xfs: prevent gc from picking the same zone twice

author Christoph Hellwig <hch@lst.de>

Thu, 23 Oct 2025 15:17:02 +0000 (17:17 +0200)

committer Carlos Maiolino <cem@kernel.org>

Fri, 31 Oct 2025 11:06:03 +0000 (12:06 +0100)
author Christoph Hellwig <hch@lst.de>
Thu, 23 Oct 2025 15:17:02 +0000 (17:17 +0200)
committer Carlos Maiolino <cem@kernel.org>
Fri, 31 Oct 2025 11:06:03 +0000 (12:06 +0100)
diff --git a/fs/xfs/libxfs/xfs_rtgroup.h b/fs/xfs/libxfs/xfs_rtgroup.h

index d36a6ae0abe57fafc67048fd7546f61e068caf20..d4fcf591e63d08c9989439324499fbda8146a722 100644 (file)
--- a/fs/xfs/libxfs/xfs_rtgroup.h
+++ b/fs/xfs/libxfs/xfs_rtgroup.h
@@ -50,6 +50,12 @@ struct xfs_rtgroup {
                 uint8_t                 *rtg_rsum_cache;
                 struct xfs_open_zone    *rtg_open_zone;
         };
+
+       /*
+        * Count of outstanding GC operations for zoned XFS.  Any RTG with a
+        * non-zero rtg_gccount will not be picked as new GC victim.
+        */
+       atomic_t                rtg_gccount;
  };
  
  /*
diff --git a/fs/xfs/xfs_zone_gc.c b/fs/xfs/xfs_zone_gc.c

index 109877d9a6bf9e62d58f1846a89c8f7a4eab8937..4ade5444553207bf35d2f64e57f76ec402f52e7c 100644 (file)
--- a/fs/xfs/xfs_zone_gc.c
+++ b/fs/xfs/xfs_zone_gc.c
@@ -114,6 +114,8 @@ struct xfs_gc_bio {
         /* Open Zone being written to */
         struct xfs_open_zone            *oz;
  
+       struct xfs_rtgroup              *victim_rtg;
+
         /* Bio used for reads and writes, including the bvec used by it */
         struct bio_vec                  bv;
         struct bio                      bio;    /* must be last */
@@ -264,6 +266,7 @@ xfs_zone_gc_iter_init(
         iter->rec_count = 0;
         iter->rec_idx = 0;
         iter->victim_rtg = victim_rtg;
+       atomic_inc(&victim_rtg->rtg_gccount);
  }
  
  /*
@@ -362,6 +365,7 @@ xfs_zone_gc_query(
  
         return 0;
  done:
+       atomic_dec(&iter->victim_rtg->rtg_gccount);
         xfs_rtgroup_rele(iter->victim_rtg);
         iter->victim_rtg = NULL;
         return 0;
@@ -451,6 +455,20 @@ xfs_zone_gc_pick_victim_from(
                 if (!rtg)
                         continue;
  
+               /*
+                * If the zone is already undergoing GC, don't pick it again.
+                *
+                * This prevents us from picking one of the zones for which we
+                * already submitted GC I/O, but for which the remapping hasn't
+                * concluded yet.  This won't cause data corruption, but
+                * increases write amplification and slows down GC, so this is
+                * a bad thing.
+                */
+               if (atomic_read(&rtg->rtg_gccount)) {
+                       xfs_rtgroup_rele(rtg);
+                       continue;
+               }
+
                 /* skip zones that are just waiting for a reset */
                 if (rtg_rmap(rtg)->i_used_blocks == 0 ||
                     rtg_rmap(rtg)->i_used_blocks >= victim_used) {
@@ -688,6 +706,9 @@ xfs_zone_gc_start_chunk(
         chunk->scratch = &data->scratch[data->scratch_idx];
         chunk->data = data;
         chunk->oz = oz;
+       chunk->victim_rtg = iter->victim_rtg;
+       atomic_inc(&chunk->victim_rtg->rtg_group.xg_active_ref);
+       atomic_inc(&chunk->victim_rtg->rtg_gccount);
  
         bio->bi_iter.bi_sector = xfs_rtb_to_daddr(mp, chunk->old_startblock);
         bio->bi_end_io = xfs_zone_gc_end_io;
@@ -710,6 +731,8 @@ static void
  xfs_zone_gc_free_chunk(
         struct xfs_gc_bio       *chunk)
  {
+       atomic_dec(&chunk->victim_rtg->rtg_gccount);
+       xfs_rtgroup_rele(chunk->victim_rtg);
         list_del(&chunk->entry);
         xfs_open_zone_put(chunk->oz);
         xfs_irele(chunk->ip);
@@ -770,6 +793,10 @@ xfs_zone_gc_split_write(
         split_chunk->oz = chunk->oz;
         atomic_inc(&chunk->oz->oz_ref);
  
+       split_chunk->victim_rtg = chunk->victim_rtg;
+       atomic_inc(&chunk->victim_rtg->rtg_group.xg_active_ref);
+       atomic_inc(&chunk->victim_rtg->rtg_gccount);
+
         chunk->offset += split_len;
         chunk->len -= split_len;
         chunk->old_startblock += XFS_B_TO_FSB(data->mp, split_len);
author	Christoph Hellwig <hch@lst.de>
	Thu, 23 Oct 2025 15:17:02 +0000 (17:17 +0200)
committer	Carlos Maiolino <cem@kernel.org>
	Fri, 31 Oct 2025 11:06:03 +0000 (12:06 +0100)
fs/xfs/libxfs/xfs_rtgroup.h		patch \| blob \| blame \| history
fs/xfs/xfs_zone_gc.c		patch \| blob \| blame \| history