Fix race between DROP TABLESPACE and checkpointing.

author Thomas Munro <tmunro@postgresql.org>

Wed, 16 Mar 2022 04:20:24 +0000 (17:20 +1300)

committer Thomas Munro <tmunro@postgresql.org>

Wed, 16 Mar 2022 04:41:31 +0000 (17:41 +1300)
author Thomas Munro <tmunro@postgresql.org>
Wed, 16 Mar 2022 04:20:24 +0000 (17:20 +1300)
committer Thomas Munro <tmunro@postgresql.org>
Wed, 16 Mar 2022 04:41:31 +0000 (17:41 +1300)
diff --git a/src/backend/access/transam/xlog.c b/src/backend/access/transam/xlog.c

index c64febdb53d77ab591293abe08639b71b2211c56..8e8bdde7646f728326363da21c0b8721dde925e9 100644 (file)
--- a/src/backend/access/transam/xlog.c
+++ b/src/backend/access/transam/xlog.c
@@ -8811,6 +8811,14 @@ CreateCheckPoint(int flags)
         MemSet(&CheckpointStats, 0, sizeof(CheckpointStats));
         CheckpointStats.ckpt_start_t = GetCurrentTimestamp();
  
+       /*
+        * Let smgr prepare for checkpoint; this has to happen outside the
+        * critical section and before we determine the REDO pointer.  Note that
+        * smgr must not do anything that'd have to be undone if we decide no
+        * checkpoint is needed.
+        */
+       smgrpreckpt();
+
         /*
          * Use a critical section to force system panic if we have trouble.
          */
@@ -8825,13 +8833,6 @@ CreateCheckPoint(int flags)
                 LWLockRelease(ControlFileLock);
         }
  
-       /*
-        * Let smgr prepare for checkpoint; this has to happen before we determine
-        * the REDO pointer.  Note that smgr must not do anything that'd have to
-        * be undone if we decide no checkpoint is needed.
-        */
-       smgrpreckpt();
-
         /* Begin filling in the checkpoint WAL record */
         MemSet(&checkPoint, 0, sizeof(checkPoint));
         checkPoint.time = (pg_time_t) time(NULL);
diff --git a/src/backend/storage/smgr/md.c b/src/backend/storage/smgr/md.c

index 8c98a11435477e341d4100552d6d712d64e67b5b..bfce29371fbbf1aceef1cbfe1b9874eaaf615331 100644 (file)
--- a/src/backend/storage/smgr/md.c
+++ b/src/backend/storage/smgr/md.c
@@ -1385,7 +1385,9 @@ mdsync(void)
   * counter is incremented here.
   *
   * This must be called *before* the checkpoint REDO point is determined.
- * That ensures that we won't delete files too soon.
+ * That ensures that we won't delete files too soon.  Since this calls
+ * AbsorbFsyncRequests(), which performs memory allocations, it cannot be
+ * called within a critical section.
   *
   * Note that we can't do anything here that depends on the assumption
   * that the checkpoint will be completed.
@@ -1393,6 +1395,16 @@ mdsync(void)
  void
  mdpreckpt(void)
  {
+       /*
+        * Operations such as DROP TABLESPACE assume that the next checkpoint will
+        * process all recently forwarded unlink requests, but if they aren't
+        * absorbed prior to advancing the cycle counter, they won't be processed
+        * until a future checkpoint.  The following absorb ensures that any
+        * unlink requests forwarded before the checkpoint began will be processed
+        * in the current checkpoint.
+        */
+       AbsorbFsyncRequests();
+
         /*
          * Any unlink requests arriving after this point will be assigned the next
          * cycle counter, and won't be unlinked until next checkpoint.
author	Thomas Munro <tmunro@postgresql.org>
	Wed, 16 Mar 2022 04:20:24 +0000 (17:20 +1300)
committer	Thomas Munro <tmunro@postgresql.org>
	Wed, 16 Mar 2022 04:41:31 +0000 (17:41 +1300)
src/backend/access/transam/xlog.c		patch \| blob \| blame \| history
src/backend/storage/smgr/md.c		patch \| blob \| blame \| history