When two base backups are started at the same time with pg_basebackup,

author Heikki Linnakangas <heikki.linnakangas@iki.fi>

Mon, 21 Mar 2011 09:25:25 +0000 (11:25 +0200)

committer Heikki Linnakangas <heikki.linnakangas@iki.fi>

Mon, 21 Mar 2011 09:25:25 +0000 (11:25 +0200)
author Heikki Linnakangas <heikki.linnakangas@iki.fi>
Mon, 21 Mar 2011 09:25:25 +0000 (11:25 +0200)
committer Heikki Linnakangas <heikki.linnakangas@iki.fi>
Mon, 21 Mar 2011 09:25:25 +0000 (11:25 +0200)
diff --git a/src/backend/access/transam/xlog.c b/src/backend/access/transam/xlog.c

index 45ba0013c8a2e21ba5ed645c37a88f022be3ab74..306ac058c365c15fd32deed7677aefe668bb6028 100644 (file)
--- a/src/backend/access/transam/xlog.c
+++ b/src/backend/access/transam/xlog.c
@@ -355,10 +355,13 @@ typedef struct XLogCtlInsert
          * exclusiveBackup is true if a backup started with pg_start_backup() is
          * in progress, and nonExclusiveBackups is a counter indicating the number
          * of streaming base backups currently in progress. forcePageWrites is
-        * set to true when either of these is non-zero.
+        * set to true when either of these is non-zero. lastBackupStart is the
+        * latest checkpoint redo location used as a starting point for an online
+        * backup.
          */
         bool            exclusiveBackup;
         int                     nonExclusiveBackups;
+       XLogRecPtr      lastBackupStart;
  } XLogCtlInsert;
  
  /*
@@ -8808,6 +8811,19 @@ do_pg_start_backup(const char *backupidstr, bool fast, char **labelfile)
                                  errmsg("backup label too long (max %d bytes)",
                                                 MAXPGPATH)));
  
+       /*
+        * Force an XLOG file switch before the checkpoint, to ensure that the WAL
+        * segment the checkpoint is written to doesn't contain pages with old
+        * timeline IDs. That would otherwise happen if you called
+        * pg_start_backup() right after restoring from a PITR archive: the first
+        * WAL segment containing the startup checkpoint has pages in the
+        * beginning with the old timeline ID. That can cause trouble at recovery:
+        * we won't have a history file covering the old timeline if pg_xlog
+        * directory was not included in the base backup and the WAL archive was
+        * cleared too before starting the backup.
+        */
+       RequestXLogSwitch();
+
         /*
          * Mark backup active in shared memory.  We must do full-page WAL writes
          * during an on-line backup even if not doing so at other times, because
@@ -8843,43 +8859,54 @@ do_pg_start_backup(const char *backupidstr, bool fast, char **labelfile)
         XLogCtl->Insert.forcePageWrites = true;
         LWLockRelease(WALInsertLock);
  
-       /*
-        * Force an XLOG file switch before the checkpoint, to ensure that the WAL
-        * segment the checkpoint is written to doesn't contain pages with old
-        * timeline IDs. That would otherwise happen if you called
-        * pg_start_backup() right after restoring from a PITR archive: the first
-        * WAL segment containing the startup checkpoint has pages in the
-        * beginning with the old timeline ID. That can cause trouble at recovery:
-        * we won't have a history file covering the old timeline if pg_xlog
-        * directory was not included in the base backup and the WAL archive was
-        * cleared too before starting the backup.
-        */
-       RequestXLogSwitch();
-
         /* Ensure we release forcePageWrites if fail below */
         PG_ENSURE_ERROR_CLEANUP(pg_start_backup_callback, (Datum) BoolGetDatum(exclusive));
         {
-               /*
-                * Force a CHECKPOINT.  Aside from being necessary to prevent torn
-                * page problems, this guarantees that two successive backup runs will
-                * have different checkpoint positions and hence different history
-                * file names, even if nothing happened in between.
-                *
-                * We use CHECKPOINT_IMMEDIATE only if requested by user (via passing
-                * fast = true).  Otherwise this can take awhile.
-                */
-               RequestCheckpoint(CHECKPOINT_FORCE | CHECKPOINT_WAIT |
-                                                 (fast ? CHECKPOINT_IMMEDIATE : 0));
+               bool gotUniqueStartpoint = false;
+               do
+               {
+                       /*
+                        * Force a CHECKPOINT.  Aside from being necessary to prevent torn
+                        * page problems, this guarantees that two successive backup runs will
+                        * have different checkpoint positions and hence different history
+                        * file names, even if nothing happened in between.
+                        *
+                        * We use CHECKPOINT_IMMEDIATE only if requested by user (via passing
+                        * fast = true).  Otherwise this can take awhile.
+                        */
+                       RequestCheckpoint(CHECKPOINT_FORCE | CHECKPOINT_WAIT |
+                                                         (fast ? CHECKPOINT_IMMEDIATE : 0));
  
-               /*
-                * Now we need to fetch the checkpoint record location, and also its
-                * REDO pointer.  The oldest point in WAL that would be needed to
-                * restore starting from the checkpoint is precisely the REDO pointer.
-                */
-               LWLockAcquire(ControlFileLock, LW_SHARED);
-               checkpointloc = ControlFile->checkPoint;
-               startpoint = ControlFile->checkPointCopy.redo;
-               LWLockRelease(ControlFileLock);
+                       /*
+                        * Now we need to fetch the checkpoint record location, and also its
+                        * REDO pointer.  The oldest point in WAL that would be needed to
+                        * restore starting from the checkpoint is precisely the REDO pointer.
+                        */
+                       LWLockAcquire(ControlFileLock, LW_SHARED);
+                       checkpointloc = ControlFile->checkPoint;
+                       startpoint = ControlFile->checkPointCopy.redo;
+                       LWLockRelease(ControlFileLock);
+
+                       /*
+                        * If two base backups are started at the same time (in WAL
+                        * sender processes), we need to make sure that they use
+                        * different checkpoints as starting locations, because we use
+                        * the starting WAL location as a unique identifier for the base
+                        * backup in the end-of-backup WAL record and when we write the
+                        * backup history file. Perhaps it would be better generate a
+                        * separate unique ID for each backup instead of forcing another
+                        * checkpoint, but taking a checkpoint right after another is
+                        * not that expensive either because only few buffers have been
+                        * dirtied yet.
+                        */
+                       LWLockAcquire(WALInsertLock, LW_SHARED);
+                       if (XLByteLT(XLogCtl->Insert.lastBackupStart, startpoint))
+                       {
+                               XLogCtl->Insert.lastBackupStart = startpoint;
+                               gotUniqueStartpoint = true;
+                       }
+                       LWLockRelease(WALInsertLock);
+               } while(!gotUniqueStartpoint);
  
                 XLByteToSeg(startpoint, _logId, _logSeg);
                 XLogFileName(xlogfilename, ThisTimeLineID, _logId, _logSeg);
author	Heikki Linnakangas <heikki.linnakangas@iki.fi>
	Mon, 21 Mar 2011 09:25:25 +0000 (11:25 +0200)
committer	Heikki Linnakangas <heikki.linnakangas@iki.fi>
	Mon, 21 Mar 2011 09:25:25 +0000 (11:25 +0200)