Flush unlogged table's buffers when copying or moving databases.

author Andres Freund <andres@anarazel.de>

Mon, 20 Oct 2014 21:43:46 +0000 (23:43 +0200)

committer Andres Freund <andres@anarazel.de>

Mon, 20 Oct 2014 21:47:45 +0000 (23:47 +0200)
author Andres Freund <andres@anarazel.de>
Mon, 20 Oct 2014 21:43:46 +0000 (23:43 +0200)
committer Andres Freund <andres@anarazel.de>
Mon, 20 Oct 2014 21:47:45 +0000 (23:47 +0200)
diff --git a/src/backend/access/transam/xlog.c b/src/backend/access/transam/xlog.c

index 89b2fb66f8b1d19ddca928e79888d7dc46a55524..c7bdd617b2645e42977402c0715d1a2d553d8566 100644 (file)
--- a/src/backend/access/transam/xlog.c
+++ b/src/backend/access/transam/xlog.c
@@ -7537,9 +7537,9 @@ LogCheckpointStart(int flags, bool restartpoint)
          * the main message, but what about all the flags?
          */
         if (restartpoint)
-               msg = "restartpoint starting:%s%s%s%s%s%s%s";
+               msg = "restartpoint starting:%s%s%s%s%s%s%s%s";
         else
-               msg = "checkpoint starting:%s%s%s%s%s%s%s";
+               msg = "checkpoint starting:%s%s%s%s%s%s%s%s";
  
         elog(LOG, msg,
                  (flags & CHECKPOINT_IS_SHUTDOWN) ? " shutdown" : "",
@@ -7548,7 +7548,8 @@ LogCheckpointStart(int flags, bool restartpoint)
                  (flags & CHECKPOINT_FORCE) ? " force" : "",
                  (flags & CHECKPOINT_WAIT) ? " wait" : "",
                  (flags & CHECKPOINT_CAUSE_XLOG) ? " xlog" : "",
-                (flags & CHECKPOINT_CAUSE_TIME) ? " time" : "");
+                (flags & CHECKPOINT_CAUSE_TIME) ? " time" : "",
+                (flags & CHECKPOINT_FLUSH_ALL) ? " flush-all" :"");
  }
  
  /*
diff --git a/src/backend/commands/dbcommands.c b/src/backend/commands/dbcommands.c

index a850582b872dad8a5845b22c7cde6caa3a5e952d..022f907f6d502c3027029efb6e3833ff420ba065 100644 (file)
--- a/src/backend/commands/dbcommands.c
+++ b/src/backend/commands/dbcommands.c
@@ -523,15 +523,17 @@ createdb(const CreatedbStmt *stmt)
         InvokeObjectAccessHook(OAT_POST_CREATE, DatabaseRelationId, dboid, 0);
  
         /*
-        * Force a checkpoint before starting the copy. This will force dirty
-        * buffers out to disk, to ensure source database is up-to-date on disk
-        * for the copy. FlushDatabaseBuffers() would suffice for that, but we
-        * also want to process any pending unlink requests. Otherwise, if a
-        * checkpoint happened while we're copying files, a file might be deleted
-        * just when we're about to copy it, causing the lstat() call in copydir()
-        * to fail with ENOENT.
+        * Force a checkpoint before starting the copy. This will force all dirty
+        * buffers, including those of unlogged tables, out to disk, to ensure
+        * source database is up-to-date on disk for the copy.
+        * FlushDatabaseBuffers() would suffice for that, but we also want
+        * to process any pending unlink requests. Otherwise, if a checkpoint
+        * happened while we're copying files, a file might be deleted just when
+        * we're about to copy it, causing the lstat() call in copydir() to fail
+        * with ENOENT.
          */
-       RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT);
+       RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT
+                                         | CHECKPOINT_FLUSH_ALL);
  
         /*
          * Take an MVCC snapshot to use while scanning through pg_tablespace.  For
@@ -1111,8 +1113,9 @@ movedb(const char *dbname, const char *tblspcname)
         dst_dbpath = GetDatabasePath(db_id, dst_tblspcoid);
  
         /*
-        * Force a checkpoint before proceeding. This will force dirty buffers out
-        * to disk, to ensure source database is up-to-date on disk for the copy.
+        * Force a checkpoint before proceeding. This will force all dirty
+        * buffers, including those of unlogged tables, out to disk, to ensure
+        * source database is up-to-date on disk for the copy.
          * FlushDatabaseBuffers() would suffice for that, but we also want to
          * process any pending unlink requests. Otherwise, the check for existing
          * files in the target directory might fail unnecessarily, not to mention
@@ -1120,7 +1123,8 @@ movedb(const char *dbname, const char *tblspcname)
          * On Windows, this also ensures that the bgwriter doesn't hold any open
          * files, which would cause rmdir() to fail.
          */
-       RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT);
+       RequestCheckpoint(CHECKPOINT_IMMEDIATE | CHECKPOINT_FORCE | CHECKPOINT_WAIT
+                                         | CHECKPOINT_FLUSH_ALL);
  
         /*
          * Check for existence of files in the target directory, i.e., objects of
diff --git a/src/backend/storage/buffer/bufmgr.c b/src/backend/storage/buffer/bufmgr.c

index aeb814e9efcdc14af69f2f1dbdea90f60bbaa6dc..cd7108b156da2ca30f236fa91c33427474684c7d 100644 (file)
--- a/src/backend/storage/buffer/bufmgr.c
+++ b/src/backend/storage/buffer/bufmgr.c
@@ -1168,9 +1168,10 @@ UnpinBuffer(volatile BufferDesc *buf, bool fixOwner)
   *
   * This is called at checkpoint time to write out all dirty shared buffers.
   * The checkpoint request flags should be passed in.  If CHECKPOINT_IMMEDIATE
- * is set, we disable delays between writes; if CHECKPOINT_IS_SHUTDOWN is
- * set, we write even unlogged buffers, which are otherwise skipped.  The
- * remaining flags currently have no effect here.
+ * is set, we disable delays between writes; if CHECKPOINT_IS_SHUTDOWN,
+ * CHECKPOINT_END_OF_RECOVERY or CHECKPOINT_FLUSH_ALL is set, we write even
+ * unlogged buffers, which are otherwise skipped.  The remaining flags
+ * currently have no effect here.
   */
  static void
  BufferSync(int flags)
@@ -1185,10 +1186,12 @@ BufferSync(int flags)
         ResourceOwnerEnlargeBuffers(CurrentResourceOwner);
  
         /*
-        * Unless this is a shutdown checkpoint, we write only permanent, dirty
-        * buffers.  But at shutdown or end of recovery, we write all dirty buffers.
+        * Unless this is a shutdown checkpoint or we have been explicitly told,
+        * we write only permanent, dirty buffers.  But at shutdown or end of
+        * recovery, we write all dirty buffers.
          */
-       if (!((flags & CHECKPOINT_IS_SHUTDOWN) || (flags & CHECKPOINT_END_OF_RECOVERY)))
+       if (!((flags & (CHECKPOINT_IS_SHUTDOWN | CHECKPOINT_END_OF_RECOVERY |
+                                       CHECKPOINT_FLUSH_ALL))))
                 mask |= BM_PERMANENT;
  
         /*
diff --git a/src/include/access/xlog.h b/src/include/access/xlog.h

index 41b9da891bc0d228e13b522d6c3bfd9b6d2152d6..8250254fa300089697c764a39e39a31b80ea0887 100644 (file)
--- a/src/include/access/xlog.h
+++ b/src/include/access/xlog.h
@@ -246,6 +246,8 @@ extern bool XLOG_DEBUG;
  /* These indicate the cause of a checkpoint request */
  #define CHECKPOINT_CAUSE_XLOG  0x0020  /* XLOG consumption */
  #define CHECKPOINT_CAUSE_TIME  0x0040  /* Elapsed time */
+#define CHECKPOINT_FLUSH_ALL   0x0080  /* Flush all pages, including those
+                                                                                * belonging to unlogged tables */
  
  /* Checkpoint statistics */
  typedef struct CheckpointStatsData
author	Andres Freund <andres@anarazel.de>
	Mon, 20 Oct 2014 21:43:46 +0000 (23:43 +0200)
committer	Andres Freund <andres@anarazel.de>
	Mon, 20 Oct 2014 21:47:45 +0000 (23:47 +0200)
src/backend/access/transam/xlog.c		patch \| blob \| history
src/backend/commands/dbcommands.c		patch \| blob \| history
src/backend/storage/buffer/bufmgr.c		patch \| blob \| history
src/include/access/xlog.h		patch \| blob \| history