pg_upgrade: check for clean server shutdowns

author Bruce Momjian <bruce@momjian.us>

Sat, 28 Jul 2018 19:01:55 +0000 (15:01 -0400)

committer Bruce Momjian <bruce@momjian.us>

Sat, 28 Jul 2018 19:01:55 +0000 (15:01 -0400)
author Bruce Momjian <bruce@momjian.us>
Sat, 28 Jul 2018 19:01:55 +0000 (15:01 -0400)
committer Bruce Momjian <bruce@momjian.us>
Sat, 28 Jul 2018 19:01:55 +0000 (15:01 -0400)
diff --git a/src/bin/pg_upgrade/controldata.c b/src/bin/pg_upgrade/controldata.c

index 0fe98a550e15746452f92df2fef6c37f60cd48b3..bba3b1b76e5fc4e033fb57f5e67ab60e9c5feda2 100644 (file)
--- a/src/bin/pg_upgrade/controldata.c
+++ b/src/bin/pg_upgrade/controldata.c
@@ -58,6 +58,7 @@ get_control_data(ClusterInfo *cluster, bool live_check)
         bool            got_large_object = false;
         bool            got_date_is_int = false;
         bool            got_data_checksum_version = false;
+       bool            got_cluster_state = false;
         char       *lc_collate = NULL;
         char       *lc_ctype = NULL;
         char       *lc_monetary = NULL;
@@ -422,6 +423,64 @@ get_control_data(ClusterInfo *cluster, bool live_check)
  
         pclose(output);
  
+       /*
+        * Check for clean shutdown
+        */
+
+       /* only pg_controldata outputs the cluster state */
+       snprintf(cmd, sizeof(cmd), "\"%s/pg_controldata\" \"%s\"",
+                        cluster->bindir, cluster->pgdata);
+       fflush(stdout);
+       fflush(stderr);
+
+       if ((output = popen(cmd, "r")) == NULL)
+               pg_fatal("could not get control data using %s: %s\n",
+                                cmd, strerror(errno));
+
+       /* we have the result of cmd in "output". so parse it line by line now */
+       while (fgets(bufin, sizeof(bufin), output))
+       {
+               if ((!live_check || cluster == &new_cluster) &&
+                       (p = strstr(bufin, "Database cluster state:")) != NULL)
+               {
+                       p = strchr(p, ':');
+
+                       if (p == NULL || strlen(p) <= 1)
+                               pg_fatal("%d: database cluster state problem\n", __LINE__);
+
+                       p++;                            /* remove ':' char */
+
+                       /*
+                        * We checked earlier for a postmaster lock file, and if we found
+                        * one, we tried to start/stop the server to replay the WAL.  However,
+                        * pg_ctl -m immediate doesn't leave a lock file, but does require
+                        * WAL replay, so we check here that the server was shut down cleanly,
+                        * from the controldata perspective.
+                        */
+                       /* remove leading spaces */
+                       while (*p == ' ')
+                               p++;
+                       if (strcmp(p, "shut down\n") != 0)
+                       {
+                               if (cluster == &old_cluster)
+                                       pg_fatal("The source cluster was not shut down cleanly.\n");
+                               else
+                                       pg_fatal("The target cluster was not shut down cleanly.\n");
+                       }
+                       got_cluster_state = true;
+               }
+       }
+
+       pclose(output);
+
+       if (!got_cluster_state)
+       {
+               if (cluster == &old_cluster)
+                       pg_fatal("The source cluster lacks cluster state information:\n");
+               else
+                       pg_fatal("The target cluster lacks cluster state information:\n");
+       }
+
         /*
          * Restore environment variables
          */
diff --git a/src/bin/pg_upgrade/pg_upgrade.c b/src/bin/pg_upgrade/pg_upgrade.c

index 9fc364bf5ccc6ae93511f1972b6c226636e38bd2..b777f9d651bc05cd72a45b25c7bb7e5914ee4e93 100644 (file)
--- a/src/bin/pg_upgrade/pg_upgrade.c
+++ b/src/bin/pg_upgrade/pg_upgrade.c
@@ -220,7 +220,8 @@ setup(char *argv0, bool *live_check)
                  * start, assume the server is running.  If the pid file is left over
                  * from a server crash, this also allows any committed transactions
                  * stored in the WAL to be replayed so they are not lost, because WAL
-                * files are not transferred from old to new servers.
+                * files are not transferred from old to new servers.  We later check
+                * for a clean shutdown.
                  */
                 if (start_postmaster(&old_cluster, false))
                         stop_postmaster(false);
author	Bruce Momjian <bruce@momjian.us>
	Sat, 28 Jul 2018 19:01:55 +0000 (15:01 -0400)
committer	Bruce Momjian <bruce@momjian.us>
	Sat, 28 Jul 2018 19:01:55 +0000 (15:01 -0400)
src/bin/pg_upgrade/controldata.c		patch \| blob \| history
src/bin/pg_upgrade/pg_upgrade.c		patch \| blob \| history