Basic foreign table support.

[postgresql] / src / bin / pg_dump / pg_backup_archiver.c
diff --git a/src/bin/pg_dump/pg_backup_archiver.c b/src/bin/pg_dump/pg_backup_archiver.c

index 61e4e412226217b634dc7904de3c36925b592cf7..64d8d93dda81805540ac70dbd7afcf11390c19fc 100644 (file)
--- a/src/bin/pg_dump/pg_backup_archiver.c
+++ b/src/bin/pg_dump/pg_backup_archiver.c
@@ -15,7 +15,7 @@
   *
   *
   * IDENTIFICATION
- *             $PostgreSQL: pgsql/src/bin/pg_dump/pg_backup_archiver.c,v 1.187 2010/07/06 19:18:59 momjian Exp $
+ *             src/bin/pg_dump/pg_backup_archiver.c
   *
   *-------------------------------------------------------------------------
   */
@@ -79,6 +79,10 @@ const char *progname;
  
  static const char *modulename = gettext_noop("archiver");
  
+/* index array created by fix_dependencies -- only used in parallel restore */
+static TocEntry          **tocsByDumpId;                       /* index by dumpId - 1 */
+static DumpId          maxDumpId;                              /* length of above array */
+
  
  static ArchiveHandle *_allocAH(const char *FileSpec, const ArchiveFormat fmt,
                  const int compression, ArchiveMode mode);
@@ -102,7 +106,7 @@ static bool _tocEntryIsACL(TocEntry *te);
  static void _disableTriggersIfNecessary(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt);
  static void _enableTriggersIfNecessary(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt);
  static TocEntry *getTocEntryByDumpId(ArchiveHandle *AH, DumpId id);
-static void _moveAfter(ArchiveHandle *AH, TocEntry *pos, TocEntry *te);
+static void _moveBefore(ArchiveHandle *AH, TocEntry *pos, TocEntry *te);
  static int     _discoverArchiveFormat(ArchiveHandle *AH);
  
  static void dump_lo_buf(ArchiveHandle *AH);
@@ -134,9 +138,7 @@ static void fix_dependencies(ArchiveHandle *AH);
  static bool has_lock_conflicts(TocEntry *te1, TocEntry *te2);
  static void repoint_table_dependencies(ArchiveHandle *AH,
                                                    DumpId tableId, DumpId tableDataId);
-static void identify_locking_dependencies(TocEntry *te,
-                                                         TocEntry **tocsByDumpId,
-                                                         DumpId maxDumpId);
+static void identify_locking_dependencies(TocEntry *te);
  static void reduce_dependencies(ArchiveHandle *AH, TocEntry *te,
                                         TocEntry *ready_list);
  static void mark_create_done(ArchiveHandle *AH, TocEntry *te);
@@ -995,15 +997,11 @@ SortTocFromFile(Archive *AHX, RestoreOptions *ropt)
         char       *endptr;
         DumpId          id;
         TocEntry   *te;
-       TocEntry   *tePrev;
  
         /* Allocate space for the 'wanted' array, and init it */
         ropt->idWanted = (bool *) malloc(sizeof(bool) * AH->maxDumpId);
         memset(ropt->idWanted, 0, sizeof(bool) * AH->maxDumpId);
  
-       /* Set prev entry as head of list */
-       tePrev = AH->toc;
-
         /* Setup the file */
         fh = fopen(ropt->tocFile, PG_BINARY_R);
         if (!fh)
@@ -1018,7 +1016,7 @@ SortTocFromFile(Archive *AHX, RestoreOptions *ropt)
                         cmnt[0] = '\0';
  
                 /* Ignore if all blank */
-               if (strspn(buf, " \t\r") == strlen(buf))
+               if (strspn(buf, " \t\r\n") == strlen(buf))
                         continue;
  
                 /* Get an ID, check it's valid and not already seen */
@@ -1036,10 +1034,21 @@ SortTocFromFile(Archive *AHX, RestoreOptions *ropt)
                         die_horribly(AH, modulename, "could not find entry for ID %d\n",
                                                  id);
  
+               /* Mark it wanted */
                 ropt->idWanted[id - 1] = true;
  
-               _moveAfter(AH, tePrev, te);
-               tePrev = te;
+               /*
+                * Move each item to the end of the list as it is selected, so that
+                * they are placed in the desired order.  Any unwanted items will end
+                * up at the front of the list, which may seem unintuitive but it's
+                * what we need.  In an ordinary serial restore that makes no
+                * difference, but in a parallel restore we need to mark unrestored
+                * items' dependencies as satisfied before we start examining
+                * restorable items.  Otherwise they could have surprising
+                * side-effects on the order in which restorable items actually get
+                * restored.
+                */
+               _moveBefore(AH, AH->toc, te);
         }
  
         if (fclose(fh) != 0)
@@ -1471,33 +1480,37 @@ warn_or_die_horribly(ArchiveHandle *AH,
         va_end(ap);
  }
  
+#ifdef NOT_USED
+
  static void
  _moveAfter(ArchiveHandle *AH, TocEntry *pos, TocEntry *te)
  {
+       /* Unlink te from list */
         te->prev->next = te->next;
         te->next->prev = te->prev;
  
+       /* and insert it after "pos" */
         te->prev = pos;
         te->next = pos->next;
-
         pos->next->prev = te;
         pos->next = te;
  }
  
-#ifdef NOT_USED
+#endif
  
  static void
  _moveBefore(ArchiveHandle *AH, TocEntry *pos, TocEntry *te)
  {
+       /* Unlink te from list */
         te->prev->next = te->next;
         te->next->prev = te->prev;
  
+       /* and insert it before "pos" */
         te->prev = pos->prev;
         te->next = pos;
         pos->prev->next = te;
         pos->prev = te;
  }
-#endif
  
  static TocEntry *
  getTocEntryByDumpId(ArchiveHandle *AH, DumpId id)
@@ -2264,6 +2277,10 @@ _tocEntryRequired(TocEntry *te, RestoreOptions *ropt, bool include_acls)
         if ((!include_acls || ropt->aclsSkip) && _tocEntryIsACL(te))
                 return 0;
  
+       /* If it's security labels, maybe ignore it */
+       if (ropt->skip_seclabel && strcmp(te->desc, "SECURITY LABEL") == 0)
+               return 0;
+
         /* Ignore DATABASE entry unless we should create it */
         if (!ropt->createDB && strcmp(te->desc, "DATABASE") == 0)
                 return 0;
@@ -2330,6 +2347,8 @@ _tocEntryRequired(TocEntry *te, RestoreOptions *ropt, bool include_acls)
                         (strcmp(te->desc, "ACL") == 0 &&
                          strncmp(te->tag, "LARGE OBJECT ", 13) == 0) ||
                         (strcmp(te->desc, "COMMENT") == 0 &&
+                        strncmp(te->tag, "LARGE OBJECT ", 13) == 0) ||
+                       (strcmp(te->desc, "SECURITY LABEL") == 0 &&
                          strncmp(te->tag, "LARGE OBJECT ", 13) == 0))
                         res = res & REQ_DATA;
                 else
@@ -2707,6 +2726,7 @@ _getObjectDescription(PQExpBuffer buf, TocEntry *te, ArchiveHandle *AH)
                 strcmp(type, "DOMAIN") == 0 ||
                 strcmp(type, "TABLE") == 0 ||
                 strcmp(type, "TYPE") == 0 ||
+               strcmp(type, "FOREIGN TABLE") == 0 ||
                 strcmp(type, "TEXT SEARCH DICTIONARY") == 0 ||
                 strcmp(type, "TEXT SEARCH CONFIGURATION") == 0)
         {
@@ -2899,6 +2919,7 @@ _printTocEntry(ArchiveHandle *AH, TocEntry *te, RestoreOptions *ropt, bool isDat
                         strcmp(te->desc, "TYPE") == 0 ||
                         strcmp(te->desc, "VIEW") == 0 ||
                         strcmp(te->desc, "SEQUENCE") == 0 ||
+                       strcmp(te->desc, "FOREIGN TABLE") == 0 ||
                         strcmp(te->desc, "TEXT SEARCH DICTIONARY") == 0 ||
                         strcmp(te->desc, "TEXT SEARCH CONFIGURATION") == 0 ||
                         strcmp(te->desc, "FOREIGN DATA WRAPPER") == 0 ||
@@ -3180,13 +3201,16 @@ restore_toc_entries_parallel(ArchiveHandle *AH)
          * Do all the early stuff in a single connection in the parent. There's no
          * great point in running it in parallel, in fact it will actually run
          * faster in a single connection because we avoid all the connection and
-        * setup overhead.
+        * setup overhead.  Also, pg_dump is not currently very good about
+        * showing all the dependencies of SECTION_PRE_DATA items, so we do not
+        * risk trying to process them out-of-order.
          */
         for (next_work_item = AH->toc->next; next_work_item != AH->toc; next_work_item = next_work_item->next)
         {
+               /* Non-PRE_DATA items are just ignored for now */
                 if (next_work_item->section == SECTION_DATA ||
                         next_work_item->section == SECTION_POST_DATA)
-                       break;
+                       continue;
  
                 ahlog(AH, 1, "processing item %d %s %s\n",
                           next_work_item->dumpId,
@@ -3229,12 +3253,17 @@ restore_toc_entries_parallel(ArchiveHandle *AH)
          */
         par_list_header_init(&pending_list);
         par_list_header_init(&ready_list);
-       for (; next_work_item != AH->toc; next_work_item = next_work_item->next)
+       for (next_work_item = AH->toc->next; next_work_item != AH->toc; next_work_item = next_work_item->next)
         {
-               if (next_work_item->depCount > 0)
-                       par_list_append(&pending_list, next_work_item);
-               else
-                       par_list_append(&ready_list, next_work_item);
+               /* All PRE_DATA items were dealt with above */
+               if (next_work_item->section == SECTION_DATA ||
+                       next_work_item->section == SECTION_POST_DATA)
+               {
+                       if (next_work_item->depCount > 0)
+                               par_list_append(&pending_list, next_work_item);
+                       else
+                               par_list_append(&ready_list, next_work_item);
+               }
         }
  
         /*
@@ -3718,7 +3747,12 @@ mark_work_done(ArchiveHandle *AH, TocEntry *ready_list,
  /*
   * Process the dependency information into a form useful for parallel restore.
   *
- * We set up depCount fields that are the number of as-yet-unprocessed
+ * This function takes care of fixing up some missing or badly designed
+ * dependencies, and then prepares subsidiary data structures that will be
+ * used in the main parallel-restore logic, including:
+ * 1. We build the tocsByDumpId[] index array.
+ * 2. We build the revDeps[] arrays of incoming dependency dumpIds.
+ * 3. We set up depCount fields that are the number of as-yet-unprocessed
   * dependencies for each TOC entry.
   *
   * We also identify locking dependencies so that we can avoid trying to
@@ -3727,22 +3761,20 @@ mark_work_done(ArchiveHandle *AH, TocEntry *ready_list,
  static void
  fix_dependencies(ArchiveHandle *AH)
  {
-       TocEntry  **tocsByDumpId;
         TocEntry   *te;
-       DumpId          maxDumpId;
         int                     i;
  
         /*
-        * For some of the steps here, it is convenient to have an array that
-        * indexes the TOC entries by dump ID, rather than searching the TOC list
-        * repeatedly.  Entries for dump IDs not present in the TOC will be NULL.
+        * It is convenient to have an array that indexes the TOC entries by dump
+        * ID, rather than searching the TOC list repeatedly.  Entries for dump
+        * IDs not present in the TOC will be NULL.
          *
          * NOTE: because maxDumpId is just the highest dump ID defined in the
          * archive, there might be dependencies for IDs > maxDumpId.  All uses of
          * this array must guard against out-of-range dependency numbers.
          *
-        * Also, initialize the depCount fields, and make sure all the TOC items
-        * are marked as not being in any parallel-processing list.
+        * Also, initialize the depCount/revDeps/nRevDeps fields, and make sure
+        * the TOC items are marked as not being in any parallel-processing list.
          */
         maxDumpId = AH->maxDumpId;
         tocsByDumpId = (TocEntry **) calloc(maxDumpId, sizeof(TocEntry *));
@@ -3750,6 +3782,8 @@ fix_dependencies(ArchiveHandle *AH)
         {
                 tocsByDumpId[te->dumpId - 1] = te;
                 te->depCount = te->nDeps;
+               te->revDeps = NULL;
+               te->nRevDeps = 0;
                 te->par_prev = NULL;
                 te->par_next = NULL;
         }
@@ -3767,6 +3801,9 @@ fix_dependencies(ArchiveHandle *AH)
          * TABLE, if possible.  However, if the dependency isn't in the archive
          * then just assume it was a TABLE; this is to cover cases where the table
          * was suppressed but we have the data and some dependent post-data items.
+        *
+        * XXX this is O(N^2) if there are a lot of tables.  We ought to fix
+        * pg_dump to produce correctly-linked dependencies in the first place.
          */
         for (te = AH->toc->next; te != AH->toc; te = te->next)
         {
@@ -3813,8 +3850,14 @@ fix_dependencies(ArchiveHandle *AH)
         }
  
         /*
-        * It is possible that the dependencies list items that are not in the
-        * archive at all.      Subtract such items from the depCounts.
+        * At this point we start to build the revDeps reverse-dependency arrays,
+        * so all changes of dependencies must be complete.
+        */
+
+       /*
+        * Count the incoming dependencies for each item.  Also, it is possible
+        * that the dependencies list items that are not in the archive at
+        * all.  Subtract such items from the depCounts.
          */
         for (te = AH->toc->next; te != AH->toc; te = te->next)
         {
@@ -3822,11 +3865,43 @@ fix_dependencies(ArchiveHandle *AH)
                 {
                         DumpId          depid = te->dependencies[i];
  
-                       if (depid > maxDumpId || tocsByDumpId[depid - 1] == NULL)
+                       if (depid <= maxDumpId && tocsByDumpId[depid - 1] != NULL)
+                               tocsByDumpId[depid - 1]->nRevDeps++;
+                       else
                                 te->depCount--;
                 }
         }
  
+       /*
+        * Allocate space for revDeps[] arrays, and reset nRevDeps so we can
+        * use it as a counter below.
+        */
+       for (te = AH->toc->next; te != AH->toc; te = te->next)
+       {
+               if (te->nRevDeps > 0)
+                       te->revDeps = (DumpId *) malloc(te->nRevDeps * sizeof(DumpId));
+               te->nRevDeps = 0;
+       }
+
+       /*
+        * Build the revDeps[] arrays of incoming-dependency dumpIds.  This
+        * had better agree with the loops above.
+        */
+       for (te = AH->toc->next; te != AH->toc; te = te->next)
+       {
+               for (i = 0; i < te->nDeps; i++)
+               {
+                       DumpId          depid = te->dependencies[i];
+
+                       if (depid <= maxDumpId && tocsByDumpId[depid - 1] != NULL)
+                       {
+                               TocEntry   *otherte = tocsByDumpId[depid - 1];
+
+                               otherte->revDeps[otherte->nRevDeps++] = te->dumpId;
+                       }
+               }
+       }
+
         /*
          * Lastly, work out the locking dependencies.
          */
@@ -3834,10 +3909,8 @@ fix_dependencies(ArchiveHandle *AH)
         {
                 te->lockDeps = NULL;
                 te->nLockDeps = 0;
-               identify_locking_dependencies(te, tocsByDumpId, maxDumpId);
+               identify_locking_dependencies(te);
         }
-
-       free(tocsByDumpId);
  }
  
  /*
@@ -3871,13 +3944,9 @@ repoint_table_dependencies(ArchiveHandle *AH,
   * Identify which objects we'll need exclusive lock on in order to restore
   * the given TOC entry (*other* than the one identified by the TOC entry
   * itself).  Record their dump IDs in the entry's lockDeps[] array.
- * tocsByDumpId[] is a convenience array (of size maxDumpId) to avoid
- * searching the TOC for each dependency.
   */
  static void
-identify_locking_dependencies(TocEntry *te,
-                                                         TocEntry **tocsByDumpId,
-                                                         DumpId maxDumpId)
+identify_locking_dependencies(TocEntry *te)
  {
         DumpId     *lockids;
         int                     nlockids;
@@ -3931,31 +4000,21 @@ identify_locking_dependencies(TocEntry *te,
  static void
  reduce_dependencies(ArchiveHandle *AH, TocEntry *te, TocEntry *ready_list)
  {
-       DumpId          target = te->dumpId;
         int                     i;
  
-       ahlog(AH, 2, "reducing dependencies for %d\n", target);
+       ahlog(AH, 2, "reducing dependencies for %d\n", te->dumpId);
  
-       /*
-        * We must examine all entries, not only the ones after the target item,
-        * because if the user used a -L switch then the original dependency-
-        * respecting order has been destroyed by SortTocFromFile.
-        */
-       for (te = AH->toc->next; te != AH->toc; te = te->next)
+       for (i = 0; i < te->nRevDeps; i++)
         {
-               for (i = 0; i < te->nDeps; i++)
+               TocEntry   *otherte = tocsByDumpId[te->revDeps[i] - 1];
+
+               otherte->depCount--;
+               if (otherte->depCount == 0 && otherte->par_prev != NULL)
                 {
-                       if (te->dependencies[i] == target)
-                       {
-                               te->depCount--;
-                               if (te->depCount == 0 && te->par_prev != NULL)
-                               {
-                                       /* It must be in the pending list, so remove it ... */
-                                       par_list_remove(te);
-                                       /* ... and add to ready_list */
-                                       par_list_append(ready_list, te);
-                               }
-                       }
+                       /* It must be in the pending list, so remove it ... */
+                       par_list_remove(otherte);
+                       /* ... and add to ready_list */
+                       par_list_append(ready_list, otherte);
                 }
         }
  }