From: Heikki Linnakangas Date: Sun, 30 Dec 2012 12:26:47 +0000 (+0200) Subject: Keep timeline history files restored from archive in pg_xlog. X-Git-Tag: REL9_2_3~45 X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=7e1cf76524323755caf5894961ca973b3969c315;p=postgresql Keep timeline history files restored from archive in pg_xlog. The cascading standby patch in 9.2 changed the way WAL files are treated when restored from the archive. Before, they were restored under a temporary filename, and not kept in pg_xlog, but after the patch, they were copied under pg_xlog. This is necessary for a cascading standby to find them, but it also means that if the archive goes offline and a standby is restarted, it can recover back to where it was using the files in pg_xlog. It also means that if you take an offline backup from a standby server, it includes all the required WAL files in pg_xlog. However, the same change was not made to timeline history files, so if the WAL segment containing the checkpoint record contains a timeline switch, you will still get an error if you try to restart recovery without the archive, or recover from an offline backup taken from the standby. With this patch, timeline history files restored from archive are copied into pg_xlog like WAL files are, so that pg_xlog contains all the files required to recover. This is a corner-case pre-existing issue in 9.2, but even more important in master where it's possible for a standby to follow a timeline switch through streaming replication. To make that possible, the timeline history files must be present in pg_xlog. --- diff --git a/src/backend/access/transam/xlog.c b/src/backend/access/transam/xlog.c index ae370fb83d..6f352fd5be 100644 --- a/src/backend/access/transam/xlog.c +++ b/src/backend/access/transam/xlog.c @@ -648,6 +648,7 @@ static bool XLogPageRead(XLogRecPtr *RecPtr, int emode, bool fetching_ckpt, bool randAccess); static int emode_for_corrupt_record(int emode, XLogRecPtr RecPtr); static void XLogFileClose(void); +static void KeepFileRestoredFromArchive(char *path, char *xlogfname); static bool RestoreArchivedFile(char *path, const char *xlogfname, const char *recovername, off_t expectedSize); static void ExecuteRecoveryCommand(char *command, char *commandName, @@ -2842,74 +2843,12 @@ XLogFileRead(uint32 log, uint32 seg, int emode, TimeLineID tli, */ if (source == XLOG_FROM_ARCHIVE) { - char xlogfpath[MAXPGPATH]; - bool reload = false; - struct stat statbuf; - - XLogFilePath(xlogfpath, tli, log, seg); - if (stat(xlogfpath, &statbuf) == 0) - { - char oldpath[MAXPGPATH]; -#ifdef WIN32 - static unsigned int deletedcounter = 1; - /* - * On Windows, if another process (e.g a walsender process) holds - * the file open in FILE_SHARE_DELETE mode, unlink will succeed, - * but the file will still show up in directory listing until the - * last handle is closed, and we cannot rename the new file in its - * place until that. To avoid that problem, rename the old file to - * a temporary name first. Use a counter to create a unique - * filename, because the same file might be restored from the - * archive multiple times, and a walsender could still be holding - * onto an old deleted version of it. - */ - snprintf(oldpath, MAXPGPATH, "%s.deleted%u", - xlogfpath, deletedcounter++); - if (rename(xlogfpath, oldpath) != 0) - { - ereport(ERROR, - (errcode_for_file_access(), - errmsg("could not rename file \"%s\" to \"%s\": %m", - xlogfpath, oldpath))); - } -#else - strncpy(oldpath, xlogfpath, MAXPGPATH); -#endif - if (unlink(oldpath) != 0) - ereport(FATAL, - (errcode_for_file_access(), - errmsg("could not remove file \"%s\": %m", - xlogfpath))); - reload = true; - } - - if (rename(path, xlogfpath) < 0) - ereport(ERROR, - (errcode_for_file_access(), - errmsg("could not rename file \"%s\" to \"%s\": %m", - path, xlogfpath))); + KeepFileRestoredFromArchive(path, xlogfname); /* * Set path to point at the new file in pg_xlog. */ - strncpy(path, xlogfpath, MAXPGPATH); - - /* - * Create .done file forcibly to prevent the restored segment from - * being archived again later. - */ - XLogArchiveForceDone(xlogfname); - - /* - * If the existing segment was replaced, since walsenders might have - * it open, request them to reload a currently-open segment. - */ - if (reload) - WalSndRqstFileReload(); - - /* Signal walsender that new WAL has arrived */ - if (AllowCascadeReplication()) - WalSndWakeup(); + snprintf(path, MAXPGPATH, XLOGDIR "/%s", xlogfname); } fd = BasicOpenFile(path, O_RDONLY | PG_BINARY, 0); @@ -3024,6 +2963,83 @@ XLogFileClose(void) openLogFile = -1; } +/* + * A file was restored from the archive under a temporary filename (path), + * and now we want to keep it. Rename it under the permanent filename in + * in pg_xlog (xlogfname), replacing any existing file with the same name. + */ +static void +KeepFileRestoredFromArchive(char *path, char *xlogfname) +{ + char xlogfpath[MAXPGPATH]; + bool reload = false; + struct stat statbuf; + + snprintf(xlogfpath, MAXPGPATH, XLOGDIR "/%s", xlogfname); + + if (stat(xlogfpath, &statbuf) == 0) + { + char oldpath[MAXPGPATH]; +#ifdef WIN32 + static unsigned int deletedcounter = 1; + /* + * On Windows, if another process (e.g a walsender process) holds + * the file open in FILE_SHARE_DELETE mode, unlink will succeed, + * but the file will still show up in directory listing until the + * last handle is closed, and we cannot rename the new file in its + * place until that. To avoid that problem, rename the old file to + * a temporary name first. Use a counter to create a unique + * filename, because the same file might be restored from the + * archive multiple times, and a walsender could still be holding + * onto an old deleted version of it. + */ + snprintf(oldpath, MAXPGPATH, "%s.deleted%u", + xlogfpath, deletedcounter++); + if (rename(xlogfpath, oldpath) != 0) + { + ereport(ERROR, + (errcode_for_file_access(), + errmsg("could not rename file \"%s\" to \"%s\": %m", + xlogfpath, oldpath))); + } +#else + strncpy(oldpath, xlogfpath, MAXPGPATH); +#endif + if (unlink(oldpath) != 0) + ereport(FATAL, + (errcode_for_file_access(), + errmsg("could not remove file \"%s\": %m", + xlogfpath))); + reload = true; + } + + if (rename(path, xlogfpath) < 0) + ereport(ERROR, + (errcode_for_file_access(), + errmsg("could not rename file \"%s\" to \"%s\": %m", + path, xlogfpath))); + + /* + * Create .done file forcibly to prevent the restored segment from + * being archived again later. + */ + XLogArchiveForceDone(xlogfname); + + /* + * If the existing file was replaced, since walsenders might have it + * open, request them to reload a currently-open segment. This is only + * required for WAL segments, walsenders don't hold other files open, + * but there's no harm in doing this too often, and we don't know what + * kind of a file we're dealing with here. + */ + if (reload) + WalSndRqstFileReload(); + + /* Signal walsender that new WAL has arrived */ + if (AllowCascadeReplication()) + WalSndWakeup(); +} + /* * Attempt to retrieve the specified file from off-line archival storage. * If successful, fill "path" with its complete path (note that this will be @@ -4356,6 +4372,7 @@ readTimeLineHistory(TimeLineID targetTLI) char histfname[MAXFNAMELEN]; char fline[MAXPGPATH]; FILE *fd; + bool fromArchive = false; /* Timeline 1 does not have a history file, so no need to check */ if (targetTLI == 1) @@ -4364,7 +4381,8 @@ readTimeLineHistory(TimeLineID targetTLI) if (InArchiveRecovery) { TLHistoryFileName(histfname, targetTLI); - RestoreArchivedFile(path, histfname, "RECOVERYHISTORY", 0); + fromArchive = + RestoreArchivedFile(path, histfname, "RECOVERYHISTORY", 0); } else TLHistoryFilePath(path, targetTLI); @@ -4433,6 +4451,13 @@ readTimeLineHistory(TimeLineID targetTLI) (errmsg_internal("history of timeline %u is %s", targetTLI, nodeToString(result)))); + /* + * If the history file was fetched from archive, save it in pg_xlog for + * future reference. + */ + if (fromArchive) + KeepFileRestoredFromArchive(path, histfname); + return result; }