mirror of
https://github.com/postgres/postgres.git
synced 2025-05-20 00:03:14 -04:00
Add /contrib/pg_standby:
pg_standby is a production-ready program that can be used to create a Warm Standby server. Other configuration is required as well, all of which is described in the main server manual. Simon Riggs
This commit is contained in:
parent
528779a2c6
commit
51be14e928
18
contrib/pg_standby/Makefile
Normal file
18
contrib/pg_standby/Makefile
Normal file
@ -0,0 +1,18 @@
|
|||||||
|
|
||||||
|
PROGRAM = pg_standby
|
||||||
|
OBJS = pg_standby.o
|
||||||
|
|
||||||
|
PG_CPPFLAGS = -I$(libpq_srcdir)
|
||||||
|
PG_LIBS = $(libpq_pgport)
|
||||||
|
|
||||||
|
DOCS = README.pg_standby
|
||||||
|
|
||||||
|
ifdef USE_PGXS
|
||||||
|
PGXS := $(shell pg_config --pgxs)
|
||||||
|
include $(PGXS)
|
||||||
|
else
|
||||||
|
subdir = contrib/pg_standby
|
||||||
|
top_builddir = ../..
|
||||||
|
include $(top_builddir)/src/Makefile.global
|
||||||
|
include $(top_srcdir)/contrib/contrib-global.mk
|
||||||
|
endif
|
164
contrib/pg_standby/README.pg_standby
Normal file
164
contrib/pg_standby/README.pg_standby
Normal file
@ -0,0 +1,164 @@
|
|||||||
|
pg_standby README 2006/12/08 Simon Riggs
|
||||||
|
|
||||||
|
o What is pg_standby?
|
||||||
|
|
||||||
|
pg_standby is a production-ready program that can be used to
|
||||||
|
create a Warm Standby server. Other configuration is required
|
||||||
|
as well, all of which is described in the main server manual.
|
||||||
|
|
||||||
|
The program is designed to be a wait-for restore_command,
|
||||||
|
required to turn a normal archive recovery into a Warm Standby.
|
||||||
|
Within the restore_command of the recovery.conf you could
|
||||||
|
configure pg_standby in the following way:
|
||||||
|
|
||||||
|
restore_command = 'pg_standby archiveDir %f %p'
|
||||||
|
|
||||||
|
which would be sufficient to define that files will be restored
|
||||||
|
from archiveDir.
|
||||||
|
|
||||||
|
o features of pg_standby
|
||||||
|
|
||||||
|
- pg_standby is written in C. So it is very portable
|
||||||
|
and easy to install.
|
||||||
|
|
||||||
|
- supports copy or link from a directory (only)
|
||||||
|
|
||||||
|
- source easy to modify, with specifically designated
|
||||||
|
sections to modify for your own needs, allowing
|
||||||
|
interfaces to be written for additional Backup Archive Restore
|
||||||
|
(BAR) systems
|
||||||
|
|
||||||
|
- portable: tested on Linux and Windows
|
||||||
|
|
||||||
|
o How to install pg_standby
|
||||||
|
|
||||||
|
$make
|
||||||
|
$make install
|
||||||
|
|
||||||
|
o How to use pg_standby?
|
||||||
|
|
||||||
|
pg_standby should be used within the restore_command of the
|
||||||
|
recovery.conf file. See the main PostgreSQL manual for details.
|
||||||
|
|
||||||
|
The basic usage should be like this:
|
||||||
|
|
||||||
|
restore_command = 'pg_standby archiveDir %f %p'
|
||||||
|
|
||||||
|
with the pg_standby command usage as
|
||||||
|
|
||||||
|
pg_standby [OPTION]... [ARCHIVELOCATION] [NEXTWALFILE] [XLOGFILEPATH]
|
||||||
|
|
||||||
|
When used within the restore_command the %f and %p macros
|
||||||
|
will provide the actual file and path required for the restore/recovery.
|
||||||
|
|
||||||
|
o options
|
||||||
|
|
||||||
|
pg_standby has number of options.
|
||||||
|
|
||||||
|
-c
|
||||||
|
use copy/cp command to restore WAL files from archive
|
||||||
|
|
||||||
|
-d
|
||||||
|
debug/logging option.
|
||||||
|
|
||||||
|
-k numfiles
|
||||||
|
Cleanup files in the archive so that we maintain no more
|
||||||
|
than this many files in the archive.
|
||||||
|
|
||||||
|
You should be wary against setting this number too low,
|
||||||
|
since this may mean you cannot restart the standby. This
|
||||||
|
is because the last restartpoint marked in the WAL files
|
||||||
|
may be many files in the past and can vary considerably.
|
||||||
|
This should be set to a value exceeding the number of WAL
|
||||||
|
files that can be recovered in 2*checkpoint_timeout seconds,
|
||||||
|
according to the value in the warm standby postgresql.conf.
|
||||||
|
It is wholly unrelated to the setting of checkpoint_segments
|
||||||
|
on either primary or standby.
|
||||||
|
|
||||||
|
If in doubt, use a large value or do not set a value at all.
|
||||||
|
|
||||||
|
-l
|
||||||
|
use ln command to restore WAL files from archive
|
||||||
|
WAL files will remain in archive
|
||||||
|
|
||||||
|
Link is more efficient, but the default is copy to
|
||||||
|
allow you to maintain the WAL archive for recovery
|
||||||
|
purposes as well as high-availability.
|
||||||
|
|
||||||
|
This option uses the Windows Vista command mklink
|
||||||
|
to provide a file-to-file symbolic link. -l will
|
||||||
|
not work on versions of Windows prior to Vista.
|
||||||
|
Use the -c option instead.
|
||||||
|
see http://en.wikipedia.org/wiki/NTFS_symbolic_link
|
||||||
|
|
||||||
|
-r maxretries
|
||||||
|
the maximum number of times to retry the restore command if it
|
||||||
|
fails. After each failure, we wait for sleeptime * num_retries
|
||||||
|
so that the wait time increases progressively, so by default
|
||||||
|
we will wait 5 secs, 10 secs then 15 secs before reporting
|
||||||
|
the failure back to the database server. This will be
|
||||||
|
interpreted as and end of recovery and the Standby will come
|
||||||
|
up fully as a result.
|
||||||
|
Default=3
|
||||||
|
|
||||||
|
-s sleeptime
|
||||||
|
the number of seconds to sleep between testing to see
|
||||||
|
if the file to be restored is available in the archive yet.
|
||||||
|
The default setting is not necessarily recommended,
|
||||||
|
consult the main database server manual for discussion.
|
||||||
|
Default=5
|
||||||
|
|
||||||
|
-t triggerfile
|
||||||
|
the presence of the triggerfile will cause recovery to end
|
||||||
|
whether or not the next file is available
|
||||||
|
It is recommended that you use a structured filename to
|
||||||
|
avoid confusion as to which server is being triggered
|
||||||
|
when multiple servers exist on same system.
|
||||||
|
e.g. /tmp/pgsql.trigger.5432
|
||||||
|
|
||||||
|
-w maxwaittime
|
||||||
|
the maximum number of seconds to wait for the next file,
|
||||||
|
after which recovery will end and the Standby will come up.
|
||||||
|
The default setting is not necessarily recommended,
|
||||||
|
consult the main database server manual for discussion.
|
||||||
|
Default=0
|
||||||
|
|
||||||
|
Note: --help is not supported since pg_standby is not intended
|
||||||
|
for interactive use, except during dev/test
|
||||||
|
|
||||||
|
o examples
|
||||||
|
|
||||||
|
Linux
|
||||||
|
|
||||||
|
archive_command = 'cp %p ../archive/%f'
|
||||||
|
|
||||||
|
restore_command = 'pg_standby -l -d -k 255 -r 2 -s 2 -w 0 -t /tmp/pgsql.trigger.5442 $PWD/../archive %f %p 2>> standby.log'
|
||||||
|
|
||||||
|
which will
|
||||||
|
- use a ln command to restore WAL files from archive
|
||||||
|
- produce logfile output in standby.log
|
||||||
|
- keep the last 255 full WAL files, plus the current one
|
||||||
|
- sleep for 2 seconds between checks for next WAL file is full
|
||||||
|
- never timeout if file not found
|
||||||
|
- stop waiting when a trigger file called /tmp.pgsql.trigger.5442 appears
|
||||||
|
|
||||||
|
Windows
|
||||||
|
|
||||||
|
archive_command = 'copy %p ..\\archive\\%f'
|
||||||
|
Note that backslashes need to be doubled in the archive_command, but
|
||||||
|
*not* in the restore_command, in 8.2, 8.1, 8.0 on Windows.
|
||||||
|
|
||||||
|
restore_command = 'pg_standby -c -d -s 5 -w 0 -t C:\pgsql.trigger.5442
|
||||||
|
..\archive %f %p 2>> standby.log'
|
||||||
|
|
||||||
|
which will
|
||||||
|
- use a copy command to restore WAL files from archive
|
||||||
|
- produce logfile output in standby.log
|
||||||
|
- sleep for 5 seconds between checks for next WAL file is full
|
||||||
|
- never timeout if file not found
|
||||||
|
- stop waiting when a trigger file called C:\pgsql.trigger.5442 appears
|
||||||
|
|
||||||
|
o reported test success
|
||||||
|
|
||||||
|
SUSE Linux 10.2
|
||||||
|
Windows XP Pro
|
619
contrib/pg_standby/pg_standby.c
Normal file
619
contrib/pg_standby/pg_standby.c
Normal file
@ -0,0 +1,619 @@
|
|||||||
|
/*
|
||||||
|
* pg_standby.c
|
||||||
|
*
|
||||||
|
* Production-ready example of how to create a Warm Standby
|
||||||
|
* database server using continuous archiving as a
|
||||||
|
* replication mechanism
|
||||||
|
*
|
||||||
|
* We separate the parameters for archive and nextWALfile
|
||||||
|
* so that we can check the archive exists, even if the
|
||||||
|
* WAL file doesn't (yet).
|
||||||
|
*
|
||||||
|
* This program will be executed once in full for each file
|
||||||
|
* requested by the warm standby server.
|
||||||
|
*
|
||||||
|
* It is designed to cater to a variety of needs, as well
|
||||||
|
* providing a customizable section.
|
||||||
|
*
|
||||||
|
* Original author: Simon Riggs simon@2ndquadrant.com
|
||||||
|
* Current maintainer: Simon Riggs
|
||||||
|
*/
|
||||||
|
#include "postgres_fe.h"
|
||||||
|
#include "pg_config_manual.h"
|
||||||
|
|
||||||
|
#include <ctype.h>
|
||||||
|
#include <dirent.h>
|
||||||
|
#include <sys/stat.h>
|
||||||
|
#include <signal.h>
|
||||||
|
|
||||||
|
#ifdef WIN32
|
||||||
|
#include "win32.h"
|
||||||
|
int getopt(int argc, char * const argv[], const char *optstring);
|
||||||
|
#else
|
||||||
|
#include <sys/time.h>
|
||||||
|
#include <unistd.h>
|
||||||
|
|
||||||
|
#ifdef HAVE_GETOPT_H
|
||||||
|
#include <getopt.h>
|
||||||
|
#endif
|
||||||
|
|
||||||
|
#endif /* ! WIN32 */
|
||||||
|
|
||||||
|
extern char *optarg;
|
||||||
|
extern int optind;
|
||||||
|
|
||||||
|
/* Options and defaults */
|
||||||
|
int sleeptime = 5; /* amount of time to sleep between file checks */
|
||||||
|
int waittime = -1; /* how long we have been waiting, -1 no wait yet */
|
||||||
|
int maxwaittime = 0; /* how long are we prepared to wait for? */
|
||||||
|
int keepfiles = 0; /* number of WAL files to keep, 0 keep all */
|
||||||
|
int maxretries = 3; /* number of retries on restore command */
|
||||||
|
bool debug = false; /* are we debugging? */
|
||||||
|
bool triggered = false;
|
||||||
|
bool signaled = false;
|
||||||
|
|
||||||
|
char *archiveLocation; /* where to find the archive? */
|
||||||
|
char *triggerPath; /* where to find the trigger file? */
|
||||||
|
char *xlogFilePath; /* where we are going to restore to */
|
||||||
|
char *nextWALFileName; /* the file we need to get from archive */
|
||||||
|
char *priorWALFileName; /* the file we need to get from archive */
|
||||||
|
char WALFilePath[MAXPGPATH];/* the file path including archive */
|
||||||
|
char restoreCommand[MAXPGPATH]; /* run this to restore */
|
||||||
|
char inclusiveCleanupFileName[MAXPGPATH]; /* the file we need to get from archive */
|
||||||
|
|
||||||
|
#define RESTORE_COMMAND_COPY 0
|
||||||
|
#define RESTORE_COMMAND_LINK 1
|
||||||
|
int restoreCommandType;
|
||||||
|
|
||||||
|
#define XLOG_DATA 0
|
||||||
|
#define XLOG_HISTORY 1
|
||||||
|
#define XLOG_BACKUP_LABEL 2
|
||||||
|
int nextWALFileType;
|
||||||
|
|
||||||
|
#define SET_RESTORE_COMMAND(cmd, arg1, arg2) \
|
||||||
|
snprintf(restoreCommand, MAXPGPATH, cmd " %s %s", arg1, arg2)
|
||||||
|
|
||||||
|
struct stat stat_buf;
|
||||||
|
|
||||||
|
/* =====================================================================
|
||||||
|
*
|
||||||
|
* Customizable section
|
||||||
|
*
|
||||||
|
* =====================================================================
|
||||||
|
*
|
||||||
|
* Currently, this section assumes that the Archive is a locally
|
||||||
|
* accessible directory. If you want to make other assumptions,
|
||||||
|
* such as using a vendor-specific archive and access API, these
|
||||||
|
* routines are the ones you'll need to change. You're
|
||||||
|
* enouraged to submit any changes to pgsql-patches@postgresql.org
|
||||||
|
* or personally to the current maintainer. Those changes may be
|
||||||
|
* folded in to later versions of this program.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#define XLOG_DATA_FNAME_LEN 24
|
||||||
|
/* Reworked from access/xlog_internal.h */
|
||||||
|
#define XLogFileName(fname, tli, log, seg) \
|
||||||
|
snprintf(fname, XLOG_DATA_FNAME_LEN + 1, "%08X%08X%08X", tli, log, seg)
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Initialize allows customized commands into the warm standby program.
|
||||||
|
*
|
||||||
|
* As an example, and probably the common case, we use either
|
||||||
|
* cp/ln commands on *nix, or copy/move command on Windows.
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
static void
|
||||||
|
CustomizableInitialize(void)
|
||||||
|
{
|
||||||
|
#ifdef WIN32
|
||||||
|
snprintf(WALFilePath, MAXPGPATH, "%s\\%s", archiveLocation, nextWALFileName);
|
||||||
|
switch (restoreCommandType)
|
||||||
|
{
|
||||||
|
case RESTORE_COMMAND_LINK:
|
||||||
|
SET_RESTORE_COMMAND("mklink",WALFilePath, xlogFilePath);
|
||||||
|
case RESTORE_COMMAND_COPY:
|
||||||
|
default:
|
||||||
|
SET_RESTORE_COMMAND("copy",WALFilePath, xlogFilePath);
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
#else
|
||||||
|
snprintf(WALFilePath, MAXPGPATH, "%s/%s", archiveLocation, nextWALFileName);
|
||||||
|
switch (restoreCommandType)
|
||||||
|
{
|
||||||
|
case RESTORE_COMMAND_LINK:
|
||||||
|
#if HAVE_WORKING_LINK
|
||||||
|
SET_RESTORE_COMMAND("ln -s -f",WALFilePath, xlogFilePath);
|
||||||
|
break;
|
||||||
|
#endif
|
||||||
|
case RESTORE_COMMAND_COPY:
|
||||||
|
default:
|
||||||
|
SET_RESTORE_COMMAND("cp",WALFilePath, xlogFilePath);
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
||||||
|
/*
|
||||||
|
* This code assumes that archiveLocation is a directory
|
||||||
|
* You may wish to add code to check for tape libraries, etc..
|
||||||
|
* So, since it is a directory, we use stat to test if its accessible
|
||||||
|
*/
|
||||||
|
if (stat(archiveLocation, &stat_buf) != 0)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "pg_standby: archiveLocation \"%s\" does not exist\n", archiveLocation);
|
||||||
|
fflush(stderr);
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* CustomizableNextWALFileReady()
|
||||||
|
*
|
||||||
|
* Is the requested file ready yet?
|
||||||
|
*/
|
||||||
|
static bool
|
||||||
|
CustomizableNextWALFileReady()
|
||||||
|
{
|
||||||
|
if (stat(WALFilePath, &stat_buf) == 0)
|
||||||
|
{
|
||||||
|
/*
|
||||||
|
* If its a backup file, return immediately
|
||||||
|
* If its a regular file return only if its the right size already
|
||||||
|
*/
|
||||||
|
if (strlen(nextWALFileName) > 24 &&
|
||||||
|
strspn(nextWALFileName, "0123456789ABCDEF") == 24 &&
|
||||||
|
strcmp(nextWALFileName + strlen(nextWALFileName) - strlen(".backup"),
|
||||||
|
".backup") == 0)
|
||||||
|
{
|
||||||
|
nextWALFileType = XLOG_BACKUP_LABEL;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
if (stat_buf.st_size == XLOG_SEG_SIZE)
|
||||||
|
{
|
||||||
|
#ifdef WIN32
|
||||||
|
/*
|
||||||
|
* Windows reports that the file has the right number of bytes
|
||||||
|
* even though the file is still being copied and cannot be
|
||||||
|
* opened by pg_standby yet. So we wait for sleeptime secs
|
||||||
|
* before attempting to restore. If that is not enough, we
|
||||||
|
* will rely on the retry/holdoff mechanism.
|
||||||
|
*/
|
||||||
|
pg_usleep(sleeptime * 1000000L);
|
||||||
|
#endif
|
||||||
|
nextWALFileType = XLOG_DATA;
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If still too small, wait until it is the correct size
|
||||||
|
*/
|
||||||
|
if (stat_buf.st_size > XLOG_SEG_SIZE)
|
||||||
|
{
|
||||||
|
if (debug)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "file size greater than expected\n");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
exit(3);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
#define MaxSegmentsPerLogFile ( 0xFFFFFFFF / XLOG_SEG_SIZE )
|
||||||
|
|
||||||
|
static void
|
||||||
|
CustomizableCleanupPriorWALFiles(void)
|
||||||
|
{
|
||||||
|
uint32 tli,
|
||||||
|
log,
|
||||||
|
seg;
|
||||||
|
int signed_log = 0;
|
||||||
|
|
||||||
|
if (keepfiles > 0)
|
||||||
|
{
|
||||||
|
sscanf(nextWALFileName, "%08X%08X%08X", &tli, &log, &seg);
|
||||||
|
signed_log = log - (keepfiles / MaxSegmentsPerLogFile);
|
||||||
|
if (keepfiles <= seg)
|
||||||
|
seg -= keepfiles;
|
||||||
|
else
|
||||||
|
{
|
||||||
|
seg = MaxSegmentsPerLogFile - (keepfiles % MaxSegmentsPerLogFile);
|
||||||
|
signed_log--;
|
||||||
|
}
|
||||||
|
log = (uint32) signed_log;
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Work out name of prior file from current filename
|
||||||
|
*/
|
||||||
|
if (keepfiles > 0 && signed_log >= 0 && nextWALFileType == XLOG_DATA)
|
||||||
|
{
|
||||||
|
int rc;
|
||||||
|
DIR *xldir;
|
||||||
|
struct dirent *xlde;
|
||||||
|
|
||||||
|
XLogFileName(inclusiveCleanupFileName, tli, log, seg);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Assume its OK to keep failing. The failure situation may change over
|
||||||
|
* time, so we'd rather keep going on the main processing than fail
|
||||||
|
* because we couldnt clean up yet.
|
||||||
|
*/
|
||||||
|
if ((xldir = opendir(archiveLocation)) != NULL)
|
||||||
|
{
|
||||||
|
while ((xlde = readdir(xldir)) != NULL)
|
||||||
|
{
|
||||||
|
/*
|
||||||
|
* We ignore the timeline part of the XLOG segment identifiers in
|
||||||
|
* deciding whether a segment is still needed. This ensures that we
|
||||||
|
* won't prematurely remove a segment from a parent timeline. We could
|
||||||
|
* probably be a little more proactive about removing segments of
|
||||||
|
* non-parent timelines, but that would be a whole lot more
|
||||||
|
* complicated.
|
||||||
|
*
|
||||||
|
* We use the alphanumeric sorting property of the filenames to decide
|
||||||
|
* which ones are earlier than the inclusiveCleanupFileName file.
|
||||||
|
*/
|
||||||
|
if (strlen(xlde->d_name) == XLOG_DATA_FNAME_LEN &&
|
||||||
|
strspn(xlde->d_name, "0123456789ABCDEF") == XLOG_DATA_FNAME_LEN &&
|
||||||
|
strcmp(xlde->d_name + 8, inclusiveCleanupFileName + 8) <= 0)
|
||||||
|
{
|
||||||
|
#ifdef WIN32
|
||||||
|
snprintf(WALFilePath, MAXPGPATH, "%s\\%s", archiveLocation, xlde->d_name);
|
||||||
|
#else
|
||||||
|
snprintf(WALFilePath, MAXPGPATH, "%s/%s", archiveLocation, xlde->d_name);
|
||||||
|
#endif
|
||||||
|
rc = unlink(WALFilePath);
|
||||||
|
|
||||||
|
if (debug)
|
||||||
|
fprintf(stderr, "\npg_standby: removed \"%s\"\n", WALFilePath);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else
|
||||||
|
fprintf(stderr, "pg_standby: archiveLocation \"%s\" open error\n", archiveLocation);
|
||||||
|
|
||||||
|
closedir(xldir);
|
||||||
|
}
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
|
||||||
|
/* =====================================================================
|
||||||
|
* End of Customizable section
|
||||||
|
* =====================================================================
|
||||||
|
*/
|
||||||
|
|
||||||
|
/*
|
||||||
|
* CheckForExternalTrigger()
|
||||||
|
*
|
||||||
|
* Is there a trigger file?
|
||||||
|
*/
|
||||||
|
static bool
|
||||||
|
CheckForExternalTrigger(void)
|
||||||
|
{
|
||||||
|
int rc;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Look for a trigger file, if that option has been selected
|
||||||
|
*
|
||||||
|
* We use stat() here because triggerPath is always a file
|
||||||
|
* rather than potentially being in an archive
|
||||||
|
*/
|
||||||
|
if (triggerPath && stat(triggerPath, &stat_buf) == 0)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "trigger file found\n");
|
||||||
|
fflush(stderr);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* If trigger file found, we *must* delete it. Here's why:
|
||||||
|
* When recovery completes, we will be asked again
|
||||||
|
* for the same file from the archive using pg_standby
|
||||||
|
* so must remove trigger file so we can reload file again
|
||||||
|
* and come up correctly.
|
||||||
|
*/
|
||||||
|
rc = unlink(triggerPath);
|
||||||
|
if (rc != 0)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "\n ERROR: unable to remove \"%s\", rc=%d", triggerPath, rc);
|
||||||
|
fflush(stderr);
|
||||||
|
exit(rc);
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* RestoreWALFileForRecovery()
|
||||||
|
*
|
||||||
|
* Perform the action required to restore the file from archive
|
||||||
|
*/
|
||||||
|
static bool
|
||||||
|
RestoreWALFileForRecovery(void)
|
||||||
|
{
|
||||||
|
int rc = 0;
|
||||||
|
int numretries = 0;
|
||||||
|
|
||||||
|
if (debug)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "\nrunning restore :");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
|
||||||
|
while (numretries < maxretries)
|
||||||
|
{
|
||||||
|
rc = system(restoreCommand);
|
||||||
|
if (rc == 0)
|
||||||
|
{
|
||||||
|
if (debug)
|
||||||
|
{
|
||||||
|
fprintf(stderr, " success\n");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
pg_usleep(numretries++ * sleeptime * 1000000L);
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Allow caller to add additional info
|
||||||
|
*/
|
||||||
|
if (debug)
|
||||||
|
fprintf(stderr, "not restored : ");
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
static void
|
||||||
|
usage()
|
||||||
|
{
|
||||||
|
fprintf(stderr, "\npg_standby allows Warm Standby servers to be configured\n");
|
||||||
|
fprintf(stderr, "Usage:\n");
|
||||||
|
fprintf(stderr, " pg_standby [OPTION]... [ARCHIVELOCATION] [NEXTWALFILE] [XLOGFILEPATH]\n");
|
||||||
|
fprintf(stderr, " note space between [ARCHIVELOCATION] and [NEXTWALFILE]\n");
|
||||||
|
fprintf(stderr, "with main intended use via restore_command in the recovery.conf\n");
|
||||||
|
fprintf(stderr, " restore_command = 'pg_standby [OPTION]... [ARCHIVELOCATION] %%f %%p'\n");
|
||||||
|
fprintf(stderr, "e.g. restore_command = 'pg_standby -l -u /mnt/server/archiverdir %%f %%p'\n");
|
||||||
|
fprintf(stderr, "\nOptions:\n");
|
||||||
|
fprintf(stderr, " -c copies file from archive (default)\n");
|
||||||
|
fprintf(stderr, " -d generate lots of debugging output (testing only)\n");
|
||||||
|
fprintf(stderr, " -k [NUMFILESTOKEEP] keeps history of # files in archives; unlinks/removes files beyond that\n");
|
||||||
|
fprintf(stderr, " -l links into archive (leaves file in archive)\n");
|
||||||
|
fprintf(stderr, " -t [TRIGGERFILE] defines a trigger file to initiate failover (no default)\n");
|
||||||
|
fprintf(stderr, " -r [MAXRETRIES] maximum number of times to retry, with progressive wait (default=3)\n");
|
||||||
|
fprintf(stderr, " -s [SLEEPTIME] number of seconds to wait between file checks (default=5)\n");
|
||||||
|
fprintf(stderr, " -w [MAXWAITTIME] max number of seconds to wait for a file (0 disables)(default=0)\n");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void
|
||||||
|
sighandler(int sig)
|
||||||
|
{
|
||||||
|
triggered = true;
|
||||||
|
signaled = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
/*------------ MAIN ----------------------------------------*/
|
||||||
|
int
|
||||||
|
main(int argc, char **argv)
|
||||||
|
{
|
||||||
|
int c;
|
||||||
|
|
||||||
|
(void) signal(SIGINT, sighandler);
|
||||||
|
(void) signal(SIGQUIT, sighandler);
|
||||||
|
|
||||||
|
while ((c = getopt(argc, argv, "cdk:lr:s:t:w:")) != -1)
|
||||||
|
{
|
||||||
|
switch (c)
|
||||||
|
{
|
||||||
|
case 'c': /* Use copy */
|
||||||
|
restoreCommandType = RESTORE_COMMAND_COPY;
|
||||||
|
break;
|
||||||
|
case 'd': /* Debug mode */
|
||||||
|
debug = true;
|
||||||
|
break;
|
||||||
|
case 'k': /* keepfiles */
|
||||||
|
keepfiles = atoi(optarg);
|
||||||
|
if (keepfiles <= 0)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "usage: pg_standby -k keepfiles must be > 0\n");
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 'l': /* Use link */
|
||||||
|
restoreCommandType = RESTORE_COMMAND_LINK;
|
||||||
|
break;
|
||||||
|
case 'r': /* Retries */
|
||||||
|
maxretries = atoi(optarg);
|
||||||
|
if (maxretries < 0)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "usage: pg_standby -r maxretries must be > 0\n");
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 's': /* Sleep time */
|
||||||
|
sleeptime = atoi(optarg);
|
||||||
|
if (sleeptime <= 0 || sleeptime > 60)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "usage: pg_standby -s sleeptime incorrectly set\n");
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 't': /* Trigger file */
|
||||||
|
triggerPath = optarg;
|
||||||
|
if (CheckForExternalTrigger())
|
||||||
|
exit(1); /* Normal exit, with non-zero */
|
||||||
|
break;
|
||||||
|
case 'w': /* Max wait time */
|
||||||
|
maxwaittime = atoi(optarg);
|
||||||
|
if (maxwaittime < 0)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "usage: pg_standby -w maxwaittime incorrectly set\n");
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Parameter checking - after checking to see if trigger file present
|
||||||
|
*/
|
||||||
|
if (argc == 1)
|
||||||
|
{
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* We will go to the archiveLocation to get nextWALFileName.
|
||||||
|
* nextWALFileName may not exist yet, which would not be an error,
|
||||||
|
* so we separate the archiveLocation and nextWALFileName so we can check
|
||||||
|
* separately whether archiveLocation exists, if not that is an error
|
||||||
|
*/
|
||||||
|
if (optind < argc)
|
||||||
|
{
|
||||||
|
archiveLocation = argv[optind];
|
||||||
|
optind++;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
fprintf(stderr, "pg_standby: must specify archiveLocation\n");
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (optind < argc)
|
||||||
|
{
|
||||||
|
nextWALFileName = argv[optind];
|
||||||
|
optind++;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
fprintf(stderr, "pg_standby: use %%f to specify nextWALFileName\n");
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
|
||||||
|
if (optind < argc)
|
||||||
|
{
|
||||||
|
xlogFilePath = argv[optind];
|
||||||
|
optind++;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
fprintf(stderr, "pg_standby: use %%p to specify xlogFilePath\n");
|
||||||
|
usage();
|
||||||
|
exit(2);
|
||||||
|
}
|
||||||
|
|
||||||
|
CustomizableInitialize();
|
||||||
|
|
||||||
|
if (debug)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "\nTrigger file : %s", triggerPath ? triggerPath : "<not set>");
|
||||||
|
fprintf(stderr, "\nWaiting for WAL file : %s", WALFilePath);
|
||||||
|
fprintf(stderr, "\nWAL file path : %s", nextWALFileName);
|
||||||
|
fprintf(stderr, "\nRestoring to... : %s", xlogFilePath);
|
||||||
|
fprintf(stderr, "\nSleep interval : %d second%s",
|
||||||
|
sleeptime, (sleeptime > 1 ? "s" : " "));
|
||||||
|
fprintf(stderr, "\nMax wait interval : %d %s",
|
||||||
|
maxwaittime, (maxwaittime > 0 ? "seconds" : "forever"));
|
||||||
|
fprintf(stderr, "\nCommand for restore : %s", restoreCommand);
|
||||||
|
if (keepfiles > 0)
|
||||||
|
fprintf(stderr, "\nNum archived files kept : last %d files", keepfiles);
|
||||||
|
else
|
||||||
|
fprintf(stderr, "\nNum archived files kept : all files");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Check for initial history file: always the first file to be requested
|
||||||
|
* It's OK if the file isn't there - all other files need to wait
|
||||||
|
*/
|
||||||
|
if (strlen(nextWALFileName) > 8 &&
|
||||||
|
strspn(nextWALFileName, "0123456789ABCDEF") == 8 &&
|
||||||
|
strcmp(nextWALFileName + strlen(nextWALFileName) - strlen(".history"),
|
||||||
|
".history") == 0)
|
||||||
|
{
|
||||||
|
nextWALFileType = XLOG_HISTORY;
|
||||||
|
if (RestoreWALFileForRecovery())
|
||||||
|
exit(0);
|
||||||
|
else
|
||||||
|
{
|
||||||
|
if (debug)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "history file not found\n");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
exit(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Main wait loop
|
||||||
|
*/
|
||||||
|
while (!CustomizableNextWALFileReady() && !triggered)
|
||||||
|
{
|
||||||
|
if (sleeptime <= 60)
|
||||||
|
pg_usleep(sleeptime * 1000000L);
|
||||||
|
|
||||||
|
if (signaled)
|
||||||
|
{
|
||||||
|
if (debug)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "\nsignaled to exit\n");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
|
||||||
|
if (debug)
|
||||||
|
{
|
||||||
|
fprintf(stderr, "\nWAL file not present yet.");
|
||||||
|
if (triggerPath)
|
||||||
|
fprintf(stderr, " Checking for trigger file...");
|
||||||
|
fflush(stderr);
|
||||||
|
}
|
||||||
|
|
||||||
|
waittime += sleeptime;
|
||||||
|
|
||||||
|
if (!triggered && (CheckForExternalTrigger() || (waittime >= maxwaittime && maxwaittime > 0)))
|
||||||
|
{
|
||||||
|
triggered = true;
|
||||||
|
if (debug && waittime >= maxwaittime && maxwaittime > 0)
|
||||||
|
fprintf(stderr, "\nTimed out after %d seconds\n",waittime);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Action on exit
|
||||||
|
*/
|
||||||
|
if (triggered)
|
||||||
|
exit(1); /* Normal exit, with non-zero */
|
||||||
|
else
|
||||||
|
{
|
||||||
|
/*
|
||||||
|
* Once we have restored this file successfully we
|
||||||
|
* can remove some prior WAL files.
|
||||||
|
* If this restore fails we musn't remove any
|
||||||
|
* file because some of them will be requested again
|
||||||
|
* immediately after the failed restore, or when
|
||||||
|
* we restart recovery.
|
||||||
|
*/
|
||||||
|
if (RestoreWALFileForRecovery())
|
||||||
|
CustomizableCleanupPriorWALFiles();
|
||||||
|
exit(0);
|
||||||
|
}
|
||||||
|
}
|
Loading…
x
Reference in New Issue
Block a user