PostgreSQL Source Code git master
Loading...
Searching...
No Matches
pg_basebackup.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * pg_basebackup.c - receive a base backup using streaming replication protocol
4 *
5 * Author: Magnus Hagander <magnus@hagander.net>
6 *
7 * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
8 *
9 * IDENTIFICATION
10 * src/bin/pg_basebackup/pg_basebackup.c
11 *-------------------------------------------------------------------------
12 */
13
14#include "postgres_fe.h"
15
16#include <unistd.h>
17#include <dirent.h>
18#include <limits.h>
19#include <sys/select.h>
20#include <sys/stat.h>
21#include <sys/wait.h>
22#include <signal.h>
23#include <time.h>
24#ifdef HAVE_LIBZ
25#include <zlib.h>
26#endif
27
29#include "astreamer_inject.h"
30#include "backup/basebackup.h"
31#include "common/compression.h"
32#include "common/file_perm.h"
33#include "common/file_utils.h"
34#include "common/logging.h"
37#include "getopt_long.h"
38#include "libpq/protocol.h"
39#include "receivelog.h"
40#include "streamutil.h"
41
42#define ERRCODE_DATA_CORRUPTED "XX001"
43
50
56
67
73
79
80typedef void (*WriteDataCallback) (size_t nbytes, char *buf,
81 void *callback_data);
82
83/*
84 * pg_xlog has been renamed to pg_wal in version 10. This version number
85 * should be compared with PQserverVersion().
86 */
87#define MINIMUM_VERSION_FOR_PG_WAL 100000
88
89/*
90 * Temporary replication slots are supported from version 10.
91 */
92#define MINIMUM_VERSION_FOR_TEMP_SLOTS 100000
93
94/*
95 * Backup manifests are supported from version 13.
96 */
97#define MINIMUM_VERSION_FOR_MANIFESTS 130000
98
99/*
100 * Before v15, tar files received from the server will be improperly
101 * terminated.
102 */
103#define MINIMUM_VERSION_FOR_TERMINATED_TARFILE 150000
104
105/*
106 * pg_wal/summaries exists beginning with version 17.
107 */
108#define MINIMUM_VERSION_FOR_WAL_SUMMARIES 170000
109
110/*
111 * Different ways to include WAL
112 */
119
120/*
121 * Different places to perform compression
122 */
129
130/* Global options */
131static char *basedir = NULL;
133static char *xlog_dir = NULL;
134static char format = '\0'; /* p(lain)/t(ar) */
135static char *label = "pg_basebackup base backup";
136static bool noclean = false;
137static bool checksum_failure = false;
138static bool showprogress = false;
139static bool estimatesize = true;
140static int verbose = 0;
142static bool fastcheckpoint = false;
143static bool writerecoveryconf = false;
144static bool do_sync = true;
145static int standby_message_timeout = 10 * 1000; /* 10 sec = default */
147static int32 maxrate = 0; /* no limit by default */
148static char *replication_slot = NULL;
149static bool temp_replication_slot = true;
150static char *backup_target = NULL;
151static bool create_slot = false;
152static bool no_slot = false;
153static bool verify_checksums = true;
154static bool manifest = true;
155static bool manifest_force_encode = false;
158
159static bool success = false;
160static bool made_new_pgdata = false;
161static bool found_existing_pgdata = false;
162static bool made_new_xlogdir = false;
163static bool found_existing_xlogdir = false;
164static bool made_tablespace_dirs = false;
165static bool found_tablespace_dirs = false;
166
167/* Progress indicators */
171static char *progress_filename = NULL;
172
173/* Pipe to communicate with background wal receiver process */
174#ifndef WIN32
175static int bgpipe[2] = {-1, -1};
176#endif
177
178/* Handle to child process */
179static pid_t bgchild = -1;
180static bool in_log_streamer = false;
181
182/* Flag to indicate if child process exited unexpectedly */
183static volatile sig_atomic_t bgchild_exited = false;
184
185/* End position for xlog streaming, empty string if unknown yet */
187
188#ifndef WIN32
189static int has_xlogendptr = 0;
190#else
191static volatile LONG has_xlogendptr = 0;
192#endif
193
194/* Contents of configuration file to be generated */
196
197/* Function headers */
198static void usage(void);
199static void verify_dir_is_empty_or_create(char *dirname, bool *created, bool *found);
200static void progress_update_filename(const char *filename);
201static void progress_report(int tablespacenum, bool force, bool finished);
202
203static astreamer *CreateBackupStreamer(char *archive_name, char *spclocation,
205 bool is_recovery_guc_supported,
207 pg_compress_specification *compress);
208static void ReceiveArchiveStreamChunk(size_t r, char *copybuf,
209 void *callback_data);
210static char GetCopyDataByte(size_t r, char *copybuf, size_t *cursor);
211static char *GetCopyDataString(size_t r, char *copybuf, size_t *cursor);
212static uint64 GetCopyDataUInt64(size_t r, char *copybuf, size_t *cursor);
213static void GetCopyDataEnd(size_t r, char *copybuf, size_t cursor);
214static void ReportCopyDataParseError(size_t r, char *copybuf);
215static void ReceiveTarFile(PGconn *conn, char *archive_name, char *spclocation,
216 bool tablespacenum, pg_compress_specification *compress);
217static void ReceiveTarCopyChunk(size_t r, char *copybuf, void *callback_data);
218static void ReceiveBackupManifest(PGconn *conn);
219static void ReceiveBackupManifestChunk(size_t r, char *copybuf,
220 void *callback_data);
222static void ReceiveBackupManifestInMemoryChunk(size_t r, char *copybuf,
223 void *callback_data);
228
229static bool reached_end_position(XLogRecPtr segendpos, uint32 timeline,
230 bool segment_finished);
231
232static const char *get_tablespace_mapping(const char *dir);
233static void tablespace_list_append(const char *arg);
234
235
236static void
238{
240 return;
241
242 if (!noclean && !checksum_failure)
243 {
244 if (made_new_pgdata)
245 {
246 pg_log_info("removing data directory \"%s\"", basedir);
247 if (!rmtree(basedir, true))
248 pg_log_error("failed to remove data directory");
249 }
250 else if (found_existing_pgdata)
251 {
252 pg_log_info("removing contents of data directory \"%s\"", basedir);
253 if (!rmtree(basedir, false))
254 pg_log_error("failed to remove contents of data directory");
255 }
256
258 {
259 pg_log_info("removing WAL directory \"%s\"", xlog_dir);
260 if (!rmtree(xlog_dir, true))
261 pg_log_error("failed to remove WAL directory");
262 }
263 else if (found_existing_xlogdir)
264 {
265 pg_log_info("removing contents of WAL directory \"%s\"", xlog_dir);
266 if (!rmtree(xlog_dir, false))
267 pg_log_error("failed to remove contents of WAL directory");
268 }
269 }
270 else
271 {
273 pg_log_info("data directory \"%s\" not removed at user's request", basedir);
274
276 pg_log_info("WAL directory \"%s\" not removed at user's request", xlog_dir);
277 }
278
280 pg_log_info("changes to tablespace directories will not be undone");
281}
282
283static void
285{
286 if (conn != NULL)
287 PQfinish(conn);
288}
289
290#ifndef WIN32
291/*
292 * If the bgchild exits prematurely and raises a SIGCHLD signal, we can abort
293 * processing rather than wait until the backup has finished and error out at
294 * that time. On Windows, we use a background thread which can communicate
295 * without the need for a signal handler.
296 */
297static void
302
303/*
304 * On windows, our background thread dies along with the process. But on
305 * Unix, if we have started a subprocess, we want to kill it off so it
306 * doesn't remain running trying to stream data.
307 */
308static void
310{
311 if (bgchild > 0 && !bgchild_exited)
313}
314#endif
315
316/*
317 * Split argument into old_dir and new_dir and append to tablespace mapping
318 * list.
319 */
320static void
322{
324 char *dst;
325 char *dst_ptr;
326 const char *arg_ptr;
327
328 dst_ptr = dst = cell->old_dir;
329 for (arg_ptr = arg; *arg_ptr; arg_ptr++)
330 {
331 if (dst_ptr - dst >= MAXPGPATH)
332 pg_fatal("directory name too long");
333
334 if (*arg_ptr == '\\' && *(arg_ptr + 1) == '=')
335 ; /* skip backslash escaping = */
336 else if (*arg_ptr == '=' && (arg_ptr == arg || *(arg_ptr - 1) != '\\'))
337 {
338 if (*cell->new_dir)
339 pg_fatal("multiple \"=\" signs in tablespace mapping");
340 else
341 dst = dst_ptr = cell->new_dir;
342 }
343 else
344 *dst_ptr++ = *arg_ptr;
345 }
346
347 if (!*cell->old_dir || !*cell->new_dir)
348 pg_fatal("invalid tablespace mapping format \"%s\", must be \"OLDDIR=NEWDIR\"", arg);
349
350 /*
351 * All tablespaces are created with absolute directories, so specifying a
352 * non-absolute path here would just never match, possibly confusing
353 * users. Since we don't know whether the remote side is Windows or not,
354 * and it might be different than the local side, permit any path that
355 * could be absolute under either set of rules.
356 *
357 * (There is little practical risk of confusion here, because someone
358 * running entirely on Linux isn't likely to have a relative path that
359 * begins with a backslash or something that looks like a drive
360 * specification. If they do, and they also incorrectly believe that a
361 * relative path is acceptable here, we'll silently fail to warn them of
362 * their mistake, and the -T option will just not get applied, same as if
363 * they'd specified -T for a nonexistent tablespace.)
364 */
367 pg_fatal("old directory is not an absolute path in tablespace mapping: %s",
368 cell->old_dir);
369
370 if (!is_absolute_path(cell->new_dir))
371 pg_fatal("new directory is not an absolute path in tablespace mapping: %s",
372 cell->new_dir);
373
374 /*
375 * Comparisons done with these values should involve similarly
376 * canonicalized path values. This is particularly sensitive on Windows
377 * where path values may not necessarily use Unix slashes.
378 */
381
383 tablespace_dirs.tail->next = cell;
384 else
385 tablespace_dirs.head = cell;
386 tablespace_dirs.tail = cell;
387}
388
389
390static void
391usage(void)
392{
393 printf(_("%s takes a base backup of a running PostgreSQL server.\n\n"),
394 progname);
395 printf(_("Usage:\n"));
396 printf(_(" %s [OPTION]...\n"), progname);
397 printf(_("\nOptions controlling the output:\n"));
398 printf(_(" -D, --pgdata=DIRECTORY receive base backup into directory\n"));
399 printf(_(" -F, --format=p|t output format (plain (default), tar)\n"));
400 printf(_(" -i, --incremental=OLDMANIFEST\n"
401 " take incremental backup\n"));
402 printf(_(" -r, --max-rate=RATE maximum transfer rate to transfer data directory\n"
403 " (in kB/s, or use suffix \"k\" or \"M\")\n"));
404 printf(_(" -R, --write-recovery-conf\n"
405 " write configuration for replication\n"));
406 printf(_(" -t, --target=TARGET[:DETAIL]\n"
407 " backup target (if other than client)\n"));
408 printf(_(" -T, --tablespace-mapping=OLDDIR=NEWDIR\n"
409 " relocate tablespace in OLDDIR to NEWDIR\n"));
410 printf(_(" --waldir=WALDIR location for the write-ahead log directory\n"));
411 printf(_(" -X, --wal-method=none|fetch|stream\n"
412 " include required WAL files with specified method\n"));
413 printf(_(" -z, --gzip compress tar output\n"));
414 printf(_(" -Z, --compress=[{client|server}-]METHOD[:DETAIL]\n"
415 " compress on client or server as specified\n"));
416 printf(_(" -Z, --compress=none do not compress tar output\n"));
417 printf(_("\nGeneral options:\n"));
418 printf(_(" -c, --checkpoint=fast|spread\n"
419 " set fast or spread (default) checkpointing\n"));
420 printf(_(" -C, --create-slot create replication slot\n"));
421 printf(_(" -l, --label=LABEL set backup label\n"));
422 printf(_(" -n, --no-clean do not clean up after errors\n"));
423 printf(_(" -N, --no-sync do not wait for changes to be written safely to disk\n"));
424 printf(_(" -P, --progress show progress information\n"));
425 printf(_(" -S, --slot=SLOTNAME replication slot to use\n"));
426 printf(_(" -v, --verbose output verbose messages\n"));
427 printf(_(" -V, --version output version information, then exit\n"));
428 printf(_(" --manifest-checksums=SHA{224,256,384,512}|CRC32C|NONE\n"
429 " use algorithm for manifest checksums\n"));
430 printf(_(" --manifest-force-encode\n"
431 " hex encode all file names in manifest\n"));
432 printf(_(" --no-estimate-size do not estimate backup size in server side\n"));
433 printf(_(" --no-manifest suppress generation of backup manifest\n"));
434 printf(_(" --no-slot prevent creation of temporary replication slot\n"));
435 printf(_(" --no-verify-checksums\n"
436 " do not verify checksums\n"));
437 printf(_(" --sync-method=METHOD\n"
438 " set method for syncing files to disk\n"));
439 printf(_(" -?, --help show this help, then exit\n"));
440 printf(_("\nConnection options:\n"));
441 printf(_(" -d, --dbname=CONNSTR connection string\n"));
442 printf(_(" -h, --host=HOSTNAME database server host or socket directory\n"));
443 printf(_(" -p, --port=PORT database server port number\n"));
444 printf(_(" -s, --status-interval=INTERVAL\n"
445 " time between status packets sent to server (in seconds)\n"));
446 printf(_(" -U, --username=NAME connect as specified database user\n"));
447 printf(_(" -w, --no-password never prompt for password\n"));
448 printf(_(" -W, --password force password prompt (should happen automatically)\n"));
449 printf(_("\nReport bugs to <%s>.\n"), PACKAGE_BUGREPORT);
450 printf(_("%s home page: <%s>\n"), PACKAGE_NAME, PACKAGE_URL);
451}
452
453
454/*
455 * Called in the background process every time data is received.
456 * On Unix, we check to see if there is any data on our pipe
457 * (which would mean we have a stop position), and if it is, check if
458 * it is time to stop.
459 * On Windows, we are in a single process, so we can just check if it's
460 * time to stop.
461 */
462static bool
464 bool segment_finished)
465{
466 if (!has_xlogendptr)
467 {
468#ifndef WIN32
469 fd_set fds;
470 struct timeval tv = {0};
471 int r;
472
473 /*
474 * Don't have the end pointer yet - check our pipe to see if it has
475 * been sent yet.
476 */
477 FD_ZERO(&fds);
478 FD_SET(bgpipe[0], &fds);
479
480 r = select(bgpipe[0] + 1, &fds, NULL, NULL, &tv);
481 if (r == 1)
482 {
483 char xlogend[64] = {0};
484 uint32 hi,
485 lo;
486
487 r = read(bgpipe[0], xlogend, sizeof(xlogend) - 1);
488 if (r < 0)
489 pg_fatal("could not read from ready pipe: %m");
490
491 if (sscanf(xlogend, "%X/%08X", &hi, &lo) != 2)
492 pg_fatal("could not parse write-ahead log location \"%s\"",
493 xlogend);
494 xlogendptr = ((uint64) hi) << 32 | lo;
495 has_xlogendptr = 1;
496
497 /*
498 * Fall through to check if we've reached the point further
499 * already.
500 */
501 }
502 else
503 {
504 /*
505 * No data received on the pipe means we don't know the end
506 * position yet - so just say it's not time to stop yet.
507 */
508 return false;
509 }
510#else
511
512 /*
513 * On win32, has_xlogendptr is set by the main thread, so if it's not
514 * set here, we just go back and wait until it shows up.
515 */
516 return false;
517#endif
518 }
519
520 /*
521 * At this point we have an end pointer, so compare it to the current
522 * position to figure out if it's time to stop.
523 */
524 if (segendpos >= xlogendptr)
525 return true;
526
527 /*
528 * Have end pointer, but haven't reached it yet - so tell the caller to
529 * keep streaming.
530 */
531 return false;
532}
533
534typedef struct
535{
538 char xlog[MAXPGPATH]; /* directory or tarfile depending on mode */
544
545static int
547{
548 StreamCtl stream = {0};
549
550 in_log_streamer = true;
551
552 stream.startpos = param->startptr;
553 stream.timeline = param->timeline;
554 stream.sysidentifier = param->sysidentifier;
556#ifndef WIN32
557 stream.stop_socket = bgpipe[0];
558#else
560#endif
562 stream.synchronous = false;
563 /* fsync happens at the end of pg_basebackup for all data */
564 stream.do_sync = false;
565 stream.mark_done = true;
566 stream.partial_suffix = NULL;
568 if (format == 'p')
571 stream.do_sync);
572 else
573 stream.walmethod = CreateWalTarMethod(param->xlog,
575 param->wal_compress_level,
576 stream.do_sync);
577
578 if (!ReceiveXlogStream(param->bgconn, &stream))
579 {
580 /*
581 * Any errors will already have been reported in the function process,
582 * but we need to tell the parent that we didn't shutdown in a nice
583 * way.
584 */
585#ifdef WIN32
586 /*
587 * In order to signal the main thread of an ungraceful exit we set the
588 * same flag that we use on Unix to signal SIGCHLD.
589 */
590 bgchild_exited = true;
591#endif
592 return 1;
593 }
594
595 if (!stream.walmethod->ops->finish(stream.walmethod))
596 {
597 pg_log_error("could not finish writing WAL files: %m");
598#ifdef WIN32
599 bgchild_exited = true;
600#endif
601 return 1;
602 }
603
604 PQfinish(param->bgconn);
605
606 stream.walmethod->ops->free(stream.walmethod);
607
608 return 0;
609}
610
611/*
612 * Initiate background process for receiving xlog during the backup.
613 * The background stream will use its own database connection so we can
614 * stream the logfile in parallel with the backups.
615 */
616static void
617StartLogStreamer(char *startpos, uint32 timeline, char *sysidentifier,
618 pg_compress_algorithm wal_compress_algorithm,
619 int wal_compress_level)
620{
621 logstreamer_param *param;
622 uint32 hi,
623 lo;
624 char statusdir[MAXPGPATH];
625
627 param->timeline = timeline;
628 param->sysidentifier = sysidentifier;
629 param->wal_compress_algorithm = wal_compress_algorithm;
630 param->wal_compress_level = wal_compress_level;
631
632 /* Convert the starting position */
633 if (sscanf(startpos, "%X/%08X", &hi, &lo) != 2)
634 pg_fatal("could not parse write-ahead log location \"%s\"",
635 startpos);
636 param->startptr = ((uint64) hi) << 32 | lo;
637 /* Round off to even segment position */
638 param->startptr -= XLogSegmentOffset(param->startptr, WalSegSz);
639
640#ifndef WIN32
641 /* Create our background pipe */
642 if (pipe(bgpipe) < 0)
643 pg_fatal("could not create pipe for background process: %m");
644#endif
645
646 /* Get a second connection */
647 param->bgconn = GetConnection();
648 if (!param->bgconn)
649 /* Error message already written in GetConnection() */
650 exit(1);
651
652 /* In post-10 cluster, pg_xlog has been renamed to pg_wal */
653 snprintf(param->xlog, sizeof(param->xlog), "%s/%s",
654 basedir,
656 "pg_xlog" : "pg_wal");
657
658 /* Temporary replication slots are only supported in 10 and newer */
660 temp_replication_slot = false;
661
662 /*
663 * Create replication slot if requested
664 */
666 replication_slot = psprintf("pg_basebackup_%u",
667 (unsigned int) PQbackendPID(param->bgconn));
669 {
671 temp_replication_slot, true, true, false,
672 false, false))
673 exit(1);
674
675 if (verbose)
676 {
678 pg_log_info("created temporary replication slot \"%s\"",
680 else
681 pg_log_info("created replication slot \"%s\"",
683 }
684 }
685
686 if (format == 'p')
687 {
688 /*
689 * Create pg_wal/archive_status or pg_xlog/archive_status (and thus
690 * pg_wal or pg_xlog) depending on the target server so we can write
691 * to basedir/pg_wal or basedir/pg_xlog as the directory entry in the
692 * tar file may arrive later.
693 */
694 snprintf(statusdir, sizeof(statusdir), "%s/%s/archive_status",
695 basedir,
697 "pg_xlog" : "pg_wal");
698
700 pg_fatal("could not create directory \"%s\": %m", statusdir);
701
702 /*
703 * For newer server versions, likewise create pg_wal/summaries
704 */
706 {
707 char summarydir[MAXPGPATH];
708
709 snprintf(summarydir, sizeof(summarydir), "%s/%s/summaries",
710 basedir, "pg_wal");
711
713 errno != EEXIST)
714 pg_fatal("could not create directory \"%s\": %m", summarydir);
715 }
716 }
717
718 /*
719 * Start a child process and tell it to start streaming. On Unix, this is
720 * a fork(). On Windows, we create a thread.
721 */
722#ifndef WIN32
723 bgchild = fork();
724 if (bgchild == 0)
725 {
726 /* in child process */
727 exit(LogStreamerMain(param));
728 }
729 else if (bgchild < 0)
730 pg_fatal("could not create background process: %m");
731
732 /*
733 * Else we are in the parent process and all is well.
734 */
736#else /* WIN32 */
737 bgchild = _beginthreadex(NULL, 0, (void *) LogStreamerMain, param, 0, NULL);
738 if (bgchild == 0)
739 pg_fatal("could not create background thread: %m");
740#endif
741}
742
743/*
744 * Verify that the given directory exists and is empty. If it does not
745 * exist, it is created. If it exists but is not empty, an error will
746 * be given and the process ended.
747 */
748static void
749verify_dir_is_empty_or_create(char *dirname, bool *created, bool *found)
750{
751 switch (pg_check_dir(dirname))
752 {
753 case 0:
754
755 /*
756 * Does not exist, so create
757 */
758 if (pg_mkdir_p(dirname, pg_dir_create_mode) == -1)
759 pg_fatal("could not create directory \"%s\": %m", dirname);
760 if (created)
761 *created = true;
762 return;
763 case 1:
764
765 /*
766 * Exists, empty
767 */
768 if (found)
769 *found = true;
770 return;
771 case 2:
772 case 3:
773 case 4:
774
775 /*
776 * Exists, not empty
777 */
778 pg_fatal("directory \"%s\" exists but is not empty", dirname);
779 case -1:
780
781 /*
782 * Access problem
783 */
784 pg_fatal("could not access directory \"%s\": %m", dirname);
785 }
786}
787
788/*
789 * Callback to update our notion of the current filename.
790 *
791 * No other code should modify progress_filename!
792 */
793static void
795{
796 /* We needn't maintain this variable if not doing verbose reports. */
797 if (showprogress && verbose)
798 {
800 if (filename)
802 else
804 }
805}
806
807/*
808 * Print a progress report based on the global variables. If verbose output
809 * is enabled, also print the current file name.
810 *
811 * Progress report is written at maximum once per second, unless the force
812 * parameter is set to true.
813 *
814 * If finished is set to true, this is the last progress report. The cursor
815 * is moved to the next line.
816 */
817static void
818progress_report(int tablespacenum, bool force, bool finished)
819{
820 int percent;
821 char totaldone_str[32];
822 char totalsize_str[32];
824
825 if (!showprogress)
826 return;
827
828 now = time(NULL);
829 if (now == last_progress_report && !force && !finished)
830 return; /* Max once per second */
831
833 percent = totalsize_kb ? (int) ((totaldone / 1024) * 100 / totalsize_kb) : 0;
834
835 /*
836 * Avoid overflowing past 100% or the full size. This may make the total
837 * size number change as we approach the end of the backup (the estimate
838 * will always be wrong if WAL is included), but that's better than having
839 * the done column be bigger than the total.
840 */
841 if (percent > 100)
842 percent = 100;
843 if (totaldone / 1024 > totalsize_kb)
844 totalsize_kb = totaldone / 1024;
845
847 totaldone / 1024);
849
850#define VERBOSE_FILENAME_LENGTH 35
851 if (verbose)
852 {
854
855 /*
856 * No filename given, so clear the status line (used for last
857 * call)
858 */
860 ngettext("%*s/%s kB (100%%), %d/%d tablespace %*s",
861 "%*s/%s kB (100%%), %d/%d tablespaces %*s",
863 (int) strlen(totalsize_str),
865 tablespacenum, tablespacecount,
867 else
868 {
870
872 ngettext("%*s/%s kB (%d%%), %d/%d tablespace (%s%-*.*s)",
873 "%*s/%s kB (%d%%), %d/%d tablespaces (%s%-*.*s)",
875 (int) strlen(totalsize_str),
877 tablespacenum, tablespacecount,
878 /* Prefix with "..." if we do leading truncation */
879 truncate ? "..." : "",
882 /* Truncate filename at beginning if it's too long */
884 }
885 }
886 else
888 ngettext("%*s/%s kB (%d%%), %d/%d tablespace",
889 "%*s/%s kB (%d%%), %d/%d tablespaces",
891 (int) strlen(totalsize_str),
893 tablespacenum, tablespacecount);
894
895 /*
896 * Stay on the same line if reporting to a terminal and we're not done
897 * yet.
898 */
899 fputc((!finished && isatty(fileno(stderr))) ? '\r' : '\n', stderr);
900}
901
902static int32
904{
905 double result;
906 char *after_num;
907 char *suffix = NULL;
908
909 errno = 0;
910 result = strtod(src, &after_num);
911 if (src == after_num)
912 pg_fatal("transfer rate \"%s\" is not a valid value", src);
913 if (errno != 0)
914 pg_fatal("invalid transfer rate \"%s\": %m", src);
915
916 if (result <= 0)
917 {
918 /*
919 * Reject obviously wrong values here.
920 */
921 pg_fatal("transfer rate must be greater than zero");
922 }
923
924 /*
925 * Evaluate suffix, after skipping over possible whitespace. Lack of
926 * suffix means kilobytes.
927 */
928 while (*after_num != '\0' && isspace((unsigned char) *after_num))
929 after_num++;
930
931 if (*after_num != '\0')
932 {
933 suffix = after_num;
934 if (*after_num == 'k')
935 {
936 /* kilobyte is the expected unit. */
937 after_num++;
938 }
939 else if (*after_num == 'M')
940 {
941 after_num++;
942 result *= 1024.0;
943 }
944 }
945
946 /* The rest can only consist of white space. */
947 while (*after_num != '\0' && isspace((unsigned char) *after_num))
948 after_num++;
949
950 if (*after_num != '\0')
951 pg_fatal("invalid --max-rate unit: \"%s\"", suffix);
952
953 /* Valid integer? */
954 if ((uint64) result != (uint64) ((uint32) result))
955 pg_fatal("transfer rate \"%s\" exceeds integer range", src);
956
957 /*
958 * The range is checked on the server side too, but avoid the server
959 * connection if a nonsensical value was passed.
960 */
962 pg_fatal("transfer rate \"%s\" is out of range", src);
963
964 return (int32) result;
965}
966
967/*
968 * Basic parsing of a value specified for -Z/--compress.
969 *
970 * We're not concerned here with understanding exactly what behavior the
971 * user wants, but we do need to know whether the user is requesting client
972 * or server side compression or leaving it unspecified, and we need to
973 * separate the name of the compression algorithm from the detail string.
974 *
975 * For instance, if the user writes --compress client-lz4:6, we want to
976 * separate that into (a) client-side compression, (b) algorithm "lz4",
977 * and (c) detail "6". Note, however, that all the client/server prefix is
978 * optional, and so is the detail. The algorithm name is required, unless
979 * the whole string is an integer, in which case we assume "gzip" as the
980 * algorithm and use the integer as the detail.
981 *
982 * We're not concerned with validation at this stage, so if the user writes
983 * --compress client-turkey:sandwich, the requested algorithm is "turkey"
984 * and the detail string is "sandwich". We'll sort out whether that's legal
985 * at a later stage.
986 */
987static void
988backup_parse_compress_options(char *option, char **algorithm, char **detail,
990{
991 /*
992 * Strip off any "client-" or "server-" prefix, calculating the location.
993 */
994 if (strncmp(option, "server-", 7) == 0)
995 {
997 option += 7;
998 }
999 else if (strncmp(option, "client-", 7) == 0)
1000 {
1002 option += 7;
1003 }
1004 else
1006
1007 /* fallback to the common parsing for the algorithm and detail */
1008 parse_compress_options(option, algorithm, detail);
1009}
1010
1011/*
1012 * Read a stream of COPY data and invoke the provided callback for each
1013 * chunk.
1014 */
1015static void
1017 void *callback_data)
1018{
1019 PGresult *res;
1020
1021 /* Get the COPY data stream. */
1022 res = PQgetResult(conn);
1023 if (PQresultStatus(res) != PGRES_COPY_OUT)
1024 pg_fatal("could not get COPY data stream: %s",
1026 PQclear(res);
1027
1028 /* Loop over chunks until done. */
1029 while (1)
1030 {
1031 int r;
1032 char *copybuf;
1033
1034 r = PQgetCopyData(conn, &copybuf, 0);
1035 if (r == -1)
1036 {
1037 /* End of chunk. */
1038 break;
1039 }
1040 else if (r == -2)
1041 pg_fatal("could not read COPY data: %s",
1043
1044 if (bgchild_exited)
1045 pg_fatal("background process terminated unexpectedly");
1046
1047 (*callback) (r, copybuf, callback_data);
1048
1050 }
1051}
1052
1053/*
1054 * Figure out what to do with an archive received from the server based on
1055 * the options selected by the user. We may just write the results directly
1056 * to a file, or we might compress first, or we might extract the tar file
1057 * and write each member separately. This function doesn't do any of that
1058 * directly, but it works out what kind of astreamer we need to create so
1059 * that the right stuff happens when, down the road, we actually receive
1060 * the data.
1061 */
1062static astreamer *
1063CreateBackupStreamer(char *archive_name, char *spclocation,
1065 bool is_recovery_guc_supported,
1067 pg_compress_specification *compress)
1068{
1069 astreamer *streamer = NULL;
1070 astreamer *manifest_inject_streamer = NULL;
1071 bool inject_manifest;
1072 bool is_tar,
1075 bool must_parse_archive;
1076
1077 /*
1078 * Normally, we emit the backup manifest as a separate file, but when
1079 * we're writing a tarfile to stdout, we don't have that option, so
1080 * include it in the one tarfile we've got.
1081 */
1082 inject_manifest = (format == 't' && strcmp(basedir, "-") == 0 && manifest);
1083
1084 /* Check whether it is a tar archive and its compression type */
1085 is_tar = parse_tar_compress_algorithm(archive_name,
1087
1088 /* Is this any kind of compressed tar? */
1091
1092 /*
1093 * Injecting the manifest into a compressed tar file would be possible if
1094 * we decompressed it, parsed the tarfile, generated a new tarfile, and
1095 * recompressed it, but compressing and decompressing multiple times just
1096 * to inject the manifest seems inefficient enough that it's probably not
1097 * what the user wants. So, instead, reject the request and tell the user
1098 * to specify something more reasonable.
1099 */
1101 {
1102 pg_log_error("cannot inject manifest into a compressed tar file");
1103 pg_log_error_hint("Use client-side compression, send the output to a directory rather than standard output, or use %s.",
1104 "--no-manifest");
1105 exit(1);
1106 }
1107
1108 /*
1109 * We have to parse the archive if (1) we're suppose to extract it, or if
1110 * (2) we need to inject backup_manifest or recovery configuration into
1111 * it. However, we only know how to parse tar archives.
1112 */
1115
1116 /* At present, we only know how to parse tar archives. */
1117 if (must_parse_archive && !is_tar)
1118 {
1119 pg_log_error("cannot parse archive \"%s\"", archive_name);
1120 pg_log_error_detail("Only tar archives can be parsed.");
1121 if (format == 'p')
1122 pg_log_error_detail("Plain format requires pg_basebackup to parse the archive.");
1123 if (inject_manifest)
1124 pg_log_error_detail("Using - as the output directory requires pg_basebackup to parse the archive.");
1126 pg_log_error_detail("The -R option requires pg_basebackup to parse the archive.");
1127 exit(1);
1128 }
1129
1130 if (format == 'p')
1131 {
1132 const char *directory;
1133
1134 /*
1135 * In plain format, we must extract the archive. The data for the main
1136 * tablespace will be written to the base directory, and the data for
1137 * other tablespaces will be written to the directory where they're
1138 * located on the server, after applying any user-specified tablespace
1139 * mappings.
1140 *
1141 * In the case of an in-place tablespace, spclocation will be a
1142 * relative path. We just convert it to an absolute path by prepending
1143 * basedir.
1144 */
1145 if (spclocation == NULL)
1147 else if (!is_absolute_path(spclocation))
1149 else
1154 }
1155 else
1156 {
1159
1160 /*
1161 * In tar format, we just write the archive without extracting it.
1162 * Normally, we write it to the archive name provided by the caller,
1163 * but when the base directory is "-" that means we need to write to
1164 * standard output.
1165 */
1166 if (strcmp(basedir, "-") == 0)
1167 {
1169 archive_file = stdout;
1170 }
1171 else
1172 {
1174 "%s/%s", basedir, archive_name);
1176 }
1177
1178 if (compress->algorithm == PG_COMPRESSION_NONE)
1180 archive_file);
1181 else if (compress->algorithm == PG_COMPRESSION_GZIP)
1182 {
1183 strlcat(archive_filename, ".gz", sizeof(archive_filename));
1185 archive_file, compress);
1186 }
1187 else if (compress->algorithm == PG_COMPRESSION_LZ4)
1188 {
1189 strlcat(archive_filename, ".lz4", sizeof(archive_filename));
1191 archive_file);
1192 streamer = astreamer_lz4_compressor_new(streamer, compress);
1193 }
1194 else if (compress->algorithm == PG_COMPRESSION_ZSTD)
1195 {
1196 strlcat(archive_filename, ".zst", sizeof(archive_filename));
1198 archive_file);
1199 streamer = astreamer_zstd_compressor_new(streamer, compress);
1200 }
1201 else
1202 {
1203 Assert(false); /* not reachable */
1204 }
1205
1206 /*
1207 * If we need to parse the archive for whatever reason, then we'll
1208 * also need to re-archive, because, if the output format is tar, the
1209 * only point of parsing the archive is to be able to inject stuff
1210 * into it.
1211 */
1213 streamer = astreamer_tar_archiver_new(streamer);
1215 }
1216
1217 /*
1218 * If we're supposed to inject the backup manifest into the results, it
1219 * should be done here, so that the file content can be injected directly,
1220 * without worrying about the details of the tar format.
1221 */
1222 if (inject_manifest)
1223 manifest_inject_streamer = streamer;
1224
1225 /*
1226 * If this is the main tablespace and we're supposed to write recovery
1227 * information, arrange to do that.
1228 */
1230 {
1232 streamer = astreamer_recovery_injector_new(streamer,
1233 is_recovery_guc_supported,
1235 }
1236
1237 /*
1238 * If we're doing anything that involves understanding the contents of the
1239 * archive, we'll need to parse it. If not, we can skip parsing it, but
1240 * old versions of the server send improperly terminated tarfiles, so if
1241 * we're talking to such a server we'll need to add the terminator here.
1242 */
1244 streamer = astreamer_tar_parser_new(streamer);
1246 streamer = astreamer_tar_terminator_new(streamer);
1247
1248 /*
1249 * If the user has requested a server compressed archive along with
1250 * archive extraction at client then we need to decompress it.
1251 */
1252 if (format == 'p' && is_compressed_tar)
1253 {
1255 streamer = astreamer_gzip_decompressor_new(streamer);
1257 streamer = astreamer_lz4_decompressor_new(streamer);
1259 streamer = astreamer_zstd_decompressor_new(streamer);
1260 }
1261
1262 /* Return the results. */
1263 *manifest_inject_streamer_p = manifest_inject_streamer;
1264 return streamer;
1265}
1266
1267/*
1268 * Receive all of the archives the server wants to send - and the backup
1269 * manifest if present - as a single COPY stream.
1270 */
1271static void
1273{
1275
1276 /* Set up initial state. */
1277 memset(&state, 0, sizeof(state));
1278 state.tablespacenum = -1;
1279 state.compress = compress;
1280
1281 /* All the real work happens in ReceiveArchiveStreamChunk. */
1283
1284 /* If we wrote the backup manifest to a file, close the file. */
1285 if (state.manifest_file !=NULL)
1286 {
1287 fclose(state.manifest_file);
1288 state.manifest_file = NULL;
1289 }
1290
1291 /*
1292 * If we buffered the backup manifest in order to inject it into the
1293 * output tarfile, do that now.
1294 */
1295 if (state.manifest_inject_streamer != NULL &&
1296 state.manifest_buffer != NULL)
1297 {
1298 astreamer_inject_file(state.manifest_inject_streamer,
1299 "backup_manifest",
1300 state.manifest_buffer->data,
1301 state.manifest_buffer->len);
1302 destroyPQExpBuffer(state.manifest_buffer);
1303 state.manifest_buffer = NULL;
1304 }
1305
1306 /* If there's still an archive in progress, end processing. */
1307 if (state.streamer != NULL)
1308 {
1309 astreamer_finalize(state.streamer);
1310 astreamer_free(state.streamer);
1311 state.streamer = NULL;
1312 }
1313}
1314
1315/*
1316 * Receive one chunk of data sent by the server as part of a single COPY
1317 * stream that includes all archives and the manifest.
1318 */
1319static void
1320ReceiveArchiveStreamChunk(size_t r, char *copybuf, void *callback_data)
1321{
1322 ArchiveStreamState *state = callback_data;
1323 size_t cursor = 0;
1324
1325 /* Each CopyData message begins with a type byte. */
1326 switch (GetCopyDataByte(r, copybuf, &cursor))
1327 {
1329 {
1330 /* New archive. */
1331 char *archive_name;
1332 char *spclocation;
1333
1334 /*
1335 * We force a progress report at the end of each tablespace. A
1336 * new tablespace starts when the previous one ends, except in
1337 * the case of the very first one.
1338 */
1339 if (++state->tablespacenum > 0)
1340 progress_report(state->tablespacenum, true, false);
1341
1342 /* Sanity check. */
1343 if (state->manifest_buffer != NULL ||
1344 state->manifest_file !=NULL)
1345 pg_fatal("archives must precede manifest");
1346
1347 /* Parse the rest of the CopyData message. */
1348 archive_name = GetCopyDataString(r, copybuf, &cursor);
1351
1352 /*
1353 * Basic sanity checks on the archive name: it shouldn't be
1354 * empty, it shouldn't start with a dot, and it shouldn't
1355 * contain a path separator.
1356 */
1357 if (archive_name[0] == '\0' || archive_name[0] == '.' ||
1358 strchr(archive_name, '/') != NULL ||
1359 strchr(archive_name, '\\') != NULL)
1360 pg_fatal("invalid archive name: \"%s\"",
1361 archive_name);
1362
1363 /*
1364 * An empty spclocation is treated as NULL. We expect this
1365 * case to occur for the data directory itself, but not for
1366 * any archives that correspond to tablespaces.
1367 */
1368 if (spclocation[0] == '\0')
1369 spclocation = NULL;
1370
1371 /* End processing of any prior archive. */
1372 if (state->streamer != NULL)
1373 {
1374 astreamer_finalize(state->streamer);
1375 astreamer_free(state->streamer);
1376 state->streamer = NULL;
1377 }
1378
1379 /*
1380 * Create an appropriate backup streamer, unless a backup
1381 * target was specified. In that case, it's up to the server
1382 * to put the backup wherever it needs to go.
1383 */
1384 if (backup_target == NULL)
1385 {
1386 /*
1387 * We know that recovery GUCs are supported, because this
1388 * protocol can only be used on v15+.
1389 */
1390 state->streamer =
1391 CreateBackupStreamer(archive_name,
1393 &state->manifest_inject_streamer,
1394 true, false,
1395 state->compress);
1396 }
1397 break;
1398 }
1399
1400 case PqMsg_CopyData:
1401 {
1402 /* Archive or manifest data. */
1403 if (state->manifest_buffer != NULL)
1404 {
1405 /* Manifest data, buffer in memory. */
1406 appendPQExpBuffer(state->manifest_buffer, copybuf + 1,
1407 r - 1);
1408 }
1409 else if (state->manifest_file !=NULL)
1410 {
1411 /* Manifest data, write to disk. */
1412 if (fwrite(copybuf + 1, r - 1, 1,
1413 state->manifest_file) != 1)
1414 {
1415 /*
1416 * If fwrite() didn't set errno, assume that the
1417 * problem is that we're out of disk space.
1418 */
1419 if (errno == 0)
1420 errno = ENOSPC;
1421 pg_fatal("could not write to file \"%s\": %m",
1422 state->manifest_filename);
1423 }
1424 }
1425 else if (state->streamer != NULL)
1426 {
1427 /* Archive data. */
1428 astreamer_content(state->streamer, NULL, copybuf + 1,
1429 r - 1, ASTREAMER_UNKNOWN);
1430 }
1431 else
1432 pg_fatal("unexpected payload data");
1433 break;
1434 }
1435
1437 {
1438 /*
1439 * Progress report.
1440 *
1441 * The remainder of the message is expected to be an 8-byte
1442 * count of bytes completed.
1443 */
1446
1447 /*
1448 * The server shouldn't send progress report messages too
1449 * often, so we force an update each time we receive one.
1450 */
1451 progress_report(state->tablespacenum, true, false);
1452 break;
1453 }
1454
1456 {
1457 /*
1458 * Manifest data will be sent next. This message is not
1459 * expected to have any further payload data.
1460 */
1462
1463 /*
1464 * If a backup target was specified, figuring out where to put
1465 * the manifest is the server's problem. Otherwise, we need to
1466 * deal with it.
1467 */
1468 if (backup_target == NULL)
1469 {
1470 /*
1471 * If we're supposed inject the manifest into the archive,
1472 * we prepare to buffer it in memory; otherwise, we
1473 * prepare to write it to a temporary file.
1474 */
1475 if (state->manifest_inject_streamer != NULL)
1476 state->manifest_buffer = createPQExpBuffer();
1477 else
1478 {
1479 snprintf(state->manifest_filename,
1480 sizeof(state->manifest_filename),
1481 "%s/backup_manifest.tmp", basedir);
1482 state->manifest_file =
1483 fopen(state->manifest_filename, "wb");
1484 if (state->manifest_file == NULL)
1485 pg_fatal("could not create file \"%s\": %m",
1486 state->manifest_filename);
1487 }
1488 }
1489 break;
1490 }
1491
1492 default:
1494 break;
1495 }
1496}
1497
1498/*
1499 * Get a single byte from a CopyData message.
1500 *
1501 * Bail out if none remain.
1502 */
1503static char
1504GetCopyDataByte(size_t r, char *copybuf, size_t *cursor)
1505{
1506 if (*cursor >= r)
1508
1509 return copybuf[(*cursor)++];
1510}
1511
1512/*
1513 * Get a NUL-terminated string from a CopyData message.
1514 *
1515 * Bail out if the terminating NUL cannot be found.
1516 */
1517static char *
1518GetCopyDataString(size_t r, char *copybuf, size_t *cursor)
1519{
1520 size_t startpos = *cursor;
1521 size_t endpos = startpos;
1522
1523 while (1)
1524 {
1525 if (endpos >= r)
1527 if (copybuf[endpos] == '\0')
1528 break;
1529 ++endpos;
1530 }
1531
1532 *cursor = endpos + 1;
1533 return &copybuf[startpos];
1534}
1535
1536/*
1537 * Get an unsigned 64-bit integer from a CopyData message.
1538 *
1539 * Bail out if there are not at least 8 bytes remaining.
1540 */
1541static uint64
1542GetCopyDataUInt64(size_t r, char *copybuf, size_t *cursor)
1543{
1544 uint64 result;
1545
1546 if (*cursor + sizeof(uint64) > r)
1548 memcpy(&result, &copybuf[*cursor], sizeof(uint64));
1549 *cursor += sizeof(uint64);
1550 return pg_ntoh64(result);
1551}
1552
1553/*
1554 * Bail out if we didn't parse the whole message.
1555 */
1556static void
1557GetCopyDataEnd(size_t r, char *copybuf, size_t cursor)
1558{
1559 if (r != cursor)
1561}
1562
1563/*
1564 * Report failure to parse a CopyData message from the server. Then exit.
1565 *
1566 * As a debugging aid, we try to give some hint about what kind of message
1567 * provoked the failure. Perhaps this is not detailed enough, but it's not
1568 * clear that it's worth expending any more code on what should be a
1569 * can't-happen case.
1570 */
1571static void
1573{
1574 if (r == 0)
1575 pg_fatal("empty COPY message");
1576 else
1577 pg_fatal("malformed COPY message of type %d, length %zu",
1578 copybuf[0], r);
1579}
1580
1581/*
1582 * Receive raw tar data from the server, and stream it to the appropriate
1583 * location. If we're writing a single tarfile to standard output, also
1584 * receive the backup manifest and inject it into that tarfile.
1585 */
1586static void
1587ReceiveTarFile(PGconn *conn, char *archive_name, char *spclocation,
1588 bool tablespacenum, pg_compress_specification *compress)
1589{
1591 astreamer *manifest_inject_streamer;
1592 bool is_recovery_guc_supported;
1594
1595 /* Pass all COPY data through to the backup streamer. */
1596 memset(&state, 0, sizeof(state));
1597 is_recovery_guc_supported =
1601 state.streamer = CreateBackupStreamer(archive_name, spclocation,
1602 &manifest_inject_streamer,
1603 is_recovery_guc_supported,
1605 compress);
1606 state.tablespacenum = tablespacenum;
1609
1610 /*
1611 * The decision as to whether we need to inject the backup manifest into
1612 * the output at this stage is made by CreateBackupStreamer; if that is
1613 * needed, manifest_inject_streamer will be non-NULL; otherwise, it will
1614 * be NULL.
1615 */
1616 if (manifest_inject_streamer != NULL)
1617 {
1619
1620 /* Slurp the entire backup manifest into a buffer. */
1624 pg_fatal("out of memory");
1625
1626 /* Inject it into the output tarfile. */
1627 astreamer_inject_file(manifest_inject_streamer, "backup_manifest",
1628 buf.data, buf.len);
1629
1630 /* Free memory. */
1632 }
1633
1634 /* Cleanup. */
1635 astreamer_finalize(state.streamer);
1636 astreamer_free(state.streamer);
1637
1638 progress_report(tablespacenum, true, false);
1639
1640 /*
1641 * Do not sync the resulting tar file yet, all files are synced once at
1642 * the end.
1643 */
1644}
1645
1646/*
1647 * Receive one chunk of tar-format data from the server.
1648 */
1649static void
1650ReceiveTarCopyChunk(size_t r, char *copybuf, void *callback_data)
1651{
1652 WriteTarState *state = callback_data;
1653
1655
1656 totaldone += r;
1657 progress_report(state->tablespacenum, false, false);
1658}
1659
1660
1661/*
1662 * Retrieve tablespace path, either relocated or original depending on whether
1663 * -T was passed or not.
1664 */
1665static const char *
1667{
1668 TablespaceListCell *cell;
1669 char canon_dir[MAXPGPATH];
1670
1671 /* Canonicalize path for comparison consistency */
1672 strlcpy(canon_dir, dir, sizeof(canon_dir));
1674
1675 for (cell = tablespace_dirs.head; cell; cell = cell->next)
1676 if (strcmp(canon_dir, cell->old_dir) == 0)
1677 return cell->new_dir;
1678
1679 return dir;
1680}
1681
1682/*
1683 * Receive the backup manifest file and write it out to a file.
1684 */
1685static void
1687{
1689
1690 snprintf(state.filename, sizeof(state.filename),
1691 "%s/backup_manifest.tmp", basedir);
1692 state.file = fopen(state.filename, "wb");
1693 if (state.file == NULL)
1694 pg_fatal("could not create file \"%s\": %m", state.filename);
1695
1697
1698 fclose(state.file);
1699}
1700
1701/*
1702 * Receive one chunk of the backup manifest file and write it out to a file.
1703 */
1704static void
1705ReceiveBackupManifestChunk(size_t r, char *copybuf, void *callback_data)
1706{
1707 WriteManifestState *state = callback_data;
1708
1709 errno = 0;
1710 if (fwrite(copybuf, r, 1, state->file) != 1)
1711 {
1712 /* if write didn't set errno, assume problem is no disk space */
1713 if (errno == 0)
1714 errno = ENOSPC;
1715 pg_fatal("could not write to file \"%s\": %m", state->filename);
1716 }
1717}
1718
1719/*
1720 * Receive the backup manifest file and write it out to a file.
1721 */
1722static void
1727
1728/*
1729 * Receive one chunk of the backup manifest file and write it out to a file.
1730 */
1731static void
1733 void *callback_data)
1734{
1735 PQExpBuffer buf = callback_data;
1736
1738}
1739
1740static void
1745{
1746 PGresult *res;
1747 char *sysidentifier;
1749 TimeLineID starttli;
1750 char *basebkp;
1751 int i;
1752 char xlogstart[64];
1753 char xlogend[64] = {0};
1754 int minServerMajor,
1756 int serverVersion,
1759 bool use_new_option_syntax = false;
1761
1762 Assert(conn != NULL);
1764
1765 /*
1766 * Check server version. BASE_BACKUP command was introduced in 9.1, so we
1767 * can't work with servers older than 9.1.
1768 */
1769 minServerMajor = 901;
1772 serverMajor = serverVersion / 100;
1774 {
1775 const char *serverver = PQparameterStatus(conn, "server_version");
1776
1777 pg_fatal("incompatible server version %s",
1778 serverver ? serverver : "'unknown'");
1779 }
1780 if (serverMajor >= 1500)
1781 use_new_option_syntax = true;
1782
1783 /*
1784 * If WAL streaming was requested, also check that the server is new
1785 * enough for that.
1786 */
1788 {
1789 /*
1790 * Error message already written in CheckServerVersionForStreaming(),
1791 * but add a hint about using -X none.
1792 */
1793 pg_log_error_hint("Use -X none or -X fetch to disable log streaming.");
1794 exit(1);
1795 }
1796
1797 /*
1798 * Build contents of configuration file if requested.
1799 *
1800 * Note that we don't use the dbname from key-value pair in conn as that
1801 * would have been filled by the default dbname (dbname=replication) in
1802 * case the user didn't specify the one. The dbname written in the config
1803 * file as part of primary_conninfo would be used by slotsync worker which
1804 * doesn't use a replication connection so the default won't work for it.
1805 */
1810
1811 /*
1812 * Run IDENTIFY_SYSTEM so we can get the timeline
1813 */
1814 if (!RunIdentifySystem(conn, &sysidentifier, &latesttli, NULL, NULL))
1815 exit(1);
1816
1817 /*
1818 * If the user wants an incremental backup, we must upload the manifest
1819 * for the previous backup upon which it is to be based.
1820 */
1822 {
1823 int fd;
1824 char mbuf[65536];
1825 int nbytes;
1826
1827 /* Reject if server is too old. */
1829 pg_fatal("server does not support incremental backup");
1830
1831 /* Open the file. */
1833 if (fd < 0)
1834 pg_fatal("could not open file \"%s\": %m", incremental_manifest);
1835
1836 /* Tell the server what we want to do. */
1837 if (PQsendQuery(conn, "UPLOAD_MANIFEST") == 0)
1838 pg_fatal("could not send replication command \"%s\": %s",
1839 "UPLOAD_MANIFEST", PQerrorMessage(conn));
1840 res = PQgetResult(conn);
1841 if (PQresultStatus(res) != PGRES_COPY_IN)
1842 {
1844 pg_fatal("could not upload manifest: %s",
1846 else
1847 pg_fatal("could not upload manifest: unexpected status %s",
1849 }
1850
1851 /* Loop, reading from the file and sending the data to the server. */
1852 while ((nbytes = read(fd, mbuf, sizeof mbuf)) > 0)
1853 {
1854 if (PQputCopyData(conn, mbuf, nbytes) < 0)
1855 pg_fatal("could not send COPY data: %s",
1857 }
1858
1859 /* Bail out if we exited the loop due to an error. */
1860 if (nbytes < 0)
1861 pg_fatal("could not read file \"%s\": %m", incremental_manifest);
1862
1863 /* End the COPY operation. */
1864 if (PQputCopyEnd(conn, NULL) < 0)
1865 pg_fatal("could not send end-of-COPY: %s",
1867
1868 /* See whether the server is happy with what we sent. */
1869 res = PQgetResult(conn);
1871 pg_fatal("could not upload manifest: %s",
1873 else if (PQresultStatus(res) != PGRES_COMMAND_OK)
1874 pg_fatal("could not upload manifest: unexpected status %s",
1876
1877 /* Consume ReadyForQuery message from server. */
1878 res = PQgetResult(conn);
1879 if (res != NULL)
1880 pg_fatal("unexpected extra result while sending manifest");
1881
1882 /* Add INCREMENTAL option to BASE_BACKUP command. */
1884 }
1885
1886 /*
1887 * Continue building up the options list for the BASE_BACKUP command.
1888 */
1890 if (estimatesize)
1892 if (includewal == FETCH_WAL)
1894 if (fastcheckpoint)
1895 {
1898 "CHECKPOINT", "fast");
1899 else
1901 }
1902 if (includewal != NO_WAL)
1903 {
1906 else
1908 }
1909 if (maxrate > 0)
1911 maxrate);
1912 if (format == 't')
1914 if (!verify_checksums)
1915 {
1918 "VERIFY_CHECKSUMS", 0);
1919 else
1921 "NOVERIFY_CHECKSUMS");
1922 }
1923
1924 if (manifest)
1925 {
1927 manifest_force_encode ? "force-encode" : "yes");
1928 if (manifest_checksums != NULL)
1930 "MANIFEST_CHECKSUMS", manifest_checksums);
1931 }
1932
1933 if (backup_target != NULL)
1934 {
1935 char *colon;
1936
1937 if (serverMajor < 1500)
1938 pg_fatal("backup targets are not supported by this server version");
1939
1941 pg_fatal("recovery configuration cannot be written when a backup target is used");
1942
1944
1945 if ((colon = strchr(backup_target, ':')) == NULL)
1946 {
1948 "TARGET", backup_target);
1949 }
1950 else
1951 {
1952 char *target;
1953
1956 "TARGET", target);
1958 "TARGET_DETAIL", colon + 1);
1959 }
1960 }
1961 else if (serverMajor >= 1500)
1963 "TARGET", "client");
1964
1966 {
1968 pg_fatal("server does not support server-side compression");
1970 "COMPRESSION", compression_algorithm);
1971 if (compression_detail != NULL)
1973 "COMPRESSION_DETAIL",
1975 }
1976
1977 if (verbose)
1978 pg_log_info("initiating base backup, waiting for checkpoint to complete");
1979
1980 if (showprogress && !verbose)
1981 {
1982 fprintf(stderr, _("waiting for checkpoint"));
1983 if (isatty(fileno(stderr)))
1984 fprintf(stderr, "\r");
1985 else
1986 fprintf(stderr, "\n");
1987 }
1988
1989 if (use_new_option_syntax && buf.len > 0)
1990 basebkp = psprintf("BASE_BACKUP (%s)", buf.data);
1991 else
1992 basebkp = psprintf("BASE_BACKUP %s", buf.data);
1993
1994 /* OK, try to start the backup. */
1995 if (PQsendQuery(conn, basebkp) == 0)
1996 pg_fatal("could not send replication command \"%s\": %s",
1997 "BASE_BACKUP", PQerrorMessage(conn));
1998
1999 /*
2000 * Get the starting WAL location
2001 */
2002 res = PQgetResult(conn);
2003 if (PQresultStatus(res) != PGRES_TUPLES_OK)
2004 pg_fatal("could not initiate base backup: %s",
2006 if (PQntuples(res) != 1)
2007 pg_fatal("server returned unexpected response to BASE_BACKUP command; got %d rows and %d fields, expected %d rows and %d fields",
2008 PQntuples(res), PQnfields(res), 1, 2);
2009
2010 strlcpy(xlogstart, PQgetvalue(res, 0, 0), sizeof(xlogstart));
2011
2012 if (verbose)
2013 pg_log_info("checkpoint completed");
2014
2015 /*
2016 * 9.3 and later sends the TLI of the starting point. With older servers,
2017 * assume it's the same as the latest timeline reported by
2018 * IDENTIFY_SYSTEM.
2019 */
2020 if (PQnfields(res) >= 2)
2021 starttli = atoi(PQgetvalue(res, 0, 1));
2022 else
2023 starttli = latesttli;
2024 PQclear(res);
2025
2026 if (verbose && includewal != NO_WAL)
2027 pg_log_info("write-ahead log start point: %s on timeline %u",
2028 xlogstart, starttli);
2029
2030 /*
2031 * Get the header
2032 */
2033 res = PQgetResult(conn);
2034 if (PQresultStatus(res) != PGRES_TUPLES_OK)
2035 pg_fatal("could not get backup header: %s",
2037 if (PQntuples(res) < 1)
2038 pg_fatal("no data returned from server");
2039
2040 /*
2041 * Sum up the total size, for progress reporting
2042 */
2043 totalsize_kb = totaldone = 0;
2045 for (i = 0; i < PQntuples(res); i++)
2046 {
2047 totalsize_kb += atoll(PQgetvalue(res, i, 2));
2048
2049 /*
2050 * Verify tablespace directories are empty. Don't bother with the
2051 * first once since it can be relocated, and it will be checked before
2052 * we do anything anyway.
2053 *
2054 * Note that this is skipped for tar format backups and backups that
2055 * the server is storing to a target location, since in that case we
2056 * won't be storing anything into these directories and thus should
2057 * not create them.
2058 */
2059 if (backup_target == NULL && format == 'p' && !PQgetisnull(res, i, 1))
2060 {
2061 char *path = PQgetvalue(res, i, 1);
2062
2063 if (is_absolute_path(path))
2064 path = unconstify(char *, get_tablespace_mapping(path));
2065 else
2066 {
2067 /* This is an in-place tablespace, so prepend basedir. */
2068 path = psprintf("%s/%s", basedir, path);
2069 }
2070
2072 }
2073 }
2074
2075 /*
2076 * When writing to stdout, require a single tablespace
2077 */
2078 writing_to_stdout = format == 't' && basedir != NULL &&
2079 strcmp(basedir, "-") == 0;
2080 if (writing_to_stdout && PQntuples(res) > 1)
2081 pg_fatal("can only write single tablespace to stdout, database has %d",
2082 PQntuples(res));
2083
2084 /*
2085 * If we're streaming WAL, start the streaming session before we start
2086 * receiving the actual data chunks.
2087 */
2088 if (includewal == STREAM_WAL)
2089 {
2090 pg_compress_algorithm wal_compress_algorithm;
2091 int wal_compress_level;
2092
2093 if (verbose)
2094 pg_log_info("starting background WAL receiver");
2095
2096 if (client_compress->algorithm == PG_COMPRESSION_GZIP)
2097 {
2098 wal_compress_algorithm = PG_COMPRESSION_GZIP;
2099 wal_compress_level = client_compress->level;
2100 }
2101 else
2102 {
2103 wal_compress_algorithm = PG_COMPRESSION_NONE;
2104 wal_compress_level = 0;
2105 }
2106
2107 StartLogStreamer(xlogstart, starttli, sysidentifier,
2108 wal_compress_algorithm,
2109 wal_compress_level);
2110 }
2111
2112 if (serverMajor >= 1500)
2113 {
2114 /* Receive a single tar stream with everything. */
2116 }
2117 else
2118 {
2119 /* Receive a tar file for each tablespace in turn */
2120 for (i = 0; i < PQntuples(res); i++)
2121 {
2122 char archive_name[MAXPGPATH];
2123 char *spclocation;
2124
2125 /*
2126 * If we write the data out to a tar file, it will be named
2127 * base.tar if it's the main data directory or <tablespaceoid>.tar
2128 * if it's for another tablespace. CreateBackupStreamer() will
2129 * arrange to add an extension to the archive name if
2130 * pg_basebackup is performing compression, depending on the
2131 * compression type.
2132 */
2133 if (PQgetisnull(res, i, 0))
2134 {
2135 strlcpy(archive_name, "base.tar", sizeof(archive_name));
2136 spclocation = NULL;
2137 }
2138 else
2139 {
2140 snprintf(archive_name, sizeof(archive_name),
2141 "%s.tar", PQgetvalue(res, i, 0));
2142 spclocation = PQgetvalue(res, i, 1);
2143 }
2144
2145 ReceiveTarFile(conn, archive_name, spclocation, i,
2147 }
2148
2149 /*
2150 * Now receive backup manifest, if appropriate.
2151 *
2152 * If we're writing a tarfile to stdout, ReceiveTarFile will have
2153 * already processed the backup manifest and included it in the output
2154 * tarfile. Such a configuration doesn't allow for writing multiple
2155 * files.
2156 *
2157 * If we're talking to an older server, it won't send a backup
2158 * manifest, so don't try to receive one.
2159 */
2162 }
2163
2164 if (showprogress)
2165 {
2167 progress_report(PQntuples(res), true, true);
2168 }
2169
2170 PQclear(res);
2171
2172 /*
2173 * Get the stop position
2174 */
2175 res = PQgetResult(conn);
2176 if (PQresultStatus(res) != PGRES_TUPLES_OK)
2177 pg_fatal("backup failed: %s",
2179 if (PQntuples(res) != 1)
2180 pg_fatal("no write-ahead log end position returned from server");
2181 strlcpy(xlogend, PQgetvalue(res, 0, 0), sizeof(xlogend));
2182 if (verbose && includewal != NO_WAL)
2183 pg_log_info("write-ahead log end point: %s", xlogend);
2184 PQclear(res);
2185
2186 res = PQgetResult(conn);
2187 if (PQresultStatus(res) != PGRES_COMMAND_OK)
2188 {
2189 const char *sqlstate = PQresultErrorField(res, PG_DIAG_SQLSTATE);
2190
2191 if (sqlstate &&
2192 strcmp(sqlstate, ERRCODE_DATA_CORRUPTED) == 0)
2193 {
2194 pg_log_error("checksum error occurred");
2195 checksum_failure = true;
2196 }
2197 else
2198 {
2199 pg_log_error("final receive failed: %s",
2201 }
2202 exit(1);
2203 }
2204
2205 if (bgchild > 0)
2206 {
2207#ifndef WIN32
2208 int status;
2209 pid_t r;
2210#else
2211 DWORD status;
2212
2213 /*
2214 * get a pointer sized version of bgchild to avoid warnings about
2215 * casting to a different size on WIN64.
2216 */
2218 uint32 hi,
2219 lo;
2220#endif
2221
2222 if (verbose)
2223 pg_log_info("waiting for background process to finish streaming ...");
2224
2225#ifndef WIN32
2227 pg_fatal("could not send command to background pipe: %m");
2228
2229 /* Just wait for the background process to exit */
2230 r = waitpid(bgchild, &status, 0);
2231 if (r == (pid_t) -1)
2232 pg_fatal("could not wait for child process: %m");
2233 if (r != bgchild)
2234 pg_fatal("child %d died, expected %d", (int) r, (int) bgchild);
2235 if (status != 0)
2236 pg_fatal("%s", wait_result_to_str(status));
2237 /* Exited normally, we're happy! */
2238#else /* WIN32 */
2239
2240 /*
2241 * On Windows, since we are in the same process, we can just store the
2242 * value directly in the variable, and then set the flag that says
2243 * it's there.
2244 */
2245 if (sscanf(xlogend, "%X/%08X", &hi, &lo) != 2)
2246 pg_fatal("could not parse write-ahead log location \"%s\"",
2247 xlogend);
2248 xlogendptr = ((uint64) hi) << 32 | lo;
2250
2251 /* First wait for the thread to exit */
2254 {
2256 pg_fatal("could not wait for child thread: %m");
2257 }
2258 if (GetExitCodeThread((HANDLE) bgchild_handle, &status) == 0)
2259 {
2261 pg_fatal("could not get child thread exit status: %m");
2262 }
2263 if (status != 0)
2264 pg_fatal("child thread exited with error %u",
2265 (unsigned int) status);
2266 /* Exited normally, we're happy */
2267#endif
2268 }
2269
2270 /* Free the configuration file contents */
2272
2273 /*
2274 * End of copy data. Final result is already checked inside the loop.
2275 */
2276 PQclear(res);
2277 PQfinish(conn);
2278 conn = NULL;
2279
2280 /*
2281 * Make data persistent on disk once backup is completed. For tar format
2282 * sync the parent directory and all its contents as each tar file was not
2283 * synced after being completed. In plain format, all the data of the
2284 * base directory is synced, taking into account all the tablespaces.
2285 * Errors are not considered fatal.
2286 *
2287 * If, however, there's a backup target, we're not writing anything
2288 * locally, so in that case we skip this step.
2289 */
2290 if (do_sync && backup_target == NULL)
2291 {
2292 if (verbose)
2293 pg_log_info("syncing data to disk ...");
2294 if (format == 't')
2295 {
2296 if (strcmp(basedir, "-") != 0)
2298 }
2299 else
2300 {
2302 }
2303 }
2304
2305 /*
2306 * After synchronizing data to disk, perform a durable rename of
2307 * backup_manifest.tmp to backup_manifest, if we wrote such a file. This
2308 * way, a failure or system crash before we reach this point will leave us
2309 * without a backup_manifest file, decreasing the chances that a directory
2310 * we leave behind will be mistaken for a valid backup.
2311 */
2313 {
2314 char tmp_filename[MAXPGPATH];
2315 char filename[MAXPGPATH];
2316
2317 if (verbose)
2318 pg_log_info("renaming backup_manifest.tmp to backup_manifest");
2319
2320 snprintf(tmp_filename, MAXPGPATH, "%s/backup_manifest.tmp", basedir);
2321 snprintf(filename, MAXPGPATH, "%s/backup_manifest", basedir);
2322
2323 if (do_sync)
2324 {
2325 /* durable_rename emits its own log message in case of failure */
2327 exit(1);
2328 }
2329 else
2330 {
2331 if (rename(tmp_filename, filename) != 0)
2332 pg_fatal("could not rename file \"%s\" to \"%s\": %m",
2334 }
2335 }
2336
2337 if (verbose)
2338 pg_log_info("base backup completed");
2339}
2340
2341
2342int
2343main(int argc, char **argv)
2344{
2345 static struct option long_options[] = {
2346 {"help", no_argument, NULL, '?'},
2347 {"version", no_argument, NULL, 'V'},
2348 {"pgdata", required_argument, NULL, 'D'},
2349 {"format", required_argument, NULL, 'F'},
2350 {"incremental", required_argument, NULL, 'i'},
2351 {"checkpoint", required_argument, NULL, 'c'},
2352 {"create-slot", no_argument, NULL, 'C'},
2353 {"max-rate", required_argument, NULL, 'r'},
2354 {"write-recovery-conf", no_argument, NULL, 'R'},
2355 {"slot", required_argument, NULL, 'S'},
2356 {"target", required_argument, NULL, 't'},
2357 {"tablespace-mapping", required_argument, NULL, 'T'},
2358 {"wal-method", required_argument, NULL, 'X'},
2359 {"gzip", no_argument, NULL, 'z'},
2360 {"compress", required_argument, NULL, 'Z'},
2361 {"label", required_argument, NULL, 'l'},
2362 {"no-clean", no_argument, NULL, 'n'},
2363 {"no-sync", no_argument, NULL, 'N'},
2364 {"dbname", required_argument, NULL, 'd'},
2365 {"host", required_argument, NULL, 'h'},
2366 {"port", required_argument, NULL, 'p'},
2367 {"username", required_argument, NULL, 'U'},
2368 {"no-password", no_argument, NULL, 'w'},
2369 {"password", no_argument, NULL, 'W'},
2370 {"status-interval", required_argument, NULL, 's'},
2371 {"verbose", no_argument, NULL, 'v'},
2372 {"progress", no_argument, NULL, 'P'},
2373 {"waldir", required_argument, NULL, 1},
2374 {"no-slot", no_argument, NULL, 2},
2375 {"no-verify-checksums", no_argument, NULL, 3},
2376 {"no-estimate-size", no_argument, NULL, 4},
2377 {"no-manifest", no_argument, NULL, 5},
2378 {"manifest-force-encode", no_argument, NULL, 6},
2379 {"manifest-checksums", required_argument, NULL, 7},
2380 {"sync-method", required_argument, NULL, 8},
2381 {NULL, 0, NULL, 0}
2382 };
2383 int c;
2384
2385 int option_index;
2386 char *compression_algorithm = "none";
2387 char *compression_detail = NULL;
2388 char *incremental_manifest = NULL;
2391
2392 pg_logging_init(argv[0]);
2393 progname = get_progname(argv[0]);
2394 set_pglocale_pgservice(argv[0], PG_TEXTDOMAIN("pg_basebackup"));
2395
2396 if (argc > 1)
2397 {
2398 if (strcmp(argv[1], "--help") == 0 || strcmp(argv[1], "-?") == 0)
2399 {
2400 usage();
2401 exit(0);
2402 }
2403 else if (strcmp(argv[1], "-V") == 0
2404 || strcmp(argv[1], "--version") == 0)
2405 {
2406 puts("pg_basebackup (PostgreSQL) " PG_VERSION);
2407 exit(0);
2408 }
2409 }
2410
2412
2413 while ((c = getopt_long(argc, argv, "c:Cd:D:F:h:i:l:nNp:Pr:Rs:S:t:T:U:vwWX:zZ:",
2414 long_options, &option_index)) != -1)
2415 {
2416 switch (c)
2417 {
2418 case 'c':
2419 if (pg_strcasecmp(optarg, "fast") == 0)
2420 fastcheckpoint = true;
2421 else if (pg_strcasecmp(optarg, "spread") == 0)
2422 fastcheckpoint = false;
2423 else
2424 pg_fatal("invalid checkpoint argument \"%s\", must be \"fast\" or \"spread\"",
2425 optarg);
2426 break;
2427 case 'C':
2428 create_slot = true;
2429 break;
2430 case 'd':
2432 break;
2433 case 'D':
2435 break;
2436 case 'F':
2437 if (strcmp(optarg, "p") == 0 || strcmp(optarg, "plain") == 0)
2438 format = 'p';
2439 else if (strcmp(optarg, "t") == 0 || strcmp(optarg, "tar") == 0)
2440 format = 't';
2441 else
2442 pg_fatal("invalid output format \"%s\", must be \"plain\" or \"tar\"",
2443 optarg);
2444 break;
2445 case 'h':
2447 break;
2448 case 'i':
2450 break;
2451 case 'l':
2453 break;
2454 case 'n':
2455 noclean = true;
2456 break;
2457 case 'N':
2458 do_sync = false;
2459 break;
2460 case 'p':
2462 break;
2463 case 'P':
2464 showprogress = true;
2465 break;
2466 case 'r':
2468 break;
2469 case 'R':
2470 writerecoveryconf = true;
2471 break;
2472 case 's':
2473 if (!option_parse_int(optarg, "-s/--status-interval", 0,
2474 INT_MAX / 1000,
2476 exit(1);
2478 break;
2479 case 'S':
2480
2481 /*
2482 * When specifying replication slot name, use a permanent
2483 * slot.
2484 */
2486 temp_replication_slot = false;
2487 break;
2488 case 't':
2490 break;
2491 case 'T':
2493 break;
2494 case 'U':
2496 break;
2497 case 'v':
2498 verbose++;
2499 break;
2500 case 'w':
2501 dbgetpassword = -1;
2502 break;
2503 case 'W':
2504 dbgetpassword = 1;
2505 break;
2506 case 'X':
2507 if (strcmp(optarg, "n") == 0 ||
2508 strcmp(optarg, "none") == 0)
2509 {
2511 }
2512 else if (strcmp(optarg, "f") == 0 ||
2513 strcmp(optarg, "fetch") == 0)
2514 {
2516 }
2517 else if (strcmp(optarg, "s") == 0 ||
2518 strcmp(optarg, "stream") == 0)
2519 {
2521 }
2522 else
2523 pg_fatal("invalid wal-method option \"%s\", must be \"fetch\", \"stream\", or \"none\"",
2524 optarg);
2525 break;
2526 case 'z':
2527 compression_algorithm = "gzip";
2530 break;
2531 case 'Z':
2534 break;
2535 case 1:
2537 break;
2538 case 2:
2539 no_slot = true;
2540 break;
2541 case 3:
2542 verify_checksums = false;
2543 break;
2544 case 4:
2545 estimatesize = false;
2546 break;
2547 case 5:
2548 manifest = false;
2549 break;
2550 case 6:
2551 manifest_force_encode = true;
2552 break;
2553 case 7:
2555 break;
2556 case 8:
2558 exit(1);
2559 break;
2560 default:
2561 /* getopt_long already emitted a complaint */
2562 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2563 exit(1);
2564 }
2565 }
2566
2567 /*
2568 * Any non-option arguments?
2569 */
2570 if (optind < argc)
2571 {
2572 pg_log_error("too many command-line arguments (first is \"%s\")",
2573 argv[optind]);
2574 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2575 exit(1);
2576 }
2577
2578 /*
2579 * Setting the backup target to 'client' is equivalent to leaving out the
2580 * option. This logic allows us to assume elsewhere that the backup is
2581 * being stored locally if and only if backup_target == NULL.
2582 */
2583 if (backup_target != NULL && strcmp(backup_target, "client") == 0)
2584 {
2587 }
2588
2589 /*
2590 * Can't use --format with --target. Without --target, default format is
2591 * tar.
2592 */
2593 if (backup_target != NULL && format != '\0')
2594 {
2595 pg_log_error("cannot specify both format and backup target");
2596 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2597 exit(1);
2598 }
2599 if (format == '\0')
2600 format = 'p';
2601
2602 /*
2603 * Either directory or backup target should be specified, but not both
2604 */
2605 if (basedir == NULL && backup_target == NULL)
2606 {
2607 pg_log_error("must specify output directory or backup target");
2608 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2609 exit(1);
2610 }
2611 if (basedir != NULL && backup_target != NULL)
2612 {
2613 pg_log_error("cannot specify both output directory and backup target");
2614 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2615 exit(1);
2616 }
2617
2618 /*
2619 * If the user has not specified where to perform backup compression,
2620 * default to the client, unless the user specified --target, in which
2621 * case the server is the only choice.
2622 */
2624 {
2625 if (backup_target == NULL)
2627 else
2629 }
2630
2631 /*
2632 * If any compression that we're doing is happening on the client side, we
2633 * must try to parse the compression algorithm and detail, but if it's all
2634 * on the server side, then we're just going to pass through whatever was
2635 * requested and let the server decide what to do.
2636 */
2638 {
2640 char *error_detail;
2641
2643 pg_fatal("unrecognized compression algorithm: \"%s\"",
2645
2648 if (error_detail != NULL)
2649 pg_fatal("invalid compression specification: %s",
2650 error_detail);
2651 }
2652 else
2653 {
2656 client_compress.options = 0;
2657 }
2658
2659 /*
2660 * Can't perform client-side compression if the backup is not being sent
2661 * to the client.
2662 */
2664 {
2665 pg_log_error("client-side compression is not possible when a backup target is specified");
2666 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2667 exit(1);
2668 }
2669
2670 /*
2671 * Client-side compression doesn't make sense unless tar format is in use.
2672 */
2673 if (format == 'p' && compressloc == COMPRESS_LOCATION_CLIENT &&
2675 {
2676 pg_log_error("only tar mode backups can be compressed");
2677 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2678 exit(1);
2679 }
2680
2681 /*
2682 * Sanity checks for WAL method.
2683 */
2685 {
2686 pg_log_error("WAL cannot be streamed when a backup target is specified");
2687 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2688 exit(1);
2689 }
2690 if (format == 't' && includewal == STREAM_WAL && strcmp(basedir, "-") == 0)
2691 {
2692 pg_log_error("cannot stream write-ahead logs in tar mode to stdout");
2693 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2694 exit(1);
2695 }
2696
2698 {
2699 pg_log_error("replication slots can only be used with WAL streaming");
2700 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2701 exit(1);
2702 }
2703
2704 /*
2705 * Sanity checks for replication slot options.
2706 */
2707 if (no_slot)
2708 {
2709 if (replication_slot)
2710 {
2711 pg_log_error("--no-slot cannot be used with slot name");
2712 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2713 exit(1);
2714 }
2715 temp_replication_slot = false;
2716 }
2717
2718 if (create_slot)
2719 {
2720 if (!replication_slot)
2721 {
2722 pg_log_error("%s needs a slot to be specified using --slot",
2723 "--create-slot");
2724 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2725 exit(1);
2726 }
2727
2728 if (no_slot)
2729 {
2730 pg_log_error("%s and %s are incompatible options",
2731 "--create-slot", "--no-slot");
2732 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2733 exit(1);
2734 }
2735 }
2736
2737 /*
2738 * Sanity checks on WAL directory.
2739 */
2740 if (xlog_dir)
2741 {
2742 if (backup_target != NULL)
2743 {
2744 pg_log_error("WAL directory location cannot be specified along with a backup target");
2745 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2746 exit(1);
2747 }
2748 if (format != 'p')
2749 {
2750 pg_log_error("WAL directory location can only be specified in plain mode");
2751 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2752 exit(1);
2753 }
2754
2755 /* clean up xlog directory name, check it's absolute */
2758 {
2759 pg_log_error("WAL directory location must be an absolute path");
2760 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2761 exit(1);
2762 }
2763 }
2764
2765 /*
2766 * Sanity checks for progress reporting options.
2767 */
2768 if (showprogress && !estimatesize)
2769 {
2770 pg_log_error("%s and %s are incompatible options",
2771 "--progress", "--no-estimate-size");
2772 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2773 exit(1);
2774 }
2775
2776 /*
2777 * Sanity checks for backup manifest options.
2778 */
2779 if (!manifest && manifest_checksums != NULL)
2780 {
2781 pg_log_error("%s and %s are incompatible options",
2782 "--no-manifest", "--manifest-checksums");
2783 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2784 exit(1);
2785 }
2786
2788 {
2789 pg_log_error("%s and %s are incompatible options",
2790 "--no-manifest", "--manifest-force-encode");
2791 pg_log_error_hint("Try \"%s --help\" for more information.", progname);
2792 exit(1);
2793 }
2794
2795 /* connection in replication mode to server */
2796 conn = GetConnection();
2797 if (!conn)
2798 {
2799 /* Error message already written in GetConnection() */
2800 exit(1);
2801 }
2803
2804#ifndef WIN32
2805
2806 /*
2807 * Trap SIGCHLD to be able to handle the WAL stream process exiting. There
2808 * is no SIGCHLD on Windows, there we rely on the background thread
2809 * setting the signal variable on unexpected but graceful exit. If the WAL
2810 * stream thread crashes on Windows it will bring down the entire process
2811 * as it's a thread, so there is nothing to catch should that happen. A
2812 * crash on UNIX will be caught by the signal handler.
2813 */
2815#endif
2816
2817 /*
2818 * Set umask so that directories/files are created with the same
2819 * permissions as directories/files in the source data directory.
2820 *
2821 * pg_mode_mask is set to owner-only by default and then updated in
2822 * GetConnection() where we get the mode from the server-side with
2823 * RetrieveDataDirCreatePerm() and then call SetDataDirectoryCreatePerm().
2824 */
2826
2827 /* Backup manifests are supported in 13 and newer versions */
2829 manifest = false;
2830
2831 /*
2832 * If an output directory was specified, verify that it exists, or create
2833 * it. Note that for a tar backup, an output directory of "-" means we are
2834 * writing to stdout, so do nothing in that case.
2835 */
2836 if (basedir != NULL && (format == 'p' || strcmp(basedir, "-") != 0))
2838
2839 /* determine remote server's xlog segment size */
2841 exit(1);
2842
2843 /* Create pg_wal symlink, if required */
2844 if (xlog_dir)
2845 {
2846 char *linkloc;
2847
2849
2850 /*
2851 * Form name of the place where the symlink must go. pg_xlog has been
2852 * renamed to pg_wal in post-10 clusters.
2853 */
2854 linkloc = psprintf("%s/%s", basedir,
2856 "pg_xlog" : "pg_wal");
2857
2858 if (symlink(xlog_dir, linkloc) != 0)
2859 pg_fatal("could not create symbolic link \"%s\": %m", linkloc);
2860 free(linkloc);
2861 }
2862
2865
2866 success = true;
2867 return 0;
2868}
static void astreamer_free(astreamer *streamer)
Definition astreamer.h:153
static void astreamer_content(astreamer *streamer, astreamer_member *member, const char *data, int len, astreamer_archive_context context)
Definition astreamer.h:135
static void astreamer_finalize(astreamer *streamer)
Definition astreamer.h:145
@ ASTREAMER_UNKNOWN
Definition astreamer.h:64
astreamer * astreamer_plain_writer_new(char *pathname, FILE *file)
astreamer * astreamer_extractor_new(const char *basepath, const char *(*link_map)(const char *), void(*report_output_file)(const char *))
astreamer * astreamer_gzip_decompressor_new(astreamer *next)
astreamer * astreamer_gzip_writer_new(char *pathname, FILE *file, pg_compress_specification *compress)
astreamer * astreamer_recovery_injector_new(astreamer *next, bool is_recovery_guc_supported, PQExpBuffer recoveryconfcontents)
void astreamer_inject_file(astreamer *streamer, char *pathname, char *data, int len)
astreamer * astreamer_lz4_compressor_new(astreamer *next, pg_compress_specification *compress)
astreamer * astreamer_lz4_decompressor_new(astreamer *next)
astreamer * astreamer_tar_parser_new(astreamer *next)
astreamer * astreamer_tar_terminator_new(astreamer *next)
astreamer * astreamer_tar_archiver_new(astreamer *next)
astreamer * astreamer_zstd_compressor_new(astreamer *next, pg_compress_specification *compress)
astreamer * astreamer_zstd_decompressor_new(astreamer *next)
Datum now(PG_FUNCTION_ARGS)
Definition timestamp.c:1600
#define MAX_RATE_UPPER
Definition basebackup.h:21
#define unconstify(underlying_type, expr)
Definition c.h:1327
#define ngettext(s, p, n)
Definition c.h:1272
#define SIGNAL_ARGS
Definition c.h:1452
#define Assert(condition)
Definition c.h:945
#define PG_TEXTDOMAIN(domain)
Definition c.h:1305
#define PG_BINARY
Definition c.h:1376
#define UINT64_FORMAT
Definition c.h:637
int32_t int32
Definition c.h:614
uint64_t uint64
Definition c.h:619
uint32_t uint32
Definition c.h:618
void set_pglocale_pgservice(const char *argv0, const char *app)
Definition exec.c:430
int main(void)
bool parse_tar_compress_algorithm(const char *fname, pg_compress_algorithm *algorithm)
Definition compression.c:49
char * validate_compress_specification(pg_compress_specification *spec)
bool parse_compress_algorithm(char *name, pg_compress_algorithm *algorithm)
Definition compression.c:79
void parse_compress_specification(pg_compress_algorithm algorithm, char *specification, pg_compress_specification *result)
pg_compress_algorithm
Definition compression.h:22
@ PG_COMPRESSION_GZIP
Definition compression.h:24
@ PG_COMPRESSION_LZ4
Definition compression.h:25
@ PG_COMPRESSION_NONE
Definition compression.h:23
@ PG_COMPRESSION_ZSTD
Definition compression.h:26
void parse_compress_options(const char *option, char **algorithm, char **detail)
#define fprintf(file, fmt, msg)
Definition cubescan.l:21
Datum arg
Definition elog.c:1322
#define _(x)
Definition elog.c:95
int durable_rename(const char *oldfile, const char *newfile, int elevel)
Definition fd.c:783
int PQserverVersion(const PGconn *conn)
const char * PQparameterStatus(const PGconn *conn, const char *paramName)
void PQfinish(PGconn *conn)
int PQbackendPID(const PGconn *conn)
char * PQerrorMessage(const PGconn *conn)
void PQfreemem(void *ptr)
Definition fe-exec.c:4049
int PQputCopyEnd(PGconn *conn, const char *errormsg)
Definition fe-exec.c:2766
int PQputCopyData(PGconn *conn, const char *buffer, int nbytes)
Definition fe-exec.c:2712
int PQsendQuery(PGconn *conn, const char *query)
Definition fe-exec.c:1433
char * PQresStatus(ExecStatusType status)
Definition fe-exec.c:3436
int PQgetCopyData(PGconn *conn, char **buffer, int async)
Definition fe-exec.c:2833
char * pg_strdup(const char *in)
Definition fe_memutils.c:85
void pg_free(void *ptr)
#define pg_malloc0_object(type)
Definition fe_memutils.h:51
int pg_mode_mask
Definition file_perm.c:25
int pg_dir_create_mode
Definition file_perm.c:18
DataDirSyncMethod
Definition file_utils.h:28
@ DATA_DIR_SYNC_METHOD_FSYNC
Definition file_utils.h:29
int getopt_long(int argc, char *const argv[], const char *optstring, const struct option *longopts, int *longindex)
Definition getopt_long.c:60
#define no_argument
Definition getopt_long.h:25
#define required_argument
Definition getopt_long.h:26
#define colon
#define write(a, b, c)
Definition win32.h:14
#define read(a, b, c)
Definition win32.h:13
int i
Definition isn.c:77
#define PQgetvalue
#define PQgetResult
#define PQclear
#define PQresultErrorField
#define PQnfields
#define PQresultStatus
#define PQgetisnull
#define PQntuples
@ PGRES_COPY_IN
Definition libpq-fe.h:138
@ PGRES_COMMAND_OK
Definition libpq-fe.h:131
@ PGRES_FATAL_ERROR
Definition libpq-fe.h:142
@ PGRES_COPY_OUT
Definition libpq-fe.h:137
@ PGRES_TUPLES_OK
Definition libpq-fe.h:134
void pg_logging_init(const char *argv0)
Definition logging.c:83
#define pg_log_error(...)
Definition logging.h:106
#define pg_log_error_hint(...)
Definition logging.h:112
#define pg_log_info(...)
Definition logging.h:124
#define pg_log_error_detail(...)
Definition logging.h:109
const char * progname
Definition main.c:44
char * pnstrdup(const char *in, Size len)
Definition mcxt.c:1792
bool option_parse_int(const char *optarg, const char *optname, int min_range, int max_range, int *result)
bool parse_sync_method(const char *optarg, DataDirSyncMethod *sync_method)
#define pg_fatal(...)
static void BaseBackup(char *compression_algorithm, char *compression_detail, CompressionLocation compressloc, pg_compress_specification *client_compress, char *incremental_manifest)
static void ReceiveArchiveStreamChunk(size_t r, char *copybuf, void *callback_data)
static int verbose
static bool checksum_failure
void(* WriteDataCallback)(size_t nbytes, char *buf, void *callback_data)
static bool noclean
static bool estimatesize
static bool found_existing_pgdata
static bool manifest
static bool found_existing_xlogdir
#define MINIMUM_VERSION_FOR_TEMP_SLOTS
static int32 maxrate
static void ReceiveTarFile(PGconn *conn, char *archive_name, char *spclocation, bool tablespacenum, pg_compress_specification *compress)
static char * backup_target
static char format
static char * xlog_dir
static void ReceiveCopyData(PGconn *conn, WriteDataCallback callback, void *callback_data)
static void StartLogStreamer(char *startpos, uint32 timeline, char *sysidentifier, pg_compress_algorithm wal_compress_algorithm, int wal_compress_level)
static void ReceiveBackupManifestChunk(size_t r, char *copybuf, void *callback_data)
static char * GetCopyDataString(size_t r, char *copybuf, size_t *cursor)
static int32 parse_max_rate(char *src)
IncludeWal
@ STREAM_WAL
@ FETCH_WAL
@ NO_WAL
static volatile sig_atomic_t bgchild_exited
static int bgpipe[2]
static bool create_slot
static void ReceiveTarCopyChunk(size_t r, char *copybuf, void *callback_data)
static int LogStreamerMain(logstreamer_param *param)
static void ReceiveArchiveStream(PGconn *conn, pg_compress_specification *compress)
static void backup_parse_compress_options(char *option, char **algorithm, char **detail, CompressionLocation *locationres)
static PQExpBuffer recoveryconfcontents
static int tablespacecount
static void progress_update_filename(const char *filename)
static pid_t bgchild
CompressionLocation
@ COMPRESS_LOCATION_UNSPECIFIED
@ COMPRESS_LOCATION_CLIENT
@ COMPRESS_LOCATION_SERVER
static bool reached_end_position(XLogRecPtr segendpos, uint32 timeline, bool segment_finished)
static int has_xlogendptr
static void verify_dir_is_empty_or_create(char *dirname, bool *created, bool *found)
static char * progress_filename
static uint64 totalsize_kb
static pg_time_t last_progress_report
static bool verify_checksums
static char * replication_slot
static void GetCopyDataEnd(size_t r, char *copybuf, size_t cursor)
static bool success
static void ReceiveBackupManifest(PGconn *conn)
static uint64 totaldone
static void progress_report(int tablespacenum, bool force, bool finished)
static bool manifest_force_encode
static char * manifest_checksums
static astreamer * CreateBackupStreamer(char *archive_name, char *spclocation, astreamer **manifest_inject_streamer_p, bool is_recovery_guc_supported, bool expect_unterminated_tarfile, pg_compress_specification *compress)
#define MINIMUM_VERSION_FOR_TERMINATED_TARFILE
static TablespaceList tablespace_dirs
static bool found_tablespace_dirs
static bool in_log_streamer
static bool made_new_xlogdir
static IncludeWal includewal
static void ReportCopyDataParseError(size_t r, char *copybuf)
static bool do_sync
static bool writerecoveryconf
static void cleanup_directories_atexit(void)
static bool temp_replication_slot
#define MINIMUM_VERSION_FOR_MANIFESTS
static bool no_slot
static bool made_tablespace_dirs
static char GetCopyDataByte(size_t r, char *copybuf, size_t *cursor)
#define VERBOSE_FILENAME_LENGTH
static uint64 GetCopyDataUInt64(size_t r, char *copybuf, size_t *cursor)
static bool fastcheckpoint
static bool made_new_pgdata
static void kill_bgchild_atexit(void)
static DataDirSyncMethod sync_method
#define ERRCODE_DATA_CORRUPTED
static char * label
static void ReceiveBackupManifestInMemoryChunk(size_t r, char *copybuf, void *callback_data)
static bool showprogress
static void usage(void)
static void tablespace_list_append(const char *arg)
static const char * get_tablespace_mapping(const char *dir)
static char * basedir
static void disconnect_atexit(void)
static void ReceiveBackupManifestInMemory(PGconn *conn, PQExpBuffer buf)
static XLogRecPtr xlogendptr
#define MINIMUM_VERSION_FOR_PG_WAL
static int standby_message_timeout
#define MINIMUM_VERSION_FOR_WAL_SUMMARIES
static void sigchld_handler(SIGNAL_ARGS)
#define pg_ntoh64(x)
Definition pg_bswap.h:126
#define MAXPGPATH
static char * filename
Definition pg_dumpall.c:133
PGDLLIMPORT int optind
Definition getopt.c:51
PGDLLIMPORT char * optarg
Definition getopt.c:53
static pg_compress_algorithm compression_algorithm
static XLogRecPtr endpos
static XLogRecPtr startpos
static char buf[DEFAULT_XLOG_SEG_SIZE]
int64 pg_time_t
Definition pgtime.h:23
#define pqsignal
Definition port.h:547
int pg_mkdir_p(char *path, int omode)
Definition pgmkdirp.c:57
#define is_absolute_path(filename)
Definition port.h:104
int pg_strcasecmp(const char *s1, const char *s2)
void canonicalize_path(char *path)
Definition path.c:337
int pg_check_dir(const char *dir)
Definition pgcheckdir.c:33
#define snprintf
Definition port.h:260
#define PGINVALID_SOCKET
Definition port.h:31
const char * get_progname(const char *argv0)
Definition path.c:652
#define is_windows_absolute_path(filename)
Definition port.h:90
#define printf(...)
Definition port.h:266
size_t strlcat(char *dst, const char *src, size_t siz)
Definition strlcat.c:33
size_t strlcpy(char *dst, const char *src, size_t siz)
Definition strlcpy.c:45
#define is_nonwindows_absolute_path(filename)
Definition port.h:83
#define PG_DIAG_SQLSTATE
PQExpBuffer createPQExpBuffer(void)
Definition pqexpbuffer.c:72
void initPQExpBuffer(PQExpBuffer str)
Definition pqexpbuffer.c:90
void appendPQExpBuffer(PQExpBuffer str, const char *fmt,...)
void destroyPQExpBuffer(PQExpBuffer str)
void termPQExpBuffer(PQExpBuffer str)
#define PQExpBufferDataBroken(buf)
Definition pqexpbuffer.h:67
char * c
static int fd(const char *x, int i)
static int fb(int x)
#define PqMsg_CopyData
Definition protocol.h:65
#define PqBackupMsg_ProgressReport
Definition protocol.h:91
#define PqBackupMsg_NewArchive
Definition protocol.h:90
#define PqBackupMsg_Manifest
Definition protocol.h:89
char * psprintf(const char *fmt,...)
Definition psprintf.c:43
bool ReceiveXlogStream(PGconn *conn, StreamCtl *stream)
Definition receivelog.c:453
bool CheckServerVersionForStreaming(PGconn *conn)
Definition receivelog.c:375
PQExpBuffer GenerateRecoveryConfig(PGconn *pgconn, const char *replication_slot, char *dbname)
char * GetDbnameFromConnectionOptions(const char *connstr)
#define MINIMUM_VERSION_FOR_RECOVERY_GUC
bool rmtree(const char *path, bool rmtopdir)
Definition rmtree.c:50
#define free(a)
void AppendIntegerCommandOption(PQExpBuffer buf, bool use_new_option_syntax, char *option_name, int32 option_value)
Definition streamutil.c:790
int dbgetpassword
Definition streamutil.c:50
PGconn * GetConnection(void)
Definition streamutil.c:60
bool RetrieveWalSegSize(PGconn *conn)
Definition streamutil.c:276
int WalSegSz
Definition streamutil.c:32
char * dbhost
Definition streamutil.c:46
char * dbport
Definition streamutil.c:48
void AppendPlainCommandOption(PQExpBuffer buf, bool use_new_option_syntax, char *option_name)
Definition streamutil.c:746
void AppendStringCommandOption(PQExpBuffer buf, bool use_new_option_syntax, char *option_name, char *option_value)
Definition streamutil.c:767
char * connection_string
Definition streamutil.c:45
PGconn * conn
Definition streamutil.c:52
bool RunIdentifySystem(PGconn *conn, char **sysid, TimeLineID *starttli, XLogRecPtr *startpos, char **db_name)
Definition streamutil.c:409
char * dbuser
Definition streamutil.c:47
char manifest_filename[MAXPGPATH]
pg_compress_specification * compress
astreamer * manifest_inject_streamer
astreamer * streamer
PQExpBuffer manifest_buffer
char * sysidentifier
Definition receivelog.h:33
TimeLineID timeline
Definition receivelog.h:32
stream_stop_callback stream_stop
Definition receivelog.h:41
char * replication_slot
Definition receivelog.h:48
XLogRecPtr startpos
Definition receivelog.h:31
bool do_sync
Definition receivelog.h:38
pgsocket stop_socket
Definition receivelog.h:43
int standby_message_timeout
Definition receivelog.h:35
WalWriteMethod * walmethod
Definition receivelog.h:46
bool mark_done
Definition receivelog.h:37
char * partial_suffix
Definition receivelog.h:47
bool synchronous
Definition receivelog.h:36
struct TablespaceListCell * next
char old_dir[MAXPGPATH]
char new_dir[MAXPGPATH]
TablespaceListCell * tail
TablespaceListCell * head
void(* free)(WalWriteMethod *wwmethod)
Definition walmethods.h:92
bool(* finish)(WalWriteMethod *wwmethod)
Definition walmethods.h:86
const WalWriteMethodOps * ops
Definition walmethods.h:105
char filename[MAXPGPATH]
astreamer * streamer
Definition type.h:138
pg_compress_algorithm wal_compress_algorithm
char xlog[MAXPGPATH]
pg_compress_algorithm algorithm
Definition compression.h:34
static StringInfo copybuf
Definition tablesync.c:129
static void callback(struct sockaddr *addr, struct sockaddr *mask, void *unused)
char * wait_result_to_str(int exitstatus)
Definition wait_error.c:33
WalWriteMethod * CreateWalTarMethod(const char *tarbase, pg_compress_algorithm compression_algorithm, int compression_level, bool sync)
WalWriteMethod * CreateWalDirectoryMethod(const char *basedir, pg_compress_algorithm compression_algorithm, int compression_level, bool sync)
Definition walmethods.c:640
static void CreateReplicationSlot(CreateReplicationSlotCmd *cmd)
Definition walsender.c:1199
#define SIGCHLD
Definition win32_port.h:168
void _dosmaperr(unsigned long)
Definition win32error.c:177
#define kill(pid, sig)
Definition win32_port.h:490
#define symlink(oldpath, newpath)
Definition win32_port.h:225
#define select(n, r, w, e, timeout)
Definition win32_port.h:500
#define XLogSegmentOffset(xlogptr, wal_segsz_bytes)
uint64 XLogRecPtr
Definition xlogdefs.h:21
uint32 TimeLineID
Definition xlogdefs.h:63
static const char * directory
Definition zic.c:648