PostgreSQL Source Code  git master
basebackup.c
Go to the documentation of this file.
1 /*-------------------------------------------------------------------------
2  *
3  * basebackup.c
4  * code for taking a base backup and streaming it to a standby
5  *
6  * Portions Copyright (c) 2010-2024, PostgreSQL Global Development Group
7  *
8  * IDENTIFICATION
9  * src/backend/backup/basebackup.c
10  *
11  *-------------------------------------------------------------------------
12  */
13 #include "postgres.h"
14 
15 #include <sys/stat.h>
16 #include <unistd.h>
17 #include <time.h>
18 
19 #include "access/xlog_internal.h"
20 #include "access/xlogbackup.h"
21 #include "backup/backup_manifest.h"
22 #include "backup/basebackup.h"
24 #include "backup/basebackup_sink.h"
26 #include "catalog/pg_tablespace_d.h"
27 #include "commands/defrem.h"
28 #include "common/compression.h"
29 #include "common/file_perm.h"
30 #include "common/file_utils.h"
31 #include "lib/stringinfo.h"
32 #include "miscadmin.h"
33 #include "nodes/pg_list.h"
34 #include "pgstat.h"
35 #include "pgtar.h"
36 #include "port.h"
37 #include "postmaster/syslogger.h"
39 #include "replication/slot.h"
40 #include "replication/walsender.h"
42 #include "storage/bufpage.h"
43 #include "storage/checksum.h"
44 #include "storage/dsm_impl.h"
45 #include "storage/ipc.h"
46 #include "storage/reinit.h"
47 #include "utils/builtins.h"
48 #include "utils/guc.h"
49 #include "utils/ps_status.h"
50 #include "utils/relcache.h"
51 #include "utils/resowner.h"
52 
53 /*
54  * How much data do we want to send in one CopyData message? Note that
55  * this may also result in reading the underlying files in chunks of this
56  * size.
57  *
58  * NB: The buffer size is required to be a multiple of the system block
59  * size, so use that value instead if it's bigger than our preference.
60  */
61 #define SINK_BUFFER_LENGTH Max(32768, BLCKSZ)
62 
63 typedef struct
64 {
65  const char *label;
66  bool progress;
68  bool nowait;
69  bool includewal;
81 
82 static int64 sendTablespace(bbsink *sink, char *path, Oid spcoid, bool sizeonly,
85 static int64 sendDir(bbsink *sink, const char *path, int basepathlen, bool sizeonly,
86  List *tablespaces, bool sendtblspclinks,
89 static bool sendFile(bbsink *sink, const char *readfilename, const char *tarfilename,
90  struct stat *statbuf, bool missing_ok,
91  Oid dboid, Oid spcoid, RelFileNumber relfilenumber,
92  unsigned segno,
94  unsigned num_incremental_blocks,
95  BlockNumber *incremental_blocks,
96  unsigned truncation_block_length);
97 static off_t read_file_data_into_buffer(bbsink *sink,
98  const char *readfilename, int fd,
99  off_t offset, size_t length,
100  BlockNumber blkno,
101  bool verify_checksum,
102  int *checksum_failures);
103 static void push_to_sink(bbsink *sink, pg_checksum_context *checksum_ctx,
104  size_t *bytes_done, void *data, size_t length);
105 static bool verify_page_checksum(Page page, XLogRecPtr start_lsn,
106  BlockNumber blkno,
107  uint16 *expected_checksum);
108 static void sendFileWithContent(bbsink *sink, const char *filename,
109  const char *content, int len,
111 static int64 _tarWriteHeader(bbsink *sink, const char *filename,
112  const char *linktarget, struct stat *statbuf,
113  bool sizeonly);
114 static void _tarWritePadding(bbsink *sink, int len);
115 static void convert_link_to_directory(const char *pathbuf, struct stat *statbuf);
116 static void perform_base_backup(basebackup_options *opt, bbsink *sink,
119 static int compareWalFileNames(const ListCell *a, const ListCell *b);
120 static ssize_t basebackup_read_file(int fd, char *buf, size_t nbytes, off_t offset,
121  const char *filename, bool partial_read_ok);
122 
123 /* Was the backup currently in-progress initiated in recovery mode? */
124 static bool backup_started_in_recovery = false;
125 
126 /* Total number of checksum failures during base backup. */
127 static long long int total_checksum_failures;
128 
129 /* Do not verify checksums. */
130 static bool noverify_checksums = false;
131 
132 /*
133  * Definition of one element part of an exclusion list, used for paths part
134  * of checksum validation or base backups. "name" is the name of the file
135  * or path to check for exclusion. If "match_prefix" is true, any items
136  * matching the name as prefix are excluded.
137  */
139 {
140  const char *name;
142 };
143 
144 /*
145  * The contents of these directories are removed or recreated during server
146  * start so they are not included in backups. The directories themselves are
147  * kept and included as empty to preserve access permissions.
148  *
149  * Note: this list should be kept in sync with the filter lists in pg_rewind's
150  * filemap.c.
151  */
152 static const char *const excludeDirContents[] =
153 {
154  /*
155  * Skip temporary statistics files. PG_STAT_TMP_DIR must be skipped
156  * because extensions like pg_stat_statements store data there.
157  */
159 
160  /*
161  * It is generally not useful to backup the contents of this directory
162  * even if the intention is to restore to another primary. See backup.sgml
163  * for a more detailed description.
164  */
166 
167  /* Contents removed on startup, see dsm_cleanup_for_mmap(). */
169 
170  /* Contents removed on startup, see AsyncShmemInit(). */
171  "pg_notify",
172 
173  /*
174  * Old contents are loaded for possible debugging but are not required for
175  * normal operation, see SerialInit().
176  */
177  "pg_serial",
178 
179  /* Contents removed on startup, see DeleteAllExportedSnapshotFiles(). */
180  "pg_snapshots",
181 
182  /* Contents zeroed on startup, see StartupSUBTRANS(). */
183  "pg_subtrans",
184 
185  /* end of list */
186  NULL
187 };
188 
189 /*
190  * List of files excluded from backups.
191  */
192 static const struct exclude_list_item excludeFiles[] =
193 {
194  /* Skip auto conf temporary file. */
195  {PG_AUTOCONF_FILENAME ".tmp", false},
196 
197  /* Skip current log file temporary file */
198  {LOG_METAINFO_DATAFILE_TMP, false},
199 
200  /*
201  * Skip relation cache because it is rebuilt on startup. This includes
202  * temporary files.
203  */
204  {RELCACHE_INIT_FILENAME, true},
205 
206  /*
207  * backup_label and tablespace_map should not exist in a running cluster
208  * capable of doing an online backup, but exclude them just in case.
209  */
210  {BACKUP_LABEL_FILE, false},
211  {TABLESPACE_MAP, false},
212 
213  /*
214  * If there's a backup_manifest, it belongs to a backup that was used to
215  * start this server. It is *not* correct for this backup. Our
216  * backup_manifest is injected into the backup separately if users want
217  * it.
218  */
219  {"backup_manifest", false},
220 
221  {"postmaster.pid", false},
222  {"postmaster.opts", false},
223 
224  /* end of list */
225  {NULL, false}
226 };
227 
228 /*
229  * Actually do a base backup for the specified tablespaces.
230  *
231  * This is split out mainly to avoid complaints about "variable might be
232  * clobbered by longjmp" from stupider versions of gcc.
233  */
234 static void
237 {
239  XLogRecPtr endptr;
240  TimeLineID endtli;
244 
245  /* Initial backup state, insofar as we know it now. */
246  state.tablespaces = NIL;
247  state.tablespace_num = 0;
248  state.bytes_done = 0;
249  state.bytes_total = 0;
250  state.bytes_total_is_valid = false;
251 
252  /* we're going to use a BufFile, so we need a ResourceOwner */
253  Assert(CurrentResourceOwner == NULL);
254  CurrentResourceOwner = ResourceOwnerCreate(NULL, "base backup");
255 
257 
260 
262 
263  /* Allocate backup related variables. */
266 
268  do_pg_backup_start(opt->label, opt->fastcheckpoint, &state.tablespaces,
270 
271  state.startptr = backup_state->startpoint;
272  state.starttli = backup_state->starttli;
273 
274  /*
275  * Once do_pg_backup_start has been called, ensure that any failure causes
276  * us to abort the backup so we don't "leak" a backup counter. For this
277  * reason, *all* functionality between do_pg_backup_start() and the end of
278  * do_pg_backup_stop() should be inside the error cleanup block!
279  */
280 
282  {
283  ListCell *lc;
284  tablespaceinfo *newti;
285 
286  /* If this is an incremental backup, execute preparatory steps. */
287  if (ib != NULL)
289 
290  /* Add a node for the base directory at the end */
291  newti = palloc0(sizeof(tablespaceinfo));
292  newti->size = -1;
293  state.tablespaces = lappend(state.tablespaces, newti);
294 
295  /*
296  * Calculate the total backup size by summing up the size of each
297  * tablespace
298  */
299  if (opt->progress)
300  {
302 
303  foreach(lc, state.tablespaces)
304  {
305  tablespaceinfo *tmp = (tablespaceinfo *) lfirst(lc);
306 
307  if (tmp->path == NULL)
308  tmp->size = sendDir(sink, ".", 1, true, state.tablespaces,
309  true, NULL, InvalidOid, NULL);
310  else
311  tmp->size = sendTablespace(sink, tmp->path, tmp->oid, true,
312  NULL, NULL);
313  state.bytes_total += tmp->size;
314  }
315  state.bytes_total_is_valid = true;
316  }
317 
318  /* notify basebackup sink about start of backup */
320 
321  /* Send off our tablespaces one by one */
322  foreach(lc, state.tablespaces)
323  {
324  tablespaceinfo *ti = (tablespaceinfo *) lfirst(lc);
325 
326  if (ti->path == NULL)
327  {
328  struct stat statbuf;
329  bool sendtblspclinks = true;
330  char *backup_label;
331 
332  bbsink_begin_archive(sink, "base.tar");
333 
334  /* In the main tar, include the backup_label first... */
335  backup_label = build_backup_content(backup_state, false);
337  backup_label, -1, &manifest);
338  pfree(backup_label);
339 
340  /* Then the tablespace_map file, if required... */
341  if (opt->sendtblspcmapfile)
342  {
344  tablespace_map->data, -1, &manifest);
345  sendtblspclinks = false;
346  }
347 
348  /* Then the bulk of the files... */
349  sendDir(sink, ".", 1, false, state.tablespaces,
350  sendtblspclinks, &manifest, InvalidOid, ib);
351 
352  /* ... and pg_control after everything else. */
353  if (lstat(XLOG_CONTROL_FILE, &statbuf) != 0)
354  ereport(ERROR,
356  errmsg("could not stat file \"%s\": %m",
359  false, InvalidOid, InvalidOid,
360  InvalidRelFileNumber, 0, &manifest, 0, NULL, 0);
361  }
362  else
363  {
364  char *archive_name = psprintf("%u.tar", ti->oid);
365 
366  bbsink_begin_archive(sink, archive_name);
367 
368  sendTablespace(sink, ti->path, ti->oid, false, &manifest, ib);
369  }
370 
371  /*
372  * If we're including WAL, and this is the main data directory we
373  * don't treat this as the end of the tablespace. Instead, we will
374  * include the xlog files below and stop afterwards. This is safe
375  * since the main data directory is always sent *last*.
376  */
377  if (opt->includewal && ti->path == NULL)
378  {
379  Assert(lnext(state.tablespaces, lc) == NULL);
380  }
381  else
382  {
383  /* Properly terminate the tarfile. */
384  StaticAssertDecl(2 * TAR_BLOCK_SIZE <= BLCKSZ,
385  "BLCKSZ too small for 2 tar blocks");
386  memset(sink->bbs_buffer, 0, 2 * TAR_BLOCK_SIZE);
388 
389  /* OK, that's the end of the archive. */
390  bbsink_end_archive(sink);
391  }
392  }
393 
396 
397  endptr = backup_state->stoppoint;
398  endtli = backup_state->stoptli;
399 
400  /* Deallocate backup-related variables. */
403  }
405 
406 
407  if (opt->includewal)
408  {
409  /*
410  * We've left the last tar file "open", so we can now append the
411  * required WAL files to it.
412  */
413  char pathbuf[MAXPGPATH];
414  XLogSegNo segno;
415  XLogSegNo startsegno;
416  XLogSegNo endsegno;
417  struct stat statbuf;
418  List *historyFileList = NIL;
419  List *walFileList = NIL;
420  char firstoff[MAXFNAMELEN];
421  char lastoff[MAXFNAMELEN];
422  DIR *dir;
423  struct dirent *de;
424  ListCell *lc;
425  TimeLineID tli;
426 
428 
429  /*
430  * I'd rather not worry about timelines here, so scan pg_wal and
431  * include all WAL files in the range between 'startptr' and 'endptr',
432  * regardless of the timeline the file is stamped with. If there are
433  * some spurious WAL files belonging to timelines that don't belong in
434  * this server's history, they will be included too. Normally there
435  * shouldn't be such files, but if there are, there's little harm in
436  * including them.
437  */
438  XLByteToSeg(state.startptr, startsegno, wal_segment_size);
439  XLogFileName(firstoff, state.starttli, startsegno, wal_segment_size);
440  XLByteToPrevSeg(endptr, endsegno, wal_segment_size);
441  XLogFileName(lastoff, endtli, endsegno, wal_segment_size);
442 
443  dir = AllocateDir("pg_wal");
444  while ((de = ReadDir(dir, "pg_wal")) != NULL)
445  {
446  /* Does it look like a WAL segment, and is it in the range? */
447  if (IsXLogFileName(de->d_name) &&
448  strcmp(de->d_name + 8, firstoff + 8) >= 0 &&
449  strcmp(de->d_name + 8, lastoff + 8) <= 0)
450  {
451  walFileList = lappend(walFileList, pstrdup(de->d_name));
452  }
453  /* Does it look like a timeline history file? */
454  else if (IsTLHistoryFileName(de->d_name))
455  {
456  historyFileList = lappend(historyFileList, pstrdup(de->d_name));
457  }
458  }
459  FreeDir(dir);
460 
461  /*
462  * Before we go any further, check that none of the WAL segments we
463  * need were removed.
464  */
465  CheckXLogRemoved(startsegno, state.starttli);
466 
467  /*
468  * Sort the WAL filenames. We want to send the files in order from
469  * oldest to newest, to reduce the chance that a file is recycled
470  * before we get a chance to send it over.
471  */
472  list_sort(walFileList, compareWalFileNames);
473 
474  /*
475  * There must be at least one xlog file in the pg_wal directory, since
476  * we are doing backup-including-xlog.
477  */
478  if (walFileList == NIL)
479  ereport(ERROR,
480  (errmsg("could not find any WAL files")));
481 
482  /*
483  * Sanity check: the first and last segment should cover startptr and
484  * endptr, with no gaps in between.
485  */
486  XLogFromFileName((char *) linitial(walFileList),
487  &tli, &segno, wal_segment_size);
488  if (segno != startsegno)
489  {
490  char startfname[MAXFNAMELEN];
491 
492  XLogFileName(startfname, state.starttli, startsegno,
494  ereport(ERROR,
495  (errmsg("could not find WAL file \"%s\"", startfname)));
496  }
497  foreach(lc, walFileList)
498  {
499  char *walFileName = (char *) lfirst(lc);
500  XLogSegNo currsegno = segno;
501  XLogSegNo nextsegno = segno + 1;
502 
503  XLogFromFileName(walFileName, &tli, &segno, wal_segment_size);
504  if (!(nextsegno == segno || currsegno == segno))
505  {
506  char nextfname[MAXFNAMELEN];
507 
508  XLogFileName(nextfname, tli, nextsegno, wal_segment_size);
509  ereport(ERROR,
510  (errmsg("could not find WAL file \"%s\"", nextfname)));
511  }
512  }
513  if (segno != endsegno)
514  {
515  char endfname[MAXFNAMELEN];
516 
517  XLogFileName(endfname, endtli, endsegno, wal_segment_size);
518  ereport(ERROR,
519  (errmsg("could not find WAL file \"%s\"", endfname)));
520  }
521 
522  /* Ok, we have everything we need. Send the WAL files. */
523  foreach(lc, walFileList)
524  {
525  char *walFileName = (char *) lfirst(lc);
526  int fd;
527  ssize_t cnt;
528  pgoff_t len = 0;
529 
530  snprintf(pathbuf, MAXPGPATH, XLOGDIR "/%s", walFileName);
531  XLogFromFileName(walFileName, &tli, &segno, wal_segment_size);
532 
533  fd = OpenTransientFile(pathbuf, O_RDONLY | PG_BINARY);
534  if (fd < 0)
535  {
536  int save_errno = errno;
537 
538  /*
539  * Most likely reason for this is that the file was already
540  * removed by a checkpoint, so check for that to get a better
541  * error message.
542  */
543  CheckXLogRemoved(segno, tli);
544 
545  errno = save_errno;
546  ereport(ERROR,
548  errmsg("could not open file \"%s\": %m", pathbuf)));
549  }
550 
551  if (fstat(fd, &statbuf) != 0)
552  ereport(ERROR,
554  errmsg("could not stat file \"%s\": %m",
555  pathbuf)));
556  if (statbuf.st_size != wal_segment_size)
557  {
558  CheckXLogRemoved(segno, tli);
559  ereport(ERROR,
561  errmsg("unexpected WAL file size \"%s\"", walFileName)));
562  }
563 
564  /* send the WAL file itself */
565  _tarWriteHeader(sink, pathbuf, NULL, &statbuf, false);
566 
567  while ((cnt = basebackup_read_file(fd, sink->bbs_buffer,
568  Min(sink->bbs_buffer_length,
570  len, pathbuf, true)) > 0)
571  {
572  CheckXLogRemoved(segno, tli);
573  bbsink_archive_contents(sink, cnt);
574 
575  len += cnt;
576 
577  if (len == wal_segment_size)
578  break;
579  }
580 
581  if (len != wal_segment_size)
582  {
583  CheckXLogRemoved(segno, tli);
584  ereport(ERROR,
586  errmsg("unexpected WAL file size \"%s\"", walFileName)));
587  }
588 
589  /*
590  * wal_segment_size is a multiple of TAR_BLOCK_SIZE, so no need
591  * for padding.
592  */
594 
596 
597  /*
598  * Mark file as archived, otherwise files can get archived again
599  * after promotion of a new node. This is in line with
600  * walreceiver.c always doing an XLogArchiveForceDone() after a
601  * complete segment.
602  */
603  StatusFilePath(pathbuf, walFileName, ".done");
604  sendFileWithContent(sink, pathbuf, "", -1, &manifest);
605  }
606 
607  /*
608  * Send timeline history files too. Only the latest timeline history
609  * file is required for recovery, and even that only if there happens
610  * to be a timeline switch in the first WAL segment that contains the
611  * checkpoint record, or if we're taking a base backup from a standby
612  * server and the target timeline changes while the backup is taken.
613  * But they are small and highly useful for debugging purposes, so
614  * better include them all, always.
615  */
616  foreach(lc, historyFileList)
617  {
618  char *fname = lfirst(lc);
619 
620  snprintf(pathbuf, MAXPGPATH, XLOGDIR "/%s", fname);
621 
622  if (lstat(pathbuf, &statbuf) != 0)
623  ereport(ERROR,
625  errmsg("could not stat file \"%s\": %m", pathbuf)));
626 
627  sendFile(sink, pathbuf, pathbuf, &statbuf, false,
629  &manifest, 0, NULL, 0);
630 
631  /* unconditionally mark file as archived */
632  StatusFilePath(pathbuf, fname, ".done");
633  sendFileWithContent(sink, pathbuf, "", -1, &manifest);
634  }
635 
636  /* Properly terminate the tar file. */
637  StaticAssertStmt(2 * TAR_BLOCK_SIZE <= BLCKSZ,
638  "BLCKSZ too small for 2 tar blocks");
639  memset(sink->bbs_buffer, 0, 2 * TAR_BLOCK_SIZE);
641 
642  /* OK, that's the end of the archive. */
643  bbsink_end_archive(sink);
644  }
645 
646  AddWALInfoToBackupManifest(&manifest, state.startptr, state.starttli,
647  endptr, endtli);
648 
650 
651  bbsink_end_backup(sink, endptr, endtli);
652 
654  {
655  if (total_checksum_failures > 1)
657  (errmsg_plural("%lld total checksum verification failure",
658  "%lld total checksum verification failures",
661 
662  ereport(ERROR,
664  errmsg("checksum verification failure during base backup")));
665  }
666 
667  /*
668  * Make sure to free the manifest before the resource owners as manifests
669  * use cryptohash contexts that may depend on resource owners (like
670  * OpenSSL).
671  */
673 
674  /* clean up the resource owner we created */
675  WalSndResourceCleanup(true);
676 
678 }
679 
680 /*
681  * list_sort comparison function, to compare log/seg portion of WAL segment
682  * filenames, ignoring the timeline portion.
683  */
684 static int
686 {
687  char *fna = (char *) lfirst(a);
688  char *fnb = (char *) lfirst(b);
689 
690  return strcmp(fna + 8, fnb + 8);
691 }
692 
693 /*
694  * Parse the base backup options passed down by the parser
695  */
696 static void
698 {
699  ListCell *lopt;
700  bool o_label = false;
701  bool o_progress = false;
702  bool o_checkpoint = false;
703  bool o_nowait = false;
704  bool o_wal = false;
705  bool o_incremental = false;
706  bool o_maxrate = false;
707  bool o_tablespace_map = false;
708  bool o_noverify_checksums = false;
709  bool o_manifest = false;
710  bool o_manifest_checksums = false;
711  bool o_target = false;
712  bool o_target_detail = false;
713  char *target_str = NULL;
714  char *target_detail_str = NULL;
715  bool o_compression = false;
716  bool o_compression_detail = false;
717  char *compression_detail_str = NULL;
718 
719  MemSet(opt, 0, sizeof(*opt));
724 
725  foreach(lopt, options)
726  {
727  DefElem *defel = (DefElem *) lfirst(lopt);
728 
729  if (strcmp(defel->defname, "label") == 0)
730  {
731  if (o_label)
732  ereport(ERROR,
733  (errcode(ERRCODE_SYNTAX_ERROR),
734  errmsg("duplicate option \"%s\"", defel->defname)));
735  opt->label = defGetString(defel);
736  o_label = true;
737  }
738  else if (strcmp(defel->defname, "progress") == 0)
739  {
740  if (o_progress)
741  ereport(ERROR,
742  (errcode(ERRCODE_SYNTAX_ERROR),
743  errmsg("duplicate option \"%s\"", defel->defname)));
744  opt->progress = defGetBoolean(defel);
745  o_progress = true;
746  }
747  else if (strcmp(defel->defname, "checkpoint") == 0)
748  {
749  char *optval = defGetString(defel);
750 
751  if (o_checkpoint)
752  ereport(ERROR,
753  (errcode(ERRCODE_SYNTAX_ERROR),
754  errmsg("duplicate option \"%s\"", defel->defname)));
755  if (pg_strcasecmp(optval, "fast") == 0)
756  opt->fastcheckpoint = true;
757  else if (pg_strcasecmp(optval, "spread") == 0)
758  opt->fastcheckpoint = false;
759  else
760  ereport(ERROR,
761  (errcode(ERRCODE_SYNTAX_ERROR),
762  errmsg("unrecognized checkpoint type: \"%s\"",
763  optval)));
764  o_checkpoint = true;
765  }
766  else if (strcmp(defel->defname, "wait") == 0)
767  {
768  if (o_nowait)
769  ereport(ERROR,
770  (errcode(ERRCODE_SYNTAX_ERROR),
771  errmsg("duplicate option \"%s\"", defel->defname)));
772  opt->nowait = !defGetBoolean(defel);
773  o_nowait = true;
774  }
775  else if (strcmp(defel->defname, "wal") == 0)
776  {
777  if (o_wal)
778  ereport(ERROR,
779  (errcode(ERRCODE_SYNTAX_ERROR),
780  errmsg("duplicate option \"%s\"", defel->defname)));
781  opt->includewal = defGetBoolean(defel);
782  o_wal = true;
783  }
784  else if (strcmp(defel->defname, "incremental") == 0)
785  {
786  if (o_incremental)
787  ereport(ERROR,
788  (errcode(ERRCODE_SYNTAX_ERROR),
789  errmsg("duplicate option \"%s\"", defel->defname)));
790  opt->incremental = defGetBoolean(defel);
791  if (opt->incremental && !summarize_wal)
792  ereport(ERROR,
793  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
794  errmsg("incremental backups cannot be taken unless WAL summarization is enabled")));
795  o_incremental = true;
796  }
797  else if (strcmp(defel->defname, "max_rate") == 0)
798  {
799  int64 maxrate;
800 
801  if (o_maxrate)
802  ereport(ERROR,
803  (errcode(ERRCODE_SYNTAX_ERROR),
804  errmsg("duplicate option \"%s\"", defel->defname)));
805 
806  maxrate = defGetInt64(defel);
807  if (maxrate < MAX_RATE_LOWER || maxrate > MAX_RATE_UPPER)
808  ereport(ERROR,
809  (errcode(ERRCODE_NUMERIC_VALUE_OUT_OF_RANGE),
810  errmsg("%d is outside the valid range for parameter \"%s\" (%d .. %d)",
811  (int) maxrate, "MAX_RATE", MAX_RATE_LOWER, MAX_RATE_UPPER)));
812 
813  opt->maxrate = (uint32) maxrate;
814  o_maxrate = true;
815  }
816  else if (strcmp(defel->defname, "tablespace_map") == 0)
817  {
818  if (o_tablespace_map)
819  ereport(ERROR,
820  (errcode(ERRCODE_SYNTAX_ERROR),
821  errmsg("duplicate option \"%s\"", defel->defname)));
822  opt->sendtblspcmapfile = defGetBoolean(defel);
823  o_tablespace_map = true;
824  }
825  else if (strcmp(defel->defname, "verify_checksums") == 0)
826  {
827  if (o_noverify_checksums)
828  ereport(ERROR,
829  (errcode(ERRCODE_SYNTAX_ERROR),
830  errmsg("duplicate option \"%s\"", defel->defname)));
832  o_noverify_checksums = true;
833  }
834  else if (strcmp(defel->defname, "manifest") == 0)
835  {
836  char *optval = defGetString(defel);
837  bool manifest_bool;
838 
839  if (o_manifest)
840  ereport(ERROR,
841  (errcode(ERRCODE_SYNTAX_ERROR),
842  errmsg("duplicate option \"%s\"", defel->defname)));
843  if (parse_bool(optval, &manifest_bool))
844  {
845  if (manifest_bool)
847  else
849  }
850  else if (pg_strcasecmp(optval, "force-encode") == 0)
852  else
853  ereport(ERROR,
854  (errcode(ERRCODE_SYNTAX_ERROR),
855  errmsg("unrecognized manifest option: \"%s\"",
856  optval)));
857  o_manifest = true;
858  }
859  else if (strcmp(defel->defname, "manifest_checksums") == 0)
860  {
861  char *optval = defGetString(defel);
862 
863  if (o_manifest_checksums)
864  ereport(ERROR,
865  (errcode(ERRCODE_SYNTAX_ERROR),
866  errmsg("duplicate option \"%s\"", defel->defname)));
867  if (!pg_checksum_parse_type(optval,
868  &opt->manifest_checksum_type))
869  ereport(ERROR,
870  (errcode(ERRCODE_SYNTAX_ERROR),
871  errmsg("unrecognized checksum algorithm: \"%s\"",
872  optval)));
873  o_manifest_checksums = true;
874  }
875  else if (strcmp(defel->defname, "target") == 0)
876  {
877  if (o_target)
878  ereport(ERROR,
879  (errcode(ERRCODE_SYNTAX_ERROR),
880  errmsg("duplicate option \"%s\"", defel->defname)));
881  target_str = defGetString(defel);
882  o_target = true;
883  }
884  else if (strcmp(defel->defname, "target_detail") == 0)
885  {
886  char *optval = defGetString(defel);
887 
888  if (o_target_detail)
889  ereport(ERROR,
890  (errcode(ERRCODE_SYNTAX_ERROR),
891  errmsg("duplicate option \"%s\"", defel->defname)));
892  target_detail_str = optval;
893  o_target_detail = true;
894  }
895  else if (strcmp(defel->defname, "compression") == 0)
896  {
897  char *optval = defGetString(defel);
898 
899  if (o_compression)
900  ereport(ERROR,
901  (errcode(ERRCODE_SYNTAX_ERROR),
902  errmsg("duplicate option \"%s\"", defel->defname)));
903  if (!parse_compress_algorithm(optval, &opt->compression))
904  ereport(ERROR,
905  (errcode(ERRCODE_SYNTAX_ERROR),
906  errmsg("unrecognized compression algorithm: \"%s\"",
907  optval)));
908  o_compression = true;
909  }
910  else if (strcmp(defel->defname, "compression_detail") == 0)
911  {
912  if (o_compression_detail)
913  ereport(ERROR,
914  (errcode(ERRCODE_SYNTAX_ERROR),
915  errmsg("duplicate option \"%s\"", defel->defname)));
916  compression_detail_str = defGetString(defel);
917  o_compression_detail = true;
918  }
919  else
920  ereport(ERROR,
921  (errcode(ERRCODE_SYNTAX_ERROR),
922  errmsg("unrecognized base backup option: \"%s\"",
923  defel->defname)));
924  }
925 
926  if (opt->label == NULL)
927  opt->label = "base backup";
928  if (opt->manifest == MANIFEST_OPTION_NO)
929  {
930  if (o_manifest_checksums)
931  ereport(ERROR,
932  (errcode(ERRCODE_SYNTAX_ERROR),
933  errmsg("manifest checksums require a backup manifest")));
935  }
936 
937  if (target_str == NULL)
938  {
939  if (target_detail_str != NULL)
940  ereport(ERROR,
941  (errcode(ERRCODE_SYNTAX_ERROR),
942  errmsg("target detail cannot be used without target")));
943  opt->use_copytblspc = true;
944  opt->send_to_client = true;
945  }
946  else if (strcmp(target_str, "client") == 0)
947  {
948  if (target_detail_str != NULL)
949  ereport(ERROR,
950  (errcode(ERRCODE_SYNTAX_ERROR),
951  errmsg("target \"%s\" does not accept a target detail",
952  target_str)));
953  opt->send_to_client = true;
954  }
955  else
956  opt->target_handle =
957  BaseBackupGetTargetHandle(target_str, target_detail_str);
958 
959  if (o_compression_detail && !o_compression)
960  ereport(ERROR,
961  (errcode(ERRCODE_SYNTAX_ERROR),
962  errmsg("compression detail cannot be specified unless compression is enabled")));
963 
964  if (o_compression)
965  {
966  char *error_detail;
967 
968  parse_compress_specification(opt->compression, compression_detail_str,
970  error_detail =
972  if (error_detail != NULL)
973  ereport(ERROR,
974  errcode(ERRCODE_SYNTAX_ERROR),
975  errmsg("invalid compression specification: %s",
976  error_detail));
977  }
978 }
979 
980 
981 /*
982  * SendBaseBackup() - send a complete base backup.
983  *
984  * The function will put the system into backup mode like pg_backup_start()
985  * does, so that the backup is consistent even though we read directly from
986  * the filesystem, bypassing the buffer cache.
987  */
988 void
990 {
991  basebackup_options opt;
992  bbsink *sink;
994 
995  if (status == SESSION_BACKUP_RUNNING)
996  ereport(ERROR,
997  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
998  errmsg("a backup is already in progress in this session")));
999 
1000  parse_basebackup_options(cmd->options, &opt);
1001 
1003 
1005  {
1006  char activitymsg[50];
1007 
1008  snprintf(activitymsg, sizeof(activitymsg), "sending backup \"%s\"",
1009  opt.label);
1010  set_ps_display(activitymsg);
1011  }
1012 
1013  /*
1014  * If we're asked to perform an incremental backup and the user has not
1015  * supplied a manifest, that's an ERROR.
1016  *
1017  * If we're asked to perform a full backup and the user did supply a
1018  * manifest, just ignore it.
1019  */
1020  if (!opt.incremental)
1021  ib = NULL;
1022  else if (ib == NULL)
1023  ereport(ERROR,
1024  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
1025  errmsg("must UPLOAD_MANIFEST before performing an incremental BASE_BACKUP")));
1026 
1027  /*
1028  * If the target is specifically 'client' then set up to stream the backup
1029  * to the client; otherwise, it's being sent someplace else and should not
1030  * be sent to the client. BaseBackupGetSink has the job of setting up a
1031  * sink to send the backup data wherever it needs to go.
1032  */
1034  if (opt.target_handle != NULL)
1035  sink = BaseBackupGetSink(opt.target_handle, sink);
1036 
1037  /* Set up network throttling, if client requested it */
1038  if (opt.maxrate > 0)
1039  sink = bbsink_throttle_new(sink, opt.maxrate);
1040 
1041  /* Set up server-side compression, if client requested it */
1042  if (opt.compression == PG_COMPRESSION_GZIP)
1043  sink = bbsink_gzip_new(sink, &opt.compression_specification);
1044  else if (opt.compression == PG_COMPRESSION_LZ4)
1045  sink = bbsink_lz4_new(sink, &opt.compression_specification);
1046  else if (opt.compression == PG_COMPRESSION_ZSTD)
1047  sink = bbsink_zstd_new(sink, &opt.compression_specification);
1048 
1049  /* Set up progress reporting. */
1050  sink = bbsink_progress_new(sink, opt.progress);
1051 
1052  /*
1053  * Perform the base backup, but make sure we clean up the bbsink even if
1054  * an error occurs.
1055  */
1056  PG_TRY();
1057  {
1058  perform_base_backup(&opt, sink, ib);
1059  }
1060  PG_FINALLY();
1061  {
1062  bbsink_cleanup(sink);
1063  }
1064  PG_END_TRY();
1065 }
1066 
1067 /*
1068  * Inject a file with given name and content in the output tar stream.
1069  *
1070  * "len" can optionally be set to an arbitrary length of data sent. If set
1071  * to -1, the content sent is treated as a string with strlen() as length.
1072  */
1073 static void
1074 sendFileWithContent(bbsink *sink, const char *filename, const char *content,
1076 {
1077  struct stat statbuf;
1078  int bytes_done = 0;
1079  pg_checksum_context checksum_ctx;
1080 
1081  if (pg_checksum_init(&checksum_ctx, manifest->checksum_type) < 0)
1082  elog(ERROR, "could not initialize checksum of file \"%s\"",
1083  filename);
1084 
1085  if (len < 0)
1086  len = strlen(content);
1087 
1088  /*
1089  * Construct a stat struct for the file we're injecting in the tar.
1090  */
1091 
1092  /* Windows doesn't have the concept of uid and gid */
1093 #ifdef WIN32
1094  statbuf.st_uid = 0;
1095  statbuf.st_gid = 0;
1096 #else
1097  statbuf.st_uid = geteuid();
1098  statbuf.st_gid = getegid();
1099 #endif
1100  statbuf.st_mtime = time(NULL);
1101  statbuf.st_mode = pg_file_create_mode;
1102  statbuf.st_size = len;
1103 
1104  _tarWriteHeader(sink, filename, NULL, &statbuf, false);
1105 
1106  if (pg_checksum_update(&checksum_ctx, (uint8 *) content, len) < 0)
1107  elog(ERROR, "could not update checksum of file \"%s\"",
1108  filename);
1109 
1110  while (bytes_done < len)
1111  {
1112  size_t remaining = len - bytes_done;
1113  size_t nbytes = Min(sink->bbs_buffer_length, remaining);
1114 
1115  memcpy(sink->bbs_buffer, content, nbytes);
1116  bbsink_archive_contents(sink, nbytes);
1117  bytes_done += nbytes;
1118  content += nbytes;
1119  }
1120 
1121  _tarWritePadding(sink, len);
1122 
1124  (pg_time_t) statbuf.st_mtime, &checksum_ctx);
1125 }
1126 
1127 /*
1128  * Include the tablespace directory pointed to by 'path' in the output tar
1129  * stream. If 'sizeonly' is true, we just calculate a total length and return
1130  * it, without actually sending anything.
1131  *
1132  * Only used to send auxiliary tablespaces, not PGDATA.
1133  */
1134 static int64
1135 sendTablespace(bbsink *sink, char *path, Oid spcoid, bool sizeonly,
1137 {
1138  int64 size;
1139  char pathbuf[MAXPGPATH];
1140  struct stat statbuf;
1141 
1142  /*
1143  * 'path' points to the tablespace location, but we only want to include
1144  * the version directory in it that belongs to us.
1145  */
1146  snprintf(pathbuf, sizeof(pathbuf), "%s/%s", path,
1148 
1149  /*
1150  * Store a directory entry in the tar file so we get the permissions
1151  * right.
1152  */
1153  if (lstat(pathbuf, &statbuf) != 0)
1154  {
1155  if (errno != ENOENT)
1156  ereport(ERROR,
1158  errmsg("could not stat file or directory \"%s\": %m",
1159  pathbuf)));
1160 
1161  /* If the tablespace went away while scanning, it's no error. */
1162  return 0;
1163  }
1164 
1165  size = _tarWriteHeader(sink, TABLESPACE_VERSION_DIRECTORY, NULL, &statbuf,
1166  sizeonly);
1167 
1168  /* Send all the files in the tablespace version directory */
1169  size += sendDir(sink, pathbuf, strlen(path), sizeonly, NIL, true, manifest,
1170  spcoid, ib);
1171 
1172  return size;
1173 }
1174 
1175 /*
1176  * Include all files from the given directory in the output tar stream. If
1177  * 'sizeonly' is true, we just calculate a total length and return it, without
1178  * actually sending anything.
1179  *
1180  * Omit any directory in the tablespaces list, to avoid backing up
1181  * tablespaces twice when they were created inside PGDATA.
1182  *
1183  * If sendtblspclinks is true, we need to include symlink
1184  * information in the tar file. If not, we can skip that
1185  * as it will be sent separately in the tablespace_map file.
1186  */
1187 static int64
1188 sendDir(bbsink *sink, const char *path, int basepathlen, bool sizeonly,
1189  List *tablespaces, bool sendtblspclinks, backup_manifest_info *manifest,
1190  Oid spcoid, IncrementalBackupInfo *ib)
1191 {
1192  DIR *dir;
1193  struct dirent *de;
1194  char pathbuf[MAXPGPATH * 2];
1195  struct stat statbuf;
1196  int64 size = 0;
1197  const char *lastDir; /* Split last dir from parent path. */
1198  bool isRelationDir = false; /* Does directory contain relations? */
1199  bool isGlobalDir = false;
1200  Oid dboid = InvalidOid;
1201  BlockNumber *relative_block_numbers = NULL;
1202 
1203  /*
1204  * Since this array is relatively large, avoid putting it on the stack.
1205  * But we don't need it at all if this is not an incremental backup.
1206  */
1207  if (ib != NULL)
1208  relative_block_numbers = palloc(sizeof(BlockNumber) * RELSEG_SIZE);
1209 
1210  /*
1211  * Determine if the current path is a database directory that can contain
1212  * relations.
1213  *
1214  * Start by finding the location of the delimiter between the parent path
1215  * and the current path.
1216  */
1217  lastDir = last_dir_separator(path);
1218 
1219  /* Does this path look like a database path (i.e. all digits)? */
1220  if (lastDir != NULL &&
1221  strspn(lastDir + 1, "0123456789") == strlen(lastDir + 1))
1222  {
1223  /* Part of path that contains the parent directory. */
1224  int parentPathLen = lastDir - path;
1225 
1226  /*
1227  * Mark path as a database directory if the parent path is either
1228  * $PGDATA/base or a tablespace version path.
1229  */
1230  if (strncmp(path, "./base", parentPathLen) == 0 ||
1231  (parentPathLen >= (sizeof(TABLESPACE_VERSION_DIRECTORY) - 1) &&
1232  strncmp(lastDir - (sizeof(TABLESPACE_VERSION_DIRECTORY) - 1),
1234  sizeof(TABLESPACE_VERSION_DIRECTORY) - 1) == 0))
1235  {
1236  isRelationDir = true;
1237  dboid = atooid(lastDir + 1);
1238  }
1239  }
1240  else if (strcmp(path, "./global") == 0)
1241  {
1242  isRelationDir = true;
1243  isGlobalDir = true;
1244  }
1245 
1246  dir = AllocateDir(path);
1247  while ((de = ReadDir(dir, path)) != NULL)
1248  {
1249  int excludeIdx;
1250  bool excludeFound;
1251  RelFileNumber relfilenumber = InvalidRelFileNumber;
1252  ForkNumber relForkNum = InvalidForkNumber;
1253  unsigned segno = 0;
1254  bool isRelationFile = false;
1255 
1256  /* Skip special stuff */
1257  if (strcmp(de->d_name, ".") == 0 || strcmp(de->d_name, "..") == 0)
1258  continue;
1259 
1260  /* Skip temporary files */
1261  if (strncmp(de->d_name,
1263  strlen(PG_TEMP_FILE_PREFIX)) == 0)
1264  continue;
1265 
1266  /* Skip macOS system files */
1267  if (strcmp(de->d_name, ".DS_Store") == 0)
1268  continue;
1269 
1270  /*
1271  * Check if the postmaster has signaled us to exit, and abort with an
1272  * error in that case. The error handler further up will call
1273  * do_pg_abort_backup() for us. Also check that if the backup was
1274  * started while still in recovery, the server wasn't promoted.
1275  * do_pg_backup_stop() will check that too, but it's better to stop
1276  * the backup early than continue to the end and fail there.
1277  */
1280  ereport(ERROR,
1281  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
1282  errmsg("the standby was promoted during online backup"),
1283  errhint("This means that the backup being taken is corrupt "
1284  "and should not be used. "
1285  "Try taking another online backup.")));
1286 
1287  /* Scan for files that should be excluded */
1288  excludeFound = false;
1289  for (excludeIdx = 0; excludeFiles[excludeIdx].name != NULL; excludeIdx++)
1290  {
1291  int cmplen = strlen(excludeFiles[excludeIdx].name);
1292 
1293  if (!excludeFiles[excludeIdx].match_prefix)
1294  cmplen++;
1295  if (strncmp(de->d_name, excludeFiles[excludeIdx].name, cmplen) == 0)
1296  {
1297  elog(DEBUG1, "file \"%s\" excluded from backup", de->d_name);
1298  excludeFound = true;
1299  break;
1300  }
1301  }
1302 
1303  if (excludeFound)
1304  continue;
1305 
1306  /*
1307  * If there could be non-temporary relation files in this directory,
1308  * try to parse the filename.
1309  */
1310  if (isRelationDir)
1311  isRelationFile =
1313  &relfilenumber,
1314  &relForkNum, &segno);
1315 
1316  /* Exclude all forks for unlogged tables except the init fork */
1317  if (isRelationFile && relForkNum != INIT_FORKNUM)
1318  {
1319  char initForkFile[MAXPGPATH];
1320 
1321  /*
1322  * If any other type of fork, check if there is an init fork with
1323  * the same RelFileNumber. If so, the file can be excluded.
1324  */
1325  snprintf(initForkFile, sizeof(initForkFile), "%s/%u_init",
1326  path, relfilenumber);
1327 
1328  if (lstat(initForkFile, &statbuf) == 0)
1329  {
1330  elog(DEBUG2,
1331  "unlogged relation file \"%s\" excluded from backup",
1332  de->d_name);
1333 
1334  continue;
1335  }
1336  }
1337 
1338  /* Exclude temporary relations */
1339  if (OidIsValid(dboid) && looks_like_temp_rel_name(de->d_name))
1340  {
1341  elog(DEBUG2,
1342  "temporary relation file \"%s\" excluded from backup",
1343  de->d_name);
1344 
1345  continue;
1346  }
1347 
1348  snprintf(pathbuf, sizeof(pathbuf), "%s/%s", path, de->d_name);
1349 
1350  /* Skip pg_control here to back up it last */
1351  if (strcmp(pathbuf, "./global/pg_control") == 0)
1352  continue;
1353 
1354  if (lstat(pathbuf, &statbuf) != 0)
1355  {
1356  if (errno != ENOENT)
1357  ereport(ERROR,
1359  errmsg("could not stat file or directory \"%s\": %m",
1360  pathbuf)));
1361 
1362  /* If the file went away while scanning, it's not an error. */
1363  continue;
1364  }
1365 
1366  /* Scan for directories whose contents should be excluded */
1367  excludeFound = false;
1368  for (excludeIdx = 0; excludeDirContents[excludeIdx] != NULL; excludeIdx++)
1369  {
1370  if (strcmp(de->d_name, excludeDirContents[excludeIdx]) == 0)
1371  {
1372  elog(DEBUG1, "contents of directory \"%s\" excluded from backup", de->d_name);
1373  convert_link_to_directory(pathbuf, &statbuf);
1374  size += _tarWriteHeader(sink, pathbuf + basepathlen + 1, NULL,
1375  &statbuf, sizeonly);
1376  excludeFound = true;
1377  break;
1378  }
1379  }
1380 
1381  if (excludeFound)
1382  continue;
1383 
1384  /*
1385  * We can skip pg_wal, the WAL segments need to be fetched from the
1386  * WAL archive anyway. But include it as an empty directory anyway, so
1387  * we get permissions right.
1388  */
1389  if (strcmp(pathbuf, "./pg_wal") == 0)
1390  {
1391  /* If pg_wal is a symlink, write it as a directory anyway */
1392  convert_link_to_directory(pathbuf, &statbuf);
1393  size += _tarWriteHeader(sink, pathbuf + basepathlen + 1, NULL,
1394  &statbuf, sizeonly);
1395 
1396  /*
1397  * Also send archive_status and summaries directories (by
1398  * hackishly reusing statbuf from above ...).
1399  */
1400  size += _tarWriteHeader(sink, "./pg_wal/archive_status", NULL,
1401  &statbuf, sizeonly);
1402  size += _tarWriteHeader(sink, "./pg_wal/summaries", NULL,
1403  &statbuf, sizeonly);
1404 
1405  continue; /* don't recurse into pg_wal */
1406  }
1407 
1408  /* Allow symbolic links in pg_tblspc only */
1409  if (strcmp(path, "./pg_tblspc") == 0 && S_ISLNK(statbuf.st_mode))
1410  {
1411  char linkpath[MAXPGPATH];
1412  int rllen;
1413 
1414  rllen = readlink(pathbuf, linkpath, sizeof(linkpath));
1415  if (rllen < 0)
1416  ereport(ERROR,
1418  errmsg("could not read symbolic link \"%s\": %m",
1419  pathbuf)));
1420  if (rllen >= sizeof(linkpath))
1421  ereport(ERROR,
1422  (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED),
1423  errmsg("symbolic link \"%s\" target is too long",
1424  pathbuf)));
1425  linkpath[rllen] = '\0';
1426 
1427  size += _tarWriteHeader(sink, pathbuf + basepathlen + 1, linkpath,
1428  &statbuf, sizeonly);
1429  }
1430  else if (S_ISDIR(statbuf.st_mode))
1431  {
1432  bool skip_this_dir = false;
1433  ListCell *lc;
1434 
1435  /*
1436  * Store a directory entry in the tar file so we can get the
1437  * permissions right.
1438  */
1439  size += _tarWriteHeader(sink, pathbuf + basepathlen + 1, NULL, &statbuf,
1440  sizeonly);
1441 
1442  /*
1443  * Call ourselves recursively for a directory, unless it happens
1444  * to be a separate tablespace located within PGDATA.
1445  */
1446  foreach(lc, tablespaces)
1447  {
1448  tablespaceinfo *ti = (tablespaceinfo *) lfirst(lc);
1449 
1450  /*
1451  * ti->rpath is the tablespace relative path within PGDATA, or
1452  * NULL if the tablespace has been properly located somewhere
1453  * else.
1454  *
1455  * Skip past the leading "./" in pathbuf when comparing.
1456  */
1457  if (ti->rpath && strcmp(ti->rpath, pathbuf + 2) == 0)
1458  {
1459  skip_this_dir = true;
1460  break;
1461  }
1462  }
1463 
1464  /*
1465  * skip sending directories inside pg_tblspc, if not required.
1466  */
1467  if (strcmp(pathbuf, "./pg_tblspc") == 0 && !sendtblspclinks)
1468  skip_this_dir = true;
1469 
1470  if (!skip_this_dir)
1471  size += sendDir(sink, pathbuf, basepathlen, sizeonly, tablespaces,
1472  sendtblspclinks, manifest, spcoid, ib);
1473  }
1474  else if (S_ISREG(statbuf.st_mode))
1475  {
1476  bool sent = false;
1477  unsigned num_blocks_required = 0;
1478  unsigned truncation_block_length = 0;
1479  char tarfilenamebuf[MAXPGPATH * 2];
1480  char *tarfilename = pathbuf + basepathlen + 1;
1482 
1483  if (ib != NULL && isRelationFile)
1484  {
1485  Oid relspcoid;
1486  char *lookup_path;
1487 
1488  if (OidIsValid(spcoid))
1489  {
1490  relspcoid = spcoid;
1491  lookup_path = psprintf("%s/%u/%s", PG_TBLSPC_DIR, spcoid,
1492  tarfilename);
1493  }
1494  else
1495  {
1496  if (isGlobalDir)
1497  relspcoid = GLOBALTABLESPACE_OID;
1498  else
1499  relspcoid = DEFAULTTABLESPACE_OID;
1500  lookup_path = pstrdup(tarfilename);
1501  }
1502 
1503  method = GetFileBackupMethod(ib, lookup_path, dboid, relspcoid,
1504  relfilenumber, relForkNum,
1505  segno, statbuf.st_size,
1506  &num_blocks_required,
1507  relative_block_numbers,
1508  &truncation_block_length);
1509  if (method == BACK_UP_FILE_INCREMENTALLY)
1510  {
1511  statbuf.st_size =
1512  GetIncrementalFileSize(num_blocks_required);
1513  snprintf(tarfilenamebuf, sizeof(tarfilenamebuf),
1514  "%s/INCREMENTAL.%s",
1515  path + basepathlen + 1,
1516  de->d_name);
1517  tarfilename = tarfilenamebuf;
1518  }
1519 
1520  pfree(lookup_path);
1521  }
1522 
1523  if (!sizeonly)
1524  sent = sendFile(sink, pathbuf, tarfilename, &statbuf,
1525  true, dboid, spcoid,
1526  relfilenumber, segno, manifest,
1527  num_blocks_required,
1528  method == BACK_UP_FILE_INCREMENTALLY ? relative_block_numbers : NULL,
1529  truncation_block_length);
1530 
1531  if (sent || sizeonly)
1532  {
1533  /* Add size. */
1534  size += statbuf.st_size;
1535 
1536  /* Pad to a multiple of the tar block size. */
1537  size += tarPaddingBytesRequired(statbuf.st_size);
1538 
1539  /* Size of the header for the file. */
1540  size += TAR_BLOCK_SIZE;
1541  }
1542  }
1543  else
1544  ereport(WARNING,
1545  (errmsg("skipping special file \"%s\"", pathbuf)));
1546  }
1547 
1548  if (relative_block_numbers != NULL)
1549  pfree(relative_block_numbers);
1550 
1551  FreeDir(dir);
1552  return size;
1553 }
1554 
1555 /*
1556  * Given the member, write the TAR header & send the file.
1557  *
1558  * If 'missing_ok' is true, will not throw an error if the file is not found.
1559  *
1560  * If dboid is anything other than InvalidOid then any checksum failures
1561  * detected will get reported to the cumulative stats system.
1562  *
1563  * If the file is to be sent incrementally, then num_incremental_blocks
1564  * should be the number of blocks to be sent, and incremental_blocks
1565  * an array of block numbers relative to the start of the current segment.
1566  * If the whole file is to be sent, then incremental_blocks should be NULL,
1567  * and num_incremental_blocks can have any value, as it will be ignored.
1568  *
1569  * Returns true if the file was successfully sent, false if 'missing_ok',
1570  * and the file did not exist.
1571  */
1572 static bool
1573 sendFile(bbsink *sink, const char *readfilename, const char *tarfilename,
1574  struct stat *statbuf, bool missing_ok, Oid dboid, Oid spcoid,
1575  RelFileNumber relfilenumber, unsigned segno,
1576  backup_manifest_info *manifest, unsigned num_incremental_blocks,
1577  BlockNumber *incremental_blocks, unsigned truncation_block_length)
1578 {
1579  int fd;
1580  BlockNumber blkno = 0;
1581  int checksum_failures = 0;
1582  off_t cnt;
1583  pgoff_t bytes_done = 0;
1584  bool verify_checksum = false;
1585  pg_checksum_context checksum_ctx;
1586  int ibindex = 0;
1587 
1588  if (pg_checksum_init(&checksum_ctx, manifest->checksum_type) < 0)
1589  elog(ERROR, "could not initialize checksum of file \"%s\"",
1590  readfilename);
1591 
1592  fd = OpenTransientFile(readfilename, O_RDONLY | PG_BINARY);
1593  if (fd < 0)
1594  {
1595  if (errno == ENOENT && missing_ok)
1596  return false;
1597  ereport(ERROR,
1599  errmsg("could not open file \"%s\": %m", readfilename)));
1600  }
1601 
1602  _tarWriteHeader(sink, tarfilename, NULL, statbuf, false);
1603 
1604  /*
1605  * Checksums are verified in multiples of BLCKSZ, so the buffer length
1606  * should be a multiple of the block size as well.
1607  */
1608  Assert((sink->bbs_buffer_length % BLCKSZ) == 0);
1609 
1610  /*
1611  * If we weren't told not to verify checksums, and if checksums are
1612  * enabled for this cluster, and if this is a relation file, then verify
1613  * the checksum.
1614  */
1616  RelFileNumberIsValid(relfilenumber))
1617  verify_checksum = true;
1618 
1619  /*
1620  * If we're sending an incremental file, write the file header.
1621  */
1622  if (incremental_blocks != NULL)
1623  {
1624  unsigned magic = INCREMENTAL_MAGIC;
1625  size_t header_bytes_done = 0;
1626  char padding[BLCKSZ];
1627  size_t paddinglen;
1628 
1629  /* Emit header data. */
1630  push_to_sink(sink, &checksum_ctx, &header_bytes_done,
1631  &magic, sizeof(magic));
1632  push_to_sink(sink, &checksum_ctx, &header_bytes_done,
1633  &num_incremental_blocks, sizeof(num_incremental_blocks));
1634  push_to_sink(sink, &checksum_ctx, &header_bytes_done,
1635  &truncation_block_length, sizeof(truncation_block_length));
1636  push_to_sink(sink, &checksum_ctx, &header_bytes_done,
1637  incremental_blocks,
1638  sizeof(BlockNumber) * num_incremental_blocks);
1639 
1640  /*
1641  * Add padding to align header to a multiple of BLCKSZ, but only if
1642  * the incremental file has some blocks, and the alignment is actually
1643  * needed (i.e. header is not already a multiple of BLCKSZ). If there
1644  * are no blocks we don't want to make the file unnecessarily large,
1645  * as that might make some filesystem optimizations impossible.
1646  */
1647  if ((num_incremental_blocks > 0) && (header_bytes_done % BLCKSZ != 0))
1648  {
1649  paddinglen = (BLCKSZ - (header_bytes_done % BLCKSZ));
1650 
1651  memset(padding, 0, paddinglen);
1652  bytes_done += paddinglen;
1653 
1654  push_to_sink(sink, &checksum_ctx, &header_bytes_done,
1655  padding, paddinglen);
1656  }
1657 
1658  /* Flush out any data still in the buffer so it's again empty. */
1659  if (header_bytes_done > 0)
1660  {
1661  bbsink_archive_contents(sink, header_bytes_done);
1662  if (pg_checksum_update(&checksum_ctx,
1663  (uint8 *) sink->bbs_buffer,
1664  header_bytes_done) < 0)
1665  elog(ERROR, "could not update checksum of base backup");
1666  }
1667 
1668  /* Update our notion of file position. */
1669  bytes_done += sizeof(magic);
1670  bytes_done += sizeof(num_incremental_blocks);
1671  bytes_done += sizeof(truncation_block_length);
1672  bytes_done += sizeof(BlockNumber) * num_incremental_blocks;
1673  }
1674 
1675  /*
1676  * Loop until we read the amount of data the caller told us to expect. The
1677  * file could be longer, if it was extended while we were sending it, but
1678  * for a base backup we can ignore such extended data. It will be restored
1679  * from WAL.
1680  */
1681  while (1)
1682  {
1683  /*
1684  * Determine whether we've read all the data that we need, and if not,
1685  * read some more.
1686  */
1687  if (incremental_blocks == NULL)
1688  {
1689  size_t remaining = statbuf->st_size - bytes_done;
1690 
1691  /*
1692  * If we've read the required number of bytes, then it's time to
1693  * stop.
1694  */
1695  if (bytes_done >= statbuf->st_size)
1696  break;
1697 
1698  /*
1699  * Read as many bytes as will fit in the buffer, or however many
1700  * are left to read, whichever is less.
1701  */
1702  cnt = read_file_data_into_buffer(sink, readfilename, fd,
1703  bytes_done, remaining,
1704  blkno + segno * RELSEG_SIZE,
1705  verify_checksum,
1706  &checksum_failures);
1707  }
1708  else
1709  {
1710  BlockNumber relative_blkno;
1711 
1712  /*
1713  * If we've read all the blocks, then it's time to stop.
1714  */
1715  if (ibindex >= num_incremental_blocks)
1716  break;
1717 
1718  /*
1719  * Read just one block, whichever one is the next that we're
1720  * supposed to include.
1721  */
1722  relative_blkno = incremental_blocks[ibindex++];
1723  cnt = read_file_data_into_buffer(sink, readfilename, fd,
1724  relative_blkno * BLCKSZ,
1725  BLCKSZ,
1726  relative_blkno + segno * RELSEG_SIZE,
1727  verify_checksum,
1728  &checksum_failures);
1729 
1730  /*
1731  * If we get a partial read, that must mean that the relation is
1732  * being truncated. Ultimately, it should be truncated to a
1733  * multiple of BLCKSZ, since this path should only be reached for
1734  * relation files, but we might transiently observe an
1735  * intermediate value.
1736  *
1737  * It should be fine to treat this just as if the entire block had
1738  * been truncated away - i.e. fill this and all later blocks with
1739  * zeroes. WAL replay will fix things up.
1740  */
1741  if (cnt < BLCKSZ)
1742  break;
1743  }
1744 
1745  /*
1746  * If the amount of data we were able to read was not a multiple of
1747  * BLCKSZ, we cannot verify checksums, which are block-level.
1748  */
1749  if (verify_checksum && (cnt % BLCKSZ != 0))
1750  {
1751  ereport(WARNING,
1752  (errmsg("could not verify checksum in file \"%s\", block "
1753  "%u: read buffer size %d and page size %d "
1754  "differ",
1755  readfilename, blkno, (int) cnt, BLCKSZ)));
1756  verify_checksum = false;
1757  }
1758 
1759  /*
1760  * If we hit end-of-file, a concurrent truncation must have occurred.
1761  * That's not an error condition, because WAL replay will fix things
1762  * up.
1763  */
1764  if (cnt == 0)
1765  break;
1766 
1767  /* Update block number and # of bytes done for next loop iteration. */
1768  blkno += cnt / BLCKSZ;
1769  bytes_done += cnt;
1770 
1771  /*
1772  * Make sure incremental files with block data are properly aligned
1773  * (header is a multiple of BLCKSZ, blocks are BLCKSZ too).
1774  */
1775  Assert(!((incremental_blocks != NULL && num_incremental_blocks > 0) &&
1776  (bytes_done % BLCKSZ != 0)));
1777 
1778  /* Archive the data we just read. */
1779  bbsink_archive_contents(sink, cnt);
1780 
1781  /* Also feed it to the checksum machinery. */
1782  if (pg_checksum_update(&checksum_ctx,
1783  (uint8 *) sink->bbs_buffer, cnt) < 0)
1784  elog(ERROR, "could not update checksum of base backup");
1785  }
1786 
1787  /* If the file was truncated while we were sending it, pad it with zeros */
1788  while (bytes_done < statbuf->st_size)
1789  {
1790  size_t remaining = statbuf->st_size - bytes_done;
1791  size_t nbytes = Min(sink->bbs_buffer_length, remaining);
1792 
1793  MemSet(sink->bbs_buffer, 0, nbytes);
1794  if (pg_checksum_update(&checksum_ctx,
1795  (uint8 *) sink->bbs_buffer,
1796  nbytes) < 0)
1797  elog(ERROR, "could not update checksum of base backup");
1798  bbsink_archive_contents(sink, nbytes);
1799  bytes_done += nbytes;
1800  }
1801 
1802  /*
1803  * Pad to a block boundary, per tar format requirements. (This small piece
1804  * of data is probably not worth throttling, and is not checksummed
1805  * because it's not actually part of the file.)
1806  */
1807  _tarWritePadding(sink, bytes_done);
1808 
1810 
1811  if (checksum_failures > 1)
1812  {
1813  ereport(WARNING,
1814  (errmsg_plural("file \"%s\" has a total of %d checksum verification failure",
1815  "file \"%s\" has a total of %d checksum verification failures",
1816  checksum_failures,
1817  readfilename, checksum_failures)));
1818 
1819  pgstat_report_checksum_failures_in_db(dboid, checksum_failures);
1820  }
1821 
1822  total_checksum_failures += checksum_failures;
1823 
1824  AddFileToBackupManifest(manifest, spcoid, tarfilename, statbuf->st_size,
1825  (pg_time_t) statbuf->st_mtime, &checksum_ctx);
1826 
1827  return true;
1828 }
1829 
1830 /*
1831  * Read some more data from the file into the bbsink's buffer, verifying
1832  * checksums as required.
1833  *
1834  * 'offset' is the file offset from which we should begin to read, and
1835  * 'length' is the amount of data that should be read. The actual amount
1836  * of data read will be less than the requested amount if the bbsink's
1837  * buffer isn't big enough to hold it all, or if the underlying file has
1838  * been truncated. The return value is the number of bytes actually read.
1839  *
1840  * 'blkno' is the block number of the first page in the bbsink's buffer
1841  * relative to the start of the relation.
1842  *
1843  * 'verify_checksum' indicates whether we should try to verify checksums
1844  * for the blocks we read. If we do this, we'll update *checksum_failures
1845  * and issue warnings as appropriate.
1846  */
1847 static off_t
1848 read_file_data_into_buffer(bbsink *sink, const char *readfilename, int fd,
1849  off_t offset, size_t length, BlockNumber blkno,
1850  bool verify_checksum, int *checksum_failures)
1851 {
1852  off_t cnt;
1853  int i;
1854  char *page;
1855 
1856  /* Try to read some more data. */
1857  cnt = basebackup_read_file(fd, sink->bbs_buffer,
1858  Min(sink->bbs_buffer_length, length),
1859  offset, readfilename, true);
1860 
1861  /* Can't verify checksums if read length is not a multiple of BLCKSZ. */
1862  if (!verify_checksum || (cnt % BLCKSZ) != 0)
1863  return cnt;
1864 
1865  /* Verify checksum for each block. */
1866  for (i = 0; i < cnt / BLCKSZ; i++)
1867  {
1868  int reread_cnt;
1869  uint16 expected_checksum;
1870 
1871  page = sink->bbs_buffer + BLCKSZ * i;
1872 
1873  /* If the page is OK, go on to the next one. */
1874  if (verify_page_checksum(page, sink->bbs_state->startptr, blkno + i,
1875  &expected_checksum))
1876  continue;
1877 
1878  /*
1879  * Retry the block on the first failure. It's possible that we read
1880  * the first 4K page of the block just before postgres updated the
1881  * entire block so it ends up looking torn to us. If, before we retry
1882  * the read, the concurrent write of the block finishes, the page LSN
1883  * will be updated and we'll realize that we should ignore this block.
1884  *
1885  * There's no guarantee that this will actually happen, though: the
1886  * torn write could take an arbitrarily long time to complete.
1887  * Retrying multiple times wouldn't fix this problem, either, though
1888  * it would reduce the chances of it happening in practice. The only
1889  * real fix here seems to be to have some kind of interlock that
1890  * allows us to wait until we can be certain that no write to the
1891  * block is in progress. Since we don't have any such thing right now,
1892  * we just do this and hope for the best.
1893  */
1894  reread_cnt =
1895  basebackup_read_file(fd, sink->bbs_buffer + BLCKSZ * i,
1896  BLCKSZ, offset + BLCKSZ * i,
1897  readfilename, false);
1898  if (reread_cnt == 0)
1899  {
1900  /*
1901  * If we hit end-of-file, a concurrent truncation must have
1902  * occurred, so reduce cnt to reflect only the blocks already
1903  * processed and break out of this loop.
1904  */
1905  cnt = BLCKSZ * i;
1906  break;
1907  }
1908 
1909  /* If the page now looks OK, go on to the next one. */
1910  if (verify_page_checksum(page, sink->bbs_state->startptr, blkno + i,
1911  &expected_checksum))
1912  continue;
1913 
1914  /* Handle checksum failure. */
1915  (*checksum_failures)++;
1916  if (*checksum_failures <= 5)
1917  ereport(WARNING,
1918  (errmsg("checksum verification failed in "
1919  "file \"%s\", block %u: calculated "
1920  "%X but expected %X",
1921  readfilename, blkno + i, expected_checksum,
1922  ((PageHeader) page)->pd_checksum)));
1923  if (*checksum_failures == 5)
1924  ereport(WARNING,
1925  (errmsg("further checksum verification "
1926  "failures in file \"%s\" will not "
1927  "be reported", readfilename)));
1928  }
1929 
1930  return cnt;
1931 }
1932 
1933 /*
1934  * Push data into a bbsink.
1935  *
1936  * It's better, when possible, to read data directly into the bbsink's buffer,
1937  * rather than using this function to copy it into the buffer; this function is
1938  * for cases where that approach is not practical.
1939  *
1940  * bytes_done should point to a count of the number of bytes that are
1941  * currently used in the bbsink's buffer. Upon return, the bytes identified by
1942  * data and length will have been copied into the bbsink's buffer, flushing
1943  * as required, and *bytes_done will have been updated accordingly. If the
1944  * buffer was flushed, the previous contents will also have been fed to
1945  * checksum_ctx.
1946  *
1947  * Note that after one or more calls to this function it is the caller's
1948  * responsibility to perform any required final flush.
1949  */
1950 static void
1952  size_t *bytes_done, void *data, size_t length)
1953 {
1954  while (length > 0)
1955  {
1956  size_t bytes_to_copy;
1957 
1958  /*
1959  * We use < here rather than <= so that if the data exactly fills the
1960  * remaining buffer space, we trigger a flush now.
1961  */
1962  if (length < sink->bbs_buffer_length - *bytes_done)
1963  {
1964  /* Append remaining data to buffer. */
1965  memcpy(sink->bbs_buffer + *bytes_done, data, length);
1966  *bytes_done += length;
1967  return;
1968  }
1969 
1970  /* Copy until buffer is full and flush it. */
1971  bytes_to_copy = sink->bbs_buffer_length - *bytes_done;
1972  memcpy(sink->bbs_buffer + *bytes_done, data, bytes_to_copy);
1973  data = ((char *) data) + bytes_to_copy;
1974  length -= bytes_to_copy;
1976  if (pg_checksum_update(checksum_ctx, (uint8 *) sink->bbs_buffer,
1977  sink->bbs_buffer_length) < 0)
1978  elog(ERROR, "could not update checksum");
1979  *bytes_done = 0;
1980  }
1981 }
1982 
1983 /*
1984  * Try to verify the checksum for the provided page, if it seems appropriate
1985  * to do so.
1986  *
1987  * Returns true if verification succeeds or if we decide not to check it,
1988  * and false if verification fails. When return false, it also sets
1989  * *expected_checksum to the computed value.
1990  */
1991 static bool
1993  uint16 *expected_checksum)
1994 {
1995  PageHeader phdr;
1996  uint16 checksum;
1997 
1998  /*
1999  * Only check pages which have not been modified since the start of the
2000  * base backup. Otherwise, they might have been written only halfway and
2001  * the checksum would not be valid. However, replaying WAL would
2002  * reinstate the correct page in this case. We also skip completely new
2003  * pages, since they don't have a checksum yet.
2004  */
2005  if (PageIsNew(page) || PageGetLSN(page) >= start_lsn)
2006  return true;
2007 
2008  /* Perform the actual checksum calculation. */
2009  checksum = pg_checksum_page(page, blkno);
2010 
2011  /* See whether it matches the value from the page. */
2012  phdr = (PageHeader) page;
2013  if (phdr->pd_checksum == checksum)
2014  return true;
2015  *expected_checksum = checksum;
2016  return false;
2017 }
2018 
2019 static int64
2020 _tarWriteHeader(bbsink *sink, const char *filename, const char *linktarget,
2021  struct stat *statbuf, bool sizeonly)
2022 {
2023  enum tarError rc;
2024 
2025  if (!sizeonly)
2026  {
2027  /*
2028  * As of this writing, the smallest supported block size is 1kB, which
2029  * is twice TAR_BLOCK_SIZE. Since the buffer size is required to be a
2030  * multiple of BLCKSZ, it should be safe to assume that the buffer is
2031  * large enough to fit an entire tar block. We double-check by means
2032  * of these assertions.
2033  */
2034  StaticAssertDecl(TAR_BLOCK_SIZE <= BLCKSZ,
2035  "BLCKSZ too small for tar block");
2037 
2038  rc = tarCreateHeader(sink->bbs_buffer, filename, linktarget,
2039  statbuf->st_size, statbuf->st_mode,
2040  statbuf->st_uid, statbuf->st_gid,
2041  statbuf->st_mtime);
2042 
2043  switch (rc)
2044  {
2045  case TAR_OK:
2046  break;
2047  case TAR_NAME_TOO_LONG:
2048  ereport(ERROR,
2049  (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED),
2050  errmsg("file name too long for tar format: \"%s\"",
2051  filename)));
2052  break;
2053  case TAR_SYMLINK_TOO_LONG:
2054  ereport(ERROR,
2055  (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED),
2056  errmsg("symbolic link target too long for tar format: "
2057  "file name \"%s\", target \"%s\"",
2058  filename, linktarget)));
2059  break;
2060  default:
2061  elog(ERROR, "unrecognized tar error: %d", rc);
2062  }
2063 
2065  }
2066 
2067  return TAR_BLOCK_SIZE;
2068 }
2069 
2070 /*
2071  * Pad with zero bytes out to a multiple of TAR_BLOCK_SIZE.
2072  */
2073 static void
2075 {
2076  int pad = tarPaddingBytesRequired(len);
2077 
2078  /*
2079  * As in _tarWriteHeader, it should be safe to assume that the buffer is
2080  * large enough that we don't need to do this in multiple chunks.
2081  */
2083  Assert(pad <= TAR_BLOCK_SIZE);
2084 
2085  if (pad > 0)
2086  {
2087  MemSet(sink->bbs_buffer, 0, pad);
2088  bbsink_archive_contents(sink, pad);
2089  }
2090 }
2091 
2092 /*
2093  * If the entry in statbuf is a link, then adjust statbuf to make it look like a
2094  * directory, so that it will be written that way.
2095  */
2096 static void
2097 convert_link_to_directory(const char *pathbuf, struct stat *statbuf)
2098 {
2099  /* If symlink, write it as a directory anyway */
2100  if (S_ISLNK(statbuf->st_mode))
2101  statbuf->st_mode = S_IFDIR | pg_dir_create_mode;
2102 }
2103 
2104 /*
2105  * Read some data from a file, setting a wait event and reporting any error
2106  * encountered.
2107  *
2108  * If partial_read_ok is false, also report an error if the number of bytes
2109  * read is not equal to the number of bytes requested.
2110  *
2111  * Returns the number of bytes read.
2112  */
2113 static ssize_t
2114 basebackup_read_file(int fd, char *buf, size_t nbytes, off_t offset,
2115  const char *filename, bool partial_read_ok)
2116 {
2117  ssize_t rc;
2118 
2119  pgstat_report_wait_start(WAIT_EVENT_BASEBACKUP_READ);
2120  rc = pg_pread(fd, buf, nbytes, offset);
2122 
2123  if (rc < 0)
2124  ereport(ERROR,
2126  errmsg("could not read file \"%s\": %m", filename)));
2127  if (!partial_read_ok && rc > 0 && rc != nbytes)
2128  ereport(ERROR,
2130  errmsg("could not read file \"%s\": read %zd of %zu",
2131  filename, rc, nbytes)));
2132 
2133  return rc;
2134 }
void InitializeBackupManifest(backup_manifest_info *manifest, backup_manifest_option want_manifest, pg_checksum_type manifest_checksum_type)
void AddFileToBackupManifest(backup_manifest_info *manifest, Oid spcoid, const char *pathname, size_t size, pg_time_t mtime, pg_checksum_context *checksum_ctx)
void AddWALInfoToBackupManifest(backup_manifest_info *manifest, XLogRecPtr startptr, TimeLineID starttli, XLogRecPtr endptr, TimeLineID endtli)
void SendBackupManifest(backup_manifest_info *manifest, bbsink *sink)
void FreeBackupManifest(backup_manifest_info *manifest)
@ MANIFEST_OPTION_NO
@ MANIFEST_OPTION_FORCE_ENCODE
@ MANIFEST_OPTION_YES
enum manifest_option backup_manifest_option
static bool sendFile(bbsink *sink, const char *readfilename, const char *tarfilename, struct stat *statbuf, bool missing_ok, Oid dboid, Oid spcoid, RelFileNumber relfilenumber, unsigned segno, backup_manifest_info *manifest, unsigned num_incremental_blocks, BlockNumber *incremental_blocks, unsigned truncation_block_length)
Definition: basebackup.c:1573
static const struct exclude_list_item excludeFiles[]
Definition: basebackup.c:192
static int compareWalFileNames(const ListCell *a, const ListCell *b)
Definition: basebackup.c:685
static void sendFileWithContent(bbsink *sink, const char *filename, const char *content, int len, backup_manifest_info *manifest)
Definition: basebackup.c:1074
static off_t read_file_data_into_buffer(bbsink *sink, const char *readfilename, int fd, off_t offset, size_t length, BlockNumber blkno, bool verify_checksum, int *checksum_failures)
Definition: basebackup.c:1848
static void push_to_sink(bbsink *sink, pg_checksum_context *checksum_ctx, size_t *bytes_done, void *data, size_t length)
Definition: basebackup.c:1951
static int64 sendDir(bbsink *sink, const char *path, int basepathlen, bool sizeonly, List *tablespaces, bool sendtblspclinks, backup_manifest_info *manifest, Oid spcoid, IncrementalBackupInfo *ib)
Definition: basebackup.c:1188
#define SINK_BUFFER_LENGTH
Definition: basebackup.c:61
static void parse_basebackup_options(List *options, basebackup_options *opt)
Definition: basebackup.c:697
static const char *const excludeDirContents[]
Definition: basebackup.c:152
static void convert_link_to_directory(const char *pathbuf, struct stat *statbuf)
Definition: basebackup.c:2097
void SendBaseBackup(BaseBackupCmd *cmd, IncrementalBackupInfo *ib)
Definition: basebackup.c:989
static bool backup_started_in_recovery
Definition: basebackup.c:124
static int64 _tarWriteHeader(bbsink *sink, const char *filename, const char *linktarget, struct stat *statbuf, bool sizeonly)
Definition: basebackup.c:2020
static void perform_base_backup(basebackup_options *opt, bbsink *sink, IncrementalBackupInfo *ib)
Definition: basebackup.c:235
static int64 sendTablespace(bbsink *sink, char *path, Oid spcoid, bool sizeonly, struct backup_manifest_info *manifest, IncrementalBackupInfo *ib)
Definition: basebackup.c:1135
static bool noverify_checksums
Definition: basebackup.c:130
static void _tarWritePadding(bbsink *sink, int len)
Definition: basebackup.c:2074
static bool verify_page_checksum(Page page, XLogRecPtr start_lsn, BlockNumber blkno, uint16 *expected_checksum)
Definition: basebackup.c:1992
static ssize_t basebackup_read_file(int fd, char *buf, size_t nbytes, off_t offset, const char *filename, bool partial_read_ok)
Definition: basebackup.c:2114
static long long int total_checksum_failures
Definition: basebackup.c:127
#define MAX_RATE_UPPER
Definition: basebackup.h:21
#define MAX_RATE_LOWER
Definition: basebackup.h:20
bbsink * bbsink_copystream_new(bool send_to_client)
bbsink * bbsink_gzip_new(bbsink *next, pg_compress_specification *compress)
size_t GetIncrementalFileSize(unsigned num_blocks_required)
FileBackupMethod GetFileBackupMethod(IncrementalBackupInfo *ib, const char *path, Oid dboid, Oid spcoid, RelFileNumber relfilenumber, ForkNumber forknum, unsigned segno, size_t size, unsigned *num_blocks_required, BlockNumber *relative_block_numbers, unsigned *truncation_block_length)
void PrepareForIncrementalBackup(IncrementalBackupInfo *ib, BackupState *backup_state)
#define INCREMENTAL_MAGIC
@ BACK_UP_FILE_INCREMENTALLY
@ BACK_UP_FILE_FULLY
bbsink * bbsink_lz4_new(bbsink *next, pg_compress_specification *compress)
void basebackup_progress_wait_checkpoint(void)
void basebackup_progress_wait_wal_archive(bbsink_state *state)
bbsink * bbsink_progress_new(bbsink *next, bool estimate_backup_size)
void basebackup_progress_done(void)
void basebackup_progress_transfer_wal(void)
void basebackup_progress_estimate_backup_size(void)
static void bbsink_begin_backup(bbsink *sink, bbsink_state *state, int buffer_length)
static void bbsink_begin_archive(bbsink *sink, const char *archive_name)
static void bbsink_end_archive(bbsink *sink)
static void bbsink_end_backup(bbsink *sink, XLogRecPtr endptr, TimeLineID endtli)
static void bbsink_cleanup(bbsink *sink)
static void bbsink_archive_contents(bbsink *sink, size_t len)
bbsink * BaseBackupGetSink(BaseBackupTargetHandle *handle, bbsink *next_sink)
BaseBackupTargetHandle * BaseBackupGetTargetHandle(char *target, char *target_detail)
bbsink * bbsink_throttle_new(bbsink *next, uint32 maxrate)
bbsink * bbsink_zstd_new(bbsink *next, pg_compress_specification *compress)
uint32 BlockNumber
Definition: block.h:31
bool parse_bool(const char *value, bool *result)
Definition: bool.c:31
PageHeaderData * PageHeader
Definition: bufpage.h:173
Pointer Page
Definition: bufpage.h:81
static bool PageIsNew(Page page)
Definition: bufpage.h:233
static XLogRecPtr PageGetLSN(const char *page)
Definition: bufpage.h:386
unsigned short uint16
Definition: c.h:505
unsigned int uint32
Definition: c.h:506
#define Min(x, y)
Definition: c.h:1004
#define Assert(condition)
Definition: c.h:858
#define PG_BINARY
Definition: c.h:1273
unsigned char uint8
Definition: c.h:504
#define MemSet(start, val, len)
Definition: c.h:1020
#define StaticAssertDecl(condition, errmessage)
Definition: c.h:936
#define StaticAssertStmt(condition, errmessage)
Definition: c.h:938
#define OidIsValid(objectId)
Definition: c.h:775
uint16 pg_checksum_page(char *page, BlockNumber blkno)
bool pg_checksum_parse_type(char *name, pg_checksum_type *type)
int pg_checksum_update(pg_checksum_context *context, const uint8 *input, size_t len)
int pg_checksum_init(pg_checksum_context *context, pg_checksum_type type)
pg_checksum_type
@ CHECKSUM_TYPE_NONE
@ CHECKSUM_TYPE_CRC32C
bool parse_compress_algorithm(char *name, pg_compress_algorithm *algorithm)
Definition: compression.c:49
void parse_compress_specification(pg_compress_algorithm algorithm, char *specification, pg_compress_specification *result)
Definition: compression.c:107
char * validate_compress_specification(pg_compress_specification *spec)
Definition: compression.c:344
pg_compress_algorithm
Definition: compression.h:22
@ PG_COMPRESSION_GZIP
Definition: compression.h:24
@ PG_COMPRESSION_LZ4
Definition: compression.h:25
@ PG_COMPRESSION_NONE
Definition: compression.h:23
@ PG_COMPRESSION_ZSTD
Definition: compression.h:26
bool defGetBoolean(DefElem *def)
Definition: define.c:107
char * defGetString(DefElem *def)
Definition: define.c:48
int64 defGetInt64(DefElem *def)
Definition: define.c:186
#define PG_DYNSHMEM_DIR
Definition: dsm_impl.h:51
int errmsg_plural(const char *fmt_singular, const char *fmt_plural, unsigned long n,...)
Definition: elog.c:1180
int errcode_for_file_access(void)
Definition: elog.c:876
int errhint(const char *fmt,...)
Definition: elog.c:1317
int errcode(int sqlerrcode)
Definition: elog.c:853
int errmsg(const char *fmt,...)
Definition: elog.c:1070
#define PG_TRY(...)
Definition: elog.h:371
#define WARNING
Definition: elog.h:36
#define DEBUG2
Definition: elog.h:29
#define PG_END_TRY(...)
Definition: elog.h:396
#define DEBUG1
Definition: elog.h:30
#define ERROR
Definition: elog.h:39
#define elog(elevel,...)
Definition: elog.h:225
#define PG_FINALLY(...)
Definition: elog.h:388
#define ereport(elevel,...)
Definition: elog.h:149
struct dirent * ReadDir(DIR *dir, const char *dirname)
Definition: fd.c:2932
int FreeDir(DIR *dir)
Definition: fd.c:2984
int CloseTransientFile(int fd)
Definition: fd.c:2832
bool looks_like_temp_rel_name(const char *name)
Definition: fd.c:3473
int OpenTransientFile(const char *fileName, int fileFlags)
Definition: fd.c:2656
DIR * AllocateDir(const char *dirname)
Definition: fd.c:2866
int pg_file_create_mode
Definition: file_perm.c:19
int pg_dir_create_mode
Definition: file_perm.c:18
#define PG_TEMP_FILE_PREFIX
Definition: file_utils.h:63
#define PG_AUTOCONF_FILENAME
Definition: guc.h:33
int remaining
Definition: informix.c:692
#define PG_ENSURE_ERROR_CLEANUP(cleanup_function, arg)
Definition: ipc.h:47
#define PG_END_ENSURE_ERROR_CLEANUP(cleanup_function, arg)
Definition: ipc.h:52
int b
Definition: isn.c:70
int a
Definition: isn.c:69
int i
Definition: isn.c:73
void list_sort(List *list, list_sort_comparator cmp)
Definition: list.c:1674
List * lappend(List *list, void *datum)
Definition: list.c:339
char * pstrdup(const char *in)
Definition: mcxt.c:1696
void pfree(void *pointer)
Definition: mcxt.c:1521
void * palloc0(Size size)
Definition: mcxt.c:1347
void * palloc(Size size)
Definition: mcxt.c:1317
#define CHECK_FOR_INTERRUPTS()
Definition: miscadmin.h:122
static bool manifest
static int32 maxrate
#define ERRCODE_DATA_CORRUPTED
Definition: pg_basebackup.c:41
#define MAXPGPATH
const void size_t len
const void * data
static char * filename
Definition: pg_dumpall.c:119
#define lfirst(lc)
Definition: pg_list.h:172
#define NIL
Definition: pg_list.h:68
#define linitial(l)
Definition: pg_list.h:178
static ListCell * lnext(const List *l, const ListCell *c)
Definition: pg_list.h:343
static char * buf
Definition: pg_test_fsync.c:73
#define PG_STAT_TMP_DIR
Definition: pgstat.h:34
void pgstat_report_checksum_failures_in_db(Oid dboid, int failurecount)
static size_t tarPaddingBytesRequired(size_t len)
Definition: pgtar.h:79
enum tarError tarCreateHeader(char *h, const char *filename, const char *linktarget, pgoff_t size, mode_t mode, uid_t uid, gid_t gid, time_t mtime)
Definition: tar.c:114
tarError
Definition: pgtar.h:20
@ TAR_SYMLINK_TOO_LONG
Definition: pgtar.h:23
@ TAR_OK
Definition: pgtar.h:21
@ TAR_NAME_TOO_LONG
Definition: pgtar.h:22
#define TAR_BLOCK_SIZE
Definition: pgtar.h:17
int64 pg_time_t
Definition: pgtime.h:23
char * last_dir_separator(const char *filename)
Definition: path.c:140
int pg_strcasecmp(const char *s1, const char *s2)
Definition: pgstrcasecmp.c:36
#define pg_pread
Definition: port.h:225
#define snprintf
Definition: port.h:238
static Datum BoolGetDatum(bool X)
Definition: postgres.h:102
#define InvalidOid
Definition: postgres_ext.h:36
unsigned int Oid
Definition: postgres_ext.h:31
#define atooid(x)
Definition: postgres_ext.h:42
static int fd(const char *x, int i)
Definition: preproc-init.c:105
bool update_process_title
Definition: ps_status.c:29
static void set_ps_display(const char *activity)
Definition: ps_status.h:40
char * psprintf(const char *fmt,...)
Definition: psprintf.c:46
bool parse_filename_for_nontemp_relation(const char *name, RelFileNumber *relnumber, ForkNumber *fork, unsigned *segno)
Definition: reinit.c:380
#define RELCACHE_INIT_FILENAME
Definition: relcache.h:25
Oid RelFileNumber
Definition: relpath.h:25
ForkNumber
Definition: relpath.h:56
@ InvalidForkNumber
Definition: relpath.h:57
@ INIT_FORKNUM
Definition: relpath.h:61
#define InvalidRelFileNumber
Definition: relpath.h:26
#define PG_TBLSPC_DIR
Definition: relpath.h:41
#define TABLESPACE_VERSION_DIRECTORY
Definition: relpath.h:33
#define RelFileNumberIsValid(relnumber)
Definition: relpath.h:27
ResourceOwner ResourceOwnerCreate(ResourceOwner parent, const char *name)
Definition: resowner.c:413
ResourceOwner CurrentResourceOwner
Definition: resowner.c:165
static pg_noinline void Size size
Definition: slab.c:607
#define PG_REPLSLOT_DIR
Definition: slot.h:21
void destroyStringInfo(StringInfo str)
Definition: stringinfo.c:361
StringInfo makeStringInfo(void)
Definition: stringinfo.c:41
TimeLineID starttli
Definition: xlogbackup.h:27
XLogRecPtr startpoint
Definition: xlogbackup.h:26
TimeLineID stoptli
Definition: xlogbackup.h:36
XLogRecPtr stoppoint
Definition: xlogbackup.h:35
List * options
Definition: replnodes.h:44
Definition: dirent.c:26
char * defname
Definition: parsenodes.h:817
Definition: pg_list.h:54
uint16 pd_checksum
Definition: bufpage.h:163
pg_compress_specification compression_specification
Definition: basebackup.c:78
pg_checksum_type manifest_checksum_type
Definition: basebackup.c:79
const char * label
Definition: basebackup.c:65
pg_compress_algorithm compression
Definition: basebackup.c:77
backup_manifest_option manifest
Definition: basebackup.c:76
BaseBackupTargetHandle * target_handle
Definition: basebackup.c:75
XLogRecPtr startptr
bbsink_state * bbs_state
char * bbs_buffer
size_t bbs_buffer_length
Definition: dirent.h:10
char d_name[MAX_PATH]
Definition: dirent.h:15
const char * name
Definition: basebackup.c:140
pg_compress_algorithm algorithm
Definition: compression.h:34
__time64_t st_mtime
Definition: win32_port.h:275
__int64 st_size
Definition: win32_port.h:273
short st_gid
Definition: win32_port.h:271
unsigned short st_mode
Definition: win32_port.h:268
short st_uid
Definition: win32_port.h:270
Definition: regguts.h:323
char * rpath
Definition: basebackup.h:32
#define LOG_METAINFO_DATAFILE_TMP
Definition: syslogger.h:103
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: wait_event.h:85
static void pgstat_report_wait_end(void)
Definition: wait_event.h:101
const char * name
void WalSndSetState(WalSndState state)
Definition: walsender.c:3812
void WalSndResourceCleanup(bool isCommit)
Definition: walsender.c:362
@ WALSNDSTATE_BACKUP
bool summarize_wal
#define lstat(path, sb)
Definition: win32_port.h:285
#define S_ISDIR(m)
Definition: win32_port.h:325
#define S_ISLNK(m)
Definition: win32_port.h:344
#define fstat
Definition: win32_port.h:283
#define readlink(path, buf, size)
Definition: win32_port.h:236
#define S_ISREG(m)
Definition: win32_port.h:328
#define pgoff_t
Definition: win32_port.h:207
bool RecoveryInProgress(void)
Definition: xlog.c:6333
void do_pg_abort_backup(int code, Datum arg)
Definition: xlog.c:9386
SessionBackupState get_backup_status(void)
Definition: xlog.c:9093
void CheckXLogRemoved(XLogSegNo segno, TimeLineID tli)
Definition: xlog.c:3720
int wal_segment_size
Definition: xlog.c:142
bool DataChecksumsEnabled(void)
Definition: xlog.c:4581
void do_pg_backup_start(const char *backupidstr, bool fast, List **tablespaces, BackupState *state, StringInfo tblspcmapfile)
Definition: xlog.c:8784
void do_pg_backup_stop(BackupState *state, bool waitforarchive)
Definition: xlog.c:9112
#define TABLESPACE_MAP
Definition: xlog.h:304
#define BACKUP_LABEL_FILE
Definition: xlog.h:301
SessionBackupState
Definition: xlog.h:285
@ SESSION_BACKUP_RUNNING
Definition: xlog.h:287
#define XLOG_CONTROL_FILE
static bool IsXLogFileName(const char *fname)
static void XLogFromFileName(const char *fname, TimeLineID *tli, XLogSegNo *logSegNo, int wal_segsz_bytes)
#define XLByteToPrevSeg(xlrp, logSegNo, wal_segsz_bytes)
static bool IsTLHistoryFileName(const char *fname)
#define MAXFNAMELEN
#define XLOGDIR
static void StatusFilePath(char *path, const char *xlog, const char *suffix)
#define XLByteToSeg(xlrp, logSegNo, wal_segsz_bytes)
static void XLogFileName(char *fname, TimeLineID tli, XLogSegNo logSegNo, int wal_segsz_bytes)
char * build_backup_content(BackupState *state, bool ishistoryfile)
Definition: xlogbackup.c:29
uint64 XLogRecPtr
Definition: xlogdefs.h:21
uint32 TimeLineID
Definition: xlogdefs.h:59
uint64 XLogSegNo
Definition: xlogdefs.h:48
static BackupState * backup_state
Definition: xlogfuncs.c:40
static StringInfo tablespace_map
Definition: xlogfuncs.c:41