PostgreSQL Source Code  git master
filemap.c
Go to the documentation of this file.
1 /*-------------------------------------------------------------------------
2  *
3  * filemap.c
4  * A data structure for keeping track of files that have changed.
5  *
6  * This source file contains the logic to decide what to do with different
7  * kinds of files, and the data structure to support it. Before modifying
8  * anything, pg_rewind collects information about all the files and their
9  * attributes in the target and source data directories. It also scans the
10  * WAL log in the target, and collects information about data blocks that
11  * were changed. All this information is stored in a hash table, using the
12  * file path relative to the root of the data directory as the key.
13  *
14  * After collecting all the information required, the decide_file_actions()
15  * function scans the hash table and decides what action needs to be taken
16  * for each file. Finally, it sorts the array to the final order that the
17  * actions should be executed in.
18  *
19  * Copyright (c) 2013-2023, PostgreSQL Global Development Group
20  *
21  *-------------------------------------------------------------------------
22  */
23 
24 #include "postgres_fe.h"
25 
26 #include <sys/stat.h>
27 #include <unistd.h>
28 
29 #include "catalog/pg_tablespace_d.h"
30 #include "common/file_utils.h"
31 #include "common/hashfn.h"
32 #include "common/string.h"
33 #include "datapagemap.h"
34 #include "filemap.h"
35 #include "pg_rewind.h"
36 
37 /*
38  * Define a hash table which we can use to store information about the files
39  * appearing in source and target systems.
40  */
41 static uint32 hash_string_pointer(const char *s);
42 #define SH_PREFIX filehash
43 #define SH_ELEMENT_TYPE file_entry_t
44 #define SH_KEY_TYPE const char *
45 #define SH_KEY path
46 #define SH_HASH_KEY(tb, key) hash_string_pointer(key)
47 #define SH_EQUAL(tb, a, b) (strcmp(a, b) == 0)
48 #define SH_SCOPE static inline
49 #define SH_RAW_ALLOCATOR pg_malloc0
50 #define SH_DECLARE
51 #define SH_DEFINE
52 #include "lib/simplehash.h"
53 
54 #define FILEHASH_INITIAL_SIZE 1000
55 
56 static filehash_hash *filehash;
57 
58 static bool isRelDataFile(const char *path);
59 static char *datasegpath(RelFileLocator rlocator, ForkNumber forknum,
60  BlockNumber segno);
61 
62 static file_entry_t *insert_filehash_entry(const char *path);
63 static file_entry_t *lookup_filehash_entry(const char *path);
64 static int final_filemap_cmp(const void *a, const void *b);
65 static bool check_file_excluded(const char *path, bool is_source);
66 
67 /*
68  * Definition of one element part of an exclusion list, used to exclude
69  * contents when rewinding. "name" is the name of the file or path to
70  * check for exclusion. If "match_prefix" is true, any items matching
71  * the name as prefix are excluded.
72  */
73 struct exclude_list_item
74 {
75  const char *name;
76  bool match_prefix;
77 };
78 
79 /*
80  * The contents of these directories are removed or recreated during server
81  * start so they are not included in data processed by pg_rewind.
82  *
83  * Note: those lists should be kept in sync with what basebackup.c provides.
84  * Some of the values, contrary to what basebackup.c uses, are hardcoded as
85  * they are defined in backend-only headers. So this list is maintained
86  * with a best effort in mind.
87  */
88 static const char *const excludeDirContents[] =
89 {
90  /*
91  * Skip temporary statistics files. PG_STAT_TMP_DIR must be skipped
92  * because extensions like pg_stat_statements store data there.
93  */
94  "pg_stat_tmp", /* defined as PG_STAT_TMP_DIR */
95 
96  /*
97  * It is generally not useful to backup the contents of this directory
98  * even if the intention is to restore to another primary. See backup.sgml
99  * for a more detailed description.
100  */
101  "pg_replslot",
102 
103  /* Contents removed on startup, see dsm_cleanup_for_mmap(). */
104  "pg_dynshmem", /* defined as PG_DYNSHMEM_DIR */
105 
106  /* Contents removed on startup, see AsyncShmemInit(). */
107  "pg_notify",
108 
109  /*
110  * Old contents are loaded for possible debugging but are not required for
111  * normal operation, see SerialInit().
112  */
113  "pg_serial",
114 
115  /* Contents removed on startup, see DeleteAllExportedSnapshotFiles(). */
116  "pg_snapshots",
117 
118  /* Contents zeroed on startup, see StartupSUBTRANS(). */
119  "pg_subtrans",
120 
121  /* end of list */
122  NULL
123 };
124 
125 /*
126  * List of files excluded from filemap processing. Files are excluded
127  * if their prefix match.
128  */
129 static const struct exclude_list_item excludeFiles[] =
130 {
131  /* Skip auto conf temporary file. */
132  {"postgresql.auto.conf.tmp", false}, /* defined as PG_AUTOCONF_FILENAME */
133 
134  /* Skip current log file temporary file */
135  {"current_logfiles.tmp", false}, /* defined as
136  * LOG_METAINFO_DATAFILE_TMP */
137 
138  /* Skip relation cache because it is rebuilt on startup */
139  {"pg_internal.init", true}, /* defined as RELCACHE_INIT_FILENAME */
140 
141  /*
142  * If there is a backup_label or tablespace_map file, it indicates that a
143  * recovery failed and this cluster probably can't be rewound, but exclude
144  * them anyway if they are found.
145  */
146  {"backup_label", false}, /* defined as BACKUP_LABEL_FILE */
147  {"tablespace_map", false}, /* defined as TABLESPACE_MAP */
148 
149  /*
150  * If there's a backup_manifest, it belongs to a backup that was used to
151  * start this server. It is *not* correct for this backup. Our
152  * backup_manifest is injected into the backup separately if users want
153  * it.
154  */
155  {"backup_manifest", false},
156 
157  {"postmaster.pid", false},
158  {"postmaster.opts", false},
159 
160  /* end of list */
161  {NULL, false}
162 };
163 
164 /*
165  * Initialize the hash table for the file map.
166  */
167 void
169 {
170  filehash = filehash_create(FILEHASH_INITIAL_SIZE, NULL);
171 }
172 
173 /* Look up entry for 'path', creating a new one if it doesn't exist */
174 static file_entry_t *
175 insert_filehash_entry(const char *path)
176 {
177  file_entry_t *entry;
178  bool found;
179 
180  entry = filehash_insert(filehash, path, &found);
181  if (!found)
182  {
183  entry->path = pg_strdup(path);
184  entry->isrelfile = isRelDataFile(path);
185 
186  entry->target_exists = false;
188  entry->target_size = 0;
189  entry->target_link_target = NULL;
190  entry->target_pages_to_overwrite.bitmap = NULL;
192 
193  entry->source_exists = false;
195  entry->source_size = 0;
196  entry->source_link_target = NULL;
197 
198  entry->action = FILE_ACTION_UNDECIDED;
199  }
200 
201  return entry;
202 }
203 
204 static file_entry_t *
205 lookup_filehash_entry(const char *path)
206 {
207  return filehash_lookup(filehash, path);
208 }
209 
210 /*
211  * Callback for processing source file list.
212  *
213  * This is called once for every file in the source server. We record the
214  * type and size of the file, so that decide_file_action() can later decide what
215  * to do with it.
216  */
217 void
218 process_source_file(const char *path, file_type_t type, size_t size,
219  const char *link_target)
220 {
221  file_entry_t *entry;
222 
223  /*
224  * Pretend that pg_wal is a directory, even if it's really a symlink. We
225  * don't want to mess with the symlink itself, nor complain if it's a
226  * symlink in source but not in target or vice versa.
227  */
228  if (strcmp(path, "pg_wal") == 0 && type == FILE_TYPE_SYMLINK)
230 
231  /*
232  * sanity check: a filename that looks like a data file better be a
233  * regular file
234  */
235  if (type != FILE_TYPE_REGULAR && isRelDataFile(path))
236  pg_fatal("data file \"%s\" in source is not a regular file", path);
237 
238  /* Remember this source file */
239  entry = insert_filehash_entry(path);
240  if (entry->source_exists)
241  pg_fatal("duplicate source file \"%s\"", path);
242  entry->source_exists = true;
243  entry->source_type = type;
244  entry->source_size = size;
245  entry->source_link_target = link_target ? pg_strdup(link_target) : NULL;
246 }
247 
248 /*
249  * Callback for processing target file list.
250  *
251  * Record the type and size of the file, like process_source_file() does.
252  */
253 void
254 process_target_file(const char *path, file_type_t type, size_t size,
255  const char *link_target)
256 {
257  file_entry_t *entry;
258 
259  /*
260  * Do not apply any exclusion filters here. This has advantage to remove
261  * from the target data folder all paths which have been filtered out from
262  * the source data folder when processing the source files.
263  */
264 
265  /*
266  * Like in process_source_file, pretend that pg_wal is always a directory.
267  */
268  if (strcmp(path, "pg_wal") == 0 && type == FILE_TYPE_SYMLINK)
270 
271  /* Remember this target file */
272  entry = insert_filehash_entry(path);
273  if (entry->target_exists)
274  pg_fatal("duplicate source file \"%s\"", path);
275  entry->target_exists = true;
276  entry->target_type = type;
277  entry->target_size = size;
278  entry->target_link_target = link_target ? pg_strdup(link_target) : NULL;
279 }
280 
281 /*
282  * This callback gets called while we read the WAL in the target, for every
283  * block that has changed in the target system. It decides if the given
284  * 'blkno' in the target relfile needs to be overwritten from the source, and
285  * if so, records it in 'target_pages_to_overwrite' bitmap.
286  *
287  * NOTE: All the files on both systems must have already been added to the
288  * hash table!
289  */
290 void
292  BlockNumber blkno)
293 {
294  char *path;
295  file_entry_t *entry;
296  BlockNumber blkno_inseg;
297  int segno;
298 
299  segno = blkno / RELSEG_SIZE;
300  blkno_inseg = blkno % RELSEG_SIZE;
301 
302  path = datasegpath(rlocator, forknum, segno);
303  entry = lookup_filehash_entry(path);
304  pfree(path);
305 
306  /*
307  * If the block still exists in both systems, remember it. Otherwise we
308  * can safely ignore it.
309  *
310  * If the block is beyond the EOF in the source system, or the file
311  * doesn't exist in the source at all, we're going to truncate/remove it
312  * away from the target anyway. Likewise, if it doesn't exist in the
313  * target anymore, we will copy it over with the "tail" from the source
314  * system, anyway.
315  *
316  * It is possible to find WAL for a file that doesn't exist on either
317  * system anymore. It means that the relation was dropped later in the
318  * target system, and independently on the source system too, or that it
319  * was created and dropped in the target system and it never existed in
320  * the source. Either way, we can safely ignore it.
321  */
322  if (entry)
323  {
324  Assert(entry->isrelfile);
325 
326  if (entry->target_exists)
327  {
328  if (entry->target_type != FILE_TYPE_REGULAR)
329  pg_fatal("unexpected page modification for non-regular file \"%s\"",
330  entry->path);
331 
332  if (entry->source_exists)
333  {
334  off_t end_offset;
335 
336  end_offset = (blkno_inseg + 1) * BLCKSZ;
337  if (end_offset <= entry->source_size && end_offset <= entry->target_size)
338  datapagemap_add(&entry->target_pages_to_overwrite, blkno_inseg);
339  }
340  }
341  }
342 }
343 
344 /*
345  * Is this the path of file that pg_rewind can skip copying?
346  */
347 static bool
348 check_file_excluded(const char *path, bool is_source)
349 {
350  char localpath[MAXPGPATH];
351  int excludeIdx;
352  const char *filename;
353 
354  /*
355  * Skip all temporary files, .../pgsql_tmp/... and .../pgsql_tmp.*
356  */
357  if (strstr(path, "/" PG_TEMP_FILE_PREFIX) != NULL ||
358  strstr(path, "/" PG_TEMP_FILES_DIR "/") != NULL)
359  {
360  return true;
361  }
362 
363  /* check individual files... */
364  for (excludeIdx = 0; excludeFiles[excludeIdx].name != NULL; excludeIdx++)
365  {
366  int cmplen = strlen(excludeFiles[excludeIdx].name);
367 
369  if (filename == NULL)
370  filename = path;
371  else
372  filename++;
373 
374  if (!excludeFiles[excludeIdx].match_prefix)
375  cmplen++;
376  if (strncmp(filename, excludeFiles[excludeIdx].name, cmplen) == 0)
377  {
378  if (is_source)
379  pg_log_debug("entry \"%s\" excluded from source file list",
380  path);
381  else
382  pg_log_debug("entry \"%s\" excluded from target file list",
383  path);
384  return true;
385  }
386  }
387 
388  /*
389  * ... And check some directories. Note that this includes any contents
390  * within the directories themselves.
391  */
392  for (excludeIdx = 0; excludeDirContents[excludeIdx] != NULL; excludeIdx++)
393  {
394  snprintf(localpath, sizeof(localpath), "%s/",
395  excludeDirContents[excludeIdx]);
396  if (strstr(path, localpath) == path)
397  {
398  if (is_source)
399  pg_log_debug("entry \"%s\" excluded from source file list",
400  path);
401  else
402  pg_log_debug("entry \"%s\" excluded from target file list",
403  path);
404  return true;
405  }
406  }
407 
408  return false;
409 }
410 
411 static const char *
413 {
414  switch (action)
415  {
416  case FILE_ACTION_NONE:
417  return "NONE";
418  case FILE_ACTION_COPY:
419  return "COPY";
421  return "TRUNCATE";
423  return "COPY_TAIL";
424  case FILE_ACTION_CREATE:
425  return "CREATE";
426  case FILE_ACTION_REMOVE:
427  return "REMOVE";
428 
429  default:
430  return "unknown";
431  }
432 }
433 
434 /*
435  * Calculate the totals needed for progress reports.
436  */
437 void
439 {
440  file_entry_t *entry;
441  int i;
442 
443  filemap->total_size = 0;
444  filemap->fetch_size = 0;
445 
446  for (i = 0; i < filemap->nentries; i++)
447  {
448  entry = filemap->entries[i];
449 
450  if (entry->source_type != FILE_TYPE_REGULAR)
451  continue;
452 
453  filemap->total_size += entry->source_size;
454 
455  if (entry->action == FILE_ACTION_COPY)
456  {
457  filemap->fetch_size += entry->source_size;
458  continue;
459  }
460 
461  if (entry->action == FILE_ACTION_COPY_TAIL)
462  filemap->fetch_size += (entry->source_size - entry->target_size);
463 
464  if (entry->target_pages_to_overwrite.bitmapsize > 0)
465  {
467  BlockNumber blk;
468 
470  while (datapagemap_next(iter, &blk))
471  filemap->fetch_size += BLCKSZ;
472 
473  pg_free(iter);
474  }
475  }
476 }
477 
478 void
480 {
481  file_entry_t *entry;
482  int i;
483 
484  for (i = 0; i < filemap->nentries; i++)
485  {
486  entry = filemap->entries[i];
487  if (entry->action != FILE_ACTION_NONE ||
489  {
490  pg_log_debug("%s (%s)", entry->path,
491  action_to_str(entry->action));
492 
493  if (entry->target_pages_to_overwrite.bitmapsize > 0)
495  }
496  }
497  fflush(stdout);
498 }
499 
500 /*
501  * Does it look like a relation data file?
502  *
503  * For our purposes, only files belonging to the main fork are considered
504  * relation files. Other forks are always copied in toto, because we cannot
505  * reliably track changes to them, because WAL only contains block references
506  * for the main fork.
507  */
508 static bool
509 isRelDataFile(const char *path)
510 {
511  RelFileLocator rlocator;
512  unsigned int segNo;
513  int nmatch;
514  bool matched;
515 
516  /*----
517  * Relation data files can be in one of the following directories:
518  *
519  * global/
520  * shared relations
521  *
522  * base/<db oid>/
523  * regular relations, default tablespace
524  *
525  * pg_tblspc/<tblspc oid>/<tblspc version>/
526  * within a non-default tablespace (the name of the directory
527  * depends on version)
528  *
529  * And the relation data files themselves have a filename like:
530  *
531  * <oid>.<segment number>
532  *
533  *----
534  */
535  rlocator.spcOid = InvalidOid;
536  rlocator.dbOid = InvalidOid;
537  rlocator.relNumber = InvalidRelFileNumber;
538  segNo = 0;
539  matched = false;
540 
541  nmatch = sscanf(path, "global/%u.%u", &rlocator.relNumber, &segNo);
542  if (nmatch == 1 || nmatch == 2)
543  {
544  rlocator.spcOid = GLOBALTABLESPACE_OID;
545  rlocator.dbOid = 0;
546  matched = true;
547  }
548  else
549  {
550  nmatch = sscanf(path, "base/%u/%u.%u",
551  &rlocator.dbOid, &rlocator.relNumber, &segNo);
552  if (nmatch == 2 || nmatch == 3)
553  {
554  rlocator.spcOid = DEFAULTTABLESPACE_OID;
555  matched = true;
556  }
557  else
558  {
559  nmatch = sscanf(path, "pg_tblspc/%u/" TABLESPACE_VERSION_DIRECTORY "/%u/%u.%u",
560  &rlocator.spcOid, &rlocator.dbOid, &rlocator.relNumber,
561  &segNo);
562  if (nmatch == 3 || nmatch == 4)
563  matched = true;
564  }
565  }
566 
567  /*
568  * The sscanf tests above can match files that have extra characters at
569  * the end. To eliminate such cases, cross-check that GetRelationPath
570  * creates the exact same filename, when passed the RelFileLocator
571  * information we extracted from the filename.
572  */
573  if (matched)
574  {
575  char *check_path = datasegpath(rlocator, MAIN_FORKNUM, segNo);
576 
577  if (strcmp(check_path, path) != 0)
578  matched = false;
579 
580  pfree(check_path);
581  }
582 
583  return matched;
584 }
585 
586 /*
587  * A helper function to create the path of a relation file and segment.
588  *
589  * The returned path is palloc'd
590  */
591 static char *
593 {
594  char *path;
595  char *segpath;
596 
597  path = relpathperm(rlocator, forknum);
598  if (segno > 0)
599  {
600  segpath = psprintf("%s.%u", path, segno);
601  pfree(path);
602  return segpath;
603  }
604  else
605  return path;
606 }
607 
608 /*
609  * In the final stage, the filemap is sorted so that removals come last.
610  * From disk space usage point of view, it would be better to do removals
611  * first, but for now, safety first. If a whole directory is deleted, all
612  * files and subdirectories inside it need to removed first. On creation,
613  * parent directory needs to be created before files and directories inside
614  * it. To achieve that, the file_action_t enum is ordered so that we can
615  * just sort on that first. Furthermore, sort REMOVE entries in reverse
616  * path order, so that "foo/bar" subdirectory is removed before "foo".
617  */
618 static int
619 final_filemap_cmp(const void *a, const void *b)
620 {
621  file_entry_t *fa = *((file_entry_t **) a);
622  file_entry_t *fb = *((file_entry_t **) b);
623 
624  if (fa->action > fb->action)
625  return 1;
626  if (fa->action < fb->action)
627  return -1;
628 
629  if (fa->action == FILE_ACTION_REMOVE)
630  return strcmp(fb->path, fa->path);
631  else
632  return strcmp(fa->path, fb->path);
633 }
634 
635 /*
636  * Decide what action to perform to a file.
637  */
638 static file_action_t
640 {
641  const char *path = entry->path;
642 
643  /*
644  * Don't touch the control file. It is handled specially, after copying
645  * all the other files.
646  */
647  if (strcmp(path, "global/pg_control") == 0)
648  return FILE_ACTION_NONE;
649 
650  /*
651  * Remove all files matching the exclusion filters in the target.
652  */
653  if (check_file_excluded(path, true))
654  {
655  if (entry->target_exists)
656  return FILE_ACTION_REMOVE;
657  else
658  return FILE_ACTION_NONE;
659  }
660 
661  /*
662  * Handle cases where the file is missing from one of the systems.
663  */
664  if (!entry->target_exists && entry->source_exists)
665  {
666  /*
667  * File exists in source, but not in target. Copy it in toto. (If it's
668  * a relation data file, WAL replay after rewinding should re-create
669  * it anyway. But there's no harm in copying it now.)
670  */
671  switch (entry->source_type)
672  {
673  case FILE_TYPE_DIRECTORY:
674  case FILE_TYPE_SYMLINK:
675  return FILE_ACTION_CREATE;
676  case FILE_TYPE_REGULAR:
677  return FILE_ACTION_COPY;
678  case FILE_TYPE_UNDEFINED:
679  pg_fatal("unknown file type for \"%s\"", entry->path);
680  break;
681  }
682  }
683  else if (entry->target_exists && !entry->source_exists)
684  {
685  /* File exists in target, but not source. Remove it. */
686  return FILE_ACTION_REMOVE;
687  }
688  else if (!entry->target_exists && !entry->source_exists)
689  {
690  /*
691  * Doesn't exist in either server. Why does it have an entry in the
692  * first place??
693  */
694  Assert(false);
695  return FILE_ACTION_NONE;
696  }
697 
698  /*
699  * Otherwise, the file exists on both systems
700  */
701  Assert(entry->target_exists && entry->source_exists);
702 
703  if (entry->source_type != entry->target_type)
704  {
705  /* But it's a different kind of object. Strange.. */
706  pg_fatal("file \"%s\" is of different type in source and target", entry->path);
707  }
708 
709  /*
710  * PG_VERSION files should be identical on both systems, but avoid
711  * overwriting them for paranoia.
712  */
713  if (pg_str_endswith(entry->path, "PG_VERSION"))
714  return FILE_ACTION_NONE;
715 
716  switch (entry->source_type)
717  {
718  case FILE_TYPE_DIRECTORY:
719  return FILE_ACTION_NONE;
720 
721  case FILE_TYPE_SYMLINK:
722 
723  /*
724  * XXX: Should we check if it points to the same target?
725  */
726  return FILE_ACTION_NONE;
727 
728  case FILE_TYPE_REGULAR:
729  if (!entry->isrelfile)
730  {
731  /*
732  * It's a non-data file that we have no special processing
733  * for. Copy it in toto.
734  */
735  return FILE_ACTION_COPY;
736  }
737  else
738  {
739  /*
740  * It's a data file that exists in both systems.
741  *
742  * If it's larger in target, we can truncate it. There will
743  * also be a WAL record of the truncation in the source
744  * system, so WAL replay would eventually truncate the target
745  * too, but we might as well do it now.
746  *
747  * If it's smaller in the target, it means that it has been
748  * truncated in the target, or enlarged in the source, or
749  * both. If it was truncated in the target, we need to copy
750  * the missing tail from the source system. If it was enlarged
751  * in the source system, there will be WAL records in the
752  * source system for the new blocks, so we wouldn't need to
753  * copy them here. But we don't know which scenario we're
754  * dealing with, and there's no harm in copying the missing
755  * blocks now, so do it now.
756  *
757  * If it's the same size, do nothing here. Any blocks modified
758  * in the target will be copied based on parsing the target
759  * system's WAL, and any blocks modified in the source will be
760  * updated after rewinding, when the source system's WAL is
761  * replayed.
762  */
763  if (entry->target_size < entry->source_size)
764  return FILE_ACTION_COPY_TAIL;
765  else if (entry->target_size > entry->source_size)
766  return FILE_ACTION_TRUNCATE;
767  else
768  return FILE_ACTION_NONE;
769  }
770  break;
771 
772  case FILE_TYPE_UNDEFINED:
773  pg_fatal("unknown file type for \"%s\"", path);
774  break;
775  }
776 
777  /* unreachable */
778  pg_fatal("could not decide what to do with file \"%s\"", path);
779 }
780 
781 /*
782  * Decide what to do with each file.
783  *
784  * Returns a 'filemap' with the entries in the order that their actions
785  * should be executed.
786  */
787 filemap_t *
789 {
790  int i;
791  filehash_iterator it;
792  file_entry_t *entry;
793  filemap_t *filemap;
794 
795  filehash_start_iterate(filehash, &it);
796  while ((entry = filehash_iterate(filehash, &it)) != NULL)
797  {
798  entry->action = decide_file_action(entry);
799  }
800 
801  /*
802  * Turn the hash table into an array, and sort in the order that the
803  * actions should be performed.
804  */
805  filemap = pg_malloc(offsetof(filemap_t, entries) +
806  filehash->members * sizeof(file_entry_t *));
807  filemap->nentries = filehash->members;
808  filehash_start_iterate(filehash, &it);
809  i = 0;
810  while ((entry = filehash_iterate(filehash, &it)) != NULL)
811  {
812  filemap->entries[i++] = entry;
813  }
814 
815  qsort(&filemap->entries, filemap->nentries, sizeof(file_entry_t *),
817 
818  return filemap;
819 }
820 
821 
822 /*
823  * Helper function for filemap hash table.
824  */
825 static uint32
826 hash_string_pointer(const char *s)
827 {
828  unsigned char *ss = (unsigned char *) s;
829 
830  return hash_bytes(ss, strlen(s));
831 }
uint32 BlockNumber
Definition: block.h:31
unsigned int uint32
Definition: c.h:495
bool datapagemap_next(datapagemap_iterator_t *iter, BlockNumber *blkno)
Definition: datapagemap.c:87
void datapagemap_print(datapagemap_t *map)
Definition: datapagemap.c:117
void datapagemap_add(datapagemap_t *map, BlockNumber blkno)
Definition: datapagemap.c:32
datapagemap_iterator_t * datapagemap_iterate(datapagemap_t *map)
Definition: datapagemap.c:75
char * pg_strdup(const char *in)
Definition: fe_memutils.c:85
void pg_free(void *ptr)
Definition: fe_memutils.c:105
void * pg_malloc(size_t size)
Definition: fe_memutils.c:47
#define PG_TEMP_FILES_DIR
Definition: file_utils.h:57
#define PG_TEMP_FILE_PREFIX
Definition: file_utils.h:58
static const struct exclude_list_item excludeFiles[]
Definition: filemap.c:129
static bool isRelDataFile(const char *path)
Definition: filemap.c:509
void filehash_init(void)
Definition: filemap.c:168
void process_source_file(const char *path, file_type_t type, size_t size, const char *link_target)
Definition: filemap.c:218
static uint32 hash_string_pointer(const char *s)
Definition: filemap.c:826
static const char *const excludeDirContents[]
Definition: filemap.c:88
static const char * action_to_str(file_action_t action)
Definition: filemap.c:412
void print_filemap(filemap_t *filemap)
Definition: filemap.c:479
static char * datasegpath(RelFileLocator rlocator, ForkNumber forknum, BlockNumber segno)
Definition: filemap.c:592
static filehash_hash * filehash
Definition: filemap.c:56
void process_target_file(const char *path, file_type_t type, size_t size, const char *link_target)
Definition: filemap.c:254
void process_target_wal_block_change(ForkNumber forknum, RelFileLocator rlocator, BlockNumber blkno)
Definition: filemap.c:291
filemap_t * decide_file_actions(void)
Definition: filemap.c:788
static file_action_t decide_file_action(file_entry_t *entry)
Definition: filemap.c:639
static file_entry_t * lookup_filehash_entry(const char *path)
Definition: filemap.c:205
static file_entry_t * insert_filehash_entry(const char *path)
Definition: filemap.c:175
static bool check_file_excluded(const char *path, bool is_source)
Definition: filemap.c:348
#define FILEHASH_INITIAL_SIZE
Definition: filemap.c:54
static int final_filemap_cmp(const void *a, const void *b)
Definition: filemap.c:619
void calculate_totals(filemap_t *filemap)
Definition: filemap.c:438
file_action_t
Definition: filemap.h:17
@ FILE_ACTION_REMOVE
Definition: filemap.h:27
@ FILE_ACTION_COPY
Definition: filemap.h:21
@ FILE_ACTION_NONE
Definition: filemap.h:24
@ FILE_ACTION_COPY_TAIL
Definition: filemap.h:22
@ FILE_ACTION_UNDECIDED
Definition: filemap.h:18
@ FILE_ACTION_TRUNCATE
Definition: filemap.h:26
@ FILE_ACTION_CREATE
Definition: filemap.h:20
file_type_t
Definition: filemap.h:31
@ FILE_TYPE_UNDEFINED
Definition: filemap.h:32
@ FILE_TYPE_REGULAR
Definition: filemap.h:34
@ FILE_TYPE_SYMLINK
Definition: filemap.h:36
@ FILE_TYPE_DIRECTORY
Definition: filemap.h:35
uint32 hash_bytes(const unsigned char *k, int keylen)
Definition: hashfn.c:146
int b
Definition: isn.c:70
int a
Definition: isn.c:69
int i
Definition: isn.c:73
static void const char fflush(stdout)
Assert(fmt[strlen(fmt) - 1] !='\n')
#define pg_log_debug(...)
Definition: logging.h:133
void pfree(void *pointer)
Definition: mcxt.c:1456
#define pg_fatal(...)
#define MAXPGPATH
static char * filename
Definition: pg_dumpall.c:119
char * last_dir_separator(const char *filename)
Definition: path.c:139
#define snprintf
Definition: port.h:238
#define qsort(a, b, c, d)
Definition: port.h:445
#define InvalidOid
Definition: postgres_ext.h:36
static int fa(void)
Definition: preproc-init.c:85
static int fb(int x)
Definition: preproc-init.c:92
char * psprintf(const char *fmt,...)
Definition: psprintf.c:46
ForkNumber
Definition: relpath.h:48
@ MAIN_FORKNUM
Definition: relpath.h:50
#define InvalidRelFileNumber
Definition: relpath.h:26
#define relpathperm(rlocator, forknum)
Definition: relpath.h:90
#define TABLESPACE_VERSION_DIRECTORY
Definition: relpath.h:33
bool pg_str_endswith(const char *str, const char *end)
Definition: string.c:32
RelFileNumber relNumber
int bitmapsize
Definition: datapagemap.h:18
char * bitmap
Definition: datapagemap.h:17
const char * name
Definition: basebackup.c:118
Definition: filemap.h:50
datapagemap_t target_pages_to_overwrite
Definition: filemap.h:68
const char * path
Definition: filemap.h:53
size_t source_size
Definition: filemap.h:75
bool source_exists
Definition: filemap.h:73
bool target_exists
Definition: filemap.h:59
char * source_link_target
Definition: filemap.h:76
file_type_t source_type
Definition: filemap.h:74
char * target_link_target
Definition: filemap.h:62
size_t target_size
Definition: filemap.h:61
file_action_t action
Definition: filemap.h:81
file_type_t target_type
Definition: filemap.h:60
bool isrelfile
Definition: filemap.h:54
file_entry_t * entries[FLEXIBLE_ARRAY_MEMBER]
Definition: filemap.h:96
int nentries
Definition: filemap.h:95
uint64 total_size
Definition: filemap.h:92
uint64 fetch_size
Definition: filemap.h:93
const char * type
const char * name