PostgreSQL Source Code  git master
filemap.h File Reference
#include "datapagemap.h"
#include "storage/block.h"
#include "storage/relfilelocator.h"
Include dependency graph for filemap.h:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Data Structures

struct  file_entry_t
 
struct  filemap_t
 

Typedefs

typedef struct file_entry_t file_entry_t
 
typedef struct filemap_t filemap_t
 

Enumerations

enum  file_action_t {
  FILE_ACTION_UNDECIDED = 0 , FILE_ACTION_CREATE , FILE_ACTION_COPY , FILE_ACTION_COPY_TAIL ,
  FILE_ACTION_NONE , FILE_ACTION_TRUNCATE , FILE_ACTION_REMOVE
}
 
enum  file_type_t { FILE_TYPE_UNDEFINED = 0 , FILE_TYPE_REGULAR , FILE_TYPE_DIRECTORY , FILE_TYPE_SYMLINK }
 

Functions

void filehash_init (void)
 
void process_source_file (const char *path, file_type_t type, size_t size, const char *link_target)
 
void process_target_file (const char *path, file_type_t type, size_t size, const char *link_target)
 
void process_target_wal_block_change (ForkNumber forknum, RelFileLocator rlocator, BlockNumber blkno)
 
filemap_tdecide_file_actions (void)
 
void calculate_totals (filemap_t *filemap)
 
void print_filemap (filemap_t *filemap)
 

Typedef Documentation

◆ file_entry_t

typedef struct file_entry_t file_entry_t

◆ filemap_t

typedef struct filemap_t filemap_t

Enumeration Type Documentation

◆ file_action_t

Enumerator
FILE_ACTION_UNDECIDED 
FILE_ACTION_CREATE 
FILE_ACTION_COPY 
FILE_ACTION_COPY_TAIL 
FILE_ACTION_NONE 
FILE_ACTION_TRUNCATE 
FILE_ACTION_REMOVE 

Definition at line 16 of file filemap.h.

17 {
18  FILE_ACTION_UNDECIDED = 0, /* not decided yet */
19 
20  FILE_ACTION_CREATE, /* create local directory or symbolic link */
21  FILE_ACTION_COPY, /* copy whole file, overwriting if exists */
22  FILE_ACTION_COPY_TAIL, /* copy tail from 'source_size' to
23  * 'target_size' */
24  FILE_ACTION_NONE, /* no action (we might still copy modified
25  * blocks based on the parsed WAL) */
26  FILE_ACTION_TRUNCATE, /* truncate local file to 'newsize' bytes */
27  FILE_ACTION_REMOVE, /* remove local file / directory / symlink */
file_action_t
Definition: filemap.h:17
@ FILE_ACTION_REMOVE
Definition: filemap.h:27
@ FILE_ACTION_COPY
Definition: filemap.h:21
@ FILE_ACTION_NONE
Definition: filemap.h:24
@ FILE_ACTION_COPY_TAIL
Definition: filemap.h:22
@ FILE_ACTION_UNDECIDED
Definition: filemap.h:18
@ FILE_ACTION_TRUNCATE
Definition: filemap.h:26
@ FILE_ACTION_CREATE
Definition: filemap.h:20

◆ file_type_t

Enumerator
FILE_TYPE_UNDEFINED 
FILE_TYPE_REGULAR 
FILE_TYPE_DIRECTORY 
FILE_TYPE_SYMLINK 

Definition at line 30 of file filemap.h.

31 {
33 
37 } file_type_t;
file_type_t
Definition: filemap.h:31
@ FILE_TYPE_UNDEFINED
Definition: filemap.h:32
@ FILE_TYPE_REGULAR
Definition: filemap.h:34
@ FILE_TYPE_SYMLINK
Definition: filemap.h:36
@ FILE_TYPE_DIRECTORY
Definition: filemap.h:35

Function Documentation

◆ calculate_totals()

void calculate_totals ( filemap_t filemap)

Definition at line 437 of file filemap.c.

438 {
439  file_entry_t *entry;
440  int i;
441 
442  filemap->total_size = 0;
443  filemap->fetch_size = 0;
444 
445  for (i = 0; i < filemap->nentries; i++)
446  {
447  entry = filemap->entries[i];
448 
449  if (entry->source_type != FILE_TYPE_REGULAR)
450  continue;
451 
452  filemap->total_size += entry->source_size;
453 
454  if (entry->action == FILE_ACTION_COPY)
455  {
456  filemap->fetch_size += entry->source_size;
457  continue;
458  }
459 
460  if (entry->action == FILE_ACTION_COPY_TAIL)
461  filemap->fetch_size += (entry->source_size - entry->target_size);
462 
463  if (entry->target_pages_to_overwrite.bitmapsize > 0)
464  {
466  BlockNumber blk;
467 
469  while (datapagemap_next(iter, &blk))
470  filemap->fetch_size += BLCKSZ;
471 
472  pg_free(iter);
473  }
474  }
475 }
uint32 BlockNumber
Definition: block.h:31
bool datapagemap_next(datapagemap_iterator_t *iter, BlockNumber *blkno)
Definition: datapagemap.c:87
datapagemap_iterator_t * datapagemap_iterate(datapagemap_t *map)
Definition: datapagemap.c:75
void pg_free(void *ptr)
Definition: fe_memutils.c:105
int i
Definition: isn.c:73
int bitmapsize
Definition: datapagemap.h:18
Definition: filemap.h:50
datapagemap_t target_pages_to_overwrite
Definition: filemap.h:68
size_t source_size
Definition: filemap.h:75
file_type_t source_type
Definition: filemap.h:74
size_t target_size
Definition: filemap.h:61
file_action_t action
Definition: filemap.h:81
file_entry_t * entries[FLEXIBLE_ARRAY_MEMBER]
Definition: filemap.h:96
int nentries
Definition: filemap.h:95
uint64 total_size
Definition: filemap.h:92
uint64 fetch_size
Definition: filemap.h:93

References file_entry_t::action, datapagemap::bitmapsize, datapagemap_iterate(), datapagemap_next(), filemap_t::entries, filemap_t::fetch_size, FILE_ACTION_COPY, FILE_ACTION_COPY_TAIL, FILE_TYPE_REGULAR, i, filemap_t::nentries, pg_free(), file_entry_t::source_size, file_entry_t::source_type, file_entry_t::target_pages_to_overwrite, file_entry_t::target_size, and filemap_t::total_size.

Referenced by main().

◆ decide_file_actions()

filemap_t* decide_file_actions ( void  )

Definition at line 791 of file filemap.c.

792 {
793  int i;
794  filehash_iterator it;
795  file_entry_t *entry;
796  filemap_t *filemap;
797 
798  filehash_start_iterate(filehash, &it);
799  while ((entry = filehash_iterate(filehash, &it)) != NULL)
800  {
801  entry->action = decide_file_action(entry);
802  }
803 
804  /*
805  * Turn the hash table into an array, and sort in the order that the
806  * actions should be performed.
807  */
808  filemap = pg_malloc(offsetof(filemap_t, entries) +
809  filehash->members * sizeof(file_entry_t *));
810  filemap->nentries = filehash->members;
811  filehash_start_iterate(filehash, &it);
812  i = 0;
813  while ((entry = filehash_iterate(filehash, &it)) != NULL)
814  {
815  filemap->entries[i++] = entry;
816  }
817 
818  qsort(&filemap->entries, filemap->nentries, sizeof(file_entry_t *),
820 
821  return filemap;
822 }
void * pg_malloc(size_t size)
Definition: fe_memutils.c:47
static filehash_hash * filehash
Definition: filemap.c:55
static file_action_t decide_file_action(file_entry_t *entry)
Definition: filemap.c:638
static int final_filemap_cmp(const void *a, const void *b)
Definition: filemap.c:618
#define qsort(a, b, c, d)
Definition: port.h:447

References file_entry_t::action, decide_file_action(), filemap_t::entries, filehash, final_filemap_cmp(), i, filemap_t::nentries, pg_malloc(), and qsort.

Referenced by main().

◆ filehash_init()

void filehash_init ( void  )

Definition at line 167 of file filemap.c.

168 {
169  filehash = filehash_create(FILEHASH_INITIAL_SIZE, NULL);
170 }
#define FILEHASH_INITIAL_SIZE
Definition: filemap.c:53

References filehash, and FILEHASH_INITIAL_SIZE.

Referenced by main().

◆ print_filemap()

void print_filemap ( filemap_t filemap)

Definition at line 478 of file filemap.c.

479 {
480  file_entry_t *entry;
481  int i;
482 
483  for (i = 0; i < filemap->nentries; i++)
484  {
485  entry = filemap->entries[i];
486  if (entry->action != FILE_ACTION_NONE ||
488  {
489  pg_log_debug("%s (%s)", entry->path,
490  action_to_str(entry->action));
491 
492  if (entry->target_pages_to_overwrite.bitmapsize > 0)
494  }
495  }
496  fflush(stdout);
497 }
void datapagemap_print(datapagemap_t *map)
Definition: datapagemap.c:117
static const char * action_to_str(file_action_t action)
Definition: filemap.c:411
static void const char fflush(stdout)
#define pg_log_debug(...)
Definition: logging.h:133
const char * path
Definition: filemap.h:53

References file_entry_t::action, action_to_str(), datapagemap::bitmapsize, datapagemap_print(), filemap_t::entries, fflush(), FILE_ACTION_NONE, i, filemap_t::nentries, file_entry_t::path, pg_log_debug, generate_unaccent_rules::stdout, and file_entry_t::target_pages_to_overwrite.

Referenced by main().

◆ process_source_file()

void process_source_file ( const char *  path,
file_type_t  type,
size_t  size,
const char *  link_target 
)

Definition at line 217 of file filemap.c.

219 {
220  file_entry_t *entry;
221 
222  /*
223  * Pretend that pg_wal is a directory, even if it's really a symlink. We
224  * don't want to mess with the symlink itself, nor complain if it's a
225  * symlink in source but not in target or vice versa.
226  */
227  if (strcmp(path, "pg_wal") == 0 && type == FILE_TYPE_SYMLINK)
229 
230  /*
231  * sanity check: a filename that looks like a data file better be a
232  * regular file
233  */
234  if (type != FILE_TYPE_REGULAR && isRelDataFile(path))
235  pg_fatal("data file \"%s\" in source is not a regular file", path);
236 
237  /* Remember this source file */
238  entry = insert_filehash_entry(path);
239  if (entry->source_exists)
240  pg_fatal("duplicate source file \"%s\"", path);
241  entry->source_exists = true;
242  entry->source_type = type;
243  entry->source_size = size;
244  entry->source_link_target = link_target ? pg_strdup(link_target) : NULL;
245 }
char * pg_strdup(const char *in)
Definition: fe_memutils.c:85
static bool isRelDataFile(const char *path)
Definition: filemap.c:508
static file_entry_t * insert_filehash_entry(const char *path)
Definition: filemap.c:174
#define pg_fatal(...)
static pg_noinline void Size size
Definition: slab.c:607
bool source_exists
Definition: filemap.h:73
char * source_link_target
Definition: filemap.h:76
const char * type

References FILE_TYPE_DIRECTORY, FILE_TYPE_REGULAR, FILE_TYPE_SYMLINK, insert_filehash_entry(), isRelDataFile(), pg_fatal, pg_strdup(), size, file_entry_t::source_exists, file_entry_t::source_link_target, file_entry_t::source_size, file_entry_t::source_type, and type.

Referenced by main().

◆ process_target_file()

void process_target_file ( const char *  path,
file_type_t  type,
size_t  size,
const char *  link_target 
)

Definition at line 253 of file filemap.c.

255 {
256  file_entry_t *entry;
257 
258  /*
259  * Do not apply any exclusion filters here. This has advantage to remove
260  * from the target data folder all paths which have been filtered out from
261  * the source data folder when processing the source files.
262  */
263 
264  /*
265  * Like in process_source_file, pretend that pg_wal is always a directory.
266  */
267  if (strcmp(path, "pg_wal") == 0 && type == FILE_TYPE_SYMLINK)
269 
270  /* Remember this target file */
271  entry = insert_filehash_entry(path);
272  if (entry->target_exists)
273  pg_fatal("duplicate source file \"%s\"", path);
274  entry->target_exists = true;
275  entry->target_type = type;
276  entry->target_size = size;
277  entry->target_link_target = link_target ? pg_strdup(link_target) : NULL;
278 }
bool target_exists
Definition: filemap.h:59
char * target_link_target
Definition: filemap.h:62
file_type_t target_type
Definition: filemap.h:60

References FILE_TYPE_DIRECTORY, FILE_TYPE_SYMLINK, insert_filehash_entry(), pg_fatal, pg_strdup(), size, file_entry_t::target_exists, file_entry_t::target_link_target, file_entry_t::target_size, file_entry_t::target_type, and type.

Referenced by main().

◆ process_target_wal_block_change()

void process_target_wal_block_change ( ForkNumber  forknum,
RelFileLocator  rlocator,
BlockNumber  blkno 
)

Definition at line 290 of file filemap.c.

292 {
293  char *path;
294  file_entry_t *entry;
295  BlockNumber blkno_inseg;
296  int segno;
297 
298  segno = blkno / RELSEG_SIZE;
299  blkno_inseg = blkno % RELSEG_SIZE;
300 
301  path = datasegpath(rlocator, forknum, segno);
302  entry = lookup_filehash_entry(path);
303  pfree(path);
304 
305  /*
306  * If the block still exists in both systems, remember it. Otherwise we
307  * can safely ignore it.
308  *
309  * If the block is beyond the EOF in the source system, or the file
310  * doesn't exist in the source at all, we're going to truncate/remove it
311  * away from the target anyway. Likewise, if it doesn't exist in the
312  * target anymore, we will copy it over with the "tail" from the source
313  * system, anyway.
314  *
315  * It is possible to find WAL for a file that doesn't exist on either
316  * system anymore. It means that the relation was dropped later in the
317  * target system, and independently on the source system too, or that it
318  * was created and dropped in the target system and it never existed in
319  * the source. Either way, we can safely ignore it.
320  */
321  if (entry)
322  {
323  Assert(entry->isrelfile);
324 
325  if (entry->target_exists)
326  {
327  if (entry->target_type != FILE_TYPE_REGULAR)
328  pg_fatal("unexpected page modification for non-regular file \"%s\"",
329  entry->path);
330 
331  if (entry->source_exists)
332  {
333  off_t end_offset;
334 
335  end_offset = (blkno_inseg + 1) * BLCKSZ;
336  if (end_offset <= entry->source_size && end_offset <= entry->target_size)
337  datapagemap_add(&entry->target_pages_to_overwrite, blkno_inseg);
338  }
339  }
340  }
341 }
#define Assert(condition)
Definition: c.h:858
void datapagemap_add(datapagemap_t *map, BlockNumber blkno)
Definition: datapagemap.c:32
static char * datasegpath(RelFileLocator rlocator, ForkNumber forknum, BlockNumber segno)
Definition: filemap.c:591
static file_entry_t * lookup_filehash_entry(const char *path)
Definition: filemap.c:204
void pfree(void *pointer)
Definition: mcxt.c:1521
bool isrelfile
Definition: filemap.h:54

References Assert, datapagemap_add(), datasegpath(), FILE_TYPE_REGULAR, file_entry_t::isrelfile, lookup_filehash_entry(), file_entry_t::path, pfree(), pg_fatal, file_entry_t::source_exists, file_entry_t::target_exists, file_entry_t::target_pages_to_overwrite, and file_entry_t::target_type.

Referenced by extractPageInfo().