PostgreSQL Source Code  git master
fd.h File Reference
#include <dirent.h>
Include dependency graph for fd.h:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Macros

#define FILE_POSSIBLY_DELETED(err)   ((err) == ENOENT)
 
#define PG_TEMP_FILES_DIR   "pgsql_tmp"
 
#define PG_TEMP_FILE_PREFIX   "pgsql_tmp"
 

Typedefs

typedef int File
 

Functions

File PathNameOpenFile (const char *fileName, int fileFlags)
 
File PathNameOpenFilePerm (const char *fileName, int fileFlags, mode_t fileMode)
 
File OpenTemporaryFile (bool interXact)
 
void FileClose (File file)
 
int FilePrefetch (File file, off_t offset, int amount, uint32 wait_event_info)
 
int FileRead (File file, char *buffer, int amount, off_t offset, uint32 wait_event_info)
 
int FileWrite (File file, char *buffer, int amount, off_t offset, uint32 wait_event_info)
 
int FileSync (File file, uint32 wait_event_info)
 
off_t FileSize (File file)
 
int FileTruncate (File file, off_t offset, uint32 wait_event_info)
 
void FileWriteback (File file, off_t offset, off_t nbytes, uint32 wait_event_info)
 
char * FilePathName (File file)
 
int FileGetRawDesc (File file)
 
int FileGetRawFlags (File file)
 
mode_t FileGetRawMode (File file)
 
File PathNameCreateTemporaryFile (const char *name, bool error_on_failure)
 
File PathNameOpenTemporaryFile (const char *path, int mode)
 
bool PathNameDeleteTemporaryFile (const char *name, bool error_on_failure)
 
void PathNameCreateTemporaryDir (const char *base, const char *name)
 
void PathNameDeleteTemporaryDir (const char *name)
 
void TempTablespacePath (char *path, Oid tablespace)
 
FILE * AllocateFile (const char *name, const char *mode)
 
int FreeFile (FILE *file)
 
FILE * OpenPipeStream (const char *command, const char *mode)
 
int ClosePipeStream (FILE *file)
 
DIRAllocateDir (const char *dirname)
 
struct direntReadDir (DIR *dir, const char *dirname)
 
struct direntReadDirExtended (DIR *dir, const char *dirname, int elevel)
 
int FreeDir (DIR *dir)
 
int OpenTransientFile (const char *fileName, int fileFlags)
 
int OpenTransientFilePerm (const char *fileName, int fileFlags, mode_t fileMode)
 
int CloseTransientFile (int fd)
 
int BasicOpenFile (const char *fileName, int fileFlags)
 
int BasicOpenFilePerm (const char *fileName, int fileFlags, mode_t fileMode)
 
bool AcquireExternalFD (void)
 
void ReserveExternalFD (void)
 
void ReleaseExternalFD (void)
 
int MakePGDirectory (const char *directoryName)
 
void InitFileAccess (void)
 
void set_max_safe_fds (void)
 
void closeAllVfds (void)
 
void SetTempTablespaces (Oid *tableSpaces, int numSpaces)
 
bool TempTablespacesAreSet (void)
 
int GetTempTablespaces (Oid *tableSpaces, int numSpaces)
 
Oid GetNextTempTableSpace (void)
 
void AtEOXact_Files (bool isCommit)
 
void AtEOSubXact_Files (bool isCommit, SubTransactionId mySubid, SubTransactionId parentSubid)
 
void RemovePgTempFiles (void)
 
void RemovePgTempFilesInDir (const char *tmpdirname, bool missing_ok, bool unlink_all)
 
bool looks_like_temp_rel_name (const char *name)
 
int pg_fsync (int fd)
 
int pg_fsync_no_writethrough (int fd)
 
int pg_fsync_writethrough (int fd)
 
int pg_fdatasync (int fd)
 
void pg_flush_data (int fd, off_t offset, off_t amount)
 
void fsync_fname (const char *fname, bool isdir)
 
int fsync_fname_ext (const char *fname, bool isdir, bool ignore_perm, int elevel)
 
int durable_rename (const char *oldfile, const char *newfile, int loglevel)
 
int durable_unlink (const char *fname, int loglevel)
 
int durable_rename_excl (const char *oldfile, const char *newfile, int loglevel)
 
void SyncDataDirectory (void)
 
int data_sync_elevel (int elevel)
 

Variables

PGDLLIMPORT int max_files_per_process
 
PGDLLIMPORT bool data_sync_retry
 
int max_safe_fds
 

Macro Definition Documentation

◆ FILE_POSSIBLY_DELETED

#define FILE_POSSIBLY_DELETED (   err)    ((err) == ENOENT)

Definition at line 69 of file fd.h.

Referenced by _mdfd_getseg(), mdopenfork(), and ProcessSyncRequests().

◆ PG_TEMP_FILE_PREFIX

#define PG_TEMP_FILE_PREFIX   "pgsql_tmp"

Definition at line 166 of file fd.h.

◆ PG_TEMP_FILES_DIR

#define PG_TEMP_FILES_DIR   "pgsql_tmp"

Definition at line 165 of file fd.h.

Typedef Documentation

◆ File

typedef int File

Definition at line 49 of file fd.h.

Function Documentation

◆ AcquireExternalFD()

bool AcquireExternalFD ( void  )

Definition at line 1048 of file fd.c.

References max_safe_fds, numExternalFDs, and ReserveExternalFD().

Referenced by connect_pg_server(), CreateWaitEventSet(), dblink_connect(), and dblink_get_conn().

1049 {
1050  /*
1051  * We don't want more than max_safe_fds / 3 FDs to be consumed for
1052  * "external" FDs.
1053  */
1054  if (numExternalFDs < max_safe_fds / 3)
1055  {
1057  return true;
1058  }
1059  errno = EMFILE;
1060  return false;
1061 }
static int numExternalFDs
Definition: fd.c:259
int max_safe_fds
Definition: fd.c:155
void ReserveExternalFD(void)
Definition: fd.c:1083

◆ AllocateDir()

DIR* AllocateDir ( const char *  dirname)

Definition at line 2583 of file fd.c.

References AllocateDescDir, AllocateDesc::create_subid, AllocateDesc::desc, AllocateDesc::dir, DO_DB, elog, ereport, errcode(), errmsg(), ERROR, GetCurrentSubTransactionId(), AllocateDesc::kind, LOG, maxAllocatedDescs, numAllocatedDescs, opendir(), ReleaseLruFile(), ReleaseLruFiles(), and reserveAllocatedDesc().

Referenced by calculate_database_size(), calculate_tablespace_size(), CheckPointLogicalRewriteHeap(), CheckPointSnapBuild(), CleanupBackupHistory(), copydir(), db_dir_size(), DeleteAllExportedSnapshotFiles(), destroy_tablespace_directories(), directory_is_empty(), do_pg_start_backup(), dsm_cleanup_for_mmap(), extension_file_exists(), get_ext_ver_list(), getInstallationPaths(), movedb(), ParseTzFile(), perform_base_backup(), pg_available_extension_versions(), pg_available_extensions(), pg_logdir_ls_internal(), pg_ls_dir(), pg_ls_dir_files(), pg_tablespace_databases(), pg_tzenumerate_next(), pg_tzenumerate_start(), pgarch_readyXlog(), pgstat_reset_remove_files(), RelationCacheInitFileRemove(), RelationCacheInitFileRemoveInDir(), RemoveNonParentXlogFiles(), RemoveOldXlogFiles(), RemovePgTempFiles(), RemovePgTempFilesInDir(), RemovePgTempRelationFiles(), RemovePgTempRelationFilesInDbspace(), RemoveTempXlogFiles(), ReorderBufferCleanupSerializedTXNs(), ResetUnloggedRelations(), ResetUnloggedRelationsInDbspaceDir(), ResetUnloggedRelationsInTablespaceDir(), restoreTwoPhaseData(), scan_directory_ci(), sendDir(), SlruScanDirectory(), StartupReorderBuffer(), StartupReplicationSlots(), UpdateLogicalMappings(), and walkdir().

2584 {
2585  DIR *dir;
2586 
2587  DO_DB(elog(LOG, "AllocateDir: Allocated %d (%s)",
2588  numAllocatedDescs, dirname));
2589 
2590  /* Can we allocate another non-virtual FD? */
2591  if (!reserveAllocatedDesc())
2592  ereport(ERROR,
2593  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
2594  errmsg("exceeded maxAllocatedDescs (%d) while trying to open directory \"%s\"",
2595  maxAllocatedDescs, dirname)));
2596 
2597  /* Close excess kernel FDs. */
2598  ReleaseLruFiles();
2599 
2600 TryAgain:
2601  if ((dir = opendir(dirname)) != NULL)
2602  {
2604 
2605  desc->kind = AllocateDescDir;
2606  desc->desc.dir = dir;
2609  return desc->desc.dir;
2610  }
2611 
2612  if (errno == EMFILE || errno == ENFILE)
2613  {
2614  int save_errno = errno;
2615 
2616  ereport(LOG,
2617  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
2618  errmsg("out of file descriptors: %m; release and retry")));
2619  errno = 0;
2620  if (ReleaseLruFile())
2621  goto TryAgain;
2622  errno = save_errno;
2623  }
2624 
2625  return NULL;
2626 }
static AllocateDesc * allocatedDescs
Definition: fd.c:254
DIR * dir
Definition: fd.c:247
#define DO_DB(A)
Definition: fd.c:170
int errcode(int sqlerrcode)
Definition: elog.c:610
static bool reserveAllocatedDesc(void)
Definition: fd.c:2247
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static bool ReleaseLruFile(void)
Definition: fd.c:1244
Definition: dirent.c:25
#define ERROR
Definition: elog.h:43
DIR * opendir(const char *)
Definition: dirent.c:33
static void ReleaseLruFiles(void)
Definition: fd.c:1266
#define ereport(elevel,...)
Definition: elog.h:144
SubTransactionId GetCurrentSubTransactionId(void)
Definition: xact.c:723
SubTransactionId create_subid
Definition: fd.c:243
union AllocateDesc::@25 desc
int errmsg(const char *fmt,...)
Definition: elog.c:824
#define elog(elevel,...)
Definition: elog.h:214
static int maxAllocatedDescs
Definition: fd.c:253
static int numAllocatedDescs
Definition: fd.c:252

◆ AllocateFile()

FILE* AllocateFile ( const char *  name,
const char *  mode 
)

Definition at line 2322 of file fd.c.

References AllocateDescFile, AllocateDesc::create_subid, AllocateDesc::desc, DO_DB, elog, ereport, errcode(), errmsg(), ERROR, AllocateDesc::file, GetCurrentSubTransactionId(), AllocateDesc::kind, LOG, maxAllocatedDescs, numAllocatedDescs, ReleaseLruFile(), ReleaseLruFiles(), and reserveAllocatedDesc().

Referenced by _ShowOption(), AlterSystemSetConfigFile(), apw_dump_now(), apw_load_buffers(), BackendRun(), BeginCopyFrom(), BeginCopyTo(), checkControlFile(), do_pg_start_backup(), do_pg_stop_backup(), entry_reset(), existsTimeLineHistory(), ExportSnapshot(), fill_hba_view(), gc_qtexts(), ImportSnapshot(), load_dh_file(), load_hba(), load_ident(), load_relcache_init_file(), parse_extension_control_file(), ParseTzFile(), pg_backup_start_time(), pg_current_logfile(), pg_file_write_internal(), pg_promote(), PGSharedMemoryAttach(), pgss_shmem_shutdown(), pgss_shmem_startup(), pgstat_read_db_statsfile(), pgstat_read_db_statsfile_timestamp(), pgstat_read_statsfiles(), pgstat_write_db_statsfile(), pgstat_write_statsfiles(), PostmasterMarkPIDForWorkerNotify(), read_backup_label(), read_binary_file(), read_tablespace_map(), read_whole_file(), readTimeLineHistory(), tokenize_inc_file(), tsearch_readline_begin(), ValidatePgVersion(), write_relcache_init_file(), XLogArchiveForceDone(), and XLogArchiveNotify().

2323 {
2324  FILE *file;
2325 
2326  DO_DB(elog(LOG, "AllocateFile: Allocated %d (%s)",
2328 
2329  /* Can we allocate another non-virtual FD? */
2330  if (!reserveAllocatedDesc())
2331  ereport(ERROR,
2332  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
2333  errmsg("exceeded maxAllocatedDescs (%d) while trying to open file \"%s\"",
2334  maxAllocatedDescs, name)));
2335 
2336  /* Close excess kernel FDs. */
2337  ReleaseLruFiles();
2338 
2339 TryAgain:
2340  if ((file = fopen(name, mode)) != NULL)
2341  {
2343 
2344  desc->kind = AllocateDescFile;
2345  desc->desc.file = file;
2348  return desc->desc.file;
2349  }
2350 
2351  if (errno == EMFILE || errno == ENFILE)
2352  {
2353  int save_errno = errno;
2354 
2355  ereport(LOG,
2356  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
2357  errmsg("out of file descriptors: %m; release and retry")));
2358  errno = 0;
2359  if (ReleaseLruFile())
2360  goto TryAgain;
2361  errno = save_errno;
2362  }
2363 
2364  return NULL;
2365 }
static PgChecksumMode mode
Definition: pg_checksums.c:61
static AllocateDesc * allocatedDescs
Definition: fd.c:254
#define DO_DB(A)
Definition: fd.c:170
int errcode(int sqlerrcode)
Definition: elog.c:610
static bool reserveAllocatedDesc(void)
Definition: fd.c:2247
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static bool ReleaseLruFile(void)
Definition: fd.c:1244
#define ERROR
Definition: elog.h:43
static void ReleaseLruFiles(void)
Definition: fd.c:1266
FILE * file
Definition: fd.c:246
#define ereport(elevel,...)
Definition: elog.h:144
SubTransactionId GetCurrentSubTransactionId(void)
Definition: xact.c:723
SubTransactionId create_subid
Definition: fd.c:243
const char * name
Definition: encode.c:561
union AllocateDesc::@25 desc
int errmsg(const char *fmt,...)
Definition: elog.c:824
#define elog(elevel,...)
Definition: elog.h:214
static int maxAllocatedDescs
Definition: fd.c:253
static int numAllocatedDescs
Definition: fd.c:252

◆ AtEOSubXact_Files()

void AtEOSubXact_Files ( bool  isCommit,
SubTransactionId  mySubid,
SubTransactionId  parentSubid 
)

Definition at line 2871 of file fd.c.

References AllocateDesc::create_subid, FreeDesc(), i, and numAllocatedDescs.

Referenced by AbortSubTransaction(), and CommitSubTransaction().

2873 {
2874  Index i;
2875 
2876  for (i = 0; i < numAllocatedDescs; i++)
2877  {
2878  if (allocatedDescs[i].create_subid == mySubid)
2879  {
2880  if (isCommit)
2881  allocatedDescs[i].create_subid = parentSubid;
2882  else
2883  {
2884  /* have to recheck the item after FreeDesc (ugly) */
2885  FreeDesc(&allocatedDescs[i--]);
2886  }
2887  }
2888  }
2889 }
static AllocateDesc * allocatedDescs
Definition: fd.c:254
static int FreeDesc(AllocateDesc *desc)
Definition: fd.c:2482
unsigned int Index
Definition: c.h:482
SubTransactionId create_subid
Definition: fd.c:243
int i
static int numAllocatedDescs
Definition: fd.c:252

◆ AtEOXact_Files()

void AtEOXact_Files ( bool  isCommit)

Definition at line 2904 of file fd.c.

References CleanupTempFiles(), numTempTableSpaces, and tempTableSpaces.

Referenced by AbortTransaction(), AutoVacLauncherMain(), BackgroundWriterMain(), CheckpointerMain(), CommitTransaction(), PrepareTransaction(), and WalWriterMain().

2905 {
2906  CleanupTempFiles(isCommit, false);
2907  tempTableSpaces = NULL;
2908  numTempTableSpaces = -1;
2909 }
static int numTempTableSpaces
Definition: fd.c:274
static Oid * tempTableSpaces
Definition: fd.c:273
static void CleanupTempFiles(bool isCommit, bool isProcExit)
Definition: fd.c:2936

◆ BasicOpenFile()

int BasicOpenFile ( const char *  fileName,
int  fileFlags 
)

Definition at line 986 of file fd.c.

References BasicOpenFilePerm(), and pg_file_create_mode.

Referenced by AlterSystemSetConfigFile(), ReadControlFile(), update_controlfile(), wal_segment_open(), WalSndSegmentOpen(), WriteControlFile(), XLogFileInit(), XLogFileOpen(), and XLogFileRead().

987 {
988  return BasicOpenFilePerm(fileName, fileFlags, pg_file_create_mode);
989 }
int pg_file_create_mode
Definition: file_perm.c:19
int BasicOpenFilePerm(const char *fileName, int fileFlags, mode_t fileMode)
Definition: fd.c:1008

◆ BasicOpenFilePerm()

int BasicOpenFilePerm ( const char *  fileName,
int  fileFlags,
mode_t  fileMode 
)

Definition at line 1008 of file fd.c.

References ereport, errcode(), errmsg(), vfd::fd, LOG, and ReleaseLruFile().

Referenced by BasicOpenFile(), LruInsert(), OpenTransientFilePerm(), PathNameOpenFilePerm(), and readRecoverySignalFile().

1009 {
1010  int fd;
1011 
1012 tryAgain:
1013  fd = open(fileName, fileFlags, fileMode);
1014 
1015  if (fd >= 0)
1016  return fd; /* success! */
1017 
1018  if (errno == EMFILE || errno == ENFILE)
1019  {
1020  int save_errno = errno;
1021 
1022  ereport(LOG,
1023  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
1024  errmsg("out of file descriptors: %m; release and retry")));
1025  errno = 0;
1026  if (ReleaseLruFile())
1027  goto tryAgain;
1028  errno = save_errno;
1029  }
1030 
1031  return -1; /* failure */
1032 }
int errcode(int sqlerrcode)
Definition: elog.c:610
#define LOG
Definition: elog.h:26
static int fd(const char *x, int i)
Definition: preproc-init.c:105
static bool ReleaseLruFile(void)
Definition: fd.c:1244
#define ereport(elevel,...)
Definition: elog.h:144
int errmsg(const char *fmt,...)
Definition: elog.c:824

◆ closeAllVfds()

void closeAllVfds ( void  )

Definition at line 2760 of file fd.c.

References Assert, FileIsNotOpen, i, LruDelete(), and SizeVfdCache.

Referenced by standard_ProcessUtility().

2761 {
2762  Index i;
2763 
2764  if (SizeVfdCache > 0)
2765  {
2766  Assert(FileIsNotOpen(0)); /* Make sure ring not corrupted */
2767  for (i = 1; i < SizeVfdCache; i++)
2768  {
2769  if (!FileIsNotOpen(i))
2770  LruDelete(i);
2771  }
2772  }
2773 }
static Size SizeVfdCache
Definition: fd.c:207
static void LruDelete(File file)
Definition: fd.c:1149
#define FileIsNotOpen(file)
Definition: fd.c:179
unsigned int Index
Definition: c.h:482
#define Assert(condition)
Definition: c.h:745
int i

◆ ClosePipeStream()

int ClosePipeStream ( FILE *  file)

Definition at line 2731 of file fd.c.

References AllocateDescPipe, AllocateDesc::desc, DO_DB, elog, AllocateDesc::file, FreeDesc(), i, AllocateDesc::kind, LOG, numAllocatedDescs, and WARNING.

Referenced by ClosePipeToProgram(), pg_import_system_collations(), and run_ssl_passphrase_command().

2732 {
2733  int i;
2734 
2735  DO_DB(elog(LOG, "ClosePipeStream: Allocated %d", numAllocatedDescs));
2736 
2737  /* Remove file from list of allocated files, if it's present */
2738  for (i = numAllocatedDescs; --i >= 0;)
2739  {
2740  AllocateDesc *desc = &allocatedDescs[i];
2741 
2742  if (desc->kind == AllocateDescPipe && desc->desc.file == file)
2743  return FreeDesc(desc);
2744  }
2745 
2746  /* Only get here if someone passes us a file not in allocatedDescs */
2747  elog(WARNING, "file passed to ClosePipeStream was not obtained from OpenPipeStream");
2748 
2749  return pclose(file);
2750 }
static AllocateDesc * allocatedDescs
Definition: fd.c:254
#define DO_DB(A)
Definition: fd.c:170
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static int FreeDesc(AllocateDesc *desc)
Definition: fd.c:2482
#define WARNING
Definition: elog.h:40
FILE * file
Definition: fd.c:246
union AllocateDesc::@25 desc
#define elog(elevel,...)
Definition: elog.h:214
int i
static int numAllocatedDescs
Definition: fd.c:252

◆ CloseTransientFile()

int CloseTransientFile ( int  fd)

Definition at line 2549 of file fd.c.

References AllocateDescRawFD, close, AllocateDesc::desc, DO_DB, elog, AllocateDesc::fd, FreeDesc(), i, AllocateDesc::kind, LOG, numAllocatedDescs, and WARNING.

Referenced by ApplyLogicalMappingFile(), be_lo_export(), CheckPointLogicalRewriteHeap(), CheckPointReplicationOrigin(), copy_file(), dsm_impl_mmap(), durable_rename(), fsync_fname_ext(), get_controlfile(), heap_xlog_logical_rewrite(), lo_import_internal(), load_relmap_file(), mdunlinkfork(), perform_base_backup(), qtext_load_file(), qtext_store(), ReadTwoPhaseFile(), RecreateTwoPhaseFile(), ReorderBufferSerializeChange(), ReorderBufferSerializeTXN(), RestoreSlotFromDisk(), SaveSlotToPath(), sendFile(), SendTimeLineHistory(), SimpleLruDoesPhysicalPageExist(), SimpleLruWriteAll(), SlruInternalWritePage(), SlruPhysicalReadPage(), SlruPhysicalWritePage(), SlruSyncFileTag(), SnapBuildRestore(), SnapBuildSerialize(), StartupReplicationOrigin(), walkdir(), write_relmap_file(), writeTimeLineHistory(), writeTimeLineHistoryFile(), and XLogFileCopy().

2550 {
2551  int i;
2552 
2553  DO_DB(elog(LOG, "CloseTransientFile: Allocated %d", numAllocatedDescs));
2554 
2555  /* Remove fd from list of allocated files, if it's present */
2556  for (i = numAllocatedDescs; --i >= 0;)
2557  {
2558  AllocateDesc *desc = &allocatedDescs[i];
2559 
2560  if (desc->kind == AllocateDescRawFD && desc->desc.fd == fd)
2561  return FreeDesc(desc);
2562  }
2563 
2564  /* Only get here if someone passes us a file not in allocatedDescs */
2565  elog(WARNING, "fd passed to CloseTransientFile was not obtained from OpenTransientFile");
2566 
2567  return close(fd);
2568 }
static AllocateDesc * allocatedDescs
Definition: fd.c:254
#define DO_DB(A)
Definition: fd.c:170
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static int fd(const char *x, int i)
Definition: preproc-init.c:105
static int FreeDesc(AllocateDesc *desc)
Definition: fd.c:2482
#define WARNING
Definition: elog.h:40
int fd
Definition: fd.c:248
union AllocateDesc::@25 desc
#define elog(elevel,...)
Definition: elog.h:214
int i
#define close(a)
Definition: win32.h:12
static int numAllocatedDescs
Definition: fd.c:252

◆ data_sync_elevel()

◆ durable_rename()

int durable_rename ( const char *  oldfile,
const char *  newfile,
int  loglevel 
)

Definition at line 659 of file fd.c.

References CloseTransientFile(), ereport, errcode_for_file_access(), errmsg(), vfd::fd, fsync_fname_ext(), fsync_parent_path(), OpenTransientFile(), PG_BINARY, and pg_fsync().

Referenced by AlterSystemSetConfigFile(), apw_dump_now(), BaseBackup(), CancelBackup(), CheckPointReplicationOrigin(), dir_close(), KeepFileRestoredFromArchive(), pgarch_archiveDone(), pgss_shmem_shutdown(), StartupXLOG(), and XLogArchiveForceDone().

660 {
661  int fd;
662 
663  /*
664  * First fsync the old and target path (if it exists), to ensure that they
665  * are properly persistent on disk. Syncing the target file is not
666  * strictly necessary, but it makes it easier to reason about crashes;
667  * because it's then guaranteed that either source or target file exists
668  * after a crash.
669  */
670  if (fsync_fname_ext(oldfile, false, false, elevel) != 0)
671  return -1;
672 
673  fd = OpenTransientFile(newfile, PG_BINARY | O_RDWR);
674  if (fd < 0)
675  {
676  if (errno != ENOENT)
677  {
678  ereport(elevel,
680  errmsg("could not open file \"%s\": %m", newfile)));
681  return -1;
682  }
683  }
684  else
685  {
686  if (pg_fsync(fd) != 0)
687  {
688  int save_errno;
689 
690  /* close file upon error, might not be in transaction context */
691  save_errno = errno;
692  CloseTransientFile(fd);
693  errno = save_errno;
694 
695  ereport(elevel,
697  errmsg("could not fsync file \"%s\": %m", newfile)));
698  return -1;
699  }
700 
701  if (CloseTransientFile(fd) != 0)
702  {
703  ereport(elevel,
705  errmsg("could not close file \"%s\": %m", newfile)));
706  return -1;
707  }
708  }
709 
710  /* Time to do the real deal... */
711  if (rename(oldfile, newfile) < 0)
712  {
713  ereport(elevel,
715  errmsg("could not rename file \"%s\" to \"%s\": %m",
716  oldfile, newfile)));
717  return -1;
718  }
719 
720  /*
721  * To guarantee renaming the file is persistent, fsync the file with its
722  * new name, and its containing directory.
723  */
724  if (fsync_fname_ext(newfile, false, false, elevel) != 0)
725  return -1;
726 
727  if (fsync_parent_path(newfile, elevel) != 0)
728  return -1;
729 
730  return 0;
731 }
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define PG_BINARY
Definition: c.h:1211
int OpenTransientFile(const char *fileName, int fileFlags)
Definition: fd.c:2372
int errcode_for_file_access(void)
Definition: elog.c:633
int CloseTransientFile(int fd)
Definition: fd.c:2549
static int elevel
Definition: vacuumlazy.c:333
#define ereport(elevel,...)
Definition: elog.h:144
int errmsg(const char *fmt,...)
Definition: elog.c:824
int pg_fsync(int fd)
Definition: fd.c:346
int fsync_fname_ext(const char *fname, bool isdir, bool ignore_perm, int elevel)
Definition: fd.c:3464
static int fsync_parent_path(const char *fname, int elevel)
Definition: fd.c:3540

◆ durable_rename_excl()

int durable_rename_excl ( const char *  oldfile,
const char *  newfile,
int  loglevel 
)

Definition at line 786 of file fd.c.

References ereport, errcode_for_file_access(), errmsg(), fsync_fname_ext(), fsync_parent_path(), and link().

Referenced by InstallXLogFileSegment(), writeTimeLineHistory(), and writeTimeLineHistoryFile().

787 {
788  /*
789  * Ensure that, if we crash directly after the rename/link, a file with
790  * valid contents is moved into place.
791  */
792  if (fsync_fname_ext(oldfile, false, false, elevel) != 0)
793  return -1;
794 
795  if (link(oldfile, newfile) < 0)
796  {
797  ereport(elevel,
799  errmsg("could not link file \"%s\" to \"%s\": %m",
800  oldfile, newfile)));
801  return -1;
802  }
803  unlink(oldfile);
804 
805  /*
806  * Make change persistent in case of an OS crash, both the new entry and
807  * its parent directory need to be flushed.
808  */
809  if (fsync_fname_ext(newfile, false, false, elevel) != 0)
810  return -1;
811 
812  /* Same for parent directory */
813  if (fsync_parent_path(newfile, elevel) != 0)
814  return -1;
815 
816  return 0;
817 }
int errcode_for_file_access(void)
Definition: elog.c:633
static int elevel
Definition: vacuumlazy.c:333
#define ereport(elevel,...)
Definition: elog.h:144
int errmsg(const char *fmt,...)
Definition: elog.c:824
int link(const char *src, const char *dst)
int fsync_fname_ext(const char *fname, bool isdir, bool ignore_perm, int elevel)
Definition: fd.c:3464
static int fsync_parent_path(const char *fname, int elevel)
Definition: fd.c:3540

◆ durable_unlink()

int durable_unlink ( const char *  fname,
int  loglevel 
)

Definition at line 749 of file fd.c.

References ereport, errcode_for_file_access(), errmsg(), and fsync_parent_path().

Referenced by do_pg_stop_backup(), exitArchiveRecovery(), InstallXLogFileSegment(), and RemoveXlogFile().

750 {
751  if (unlink(fname) < 0)
752  {
753  ereport(elevel,
755  errmsg("could not remove file \"%s\": %m",
756  fname)));
757  return -1;
758  }
759 
760  /*
761  * To guarantee that the removal of the file is persistent, fsync its
762  * parent directory.
763  */
764  if (fsync_parent_path(fname, elevel) != 0)
765  return -1;
766 
767  return 0;
768 }
int errcode_for_file_access(void)
Definition: elog.c:633
static int elevel
Definition: vacuumlazy.c:333
#define ereport(elevel,...)
Definition: elog.h:144
int errmsg(const char *fmt,...)
Definition: elog.c:824
static int fsync_parent_path(const char *fname, int elevel)
Definition: fd.c:3540

◆ FileClose()

void FileClose ( File  file)

Definition at line 1826 of file fd.c.

References Assert, close, data_sync_elevel(), Delete(), DO_DB, elog, vfd::fd, FD_DELETE_AT_CLOSE, FD_TEMP_FILE_LIMIT, vfd::fdstate, FileIsNotOpen, FileIsValid, vfd::fileName, vfd::fileSize, FreeVfd(), LOG, nfile, ReportTemporaryFileUsage(), ResourceOwnerForgetFile(), vfd::resowner, stat, temporary_files_size, and VFD_CLOSED.

Referenced by BufFileClose(), BufFileTruncateShared(), CleanupTempFiles(), logical_end_heap_rewrite(), mdclose(), mdimmedsync(), mdsyncfiletag(), mdtruncate(), ReorderBufferIterTXNFinish(), ReorderBufferRestoreChanges(), and ResourceOwnerReleaseInternal().

1827 {
1828  Vfd *vfdP;
1829 
1830  Assert(FileIsValid(file));
1831 
1832  DO_DB(elog(LOG, "FileClose: %d (%s)",
1833  file, VfdCache[file].fileName));
1834 
1835  vfdP = &VfdCache[file];
1836 
1837  if (!FileIsNotOpen(file))
1838  {
1839  /* close the file */
1840  if (close(vfdP->fd) != 0)
1841  {
1842  /*
1843  * We may need to panic on failure to close non-temporary files;
1844  * see LruDelete.
1845  */
1847  "could not close file \"%s\": %m", vfdP->fileName);
1848  }
1849 
1850  --nfile;
1851  vfdP->fd = VFD_CLOSED;
1852 
1853  /* remove the file from the lru ring */
1854  Delete(file);
1855  }
1856 
1857  if (vfdP->fdstate & FD_TEMP_FILE_LIMIT)
1858  {
1859  /* Subtract its size from current usage (do first in case of error) */
1860  temporary_files_size -= vfdP->fileSize;
1861  vfdP->fileSize = 0;
1862  }
1863 
1864  /*
1865  * Delete the file if it was temporary, and make a log entry if wanted
1866  */
1867  if (vfdP->fdstate & FD_DELETE_AT_CLOSE)
1868  {
1869  struct stat filestats;
1870  int stat_errno;
1871 
1872  /*
1873  * If we get an error, as could happen within the ereport/elog calls,
1874  * we'll come right back here during transaction abort. Reset the
1875  * flag to ensure that we can't get into an infinite loop. This code
1876  * is arranged to ensure that the worst-case consequence is failing to
1877  * emit log message(s), not failing to attempt the unlink.
1878  */
1879  vfdP->fdstate &= ~FD_DELETE_AT_CLOSE;
1880 
1881 
1882  /* first try the stat() */
1883  if (stat(vfdP->fileName, &filestats))
1884  stat_errno = errno;
1885  else
1886  stat_errno = 0;
1887 
1888  /* in any case do the unlink */
1889  if (unlink(vfdP->fileName))
1890  elog(LOG, "could not unlink file \"%s\": %m", vfdP->fileName);
1891 
1892  /* and last report the stat results */
1893  if (stat_errno == 0)
1894  ReportTemporaryFileUsage(vfdP->fileName, filestats.st_size);
1895  else
1896  {
1897  errno = stat_errno;
1898  elog(LOG, "could not stat file \"%s\": %m", vfdP->fileName);
1899  }
1900  }
1901 
1902  /* Unregister it from the resource owner */
1903  if (vfdP->resowner)
1904  ResourceOwnerForgetFile(vfdP->resowner, file);
1905 
1906  /*
1907  * Return the Vfd slot to the free list
1908  */
1909  FreeVfd(file);
1910 }
#define FD_TEMP_FILE_LIMIT
Definition: fd.c:184
#define DO_DB(A)
Definition: fd.c:170
#define FD_DELETE_AT_CLOSE
Definition: fd.c:182
static Vfd * VfdCache
Definition: fd.c:206
static void Delete(File file)
Definition: fd.c:1130
#define LOG
Definition: elog.h:26
char * fileName
Definition: fd.c:195
static int nfile
Definition: fd.c:212
unsigned short fdstate
Definition: fd.c:189
Definition: fd.c:186
off_t fileSize
Definition: fd.c:194
int fd
Definition: fd.c:188
ResourceOwner resowner
Definition: fd.c:190
static void ReportTemporaryFileUsage(const char *path, off_t size)
Definition: fd.c:1390
#define stat(a, b)
Definition: win32_port.h:255
#define FileIsNotOpen(file)
Definition: fd.c:179
int data_sync_elevel(int elevel)
Definition: fd.c:3603
#define FileIsValid(file)
Definition: fd.c:176
#define VFD_CLOSED
Definition: fd.c:174
static uint64 temporary_files_size
Definition: fd.c:226
#define Assert(condition)
Definition: c.h:745
#define elog(elevel,...)
Definition: elog.h:214
static void FreeVfd(File file)
Definition: fd.c:1334
#define close(a)
Definition: win32.h:12
void ResourceOwnerForgetFile(ResourceOwner owner, File file)
Definition: resowner.c:1277

◆ FileGetRawDesc()

int FileGetRawDesc ( File  file)

Definition at line 2216 of file fd.c.

References Assert, vfd::fd, and FileIsValid.

2217 {
2218  Assert(FileIsValid(file));
2219  return VfdCache[file].fd;
2220 }
static Vfd * VfdCache
Definition: fd.c:206
int fd
Definition: fd.c:188
#define FileIsValid(file)
Definition: fd.c:176
#define Assert(condition)
Definition: c.h:745

◆ FileGetRawFlags()

int FileGetRawFlags ( File  file)

Definition at line 2226 of file fd.c.

References Assert, vfd::fileFlags, and FileIsValid.

2227 {
2228  Assert(FileIsValid(file));
2229  return VfdCache[file].fileFlags;
2230 }
static Vfd * VfdCache
Definition: fd.c:206
#define FileIsValid(file)
Definition: fd.c:176
#define Assert(condition)
Definition: c.h:745
int fileFlags
Definition: fd.c:197

◆ FileGetRawMode()

mode_t FileGetRawMode ( File  file)

Definition at line 2236 of file fd.c.

References Assert, FileIsValid, and vfd::fileMode.

2237 {
2238  Assert(FileIsValid(file));
2239  return VfdCache[file].fileMode;
2240 }
static Vfd * VfdCache
Definition: fd.c:206
mode_t fileMode
Definition: fd.c:198
#define FileIsValid(file)
Definition: fd.c:176
#define Assert(condition)
Definition: c.h:745

◆ FilePathName()

char* FilePathName ( File  file)

Definition at line 2200 of file fd.c.

References Assert, FileIsValid, and vfd::fileName.

Referenced by _mdnblocks(), BufFileDumpBuffer(), BufFileLoadBuffer(), BufFileSeek(), BufFileSize(), BufFileTruncateShared(), mdextend(), mdimmedsync(), mdread(), mdsyncfiletag(), mdtruncate(), mdwrite(), and register_dirty_segment().

2201 {
2202  Assert(FileIsValid(file));
2203 
2204  return VfdCache[file].fileName;
2205 }
static Vfd * VfdCache
Definition: fd.c:206
char * fileName
Definition: fd.c:195
#define FileIsValid(file)
Definition: fd.c:176
#define Assert(condition)
Definition: c.h:745

◆ FilePrefetch()

int FilePrefetch ( File  file,
off_t  offset,
int  amount,
uint32  wait_event_info 
)

Definition at line 1922 of file fd.c.

References Assert, DO_DB, elog, vfd::fd, FileAccess(), FileIsValid, vfd::fileName, INT64_FORMAT, LOG, pgstat_report_wait_end(), and pgstat_report_wait_start().

Referenced by mdprefetch().

1923 {
1924 #if defined(USE_POSIX_FADVISE) && defined(POSIX_FADV_WILLNEED)
1925  int returnCode;
1926 
1927  Assert(FileIsValid(file));
1928 
1929  DO_DB(elog(LOG, "FilePrefetch: %d (%s) " INT64_FORMAT " %d",
1930  file, VfdCache[file].fileName,
1931  (int64) offset, amount));
1932 
1933  returnCode = FileAccess(file);
1934  if (returnCode < 0)
1935  return returnCode;
1936 
1937  pgstat_report_wait_start(wait_event_info);
1938  returnCode = posix_fadvise(VfdCache[file].fd, offset, amount,
1939  POSIX_FADV_WILLNEED);
1941 
1942  return returnCode;
1943 #else
1944  Assert(FileIsValid(file));
1945  return 0;
1946 #endif
1947 }
#define DO_DB(A)
Definition: fd.c:170
static Vfd * VfdCache
Definition: fd.c:206
#define LOG
Definition: elog.h:26
static int fd(const char *x, int i)
Definition: preproc-init.c:105
static void pgstat_report_wait_end(void)
Definition: pgstat.h:1386
#define FileIsValid(file)
Definition: fd.c:176
static int FileAccess(File file)
Definition: fd.c:1354
#define Assert(condition)
Definition: c.h:745
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: pgstat.h:1362
#define INT64_FORMAT
Definition: c.h:416
#define elog(elevel,...)
Definition: elog.h:214

◆ FileRead()

int FileRead ( File  file,
char *  buffer,
int  amount,
off_t  offset,
uint32  wait_event_info 
)

Definition at line 1973 of file fd.c.

References _dosmaperr(), Assert, DO_DB, EINTR, elog, error(), vfd::fd, FileAccess(), FileIsValid, vfd::fileName, INT64_FORMAT, LOG, pg_pread(), pg_usleep(), pgstat_report_wait_end(), and pgstat_report_wait_start().

Referenced by BufFileLoadBuffer(), mdread(), and ReorderBufferRestoreChanges().

1975 {
1976  int returnCode;
1977  Vfd *vfdP;
1978 
1979  Assert(FileIsValid(file));
1980 
1981  DO_DB(elog(LOG, "FileRead: %d (%s) " INT64_FORMAT " %d %p",
1982  file, VfdCache[file].fileName,
1983  (int64) offset,
1984  amount, buffer));
1985 
1986  returnCode = FileAccess(file);
1987  if (returnCode < 0)
1988  return returnCode;
1989 
1990  vfdP = &VfdCache[file];
1991 
1992 retry:
1993  pgstat_report_wait_start(wait_event_info);
1994  returnCode = pg_pread(vfdP->fd, buffer, amount, offset);
1996 
1997  if (returnCode < 0)
1998  {
1999  /*
2000  * Windows may run out of kernel buffers and return "Insufficient
2001  * system resources" error. Wait a bit and retry to solve it.
2002  *
2003  * It is rumored that EINTR is also possible on some Unix filesystems,
2004  * in which case immediate retry is indicated.
2005  */
2006 #ifdef WIN32
2007  DWORD error = GetLastError();
2008 
2009  switch (error)
2010  {
2011  case ERROR_NO_SYSTEM_RESOURCES:
2012  pg_usleep(1000L);
2013  errno = EINTR;
2014  break;
2015  default:
2016  _dosmaperr(error);
2017  break;
2018  }
2019 #endif
2020  /* OK to retry if interrupted */
2021  if (errno == EINTR)
2022  goto retry;
2023  }
2024 
2025  return returnCode;
2026 }
static void error(void)
Definition: sql-dyntest.c:147
#define DO_DB(A)
Definition: fd.c:170
void _dosmaperr(unsigned long)
Definition: win32error.c:171
static Vfd * VfdCache
Definition: fd.c:206
#define LOG
Definition: elog.h:26
ssize_t pg_pread(int fd, void *buf, size_t nbyte, off_t offset)
Definition: pread.c:27
void pg_usleep(long microsec)
Definition: signal.c:53
static void pgstat_report_wait_end(void)
Definition: pgstat.h:1386
Definition: fd.c:186
int fd
Definition: fd.c:188
#define FileIsValid(file)
Definition: fd.c:176
static int FileAccess(File file)
Definition: fd.c:1354
#define Assert(condition)
Definition: c.h:745
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: pgstat.h:1362
#define INT64_FORMAT
Definition: c.h:416
#define elog(elevel,...)
Definition: elog.h:214
#define EINTR
Definition: win32_port.h:323

◆ FileSize()

off_t FileSize ( File  file)

Definition at line 2148 of file fd.c.

References Assert, DO_DB, elog, vfd::fd, FileAccess(), FileIsNotOpen, FileIsValid, vfd::fileName, and LOG.

Referenced by _mdnblocks(), BufFileSeek(), and BufFileSize().

2149 {
2150  Assert(FileIsValid(file));
2151 
2152  DO_DB(elog(LOG, "FileSize %d (%s)",
2153  file, VfdCache[file].fileName));
2154 
2155  if (FileIsNotOpen(file))
2156  {
2157  if (FileAccess(file) < 0)
2158  return (off_t) -1;
2159  }
2160 
2161  return lseek(VfdCache[file].fd, 0, SEEK_END);
2162 }
#define DO_DB(A)
Definition: fd.c:170
static Vfd * VfdCache
Definition: fd.c:206
#define LOG
Definition: elog.h:26
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define FileIsNotOpen(file)
Definition: fd.c:179
#define FileIsValid(file)
Definition: fd.c:176
static int FileAccess(File file)
Definition: fd.c:1354
#define Assert(condition)
Definition: c.h:745
#define elog(elevel,...)
Definition: elog.h:214

◆ FileSync()

int FileSync ( File  file,
uint32  wait_event_info 
)

Definition at line 2127 of file fd.c.

References Assert, DO_DB, elog, vfd::fd, FileAccess(), FileIsValid, vfd::fileName, LOG, pg_fsync(), pgstat_report_wait_end(), and pgstat_report_wait_start().

Referenced by logical_end_heap_rewrite(), mdimmedsync(), mdsyncfiletag(), and register_dirty_segment().

2128 {
2129  int returnCode;
2130 
2131  Assert(FileIsValid(file));
2132 
2133  DO_DB(elog(LOG, "FileSync: %d (%s)",
2134  file, VfdCache[file].fileName));
2135 
2136  returnCode = FileAccess(file);
2137  if (returnCode < 0)
2138  return returnCode;
2139 
2140  pgstat_report_wait_start(wait_event_info);
2141  returnCode = pg_fsync(VfdCache[file].fd);
2143 
2144  return returnCode;
2145 }
#define DO_DB(A)
Definition: fd.c:170
static Vfd * VfdCache
Definition: fd.c:206
#define LOG
Definition: elog.h:26
static int fd(const char *x, int i)
Definition: preproc-init.c:105
static void pgstat_report_wait_end(void)
Definition: pgstat.h:1386
#define FileIsValid(file)
Definition: fd.c:176
static int FileAccess(File file)
Definition: fd.c:1354
#define Assert(condition)
Definition: c.h:745
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: pgstat.h:1362
#define elog(elevel,...)
Definition: elog.h:214
int pg_fsync(int fd)
Definition: fd.c:346

◆ FileTruncate()

int FileTruncate ( File  file,
off_t  offset,
uint32  wait_event_info 
)

Definition at line 2165 of file fd.c.

References Assert, DO_DB, elog, vfd::fd, FD_TEMP_FILE_LIMIT, vfd::fdstate, FileAccess(), FileIsValid, vfd::fileName, vfd::fileSize, ftruncate, LOG, pgstat_report_wait_end(), pgstat_report_wait_start(), and temporary_files_size.

Referenced by BufFileTruncateShared(), and mdtruncate().

2166 {
2167  int returnCode;
2168 
2169  Assert(FileIsValid(file));
2170 
2171  DO_DB(elog(LOG, "FileTruncate %d (%s)",
2172  file, VfdCache[file].fileName));
2173 
2174  returnCode = FileAccess(file);
2175  if (returnCode < 0)
2176  return returnCode;
2177 
2178  pgstat_report_wait_start(wait_event_info);
2179  returnCode = ftruncate(VfdCache[file].fd, offset);
2181 
2182  if (returnCode == 0 && VfdCache[file].fileSize > offset)
2183  {
2184  /* adjust our state for truncation of a temp file */
2185  Assert(VfdCache[file].fdstate & FD_TEMP_FILE_LIMIT);
2186  temporary_files_size -= VfdCache[file].fileSize - offset;
2187  VfdCache[file].fileSize = offset;
2188  }
2189 
2190  return returnCode;
2191 }
#define FD_TEMP_FILE_LIMIT
Definition: fd.c:184
#define DO_DB(A)
Definition: fd.c:170
static Vfd * VfdCache
Definition: fd.c:206
#define LOG
Definition: elog.h:26
static int fd(const char *x, int i)
Definition: preproc-init.c:105
static void pgstat_report_wait_end(void)
Definition: pgstat.h:1386
off_t fileSize
Definition: fd.c:194
#define FileIsValid(file)
Definition: fd.c:176
static uint64 temporary_files_size
Definition: fd.c:226
static int FileAccess(File file)
Definition: fd.c:1354
#define Assert(condition)
Definition: c.h:745
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: pgstat.h:1362
#define elog(elevel,...)
Definition: elog.h:214
#define ftruncate(a, b)
Definition: win32_port.h:59

◆ FileWrite()

int FileWrite ( File  file,
char *  buffer,
int  amount,
off_t  offset,
uint32  wait_event_info 
)

Definition at line 2029 of file fd.c.

References _dosmaperr(), Assert, DO_DB, EINTR, elog, ereport, errcode(), errmsg(), ERROR, error(), vfd::fd, FD_TEMP_FILE_LIMIT, vfd::fdstate, FileAccess(), FileIsValid, vfd::fileName, vfd::fileSize, INT64_FORMAT, LOG, pg_pwrite(), pg_usleep(), pgstat_report_wait_end(), pgstat_report_wait_start(), temp_file_limit, and temporary_files_size.

Referenced by BufFileDumpBuffer(), logical_heap_rewrite_flush_mappings(), mdextend(), and mdwrite().

2031 {
2032  int returnCode;
2033  Vfd *vfdP;
2034 
2035  Assert(FileIsValid(file));
2036 
2037  DO_DB(elog(LOG, "FileWrite: %d (%s) " INT64_FORMAT " %d %p",
2038  file, VfdCache[file].fileName,
2039  (int64) offset,
2040  amount, buffer));
2041 
2042  returnCode = FileAccess(file);
2043  if (returnCode < 0)
2044  return returnCode;
2045 
2046  vfdP = &VfdCache[file];
2047 
2048  /*
2049  * If enforcing temp_file_limit and it's a temp file, check to see if the
2050  * write would overrun temp_file_limit, and throw error if so. Note: it's
2051  * really a modularity violation to throw error here; we should set errno
2052  * and return -1. However, there's no way to report a suitable error
2053  * message if we do that. All current callers would just throw error
2054  * immediately anyway, so this is safe at present.
2055  */
2056  if (temp_file_limit >= 0 && (vfdP->fdstate & FD_TEMP_FILE_LIMIT))
2057  {
2058  off_t past_write = offset + amount;
2059 
2060  if (past_write > vfdP->fileSize)
2061  {
2062  uint64 newTotal = temporary_files_size;
2063 
2064  newTotal += past_write - vfdP->fileSize;
2065  if (newTotal > (uint64) temp_file_limit * (uint64) 1024)
2066  ereport(ERROR,
2067  (errcode(ERRCODE_CONFIGURATION_LIMIT_EXCEEDED),
2068  errmsg("temporary file size exceeds temp_file_limit (%dkB)",
2069  temp_file_limit)));
2070  }
2071  }
2072 
2073 retry:
2074  errno = 0;
2075  pgstat_report_wait_start(wait_event_info);
2076  returnCode = pg_pwrite(VfdCache[file].fd, buffer, amount, offset);
2078 
2079  /* if write didn't set errno, assume problem is no disk space */
2080  if (returnCode != amount && errno == 0)
2081  errno = ENOSPC;
2082 
2083  if (returnCode >= 0)
2084  {
2085  /*
2086  * Maintain fileSize and temporary_files_size if it's a temp file.
2087  */
2088  if (vfdP->fdstate & FD_TEMP_FILE_LIMIT)
2089  {
2090  off_t past_write = offset + amount;
2091 
2092  if (past_write > vfdP->fileSize)
2093  {
2094  temporary_files_size += past_write - vfdP->fileSize;
2095  vfdP->fileSize = past_write;
2096  }
2097  }
2098  }
2099  else
2100  {
2101  /*
2102  * See comments in FileRead()
2103  */
2104 #ifdef WIN32
2105  DWORD error = GetLastError();
2106 
2107  switch (error)
2108  {
2109  case ERROR_NO_SYSTEM_RESOURCES:
2110  pg_usleep(1000L);
2111  errno = EINTR;
2112  break;
2113  default:
2114  _dosmaperr(error);
2115  break;
2116  }
2117 #endif
2118  /* OK to retry if interrupted */
2119  if (errno == EINTR)
2120  goto retry;
2121  }
2122 
2123  return returnCode;
2124 }
static void error(void)
Definition: sql-dyntest.c:147
#define FD_TEMP_FILE_LIMIT
Definition: fd.c:184
#define DO_DB(A)
Definition: fd.c:170
void _dosmaperr(unsigned long)
Definition: win32error.c:171
static Vfd * VfdCache
Definition: fd.c:206
int errcode(int sqlerrcode)
Definition: elog.c:610
#define LOG
Definition: elog.h:26
static int fd(const char *x, int i)
Definition: preproc-init.c:105
ssize_t pg_pwrite(int fd, const void *buf, size_t nbyte, off_t offset)
Definition: pwrite.c:27
void pg_usleep(long microsec)
Definition: signal.c:53
#define ERROR
Definition: elog.h:43
static void pgstat_report_wait_end(void)
Definition: pgstat.h:1386
unsigned short fdstate
Definition: fd.c:189
Definition: fd.c:186
off_t fileSize
Definition: fd.c:194
#define FileIsValid(file)
Definition: fd.c:176
static uint64 temporary_files_size
Definition: fd.c:226
#define ereport(elevel,...)
Definition: elog.h:144
static int FileAccess(File file)
Definition: fd.c:1354
#define Assert(condition)
Definition: c.h:745
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: pgstat.h:1362
#define INT64_FORMAT
Definition: c.h:416
int errmsg(const char *fmt,...)
Definition: elog.c:824
#define elog(elevel,...)
Definition: elog.h:214
#define EINTR
Definition: win32_port.h:323
int temp_file_limit
Definition: guc.c:551

◆ FileWriteback()

void FileWriteback ( File  file,
off_t  offset,
off_t  nbytes,
uint32  wait_event_info 
)

Definition at line 1950 of file fd.c.

References Assert, DO_DB, elog, vfd::fd, FileAccess(), FileIsValid, vfd::fileName, INT64_FORMAT, LOG, pg_flush_data(), pgstat_report_wait_end(), and pgstat_report_wait_start().

Referenced by mdwriteback().

1951 {
1952  int returnCode;
1953 
1954  Assert(FileIsValid(file));
1955 
1956  DO_DB(elog(LOG, "FileWriteback: %d (%s) " INT64_FORMAT " " INT64_FORMAT,
1957  file, VfdCache[file].fileName,
1958  (int64) offset, (int64) nbytes));
1959 
1960  if (nbytes <= 0)
1961  return;
1962 
1963  returnCode = FileAccess(file);
1964  if (returnCode < 0)
1965  return;
1966 
1967  pgstat_report_wait_start(wait_event_info);
1968  pg_flush_data(VfdCache[file].fd, offset, nbytes);
1970 }
#define DO_DB(A)
Definition: fd.c:170
static Vfd * VfdCache
Definition: fd.c:206
#define LOG
Definition: elog.h:26
static int fd(const char *x, int i)
Definition: preproc-init.c:105
static void pgstat_report_wait_end(void)
Definition: pgstat.h:1386
void pg_flush_data(int fd, off_t offset, off_t nbytes)
Definition: fd.c:456
#define FileIsValid(file)
Definition: fd.c:176
static int FileAccess(File file)
Definition: fd.c:1354
#define Assert(condition)
Definition: c.h:745
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition: pgstat.h:1362
#define INT64_FORMAT
Definition: c.h:416
#define elog(elevel,...)
Definition: elog.h:214

◆ FreeDir()

int FreeDir ( DIR dir)

Definition at line 2701 of file fd.c.

References AllocateDescDir, closedir(), AllocateDesc::desc, AllocateDesc::dir, DO_DB, elog, FreeDesc(), i, AllocateDesc::kind, LOG, numAllocatedDescs, and WARNING.

Referenced by calculate_database_size(), calculate_tablespace_size(), CheckPointLogicalRewriteHeap(), CheckPointSnapBuild(), CleanupBackupHistory(), copydir(), db_dir_size(), DeleteAllExportedSnapshotFiles(), destroy_tablespace_directories(), directory_is_empty(), do_pg_start_backup(), dsm_cleanup_for_mmap(), extension_file_exists(), get_ext_ver_list(), getInstallationPaths(), movedb(), ParseTzFile(), perform_base_backup(), pg_available_extension_versions(), pg_available_extensions(), pg_logdir_ls_internal(), pg_ls_dir(), pg_ls_dir_files(), pg_tablespace_databases(), pg_tzenumerate_end(), pg_tzenumerate_next(), pgarch_readyXlog(), pgstat_reset_remove_files(), RelationCacheInitFileRemove(), RelationCacheInitFileRemoveInDir(), RemoveNonParentXlogFiles(), RemoveOldXlogFiles(), RemovePgTempFiles(), RemovePgTempFilesInDir(), RemovePgTempRelationFiles(), RemovePgTempRelationFilesInDbspace(), RemoveTempXlogFiles(), ReorderBufferCleanupSerializedTXNs(), ResetUnloggedRelations(), ResetUnloggedRelationsInDbspaceDir(), ResetUnloggedRelationsInTablespaceDir(), restoreTwoPhaseData(), scan_directory_ci(), sendDir(), SlruScanDirectory(), StartupReorderBuffer(), StartupReplicationSlots(), UpdateLogicalMappings(), and walkdir().

2702 {
2703  int i;
2704 
2705  /* Nothing to do if AllocateDir failed */
2706  if (dir == NULL)
2707  return 0;
2708 
2709  DO_DB(elog(LOG, "FreeDir: Allocated %d", numAllocatedDescs));
2710 
2711  /* Remove dir from list of allocated dirs, if it's present */
2712  for (i = numAllocatedDescs; --i >= 0;)
2713  {
2714  AllocateDesc *desc = &allocatedDescs[i];
2715 
2716  if (desc->kind == AllocateDescDir && desc->desc.dir == dir)
2717  return FreeDesc(desc);
2718  }
2719 
2720  /* Only get here if someone passes us a dir not in allocatedDescs */
2721  elog(WARNING, "dir passed to FreeDir was not obtained from AllocateDir");
2722 
2723  return closedir(dir);
2724 }
static AllocateDesc * allocatedDescs
Definition: fd.c:254
DIR * dir
Definition: fd.c:247
#define DO_DB(A)
Definition: fd.c:170
int closedir(DIR *)
Definition: dirent.c:123
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static int FreeDesc(AllocateDesc *desc)
Definition: fd.c:2482
#define WARNING
Definition: elog.h:40
union AllocateDesc::@25 desc
#define elog(elevel,...)
Definition: elog.h:214
int i
static int numAllocatedDescs
Definition: fd.c:252

◆ FreeFile()

int FreeFile ( FILE *  file)

Definition at line 2521 of file fd.c.

References AllocateDescFile, AllocateDesc::desc, DO_DB, elog, AllocateDesc::file, FreeDesc(), i, AllocateDesc::kind, LOG, numAllocatedDescs, and WARNING.

Referenced by _ShowOption(), AlterSystemSetConfigFile(), apw_dump_now(), apw_load_buffers(), BackendRun(), checkControlFile(), do_pg_start_backup(), do_pg_stop_backup(), EndCopy(), entry_reset(), existsTimeLineHistory(), ExportSnapshot(), fill_hba_view(), gc_qtexts(), ImportSnapshot(), load_dh_file(), load_hba(), load_ident(), load_relcache_init_file(), parse_extension_control_file(), ParseTzFile(), pg_backup_start_time(), pg_current_logfile(), pg_file_write_internal(), pg_promote(), PGSharedMemoryAttach(), pgss_shmem_shutdown(), pgss_shmem_startup(), pgstat_read_db_statsfile(), pgstat_read_db_statsfile_timestamp(), pgstat_read_statsfiles(), pgstat_write_db_statsfile(), pgstat_write_statsfiles(), PostmasterMarkPIDForWorkerNotify(), read_backup_label(), read_binary_file(), read_tablespace_map(), read_whole_file(), readTimeLineHistory(), tokenize_inc_file(), tsearch_readline_end(), ValidatePgVersion(), write_relcache_init_file(), XLogArchiveForceDone(), and XLogArchiveNotify().

2522 {
2523  int i;
2524 
2525  DO_DB(elog(LOG, "FreeFile: Allocated %d", numAllocatedDescs));
2526 
2527  /* Remove file from list of allocated files, if it's present */
2528  for (i = numAllocatedDescs; --i >= 0;)
2529  {
2530  AllocateDesc *desc = &allocatedDescs[i];
2531 
2532  if (desc->kind == AllocateDescFile && desc->desc.file == file)
2533  return FreeDesc(desc);
2534  }
2535 
2536  /* Only get here if someone passes us a file not in allocatedDescs */
2537  elog(WARNING, "file passed to FreeFile was not obtained from AllocateFile");
2538 
2539  return fclose(file);
2540 }
static AllocateDesc * allocatedDescs
Definition: fd.c:254
#define DO_DB(A)
Definition: fd.c:170
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static int FreeDesc(AllocateDesc *desc)
Definition: fd.c:2482
#define WARNING
Definition: elog.h:40
FILE * file
Definition: fd.c:246
union AllocateDesc::@25 desc
#define elog(elevel,...)
Definition: elog.h:214
int i
static int numAllocatedDescs
Definition: fd.c:252

◆ fsync_fname()

void fsync_fname ( const char *  fname,
bool  isdir 
)

Definition at line 633 of file fd.c.

References data_sync_elevel(), ERROR, and fsync_fname_ext().

Referenced by _CloseArchive(), CheckPointTwoPhase(), copydir(), CreateSlotOnDisk(), dir_close(), dir_finish(), dir_open_for_write(), main(), ReplicationSlotDropPtr(), ResetUnloggedRelationsInDbspaceDir(), RestoreSlotFromDisk(), SaveSlotToPath(), SimpleLruWriteAll(), SnapBuildRestore(), SnapBuildSerialize(), StartupReplicationSlots(), and tar_finish().

634 {
635  fsync_fname_ext(fname, isdir, false, data_sync_elevel(ERROR));
636 }
#define ERROR
Definition: elog.h:43
int data_sync_elevel(int elevel)
Definition: fd.c:3603
int fsync_fname_ext(const char *fname, bool isdir, bool ignore_perm, int elevel)
Definition: fd.c:3464

◆ fsync_fname_ext()

int fsync_fname_ext ( const char *  fname,
bool  isdir,
bool  ignore_perm,
int  elevel 
)

Definition at line 3464 of file fd.c.

References CloseTransientFile(), ereport, errcode_for_file_access(), errmsg(), vfd::fd, OpenTransientFile(), PG_BINARY, and pg_fsync().

Referenced by datadir_fsync_fname(), durable_rename(), durable_rename_excl(), fsync_fname(), fsync_parent_path(), and pg_file_sync().

3465 {
3466  int fd;
3467  int flags;
3468  int returncode;
3469 
3470  /*
3471  * Some OSs require directories to be opened read-only whereas other
3472  * systems don't allow us to fsync files opened read-only; so we need both
3473  * cases here. Using O_RDWR will cause us to fail to fsync files that are
3474  * not writable by our userid, but we assume that's OK.
3475  */
3476  flags = PG_BINARY;
3477  if (!isdir)
3478  flags |= O_RDWR;
3479  else
3480  flags |= O_RDONLY;
3481 
3482  fd = OpenTransientFile(fname, flags);
3483 
3484  /*
3485  * Some OSs don't allow us to open directories at all (Windows returns
3486  * EACCES), just ignore the error in that case. If desired also silently
3487  * ignoring errors about unreadable files. Log others.
3488  */
3489  if (fd < 0 && isdir && (errno == EISDIR || errno == EACCES))
3490  return 0;
3491  else if (fd < 0 && ignore_perm && errno == EACCES)
3492  return 0;
3493  else if (fd < 0)
3494  {
3495  ereport(elevel,
3497  errmsg("could not open file \"%s\": %m", fname)));
3498  return -1;
3499  }
3500 
3501  returncode = pg_fsync(fd);
3502 
3503  /*
3504  * Some OSes don't allow us to fsync directories at all, so we can ignore
3505  * those errors. Anything else needs to be logged.
3506  */
3507  if (returncode != 0 && !(isdir && (errno == EBADF || errno == EINVAL)))
3508  {
3509  int save_errno;
3510 
3511  /* close file upon error, might not be in transaction context */
3512  save_errno = errno;
3513  (void) CloseTransientFile(fd);
3514  errno = save_errno;
3515 
3516  ereport(elevel,
3518  errmsg("could not fsync file \"%s\": %m", fname)));
3519  return -1;
3520  }
3521 
3522  if (CloseTransientFile(fd) != 0)
3523  {
3524  ereport(elevel,
3526  errmsg("could not close file \"%s\": %m", fname)));
3527  return -1;
3528  }
3529 
3530  return 0;
3531 }
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define PG_BINARY
Definition: c.h:1211
int OpenTransientFile(const char *fileName, int fileFlags)
Definition: fd.c:2372
int errcode_for_file_access(void)
Definition: elog.c:633
int CloseTransientFile(int fd)
Definition: fd.c:2549
static int elevel
Definition: vacuumlazy.c:333
#define ereport(elevel,...)
Definition: elog.h:144
int errmsg(const char *fmt,...)
Definition: elog.c:824
int pg_fsync(int fd)
Definition: fd.c:346

◆ GetNextTempTableSpace()

Oid GetNextTempTableSpace ( void  )

Definition at line 2850 of file fd.c.

References InvalidOid, nextTempTableSpace, numTempTableSpaces, and tempTableSpaces.

Referenced by GetDefaultTablespace(), and OpenTemporaryFile().

2851 {
2852  if (numTempTableSpaces > 0)
2853  {
2854  /* Advance nextTempTableSpace counter with wraparound */
2856  nextTempTableSpace = 0;
2858  }
2859  return InvalidOid;
2860 }
static int numTempTableSpaces
Definition: fd.c:274
static int nextTempTableSpace
Definition: fd.c:275
#define InvalidOid
Definition: postgres_ext.h:36
static Oid * tempTableSpaces
Definition: fd.c:273

◆ GetTempTablespaces()

int GetTempTablespaces ( Oid tableSpaces,
int  numSpaces 
)

Definition at line 2832 of file fd.c.

References Assert, i, numTempTableSpaces, tempTableSpaces, and TempTablespacesAreSet().

Referenced by SharedFileSetInit().

2833 {
2834  int i;
2835 
2837  for (i = 0; i < numTempTableSpaces && i < numSpaces; ++i)
2838  tableSpaces[i] = tempTableSpaces[i];
2839 
2840  return i;
2841 }
static int numTempTableSpaces
Definition: fd.c:274
bool TempTablespacesAreSet(void)
Definition: fd.c:2817
#define Assert(condition)
Definition: c.h:745
static Oid * tempTableSpaces
Definition: fd.c:273
int i

◆ InitFileAccess()

void InitFileAccess ( void  )

Definition at line 826 of file fd.c.

References Assert, AtProcExit_Files(), ereport, errcode(), errmsg(), FATAL, vfd::fd, malloc, MemSet, on_proc_exit(), SizeVfdCache, and VFD_CLOSED.

Referenced by BaseInit().

827 {
828  Assert(SizeVfdCache == 0); /* call me only once */
829 
830  /* initialize cache header entry */
831  VfdCache = (Vfd *) malloc(sizeof(Vfd));
832  if (VfdCache == NULL)
833  ereport(FATAL,
834  (errcode(ERRCODE_OUT_OF_MEMORY),
835  errmsg("out of memory")));
836 
837  MemSet((char *) &(VfdCache[0]), 0, sizeof(Vfd));
839 
840  SizeVfdCache = 1;
841 
842  /* register proc-exit hook to ensure temp files are dropped at exit */
844 }
static void AtProcExit_Files(int code, Datum arg)
Definition: fd.c:2918
static Size SizeVfdCache
Definition: fd.c:207
void on_proc_exit(pg_on_exit_callback function, Datum arg)
Definition: ipc.c:305
static Vfd * VfdCache
Definition: fd.c:206
int errcode(int sqlerrcode)
Definition: elog.c:610
#define MemSet(start, val, len)
Definition: c.h:949
#define malloc(a)
Definition: header.h:50
#define FATAL
Definition: elog.h:52
Definition: fd.c:186
int fd
Definition: fd.c:188
#define VFD_CLOSED
Definition: fd.c:174
#define ereport(elevel,...)
Definition: elog.h:144
#define Assert(condition)
Definition: c.h:745
int errmsg(const char *fmt,...)
Definition: elog.c:824

◆ looks_like_temp_rel_name()

bool looks_like_temp_rel_name ( const char *  name)

Definition at line 3187 of file fd.c.

References forkname_chars().

Referenced by RemovePgTempRelationFilesInDbspace(), and sendDir().

3188 {
3189  int pos;
3190  int savepos;
3191 
3192  /* Must start with "t". */
3193  if (name[0] != 't')
3194  return false;
3195 
3196  /* Followed by a non-empty string of digits and then an underscore. */
3197  for (pos = 1; isdigit((unsigned char) name[pos]); ++pos)
3198  ;
3199  if (pos == 1 || name[pos] != '_')
3200  return false;
3201 
3202  /* Followed by another nonempty string of digits. */
3203  for (savepos = ++pos; isdigit((unsigned char) name[pos]); ++pos)
3204  ;
3205  if (savepos == pos)
3206  return false;
3207 
3208  /* We might have _forkname or .segment or both. */
3209  if (name[pos] == '_')
3210  {
3211  int forkchar = forkname_chars(&name[pos + 1], NULL);
3212 
3213  if (forkchar <= 0)
3214  return false;
3215  pos += forkchar + 1;
3216  }
3217  if (name[pos] == '.')
3218  {
3219  int segchar;
3220 
3221  for (segchar = 1; isdigit((unsigned char) name[pos + segchar]); ++segchar)
3222  ;
3223  if (segchar <= 1)
3224  return false;
3225  pos += segchar;
3226  }
3227 
3228  /* Now we should be at the end. */
3229  if (name[pos] != '\0')
3230  return false;
3231  return true;
3232 }
int forkname_chars(const char *str, ForkNumber *fork)
Definition: relpath.c:81
const char * name
Definition: encode.c:561

◆ MakePGDirectory()

int MakePGDirectory ( const char *  directoryName)

◆ OpenPipeStream()

FILE* OpenPipeStream ( const char *  command,
const char *  mode 
)

Definition at line 2425 of file fd.c.

References AllocateDescPipe, AllocateDesc::create_subid, AllocateDesc::desc, DO_DB, elog, ereport, errcode(), errmsg(), ERROR, AllocateDesc::file, GetCurrentSubTransactionId(), AllocateDesc::kind, LOG, maxAllocatedDescs, numAllocatedDescs, pqsignal(), ReleaseLruFile(), ReleaseLruFiles(), reserveAllocatedDesc(), SIG_DFL, SIG_IGN, SIGPIPE, and generate_unaccent_rules::stdout.

Referenced by BeginCopyFrom(), BeginCopyTo(), pg_import_system_collations(), and run_ssl_passphrase_command().

2426 {
2427  FILE *file;
2428  int save_errno;
2429 
2430  DO_DB(elog(LOG, "OpenPipeStream: Allocated %d (%s)",
2431  numAllocatedDescs, command));
2432 
2433  /* Can we allocate another non-virtual FD? */
2434  if (!reserveAllocatedDesc())
2435  ereport(ERROR,
2436  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
2437  errmsg("exceeded maxAllocatedDescs (%d) while trying to execute command \"%s\"",
2438  maxAllocatedDescs, command)));
2439 
2440  /* Close excess kernel FDs. */
2441  ReleaseLruFiles();
2442 
2443 TryAgain:
2444  fflush(stdout);
2445  fflush(stderr);
2447  errno = 0;
2448  file = popen(command, mode);
2449  save_errno = errno;
2451  errno = save_errno;
2452  if (file != NULL)
2453  {
2455 
2456  desc->kind = AllocateDescPipe;
2457  desc->desc.file = file;
2460  return desc->desc.file;
2461  }
2462 
2463  if (errno == EMFILE || errno == ENFILE)
2464  {
2465  ereport(LOG,
2466  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
2467  errmsg("out of file descriptors: %m; release and retry")));
2468  if (ReleaseLruFile())
2469  goto TryAgain;
2470  errno = save_errno;
2471  }
2472 
2473  return NULL;
2474 }
static PgChecksumMode mode
Definition: pg_checksums.c:61
static AllocateDesc * allocatedDescs
Definition: fd.c:254
#define DO_DB(A)
Definition: fd.c:170
int errcode(int sqlerrcode)
Definition: elog.c:610
static bool reserveAllocatedDesc(void)
Definition: fd.c:2247
#define SIGPIPE
Definition: win32_port.h:158
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static bool ReleaseLruFile(void)
Definition: fd.c:1244
#define ERROR
Definition: elog.h:43
#define SIG_IGN
Definition: win32_port.h:150
static void ReleaseLruFiles(void)
Definition: fd.c:1266
FILE * file
Definition: fd.c:246
#define ereport(elevel,...)
Definition: elog.h:144
pqsigfunc pqsignal(int signum, pqsigfunc handler)
Definition: signal.c:170
#define SIG_DFL
Definition: win32_port.h:148
SubTransactionId GetCurrentSubTransactionId(void)
Definition: xact.c:723
SubTransactionId create_subid
Definition: fd.c:243
union AllocateDesc::@25 desc
int errmsg(const char *fmt,...)
Definition: elog.c:824
#define elog(elevel,...)
Definition: elog.h:214
static int maxAllocatedDescs
Definition: fd.c:253
static int numAllocatedDescs
Definition: fd.c:252

◆ OpenTemporaryFile()

File OpenTemporaryFile ( bool  interXact)

Definition at line 1578 of file fd.c.

References CurrentResourceOwner, FD_DELETE_AT_CLOSE, FD_TEMP_FILE_LIMIT, vfd::fdstate, GetNextTempTableSpace(), MyDatabaseTableSpace, numTempTableSpaces, OidIsValid, OpenTemporaryFileInTablespace(), RegisterTemporaryFile(), and ResourceOwnerEnlargeFiles().

Referenced by BufFileCreateTemp(), and extendBufFile().

1579 {
1580  File file = 0;
1581 
1582  /*
1583  * Make sure the current resource owner has space for this File before we
1584  * open it, if we'll be registering it below.
1585  */
1586  if (!interXact)
1588 
1589  /*
1590  * If some temp tablespace(s) have been given to us, try to use the next
1591  * one. If a given tablespace can't be found, we silently fall back to
1592  * the database's default tablespace.
1593  *
1594  * BUT: if the temp file is slated to outlive the current transaction,
1595  * force it into the database's default tablespace, so that it will not
1596  * pose a threat to possible tablespace drop attempts.
1597  */
1598  if (numTempTableSpaces > 0 && !interXact)
1599  {
1600  Oid tblspcOid = GetNextTempTableSpace();
1601 
1602  if (OidIsValid(tblspcOid))
1603  file = OpenTemporaryFileInTablespace(tblspcOid, false);
1604  }
1605 
1606  /*
1607  * If not, or if tablespace is bad, create in database's default
1608  * tablespace. MyDatabaseTableSpace should normally be set before we get
1609  * here, but just in case it isn't, fall back to pg_default tablespace.
1610  */
1611  if (file <= 0)
1614  DEFAULTTABLESPACE_OID,
1615  true);
1616 
1617  /* Mark it for deletion at close and temporary file size limit */
1619 
1620  /* Register it with the current resource owner */
1621  if (!interXact)
1622  RegisterTemporaryFile(file);
1623 
1624  return file;
1625 }
static File OpenTemporaryFileInTablespace(Oid tblspcOid, bool rejectError)
Definition: fd.c:1656
#define FD_TEMP_FILE_LIMIT
Definition: fd.c:184
ResourceOwner CurrentResourceOwner
Definition: resowner.c:142
#define FD_DELETE_AT_CLOSE
Definition: fd.c:182
static Vfd * VfdCache
Definition: fd.c:206
static int numTempTableSpaces
Definition: fd.c:274
unsigned int Oid
Definition: postgres_ext.h:31
#define OidIsValid(objectId)
Definition: c.h:651
Oid MyDatabaseTableSpace
Definition: globals.c:87
Oid GetNextTempTableSpace(void)
Definition: fd.c:2850
unsigned short fdstate
Definition: fd.c:189
static void RegisterTemporaryFile(File file)
Definition: fd.c:1409
void ResourceOwnerEnlargeFiles(ResourceOwner owner)
Definition: resowner.c:1257
int File
Definition: fd.h:49

◆ OpenTransientFile()

◆ OpenTransientFilePerm()

int OpenTransientFilePerm ( const char *  fileName,
int  fileFlags,
mode_t  fileMode 
)

Definition at line 2381 of file fd.c.

References AllocateDescRawFD, BasicOpenFilePerm(), AllocateDesc::create_subid, AllocateDesc::desc, DO_DB, elog, ereport, errcode(), errmsg(), ERROR, vfd::fd, AllocateDesc::fd, GetCurrentSubTransactionId(), AllocateDesc::kind, LOG, maxAllocatedDescs, numAllocatedDescs, ReleaseLruFiles(), and reserveAllocatedDesc().

Referenced by be_lo_export(), and OpenTransientFile().

2382 {
2383  int fd;
2384 
2385  DO_DB(elog(LOG, "OpenTransientFile: Allocated %d (%s)",
2386  numAllocatedDescs, fileName));
2387 
2388  /* Can we allocate another non-virtual FD? */
2389  if (!reserveAllocatedDesc())
2390  ereport(ERROR,
2391  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
2392  errmsg("exceeded maxAllocatedDescs (%d) while trying to open file \"%s\"",
2393  maxAllocatedDescs, fileName)));
2394 
2395  /* Close excess kernel FDs. */
2396  ReleaseLruFiles();
2397 
2398  fd = BasicOpenFilePerm(fileName, fileFlags, fileMode);
2399 
2400  if (fd >= 0)
2401  {
2403 
2404  desc->kind = AllocateDescRawFD;
2405  desc->desc.fd = fd;
2408 
2409  return fd;
2410  }
2411 
2412  return -1; /* failure */
2413 }
static AllocateDesc * allocatedDescs
Definition: fd.c:254
#define DO_DB(A)
Definition: fd.c:170
int errcode(int sqlerrcode)
Definition: elog.c:610
static bool reserveAllocatedDesc(void)
Definition: fd.c:2247
#define LOG
Definition: elog.h:26
AllocateDescKind kind
Definition: fd.c:242
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define ERROR
Definition: elog.h:43
static void ReleaseLruFiles(void)
Definition: fd.c:1266
#define ereport(elevel,...)
Definition: elog.h:144
SubTransactionId GetCurrentSubTransactionId(void)
Definition: xact.c:723
SubTransactionId create_subid
Definition: fd.c:243
int fd
Definition: fd.c:248
union AllocateDesc::@25 desc
int errmsg(const char *fmt,...)
Definition: elog.c:824
int BasicOpenFilePerm(const char *fileName, int fileFlags, mode_t fileMode)
Definition: fd.c:1008
#define elog(elevel,...)
Definition: elog.h:214
static int maxAllocatedDescs
Definition: fd.c:253
static int numAllocatedDescs
Definition: fd.c:252

◆ PathNameCreateTemporaryDir()

void PathNameCreateTemporaryDir ( const char *  base,
const char *  name 
)

Definition at line 1514 of file fd.c.

References ereport, errcode_for_file_access(), errmsg(), ERROR, and MakePGDirectory().

Referenced by SharedFileSetCreate().

1515 {
1516  if (MakePGDirectory(directory) < 0)
1517  {
1518  if (errno == EEXIST)
1519  return;
1520 
1521  /*
1522  * Failed. Try to create basedir first in case it's missing. Tolerate
1523  * EEXIST to close a race against another process following the same
1524  * algorithm.
1525  */
1526  if (MakePGDirectory(basedir) < 0 && errno != EEXIST)
1527  ereport(ERROR,
1529  errmsg("cannot create temporary directory \"%s\": %m",
1530  basedir)));
1531 
1532  /* Try again. */
1533  if (MakePGDirectory(directory) < 0 && errno != EEXIST)
1534  ereport(ERROR,
1536  errmsg("cannot create temporary subdirectory \"%s\": %m",
1537  directory)));
1538  }
1539 }
static char * basedir
#define ERROR
Definition: elog.h:43
int errcode_for_file_access(void)
Definition: elog.c:633
#define ereport(elevel,...)
Definition: elog.h:144
int MakePGDirectory(const char *directoryName)
Definition: fd.c:3580
static const char * directory
Definition: zic.c:634
int errmsg(const char *fmt,...)
Definition: elog.c:824

◆ PathNameCreateTemporaryFile()

File PathNameCreateTemporaryFile ( const char *  name,
bool  error_on_failure 
)

Definition at line 1713 of file fd.c.

References CurrentResourceOwner, ereport, errcode_for_file_access(), errmsg(), ERROR, FD_TEMP_FILE_LIMIT, vfd::fdstate, PathNameOpenFile(), PG_BINARY, RegisterTemporaryFile(), and ResourceOwnerEnlargeFiles().

Referenced by SharedFileSetCreate().

1714 {
1715  File file;
1716 
1718 
1719  /*
1720  * Open the file. Note: we don't use O_EXCL, in case there is an orphaned
1721  * temp file that can be reused.
1722  */
1723  file = PathNameOpenFile(path, O_RDWR | O_CREAT | O_TRUNC | PG_BINARY);
1724  if (file <= 0)
1725  {
1726  if (error_on_failure)
1727  ereport(ERROR,
1729  errmsg("could not create temporary file \"%s\": %m",
1730  path)));
1731  else
1732  return file;
1733  }
1734 
1735  /* Mark it for temp_file_limit accounting. */
1737 
1738  /* Register it for automatic close. */
1739  RegisterTemporaryFile(file);
1740 
1741  return file;
1742 }
File PathNameOpenFile(const char *fileName, int fileFlags)
Definition: fd.c:1437
#define FD_TEMP_FILE_LIMIT
Definition: fd.c:184
ResourceOwner CurrentResourceOwner
Definition: resowner.c:142
static Vfd * VfdCache
Definition: fd.c:206
#define PG_BINARY
Definition: c.h:1211
#define ERROR
Definition: elog.h:43
int errcode_for_file_access(void)
Definition: elog.c:633
unsigned short fdstate
Definition: fd.c:189
#define ereport(elevel,...)
Definition: elog.h:144
static void RegisterTemporaryFile(File file)
Definition: fd.c:1409
int errmsg(const char *fmt,...)
Definition: elog.c:824
void ResourceOwnerEnlargeFiles(ResourceOwner owner)
Definition: resowner.c:1257
int File
Definition: fd.h:49

◆ PathNameDeleteTemporaryDir()

void PathNameDeleteTemporaryDir ( const char *  name)

Definition at line 1545 of file fd.c.

References LOG, stat, unlink_if_exists_fname(), and walkdir().

Referenced by SharedFileSetDeleteAll().

1546 {
1547  struct stat statbuf;
1548 
1549  /* Silently ignore missing directory. */
1550  if (stat(dirname, &statbuf) != 0 && errno == ENOENT)
1551  return;
1552 
1553  /*
1554  * Currently, walkdir doesn't offer a way for our passed in function to
1555  * maintain state. Perhaps it should, so that we could tell the caller
1556  * whether this operation succeeded or failed. Since this operation is
1557  * used in a cleanup path, we wouldn't actually behave differently: we'll
1558  * just log failures.
1559  */
1560  walkdir(dirname, unlink_if_exists_fname, false, LOG);
1561 }
static void walkdir(const char *path, void(*action)(const char *fname, bool isdir, int elevel), bool process_symlinks, int elevel)
Definition: fd.c:3331
#define LOG
Definition: elog.h:26
static void unlink_if_exists_fname(const char *fname, bool isdir, int elevel)
Definition: fd.c:3439
#define stat(a, b)
Definition: win32_port.h:255

◆ PathNameDeleteTemporaryFile()

bool PathNameDeleteTemporaryFile ( const char *  name,
bool  error_on_failure 
)

Definition at line 1780 of file fd.c.

References ereport, errcode_for_file_access(), errmsg(), ERROR, LOG, ReportTemporaryFileUsage(), and stat.

Referenced by SharedFileSetDelete(), and unlink_if_exists_fname().

1781 {
1782  struct stat filestats;
1783  int stat_errno;
1784 
1785  /* Get the final size for pgstat reporting. */
1786  if (stat(path, &filestats) != 0)
1787  stat_errno = errno;
1788  else
1789  stat_errno = 0;
1790 
1791  /*
1792  * Unlike FileClose's automatic file deletion code, we tolerate
1793  * non-existence to support BufFileDeleteShared which doesn't know how
1794  * many segments it has to delete until it runs out.
1795  */
1796  if (stat_errno == ENOENT)
1797  return false;
1798 
1799  if (unlink(path) < 0)
1800  {
1801  if (errno != ENOENT)
1802  ereport(error_on_failure ? ERROR : LOG,
1804  errmsg("could not unlink temporary file \"%s\": %m",
1805  path)));
1806  return false;
1807  }
1808 
1809  if (stat_errno == 0)
1810  ReportTemporaryFileUsage(path, filestats.st_size);
1811  else
1812  {
1813  errno = stat_errno;
1814  ereport(LOG,
1816  errmsg("could not stat file \"%s\": %m", path)));
1817  }
1818 
1819  return true;
1820 }
#define LOG
Definition: elog.h:26
#define ERROR
Definition: elog.h:43
int errcode_for_file_access(void)
Definition: elog.c:633
static void ReportTemporaryFileUsage(const char *path, off_t size)
Definition: fd.c:1390
#define stat(a, b)
Definition: win32_port.h:255
#define ereport(elevel,...)
Definition: elog.h:144
int errmsg(const char *fmt,...)
Definition: elog.c:824

◆ PathNameOpenFile()

File PathNameOpenFile ( const char *  fileName,
int  fileFlags 
)

Definition at line 1437 of file fd.c.

References PathNameOpenFilePerm(), and pg_file_create_mode.

Referenced by _mdfd_openseg(), logical_rewrite_log_mapping(), mdcreate(), mdopenfork(), mdsyncfiletag(), OpenTemporaryFileInTablespace(), PathNameCreateTemporaryFile(), PathNameOpenTemporaryFile(), and ReorderBufferRestoreChanges().

1438 {
1439  return PathNameOpenFilePerm(fileName, fileFlags, pg_file_create_mode);
1440 }
File PathNameOpenFilePerm(const char *fileName, int fileFlags, mode_t fileMode)
Definition: fd.c:1450
int pg_file_create_mode
Definition: file_perm.c:19

◆ PathNameOpenFilePerm()

File PathNameOpenFilePerm ( const char *  fileName,
int  fileFlags,
mode_t  fileMode 
)

Definition at line 1450 of file fd.c.

References AllocateVfd(), BasicOpenFilePerm(), DO_DB, elog, ereport, errcode(), errmsg(), ERROR, vfd::fd, vfd::fdstate, vfd::fileFlags, vfd::fileMode, vfd::fileName, vfd::fileSize, free, FreeVfd(), Insert(), LOG, nfile, ReleaseLruFiles(), and vfd::resowner.

Referenced by PathNameOpenFile().

1451 {
1452  char *fnamecopy;
1453  File file;
1454  Vfd *vfdP;
1455 
1456  DO_DB(elog(LOG, "PathNameOpenFilePerm: %s %x %o",
1457  fileName, fileFlags, fileMode));
1458 
1459  /*
1460  * We need a malloc'd copy of the file name; fail cleanly if no room.
1461  */
1462  fnamecopy = strdup(fileName);
1463  if (fnamecopy == NULL)
1464  ereport(ERROR,
1465  (errcode(ERRCODE_OUT_OF_MEMORY),
1466  errmsg("out of memory")));
1467 
1468  file = AllocateVfd();
1469  vfdP = &VfdCache[file];
1470 
1471  /* Close excess kernel FDs. */
1472  ReleaseLruFiles();
1473 
1474  vfdP->fd = BasicOpenFilePerm(fileName, fileFlags, fileMode);
1475 
1476  if (vfdP->fd < 0)
1477  {
1478  int save_errno = errno;
1479 
1480  FreeVfd(file);
1481  free(fnamecopy);
1482  errno = save_errno;
1483  return -1;
1484  }
1485  ++nfile;
1486  DO_DB(elog(LOG, "PathNameOpenFile: success %d",
1487  vfdP->fd));
1488 
1489  Insert(file);
1490 
1491  vfdP->fileName = fnamecopy;
1492  /* Saved flags are adjusted to be OK for re-opening file */
1493  vfdP->fileFlags = fileFlags & ~(O_CREAT | O_TRUNC | O_EXCL);
1494  vfdP->fileMode = fileMode;
1495  vfdP->fileSize = 0;
1496  vfdP->fdstate = 0x0;
1497  vfdP->resowner = NULL;
1498 
1499  return file;
1500 }
#define DO_DB(A)
Definition: fd.c:170
static Vfd * VfdCache
Definition: fd.c:206
int errcode(int sqlerrcode)
Definition: elog.c:610
#define LOG
Definition: elog.h:26
mode_t fileMode
Definition: fd.c:198
#define ERROR
Definition: elog.h:43
char * fileName
Definition: fd.c:195
static int nfile
Definition: fd.c:212
static File AllocateVfd(void)
Definition: fd.c:1276
unsigned short fdstate
Definition: fd.c:189
Definition: fd.c:186
off_t fileSize
Definition: fd.c:194
int fd
Definition: fd.c:188
static void Insert(File file)
Definition: fd.c:1175
ResourceOwner resowner
Definition: fd.c:190
static void ReleaseLruFiles(void)
Definition: fd.c:1266
#define ereport(elevel,...)
Definition: elog.h:144
#define free(a)
Definition: header.h:65
int errmsg(const char *fmt,...)
Definition: elog.c:824
int BasicOpenFilePerm(const char *fileName, int fileFlags, mode_t fileMode)
Definition: fd.c:1008
#define elog(elevel,...)
Definition: elog.h:214
static void FreeVfd(File file)
Definition: fd.c:1334
int fileFlags
Definition: fd.c:197
int File
Definition: fd.h:49

◆ PathNameOpenTemporaryFile()

File PathNameOpenTemporaryFile ( const char *  path,
int  mode 
)

Definition at line 1751 of file fd.c.

References CurrentResourceOwner, ereport, errcode_for_file_access(), errmsg(), ERROR, PathNameOpenFile(), PG_BINARY, RegisterTemporaryFile(), and ResourceOwnerEnlargeFiles().

Referenced by SharedFileSetOpen().

1752 {
1753  File file;
1754 
1756 
1757  file = PathNameOpenFile(path, mode | PG_BINARY);
1758 
1759  /* If no such file, then we don't raise an error. */
1760  if (file <= 0 && errno != ENOENT)
1761  ereport(ERROR,
1763  errmsg("could not open temporary file \"%s\": %m",
1764  path)));
1765 
1766  if (file > 0)
1767  {
1768  /* Register it for automatic close. */
1769  RegisterTemporaryFile(file);
1770  }
1771 
1772  return file;
1773 }
static PgChecksumMode mode
Definition: pg_checksums.c:61
File PathNameOpenFile(const char *fileName, int fileFlags)
Definition: fd.c:1437
ResourceOwner CurrentResourceOwner
Definition: resowner.c:142
#define PG_BINARY
Definition: c.h:1211
#define ERROR
Definition: elog.h:43
int errcode_for_file_access(void)
Definition: elog.c:633
#define ereport(elevel,...)
Definition: elog.h:144
static void RegisterTemporaryFile(File file)
Definition: fd.c:1409
int errmsg(const char *fmt,...)
Definition: elog.c:824
void ResourceOwnerEnlargeFiles(ResourceOwner owner)
Definition: resowner.c:1257
int File
Definition: fd.h:49

◆ pg_fdatasync()

int pg_fdatasync ( int  fd)

Definition at line 436 of file fd.c.

References enableFsync, and fsync.

Referenced by issue_xlog_fsync().

437 {
438  if (enableFsync)
439  {
440 #ifdef HAVE_FDATASYNC
441  return fdatasync(fd);
442 #else
443  return fsync(fd);
444 #endif
445  }
446  else
447  return 0;
448 }
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define fsync(fd)
Definition: win32_port.h:62
bool enableFsync
Definition: globals.c:119

◆ pg_flush_data()

void pg_flush_data ( int  fd,
off_t  offset,
off_t  amount 
)

Definition at line 456 of file fd.c.

References data_sync_elevel(), elevel, enableFsync, ereport, errcode_for_file_access(), errmsg(), FATAL, MAP_FAILED, and WARNING.

Referenced by copy_file(), FileWriteback(), and walkdir().

457 {
458  /*
459  * Right now file flushing is primarily used to avoid making later
460  * fsync()/fdatasync() calls have less impact. Thus don't trigger flushes
461  * if fsyncs are disabled - that's a decision we might want to make
462  * configurable at some point.
463  */
464  if (!enableFsync)
465  return;
466 
467  /*
468  * We compile all alternatives that are supported on the current platform,
469  * to find portability problems more easily.
470  */
471 #if defined(HAVE_SYNC_FILE_RANGE)
472  {
473  int rc;
474  static bool not_implemented_by_kernel = false;
475 
476  if (not_implemented_by_kernel)
477  return;
478 
479  /*
480  * sync_file_range(SYNC_FILE_RANGE_WRITE), currently linux specific,
481  * tells the OS that writeback for the specified blocks should be
482  * started, but that we don't want to wait for completion. Note that
483  * this call might block if too much dirty data exists in the range.
484  * This is the preferable method on OSs supporting it, as it works
485  * reliably when available (contrast to msync()) and doesn't flush out
486  * clean data (like FADV_DONTNEED).
487  */
488  rc = sync_file_range(fd, offset, nbytes,
489  SYNC_FILE_RANGE_WRITE);
490  if (rc != 0)
491  {
492  int elevel;
493 
494  /*
495  * For systems that don't have an implementation of
496  * sync_file_range() such as Windows WSL, generate only one
497  * warning and then suppress all further attempts by this process.
498  */
499  if (errno == ENOSYS)
500  {
501  elevel = WARNING;
502  not_implemented_by_kernel = true;
503  }
504  else
505  elevel = data_sync_elevel(WARNING);
506 
507  ereport(elevel,
509  errmsg("could not flush dirty data: %m")));
510  }
511 
512  return;
513  }
514 #endif
515 #if !defined(WIN32) && defined(MS_ASYNC)
516  {
517  void *p;
518  static int pagesize = 0;
519 
520  /*
521  * On several OSs msync(MS_ASYNC) on a mmap'ed file triggers
522  * writeback. On linux it only does so if MS_SYNC is specified, but
523  * then it does the writeback synchronously. Luckily all common linux
524  * systems have sync_file_range(). This is preferable over
525  * FADV_DONTNEED because it doesn't flush out clean data.
526  *
527  * We map the file (mmap()), tell the kernel to sync back the contents
528  * (msync()), and then remove the mapping again (munmap()).
529  */
530 
531  /* mmap() needs actual length if we want to map whole file */
532  if (offset == 0 && nbytes == 0)
533  {
534  nbytes = lseek(fd, 0, SEEK_END);
535  if (nbytes < 0)
536  {
539  errmsg("could not determine dirty data size: %m")));
540  return;
541  }
542  }
543 
544  /*
545  * Some platforms reject partial-page mmap() attempts. To deal with
546  * that, just truncate the request to a page boundary. If any extra
547  * bytes don't get flushed, well, it's only a hint anyway.
548  */
549 
550  /* fetch pagesize only once */
551  if (pagesize == 0)
552  pagesize = sysconf(_SC_PAGESIZE);
553 
554  /* align length to pagesize, dropping any fractional page */
555  if (pagesize > 0)
556  nbytes = (nbytes / pagesize) * pagesize;
557 
558  /* fractional-page request is a no-op */
559  if (nbytes <= 0)
560  return;
561 
562  /*
563  * mmap could well fail, particularly on 32-bit platforms where there
564  * may simply not be enough address space. If so, silently fall
565  * through to the next implementation.
566  */
567  if (nbytes <= (off_t) SSIZE_MAX)
568  p = mmap(NULL, nbytes, PROT_READ, MAP_SHARED, fd, offset);
569  else
570  p = MAP_FAILED;
571 
572  if (p != MAP_FAILED)
573  {
574  int rc;
575 
576  rc = msync(p, (size_t) nbytes, MS_ASYNC);
577  if (rc != 0)
578  {
581  errmsg("could not flush dirty data: %m")));
582  /* NB: need to fall through to munmap()! */
583  }
584 
585  rc = munmap(p, (size_t) nbytes);
586  if (rc != 0)
587  {
588  /* FATAL error because mapping would remain */
589  ereport(FATAL,
591  errmsg("could not munmap() while flushing data: %m")));
592  }
593 
594  return;
595  }
596  }
597 #endif
598 #if defined(USE_POSIX_FADVISE) && defined(POSIX_FADV_DONTNEED)
599  {
600  int rc;
601 
602  /*
603  * Signal the kernel that the passed in range should not be cached
604  * anymore. This has the, desired, side effect of writing out dirty
605  * data, and the, undesired, side effect of likely discarding useful
606  * clean cached blocks. For the latter reason this is the least
607  * preferable method.
608  */
609 
610  rc = posix_fadvise(fd, offset, nbytes, POSIX_FADV_DONTNEED);
611 
612  if (rc != 0)
613  {
614  /* don't error out, this is just a performance optimization */
617  errmsg("could not flush dirty data: %m")));
618  }
619 
620  return;
621  }
622 #endif
623 }
#define MAP_FAILED
Definition: mem.h:45
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define FATAL
Definition: elog.h:52
int errcode_for_file_access(void)
Definition: elog.c:633
#define WARNING
Definition: elog.h:40
static int elevel
Definition: vacuumlazy.c:333
int data_sync_elevel(int elevel)
Definition: fd.c:3603
#define ereport(elevel,...)
Definition: elog.h:144
bool enableFsync
Definition: globals.c:119
int errmsg(const char *fmt,...)
Definition: elog.c:824

◆ pg_fsync()

int pg_fsync ( int  fd)

Definition at line 346 of file fd.c.

References Assert, pg_fsync_no_writethrough(), pg_fsync_writethrough(), S_ISDIR, stat, sync_method, and SYNC_METHOD_FSYNC_WRITETHROUGH.

Referenced by AddToDataDirLockFile(), assign_xlog_sync_method(), BootStrapXLOG(), CheckPointLogicalRewriteHeap(), CreateLockFile(), do_pg_start_backup(), durable_rename(), FileSync(), fsync_fname_ext(), heap_xlog_logical_rewrite(), readRecoverySignalFile(), RecreateTwoPhaseFile(), RestoreSlotFromDisk(), SaveSlotToPath(), SlruPhysicalWritePage(), SlruSyncFileTag(), SnapBuildSerialize(), update_controlfile(), write_auto_conf_file(), write_relmap_file(), WriteControlFile(), writeTimeLineHistory(), writeTimeLineHistoryFile(), XLogFileCopy(), and XLogFileInit().

347 {
348 #if !defined(WIN32) && defined(USE_ASSERT_CHECKING)
349  struct stat st;
350 
351  /*
352  * Some operating system implementations of fsync() have requirements
353  * about the file access modes that were used when their file descriptor
354  * argument was opened, and these requirements differ depending on whether
355  * the file descriptor is for a directory.
356  *
357  * For any file descriptor that may eventually be handed to fsync(), we
358  * should have opened it with access modes that are compatible with
359  * fsync() on all supported systems, otherwise the code may not be
360  * portable, even if it runs ok on the current system.
361  *
362  * We assert here that a descriptor for a file was opened with write
363  * permissions (either O_RDWR or O_WRONLY) and for a directory without
364  * write permissions (O_RDONLY).
365  *
366  * Ignore any fstat errors and let the follow-up fsync() do its work.
367  * Doing this sanity check here counts for the case where fsync() is
368  * disabled.
369  */
370  if (fstat(fd, &st) == 0)
371  {
372  int desc_flags = fcntl(fd, F_GETFL);
373 
374  /*
375  * O_RDONLY is historically 0, so just make sure that for directories
376  * no write flags are used.
377  */
378  if (S_ISDIR(st.st_mode))
379  Assert((desc_flags & (O_RDWR | O_WRONLY)) == 0);
380  else
381  Assert((desc_flags & (O_RDWR | O_WRONLY)) != 0);
382  }
383  errno = 0;
384 #endif
385 
386  /* #if is to skip the sync_method test if there's no need for it */
387 #if defined(HAVE_FSYNC_WRITETHROUGH) && !defined(FSYNC_WRITETHROUGH_IS_FSYNC)
389  return pg_fsync_writethrough(fd);
390  else
391 #endif
393 }
#define SYNC_METHOD_FSYNC_WRITETHROUGH
Definition: xlog.h:28
int pg_fsync_writethrough(int fd)
Definition: fd.c:413
int pg_fsync_no_writethrough(int fd)
Definition: fd.c:401
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define stat(a, b)
Definition: win32_port.h:255
#define Assert(condition)
Definition: c.h:745
int sync_method
Definition: xlog.c:106
#define S_ISDIR(m)
Definition: win32_port.h:296

◆ pg_fsync_no_writethrough()

int pg_fsync_no_writethrough ( int  fd)

Definition at line 401 of file fd.c.

References enableFsync, and fsync.

Referenced by issue_xlog_fsync(), and pg_fsync().

402 {
403  if (enableFsync)
404  return fsync(fd);
405  else
406  return 0;
407 }
static int fd(const char *x, int i)
Definition: preproc-init.c:105
#define fsync(fd)
Definition: win32_port.h:62
bool enableFsync
Definition: globals.c:119

◆ pg_fsync_writethrough()

int pg_fsync_writethrough ( int  fd)

Definition at line 413 of file fd.c.

References enableFsync.

Referenced by issue_xlog_fsync(), pg_fsync(), signal_cleanup(), and test_sync().

414 {
415  if (enableFsync)
416  {
417 #ifdef WIN32
418  return _commit(fd);
419 #elif defined(F_FULLFSYNC)
420  return (fcntl(fd, F_FULLFSYNC, 0) == -1) ? -1 : 0;
421 #else
422  errno = ENOSYS;
423  return -1;
424 #endif
425  }
426  else
427  return 0;
428 }
static int fd(const char *x, int i)
Definition: preproc-init.c:105
bool enableFsync
Definition: globals.c:119

◆ ReadDir()

◆ ReadDirExtended()

struct dirent* ReadDirExtended ( DIR dir,
const char *  dirname,
int  elevel 
)

Definition at line 2664 of file fd.c.

References ereport, errcode_for_file_access(), errmsg(), and readdir().

Referenced by DeleteAllExportedSnapshotFiles(), ReadDir(), RelationCacheInitFileRemove(), RelationCacheInitFileRemoveInDir(), RemovePgTempFiles(), RemovePgTempFilesInDir(), RemovePgTempRelationFiles(), RemovePgTempRelationFilesInDbspace(), ReorderBufferCleanupSerializedTXNs(), scan_directory_ci(), and walkdir().

2665 {
2666  struct dirent *dent;
2667 
2668  /* Give a generic message for AllocateDir failure, if caller didn't */
2669  if (dir == NULL)
2670  {
2671  ereport(elevel,
2673  errmsg("could not open directory \"%s\": %m",
2674  dirname)));
2675  return NULL;
2676  }
2677 
2678  errno = 0;
2679  if ((dent = readdir(dir)) != NULL)
2680  return dent;
2681 
2682  if (errno)
2683  ereport(elevel,
2685  errmsg("could not read directory \"%s\": %m",
2686  dirname)));
2687  return NULL;
2688 }
Definition: dirent.h:9
int errcode_for_file_access(void)
Definition: elog.c:633
static int elevel
Definition: vacuumlazy.c:333
#define ereport(elevel,...)
Definition: elog.h:144
struct dirent * readdir(DIR *)
Definition: dirent.c:78
int errmsg(const char *fmt,...)
Definition: elog.c:824

◆ ReleaseExternalFD()

◆ RemovePgTempFiles()

void RemovePgTempFiles ( void  )

Definition at line 3006 of file fd.c.

References AllocateDir(), dirent::d_name, FreeDir(), LOG, MAXPGPATH, PG_TEMP_FILES_DIR, ReadDirExtended(), RemovePgTempFilesInDir(), RemovePgTempRelationFiles(), snprintf, and TABLESPACE_VERSION_DIRECTORY.

Referenced by PostmasterMain().

3007 {
3008  char temp_path[MAXPGPATH + 10 + sizeof(TABLESPACE_VERSION_DIRECTORY) + sizeof(PG_TEMP_FILES_DIR)];
3009  DIR *spc_dir;
3010  struct dirent *spc_de;
3011 
3012  /*
3013  * First process temp files in pg_default ($PGDATA/base)
3014  */
3015  snprintf(temp_path, sizeof(temp_path), "base/%s", PG_TEMP_FILES_DIR);
3016  RemovePgTempFilesInDir(temp_path, true, false);
3017  RemovePgTempRelationFiles("base");
3018 
3019  /*
3020  * Cycle through temp directories for all non-default tablespaces.
3021  */
3022  spc_dir = AllocateDir("pg_tblspc");
3023 
3024  while ((spc_de = ReadDirExtended(spc_dir, "pg_tblspc", LOG)) != NULL)
3025  {
3026  if (strcmp(spc_de->d_name, ".") == 0 ||
3027  strcmp(spc_de->d_name, "..") == 0)
3028  continue;
3029 
3030  snprintf(temp_path, sizeof(temp_path), "pg_tblspc/%s/%s/%s",
3032  RemovePgTempFilesInDir(temp_path, true, false);
3033 
3034  snprintf(temp_path, sizeof(temp_path), "pg_tblspc/%s/%s",
3036  RemovePgTempRelationFiles(temp_path);
3037  }
3038 
3039  FreeDir(spc_dir);
3040 
3041  /*
3042  * In EXEC_BACKEND case there is a pgsql_tmp directory at the top level of
3043  * DataDir as well. However, that is *not* cleaned here because doing so
3044  * would create a race condition. It's done separately, earlier in
3045  * postmaster startup.
3046  */
3047 }
struct dirent * ReadDirExtended(DIR *dir, const char *dirname, int elevel)
Definition: fd.c:2664
#define PG_TEMP_FILES_DIR
Definition: pg_checksums.c:58
#define LOG
Definition: elog.h:26
Definition: dirent.h:9
static void RemovePgTempRelationFiles(const char *tsdirname)
Definition: fd.c:3131
Definition: dirent.c:25
#define MAXPGPATH
#define TABLESPACE_VERSION_DIRECTORY
Definition: relpath.h:26
void RemovePgTempFilesInDir(const char *tmpdirname, bool missing_ok, bool unlink_all)
Definition: fd.c:3065
DIR * AllocateDir(const char *dirname)
Definition: fd.c:2583
char d_name[MAX_PATH]
Definition: dirent.h:15
#define snprintf
Definition: port.h:193
int FreeDir(DIR *dir)
Definition: fd.c:2701

◆ RemovePgTempFilesInDir()

void RemovePgTempFilesInDir ( const char *  tmpdirname,
bool  missing_ok,
bool  unlink_all 
)

Definition at line 3065 of file fd.c.

References AllocateDir(), dirent::d_name, ereport, errcode_for_file_access(), errmsg(), FreeDir(), LOG, lstat, MAXPGPATH, PG_TEMP_FILE_PREFIX, ReadDirExtended(), RemovePgTempFilesInDir(), S_ISDIR, snprintf, and stat.

Referenced by PostmasterMain(), RemovePgTempFiles(), and RemovePgTempFilesInDir().

3066 {
3067  DIR *temp_dir;
3068  struct dirent *temp_de;
3069  char rm_path[MAXPGPATH * 2];
3070 
3071  temp_dir = AllocateDir(tmpdirname);
3072 
3073  if (temp_dir == NULL && errno == ENOENT && missing_ok)
3074  return;
3075 
3076  while ((temp_de = ReadDirExtended(temp_dir, tmpdirname, LOG)) != NULL)
3077  {
3078  if (strcmp(temp_de->d_name, ".") == 0 ||
3079  strcmp(temp_de->d_name, "..") == 0)
3080  continue;
3081 
3082  snprintf(rm_path, sizeof(rm_path), "%s/%s",
3083  tmpdirname, temp_de->d_name);
3084 
3085  if (unlink_all ||
3086  strncmp(temp_de->d_name,
3088  strlen(PG_TEMP_FILE_PREFIX)) == 0)
3089  {
3090  struct stat statbuf;
3091 
3092  if (lstat(rm_path, &statbuf) < 0)
3093  {
3094  ereport(LOG,
3096  errmsg("could not stat file \"%s\": %m", rm_path)));
3097  continue;
3098  }
3099 
3100  if (S_ISDIR(statbuf.st_mode))
3101  {
3102  /* recursively remove contents, then directory itself */
3103  RemovePgTempFilesInDir(rm_path, false, true);
3104 
3105  if (rmdir(rm_path) < 0)
3106  ereport(LOG,
3108  errmsg("could not remove directory \"%s\": %m",
3109  rm_path)));
3110  }
3111  else
3112  {
3113  if (unlink(rm_path) < 0)
3114  ereport(LOG,
3116  errmsg("could not remove file \"%s\": %m",
3117  rm_path)));
3118  }
3119  }
3120  else
3121  ereport(LOG,
3122  (errmsg("unexpected file found in temporary-files directory: \"%s\"",
3123  rm_path)));
3124  }
3125 
3126  FreeDir(temp_dir);
3127 }
struct dirent * ReadDirExtended(DIR *dir, const char *dirname, int elevel)
Definition: fd.c:2664
#define LOG
Definition: elog.h:26
Definition: dirent.h:9
Definition: dirent.c:25
#define PG_TEMP_FILE_PREFIX
Definition: pg_checksums.c:59
#define MAXPGPATH
void RemovePgTempFilesInDir(const char *tmpdirname, bool missing_ok, bool unlink_all)
Definition: fd.c:3065
int errcode_for_file_access(void)
Definition: elog.c:633
DIR * AllocateDir(const char *dirname)
Definition: fd.c:2583
#define stat(a, b)
Definition: win32_port.h:255
#define ereport(elevel,...)
Definition: elog.h:144
#define S_ISDIR(m)
Definition: win32_port.h:296
#define lstat(path, sb)
Definition: win32_port.h:244
int errmsg(const char *fmt,...)
Definition: elog.c:824
char d_name[MAX_PATH]
Definition: dirent.h:15
#define snprintf
Definition: port.h:193
int FreeDir(DIR *dir)
Definition: fd.c:2701

◆ ReserveExternalFD()

void ReserveExternalFD ( void  )

Definition at line 1083 of file fd.c.

References numExternalFDs, and ReleaseLruFiles().

Referenced by AcquireExternalFD(), BackendInitialize(), dsm_impl_op(), InitializeLatchSupport(), InitPostmasterDeathWatchHandle(), pgstat_init(), PostmasterMarkPIDForWorkerNotify(), and XLogWrite().

1084 {
1085  /*
1086  * Release VFDs if needed to stay safe. Because we do this before
1087  * incrementing numExternalFDs, the final state will be as desired, i.e.,
1088  * nfile + numAllocatedDescs + numExternalFDs <= max_safe_fds.
1089  */
1090  ReleaseLruFiles();
1091 
1092  numExternalFDs++;
1093 }
static int numExternalFDs
Definition: fd.c:259
static void ReleaseLruFiles(void)
Definition: fd.c:1266

◆ set_max_safe_fds()

void set_max_safe_fds ( void  )

Definition at line 943 of file fd.c.

References count_usable_fds(), DEBUG2, elog, ereport, errcode(), errdetail(), errmsg(), FATAL, FD_MINFREE, max_files_per_process, max_safe_fds, Min, and NUM_RESERVED_FDS.

Referenced by PostmasterMain().

944 {
945  int usable_fds;
946  int already_open;
947 
948  /*----------
949  * We want to set max_safe_fds to
950  * MIN(usable_fds, max_files_per_process - already_open)
951  * less the slop factor for files that are opened without consulting
952  * fd.c. This ensures that we won't exceed either max_files_per_process
953  * or the experimentally-determined EMFILE limit.
954  *----------
955  */
957  &usable_fds, &already_open);
958 
959  max_safe_fds = Min(usable_fds, max_files_per_process - already_open);
960 
961  /*
962  * Take off the FDs reserved for system() etc.
963  */
965 
966  /*
967  * Make sure we still have enough to get by.
968  */
969  if (max_safe_fds < FD_MINFREE)
970  ereport(FATAL,
971  (errcode(ERRCODE_INSUFFICIENT_RESOURCES),
972  errmsg("insufficient file descriptors available to start server process"),
973  errdetail("System allows %d, we need at least %d.",
976 
977  elog(DEBUG2, "max_safe_fds = %d, usable_fds = %d, already_open = %d",
978  max_safe_fds, usable_fds, already_open);
979 }
static void count_usable_fds(int max_to_probe, int *usable_fds, int *already_open)
Definition: fd.c:859
#define NUM_RESERVED_FDS
Definition: fd.c:125
int max_safe_fds
Definition: fd.c:155
#define Min(x, y)
Definition: c.h:927
int errcode(int sqlerrcode)
Definition: elog.c:610
#define FATAL
Definition: elog.h:52
#define DEBUG2
Definition: elog.h:24
int errdetail(const char *fmt,...)
Definition: elog.c:957
int max_files_per_process
Definition: fd.c:142
#define ereport(elevel,...)
Definition: elog.h:144
#define FD_MINFREE
Definition: fd.c:134
int errmsg(const char *fmt,...)
Definition: elog.c:824
#define elog(elevel,...)
Definition: elog.h:214

◆ SetTempTablespaces()

void SetTempTablespaces ( Oid tableSpaces,
int  numSpaces 
)

Definition at line 2789 of file fd.c.

References Assert, nextTempTableSpace, numTempTableSpaces, random(), and tempTableSpaces.

Referenced by assign_temp_tablespaces(), and PrepareTempTablespaces().

2790 {
2791  Assert(numSpaces >= 0);
2792  tempTableSpaces = tableSpaces;
2793  numTempTableSpaces = numSpaces;
2794 
2795  /*
2796  * Select a random starting point in the list. This is to minimize
2797  * conflicts between backends that are most likely sharing the same list
2798  * of temp tablespaces. Note that if we create multiple temp files in the
2799  * same transaction, we'll advance circularly through the list --- this
2800  * ensures that large temporary sort files are nicely spread across all
2801  * available tablespaces.
2802  */
2803  if (numSpaces > 1)
2804  nextTempTableSpace = random() % numSpaces;
2805  else
2806  nextTempTableSpace = 0;
2807 }
long random(void)
Definition: random.c:22
static int numTempTableSpaces
Definition: fd.c:274
static int nextTempTableSpace
Definition: fd.c:275
#define Assert(condition)
Definition: c.h:745
static Oid * tempTableSpaces
Definition: fd.c:273

◆ SyncDataDirectory()

void SyncDataDirectory ( void  )

Definition at line 3257 of file fd.c.

References datadir_fsync_fname(), DEBUG1, enableFsync, ereport, errcode_for_file_access(), errmsg(), LOG, lstat, pgwin32_is_junction(), stat, and walkdir().

Referenced by StartupXLOG().

3258 {
3259  bool xlog_is_symlink;
3260 
3261  /* We can skip this whole thing if fsync is disabled. */
3262  if (!enableFsync)
3263  return;
3264 
3265  /*
3266  * If pg_wal is a symlink, we'll need to recurse into it separately,
3267  * because the first walkdir below will ignore it.
3268  */
3269  xlog_is_symlink = false;
3270 
3271 #ifndef WIN32
3272  {
3273  struct stat st;
3274 
3275  if (lstat("pg_wal", &st) < 0)
3276  ereport(LOG,
3278  errmsg("could not stat file \"%s\": %m",
3279  "pg_wal")));
3280  else if (S_ISLNK(st.st_mode))
3281  xlog_is_symlink = true;
3282  }
3283 #else
3284  if (pgwin32_is_junction("pg_wal"))
3285  xlog_is_symlink = true;
3286 #endif
3287 
3288  /*
3289  * If possible, hint to the kernel that we're soon going to fsync the data
3290  * directory and its contents. Errors in this step are even less
3291  * interesting than normal, so log them only at DEBUG1.
3292  */
3293 #ifdef PG_FLUSH_DATA_WORKS
3294  walkdir(".", pre_sync_fname, false, DEBUG1);
3295  if (xlog_is_symlink)
3296  walkdir("pg_wal", pre_sync_fname, false, DEBUG1);
3297  walkdir("pg_tblspc", pre_sync_fname, true, DEBUG1);
3298 #endif
3299 
3300  /*
3301  * Now we do the fsync()s in the same order.
3302  *
3303  * The main call ignores symlinks, so in addition to specially processing
3304  * pg_wal if it's a symlink, pg_tblspc has to be visited separately with
3305  * process_symlinks = true. Note that if there are any plain directories
3306  * in pg_tblspc, they'll get fsync'd twice. That's not an expected case
3307  * so we don't worry about optimizing it.
3308  */
3309  walkdir(".", datadir_fsync_fname, false, LOG);
3310  if (xlog_is_symlink)
3311  walkdir("pg_wal", datadir_fsync_fname, false, LOG);
3312  walkdir("pg_tblspc", datadir_fsync_fname, true, LOG);
3313 }
#define DEBUG1
Definition: elog.h:25
static void walkdir(const char *path, void(*action)(const char *fname, bool isdir, int elevel), bool process_symlinks, int elevel)
Definition: fd.c:3331
#define LOG
Definition: elog.h:26
int errcode_for_file_access(void)
Definition: elog.c:633
static void datadir_fsync_fname(const char *fname, bool isdir, int elevel)
Definition: fd.c:3429
#define stat(a, b)
Definition: win32_port.h:255
#define ereport(elevel,...)
Definition: elog.h:144
#define lstat(path, sb)
Definition: win32_port.h:244
bool enableFsync
Definition: globals.c:119
int errmsg(const char *fmt,...)
Definition: elog.c:824
bool pgwin32_is_junction(const char *path)

◆ TempTablespacePath()

void TempTablespacePath ( char *  path,
Oid  tablespace 
)

Definition at line 1631 of file fd.c.

References InvalidOid, MAXPGPATH, PG_TEMP_FILES_DIR, snprintf, and TABLESPACE_VERSION_DIRECTORY.

Referenced by OpenTemporaryFileInTablespace(), pg_ls_tmpdir(), SharedFileSetCreate(), and SharedFileSetPath().

1632 {
1633  /*
1634  * Identify the tempfile directory for this tablespace.
1635  *
1636  * If someone tries to specify pg_global, use pg_default instead.
1637  */
1638  if (tablespace == InvalidOid ||
1639  tablespace == DEFAULTTABLESPACE_OID ||
1640  tablespace == GLOBALTABLESPACE_OID)
1641  snprintf(path, MAXPGPATH, "base/%s", PG_TEMP_FILES_DIR);
1642  else
1643  {
1644  /* All other tablespaces are accessed via symlinks */
1645  snprintf(path, MAXPGPATH, "pg_tblspc/%u/%s/%s",
1648  }
1649 }
#define PG_TEMP_FILES_DIR
Definition: pg_checksums.c:58
#define MAXPGPATH
#define TABLESPACE_VERSION_DIRECTORY
Definition: relpath.h:26
char * tablespace
Definition: pgbench.c:189
#define InvalidOid
Definition: postgres_ext.h:36
#define snprintf
Definition: port.h:193

◆ TempTablespacesAreSet()

bool TempTablespacesAreSet ( void  )

Definition at line 2817 of file fd.c.

References numTempTableSpaces.

Referenced by GetTempTablespaces(), and PrepareTempTablespaces().

2818 {
2819  return (numTempTableSpaces >= 0);
2820 }
static int numTempTableSpaces
Definition: fd.c:274

Variable Documentation

◆ data_sync_retry

PGDLLIMPORT bool data_sync_retry

Definition at line 158 of file fd.c.

Referenced by data_sync_elevel().

◆ max_files_per_process

PGDLLIMPORT int max_files_per_process

Definition at line 142 of file fd.c.

Referenced by set_max_safe_fds().

◆ max_safe_fds