PostgreSQL Source Code git master
All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
basic_archive.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * basic_archive.c
4 *
5 * This file demonstrates a basic archive library implementation that is
6 * roughly equivalent to the following shell command:
7 *
8 * test ! -f /path/to/dest && cp /path/to/src /path/to/dest
9 *
10 * One notable difference between this module and the shell command above
11 * is that this module first copies the file to a temporary destination,
12 * syncs it to disk, and then durably moves it to the final destination.
13 *
14 * Another notable difference is that if /path/to/dest already exists
15 * but has contents identical to /path/to/src, archiving will succeed,
16 * whereas the command shown above would fail. This prevents problems if
17 * a file is successfully archived and then the system crashes before
18 * a durable record of the success has been made.
19 *
20 * Copyright (c) 2022-2025, PostgreSQL Global Development Group
21 *
22 * IDENTIFICATION
23 * contrib/basic_archive/basic_archive.c
24 *
25 *-------------------------------------------------------------------------
26 */
27#include "postgres.h"
28
29#include <sys/stat.h>
30#include <sys/time.h>
31#include <unistd.h>
32
34#include "common/int.h"
35#include "miscadmin.h"
36#include "storage/copydir.h"
37#include "storage/fd.h"
38#include "utils/guc.h"
39
41 .name = "basic_archive",
42 .version = PG_VERSION
43);
44
45static char *archive_directory = NULL;
46
48static bool basic_archive_file(ArchiveModuleState *state, const char *file, const char *path);
49static bool check_archive_directory(char **newval, void **extra, GucSource source);
50static bool compare_files(const char *file1, const char *file2);
51
53 .startup_cb = NULL,
54 .check_configured_cb = basic_archive_configured,
55 .archive_file_cb = basic_archive_file,
56 .shutdown_cb = NULL
57};
58
59/*
60 * _PG_init
61 *
62 * Defines the module's GUC.
63 */
64void
66{
67 DefineCustomStringVariable("basic_archive.archive_directory",
68 gettext_noop("Archive file destination directory."),
69 NULL,
71 "",
73 0,
74 check_archive_directory, NULL, NULL);
75
76 MarkGUCPrefixReserved("basic_archive");
77}
78
79/*
80 * _PG_archive_module_init
81 *
82 * Returns the module's archiving callbacks.
83 */
86{
88}
89
90/*
91 * check_archive_directory
92 *
93 * Checks that the provided archive directory exists.
94 */
95static bool
97{
98 struct stat st;
99
100 /*
101 * The default value is an empty string, so we have to accept that value.
102 * Our check_configured callback also checks for this and prevents
103 * archiving from proceeding if it is still empty.
104 */
105 if (*newval == NULL || *newval[0] == '\0')
106 return true;
107
108 /*
109 * Make sure the file paths won't be too long. The docs indicate that the
110 * file names to be archived can be up to 64 characters long.
111 */
112 if (strlen(*newval) + 64 + 2 >= MAXPGPATH)
113 {
114 GUC_check_errdetail("Archive directory too long.");
115 return false;
116 }
117
118 /*
119 * Do a basic sanity check that the specified archive directory exists. It
120 * could be removed at some point in the future, so we still need to be
121 * prepared for it not to exist in the actual archiving logic.
122 */
123 if (stat(*newval, &st) != 0 || !S_ISDIR(st.st_mode))
124 {
125 GUC_check_errdetail("Specified archive directory does not exist.");
126 return false;
127 }
128
129 return true;
130}
131
132/*
133 * basic_archive_configured
134 *
135 * Checks that archive_directory is not blank.
136 */
137static bool
139{
140 if (archive_directory != NULL && archive_directory[0] != '\0')
141 return true;
142
143 arch_module_check_errdetail("%s is not set.",
144 "basic_archive.archive_directory");
145 return false;
146}
147
148/*
149 * basic_archive_file
150 *
151 * Archives one file.
152 */
153static bool
154basic_archive_file(ArchiveModuleState *state, const char *file, const char *path)
155{
156 char destination[MAXPGPATH];
157 char temp[MAXPGPATH + 256];
158 struct stat st;
159 struct timeval tv;
160 uint64 epoch; /* milliseconds */
161
163 (errmsg("archiving \"%s\" via basic_archive", file)));
164
165 snprintf(destination, MAXPGPATH, "%s/%s", archive_directory, file);
166
167 /*
168 * First, check if the file has already been archived. If it already
169 * exists and has the same contents as the file we're trying to archive,
170 * we can return success (after ensuring the file is persisted to disk).
171 * This scenario is possible if the server crashed after archiving the
172 * file but before renaming its .ready file to .done.
173 *
174 * If the archive file already exists but has different contents,
175 * something might be wrong, so we just fail.
176 */
177 if (stat(destination, &st) == 0)
178 {
179 if (compare_files(path, destination))
180 {
182 (errmsg("archive file \"%s\" already exists with identical contents",
183 destination)));
184
185 fsync_fname(destination, false);
187
188 return true;
189 }
190
192 (errmsg("archive file \"%s\" already exists", destination)));
193 }
194 else if (errno != ENOENT)
197 errmsg("could not stat file \"%s\": %m", destination)));
198
199 /*
200 * Pick a sufficiently unique name for the temporary file so that a
201 * collision is unlikely. This helps avoid problems in case a temporary
202 * file was left around after a crash or another server happens to be
203 * archiving to the same directory.
204 */
205 gettimeofday(&tv, NULL);
206 if (pg_mul_u64_overflow((uint64) 1000, (uint64) tv.tv_sec, &epoch) ||
207 pg_add_u64_overflow(epoch, (uint64) (tv.tv_usec / 1000), &epoch))
208 elog(ERROR, "could not generate temporary file name for archiving");
209
210 snprintf(temp, sizeof(temp), "%s/%s.%s.%d." UINT64_FORMAT,
211 archive_directory, "archtemp", file, MyProcPid, epoch);
212
213 /*
214 * Copy the file to its temporary destination. Note that this will fail
215 * if temp already exists.
216 */
217 copy_file(path, temp);
218
219 /*
220 * Sync the temporary file to disk and move it to its final destination.
221 * Note that this will overwrite any existing file, but this is only
222 * possible if someone else created the file since the stat() above.
223 */
224 (void) durable_rename(temp, destination, ERROR);
225
227 (errmsg("archived \"%s\" via basic_archive", file)));
228
229 return true;
230}
231
232/*
233 * compare_files
234 *
235 * Returns whether the contents of the files are the same.
236 */
237static bool
238compare_files(const char *file1, const char *file2)
239{
240#define CMP_BUF_SIZE (4096)
241 char buf1[CMP_BUF_SIZE];
242 char buf2[CMP_BUF_SIZE];
243 int fd1;
244 int fd2;
245 bool ret = true;
246
247 fd1 = OpenTransientFile(file1, O_RDONLY | PG_BINARY);
248 if (fd1 < 0)
251 errmsg("could not open file \"%s\": %m", file1)));
252
253 fd2 = OpenTransientFile(file2, O_RDONLY | PG_BINARY);
254 if (fd2 < 0)
257 errmsg("could not open file \"%s\": %m", file2)));
258
259 for (;;)
260 {
261 int nbytes = 0;
262 int buf1_len = 0;
263 int buf2_len = 0;
264
265 while (buf1_len < CMP_BUF_SIZE)
266 {
267 nbytes = read(fd1, buf1 + buf1_len, CMP_BUF_SIZE - buf1_len);
268 if (nbytes < 0)
271 errmsg("could not read file \"%s\": %m", file1)));
272 else if (nbytes == 0)
273 break;
274
275 buf1_len += nbytes;
276 }
277
278 while (buf2_len < CMP_BUF_SIZE)
279 {
280 nbytes = read(fd2, buf2 + buf2_len, CMP_BUF_SIZE - buf2_len);
281 if (nbytes < 0)
284 errmsg("could not read file \"%s\": %m", file2)));
285 else if (nbytes == 0)
286 break;
287
288 buf2_len += nbytes;
289 }
290
291 if (buf1_len != buf2_len || memcmp(buf1, buf2, buf1_len) != 0)
292 {
293 ret = false;
294 break;
295 }
296 else if (buf1_len == 0)
297 break;
298 }
299
300 if (CloseTransientFile(fd1) != 0)
303 errmsg("could not close file \"%s\": %m", file1)));
304
305 if (CloseTransientFile(fd2) != 0)
308 errmsg("could not close file \"%s\": %m", file2)));
309
310 return ret;
311}
#define arch_module_check_errdetail
static char * archive_directory
Definition: basic_archive.c:45
void _PG_init(void)
Definition: basic_archive.c:65
static bool basic_archive_file(ArchiveModuleState *state, const char *file, const char *path)
PG_MODULE_MAGIC_EXT(.name="basic_archive",.version=PG_VERSION)
#define CMP_BUF_SIZE
static const ArchiveModuleCallbacks basic_archive_callbacks
Definition: basic_archive.c:52
static bool compare_files(const char *file1, const char *file2)
static bool basic_archive_configured(ArchiveModuleState *state)
static bool check_archive_directory(char **newval, void **extra, GucSource source)
Definition: basic_archive.c:96
const ArchiveModuleCallbacks * _PG_archive_module_init(void)
Definition: basic_archive.c:85
#define gettext_noop(x)
Definition: c.h:1167
#define PG_BINARY
Definition: c.h:1244
#define UINT64_FORMAT
Definition: c.h:521
uint64_t uint64
Definition: c.h:503
void copy_file(const char *fromfile, const char *tofile)
Definition: copydir.c:133
int errcode_for_file_access(void)
Definition: elog.c:877
int errmsg(const char *fmt,...)
Definition: elog.c:1071
#define DEBUG3
Definition: elog.h:28
#define DEBUG1
Definition: elog.h:30
#define ERROR
Definition: elog.h:39
#define elog(elevel,...)
Definition: elog.h:225
#define ereport(elevel,...)
Definition: elog.h:149
int durable_rename(const char *oldfile, const char *newfile, int elevel)
Definition: fd.c:782
int CloseTransientFile(int fd)
Definition: fd.c:2871
void fsync_fname(const char *fname, bool isdir)
Definition: fd.c:756
int OpenTransientFile(const char *fileName, int fileFlags)
Definition: fd.c:2694
int MyProcPid
Definition: globals.c:48
void DefineCustomStringVariable(const char *name, const char *short_desc, const char *long_desc, char **valueAddr, const char *bootValue, GucContext context, int flags, GucStringCheckHook check_hook, GucStringAssignHook assign_hook, GucShowHook show_hook)
Definition: guc.c:5219
#define newval
void MarkGUCPrefixReserved(const char *className)
Definition: guc.c:5280
#define GUC_check_errdetail
Definition: guc.h:481
GucSource
Definition: guc.h:112
@ PGC_SIGHUP
Definition: guc.h:75
static bool pg_add_u64_overflow(uint64 a, uint64 b, uint64 *result)
Definition: int.h:514
static bool pg_mul_u64_overflow(uint64 a, uint64 b, uint64 *result)
Definition: int.h:548
#define read(a, b, c)
Definition: win32.h:13
#define MAXPGPATH
static rewind_source * source
Definition: pg_rewind.c:89
#define snprintf
Definition: port.h:239
ArchiveStartupCB startup_cb
unsigned short st_mode
Definition: win32_port.h:258
Definition: regguts.h:323
const char * name
#define stat
Definition: win32_port.h:274
#define S_ISDIR(m)
Definition: win32_port.h:315
static const unsigned __int64 epoch
int gettimeofday(struct timeval *tp, void *tzp)