PostgreSQL Source Code git master
astreamer_file.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * astreamer_file.c
4 *
5 * Archive streamers that write to files. astreamer_plain_writer writes
6 * the whole archive to a single file, and astreamer_extractor writes
7 * each archive member to a separate file in a given directory.
8 *
9 * Portions Copyright (c) 1996-2025, PostgreSQL Global Development Group
10 *
11 * IDENTIFICATION
12 * src/fe_utils/astreamer_file.c
13 *-------------------------------------------------------------------------
14 */
15
16#include "postgres_fe.h"
17
18#include <unistd.h>
19
20#include "common/file_perm.h"
21#include "common/logging.h"
22#include "fe_utils/astreamer.h"
23
25{
27 char *pathname;
28 FILE *file;
31
32typedef struct astreamer_extractor
33{
35 char *basepath;
36 const char *(*link_map) (const char *);
37 void (*report_output_file) (const char *);
39 FILE *file;
41
42static void astreamer_plain_writer_content(astreamer *streamer,
43 astreamer_member *member,
44 const char *data, int len,
46static void astreamer_plain_writer_finalize(astreamer *streamer);
47static void astreamer_plain_writer_free(astreamer *streamer);
48
53};
54
55static void astreamer_extractor_content(astreamer *streamer,
56 astreamer_member *member,
57 const char *data, int len,
59static void astreamer_extractor_finalize(astreamer *streamer);
60static void astreamer_extractor_free(astreamer *streamer);
61static void extract_directory(const char *filename, mode_t mode);
62static void extract_link(const char *filename, const char *linktarget);
63static FILE *create_file_for_extract(const char *filename, mode_t mode);
64
69};
70
71/*
72 * Create a astreamer that just writes data to a file.
73 *
74 * The caller must specify a pathname and may specify a file. The pathname is
75 * used for error-reporting purposes either way. If file is NULL, the pathname
76 * also identifies the file to which the data should be written: it is opened
77 * for writing and closed when done. If file is not NULL, the data is written
78 * there.
79 */
81astreamer_plain_writer_new(char *pathname, FILE *file)
82{
83 astreamer_plain_writer *streamer;
84
85 streamer = palloc0(sizeof(astreamer_plain_writer));
86 *((const astreamer_ops **) &streamer->base.bbs_ops) =
88
89 streamer->pathname = pstrdup(pathname);
90 streamer->file = file;
91
92 if (file == NULL)
93 {
94 streamer->file = fopen(pathname, "wb");
95 if (streamer->file == NULL)
96 pg_fatal("could not create file \"%s\": %m", pathname);
97 streamer->should_close_file = true;
98 }
99
100 return &streamer->base;
101}
102
103/*
104 * Write archive content to file.
105 */
106static void
108 astreamer_member *member, const char *data,
109 int len, astreamer_archive_context context)
110{
111 astreamer_plain_writer *mystreamer;
112
113 mystreamer = (astreamer_plain_writer *) streamer;
114
115 if (len == 0)
116 return;
117
118 errno = 0;
119 if (fwrite(data, len, 1, mystreamer->file) != 1)
120 {
121 /* if write didn't set errno, assume problem is no disk space */
122 if (errno == 0)
123 errno = ENOSPC;
124 pg_fatal("could not write to file \"%s\": %m",
125 mystreamer->pathname);
126 }
127}
128
129/*
130 * End-of-archive processing when writing to a plain file consists of closing
131 * the file if we opened it, but not if the caller provided it.
132 */
133static void
135{
136 astreamer_plain_writer *mystreamer;
137
138 mystreamer = (astreamer_plain_writer *) streamer;
139
140 if (mystreamer->should_close_file && fclose(mystreamer->file) != 0)
141 pg_fatal("could not close file \"%s\": %m",
142 mystreamer->pathname);
143
144 mystreamer->file = NULL;
145 mystreamer->should_close_file = false;
146}
147
148/*
149 * Free memory associated with this astreamer.
150 */
151static void
153{
154 astreamer_plain_writer *mystreamer;
155
156 mystreamer = (astreamer_plain_writer *) streamer;
157
158 Assert(!mystreamer->should_close_file);
159 Assert(mystreamer->base.bbs_next == NULL);
160
161 pfree(mystreamer->pathname);
162 pfree(mystreamer);
163}
164
165/*
166 * Create a astreamer that extracts an archive.
167 *
168 * All pathnames in the archive are interpreted relative to basepath.
169 *
170 * Unlike e.g. astreamer_plain_writer_new() we can't do anything useful here
171 * with untyped chunks; we need typed chunks which follow the rules described
172 * in astreamer.h. Assuming we have that, we don't need to worry about the
173 * original archive format; it's enough to just look at the member information
174 * provided and write to the corresponding file.
175 *
176 * 'link_map' is a function that will be applied to the target of any
177 * symbolic link, and which should return a replacement pathname to be used
178 * in its place. If NULL, the symbolic link target is used without
179 * modification.
180 *
181 * 'report_output_file' is a function that will be called each time we open a
182 * new output file. The pathname to that file is passed as an argument. If
183 * NULL, the call is skipped.
184 */
185astreamer *
186astreamer_extractor_new(const char *basepath,
187 const char *(*link_map) (const char *),
188 void (*report_output_file) (const char *))
189{
190 astreamer_extractor *streamer;
191
192 streamer = palloc0(sizeof(astreamer_extractor));
193 *((const astreamer_ops **) &streamer->base.bbs_ops) =
195 streamer->basepath = pstrdup(basepath);
196 streamer->link_map = link_map;
197 streamer->report_output_file = report_output_file;
198
199 return &streamer->base;
200}
201
202/*
203 * Extract archive contents to the filesystem.
204 */
205static void
207 const char *data, int len,
209{
210 astreamer_extractor *mystreamer = (astreamer_extractor *) streamer;
211 int fnamelen;
212
213 Assert(member != NULL || context == ASTREAMER_ARCHIVE_TRAILER);
214 Assert(context != ASTREAMER_UNKNOWN);
215
216 switch (context)
217 {
219 Assert(mystreamer->file == NULL);
220
221 /* Prepend basepath. */
222 snprintf(mystreamer->filename, sizeof(mystreamer->filename),
223 "%s/%s", mystreamer->basepath, member->pathname);
224
225 /* Remove any trailing slash. */
226 fnamelen = strlen(mystreamer->filename);
227 if (mystreamer->filename[fnamelen - 1] == '/')
228 mystreamer->filename[fnamelen - 1] = '\0';
229
230 /* Dispatch based on file type. */
231 if (member->is_directory)
232 extract_directory(mystreamer->filename, member->mode);
233 else if (member->is_link)
234 {
235 const char *linktarget = member->linktarget;
236
237 if (mystreamer->link_map)
238 linktarget = mystreamer->link_map(linktarget);
239 extract_link(mystreamer->filename, linktarget);
240 }
241 else
242 mystreamer->file =
244 member->mode);
245
246 /* Report output file change. */
247 if (mystreamer->report_output_file)
248 mystreamer->report_output_file(mystreamer->filename);
249 break;
250
252 if (mystreamer->file == NULL)
253 break;
254
255 errno = 0;
256 if (len > 0 && fwrite(data, len, 1, mystreamer->file) != 1)
257 {
258 /* if write didn't set errno, assume problem is no disk space */
259 if (errno == 0)
260 errno = ENOSPC;
261 pg_fatal("could not write to file \"%s\": %m",
262 mystreamer->filename);
263 }
264 break;
265
267 if (mystreamer->file == NULL)
268 break;
269 fclose(mystreamer->file);
270 mystreamer->file = NULL;
271 break;
272
274 break;
275
276 default:
277 /* Shouldn't happen. */
278 pg_fatal("unexpected state while extracting archive");
279 }
280}
281
282/*
283 * Should we tolerate an already-existing directory?
284 *
285 * When streaming WAL, pg_wal (or pg_xlog for pre-9.6 clusters) will have been
286 * created by the wal receiver process. Also, when the WAL directory location
287 * was specified, pg_wal (or pg_xlog) has already been created as a symbolic
288 * link before starting the actual backup. So just ignore creation failures
289 * on related directories.
290 *
291 * If in-place tablespaces are used, pg_tblspc and subdirectories may already
292 * exist when we get here. So tolerate that case, too.
293 */
294static bool
296{
297 const char *filename = last_dir_separator(pathname) + 1;
298
299 if (strcmp(filename, "pg_wal") == 0 ||
300 strcmp(filename, "pg_xlog") == 0 ||
301 strcmp(filename, "archive_status") == 0 ||
302 strcmp(filename, "summaries") == 0 ||
303 strcmp(filename, "pg_tblspc") == 0)
304 return true;
305
306 if (strspn(filename, "0123456789") == strlen(filename))
307 {
308 const char *pg_tblspc = strstr(pathname, "/pg_tblspc/");
309
310 return pg_tblspc != NULL && pg_tblspc + 11 == filename;
311 }
312
313 return false;
314}
315
316/*
317 * Create a directory.
318 */
319static void
320extract_directory(const char *filename, mode_t mode)
321{
322 if (mkdir(filename, pg_dir_create_mode) != 0 &&
323 (errno != EEXIST || !should_allow_existing_directory(filename)))
324 pg_fatal("could not create directory \"%s\": %m",
325 filename);
326
327#ifndef WIN32
328 if (chmod(filename, mode))
329 pg_fatal("could not set permissions on directory \"%s\": %m",
330 filename);
331#endif
332}
333
334/*
335 * Create a symbolic link.
336 *
337 * It's most likely a link in pg_tblspc directory, to the location of a
338 * tablespace. Apply any tablespace mapping given on the command line
339 * (--tablespace-mapping). (We blindly apply the mapping without checking that
340 * the link really is inside pg_tblspc. We don't expect there to be other
341 * symlinks in a data directory, but if there are, you can call it an
342 * undocumented feature that you can map them too.)
343 */
344static void
345extract_link(const char *filename, const char *linktarget)
346{
347 if (symlink(linktarget, filename) != 0)
348 pg_fatal("could not create symbolic link from \"%s\" to \"%s\": %m",
349 filename, linktarget);
350}
351
352/*
353 * Create a regular file.
354 *
355 * Return the resulting handle so we can write the content to the file.
356 */
357static FILE *
359{
360 FILE *file;
361
362 file = fopen(filename, "wb");
363 if (file == NULL)
364 pg_fatal("could not create file \"%s\": %m", filename);
365
366#ifndef WIN32
367 if (chmod(filename, mode))
368 pg_fatal("could not set permissions on file \"%s\": %m",
369 filename);
370#endif
371
372 return file;
373}
374
375/*
376 * End-of-stream processing for extracting an archive.
377 *
378 * There's nothing to do here but sanity checking.
379 */
380static void
382{
384 = (astreamer_extractor *) streamer;
385
386 Assert(mystreamer->file == NULL);
387}
388
389/*
390 * Free memory.
391 */
392static void
394{
395 astreamer_extractor *mystreamer = (astreamer_extractor *) streamer;
396
397 pfree(mystreamer->basepath);
398 pfree(mystreamer);
399}
astreamer_archive_context
Definition: astreamer.h:63
@ ASTREAMER_MEMBER_HEADER
Definition: astreamer.h:65
@ ASTREAMER_MEMBER_CONTENTS
Definition: astreamer.h:66
@ ASTREAMER_MEMBER_TRAILER
Definition: astreamer.h:67
@ ASTREAMER_ARCHIVE_TRAILER
Definition: astreamer.h:68
@ ASTREAMER_UNKNOWN
Definition: astreamer.h:64
astreamer * astreamer_plain_writer_new(char *pathname, FILE *file)
static void astreamer_plain_writer_content(astreamer *streamer, astreamer_member *member, const char *data, int len, astreamer_archive_context context)
static void astreamer_extractor_finalize(astreamer *streamer)
static void extract_directory(const char *filename, mode_t mode)
static FILE * create_file_for_extract(const char *filename, mode_t mode)
static const astreamer_ops astreamer_extractor_ops
struct astreamer_extractor astreamer_extractor
astreamer * astreamer_extractor_new(const char *basepath, const char *(*link_map)(const char *), void(*report_output_file)(const char *))
struct astreamer_plain_writer astreamer_plain_writer
static void astreamer_plain_writer_finalize(astreamer *streamer)
static void astreamer_extractor_free(astreamer *streamer)
static void astreamer_extractor_content(astreamer *streamer, astreamer_member *member, const char *data, int len, astreamer_archive_context context)
static const astreamer_ops astreamer_plain_writer_ops
static bool should_allow_existing_directory(const char *pathname)
static void extract_link(const char *filename, const char *linktarget)
static void astreamer_plain_writer_free(astreamer *streamer)
#define PG_USED_FOR_ASSERTS_ONLY
Definition: c.h:204
#define Assert(condition)
Definition: c.h:815
int pg_dir_create_mode
Definition: file_perm.c:18
char * pstrdup(const char *in)
Definition: mcxt.c:1696
void pfree(void *pointer)
Definition: mcxt.c:1521
void * palloc0(Size size)
Definition: mcxt.c:1347
#define pg_fatal(...)
static PgChecksumMode mode
Definition: pg_checksums.c:55
#define MAXPGPATH
const void size_t len
const void * data
static char * filename
Definition: pg_dumpall.c:119
char * last_dir_separator(const char *filename)
Definition: path.c:140
#define snprintf
Definition: port.h:238
const char *(* link_map)(const char *)
void(* report_output_file)(const char *)
char filename[MAXPGPATH]
char linktarget[MAXPGPATH]
Definition: astreamer.h:88
char pathname[MAXPGPATH]
Definition: astreamer.h:81
void(* content)(astreamer *streamer, astreamer_member *member, const char *data, int len, astreamer_archive_context context)
Definition: astreamer.h:126
const astreamer_ops * bbs_ops
Definition: astreamer.h:109
astreamer * bbs_next
Definition: astreamer.h:110
#define mkdir(a, b)
Definition: win32_port.h:80
#define symlink(oldpath, newpath)
Definition: win32_port.h:225