56 int segsize, const
char *waldir);
59#define MAX_ERRORMSG_LEN 1000
65#define DEFAULT_DECODE_BUFFER_SIZE (64 * 1024)
82 state->errormsg_deferred =
true;
95 state->decode_buffer = buffer;
96 state->decode_buffer_size = size;
97 state->decode_buffer_tail = buffer;
98 state->decode_buffer_head = buffer;
119 state->routine = *routine;
141 state->private_data = private_data;
145 if (!
state->errormsg_buf)
151 state->errormsg_buf[0] =
'\0';
164 if (
state->seg.ws_file != -1)
167 if (
state->decode_buffer &&
state->free_decode_buffer)
171 if (
state->readRecordBuf)
193 uint32 newSize = reclength;
195 newSize += XLOG_BLCKSZ - (newSize % XLOG_BLCKSZ);
196 newSize =
Max(newSize, 5 *
Max(BLCKSZ, XLOG_BLCKSZ));
198 if (
state->readRecordBuf)
201 state->readRecordBufSize = newSize;
209 int segsize,
const char *waldir)
239 state->EndRecPtr = RecPtr;
240 state->NextRecPtr = RecPtr;
262 record =
state->record;
265 state->record = NULL;
269 if (
state->decode_queue_tail == record)
270 state->decode_queue_tail = NULL;
281 Assert(
state->decode_buffer_head == (
char *) record);
288 record = record->next;
289 while (
unlikely(record && record->oversized))
290 record = record->next;
295 state->decode_buffer_head = (
char *) record;
305 state->decode_buffer_head =
state->decode_buffer;
306 state->decode_buffer_tail =
state->decode_buffer;
331 if (
state->decode_queue_head == NULL)
334 if (
state->errormsg_deferred)
336 if (
state->errormsg_buf[0] !=
'\0')
337 *errormsg =
state->errormsg_buf;
338 state->errormsg_deferred =
false;
370 return state->record;
447 if (
state->decode_buffer_size == 0)
450 state->decode_buffer_head =
state->decode_buffer;
451 state->decode_buffer_tail =
state->decode_buffer;
452 state->free_decode_buffer =
true;
456 if (
state->decode_buffer_tail >=
state->decode_buffer_head)
459 if (required_space <=
460 state->decode_buffer_size -
461 (
state->decode_buffer_tail -
state->decode_buffer))
477 else if (required_space <
478 state->decode_buffer_head -
state->decode_buffer)
499 state->decode_buffer_head -
state->decode_buffer_tail)
520 decoded =
palloc(required_space);
553 state->errormsg_buf[0] =
'\0';
559 RecPtr =
state->NextRecPtr;
586 state->nonblocking = nonblocking;
587 state->currRecPtr = RecPtr;
590 targetPagePtr = RecPtr - (RecPtr % XLOG_BLCKSZ);
591 targetRecOff = RecPtr % XLOG_BLCKSZ;
610 if (targetRecOff == 0)
615 RecPtr += pageHeaderSize;
616 targetRecOff = pageHeaderSize;
618 else if (targetRecOff < pageHeaderSize)
622 pageHeaderSize, targetRecOff);
627 targetRecOff == pageHeaderSize)
670 "invalid record length at %X/%X: expected at least %u, got %u",
687 if (decoded == NULL && nonblocking)
697 len = XLOG_BLCKSZ - RecPtr % XLOG_BLCKSZ;
712 Assert(
state->readRecordBufSize >= XLOG_BLCKSZ * 2);
716 memcpy(
state->readRecordBuf,
717 state->readBuf + RecPtr % XLOG_BLCKSZ,
len);
718 buffer =
state->readRecordBuf +
len;
724 targetPagePtr += XLOG_BLCKSZ;
750 state->overwrittenRecPtr = RecPtr;
751 RecPtr = targetPagePtr;
759 "there is no contrecord flag at %X/%X",
772 "invalid contrecord length %u (expected %lld) at %X/%X",
774 ((
long long) total_len) - gotlen,
788 contdata = (
char *)
state->readBuf + pageHeaderSize;
789 len = XLOG_BLCKSZ - pageHeaderSize;
795 pageHeaderSize +
len);
797 memcpy(buffer, contdata,
len);
817 if (total_len >
state->readRecordBufSize)
819 char save_copy[XLOG_BLCKSZ * 2];
826 Assert(gotlen <= state->readRecordBufSize);
827 memcpy(save_copy,
state->readRecordBuf, gotlen);
829 memcpy(
state->readRecordBuf, save_copy, gotlen);
830 buffer =
state->readRecordBuf + gotlen;
832 }
while (gotlen < total_len);
840 state->DecodeRecPtr = RecPtr;
841 state->NextRecPtr = targetPagePtr + pageHeaderSize
848 Min(targetRecOff + total_len, XLOG_BLCKSZ));
860 state->DecodeRecPtr = RecPtr;
866 if (record->
xl_rmid == RM_XLOG_ID &&
870 state->NextRecPtr +=
state->segcxt.ws_segsize - 1;
901 if ((
char *) decoded ==
state->decode_buffer)
904 state->decode_buffer_tail += decoded->
size;
909 if (
state->decode_queue_tail)
910 state->decode_queue_tail->
next = decoded;
911 state->decode_queue_tail = decoded;
912 if (!
state->decode_queue_head)
913 state->decode_queue_head = decoded;
929 state->abortedRecPtr = RecPtr;
930 state->missingContrecPtr = targetPagePtr;
937 state->errormsg_deferred =
true;
971 if (
state->errormsg_deferred)
978 return state->decode_queue_tail;
1008 Assert((pageptr % XLOG_BLCKSZ) == 0);
1014 if (targetSegNo ==
state->seg.ws_segno &&
1015 targetPageOff ==
state->segoff && reqLen <= state->
readLen)
1016 return state->readLen;
1037 if (targetSegNo !=
state->seg.ws_segno && targetPageOff != 0)
1039 XLogRecPtr targetSegmentPtr = pageptr - targetPageOff;
1098 state->seg.ws_segno = targetSegNo;
1099 state->segoff = targetPageOff;
1116 state->seg.ws_segno = 0;
1135 "invalid record length at %X/%X: expected at least %u, got %u",
1143 "invalid resource manager ID %u at %X/%X",
1153 if (!(record->
xl_prev < RecPtr))
1156 "record with incorrect prev-link %X/%X at %X/%X",
1169 if (record->
xl_prev != PrevRecPtr)
1172 "record with incorrect prev-link %X/%X at %X/%X",
1210 "incorrect resource manager data checksum in record at %X/%X",
1232 Assert((recptr % XLOG_BLCKSZ) == 0);
1244 "invalid magic number %04X in WAL segment %s, LSN %X/%X, offset %u",
1259 "invalid info bits %04X in WAL segment %s, LSN %X/%X, offset %u",
1271 if (
state->system_identifier &&
1275 "WAL file is from different database system: WAL file database system identifier is %" PRIu64
", pg_control database system identifier is %" PRIu64,
1277 state->system_identifier);
1283 "WAL file is from different database system: incorrect segment size in page header");
1289 "WAL file is from different database system: incorrect XLOG_BLCKSZ in page header");
1293 else if (offset == 0)
1301 "invalid info bits %04X in WAL segment %s, LSN %X/%X, offset %u",
1321 "unexpected pageaddr %X/%X in WAL segment %s, LSN %X/%X, offset %u",
1338 if (recptr >
state->latestPagePtr)
1347 "out-of-sequence timeline ID %u (after %u) in WAL segment %s, LSN %X/%X, offset %u",
1349 state->latestPageTLI,
1356 state->latestPagePtr = recptr;
1368 state->errormsg_buf[0] =
'\0';
1369 state->errormsg_deferred =
false;
1394 state->nonblocking =
false;
1417 targetRecOff = tmpRecPtr % XLOG_BLCKSZ;
1420 targetPagePtr = tmpRecPtr - targetRecOff;
1449 tmpRecPtr = targetPagePtr + XLOG_BLCKSZ;
1456 tmpRecPtr = targetPagePtr + pageHeaderSize
1463 tmpRecPtr = targetPagePtr + pageHeaderSize;
1477 if (RecPtr <= state->ReadRecPtr)
1480 found =
state->ReadRecPtr;
1532 if (
state->seg.ws_file < 0 ||
1534 tli !=
state->seg.ws_tli)
1538 if (
state->seg.ws_file >= 0)
1542 state->routine.segment_open(
state, nextSegNo, &tli);
1548 state->seg.ws_tli = tli;
1549 state->seg.ws_segno = nextSegNo;
1553 if (nbytes > (
state->segcxt.ws_segsize - startoff))
1554 segbytes =
state->segcxt.ws_segsize - startoff;
1567 readbytes =
pg_pread(
state->seg.ws_file, p, segbytes, (off_t) startoff);
1573 io_start, 1, readbytes);
1587 recptr += readbytes;
1588 nbytes -= readbytes;
1610 while ((r =
state->decode_queue_head) != NULL)
1616 state->decode_queue_tail = NULL;
1617 state->decode_queue_head = NULL;
1618 state->record = NULL;
1621 state->decode_buffer_tail =
state->decode_buffer;
1622 state->decode_buffer_head =
state->decode_buffer;
1625 state->errormsg_buf[0] =
'\0';
1626 state->errormsg_deferred =
false;
1650 size += (MAXIMUM_ALIGNOF - 1);
1654 size += (MAXIMUM_ALIGNOF - 1);
1681#define COPY_HEADER_FIELD(_dst, _size) \
1683 if (remaining < _size) \
1684 goto shortdata_err; \
1685 memcpy(_dst, ptr, _size); \
1687 remaining -= _size; \
1697 decoded->
header = *record;
1699 decoded->
next = NULL;
1705 ptr = (
char *) record;
1718 uint8 main_data_len;
1723 datatotal += main_data_len;
1734 datatotal += main_data_len;
1756 if (block_id <= decoded->max_block_id)
1759 "out-of-order block_id %u at %X/%X",
1766 blk = &decoded->
blocks[block_id];
1772 blk->
flags = fork_flags;
1783 "BKPBLOCK_HAS_DATA set, but no data included at %X/%X",
1790 "BKPBLOCK_HAS_DATA not set, but data length is %u at %X/%X",
1826 "BKPIMAGE_HAS_HOLE set, but hole offset %u length %u block image length %u at %X/%X",
1842 "BKPIMAGE_HAS_HOLE not set, but hole offset %u length %u at %X/%X",
1856 "BKPIMAGE_COMPRESSED set, but block image length %u at %X/%X",
1871 "neither BKPIMAGE_HAS_HOLE nor BKPIMAGE_COMPRESSED set, but block image length is %u at %X/%X",
1884 if (rlocator == NULL)
1887 "BKPBLOCK_SAME_REL set but no previous rel at %X/%X",
1899 "invalid block_id %u at %X/%X",
1915 out = ((
char *) decoded) +
1920 for (block_id = 0; block_id <= decoded->
max_block_id; block_id++)
1966 "record with invalid length at %X/%X",
1969 *errormsg =
state->errormsg_buf;
1989 elog(
ERROR,
"could not locate backup block with ID %d in WAL record",
1992 pg_fatal(
"could not locate backup block with ID %d in WAL record",
2023 *blknum = bkpb->
blkno;
2024 if (prefetch_buffer)
2076 "could not restore image at %X/%X with invalid block %d specified",
2095 bool decomp_success =
true;
2101 decomp_success =
false;
2106 if (LZ4_decompress_safe(ptr, tmp.
data,
2108 decomp_success =
false;
2110 report_invalid_record(record,
"could not restore image at %X/%X compressed with %s not supported by build, block %d",
2120 size_t decomp_result = ZSTD_decompress(tmp.
data,
2124 if (ZSTD_isError(decomp_result))
2125 decomp_success =
false;
2127 report_invalid_record(record,
"could not restore image at %X/%X compressed with %s not supported by build, block %d",
2136 report_invalid_record(record,
"could not restore image at %X/%X compressed with unknown method, block %d",
2142 if (!decomp_success)
2156 memcpy(page, ptr, BLCKSZ);
#define pg_attribute_printf(f, a)
#define MemSet(start, val, len)
void err(int eval, const char *fmt,...)
#define MCXT_ALLOC_NO_OOM
Assert(PointerIsAligned(start, uint64))
if(TABLE==NULL||TABLE_index==NULL)
void pfree(void *pointer)
void * palloc_extended(Size size, int flags)
#define AmStartupProcess()
#define InvalidRepOriginId
#define COMP_CRC32C(crc, data, len)
#define EQ_CRC32C(c1, c2)
int32 pglz_decompress(const char *source, int32 slen, char *dest, int32 rawsize, bool check_complete)
instr_time pgstat_prepare_io_time(bool track_io_guc)
void pgstat_count_io_op_time(IOObject io_object, IOContext io_context, IOOp io_op, instr_time start_time, uint32 cnt, uint64 bytes)
#define RmgrIdIsValid(rmid)
struct DecodedXLogRecord * next
TransactionId toplevel_xid
RepOriginId record_origin
DecodedBkpBlock blocks[FLEXIBLE_ARRAY_MEMBER]
FullTransactionId nextXid
DecodedXLogRecord * record
#define InvalidTransactionId
static FullTransactionId FullTransactionIdFromAllowableAt(FullTransactionId nextFullXid, TransactionId xid)
TransamVariablesData * TransamVariables
static void pgstat_report_wait_start(uint32 wait_event_info)
static void pgstat_report_wait_end(void)
#define XLP_FIRST_IS_CONTRECORD
XLogLongPageHeaderData * XLogLongPageHeader
#define XLP_FIRST_IS_OVERWRITE_CONTRECORD
#define XLogSegmentOffset(xlogptr, wal_segsz_bytes)
XLogPageHeaderData * XLogPageHeader
#define XLByteToSeg(xlrp, logSegNo, wal_segsz_bytes)
#define XRecOffIsValid(xlrp)
#define SizeOfXLogShortPHD
static void XLogFileName(char *fname, TimeLineID tli, XLogSegNo logSegNo, int wal_segsz_bytes)
#define XLogPageHeaderSize(hdr)
#define XLByteInSeg(xlrp, logSegNo, wal_segsz_bytes)
#define LSN_FORMAT_ARGS(lsn)
#define XLogRecPtrIsInvalid(r)
#define InvalidXLogRecPtr
bool XLogRecGetBlockTagExtended(XLogReaderState *record, uint8 block_id, RelFileLocator *rlocator, ForkNumber *forknum, BlockNumber *blknum, Buffer *prefetch_buffer)
static XLogPageReadResult XLogDecodeNextRecord(XLogReaderState *state, bool nonblocking)
XLogReaderState * XLogReaderAllocate(int wal_segment_size, const char *waldir, XLogReaderRoutine *routine, void *private_data)
void XLogReaderSetDecodeBuffer(XLogReaderState *state, void *buffer, size_t size)
DecodedXLogRecord * XLogReadAhead(XLogReaderState *state, bool nonblocking)
static void WALOpenSegmentInit(WALOpenSegment *seg, WALSegmentContext *segcxt, int segsize, const char *waldir)
char * XLogRecGetBlockData(XLogReaderState *record, uint8 block_id, Size *len)
static int ReadPageInternal(XLogReaderState *state, XLogRecPtr pageptr, int reqLen)
DecodedXLogRecord * XLogNextRecord(XLogReaderState *state, char **errormsg)
static void report_invalid_record(XLogReaderState *state, const char *fmt,...) pg_attribute_printf(2
static void static void allocate_recordbuf(XLogReaderState *state, uint32 reclength)
bool WALRead(XLogReaderState *state, char *buf, XLogRecPtr startptr, Size count, TimeLineID tli, WALReadError *errinfo)
XLogRecord * XLogReadRecord(XLogReaderState *state, char **errormsg)
void XLogReaderResetError(XLogReaderState *state)
static void XLogReaderInvalReadState(XLogReaderState *state)
#define COPY_HEADER_FIELD(_dst, _size)
bool XLogReaderValidatePageHeader(XLogReaderState *state, XLogRecPtr recptr, char *phdr)
FullTransactionId XLogRecGetFullXid(XLogReaderState *record)
void XLogReaderFree(XLogReaderState *state)
void XLogRecGetBlockTag(XLogReaderState *record, uint8 block_id, RelFileLocator *rlocator, ForkNumber *forknum, BlockNumber *blknum)
static void ResetDecoder(XLogReaderState *state)
bool DecodeXLogRecord(XLogReaderState *state, DecodedXLogRecord *decoded, XLogRecord *record, XLogRecPtr lsn, char **errormsg)
static bool ValidXLogRecord(XLogReaderState *state, XLogRecord *record, XLogRecPtr recptr)
#define DEFAULT_DECODE_BUFFER_SIZE
size_t DecodeXLogRecordRequiredSpace(size_t xl_tot_len)
static DecodedXLogRecord * XLogReadRecordAlloc(XLogReaderState *state, size_t xl_tot_len, bool allow_oversized)
XLogRecPtr XLogFindNextRecord(XLogReaderState *state, XLogRecPtr RecPtr)
void XLogBeginRead(XLogReaderState *state, XLogRecPtr RecPtr)
bool RestoreBlockImage(XLogReaderState *record, uint8 block_id, char *page)
XLogRecPtr XLogReleasePreviousRecord(XLogReaderState *state)
static bool ValidXLogRecordHeader(XLogReaderState *state, XLogRecPtr RecPtr, XLogRecPtr PrevRecPtr, XLogRecord *record, bool randAccess)
static bool XLogReaderHasQueuedRecordOrError(XLogReaderState *state)
#define XLogRecGetXid(decoder)
#define XLogRecHasBlockRef(decoder, block_id)
#define BKPIMAGE_COMPRESS_ZSTD
#define BKPBLOCK_FORK_MASK
#define BKPBLOCK_HAS_DATA
#define BKPIMAGE_HAS_HOLE
#define XLR_BLOCK_ID_DATA_LONG
#define BKPIMAGE_COMPRESS_LZ4
#define BKPIMAGE_COMPRESSED(info)
#define XLR_BLOCK_ID_TOPLEVEL_XID
#define XLR_BLOCK_ID_DATA_SHORT
#define BKPBLOCK_SAME_REL
#define BKPIMAGE_COMPRESS_PGLZ
#define XLR_BLOCK_ID_ORIGIN
#define BKPBLOCK_HAS_IMAGE