PostgreSQL Source Code git master
Loading...
Searching...
No Matches
rewriteheap.h File Reference
#include "access/htup.h"
#include "storage/itemptr.h"
#include "storage/relfilelocator.h"
#include "utils/relcache.h"
Include dependency graph for rewriteheap.h:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Data Structures

struct  LogicalRewriteMappingData
 

Macros

#define LOGICAL_REWRITE_FORMAT   "map-%x-%x-%X_%X-%x-%x"
 

Typedefs

typedef struct RewriteStateDataRewriteState
 
typedef struct LogicalRewriteMappingData LogicalRewriteMappingData
 

Functions

RewriteState begin_heap_rewrite (Relation old_heap, Relation new_heap, TransactionId oldest_xmin, TransactionId freeze_xid, MultiXactId cutoff_multi)
 
void end_heap_rewrite (RewriteState state)
 
void rewrite_heap_tuple (RewriteState state, HeapTuple old_tuple, HeapTuple new_tuple)
 
bool rewrite_heap_dead_tuple (RewriteState state, HeapTuple old_tuple)
 
void CheckPointLogicalRewriteHeap (void)
 

Macro Definition Documentation

◆ LOGICAL_REWRITE_FORMAT

#define LOGICAL_REWRITE_FORMAT   "map-%x-%x-%X_%X-%x-%x"

Definition at line 54 of file rewriteheap.h.

Typedef Documentation

◆ LogicalRewriteMappingData

◆ RewriteState

Function Documentation

◆ begin_heap_rewrite()

RewriteState begin_heap_rewrite ( Relation  old_heap,
Relation  new_heap,
TransactionId  oldest_xmin,
TransactionId  freeze_xid,
MultiXactId  cutoff_multi 
)
extern

Definition at line 234 of file rewriteheap.c.

236{
241
242 /*
243 * To ease cleanup, make a separate context that will contain the
244 * RewriteState struct itself plus all subsidiary data.
245 */
247 "Table rewrite",
250
251 /* Create and fill in the state struct */
253
254 state->rs_old_rel = old_heap;
255 state->rs_new_rel = new_heap;
256 state->rs_buffer = NULL;
257 /* new_heap needn't be empty, just locked */
259 state->rs_oldest_xmin = oldest_xmin;
260 state->rs_freeze_xid = freeze_xid;
261 state->rs_cutoff_multi = cutoff_multi;
262 state->rs_cxt = rw_cxt;
264
265 /* Initialize hash tables used to track update chains */
266 hash_ctl.keysize = sizeof(TidHashKey);
267 hash_ctl.entrysize = sizeof(UnresolvedTupData);
268 hash_ctl.hcxt = state->rs_cxt;
269
270 state->rs_unresolved_tups =
271 hash_create("Rewrite / Unresolved ctids",
272 128, /* arbitrary initial size */
273 &hash_ctl,
275
276 hash_ctl.entrysize = sizeof(OldToNewMappingData);
277
278 state->rs_old_new_tid_map =
279 hash_create("Rewrite / Old to new tid map",
280 128, /* arbitrary initial size */
281 &hash_ctl,
283
285
287
288 return state;
289}
#define RelationGetNumberOfBlocks(reln)
Definition bufmgr.h:307
BulkWriteState * smgr_bulk_start_rel(Relation rel, ForkNumber forknum)
Definition bulk_write.c:87
HTAB * hash_create(const char *tabname, int64 nelem, const HASHCTL *info, int flags)
Definition dynahash.c:358
#define palloc0_object(type)
Definition fe_memutils.h:75
#define HASH_CONTEXT
Definition hsearch.h:102
#define HASH_ELEM
Definition hsearch.h:95
#define HASH_BLOBS
Definition hsearch.h:97
MemoryContext CurrentMemoryContext
Definition mcxt.c:160
#define AllocSetContextCreate
Definition memutils.h:129
#define ALLOCSET_DEFAULT_SIZES
Definition memutils.h:160
static MemoryContext MemoryContextSwitchTo(MemoryContext context)
Definition palloc.h:124
static int fb(int x)
@ MAIN_FORKNUM
Definition relpath.h:58
static void logical_begin_heap_rewrite(RewriteState state)

References ALLOCSET_DEFAULT_SIZES, AllocSetContextCreate, CurrentMemoryContext, fb(), HASH_BLOBS, HASH_CONTEXT, hash_create(), HASH_ELEM, logical_begin_heap_rewrite(), MAIN_FORKNUM, MemoryContextSwitchTo(), palloc0_object, RelationGetNumberOfBlocks, and smgr_bulk_start_rel().

Referenced by heapam_relation_copy_for_cluster().

◆ CheckPointLogicalRewriteHeap()

void CheckPointLogicalRewriteHeap ( void  )
extern

Definition at line 1157 of file rewriteheap.c.

1158{
1159 XLogRecPtr cutoff;
1160 XLogRecPtr redo;
1162 struct dirent *mapping_de;
1163 char path[MAXPGPATH + sizeof(PG_LOGICAL_MAPPINGS_DIR)];
1164
1165 /*
1166 * We start of with a minimum of the last redo pointer. No new decoding
1167 * slot will start before that, so that's a safe upper bound for removal.
1168 */
1169 redo = GetRedoRecPtr();
1170
1171 /* now check for the restart ptrs from existing slots */
1173
1174 /* don't start earlier than the restart lsn */
1175 if (XLogRecPtrIsValid(cutoff) && redo < cutoff)
1176 cutoff = redo;
1177
1180 {
1181 Oid dboid;
1182 Oid relid;
1183 XLogRecPtr lsn;
1186 uint32 hi,
1187 lo;
1189
1190 if (strcmp(mapping_de->d_name, ".") == 0 ||
1191 strcmp(mapping_de->d_name, "..") == 0)
1192 continue;
1193
1194 snprintf(path, sizeof(path), "%s/%s", PG_LOGICAL_MAPPINGS_DIR, mapping_de->d_name);
1195 de_type = get_dirent_type(path, mapping_de, false, DEBUG1);
1196
1198 continue;
1199
1200 /* Skip over files that cannot be ours. */
1201 if (strncmp(mapping_de->d_name, "map-", 4) != 0)
1202 continue;
1203
1205 &dboid, &relid, &hi, &lo, &rewrite_xid, &create_xid) != 6)
1206 elog(ERROR, "could not parse filename \"%s\"", mapping_de->d_name);
1207
1208 lsn = ((uint64) hi) << 32 | lo;
1209
1210 if (lsn < cutoff || !XLogRecPtrIsValid(cutoff))
1211 {
1212 elog(DEBUG1, "removing logical rewrite file \"%s\"", path);
1213 if (unlink(path) < 0)
1214 ereport(ERROR,
1216 errmsg("could not remove file \"%s\": %m", path)));
1217 }
1218 else
1219 {
1220 /* on some operating systems fsyncing a file requires O_RDWR */
1221 int fd = OpenTransientFile(path, O_RDWR | PG_BINARY);
1222
1223 /*
1224 * The file cannot vanish due to concurrency since this function
1225 * is the only one removing logical mappings and only one
1226 * checkpoint can be in progress at a time.
1227 */
1228 if (fd < 0)
1229 ereport(ERROR,
1231 errmsg("could not open file \"%s\": %m", path)));
1232
1233 /*
1234 * We could try to avoid fsyncing files that either haven't
1235 * changed or have only been created since the checkpoint's start,
1236 * but it's currently not deemed worth the effort.
1237 */
1239 if (pg_fsync(fd) != 0)
1242 errmsg("could not fsync file \"%s\": %m", path)));
1244
1245 if (CloseTransientFile(fd) != 0)
1246 ereport(ERROR,
1248 errmsg("could not close file \"%s\": %m", path)));
1249 }
1250 }
1252
1253 /* persist directory entries to disk */
1255}
#define PG_BINARY
Definition c.h:1287
uint64_t uint64
Definition c.h:547
uint32_t uint32
Definition c.h:546
uint32 TransactionId
Definition c.h:666
int errcode_for_file_access(void)
Definition elog.c:886
int errmsg(const char *fmt,...)
Definition elog.c:1080
#define DEBUG1
Definition elog.h:30
#define ERROR
Definition elog.h:39
#define elog(elevel,...)
Definition elog.h:226
#define ereport(elevel,...)
Definition elog.h:150
int FreeDir(DIR *dir)
Definition fd.c:3005
int CloseTransientFile(int fd)
Definition fd.c:2851
void fsync_fname(const char *fname, bool isdir)
Definition fd.c:753
int data_sync_elevel(int elevel)
Definition fd.c:3982
DIR * AllocateDir(const char *dirname)
Definition fd.c:2887
struct dirent * ReadDir(DIR *dir, const char *dirname)
Definition fd.c:2953
int pg_fsync(int fd)
Definition fd.c:386
int OpenTransientFile(const char *fileName, int fileFlags)
Definition fd.c:2674
PGFileType get_dirent_type(const char *path, const struct dirent *de, bool look_through_symlinks, int elevel)
Definition file_utils.c:547
PGFileType
Definition file_utils.h:19
@ PGFILETYPE_REG
Definition file_utils.h:22
@ PGFILETYPE_ERROR
Definition file_utils.h:20
#define MAXPGPATH
#define snprintf
Definition port.h:260
unsigned int Oid
static int fd(const char *x, int i)
#define PG_LOGICAL_MAPPINGS_DIR
#define LOGICAL_REWRITE_FORMAT
Definition rewriteheap.h:54
XLogRecPtr ReplicationSlotsComputeLogicalRestartLSN(void)
Definition slot.c:1367
Definition dirent.c:26
static void pgstat_report_wait_start(uint32 wait_event_info)
Definition wait_event.h:69
static void pgstat_report_wait_end(void)
Definition wait_event.h:85
XLogRecPtr GetRedoRecPtr(void)
Definition xlog.c:6563
#define XLogRecPtrIsValid(r)
Definition xlogdefs.h:29
uint64 XLogRecPtr
Definition xlogdefs.h:21

References AllocateDir(), CloseTransientFile(), data_sync_elevel(), DEBUG1, elog, ereport, errcode_for_file_access(), errmsg(), ERROR, fb(), fd(), FreeDir(), fsync_fname(), get_dirent_type(), GetRedoRecPtr(), LOGICAL_REWRITE_FORMAT, MAXPGPATH, OpenTransientFile(), PG_BINARY, pg_fsync(), PG_LOGICAL_MAPPINGS_DIR, PGFILETYPE_ERROR, PGFILETYPE_REG, pgstat_report_wait_end(), pgstat_report_wait_start(), ReadDir(), ReplicationSlotsComputeLogicalRestartLSN(), snprintf, and XLogRecPtrIsValid.

Referenced by CheckPointGuts().

◆ end_heap_rewrite()

void end_heap_rewrite ( RewriteState  state)
extern

Definition at line 297 of file rewriteheap.c.

298{
301
302 /*
303 * Write any remaining tuples in the UnresolvedTups table. If we have any
304 * left, they should in fact be dead, but let's err on the safe side.
305 */
306 hash_seq_init(&seq_status, state->rs_unresolved_tups);
307
309 {
310 ItemPointerSetInvalid(&unresolved->tuple->t_data->t_ctid);
312 }
313
314 /* Write the last page, if any */
315 if (state->rs_buffer)
316 {
317 smgr_bulk_write(state->rs_bulkstate, state->rs_blockno, state->rs_buffer, true);
318 state->rs_buffer = NULL;
319 }
320
321 smgr_bulk_finish(state->rs_bulkstate);
322
324
325 /* Deleting the context frees everything */
326 MemoryContextDelete(state->rs_cxt);
327}
void smgr_bulk_write(BulkWriteState *bulkstate, BlockNumber blocknum, BulkWriteBuffer buf, bool page_std)
Definition bulk_write.c:323
void smgr_bulk_finish(BulkWriteState *bulkstate)
Definition bulk_write.c:130
void * hash_seq_search(HASH_SEQ_STATUS *status)
Definition dynahash.c:1415
void hash_seq_init(HASH_SEQ_STATUS *status, HTAB *hashp)
Definition dynahash.c:1380
static void ItemPointerSetInvalid(ItemPointerData *pointer)
Definition itemptr.h:184
void MemoryContextDelete(MemoryContext context)
Definition mcxt.c:472
static void raw_heap_insert(RewriteState state, HeapTuple tup)
static void logical_end_heap_rewrite(RewriteState state)

References fb(), hash_seq_init(), hash_seq_search(), ItemPointerSetInvalid(), logical_end_heap_rewrite(), MemoryContextDelete(), raw_heap_insert(), smgr_bulk_finish(), and smgr_bulk_write().

Referenced by heapam_relation_copy_for_cluster().

◆ rewrite_heap_dead_tuple()

bool rewrite_heap_dead_tuple ( RewriteState  state,
HeapTuple  old_tuple 
)
extern

Definition at line 546 of file rewriteheap.c.

547{
548 /*
549 * If we have already seen an earlier tuple in the update chain that
550 * points to this tuple, let's forget about that earlier tuple. It's in
551 * fact dead as well, our simple xmax < OldestXmin test in
552 * HeapTupleSatisfiesVacuum just wasn't enough to detect it. It happens
553 * when xmin of a tuple is greater than xmax, which sounds
554 * counter-intuitive but is perfectly valid.
555 *
556 * We don't bother to try to detect the situation the other way round,
557 * when we encounter the dead tuple first and then the recently dead one
558 * that points to it. If that happens, we'll have some unmatched entries
559 * in the UnresolvedTups hash table at the end. That can happen anyway,
560 * because a vacuum might have removed the dead tuple in the chain before
561 * us.
562 */
565 bool found;
566
567 memset(&hashkey, 0, sizeof(hashkey));
569 hashkey.tid = old_tuple->t_self;
570
571 unresolved = hash_search(state->rs_unresolved_tups, &hashkey,
572 HASH_FIND, NULL);
573
574 if (unresolved != NULL)
575 {
576 /* Need to free the contained tuple as well as the hashtable entry */
578 hash_search(state->rs_unresolved_tups, &hashkey,
579 HASH_REMOVE, &found);
580 Assert(found);
581 return true;
582 }
583
584 return false;
585}
#define Assert(condition)
Definition c.h:873
void * hash_search(HTAB *hashp, const void *keyPtr, HASHACTION action, bool *foundPtr)
Definition dynahash.c:952
void heap_freetuple(HeapTuple htup)
Definition heaptuple.c:1435
@ HASH_FIND
Definition hsearch.h:113
@ HASH_REMOVE
Definition hsearch.h:115
static TransactionId HeapTupleHeaderGetXmin(const HeapTupleHeaderData *tup)

References Assert, fb(), HASH_FIND, HASH_REMOVE, hash_search(), heap_freetuple(), and HeapTupleHeaderGetXmin().

Referenced by heapam_relation_copy_for_cluster().

◆ rewrite_heap_tuple()

void rewrite_heap_tuple ( RewriteState  state,
HeapTuple  old_tuple,
HeapTuple  new_tuple 
)
extern

Definition at line 341 of file rewriteheap.c.

343{
345 ItemPointerData old_tid;
347 bool found;
348 bool free_new;
349
351
352 /*
353 * Copy the original tuple's visibility information into new_tuple.
354 *
355 * XXX we might later need to copy some t_infomask2 bits, too? Right now,
356 * we intentionally clear the HOT status bits.
357 */
358 memcpy(&new_tuple->t_data->t_choice.t_heap,
359 &old_tuple->t_data->t_choice.t_heap,
360 sizeof(HeapTupleFields));
361
362 new_tuple->t_data->t_infomask &= ~HEAP_XACT_MASK;
363 new_tuple->t_data->t_infomask2 &= ~HEAP2_XACT_MASK;
364 new_tuple->t_data->t_infomask |=
365 old_tuple->t_data->t_infomask & HEAP_XACT_MASK;
366
367 /*
368 * While we have our hands on the tuple, we may as well freeze any
369 * eligible xmin or xmax, so that future VACUUM effort can be saved.
370 */
372 state->rs_old_rel->rd_rel->relfrozenxid,
373 state->rs_old_rel->rd_rel->relminmxid,
374 state->rs_freeze_xid,
375 state->rs_cutoff_multi);
376
377 /*
378 * Invalid ctid means that ctid should point to the tuple itself. We'll
379 * override it later if the tuple is part of an update chain.
380 */
381 ItemPointerSetInvalid(&new_tuple->t_data->t_ctid);
382
383 /*
384 * If the tuple has been updated, check the old-to-new mapping hash table.
385 *
386 * Note that this check relies on the HeapTupleSatisfiesVacuum() in
387 * heapam_relation_copy_for_cluster() to have set hint bits.
388 */
389 if (!((old_tuple->t_data->t_infomask & HEAP_XMAX_INVALID) ||
392 !(ItemPointerEquals(&(old_tuple->t_self),
393 &(old_tuple->t_data->t_ctid))))
394 {
396
397 memset(&hashkey, 0, sizeof(hashkey));
399 hashkey.tid = old_tuple->t_data->t_ctid;
400
402 hash_search(state->rs_old_new_tid_map, &hashkey,
403 HASH_FIND, NULL);
404
405 if (mapping != NULL)
406 {
407 /*
408 * We've already copied the tuple that t_ctid points to, so we can
409 * set the ctid of this tuple to point to the new location, and
410 * insert it right away.
411 */
412 new_tuple->t_data->t_ctid = mapping->new_tid;
413
414 /* We don't need the mapping entry anymore */
415 hash_search(state->rs_old_new_tid_map, &hashkey,
416 HASH_REMOVE, &found);
417 Assert(found);
418 }
419 else
420 {
421 /*
422 * We haven't seen the tuple t_ctid points to yet. Stash this
423 * tuple into unresolved_tups to be written later.
424 */
426
427 unresolved = hash_search(state->rs_unresolved_tups, &hashkey,
428 HASH_ENTER, &found);
429 Assert(!found);
430
431 unresolved->old_tid = old_tuple->t_self;
433
434 /*
435 * We can't do anything more now, since we don't know where the
436 * tuple will be written.
437 */
439 return;
440 }
441 }
442
443 /*
444 * Now we will write the tuple, and then check to see if it is the B tuple
445 * in any new or known pair. When we resolve a known pair, we will be
446 * able to write that pair's A tuple, and then we have to check if it
447 * resolves some other pair. Hence, we need a loop here.
448 */
449 old_tid = old_tuple->t_self;
450 free_new = false;
451
452 for (;;)
453 {
454 ItemPointerData new_tid;
455
456 /* Insert the tuple and find out where it's put in new_heap */
458 new_tid = new_tuple->t_self;
459
461
462 /*
463 * If the tuple is the updated version of a row, and the prior version
464 * wouldn't be DEAD yet, then we need to either resolve the prior
465 * version (if it's waiting in rs_unresolved_tups), or make an entry
466 * in rs_old_new_tid_map (so we can resolve it when we do see it). The
467 * previous tuple's xmax would equal this one's xmin, so it's
468 * RECENTLY_DEAD if and only if the xmin is not before OldestXmin.
469 */
470 if ((new_tuple->t_data->t_infomask & HEAP_UPDATED) &&
472 state->rs_oldest_xmin))
473 {
474 /*
475 * Okay, this is B in an update pair. See if we've seen A.
476 */
478
479 memset(&hashkey, 0, sizeof(hashkey));
481 hashkey.tid = old_tid;
482
483 unresolved = hash_search(state->rs_unresolved_tups, &hashkey,
484 HASH_FIND, NULL);
485
486 if (unresolved != NULL)
487 {
488 /*
489 * We have seen and memorized the previous tuple already. Now
490 * that we know where we inserted the tuple its t_ctid points
491 * to, fix its t_ctid and insert it to the new heap.
492 */
493 if (free_new)
495 new_tuple = unresolved->tuple;
496 free_new = true;
497 old_tid = unresolved->old_tid;
498 new_tuple->t_data->t_ctid = new_tid;
499
500 /*
501 * We don't need the hash entry anymore, but don't free its
502 * tuple just yet.
503 */
504 hash_search(state->rs_unresolved_tups, &hashkey,
505 HASH_REMOVE, &found);
506 Assert(found);
507
508 /* loop back to insert the previous tuple in the chain */
509 continue;
510 }
511 else
512 {
513 /*
514 * Remember the new tid of this tuple. We'll use it to set the
515 * ctid when we find the previous tuple in the chain.
516 */
518
519 mapping = hash_search(state->rs_old_new_tid_map, &hashkey,
520 HASH_ENTER, &found);
521 Assert(!found);
522
523 mapping->new_tid = new_tid;
524 }
525 }
526
527 /* Done with this (chain of) tuples, for now */
528 if (free_new)
530 break;
531 }
532
534}
bool heap_freeze_tuple(HeapTupleHeader tuple, TransactionId relfrozenxid, TransactionId relminmxid, TransactionId FreezeLimit, TransactionId MultiXactCutoff)
Definition heapam.c:7482
bool HeapTupleHeaderIsOnlyLocked(HeapTupleHeader tuple)
HeapTuple heap_copytuple(HeapTuple tuple)
Definition heaptuple.c:778
@ HASH_ENTER
Definition hsearch.h:114
#define HEAP_XACT_MASK
static bool HeapTupleHeaderIndicatesMovedPartitions(const HeapTupleHeaderData *tup)
#define HEAP_XMAX_INVALID
static TransactionId HeapTupleHeaderGetUpdateXid(const HeapTupleHeaderData *tup)
#define HEAP_UPDATED
bool ItemPointerEquals(const ItemPointerData *pointer1, const ItemPointerData *pointer2)
Definition itemptr.c:35
static void logical_rewrite_heap_tuple(RewriteState state, ItemPointerData old_tid, HeapTuple new_tuple)
OldToNewMappingData * OldToNewMapping
static bool TransactionIdPrecedes(TransactionId id1, TransactionId id2)
Definition transam.h:263

References Assert, fb(), HASH_ENTER, HASH_FIND, HASH_REMOVE, hash_search(), heap_copytuple(), heap_freetuple(), heap_freeze_tuple(), HEAP_UPDATED, HEAP_XACT_MASK, HEAP_XMAX_INVALID, HeapTupleHeaderGetUpdateXid(), HeapTupleHeaderGetXmin(), HeapTupleHeaderIndicatesMovedPartitions(), HeapTupleHeaderIsOnlyLocked(), ItemPointerEquals(), ItemPointerSetInvalid(), logical_rewrite_heap_tuple(), MemoryContextSwitchTo(), raw_heap_insert(), and TransactionIdPrecedes().

Referenced by reform_and_rewrite_tuple().