36#include "catalog/pg_opfamily_d.h"
55#define InvalidBtreeLevel ((uint32) InvalidBlockNumber)
56#define BTreeTupleGetNKeyAtts(itup, rel) \
57 Min(IndexRelationGetNumberOfKeyAttributes(rel), BTreeTupleGetNAtts(itup, rel))
180 void *
state,
bool readonly);
182 bool heapkeyspace,
bool readonly,
bool heapallindexed,
183 bool rootdescend,
bool checkunique);
214 bool tupleIsAlive,
void *checkstate);
257 args.heapallindexed =
false;
258 args.rootdescend =
false;
259 args.parentcheck =
false;
260 args.checkunique =
false;
289 args.heapallindexed =
false;
290 args.rootdescend =
false;
291 args.parentcheck =
true;
292 args.checkunique =
false;
321 errmsg(
"index \"%s\" lacks a main relation fork",
326 if (allequalimage && !heapkeyspace)
329 errmsg(
"index \"%s\" metapage has equalimage field set on unsupported nbtree version",
344 errmsg(
"index \"%s\" metapage incorrectly indicates that deduplication is safe",
347 ?
errhint(
"This is known of \"interval\" indexes last built on a version predating 2023-11.")
353 args->heapallindexed, args->rootdescend, args->checkunique);
381 bool readonly,
bool heapallindexed,
bool rootdescend,
391 elog(
DEBUG1,
"verifying consistency of tree structure for index \"%s\"",
394 elog(
DEBUG1,
"verifying consistency of tree structure for index \"%s\" with cross-level checks",
408 state->heaprel = heaprel;
409 state->heapkeyspace = heapkeyspace;
410 state->readonly = readonly;
411 state->heapallindexed = heapallindexed;
412 state->rootdescend = rootdescend;
413 state->checkunique = checkunique;
416 if (
state->heapallindexed)
436 state->heaptuplespresent = 0;
461 state->snapshot->xmin))
464 errmsg(
"index \"%s\" cannot be verified using transaction snapshot",
473 if (
state->checkunique)
482 if (
state->rootdescend && !
state->heapkeyspace)
485 errmsg(
"cannot verify that tuples from index \"%s\" can each be found by an independent index search",
487 errhint(
"Only B-Tree version 4 indexes support rootdescend verification.")));
512 errdetail_internal(
"Fast root block %u (level %u) differs from true root block %u (level %u).",
536 errmsg(
"index \"%s\" has no valid pages on level below %u or first level",
545 if (
state->heapallindexed)
586 elog(
DEBUG1,
"verifying that tuples from index \"%s\" are present in \"%s\"",
647 " (true root level)" : level.
level == 0 ?
" (leaf level)" :
"");
650 state->previncompletesplit =
false;
658 state->targetblock = current;
680 errmsg(
"downlink or sibling link points to deleted block in index \"%s\"",
688 errmsg(
"block %u fell off the end of index \"%s\"",
711 errmsg(
"block %u is not leftmost in index \"%s\"",
717 errmsg(
"block %u is not true root in index \"%s\"",
778 errmsg(
"leftmost down link for level points to block in index \"%s\" whose level is not one level down",
780 errdetail_internal(
"Block pointed to=%u expected level=%u level in pointed to block=%u.",
792 errmsg(
"circular link chain found in block %u of index \"%s\"",
837 while (current !=
P_NONE);
861 tid,
state->snapshot, slot);
896 if (
lVis->postingIndex >= 0)
904 errmsg(
"index uniqueness is violated for index \"%s\"",
906 errdetail(
"Index %s%s and%s%s (point to heap %s and %s) page lsn=%X/%08X.",
950 lVis->blkno = targetblock;
951 lVis->offset = offset;
952 lVis->postingIndex =
i;
977 lVis->blkno = targetblock;
978 lVis->offset = offset;
980 lVis->postingIndex = -1;
986 lVis->blkno != targetblock)
990 if (
lVis->postingIndex >= 0)
994 errmsg(
"index uniqueness can not be checked for index tid=(%u,%u) in index \"%s\"",
997 errdetail(
"It doesn't have visible heap tids and key is equal to the tid=(%u,%u)%s (points to heap tid=(%u,%u)).",
1001 errhint(
"VACUUM the table and repeat the check.")));
1049 errmsg_internal(
"harmless interrupted page deletion detected in index \"%s\"",
1108 if (!
state->readonly)
1142 state->checkstrategy);
1175 errmsg_internal(
"harmless concurrent page split detected in index \"%s\"",
1179 state->targetblock)));
1195 errmsg(
"left link/right link pair in index \"%s\" not in agreement",
1253 elog(
DEBUG2,
"verifying %u items on %s block %u", max,
1274 errmsg(
"wrong number of high key index tuple attributes in index \"%s\"",
1310 state->target, offset);
1323 errmsg(
"index tuple size does not equal lp_len in index \"%s\"",
1326 state->targetblock, offset,
1329 errhint(
"This could be a torn page problem.")));
1347 errmsg(
"wrong number of index tuple attributes in index \"%s\"",
1397 errmsg(
"could not find tuple using search from root page in index \"%s\"",
1426 errmsg_internal(
"posting list contains misplaced TID in index \"%s\"",
1479 errmsg(
"index row size %zu exceeds maximum for index \"%s\"",
1567 scantid =
skey->scantid;
1586 errmsg(
"high key invariant violated for index \"%s\"",
1595 skey->scantid = scantid;
1632 errmsg(
"item order invariant violated for index \"%s\"",
1634 errdetail_internal(
"Lower index tid=%s (points to %s tid=%s) higher index tid=%s (points to %s tid=%s) page lsn=%X/%08X.",
1650 if (
state->checkunique &&
state->indexinfo->ii_Unique &&
1659 if (
state->checkunique &&
state->indexinfo->ii_Unique &&
1663 scantid =
skey->scantid;
1685 lVis.postingIndex = -1;
1693 skey->scantid = scantid;
1733 if (!
state->readonly)
1749 errmsg(
"cross page item order invariant violated for index \"%s\"",
1752 state->targetblock, offset,
1760 if (
state->checkunique &&
state->indexinfo->ii_Unique &&
1765 elog(
DEBUG2,
"check cross page unique condition");
1802 errmsg(
"right block of leaf block is non-leaf for index \"%s\"",
1924 errmsg_internal(
"level %u sibling page in block %u of index \"%s\" was found deleted or half dead",
1926 errdetail_internal(
"Deleted page found when building scankey from right sibling.")));
2201 state->previncompletesplit =
false;
2209 errmsg(
"can't traverse from downlink %u to downlink %u of index \"%s\"",
2210 state->prevrightlink, downlink,
2226 errmsg(
"the first child of leftmost target page is not leftmost of its level in index \"%s\"",
2229 state->targetblock, blkno,
2237 errmsg(
"block found while following rightlinks from child of index \"%s\" has invalid level",
2239 errdetail_internal(
"Block pointed to=%u expected level=%u level in pointed to block=%u.",
2243 if ((!first && blkno ==
state->prevrightlink) || blkno == opaque->
btpo_prev)
2246 errmsg(
"circular link chain found in block %u of index \"%s\"",
2249 if (blkno != downlink && !
P_IGNORE(opaque))
2293 if (blkno == downlink)
2312 errmsg(
"child high key is greater than rightmost pivot key on target level in index \"%s\"",
2315 state->targetblock, blkno,
2342 errmsg(
"can't find left sibling high key in index \"%s\"",
2345 state->targetblock, blkno,
2347 itup =
state->lowkey;
2354 errmsg(
"mismatch between parent key and child high key in index \"%s\"",
2357 state->targetblock, blkno,
2363 if (blkno == downlink)
2407 state->target, downlinkoffnum);
2494 errmsg(
"downlink to deleted page found in index \"%s\"",
2535 errmsg(
"down-link lower bound invariant violated for index \"%s\"",
2537 errdetail_internal(
"Parent block=%u child index tid=(%u,%u) parent page lsn=%X/%08X.",
2605 errmsg_internal(
"harmless interrupted page split detected in index \"%s\"",
2627 errmsg(
"leaf index block lacks downlink in index \"%s\"",
2634 elog(
DEBUG1,
"checking for interrupted multi-level deletion due to missing downlink in index \"%s\"",
2652 if (
copaque->btpo_level != level - 1)
2655 errmsg_internal(
"downlink points to block in index \"%s\" whose level is not one level down",
2657 errdetail_internal(
"Top parent/under check block=%u block pointed to=%u expected level=%u level in pointed to block=%u.",
2659 level - 1,
copaque->btpo_level)));
2693 errmsg_internal(
"downlink to deleted leaf page found in index \"%s\"",
2695 errdetail_internal(
"Top parent/target block=%u leaf block=%u top parent/under check lsn=%X/%08X.",
2719 errmsg(
"internal index block lacks downlink in index \"%s\"",
2801 errmsg(
"heap tuple (%u,%u) from table \"%s\" lacks matching index tuple within index \"%s\"",
2807 ?
errhint(
"Retrying verification using the function bt_index_parent_check() might provide a more specific error.")
2810 state->heaptuplespresent++;
2878 if (att->attbyval || att->attlen != -1 || isnull[
i])
2889 errmsg(
"external varlena datum in tuple that references heap row (%u,%u) in index \"%s\"",
3018 Assert(key->heapkeyspace && key->scantid !=
NULL);
3114 Assert(!key->nextkey && key->backward);
3120 if (!key->heapkeyspace)
3176 Assert(!key->nextkey && key->backward);
3199 Assert(!key->nextkey && key->backward);
3204 if (!key->heapkeyspace)
3237 Assert(!key->nextkey && key->backward);
3245 if (!key->heapkeyspace)
3304 state->checkstrategy);
3322 errmsg(
"invalid meta page found at block %u in index \"%s\"",
3334 errmsg(
"index \"%s\" meta page is corrupt",
3341 errmsg(
"version mismatch in index \"%s\": file version %d, "
3342 "current version %d, minimum supported version %d",
3363 errmsg_internal(
"invalid leaf page level %u for block %u in index \"%s\"",
3370 errmsg_internal(
"invalid internal page level 0 for block %u in index \"%s\"",
3398 errmsg(
"Number of items on block %u of index \"%s\" exceeds MaxIndexTuplesPerPage (%u)",
3405 errmsg(
"internal block %u in index \"%s\" lacks high key and/or at least one downlink",
3411 errmsg(
"non-rightmost leaf block %u in index \"%s\" lacks high key item",
3424 errmsg(
"internal page block %u in index \"%s\" is half-dead",
3426 errhint(
"This can be caused by an interrupted VACUUM in version 9.3 or older, before upgrade. Please REINDEX it.")));
3435 errmsg_internal(
"internal page block %u in index \"%s\" has garbage items",
3441 errmsg_internal(
"full transaction id page flag appears in non-deleted block %u in index \"%s\"",
3473 skey->backward =
true;
3501 errmsg(
"line pointer points past end of tuple space in index \"%s\"",
3517 errmsg(
"invalid line pointer storage in index \"%s\"",
3546 errmsg_internal(
"block %u or its right sibling block or child block in index \"%s\" has unexpected pivot tuple",
3553 errmsg_internal(
"block %u or its right sibling block or child block in index \"%s\" has unexpected non-pivot tuple",
3561 errmsg(
"block %u or its right sibling block or child block in index \"%s\" contains non-pivot tuple that lacks a heap TID",
3592 return &itup->
t_tid;
#define InvalidBlockNumber
static bool BlockNumberIsValid(BlockNumber blockNumber)
void bloom_free(bloom_filter *filter)
bloom_filter * bloom_create(int64 total_elems, int bloom_work_mem, uint64 seed)
double bloom_prop_bits_set(bloom_filter *filter)
bool bloom_lacks_element(bloom_filter *filter, unsigned char *elem, size_t len)
void bloom_add_element(bloom_filter *filter, unsigned char *elem, size_t len)
static Datum values[MAXATTR]
void UnlockReleaseBuffer(Buffer buffer)
Buffer ReadBufferExtended(Relation reln, ForkNumber forkNum, BlockNumber blockNum, ReadBufferMode mode, BufferAccessStrategy strategy)
#define RelationGetNumberOfBlocks(reln)
static Page BufferGetPage(Buffer buffer)
static void LockBuffer(Buffer buffer, BufferLockMode mode)
static bool BufferIsValid(Buffer bufnum)
static ItemId PageGetItemId(Page page, OffsetNumber offsetNumber)
static void * PageGetItem(PageData *page, const ItemIdData *itemId)
static XLogRecPtr PageGetLSN(const PageData *page)
static OffsetNumber PageGetMaxOffsetNumber(const PageData *page)
#define Assert(condition)
memcpy(sums, checksumBaseOffsets, sizeof(checksumBaseOffsets))
int errcode(int sqlerrcode)
int int errdetail_internal(const char *fmt,...) pg_attribute_printf(1
int errhint(const char *fmt,...) pg_attribute_printf(1
int errdetail(const char *fmt,...) pg_attribute_printf(1
int int errmsg_internal(const char *fmt,...) pg_attribute_printf(1
#define ereport(elevel,...)
void ExecDropSingleTupleTableSlot(TupleTableSlot *slot)
#define palloc0_object(type)
#define PG_MODULE_MAGIC_EXT(...)
#define PG_FUNCTION_INFO_V1(funcname)
#define PG_DETOAST_DATUM(datum)
#define PG_GETARG_BOOL(n)
BufferAccessStrategy GetAccessStrategy(BufferAccessStrategyType btype)
#define TOAST_INDEX_TARGET
static TransactionId HeapTupleHeaderGetXmin(const HeapTupleHeaderData *tup)
IndexInfo * BuildIndexInfo(Relation index)
IndexTuple index_form_tuple(TupleDesc tupleDescriptor, const Datum *values, const bool *isnull)
#define ItemIdGetLength(itemId)
#define ItemIdGetOffset(itemId)
#define ItemIdIsDead(itemId)
#define ItemIdIsUsed(itemId)
#define ItemIdIsRedirected(itemId)
#define ItemIdGetFlags(itemId)
int32 ItemPointerCompare(const ItemPointerData *arg1, const ItemPointerData *arg2)
static OffsetNumber ItemPointerGetOffsetNumber(const ItemPointerData *pointer)
static OffsetNumber ItemPointerGetOffsetNumberNoCheck(const ItemPointerData *pointer)
static BlockNumber ItemPointerGetBlockNumber(const ItemPointerData *pointer)
static BlockNumber ItemPointerGetBlockNumberNoCheck(const ItemPointerData *pointer)
static void ItemPointerCopy(const ItemPointerData *fromPointer, ItemPointerData *toPointer)
static bool ItemPointerIsValid(const ItemPointerData *pointer)
static bool IndexTupleHasVarwidths(const IndexTupleData *itup)
IndexTupleData * IndexTuple
static Datum index_getattr(IndexTuple tup, int attnum, TupleDesc tupleDesc, bool *isnull)
static Size IndexTupleSize(const IndexTupleData *itup)
#define MaxIndexTuplesPerPage
void * MemoryContextAlloc(MemoryContext context, Size size)
void MemoryContextReset(MemoryContext context)
void pfree(void *pointer)
MemoryContext CurrentMemoryContext
void MemoryContextDelete(MemoryContext context)
#define AllocSetContextCreate
#define ALLOCSET_DEFAULT_SIZES
#define CHECK_FOR_INTERRUPTS()
IndexTuple _bt_form_posting(IndexTuple base, const ItemPointerData *htids, int nhtids)
void _bt_relbuf(Relation rel, Buffer buf)
void _bt_checkpage(Relation rel, Buffer buf)
void _bt_metaversion(Relation rel, bool *heapkeyspace, bool *allequalimage)
#define P_HAS_FULLXID(opaque)
#define P_ISHALFDEAD(opaque)
static uint16 BTreeTupleGetNPosting(IndexTuple posting)
static bool BTreeTupleIsPivot(IndexTuple itup)
#define BTREE_MIN_VERSION
#define P_HAS_GARBAGE(opaque)
#define BTPageGetOpaque(page)
#define P_ISDELETED(opaque)
static BlockNumber BTreeTupleGetTopParent(IndexTuple leafhikey)
#define MaxTIDsPerBTreePage
#define P_FIRSTDATAKEY(opaque)
#define P_RIGHTMOST(opaque)
#define P_INCOMPLETE_SPLIT(opaque)
static ItemPointer BTreeTupleGetPostingN(IndexTuple posting, int n)
static BlockNumber BTreeTupleGetDownLink(IndexTuple pivot)
static ItemPointer BTreeTupleGetMaxHeapTID(IndexTuple itup)
static bool BTreeTupleIsPosting(IndexTuple itup)
#define BTMaxItemSizeNoHeapTid
static ItemPointer BTreeTupleGetHeapTID(IndexTuple itup)
#define BTreeTupleGetNAtts(itup, rel)
OffsetNumber _bt_binsrch_insert(Relation rel, BTInsertState insertstate)
int32 _bt_compare(Relation rel, BTScanInsert key, Page page, OffsetNumber offnum)
BTStack _bt_search(Relation rel, Relation heaprel, BTScanInsert key, Buffer *bufP, int access, bool returnstack)
BTScanInsert _bt_mkscankey(Relation rel, IndexTuple itup)
bool _bt_check_natts(Relation rel, bool heapkeyspace, Page page, OffsetNumber offnum)
bool _bt_allequalimage(Relation rel, bool debugmessage)
#define InvalidOffsetNumber
#define OffsetNumberIsValid(offsetNumber)
#define OffsetNumberNext(offsetNumber)
static MemoryContext MemoryContextSwitchTo(MemoryContext context)
FormData_pg_attribute * Form_pg_attribute
#define ERRCODE_DATA_CORRUPTED
uint64 pg_prng_uint64(pg_prng_state *state)
pg_prng_state pg_global_prng_state
#define ERRCODE_T_R_SERIALIZATION_FAILURE
static Pointer DatumGetPointer(Datum X)
#define PointerGetDatum(X)
char * psprintf(const char *fmt,...)
static int cmp(const chr *x, const chr *y, size_t len)
static SMgrRelation RelationGetSmgr(Relation rel)
#define RelationGetDescr(relation)
#define RelationGetRelationName(relation)
#define IndexRelationGetNumberOfKeyAttributes(relation)
bool smgrexists(SMgrRelation reln, ForkNumber forknum)
Snapshot GetTransactionSnapshot(void)
void UnregisterSnapshot(Snapshot snapshot)
Snapshot RegisterSnapshot(Snapshot snapshot)
BufferAccessStrategy checkstrategy
BlockNumber prevrightlink
MemoryContext targetcontext
uint16 * ii_ExclusionStrats
struct HeapTupleData * rd_indextuple
TupleTableSlot * table_slot_create(Relation relation, List **reglist)
static double table_index_build_scan(Relation table_rel, Relation index_rel, IndexInfo *index_info, bool allow_sync, bool progress, IndexBuildCallback callback, void *callback_state, TableScanDesc scan)
static TableScanDesc table_beginscan_strat(Relation rel, Snapshot snapshot, int nkeys, ScanKeyData *key, bool allow_strat, bool allow_sync)
static bool table_tuple_fetch_row_version(Relation rel, ItemPointer tid, Snapshot snapshot, TupleTableSlot *slot)
#define TransactionIdIsValid(xid)
static bool TransactionIdPrecedes(TransactionId id1, TransactionId id2)
static FormData_pg_attribute * TupleDescAttr(TupleDesc tupdesc, int i)
static Size VARSIZE_ANY(const void *PTR)
static bool VARATT_CAN_MAKE_SHORT(const void *PTR)
static bool VARATT_IS_EXTERNAL(const void *PTR)
static char * VARDATA(const void *PTR)
static Size VARATT_CONVERTED_SHORT_SIZE(const void *PTR)
static bool VARATT_IS_COMPRESSED(const void *PTR)
static void SET_VARSIZE_SHORT(void *PTR, Size len)
void amcheck_lock_relation_and_check(Oid indrelid, Oid am_id, IndexDoCheckCallback check, LOCKMODE lockmode, void *state)
static bool offset_is_negative_infinity(BTPageOpaque opaque, OffsetNumber offset)
static bool bt_leftmost_ignoring_half_dead(BtreeCheckState *state, BlockNumber start, BTPageOpaque start_opaque)
static bool invariant_l_offset(BtreeCheckState *state, BTScanInsert key, OffsetNumber upperbound)
static ItemPointer BTreeTupleGetPointsToTID(IndexTuple itup)
static IndexTuple bt_posting_plain_tuple(IndexTuple itup, int n)
static void bt_target_page_check(BtreeCheckState *state)
static void bt_check_every_level(Relation rel, Relation heaprel, bool heapkeyspace, bool readonly, bool heapallindexed, bool rootdescend, bool checkunique)
static void bt_report_duplicate(BtreeCheckState *state, BtreeLastVisibleEntry *lVis, ItemPointer nexttid, BlockNumber nblock, OffsetNumber noffset, int nposting)
static bool bt_pivot_tuple_identical(bool heapkeyspace, IndexTuple itup1, IndexTuple itup2)
static bool invariant_leq_offset(BtreeCheckState *state, BTScanInsert key, OffsetNumber upperbound)
Datum bt_index_parent_check(PG_FUNCTION_ARGS)
static void bt_child_highkey_check(BtreeCheckState *state, OffsetNumber target_downlinkoffnum, Page loaded_child, uint32 target_level)
static bool heap_entry_is_visible(BtreeCheckState *state, ItemPointer tid)
static BTScanInsert bt_mkscankey_pivotsearch(Relation rel, IndexTuple itup)
Datum bt_index_check(PG_FUNCTION_ARGS)
static BtreeLevel bt_check_level_from_leftmost(BtreeCheckState *state, BtreeLevel level)
static void bt_downlink_missing_check(BtreeCheckState *state, bool rightsplit, BlockNumber blkno, Page page)
static ItemId PageGetItemIdCareful(BtreeCheckState *state, BlockNumber block, Page page, OffsetNumber offset)
static void bt_tuple_present_callback(Relation index, ItemPointer tid, Datum *values, bool *isnull, bool tupleIsAlive, void *checkstate)
static void bt_index_check_callback(Relation indrel, Relation heaprel, void *state, bool readonly)
static bool bt_rootdescend(BtreeCheckState *state, IndexTuple itup)
static BTScanInsert bt_right_page_check_scankey(BtreeCheckState *state, OffsetNumber *rightfirstoffset)
static bool invariant_g_offset(BtreeCheckState *state, BTScanInsert key, OffsetNumber lowerbound)
#define InvalidBtreeLevel
static Page palloc_btree_page(BtreeCheckState *state, BlockNumber blocknum)
static IndexTuple bt_normalize_tuple(BtreeCheckState *state, IndexTuple itup)
static void bt_recheck_sibling_links(BtreeCheckState *state, BlockNumber btpo_prev_from_target, BlockNumber leftcurrent)
static ItemPointer BTreeTupleGetHeapTIDCareful(BtreeCheckState *state, IndexTuple itup, bool nonpivot)
#define BTreeTupleGetNKeyAtts(itup, rel)
static void bt_child_check(BtreeCheckState *state, BTScanInsert targetkey, OffsetNumber downlinkoffnum)
static void bt_entry_unique_check(BtreeCheckState *state, IndexTuple itup, BlockNumber targetblock, OffsetNumber offset, BtreeLastVisibleEntry *lVis)
static bool invariant_l_nontarget_offset(BtreeCheckState *state, BTScanInsert key, BlockNumber nontargetblock, Page nontarget, OffsetNumber upperbound)
#define IsolationUsesXactSnapshot()
#define LSN_FORMAT_ARGS(lsn)