PostgreSQL Source Code  git master
brin.c File Reference
#include "postgres.h"
#include "access/brin.h"
#include "access/brin_page.h"
#include "access/brin_pageops.h"
#include "access/brin_xlog.h"
#include "access/relation.h"
#include "access/reloptions.h"
#include "access/relscan.h"
#include "access/table.h"
#include "access/tableam.h"
#include "access/xloginsert.h"
#include "catalog/index.h"
#include "catalog/pg_am.h"
#include "commands/vacuum.h"
#include "miscadmin.h"
#include "pgstat.h"
#include "postmaster/autovacuum.h"
#include "storage/bufmgr.h"
#include "storage/freespace.h"
#include "tcop/tcopprot.h"
#include "utils/acl.h"
#include "utils/datum.h"
#include "utils/fmgrprotos.h"
#include "utils/guc.h"
#include "utils/index_selfuncs.h"
#include "utils/memutils.h"
#include "utils/rel.h"
#include "utils/tuplesort.h"
Include dependency graph for brin.c:

Go to the source code of this file.

Data Structures

struct  BrinShared
 
struct  BrinLeader
 
struct  BrinBuildState
 
struct  BrinInsertState
 
struct  BrinOpaque
 

Macros

#define PARALLEL_KEY_BRIN_SHARED   UINT64CONST(0xB000000000000001)
 
#define PARALLEL_KEY_TUPLESORT   UINT64CONST(0xB000000000000002)
 
#define PARALLEL_KEY_QUERY_TEXT   UINT64CONST(0xB000000000000003)
 
#define PARALLEL_KEY_WAL_USAGE   UINT64CONST(0xB000000000000004)
 
#define PARALLEL_KEY_BUFFER_USAGE   UINT64CONST(0xB000000000000005)
 
#define ParallelTableScanFromBrinShared(shared)    (ParallelTableScanDesc) ((char *) (shared) + BUFFERALIGN(sizeof(BrinShared)))
 
#define BRIN_ALL_BLOCKRANGES   InvalidBlockNumber
 

Typedefs

typedef struct BrinShared BrinShared
 
typedef struct BrinLeader BrinLeader
 
typedef struct BrinBuildState BrinBuildState
 
typedef struct BrinInsertState BrinInsertState
 
typedef struct BrinOpaque BrinOpaque
 

Functions

static BrinBuildStateinitialize_brin_buildstate (Relation idxRel, BrinRevmap *revmap, BlockNumber pagesPerRange, BlockNumber tablePages)
 
static BrinInsertStateinitialize_brin_insertstate (Relation idxRel, IndexInfo *indexInfo)
 
static void terminate_brin_buildstate (BrinBuildState *state)
 
static void brinsummarize (Relation index, Relation heapRel, BlockNumber pageRange, bool include_partial, double *numSummarized, double *numExisting)
 
static void form_and_insert_tuple (BrinBuildState *state)
 
static void form_and_spill_tuple (BrinBuildState *state)
 
static void union_tuples (BrinDesc *bdesc, BrinMemTuple *a, BrinTuple *b)
 
static void brin_vacuum_scan (Relation idxrel, BufferAccessStrategy strategy)
 
static bool add_values_to_range (Relation idxRel, BrinDesc *bdesc, BrinMemTuple *dtup, const Datum *values, const bool *nulls)
 
static bool check_null_keys (BrinValues *bval, ScanKey *nullkeys, int nnullkeys)
 
static void brin_fill_empty_ranges (BrinBuildState *state, BlockNumber prevRange, BlockNumber nextRange)
 
static void _brin_begin_parallel (BrinBuildState *buildstate, Relation heap, Relation index, bool isconcurrent, int request)
 
static void _brin_end_parallel (BrinLeader *brinleader, BrinBuildState *state)
 
static Size _brin_parallel_estimate_shared (Relation heap, Snapshot snapshot)
 
static double _brin_parallel_heapscan (BrinBuildState *state)
 
static double _brin_parallel_merge (BrinBuildState *state)
 
static void _brin_leader_participate_as_worker (BrinBuildState *buildstate, Relation heap, Relation index)
 
static void _brin_parallel_scan_and_build (BrinBuildState *state, BrinShared *brinshared, Sharedsort *sharedsort, Relation heap, Relation index, int sortmem, bool progress)
 
Datum brinhandler (PG_FUNCTION_ARGS)
 
bool brininsert (Relation idxRel, Datum *values, bool *nulls, ItemPointer heaptid, Relation heapRel, IndexUniqueCheck checkUnique, bool indexUnchanged, IndexInfo *indexInfo)
 
void brininsertcleanup (Relation index, IndexInfo *indexInfo)
 
IndexScanDesc brinbeginscan (Relation r, int nkeys, int norderbys)
 
int64 bringetbitmap (IndexScanDesc scan, TIDBitmap *tbm)
 
void brinrescan (IndexScanDesc scan, ScanKey scankey, int nscankeys, ScanKey orderbys, int norderbys)
 
void brinendscan (IndexScanDesc scan)
 
static void brinbuildCallback (Relation index, ItemPointer tid, Datum *values, bool *isnull, bool tupleIsAlive, void *brstate)
 
static void brinbuildCallbackParallel (Relation index, ItemPointer tid, Datum *values, bool *isnull, bool tupleIsAlive, void *brstate)
 
IndexBuildResultbrinbuild (Relation heap, Relation index, IndexInfo *indexInfo)
 
void brinbuildempty (Relation index)
 
IndexBulkDeleteResultbrinbulkdelete (IndexVacuumInfo *info, IndexBulkDeleteResult *stats, IndexBulkDeleteCallback callback, void *callback_state)
 
IndexBulkDeleteResultbrinvacuumcleanup (IndexVacuumInfo *info, IndexBulkDeleteResult *stats)
 
byteabrinoptions (Datum reloptions, bool validate)
 
Datum brin_summarize_new_values (PG_FUNCTION_ARGS)
 
Datum brin_summarize_range (PG_FUNCTION_ARGS)
 
Datum brin_desummarize_range (PG_FUNCTION_ARGS)
 
BrinDescbrin_build_desc (Relation rel)
 
void brin_free_desc (BrinDesc *bdesc)
 
void brinGetStats (Relation index, BrinStatsData *stats)
 
static void summarize_range (IndexInfo *indexInfo, BrinBuildState *state, Relation heapRel, BlockNumber heapBlk, BlockNumber heapNumBlks)
 
void _brin_parallel_build_main (dsm_segment *seg, shm_toc *toc)
 
static void brin_build_empty_tuple (BrinBuildState *state, BlockNumber blkno)
 

Macro Definition Documentation

◆ BRIN_ALL_BLOCKRANGES

#define BRIN_ALL_BLOCKRANGES   InvalidBlockNumber

Definition at line 206 of file brin.c.

◆ PARALLEL_KEY_BRIN_SHARED

#define PARALLEL_KEY_BRIN_SHARED   UINT64CONST(0xB000000000000001)

Definition at line 47 of file brin.c.

◆ PARALLEL_KEY_BUFFER_USAGE

#define PARALLEL_KEY_BUFFER_USAGE   UINT64CONST(0xB000000000000005)

Definition at line 51 of file brin.c.

◆ PARALLEL_KEY_QUERY_TEXT

#define PARALLEL_KEY_QUERY_TEXT   UINT64CONST(0xB000000000000003)

Definition at line 49 of file brin.c.

◆ PARALLEL_KEY_TUPLESORT

#define PARALLEL_KEY_TUPLESORT   UINT64CONST(0xB000000000000002)

Definition at line 48 of file brin.c.

◆ PARALLEL_KEY_WAL_USAGE

#define PARALLEL_KEY_WAL_USAGE   UINT64CONST(0xB000000000000004)

Definition at line 50 of file brin.c.

◆ ParallelTableScanFromBrinShared

#define ParallelTableScanFromBrinShared (   shared)     (ParallelTableScanDesc) ((char *) (shared) + BUFFERALIGN(sizeof(BrinShared)))

Definition at line 113 of file brin.c.

Typedef Documentation

◆ BrinBuildState

◆ BrinInsertState

◆ BrinLeader

typedef struct BrinLeader BrinLeader

◆ BrinOpaque

typedef struct BrinOpaque BrinOpaque

◆ BrinShared

typedef struct BrinShared BrinShared

Function Documentation

◆ _brin_begin_parallel()

static void _brin_begin_parallel ( BrinBuildState buildstate,
Relation  heap,
Relation  index,
bool  isconcurrent,
int  request 
)
static

Definition at line 2352 of file brin.c.

2354 {
2355  ParallelContext *pcxt;
2356  int scantuplesortstates;
2357  Snapshot snapshot;
2358  Size estbrinshared;
2359  Size estsort;
2360  BrinShared *brinshared;
2361  Sharedsort *sharedsort;
2362  BrinLeader *brinleader = (BrinLeader *) palloc0(sizeof(BrinLeader));
2363  WalUsage *walusage;
2364  BufferUsage *bufferusage;
2365  bool leaderparticipates = true;
2366  int querylen;
2367 
2368 #ifdef DISABLE_LEADER_PARTICIPATION
2369  leaderparticipates = false;
2370 #endif
2371 
2372  /*
2373  * Enter parallel mode, and create context for parallel build of brin
2374  * index
2375  */
2377  Assert(request > 0);
2378  pcxt = CreateParallelContext("postgres", "_brin_parallel_build_main",
2379  request);
2380 
2381  scantuplesortstates = leaderparticipates ? request + 1 : request;
2382 
2383  /*
2384  * Prepare for scan of the base relation. In a normal index build, we use
2385  * SnapshotAny because we must retrieve all tuples and do our own time
2386  * qual checks (because we have to index RECENTLY_DEAD tuples). In a
2387  * concurrent build, we take a regular MVCC snapshot and index whatever's
2388  * live according to that.
2389  */
2390  if (!isconcurrent)
2391  snapshot = SnapshotAny;
2392  else
2394 
2395  /*
2396  * Estimate size for our own PARALLEL_KEY_BRIN_SHARED workspace.
2397  */
2398  estbrinshared = _brin_parallel_estimate_shared(heap, snapshot);
2399  shm_toc_estimate_chunk(&pcxt->estimator, estbrinshared);
2400  estsort = tuplesort_estimate_shared(scantuplesortstates);
2401  shm_toc_estimate_chunk(&pcxt->estimator, estsort);
2402 
2403  shm_toc_estimate_keys(&pcxt->estimator, 2);
2404 
2405  /*
2406  * Estimate space for WalUsage and BufferUsage -- PARALLEL_KEY_WAL_USAGE
2407  * and PARALLEL_KEY_BUFFER_USAGE.
2408  *
2409  * If there are no extensions loaded that care, we could skip this. We
2410  * have no way of knowing whether anyone's looking at pgWalUsage or
2411  * pgBufferUsage, so do it unconditionally.
2412  */
2414  mul_size(sizeof(WalUsage), pcxt->nworkers));
2415  shm_toc_estimate_keys(&pcxt->estimator, 1);
2417  mul_size(sizeof(BufferUsage), pcxt->nworkers));
2418  shm_toc_estimate_keys(&pcxt->estimator, 1);
2419 
2420  /* Finally, estimate PARALLEL_KEY_QUERY_TEXT space */
2421  if (debug_query_string)
2422  {
2423  querylen = strlen(debug_query_string);
2424  shm_toc_estimate_chunk(&pcxt->estimator, querylen + 1);
2425  shm_toc_estimate_keys(&pcxt->estimator, 1);
2426  }
2427  else
2428  querylen = 0; /* keep compiler quiet */
2429 
2430  /* Everyone's had a chance to ask for space, so now create the DSM */
2431  InitializeParallelDSM(pcxt);
2432 
2433  /* If no DSM segment was available, back out (do serial build) */
2434  if (pcxt->seg == NULL)
2435  {
2436  if (IsMVCCSnapshot(snapshot))
2437  UnregisterSnapshot(snapshot);
2438  DestroyParallelContext(pcxt);
2439  ExitParallelMode();
2440  return;
2441  }
2442 
2443  /* Store shared build state, for which we reserved space */
2444  brinshared = (BrinShared *) shm_toc_allocate(pcxt->toc, estbrinshared);
2445  /* Initialize immutable state */
2446  brinshared->heaprelid = RelationGetRelid(heap);
2447  brinshared->indexrelid = RelationGetRelid(index);
2448  brinshared->isconcurrent = isconcurrent;
2449  brinshared->scantuplesortstates = scantuplesortstates;
2450  brinshared->pagesPerRange = buildstate->bs_pagesPerRange;
2451  ConditionVariableInit(&brinshared->workersdonecv);
2452  SpinLockInit(&brinshared->mutex);
2453 
2454  /* Initialize mutable state */
2455  brinshared->nparticipantsdone = 0;
2456  brinshared->reltuples = 0.0;
2457  brinshared->indtuples = 0.0;
2458 
2460  ParallelTableScanFromBrinShared(brinshared),
2461  snapshot);
2462 
2463  /*
2464  * Store shared tuplesort-private state, for which we reserved space.
2465  * Then, initialize opaque state using tuplesort routine.
2466  */
2467  sharedsort = (Sharedsort *) shm_toc_allocate(pcxt->toc, estsort);
2468  tuplesort_initialize_shared(sharedsort, scantuplesortstates,
2469  pcxt->seg);
2470 
2471  /*
2472  * Store shared tuplesort-private state, for which we reserved space.
2473  * Then, initialize opaque state using tuplesort routine.
2474  */
2475  shm_toc_insert(pcxt->toc, PARALLEL_KEY_BRIN_SHARED, brinshared);
2476  shm_toc_insert(pcxt->toc, PARALLEL_KEY_TUPLESORT, sharedsort);
2477 
2478  /* Store query string for workers */
2479  if (debug_query_string)
2480  {
2481  char *sharedquery;
2482 
2483  sharedquery = (char *) shm_toc_allocate(pcxt->toc, querylen + 1);
2484  memcpy(sharedquery, debug_query_string, querylen + 1);
2485  shm_toc_insert(pcxt->toc, PARALLEL_KEY_QUERY_TEXT, sharedquery);
2486  }
2487 
2488  /*
2489  * Allocate space for each worker's WalUsage and BufferUsage; no need to
2490  * initialize.
2491  */
2492  walusage = shm_toc_allocate(pcxt->toc,
2493  mul_size(sizeof(WalUsage), pcxt->nworkers));
2494  shm_toc_insert(pcxt->toc, PARALLEL_KEY_WAL_USAGE, walusage);
2495  bufferusage = shm_toc_allocate(pcxt->toc,
2496  mul_size(sizeof(BufferUsage), pcxt->nworkers));
2497  shm_toc_insert(pcxt->toc, PARALLEL_KEY_BUFFER_USAGE, bufferusage);
2498 
2499  /* Launch workers, saving status for leader/caller */
2500  LaunchParallelWorkers(pcxt);
2501  brinleader->pcxt = pcxt;
2502  brinleader->nparticipanttuplesorts = pcxt->nworkers_launched;
2503  if (leaderparticipates)
2504  brinleader->nparticipanttuplesorts++;
2505  brinleader->brinshared = brinshared;
2506  brinleader->sharedsort = sharedsort;
2507  brinleader->snapshot = snapshot;
2508  brinleader->walusage = walusage;
2509  brinleader->bufferusage = bufferusage;
2510 
2511  /* If no workers were successfully launched, back out (do serial build) */
2512  if (pcxt->nworkers_launched == 0)
2513  {
2514  _brin_end_parallel(brinleader, NULL);
2515  return;
2516  }
2517 
2518  /* Save leader state now that it's clear build will be parallel */
2519  buildstate->bs_leader = brinleader;
2520 
2521  /* Join heap scan ourselves */
2522  if (leaderparticipates)
2523  _brin_leader_participate_as_worker(buildstate, heap, index);
2524 
2525  /*
2526  * Caller needs to wait for all launched workers when we return. Make
2527  * sure that the failure-to-start case will not hang forever.
2528  */
2530 }
void InitializeParallelDSM(ParallelContext *pcxt)
Definition: parallel.c:205
void LaunchParallelWorkers(ParallelContext *pcxt)
Definition: parallel.c:552
void DestroyParallelContext(ParallelContext *pcxt)
Definition: parallel.c:929
ParallelContext * CreateParallelContext(const char *library_name, const char *function_name, int nworkers)
Definition: parallel.c:167
void WaitForParallelWorkersToAttach(ParallelContext *pcxt)
Definition: parallel.c:672
#define PARALLEL_KEY_BUFFER_USAGE
Definition: brin.c:51
#define PARALLEL_KEY_BRIN_SHARED
Definition: brin.c:47
static void _brin_leader_participate_as_worker(BrinBuildState *buildstate, Relation heap, Relation index)
Definition: brin.c:2766
static void _brin_end_parallel(BrinLeader *brinleader, BrinBuildState *state)
Definition: brin.c:2536
static Size _brin_parallel_estimate_shared(Relation heap, Snapshot snapshot)
Definition: brin.c:2755
#define ParallelTableScanFromBrinShared(shared)
Definition: brin.c:113
#define PARALLEL_KEY_TUPLESORT
Definition: brin.c:48
#define PARALLEL_KEY_QUERY_TEXT
Definition: brin.c:49
#define PARALLEL_KEY_WAL_USAGE
Definition: brin.c:50
#define Assert(condition)
Definition: c.h:858
size_t Size
Definition: c.h:605
void ConditionVariableInit(ConditionVariable *cv)
void * palloc0(Size size)
Definition: mcxt.c:1347
const char * debug_query_string
Definition: postgres.c:88
#define RelationGetRelid(relation)
Definition: rel.h:505
void shm_toc_insert(shm_toc *toc, uint64 key, void *address)
Definition: shm_toc.c:171
void * shm_toc_allocate(shm_toc *toc, Size nbytes)
Definition: shm_toc.c:88
#define shm_toc_estimate_chunk(e, sz)
Definition: shm_toc.h:51
#define shm_toc_estimate_keys(e, cnt)
Definition: shm_toc.h:53
Size mul_size(Size s1, Size s2)
Definition: shmem.c:510
Snapshot GetTransactionSnapshot(void)
Definition: snapmgr.c:216
void UnregisterSnapshot(Snapshot snapshot)
Definition: snapmgr.c:836
Snapshot RegisterSnapshot(Snapshot snapshot)
Definition: snapmgr.c:794
#define SnapshotAny
Definition: snapmgr.h:33
#define IsMVCCSnapshot(snapshot)
Definition: snapmgr.h:62
#define SpinLockInit(lock)
Definition: spin.h:57
BlockNumber bs_pagesPerRange
Definition: brin.c:158
BrinLeader * bs_leader
Definition: brin.c:174
int nparticipanttuplesorts
Definition: brin.c:130
WalUsage * walusage
Definition: brin.c:144
BrinShared * brinshared
Definition: brin.c:141
BufferUsage * bufferusage
Definition: brin.c:145
Snapshot snapshot
Definition: brin.c:143
Sharedsort * sharedsort
Definition: brin.c:142
ParallelContext * pcxt
Definition: brin.c:122
slock_t mutex
Definition: brin.c:84
int scantuplesortstates
Definition: brin.c:68
int nparticipantsdone
Definition: brin.c:96
Oid heaprelid
Definition: brin.c:64
BlockNumber pagesPerRange
Definition: brin.c:67
ConditionVariable workersdonecv
Definition: brin.c:76
Oid indexrelid
Definition: brin.c:65
bool isconcurrent
Definition: brin.c:66
double indtuples
Definition: brin.c:98
double reltuples
Definition: brin.c:97
dsm_segment * seg
Definition: parallel.h:42
shm_toc_estimator estimator
Definition: parallel.h:41
shm_toc * toc
Definition: parallel.h:44
int nworkers_launched
Definition: parallel.h:37
Definition: type.h:95
void table_parallelscan_initialize(Relation rel, ParallelTableScanDesc pscan, Snapshot snapshot)
Definition: tableam.c:145
void tuplesort_initialize_shared(Sharedsort *shared, int nWorkers, dsm_segment *seg)
Definition: tuplesort.c:2938
Size tuplesort_estimate_shared(int nWorkers)
Definition: tuplesort.c:2917
void ExitParallelMode(void)
Definition: xact.c:1063
void EnterParallelMode(void)
Definition: xact.c:1050

References _brin_end_parallel(), _brin_leader_participate_as_worker(), _brin_parallel_estimate_shared(), Assert, BrinLeader::brinshared, BrinBuildState::bs_leader, BrinBuildState::bs_pagesPerRange, BrinLeader::bufferusage, ConditionVariableInit(), CreateParallelContext(), debug_query_string, DestroyParallelContext(), EnterParallelMode(), ParallelContext::estimator, ExitParallelMode(), GetTransactionSnapshot(), BrinShared::heaprelid, BrinShared::indexrelid, BrinShared::indtuples, InitializeParallelDSM(), BrinShared::isconcurrent, IsMVCCSnapshot, LaunchParallelWorkers(), mul_size(), BrinShared::mutex, BrinShared::nparticipantsdone, BrinLeader::nparticipanttuplesorts, ParallelContext::nworkers, ParallelContext::nworkers_launched, BrinShared::pagesPerRange, palloc0(), PARALLEL_KEY_BRIN_SHARED, PARALLEL_KEY_BUFFER_USAGE, PARALLEL_KEY_QUERY_TEXT, PARALLEL_KEY_TUPLESORT, PARALLEL_KEY_WAL_USAGE, ParallelTableScanFromBrinShared, BrinLeader::pcxt, RegisterSnapshot(), RelationGetRelid, BrinShared::reltuples, BrinShared::scantuplesortstates, ParallelContext::seg, BrinLeader::sharedsort, shm_toc_allocate(), shm_toc_estimate_chunk, shm_toc_estimate_keys, shm_toc_insert(), BrinLeader::snapshot, SnapshotAny, SpinLockInit, table_parallelscan_initialize(), ParallelContext::toc, tuplesort_estimate_shared(), tuplesort_initialize_shared(), UnregisterSnapshot(), WaitForParallelWorkersToAttach(), BrinLeader::walusage, and BrinShared::workersdonecv.

Referenced by brinbuild().

◆ _brin_end_parallel()

static void _brin_end_parallel ( BrinLeader brinleader,
BrinBuildState state 
)
static

Definition at line 2536 of file brin.c.

2537 {
2538  int i;
2539 
2540  /* Shutdown worker processes */
2541  WaitForParallelWorkersToFinish(brinleader->pcxt);
2542 
2543  /*
2544  * Next, accumulate WAL usage. (This must wait for the workers to finish,
2545  * or we might get incomplete data.)
2546  */
2547  for (i = 0; i < brinleader->pcxt->nworkers_launched; i++)
2548  InstrAccumParallelQuery(&brinleader->bufferusage[i], &brinleader->walusage[i]);
2549 
2550  /* Free last reference to MVCC snapshot, if one was used */
2551  if (IsMVCCSnapshot(brinleader->snapshot))
2552  UnregisterSnapshot(brinleader->snapshot);
2553  DestroyParallelContext(brinleader->pcxt);
2554  ExitParallelMode();
2555 }
void WaitForParallelWorkersToFinish(ParallelContext *pcxt)
Definition: parallel.c:775
void InstrAccumParallelQuery(BufferUsage *bufusage, WalUsage *walusage)
Definition: instrument.c:218
int i
Definition: isn.c:73

References BrinLeader::bufferusage, DestroyParallelContext(), ExitParallelMode(), i, InstrAccumParallelQuery(), IsMVCCSnapshot, ParallelContext::nworkers_launched, BrinLeader::pcxt, BrinLeader::snapshot, UnregisterSnapshot(), WaitForParallelWorkersToFinish(), and BrinLeader::walusage.

Referenced by _brin_begin_parallel(), and brinbuild().

◆ _brin_leader_participate_as_worker()

static void _brin_leader_participate_as_worker ( BrinBuildState buildstate,
Relation  heap,
Relation  index 
)
static

Definition at line 2766 of file brin.c.

2767 {
2768  BrinLeader *brinleader = buildstate->bs_leader;
2769  int sortmem;
2770 
2771  /*
2772  * Might as well use reliable figure when doling out maintenance_work_mem
2773  * (when requested number of workers were not launched, this will be
2774  * somewhat higher than it is for other workers).
2775  */
2776  sortmem = maintenance_work_mem / brinleader->nparticipanttuplesorts;
2777 
2778  /* Perform work common to all participants */
2779  _brin_parallel_scan_and_build(buildstate, brinleader->brinshared,
2780  brinleader->sharedsort, heap, index, sortmem, true);
2781 }
static void _brin_parallel_scan_and_build(BrinBuildState *state, BrinShared *brinshared, Sharedsort *sharedsort, Relation heap, Relation index, int sortmem, bool progress)
Definition: brin.c:2794
int maintenance_work_mem
Definition: globals.c:132

References _brin_parallel_scan_and_build(), BrinLeader::brinshared, BrinBuildState::bs_leader, maintenance_work_mem, BrinLeader::nparticipanttuplesorts, and BrinLeader::sharedsort.

Referenced by _brin_begin_parallel().

◆ _brin_parallel_build_main()

void _brin_parallel_build_main ( dsm_segment seg,
shm_toc toc 
)

Definition at line 2851 of file brin.c.

2852 {
2853  char *sharedquery;
2854  BrinShared *brinshared;
2855  Sharedsort *sharedsort;
2856  BrinBuildState *buildstate;
2857  Relation heapRel;
2858  Relation indexRel;
2859  LOCKMODE heapLockmode;
2860  LOCKMODE indexLockmode;
2861  WalUsage *walusage;
2862  BufferUsage *bufferusage;
2863  int sortmem;
2864 
2865  /*
2866  * The only possible status flag that can be set to the parallel worker is
2867  * PROC_IN_SAFE_IC.
2868  */
2869  Assert((MyProc->statusFlags == 0) ||
2871 
2872  /* Set debug_query_string for individual workers first */
2873  sharedquery = shm_toc_lookup(toc, PARALLEL_KEY_QUERY_TEXT, true);
2874  debug_query_string = sharedquery;
2875 
2876  /* Report the query string from leader */
2878 
2879  /* Look up brin shared state */
2880  brinshared = shm_toc_lookup(toc, PARALLEL_KEY_BRIN_SHARED, false);
2881 
2882  /* Open relations using lock modes known to be obtained by index.c */
2883  if (!brinshared->isconcurrent)
2884  {
2885  heapLockmode = ShareLock;
2886  indexLockmode = AccessExclusiveLock;
2887  }
2888  else
2889  {
2890  heapLockmode = ShareUpdateExclusiveLock;
2891  indexLockmode = RowExclusiveLock;
2892  }
2893 
2894  /* Open relations within worker */
2895  heapRel = table_open(brinshared->heaprelid, heapLockmode);
2896  indexRel = index_open(brinshared->indexrelid, indexLockmode);
2897 
2898  buildstate = initialize_brin_buildstate(indexRel, NULL,
2899  brinshared->pagesPerRange,
2901 
2902  /* Look up shared state private to tuplesort.c */
2903  sharedsort = shm_toc_lookup(toc, PARALLEL_KEY_TUPLESORT, false);
2904  tuplesort_attach_shared(sharedsort, seg);
2905 
2906  /* Prepare to track buffer usage during parallel execution */
2908 
2909  /*
2910  * Might as well use reliable figure when doling out maintenance_work_mem
2911  * (when requested number of workers were not launched, this will be
2912  * somewhat higher than it is for other workers).
2913  */
2914  sortmem = maintenance_work_mem / brinshared->scantuplesortstates;
2915 
2916  _brin_parallel_scan_and_build(buildstate, brinshared, sharedsort,
2917  heapRel, indexRel, sortmem, false);
2918 
2919  /* Report WAL/buffer usage during parallel execution */
2920  bufferusage = shm_toc_lookup(toc, PARALLEL_KEY_BUFFER_USAGE, false);
2921  walusage = shm_toc_lookup(toc, PARALLEL_KEY_WAL_USAGE, false);
2923  &walusage[ParallelWorkerNumber]);
2924 
2925  index_close(indexRel, indexLockmode);
2926  table_close(heapRel, heapLockmode);
2927 }
int ParallelWorkerNumber
Definition: parallel.c:112
void pgstat_report_activity(BackendState state, const char *cmd_str)
@ STATE_RUNNING
#define InvalidBlockNumber
Definition: block.h:33
static BrinBuildState * initialize_brin_buildstate(Relation idxRel, BrinRevmap *revmap, BlockNumber pagesPerRange, BlockNumber tablePages)
Definition: brin.c:1658
void index_close(Relation relation, LOCKMODE lockmode)
Definition: indexam.c:177
Relation index_open(Oid relationId, LOCKMODE lockmode)
Definition: indexam.c:133
void InstrEndParallelQuery(BufferUsage *bufusage, WalUsage *walusage)
Definition: instrument.c:208
void InstrStartParallelQuery(void)
Definition: instrument.c:200
int LOCKMODE
Definition: lockdefs.h:26
#define AccessExclusiveLock
Definition: lockdefs.h:43
#define ShareUpdateExclusiveLock
Definition: lockdefs.h:39
#define ShareLock
Definition: lockdefs.h:40
#define RowExclusiveLock
Definition: lockdefs.h:38
#define PROC_IN_SAFE_IC
Definition: proc.h:59
void * shm_toc_lookup(shm_toc *toc, uint64 key, bool noError)
Definition: shm_toc.c:232
PGPROC * MyProc
Definition: proc.c:67
uint8 statusFlags
Definition: proc.h:237
void table_close(Relation relation, LOCKMODE lockmode)
Definition: table.c:126
Relation table_open(Oid relationId, LOCKMODE lockmode)
Definition: table.c:40
void tuplesort_attach_shared(Sharedsort *shared, dsm_segment *seg)
Definition: tuplesort.c:2961

References _brin_parallel_scan_and_build(), AccessExclusiveLock, Assert, debug_query_string, BrinShared::heaprelid, index_close(), index_open(), BrinShared::indexrelid, initialize_brin_buildstate(), InstrEndParallelQuery(), InstrStartParallelQuery(), InvalidBlockNumber, BrinShared::isconcurrent, maintenance_work_mem, MyProc, BrinShared::pagesPerRange, PARALLEL_KEY_BRIN_SHARED, PARALLEL_KEY_BUFFER_USAGE, PARALLEL_KEY_QUERY_TEXT, PARALLEL_KEY_TUPLESORT, PARALLEL_KEY_WAL_USAGE, ParallelWorkerNumber, pgstat_report_activity(), PROC_IN_SAFE_IC, RowExclusiveLock, BrinShared::scantuplesortstates, ShareLock, ShareUpdateExclusiveLock, shm_toc_lookup(), STATE_RUNNING, PGPROC::statusFlags, table_close(), table_open(), and tuplesort_attach_shared().

◆ _brin_parallel_estimate_shared()

static Size _brin_parallel_estimate_shared ( Relation  heap,
Snapshot  snapshot 
)
static

Definition at line 2755 of file brin.c.

2756 {
2757  /* c.f. shm_toc_allocate as to why BUFFERALIGN is used */
2758  return add_size(BUFFERALIGN(sizeof(BrinShared)),
2759  table_parallelscan_estimate(heap, snapshot));
2760 }
#define BUFFERALIGN(LEN)
Definition: c.h:813
Size add_size(Size s1, Size s2)
Definition: shmem.c:493
Size table_parallelscan_estimate(Relation rel, Snapshot snapshot)
Definition: tableam.c:130

References add_size(), BUFFERALIGN, and table_parallelscan_estimate().

Referenced by _brin_begin_parallel().

◆ _brin_parallel_heapscan()

static double _brin_parallel_heapscan ( BrinBuildState state)
static

Definition at line 2567 of file brin.c.

2568 {
2569  BrinShared *brinshared = state->bs_leader->brinshared;
2570  int nparticipanttuplesorts;
2571 
2572  nparticipanttuplesorts = state->bs_leader->nparticipanttuplesorts;
2573  for (;;)
2574  {
2575  SpinLockAcquire(&brinshared->mutex);
2576  if (brinshared->nparticipantsdone == nparticipanttuplesorts)
2577  {
2578  /* copy the data into leader state */
2579  state->bs_reltuples = brinshared->reltuples;
2580  state->bs_numtuples = brinshared->indtuples;
2581 
2582  SpinLockRelease(&brinshared->mutex);
2583  break;
2584  }
2585  SpinLockRelease(&brinshared->mutex);
2586 
2588  WAIT_EVENT_PARALLEL_CREATE_INDEX_SCAN);
2589  }
2590 
2592 
2593  return state->bs_reltuples;
2594 }
bool ConditionVariableCancelSleep(void)
void ConditionVariableSleep(ConditionVariable *cv, uint32 wait_event_info)
#define SpinLockRelease(lock)
Definition: spin.h:61
#define SpinLockAcquire(lock)
Definition: spin.h:59
Definition: regguts.h:323

References ConditionVariableCancelSleep(), ConditionVariableSleep(), BrinShared::indtuples, BrinShared::mutex, BrinShared::nparticipantsdone, BrinShared::reltuples, SpinLockAcquire, SpinLockRelease, and BrinShared::workersdonecv.

Referenced by _brin_parallel_merge().

◆ _brin_parallel_merge()

static double _brin_parallel_merge ( BrinBuildState state)
static

Definition at line 2608 of file brin.c.

2609 {
2610  BrinTuple *btup;
2611  BrinMemTuple *memtuple = NULL;
2612  Size tuplen;
2613  BlockNumber prevblkno = InvalidBlockNumber;
2614  MemoryContext rangeCxt,
2615  oldCxt;
2616  double reltuples;
2617 
2618  /* wait for workers to scan table and produce partial results */
2619  reltuples = _brin_parallel_heapscan(state);
2620 
2621  /* do the actual sort in the leader */
2622  tuplesort_performsort(state->bs_sortstate);
2623 
2624  /*
2625  * Initialize BrinMemTuple we'll use to union summaries from workers (in
2626  * case they happened to produce parts of the same page range).
2627  */
2628  memtuple = brin_new_memtuple(state->bs_bdesc);
2629 
2630  /*
2631  * Create a memory context we'll reset to combine results for a single
2632  * page range (received from the workers). We don't expect huge number of
2633  * overlaps under regular circumstances, because for large tables the
2634  * chunk size is likely larger than the BRIN page range), but it can
2635  * happen, and the union functions may do all kinds of stuff. So we better
2636  * reset the context once in a while.
2637  */
2639  "brin union",
2641  oldCxt = MemoryContextSwitchTo(rangeCxt);
2642 
2643  /*
2644  * Read the BRIN tuples from the shared tuplesort, sorted by block number.
2645  * That probably gives us an index that is cheaper to scan, thanks to
2646  * mostly getting data from the same index page as before.
2647  */
2648  while ((btup = tuplesort_getbrintuple(state->bs_sortstate, &tuplen, true)) != NULL)
2649  {
2650  /* Ranges should be multiples of pages_per_range for the index. */
2651  Assert(btup->bt_blkno % state->bs_leader->brinshared->pagesPerRange == 0);
2652 
2653  /*
2654  * Do we need to union summaries for the same page range?
2655  *
2656  * If this is the first brin tuple we read, then just deform it into
2657  * the memtuple, and continue with the next one from tuplesort. We
2658  * however may need to insert empty summaries into the index.
2659  *
2660  * If it's the same block as the last we saw, we simply union the brin
2661  * tuple into it, and we're done - we don't even need to insert empty
2662  * ranges, because that was done earlier when we saw the first brin
2663  * tuple (for this range).
2664  *
2665  * Finally, if it's not the first brin tuple, and it's not the same
2666  * page range, we need to do the insert and then deform the tuple into
2667  * the memtuple. Then we'll insert empty ranges before the new brin
2668  * tuple, if needed.
2669  */
2670  if (prevblkno == InvalidBlockNumber)
2671  {
2672  /* First brin tuples, just deform into memtuple. */
2673  memtuple = brin_deform_tuple(state->bs_bdesc, btup, memtuple);
2674 
2675  /* continue to insert empty pages before thisblock */
2676  }
2677  else if (memtuple->bt_blkno == btup->bt_blkno)
2678  {
2679  /*
2680  * Not the first brin tuple, but same page range as the previous
2681  * one, so we can merge it into the memtuple.
2682  */
2683  union_tuples(state->bs_bdesc, memtuple, btup);
2684  continue;
2685  }
2686  else
2687  {
2688  BrinTuple *tmp;
2689  Size len;
2690 
2691  /*
2692  * We got brin tuple for a different page range, so form a brin
2693  * tuple from the memtuple, insert it, and re-init the memtuple
2694  * from the new brin tuple.
2695  */
2696  tmp = brin_form_tuple(state->bs_bdesc, memtuple->bt_blkno,
2697  memtuple, &len);
2698 
2699  brin_doinsert(state->bs_irel, state->bs_pagesPerRange, state->bs_rmAccess,
2700  &state->bs_currentInsertBuf, tmp->bt_blkno, tmp, len);
2701 
2702  /*
2703  * Reset the per-output-range context. This frees all the memory
2704  * possibly allocated by the union functions, and also the BRIN
2705  * tuple we just formed and inserted.
2706  */
2707  MemoryContextReset(rangeCxt);
2708 
2709  memtuple = brin_deform_tuple(state->bs_bdesc, btup, memtuple);
2710 
2711  /* continue to insert empty pages before thisblock */
2712  }
2713 
2714  /* Fill empty ranges for all ranges missing in the tuplesort. */
2715  brin_fill_empty_ranges(state, prevblkno, btup->bt_blkno);
2716 
2717  prevblkno = btup->bt_blkno;
2718  }
2719 
2720  tuplesort_end(state->bs_sortstate);
2721 
2722  /* Fill the BRIN tuple for the last page range with data. */
2723  if (prevblkno != InvalidBlockNumber)
2724  {
2725  BrinTuple *tmp;
2726  Size len;
2727 
2728  tmp = brin_form_tuple(state->bs_bdesc, memtuple->bt_blkno,
2729  memtuple, &len);
2730 
2731  brin_doinsert(state->bs_irel, state->bs_pagesPerRange, state->bs_rmAccess,
2732  &state->bs_currentInsertBuf, tmp->bt_blkno, tmp, len);
2733 
2734  pfree(tmp);
2735  }
2736 
2737  /* Fill empty ranges at the end, for all ranges missing in the tuplesort. */
2738  brin_fill_empty_ranges(state, prevblkno, state->bs_maxRangeStart);
2739 
2740  /*
2741  * Switch back to the original memory context, and destroy the one we
2742  * created to isolate the union_tuple calls.
2743  */
2744  MemoryContextSwitchTo(oldCxt);
2745  MemoryContextDelete(rangeCxt);
2746 
2747  return reltuples;
2748 }
uint32 BlockNumber
Definition: block.h:31
static void union_tuples(BrinDesc *bdesc, BrinMemTuple *a, BrinTuple *b)
Definition: brin.c:2020
static void brin_fill_empty_ranges(BrinBuildState *state, BlockNumber prevRange, BlockNumber nextRange)
Definition: brin.c:2978
static double _brin_parallel_heapscan(BrinBuildState *state)
Definition: brin.c:2567
OffsetNumber brin_doinsert(Relation idxrel, BlockNumber pagesPerRange, BrinRevmap *revmap, Buffer *buffer, BlockNumber heapBlk, BrinTuple *tup, Size itemsz)
Definition: brin_pageops.c:342
BrinTuple * brin_form_tuple(BrinDesc *brdesc, BlockNumber blkno, BrinMemTuple *tuple, Size *size)
Definition: brin_tuple.c:99
BrinMemTuple * brin_new_memtuple(BrinDesc *brdesc)
Definition: brin_tuple.c:482
BrinMemTuple * brin_deform_tuple(BrinDesc *brdesc, BrinTuple *tuple, BrinMemTuple *dMemtuple)
Definition: brin_tuple.c:553
void MemoryContextReset(MemoryContext context)
Definition: mcxt.c:383
void pfree(void *pointer)
Definition: mcxt.c:1521
MemoryContext CurrentMemoryContext
Definition: mcxt.c:143
void MemoryContextDelete(MemoryContext context)
Definition: mcxt.c:454
#define AllocSetContextCreate
Definition: memutils.h:129
#define ALLOCSET_DEFAULT_SIZES
Definition: memutils.h:160
const void size_t len
MemoryContextSwitchTo(old_ctx)
BlockNumber bt_blkno
Definition: brin_tuple.h:48
BlockNumber bt_blkno
Definition: brin_tuple.h:66
void tuplesort_performsort(Tuplesortstate *state)
Definition: tuplesort.c:1363
void tuplesort_end(Tuplesortstate *state)
Definition: tuplesort.c:951
BrinTuple * tuplesort_getbrintuple(Tuplesortstate *state, Size *len, bool forward)

References _brin_parallel_heapscan(), ALLOCSET_DEFAULT_SIZES, AllocSetContextCreate, Assert, brin_deform_tuple(), brin_doinsert(), brin_fill_empty_ranges(), brin_form_tuple(), brin_new_memtuple(), BrinMemTuple::bt_blkno, BrinTuple::bt_blkno, CurrentMemoryContext, InvalidBlockNumber, len, MemoryContextDelete(), MemoryContextReset(), MemoryContextSwitchTo(), pfree(), tuplesort_end(), tuplesort_getbrintuple(), tuplesort_performsort(), and union_tuples().

Referenced by brinbuild().

◆ _brin_parallel_scan_and_build()

static void _brin_parallel_scan_and_build ( BrinBuildState state,
BrinShared brinshared,
Sharedsort sharedsort,
Relation  heap,
Relation  index,
int  sortmem,
bool  progress 
)
static

Definition at line 2794 of file brin.c.

2798 {
2799  SortCoordinate coordinate;
2800  TableScanDesc scan;
2801  double reltuples;
2802  IndexInfo *indexInfo;
2803 
2804  /* Initialize local tuplesort coordination state */
2805  coordinate = palloc0(sizeof(SortCoordinateData));
2806  coordinate->isWorker = true;
2807  coordinate->nParticipants = -1;
2808  coordinate->sharedsort = sharedsort;
2809 
2810  /* Begin "partial" tuplesort */
2811  state->bs_sortstate = tuplesort_begin_index_brin(sortmem, coordinate,
2812  TUPLESORT_NONE);
2813 
2814  /* Join parallel scan */
2815  indexInfo = BuildIndexInfo(index);
2816  indexInfo->ii_Concurrent = brinshared->isconcurrent;
2817 
2818  scan = table_beginscan_parallel(heap,
2819  ParallelTableScanFromBrinShared(brinshared));
2820 
2821  reltuples = table_index_build_scan(heap, index, indexInfo, true, true,
2823 
2824  /* insert the last item */
2826 
2827  /* sort the BRIN ranges built by this worker */
2828  tuplesort_performsort(state->bs_sortstate);
2829 
2830  state->bs_reltuples += reltuples;
2831 
2832  /*
2833  * Done. Record ambuild statistics.
2834  */
2835  SpinLockAcquire(&brinshared->mutex);
2836  brinshared->nparticipantsdone++;
2837  brinshared->reltuples += state->bs_reltuples;
2838  brinshared->indtuples += state->bs_numtuples;
2839  SpinLockRelease(&brinshared->mutex);
2840 
2841  /* Notify leader */
2842  ConditionVariableSignal(&brinshared->workersdonecv);
2843 
2844  tuplesort_end(state->bs_sortstate);
2845 }
static void form_and_spill_tuple(BrinBuildState *state)
Definition: brin.c:1995
static void brinbuildCallbackParallel(Relation index, ItemPointer tid, Datum *values, bool *isnull, bool tupleIsAlive, void *brstate)
Definition: brin.c:1034
void ConditionVariableSignal(ConditionVariable *cv)
IndexInfo * BuildIndexInfo(Relation index)
Definition: index.c:2409
bool ii_Concurrent
Definition: execnodes.h:204
Sharedsort * sharedsort
Definition: tuplesort.h:58
TableScanDesc table_beginscan_parallel(Relation relation, ParallelTableScanDesc pscan)
Definition: tableam.c:165
static double table_index_build_scan(Relation table_rel, Relation index_rel, struct IndexInfo *index_info, bool allow_sync, bool progress, IndexBuildCallback callback, void *callback_state, TableScanDesc scan)
Definition: tableam.h:1775
#define TUPLESORT_NONE
Definition: tuplesort.h:93
Tuplesortstate * tuplesort_begin_index_brin(int workMem, SortCoordinate coordinate, int sortopt)

References brinbuildCallbackParallel(), BuildIndexInfo(), ConditionVariableSignal(), form_and_spill_tuple(), IndexInfo::ii_Concurrent, BrinShared::indtuples, BrinShared::isconcurrent, SortCoordinateData::isWorker, BrinShared::mutex, SortCoordinateData::nParticipants, BrinShared::nparticipantsdone, palloc0(), ParallelTableScanFromBrinShared, BrinShared::reltuples, SortCoordinateData::sharedsort, SpinLockAcquire, SpinLockRelease, table_beginscan_parallel(), table_index_build_scan(), tuplesort_begin_index_brin(), tuplesort_end(), TUPLESORT_NONE, tuplesort_performsort(), and BrinShared::workersdonecv.

Referenced by _brin_leader_participate_as_worker(), and _brin_parallel_build_main().

◆ add_values_to_range()

static bool add_values_to_range ( Relation  idxRel,
BrinDesc bdesc,
BrinMemTuple dtup,
const Datum values,
const bool nulls 
)
static

Definition at line 2194 of file brin.c.

2196 {
2197  int keyno;
2198 
2199  /* If the range starts empty, we're certainly going to modify it. */
2200  bool modified = dtup->bt_empty_range;
2201 
2202  /*
2203  * Compare the key values of the new tuple to the stored index values; our
2204  * deformed tuple will get updated if the new tuple doesn't fit the
2205  * original range (note this means we can't break out of the loop early).
2206  * Make a note of whether this happens, so that we know to insert the
2207  * modified tuple later.
2208  */
2209  for (keyno = 0; keyno < bdesc->bd_tupdesc->natts; keyno++)
2210  {
2211  Datum result;
2212  BrinValues *bval;
2213  FmgrInfo *addValue;
2214  bool has_nulls;
2215 
2216  bval = &dtup->bt_columns[keyno];
2217 
2218  /*
2219  * Does the range have actual NULL values? Either of the flags can be
2220  * set, but we ignore the state before adding first row.
2221  *
2222  * We have to remember this, because we'll modify the flags and we
2223  * need to know if the range started as empty.
2224  */
2225  has_nulls = ((!dtup->bt_empty_range) &&
2226  (bval->bv_hasnulls || bval->bv_allnulls));
2227 
2228  /*
2229  * If the value we're adding is NULL, handle it locally. Otherwise
2230  * call the BRIN_PROCNUM_ADDVALUE procedure.
2231  */
2232  if (bdesc->bd_info[keyno]->oi_regular_nulls && nulls[keyno])
2233  {
2234  /*
2235  * If the new value is null, we record that we saw it if it's the
2236  * first one; otherwise, there's nothing to do.
2237  */
2238  if (!bval->bv_hasnulls)
2239  {
2240  bval->bv_hasnulls = true;
2241  modified = true;
2242  }
2243 
2244  continue;
2245  }
2246 
2247  addValue = index_getprocinfo(idxRel, keyno + 1,
2249  result = FunctionCall4Coll(addValue,
2250  idxRel->rd_indcollation[keyno],
2251  PointerGetDatum(bdesc),
2252  PointerGetDatum(bval),
2253  values[keyno],
2254  nulls[keyno]);
2255  /* if that returned true, we need to insert the updated tuple */
2256  modified |= DatumGetBool(result);
2257 
2258  /*
2259  * If the range was had actual NULL values (i.e. did not start empty),
2260  * make sure we don't forget about the NULL values. Either the
2261  * allnulls flag is still set to true, or (if the opclass cleared it)
2262  * we need to set hasnulls=true.
2263  *
2264  * XXX This can only happen when the opclass modified the tuple, so
2265  * the modified flag should be set.
2266  */
2267  if (has_nulls && !(bval->bv_hasnulls || bval->bv_allnulls))
2268  {
2269  Assert(modified);
2270  bval->bv_hasnulls = true;
2271  }
2272  }
2273 
2274  /*
2275  * After updating summaries for all the keys, mark it as not empty.
2276  *
2277  * If we're actually changing the flag value (i.e. tuple started as
2278  * empty), we should have modified the tuple. So we should not see empty
2279  * range that was not modified.
2280  */
2281  Assert(!dtup->bt_empty_range || modified);
2282  dtup->bt_empty_range = false;
2283 
2284  return modified;
2285 }
static Datum values[MAXATTR]
Definition: bootstrap.c:150
#define BRIN_PROCNUM_ADDVALUE
Definition: brin_internal.h:71
Datum FunctionCall4Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2, Datum arg3, Datum arg4)
Definition: fmgr.c:1196
FmgrInfo * index_getprocinfo(Relation irel, AttrNumber attnum, uint16 procnum)
Definition: indexam.c:860
static bool DatumGetBool(Datum X)
Definition: postgres.h:90
static Datum PointerGetDatum(const void *X)
Definition: postgres.h:322
uintptr_t Datum
Definition: postgres.h:64
TupleDesc bd_tupdesc
Definition: brin_internal.h:53
BrinOpcInfo * bd_info[FLEXIBLE_ARRAY_MEMBER]
Definition: brin_internal.h:62
BrinValues bt_columns[FLEXIBLE_ARRAY_MEMBER]
Definition: brin_tuple.h:55
bool bt_empty_range
Definition: brin_tuple.h:47
bool oi_regular_nulls
Definition: brin_internal.h:31
bool bv_hasnulls
Definition: brin_tuple.h:32
bool bv_allnulls
Definition: brin_tuple.h:33
Definition: fmgr.h:57
Oid * rd_indcollation
Definition: rel.h:217

References Assert, BrinDesc::bd_info, BrinDesc::bd_tupdesc, BRIN_PROCNUM_ADDVALUE, BrinMemTuple::bt_columns, BrinMemTuple::bt_empty_range, BrinValues::bv_allnulls, BrinValues::bv_hasnulls, DatumGetBool(), FunctionCall4Coll(), index_getprocinfo(), TupleDescData::natts, BrinOpcInfo::oi_regular_nulls, PointerGetDatum(), RelationData::rd_indcollation, and values.

Referenced by brinbuildCallback(), brinbuildCallbackParallel(), and brininsert().

◆ brin_build_desc()

BrinDesc* brin_build_desc ( Relation  rel)

Definition at line 1570 of file brin.c.

1571 {
1572  BrinOpcInfo **opcinfo;
1573  BrinDesc *bdesc;
1574  TupleDesc tupdesc;
1575  int totalstored = 0;
1576  int keyno;
1577  long totalsize;
1578  MemoryContext cxt;
1579  MemoryContext oldcxt;
1580 
1582  "brin desc cxt",
1584  oldcxt = MemoryContextSwitchTo(cxt);
1585  tupdesc = RelationGetDescr(rel);
1586 
1587  /*
1588  * Obtain BrinOpcInfo for each indexed column. While at it, accumulate
1589  * the number of columns stored, since the number is opclass-defined.
1590  */
1591  opcinfo = palloc_array(BrinOpcInfo *, tupdesc->natts);
1592  for (keyno = 0; keyno < tupdesc->natts; keyno++)
1593  {
1594  FmgrInfo *opcInfoFn;
1595  Form_pg_attribute attr = TupleDescAttr(tupdesc, keyno);
1596 
1597  opcInfoFn = index_getprocinfo(rel, keyno + 1, BRIN_PROCNUM_OPCINFO);
1598 
1599  opcinfo[keyno] = (BrinOpcInfo *)
1600  DatumGetPointer(FunctionCall1(opcInfoFn, attr->atttypid));
1601  totalstored += opcinfo[keyno]->oi_nstored;
1602  }
1603 
1604  /* Allocate our result struct and fill it in */
1605  totalsize = offsetof(BrinDesc, bd_info) +
1606  sizeof(BrinOpcInfo *) * tupdesc->natts;
1607 
1608  bdesc = palloc(totalsize);
1609  bdesc->bd_context = cxt;
1610  bdesc->bd_index = rel;
1611  bdesc->bd_tupdesc = tupdesc;
1612  bdesc->bd_disktdesc = NULL; /* generated lazily */
1613  bdesc->bd_totalstored = totalstored;
1614 
1615  for (keyno = 0; keyno < tupdesc->natts; keyno++)
1616  bdesc->bd_info[keyno] = opcinfo[keyno];
1617  pfree(opcinfo);
1618 
1619  MemoryContextSwitchTo(oldcxt);
1620 
1621  return bdesc;
1622 }
#define BRIN_PROCNUM_OPCINFO
Definition: brin_internal.h:70
#define palloc_array(type, count)
Definition: fe_memutils.h:64
#define FunctionCall1(flinfo, arg1)
Definition: fmgr.h:659
void * palloc(Size size)
Definition: mcxt.c:1317
#define ALLOCSET_SMALL_SIZES
Definition: memutils.h:170
FormData_pg_attribute * Form_pg_attribute
Definition: pg_attribute.h:209
static Pointer DatumGetPointer(Datum X)
Definition: postgres.h:312
#define RelationGetDescr(relation)
Definition: rel.h:531
int bd_totalstored
Definition: brin_internal.h:59
Relation bd_index
Definition: brin_internal.h:50
MemoryContext bd_context
Definition: brin_internal.h:47
TupleDesc bd_disktdesc
Definition: brin_internal.h:56
uint16 oi_nstored
Definition: brin_internal.h:28
#define TupleDescAttr(tupdesc, i)
Definition: tupdesc.h:92

References ALLOCSET_SMALL_SIZES, AllocSetContextCreate, BrinDesc::bd_context, BrinDesc::bd_disktdesc, BrinDesc::bd_index, BrinDesc::bd_info, BrinDesc::bd_totalstored, BrinDesc::bd_tupdesc, BRIN_PROCNUM_OPCINFO, CurrentMemoryContext, DatumGetPointer(), FunctionCall1, index_getprocinfo(), MemoryContextSwitchTo(), TupleDescData::natts, BrinOpcInfo::oi_nstored, palloc(), palloc_array, pfree(), RelationGetDescr, and TupleDescAttr.

Referenced by brin_page_items(), brinbeginscan(), initialize_brin_buildstate(), and initialize_brin_insertstate().

◆ brin_build_empty_tuple()

static void brin_build_empty_tuple ( BrinBuildState state,
BlockNumber  blkno 
)
static

Definition at line 2941 of file brin.c.

2942 {
2943  /* First time an empty tuple is requested? If yes, initialize it. */
2944  if (state->bs_emptyTuple == NULL)
2945  {
2946  MemoryContext oldcxt;
2947  BrinMemTuple *dtuple = brin_new_memtuple(state->bs_bdesc);
2948 
2949  /* Allocate the tuple in context for the whole index build. */
2950  oldcxt = MemoryContextSwitchTo(state->bs_context);
2951 
2952  state->bs_emptyTuple = brin_form_tuple(state->bs_bdesc, blkno, dtuple,
2953  &state->bs_emptyTupleLen);
2954 
2955  MemoryContextSwitchTo(oldcxt);
2956  }
2957  else
2958  {
2959  /* If we already have an empty tuple, just update the block. */
2960  state->bs_emptyTuple->bt_blkno = blkno;
2961  }
2962 }

References brin_form_tuple(), brin_new_memtuple(), and MemoryContextSwitchTo().

Referenced by brin_fill_empty_ranges().

◆ brin_desummarize_range()

Datum brin_desummarize_range ( PG_FUNCTION_ARGS  )

Definition at line 1480 of file brin.c.

1481 {
1482  Oid indexoid = PG_GETARG_OID(0);
1483  int64 heapBlk64 = PG_GETARG_INT64(1);
1484  BlockNumber heapBlk;
1485  Oid heapoid;
1486  Relation heapRel;
1487  Relation indexRel;
1488  bool done;
1489 
1490  if (RecoveryInProgress())
1491  ereport(ERROR,
1492  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
1493  errmsg("recovery is in progress"),
1494  errhint("BRIN control functions cannot be executed during recovery.")));
1495 
1496  if (heapBlk64 > MaxBlockNumber || heapBlk64 < 0)
1497  ereport(ERROR,
1498  (errcode(ERRCODE_NUMERIC_VALUE_OUT_OF_RANGE),
1499  errmsg("block number out of range: %lld",
1500  (long long) heapBlk64)));
1501  heapBlk = (BlockNumber) heapBlk64;
1502 
1503  /*
1504  * We must lock table before index to avoid deadlocks. However, if the
1505  * passed indexoid isn't an index then IndexGetRelation() will fail.
1506  * Rather than emitting a not-very-helpful error message, postpone
1507  * complaining, expecting that the is-it-an-index test below will fail.
1508  *
1509  * Unlike brin_summarize_range(), autovacuum never calls this. Hence, we
1510  * don't switch userid.
1511  */
1512  heapoid = IndexGetRelation(indexoid, true);
1513  if (OidIsValid(heapoid))
1514  heapRel = table_open(heapoid, ShareUpdateExclusiveLock);
1515  else
1516  heapRel = NULL;
1517 
1518  indexRel = index_open(indexoid, ShareUpdateExclusiveLock);
1519 
1520  /* Must be a BRIN index */
1521  if (indexRel->rd_rel->relkind != RELKIND_INDEX ||
1522  indexRel->rd_rel->relam != BRIN_AM_OID)
1523  ereport(ERROR,
1524  (errcode(ERRCODE_WRONG_OBJECT_TYPE),
1525  errmsg("\"%s\" is not a BRIN index",
1526  RelationGetRelationName(indexRel))));
1527 
1528  /* User must own the index (comparable to privileges needed for VACUUM) */
1529  if (!object_ownercheck(RelationRelationId, indexoid, GetUserId()))
1531  RelationGetRelationName(indexRel));
1532 
1533  /*
1534  * Since we did the IndexGetRelation call above without any lock, it's
1535  * barely possible that a race against an index drop/recreation could have
1536  * netted us the wrong table. Recheck.
1537  */
1538  if (heapRel == NULL || heapoid != IndexGetRelation(indexoid, false))
1539  ereport(ERROR,
1541  errmsg("could not open parent table of index \"%s\"",
1542  RelationGetRelationName(indexRel))));
1543 
1544  /* see gin_clean_pending_list() */
1545  if (indexRel->rd_index->indisvalid)
1546  {
1547  /* the revmap does the hard work */
1548  do
1549  {
1550  done = brinRevmapDesummarizeRange(indexRel, heapBlk);
1551  }
1552  while (!done);
1553  }
1554  else
1555  ereport(DEBUG1,
1556  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
1557  errmsg("index \"%s\" is not valid",
1558  RelationGetRelationName(indexRel))));
1559 
1562 
1563  PG_RETURN_VOID();
1564 }
@ ACLCHECK_NOT_OWNER
Definition: acl.h:185
void aclcheck_error(AclResult aclerr, ObjectType objtype, const char *objectname)
Definition: aclchk.c:2698
bool object_ownercheck(Oid classid, Oid objectid, Oid roleid)
Definition: aclchk.c:4140
#define MaxBlockNumber
Definition: block.h:35
bool brinRevmapDesummarizeRange(Relation idxrel, BlockNumber heapBlk)
Definition: brin_revmap.c:323
#define OidIsValid(objectId)
Definition: c.h:775
int errhint(const char *fmt,...)
Definition: elog.c:1317
int errcode(int sqlerrcode)
Definition: elog.c:853
int errmsg(const char *fmt,...)
Definition: elog.c:1070
#define DEBUG1
Definition: elog.h:30
#define ERROR
Definition: elog.h:39
#define ereport(elevel,...)
Definition: elog.h:149
#define PG_RETURN_VOID()
Definition: fmgr.h:349
#define PG_GETARG_OID(n)
Definition: fmgr.h:275
#define PG_GETARG_INT64(n)
Definition: fmgr.h:283
Oid IndexGetRelation(Oid indexId, bool missing_ok)
Definition: index.c:3531
Oid GetUserId(void)
Definition: miscinit.c:514
@ OBJECT_INDEX
Definition: parsenodes.h:2277
#define ERRCODE_UNDEFINED_TABLE
Definition: pgbench.c:78
unsigned int Oid
Definition: postgres_ext.h:31
#define RelationGetRelationName(relation)
Definition: rel.h:539
void relation_close(Relation relation, LOCKMODE lockmode)
Definition: relation.c:205
Form_pg_index rd_index
Definition: rel.h:192
Form_pg_class rd_rel
Definition: rel.h:111
bool RecoveryInProgress(void)
Definition: xlog.c:6333

References aclcheck_error(), ACLCHECK_NOT_OWNER, brinRevmapDesummarizeRange(), DEBUG1, ereport, errcode(), ERRCODE_UNDEFINED_TABLE, errhint(), errmsg(), ERROR, GetUserId(), index_open(), IndexGetRelation(), MaxBlockNumber, OBJECT_INDEX, object_ownercheck(), OidIsValid, PG_GETARG_INT64, PG_GETARG_OID, PG_RETURN_VOID, RelationData::rd_index, RelationData::rd_rel, RecoveryInProgress(), relation_close(), RelationGetRelationName, ShareUpdateExclusiveLock, and table_open().

◆ brin_fill_empty_ranges()

static void brin_fill_empty_ranges ( BrinBuildState state,
BlockNumber  prevRange,
BlockNumber  nextRange 
)
static

Definition at line 2978 of file brin.c.

2980 {
2981  BlockNumber blkno;
2982 
2983  /*
2984  * If we already summarized some ranges, we need to start with the next
2985  * one. Otherwise start from the first range of the table.
2986  */
2987  blkno = (prevRange == InvalidBlockNumber) ? 0 : (prevRange + state->bs_pagesPerRange);
2988 
2989  /* Generate empty ranges until we hit the next non-empty range. */
2990  while (blkno < nextRange)
2991  {
2992  /* Did we already build the empty tuple? If not, do it now. */
2993  brin_build_empty_tuple(state, blkno);
2994 
2995  brin_doinsert(state->bs_irel, state->bs_pagesPerRange, state->bs_rmAccess,
2996  &state->bs_currentInsertBuf,
2997  blkno, state->bs_emptyTuple, state->bs_emptyTupleLen);
2998 
2999  /* try next page range */
3000  blkno += state->bs_pagesPerRange;
3001  }
3002 }
static void brin_build_empty_tuple(BrinBuildState *state, BlockNumber blkno)
Definition: brin.c:2941

References brin_build_empty_tuple(), brin_doinsert(), and InvalidBlockNumber.

Referenced by _brin_parallel_merge(), and brinbuild().

◆ brin_free_desc()

void brin_free_desc ( BrinDesc bdesc)

Definition at line 1625 of file brin.c.

1626 {
1627  /* make sure the tupdesc is still valid */
1628  Assert(bdesc->bd_tupdesc->tdrefcount >= 1);
1629  /* no need for retail pfree */
1631 }
int tdrefcount
Definition: tupdesc.h:84

References Assert, BrinDesc::bd_context, BrinDesc::bd_tupdesc, MemoryContextDelete(), and TupleDescData::tdrefcount.

Referenced by brin_page_items(), brinendscan(), and terminate_brin_buildstate().

◆ brin_summarize_new_values()

Datum brin_summarize_new_values ( PG_FUNCTION_ARGS  )

Definition at line 1354 of file brin.c.

1355 {
1356  Datum relation = PG_GETARG_DATUM(0);
1357 
1359  relation,
1361 }
Datum brin_summarize_range(PG_FUNCTION_ARGS)
Definition: brin.c:1369
#define BRIN_ALL_BLOCKRANGES
Definition: brin.c:206
Datum Int64GetDatum(int64 X)
Definition: fmgr.c:1807
#define DirectFunctionCall2(func, arg1, arg2)
Definition: fmgr.h:643
#define PG_GETARG_DATUM(n)
Definition: fmgr.h:268

References BRIN_ALL_BLOCKRANGES, brin_summarize_range(), DirectFunctionCall2, Int64GetDatum(), and PG_GETARG_DATUM.

◆ brin_summarize_range()

Datum brin_summarize_range ( PG_FUNCTION_ARGS  )

Definition at line 1369 of file brin.c.

1370 {
1371  Oid indexoid = PG_GETARG_OID(0);
1372  int64 heapBlk64 = PG_GETARG_INT64(1);
1373  BlockNumber heapBlk;
1374  Oid heapoid;
1375  Relation indexRel;
1376  Relation heapRel;
1377  Oid save_userid;
1378  int save_sec_context;
1379  int save_nestlevel;
1380  double numSummarized = 0;
1381 
1382  if (RecoveryInProgress())
1383  ereport(ERROR,
1384  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
1385  errmsg("recovery is in progress"),
1386  errhint("BRIN control functions cannot be executed during recovery.")));
1387 
1388  if (heapBlk64 > BRIN_ALL_BLOCKRANGES || heapBlk64 < 0)
1389  ereport(ERROR,
1390  (errcode(ERRCODE_NUMERIC_VALUE_OUT_OF_RANGE),
1391  errmsg("block number out of range: %lld",
1392  (long long) heapBlk64)));
1393  heapBlk = (BlockNumber) heapBlk64;
1394 
1395  /*
1396  * We must lock table before index to avoid deadlocks. However, if the
1397  * passed indexoid isn't an index then IndexGetRelation() will fail.
1398  * Rather than emitting a not-very-helpful error message, postpone
1399  * complaining, expecting that the is-it-an-index test below will fail.
1400  */
1401  heapoid = IndexGetRelation(indexoid, true);
1402  if (OidIsValid(heapoid))
1403  {
1404  heapRel = table_open(heapoid, ShareUpdateExclusiveLock);
1405 
1406  /*
1407  * Autovacuum calls us. For its benefit, switch to the table owner's
1408  * userid, so that any index functions are run as that user. Also
1409  * lock down security-restricted operations and arrange to make GUC
1410  * variable changes local to this command. This is harmless, albeit
1411  * unnecessary, when called from SQL, because we fail shortly if the
1412  * user does not own the index.
1413  */
1414  GetUserIdAndSecContext(&save_userid, &save_sec_context);
1415  SetUserIdAndSecContext(heapRel->rd_rel->relowner,
1416  save_sec_context | SECURITY_RESTRICTED_OPERATION);
1417  save_nestlevel = NewGUCNestLevel();
1419  }
1420  else
1421  {
1422  heapRel = NULL;
1423  /* Set these just to suppress "uninitialized variable" warnings */
1424  save_userid = InvalidOid;
1425  save_sec_context = -1;
1426  save_nestlevel = -1;
1427  }
1428 
1429  indexRel = index_open(indexoid, ShareUpdateExclusiveLock);
1430 
1431  /* Must be a BRIN index */
1432  if (indexRel->rd_rel->relkind != RELKIND_INDEX ||
1433  indexRel->rd_rel->relam != BRIN_AM_OID)
1434  ereport(ERROR,
1435  (errcode(ERRCODE_WRONG_OBJECT_TYPE),
1436  errmsg("\"%s\" is not a BRIN index",
1437  RelationGetRelationName(indexRel))));
1438 
1439  /* User must own the index (comparable to privileges needed for VACUUM) */
1440  if (heapRel != NULL && !object_ownercheck(RelationRelationId, indexoid, save_userid))
1442  RelationGetRelationName(indexRel));
1443 
1444  /*
1445  * Since we did the IndexGetRelation call above without any lock, it's
1446  * barely possible that a race against an index drop/recreation could have
1447  * netted us the wrong table. Recheck.
1448  */
1449  if (heapRel == NULL || heapoid != IndexGetRelation(indexoid, false))
1450  ereport(ERROR,
1452  errmsg("could not open parent table of index \"%s\"",
1453  RelationGetRelationName(indexRel))));
1454 
1455  /* see gin_clean_pending_list() */
1456  if (indexRel->rd_index->indisvalid)
1457  brinsummarize(indexRel, heapRel, heapBlk, true, &numSummarized, NULL);
1458  else
1459  ereport(DEBUG1,
1460  (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
1461  errmsg("index \"%s\" is not valid",
1462  RelationGetRelationName(indexRel))));
1463 
1464  /* Roll back any GUC changes executed by index functions */
1465  AtEOXact_GUC(false, save_nestlevel);
1466 
1467  /* Restore userid and security context */
1468  SetUserIdAndSecContext(save_userid, save_sec_context);
1469 
1472 
1473  PG_RETURN_INT32((int32) numSummarized);
1474 }
static void brinsummarize(Relation index, Relation heapRel, BlockNumber pageRange, bool include_partial, double *numSummarized, double *numExisting)
Definition: brin.c:1876
signed int int32
Definition: c.h:494
#define PG_RETURN_INT32(x)
Definition: fmgr.h:354
int NewGUCNestLevel(void)
Definition: guc.c:2234
void RestrictSearchPath(void)
Definition: guc.c:2245
void AtEOXact_GUC(bool isCommit, int nestLevel)
Definition: guc.c:2261
#define SECURITY_RESTRICTED_OPERATION
Definition: miscadmin.h:312
void GetUserIdAndSecContext(Oid *userid, int *sec_context)
Definition: miscinit.c:635
void SetUserIdAndSecContext(Oid userid, int sec_context)
Definition: miscinit.c:642
#define InvalidOid
Definition: postgres_ext.h:36

References aclcheck_error(), ACLCHECK_NOT_OWNER, AtEOXact_GUC(), BRIN_ALL_BLOCKRANGES, brinsummarize(), DEBUG1, ereport, errcode(), ERRCODE_UNDEFINED_TABLE, errhint(), errmsg(), ERROR, GetUserIdAndSecContext(), index_open(), IndexGetRelation(), InvalidOid, NewGUCNestLevel(), OBJECT_INDEX, object_ownercheck(), OidIsValid, PG_GETARG_INT64, PG_GETARG_OID, PG_RETURN_INT32, RelationData::rd_index, RelationData::rd_rel, RecoveryInProgress(), relation_close(), RelationGetRelationName, RestrictSearchPath(), SECURITY_RESTRICTED_OPERATION, SetUserIdAndSecContext(), ShareUpdateExclusiveLock, and table_open().

Referenced by brin_summarize_new_values(), and perform_work_item().

◆ brin_vacuum_scan()

static void brin_vacuum_scan ( Relation  idxrel,
BufferAccessStrategy  strategy 
)
static

Definition at line 2161 of file brin.c.

2162 {
2163  BlockNumber nblocks;
2164  BlockNumber blkno;
2165 
2166  /*
2167  * Scan the index in physical order, and clean up any possible mess in
2168  * each page.
2169  */
2170  nblocks = RelationGetNumberOfBlocks(idxrel);
2171  for (blkno = 0; blkno < nblocks; blkno++)
2172  {
2173  Buffer buf;
2174 
2176 
2177  buf = ReadBufferExtended(idxrel, MAIN_FORKNUM, blkno,
2178  RBM_NORMAL, strategy);
2179 
2180  brin_page_cleanup(idxrel, buf);
2181 
2182  ReleaseBuffer(buf);
2183  }
2184 
2185  /*
2186  * Update all upper pages in the index's FSM, as well. This ensures not
2187  * only that we propagate leaf-page FSM updates made by brin_page_cleanup,
2188  * but also that any pre-existing damage or out-of-dateness is repaired.
2189  */
2190  FreeSpaceMapVacuum(idxrel);
2191 }
void brin_page_cleanup(Relation idxrel, Buffer buf)
Definition: brin_pageops.c:624
int Buffer
Definition: buf.h:23
void ReleaseBuffer(Buffer buffer)
Definition: bufmgr.c:4906
Buffer ReadBufferExtended(Relation reln, ForkNumber forkNum, BlockNumber blockNum, ReadBufferMode mode, BufferAccessStrategy strategy)
Definition: bufmgr.c:793
#define RelationGetNumberOfBlocks(reln)
Definition: bufmgr.h:273
@ RBM_NORMAL
Definition: bufmgr.h:45
void FreeSpaceMapVacuum(Relation rel)
Definition: freespace.c:358
#define CHECK_FOR_INTERRUPTS()
Definition: miscadmin.h:122
static char * buf
Definition: pg_test_fsync.c:73
@ MAIN_FORKNUM
Definition: relpath.h:58

References brin_page_cleanup(), buf, CHECK_FOR_INTERRUPTS, FreeSpaceMapVacuum(), MAIN_FORKNUM, RBM_NORMAL, ReadBufferExtended(), RelationGetNumberOfBlocks, and ReleaseBuffer().

Referenced by brinvacuumcleanup().

◆ brinbeginscan()

IndexScanDesc brinbeginscan ( Relation  r,
int  nkeys,
int  norderbys 
)

Definition at line 529 of file brin.c.

530 {
531  IndexScanDesc scan;
532  BrinOpaque *opaque;
533 
534  scan = RelationGetIndexScan(r, nkeys, norderbys);
535 
536  opaque = palloc_object(BrinOpaque);
537  opaque->bo_rmAccess = brinRevmapInitialize(r, &opaque->bo_pagesPerRange);
538  opaque->bo_bdesc = brin_build_desc(r);
539  scan->opaque = opaque;
540 
541  return scan;
542 }
BrinDesc * brin_build_desc(Relation rel)
Definition: brin.c:1570
BrinRevmap * brinRevmapInitialize(Relation idxrel, BlockNumber *pagesPerRange)
Definition: brin_revmap.c:70
#define palloc_object(type)
Definition: fe_memutils.h:62
IndexScanDesc RelationGetIndexScan(Relation indexRelation, int nkeys, int norderbys)
Definition: genam.c:78
BlockNumber bo_pagesPerRange
Definition: brin.c:201
BrinDesc * bo_bdesc
Definition: brin.c:203
BrinRevmap * bo_rmAccess
Definition: brin.c:202

References BrinOpaque::bo_bdesc, BrinOpaque::bo_pagesPerRange, BrinOpaque::bo_rmAccess, brin_build_desc(), brinRevmapInitialize(), IndexScanDescData::opaque, palloc_object, and RelationGetIndexScan().

Referenced by brinhandler().

◆ brinbuild()

IndexBuildResult* brinbuild ( Relation  heap,
Relation  index,
IndexInfo indexInfo 
)

Definition at line 1093 of file brin.c.

1094 {
1095  IndexBuildResult *result;
1096  double reltuples;
1097  double idxtuples;
1098  BrinRevmap *revmap;
1100  Buffer meta;
1101  BlockNumber pagesPerRange;
1102 
1103  /*
1104  * We expect to be called exactly once for any index relation.
1105  */
1106  if (RelationGetNumberOfBlocks(index) != 0)
1107  elog(ERROR, "index \"%s\" already contains data",
1109 
1110  /*
1111  * Critical section not required, because on error the creation of the
1112  * whole relation will be rolled back.
1113  */
1114 
1118 
1121  MarkBufferDirty(meta);
1122 
1123  if (RelationNeedsWAL(index))
1124  {
1125  xl_brin_createidx xlrec;
1126  XLogRecPtr recptr;
1127  Page page;
1128 
1129  xlrec.version = BRIN_CURRENT_VERSION;
1131 
1132  XLogBeginInsert();
1133  XLogRegisterData((char *) &xlrec, SizeOfBrinCreateIdx);
1135 
1136  recptr = XLogInsert(RM_BRIN_ID, XLOG_BRIN_CREATE_INDEX);
1137 
1138  page = BufferGetPage(meta);
1139  PageSetLSN(page, recptr);
1140  }
1141 
1142  UnlockReleaseBuffer(meta);
1143 
1144  /*
1145  * Initialize our state, including the deformed tuple state.
1146  */
1147  revmap = brinRevmapInitialize(index, &pagesPerRange);
1148  state = initialize_brin_buildstate(index, revmap, pagesPerRange,
1150 
1151  /*
1152  * Attempt to launch parallel worker scan when required
1153  *
1154  * XXX plan_create_index_workers makes the number of workers dependent on
1155  * maintenance_work_mem, requiring 32MB for each worker. That makes sense
1156  * for btree, but not for BRIN, which can do with much less memory. So
1157  * maybe make that somehow less strict, optionally?
1158  */
1159  if (indexInfo->ii_ParallelWorkers > 0)
1160  _brin_begin_parallel(state, heap, index, indexInfo->ii_Concurrent,
1161  indexInfo->ii_ParallelWorkers);
1162 
1163  /*
1164  * If parallel build requested and at least one worker process was
1165  * successfully launched, set up coordination state, wait for workers to
1166  * complete. Then read all tuples from the shared tuplesort and insert
1167  * them into the index.
1168  *
1169  * In serial mode, simply scan the table and build the index one index
1170  * tuple at a time.
1171  */
1172  if (state->bs_leader)
1173  {
1174  SortCoordinate coordinate;
1175 
1176  coordinate = (SortCoordinate) palloc0(sizeof(SortCoordinateData));
1177  coordinate->isWorker = false;
1178  coordinate->nParticipants =
1179  state->bs_leader->nparticipanttuplesorts;
1180  coordinate->sharedsort = state->bs_leader->sharedsort;
1181 
1182  /*
1183  * Begin leader tuplesort.
1184  *
1185  * In cases where parallelism is involved, the leader receives the
1186  * same share of maintenance_work_mem as a serial sort (it is
1187  * generally treated in the same way as a serial sort once we return).
1188  * Parallel worker Tuplesortstates will have received only a fraction
1189  * of maintenance_work_mem, though.
1190  *
1191  * We rely on the lifetime of the Leader Tuplesortstate almost not
1192  * overlapping with any worker Tuplesortstate's lifetime. There may
1193  * be some small overlap, but that's okay because we rely on leader
1194  * Tuplesortstate only allocating a small, fixed amount of memory
1195  * here. When its tuplesort_performsort() is called (by our caller),
1196  * and significant amounts of memory are likely to be used, all
1197  * workers must have already freed almost all memory held by their
1198  * Tuplesortstates (they are about to go away completely, too). The
1199  * overall effect is that maintenance_work_mem always represents an
1200  * absolute high watermark on the amount of memory used by a CREATE
1201  * INDEX operation, regardless of the use of parallelism or any other
1202  * factor.
1203  */
1204  state->bs_sortstate =
1206  TUPLESORT_NONE);
1207 
1208  /* scan the relation and merge per-worker results */
1209  reltuples = _brin_parallel_merge(state);
1210 
1211  _brin_end_parallel(state->bs_leader, state);
1212  }
1213  else /* no parallel index build */
1214  {
1215  /*
1216  * Now scan the relation. No syncscan allowed here because we want
1217  * the heap blocks in physical order (we want to produce the ranges
1218  * starting from block 0, and the callback also relies on this to not
1219  * generate summary for the same range twice).
1220  */
1221  reltuples = table_index_build_scan(heap, index, indexInfo, false, true,
1222  brinbuildCallback, (void *) state, NULL);
1223 
1224  /*
1225  * process the final batch
1226  *
1227  * XXX Note this does not update state->bs_currRangeStart, i.e. it
1228  * stays set to the last range added to the index. This is OK, because
1229  * that's what brin_fill_empty_ranges expects.
1230  */
1232 
1233  /*
1234  * Backfill the final ranges with empty data.
1235  *
1236  * This saves us from doing what amounts to full table scans when the
1237  * index with a predicate like WHERE (nonnull_column IS NULL), or
1238  * other very selective predicates.
1239  */
1241  state->bs_currRangeStart,
1242  state->bs_maxRangeStart);
1243  }
1244 
1245  /* release resources */
1246  idxtuples = state->bs_numtuples;
1247  brinRevmapTerminate(state->bs_rmAccess);
1249 
1250  /*
1251  * Return statistics
1252  */
1253  result = palloc_object(IndexBuildResult);
1254 
1255  result->heap_tuples = reltuples;
1256  result->index_tuples = idxtuples;
1257 
1258  return result;
1259 }
static double _brin_parallel_merge(BrinBuildState *state)
Definition: brin.c:2608
static void terminate_brin_buildstate(BrinBuildState *state)
Definition: brin.c:1705
static void form_and_insert_tuple(BrinBuildState *state)
Definition: brin.c:1974
static void _brin_begin_parallel(BrinBuildState *buildstate, Relation heap, Relation index, bool isconcurrent, int request)
Definition: brin.c:2352
static void brinbuildCallback(Relation index, ItemPointer tid, Datum *values, bool *isnull, bool tupleIsAlive, void *brstate)
Definition: brin.c:983
#define BrinGetPagesPerRange(relation)
Definition: brin.h:40
#define BRIN_CURRENT_VERSION
Definition: brin_page.h:72
#define BRIN_METAPAGE_BLKNO
Definition: brin_page.h:75
void brin_metapage_init(Page page, BlockNumber pagesPerRange, uint16 version)
Definition: brin_pageops.c:486
void brinRevmapTerminate(BrinRevmap *revmap)
Definition: brin_revmap.c:100
#define SizeOfBrinCreateIdx
Definition: brin_xlog.h:55
#define XLOG_BRIN_CREATE_INDEX
Definition: brin_xlog.h:31
BlockNumber BufferGetBlockNumber(Buffer buffer)
Definition: bufmgr.c:3706
Buffer ExtendBufferedRel(BufferManagerRelation bmr, ForkNumber forkNum, BufferAccessStrategy strategy, uint32 flags)
Definition: bufmgr.c:846
void UnlockReleaseBuffer(Buffer buffer)
Definition: bufmgr.c:4923
void MarkBufferDirty(Buffer buffer)
Definition: bufmgr.c:2514
static Page BufferGetPage(Buffer buffer)
Definition: bufmgr.h:400
@ EB_SKIP_EXTENSION_LOCK
Definition: bufmgr.h:74
@ EB_LOCK_FIRST
Definition: bufmgr.h:86
#define BMR_REL(p_rel)
Definition: bufmgr.h:107
Pointer Page
Definition: bufpage.h:81
static void PageSetLSN(Page page, XLogRecPtr lsn)
Definition: bufpage.h:391
#define elog(elevel,...)
Definition: elog.h:225
#define RelationNeedsWAL(relation)
Definition: rel.h:628
double heap_tuples
Definition: genam.h:32
double index_tuples
Definition: genam.h:33
int ii_ParallelWorkers
Definition: execnodes.h:208
BlockNumber pagesPerRange
Definition: brin_xlog.h:52
struct SortCoordinateData * SortCoordinate
Definition: tuplesort.h:61
uint64 XLogRecPtr
Definition: xlogdefs.h:21
XLogRecPtr XLogInsert(RmgrId rmid, uint8 info)
Definition: xloginsert.c:474
void XLogRegisterData(const char *data, uint32 len)
Definition: xloginsert.c:364
void XLogRegisterBuffer(uint8 block_id, Buffer buffer, uint8 flags)
Definition: xloginsert.c:242
void XLogBeginInsert(void)
Definition: xloginsert.c:149
#define REGBUF_STANDARD
Definition: xloginsert.h:34
#define REGBUF_WILL_INIT
Definition: xloginsert.h:33

References _brin_begin_parallel(), _brin_end_parallel(), _brin_parallel_merge(), Assert, BMR_REL, BRIN_CURRENT_VERSION, brin_fill_empty_ranges(), BRIN_METAPAGE_BLKNO, brin_metapage_init(), brinbuildCallback(), BrinGetPagesPerRange, brinRevmapInitialize(), brinRevmapTerminate(), BufferGetBlockNumber(), BufferGetPage(), EB_LOCK_FIRST, EB_SKIP_EXTENSION_LOCK, elog, ERROR, ExtendBufferedRel(), form_and_insert_tuple(), IndexBuildResult::heap_tuples, IndexInfo::ii_Concurrent, IndexInfo::ii_ParallelWorkers, IndexBuildResult::index_tuples, initialize_brin_buildstate(), SortCoordinateData::isWorker, MAIN_FORKNUM, maintenance_work_mem, MarkBufferDirty(), SortCoordinateData::nParticipants, PageSetLSN(), xl_brin_createidx::pagesPerRange, palloc0(), palloc_object, REGBUF_STANDARD, REGBUF_WILL_INIT, RelationGetNumberOfBlocks, RelationGetRelationName, RelationNeedsWAL, SortCoordinateData::sharedsort, SizeOfBrinCreateIdx, table_index_build_scan(), terminate_brin_buildstate(), tuplesort_begin_index_brin(), TUPLESORT_NONE, UnlockReleaseBuffer(), xl_brin_createidx::version, XLOG_BRIN_CREATE_INDEX, XLogBeginInsert(), XLogInsert(), XLogRegisterBuffer(), and XLogRegisterData().

Referenced by brinhandler().

◆ brinbuildCallback()

static void brinbuildCallback ( Relation  index,
ItemPointer  tid,
Datum values,
bool isnull,
bool  tupleIsAlive,
void *  brstate 
)
static

Definition at line 983 of file brin.c.

989 {
990  BrinBuildState *state = (BrinBuildState *) brstate;
991  BlockNumber thisblock;
992 
993  thisblock = ItemPointerGetBlockNumber(tid);
994 
995  /*
996  * If we're in a block that belongs to a future range, summarize what
997  * we've got and start afresh. Note the scan might have skipped many
998  * pages, if they were devoid of live tuples; make sure to insert index
999  * tuples for those too.
1000  */
1001  while (thisblock > state->bs_currRangeStart + state->bs_pagesPerRange - 1)
1002  {
1003 
1004  BRIN_elog((DEBUG2,
1005  "brinbuildCallback: completed a range: %u--%u",
1006  state->bs_currRangeStart,
1007  state->bs_currRangeStart + state->bs_pagesPerRange));
1008 
1009  /* create the index tuple and insert it */
1011 
1012  /* set state to correspond to the next range */
1013  state->bs_currRangeStart += state->bs_pagesPerRange;
1014 
1015  /* re-initialize state for it */
1016  brin_memtuple_initialize(state->bs_dtuple, state->bs_bdesc);
1017  }
1018 
1019  /* Accumulate the current tuple into the running state */
1020  (void) add_values_to_range(index, state->bs_bdesc, state->bs_dtuple,
1021  values, isnull);
1022 }
static bool add_values_to_range(Relation idxRel, BrinDesc *bdesc, BrinMemTuple *dtup, const Datum *values, const bool *nulls)
Definition: brin.c:2194
#define BRIN_elog(args)
Definition: brin_internal.h:85
BrinMemTuple * brin_memtuple_initialize(BrinMemTuple *dtuple, BrinDesc *brdesc)
Definition: brin_tuple.c:511
#define DEBUG2
Definition: elog.h:29
static BlockNumber ItemPointerGetBlockNumber(const ItemPointerData *pointer)
Definition: itemptr.h:103

References add_values_to_range(), BRIN_elog, brin_memtuple_initialize(), DEBUG2, form_and_insert_tuple(), ItemPointerGetBlockNumber(), and values.

Referenced by brinbuild(), and summarize_range().

◆ brinbuildCallbackParallel()

static void brinbuildCallbackParallel ( Relation  index,
ItemPointer  tid,
Datum values,
bool isnull,
bool  tupleIsAlive,
void *  brstate 
)
static

Definition at line 1034 of file brin.c.

1040 {
1041  BrinBuildState *state = (BrinBuildState *) brstate;
1042  BlockNumber thisblock;
1043 
1044  thisblock = ItemPointerGetBlockNumber(tid);
1045 
1046  /*
1047  * If we're in a block that belongs to a different range, summarize what
1048  * we've got and start afresh. Note the scan might have skipped many
1049  * pages, if they were devoid of live tuples; we do not create empty BRIN
1050  * ranges here - the leader is responsible for filling them in.
1051  *
1052  * Unlike serial builds, parallel index builds allow synchronized seqscans
1053  * (because that's what parallel scans do). This means the block may wrap
1054  * around to the beginning of the relation, so the condition needs to
1055  * check for both future and past ranges.
1056  */
1057  if ((thisblock < state->bs_currRangeStart) ||
1058  (thisblock > state->bs_currRangeStart + state->bs_pagesPerRange - 1))
1059  {
1060 
1061  BRIN_elog((DEBUG2,
1062  "brinbuildCallbackParallel: completed a range: %u--%u",
1063  state->bs_currRangeStart,
1064  state->bs_currRangeStart + state->bs_pagesPerRange));
1065 
1066  /* create the index tuple and write it into the tuplesort */
1068 
1069  /*
1070  * Set state to correspond to the next range (for this block).
1071  *
1072  * This skips ranges that are either empty (and so we don't get any
1073  * tuples to summarize), or processed by other workers. We can't
1074  * differentiate those cases here easily, so we leave it up to the
1075  * leader to fill empty ranges where needed.
1076  */
1077  state->bs_currRangeStart
1078  = state->bs_pagesPerRange * (thisblock / state->bs_pagesPerRange);
1079 
1080  /* re-initialize state for it */
1081  brin_memtuple_initialize(state->bs_dtuple, state->bs_bdesc);
1082  }
1083 
1084  /* Accumulate the current tuple into the running state */
1085  (void) add_values_to_range(index, state->bs_bdesc, state->bs_dtuple,
1086  values, isnull);
1087 }

References add_values_to_range(), BRIN_elog, brin_memtuple_initialize(), DEBUG2, form_and_spill_tuple(), ItemPointerGetBlockNumber(), and values.

Referenced by _brin_parallel_scan_and_build().

◆ brinbuildempty()

void brinbuildempty ( Relation  index)

Definition at line 1262 of file brin.c.

1263 {
1264  Buffer metabuf;
1265 
1266  /* An empty BRIN index has a metapage only. */
1267  metabuf = ExtendBufferedRel(BMR_REL(index), INIT_FORKNUM, NULL,
1269 
1270  /* Initialize and xlog metabuffer. */
1274  MarkBufferDirty(metabuf);
1275  log_newpage_buffer(metabuf, true);
1276  END_CRIT_SECTION();
1277 
1278  UnlockReleaseBuffer(metabuf);
1279 }
#define START_CRIT_SECTION()
Definition: miscadmin.h:149
#define END_CRIT_SECTION()
Definition: miscadmin.h:151
@ INIT_FORKNUM
Definition: relpath.h:61
XLogRecPtr log_newpage_buffer(Buffer buffer, bool page_std)
Definition: xloginsert.c:1237

References BMR_REL, BRIN_CURRENT_VERSION, brin_metapage_init(), BrinGetPagesPerRange, BufferGetPage(), EB_LOCK_FIRST, EB_SKIP_EXTENSION_LOCK, END_CRIT_SECTION, ExtendBufferedRel(), INIT_FORKNUM, log_newpage_buffer(), MarkBufferDirty(), START_CRIT_SECTION, and UnlockReleaseBuffer().

Referenced by brinhandler().

◆ brinbulkdelete()

IndexBulkDeleteResult* brinbulkdelete ( IndexVacuumInfo info,
IndexBulkDeleteResult stats,
IndexBulkDeleteCallback  callback,
void *  callback_state 
)

Definition at line 1291 of file brin.c.

1293 {
1294  /* allocate stats if first time through, else re-use existing struct */
1295  if (stats == NULL)
1297 
1298  return stats;
1299 }
#define palloc0_object(type)
Definition: fe_memutils.h:63

References palloc0_object.

Referenced by brinhandler().

◆ brinendscan()

void brinendscan ( IndexScanDesc  scan)

Definition at line 966 of file brin.c.

967 {
968  BrinOpaque *opaque = (BrinOpaque *) scan->opaque;
969 
971  brin_free_desc(opaque->bo_bdesc);
972  pfree(opaque);
973 }
void brin_free_desc(BrinDesc *bdesc)
Definition: brin.c:1625

References BrinOpaque::bo_bdesc, BrinOpaque::bo_rmAccess, brin_free_desc(), brinRevmapTerminate(), IndexScanDescData::opaque, and pfree().

Referenced by brinhandler().

◆ bringetbitmap()

int64 bringetbitmap ( IndexScanDesc  scan,
TIDBitmap tbm 
)

Definition at line 557 of file brin.c.

558 {
559  Relation idxRel = scan->indexRelation;
561  BrinDesc *bdesc;
562  Oid heapOid;
563  Relation heapRel;
564  BrinOpaque *opaque;
565  BlockNumber nblocks;
566  BlockNumber heapBlk;
567  int totalpages = 0;
568  FmgrInfo *consistentFn;
569  MemoryContext oldcxt;
570  MemoryContext perRangeCxt;
571  BrinMemTuple *dtup;
572  BrinTuple *btup = NULL;
573  Size btupsz = 0;
574  ScanKey **keys,
575  **nullkeys;
576  int *nkeys,
577  *nnullkeys;
578  char *ptr;
579  Size len;
580  char *tmp PG_USED_FOR_ASSERTS_ONLY;
581 
582  opaque = (BrinOpaque *) scan->opaque;
583  bdesc = opaque->bo_bdesc;
584  pgstat_count_index_scan(idxRel);
585 
586  /*
587  * We need to know the size of the table so that we know how long to
588  * iterate on the revmap.
589  */
590  heapOid = IndexGetRelation(RelationGetRelid(idxRel), false);
591  heapRel = table_open(heapOid, AccessShareLock);
592  nblocks = RelationGetNumberOfBlocks(heapRel);
593  table_close(heapRel, AccessShareLock);
594 
595  /*
596  * Make room for the consistent support procedures of indexed columns. We
597  * don't look them up here; we do that lazily the first time we see a scan
598  * key reference each of them. We rely on zeroing fn_oid to InvalidOid.
599  */
600  consistentFn = palloc0_array(FmgrInfo, bdesc->bd_tupdesc->natts);
601 
602  /*
603  * Make room for per-attribute lists of scan keys that we'll pass to the
604  * consistent support procedure. We don't know which attributes have scan
605  * keys, so we allocate space for all attributes. That may use more memory
606  * but it's probably cheaper than determining which attributes are used.
607  *
608  * We keep null and regular keys separate, so that we can pass just the
609  * regular keys to the consistent function easily.
610  *
611  * To reduce the allocation overhead, we allocate one big chunk and then
612  * carve it into smaller arrays ourselves. All the pieces have exactly the
613  * same lifetime, so that's OK.
614  *
615  * XXX The widest index can have 32 attributes, so the amount of wasted
616  * memory is negligible. We could invent a more compact approach (with
617  * just space for used attributes) but that would make the matching more
618  * complex so it's not a good trade-off.
619  */
620  len =
621  MAXALIGN(sizeof(ScanKey *) * bdesc->bd_tupdesc->natts) + /* regular keys */
622  MAXALIGN(sizeof(ScanKey) * scan->numberOfKeys) * bdesc->bd_tupdesc->natts +
623  MAXALIGN(sizeof(int) * bdesc->bd_tupdesc->natts) +
624  MAXALIGN(sizeof(ScanKey *) * bdesc->bd_tupdesc->natts) + /* NULL keys */
625  MAXALIGN(sizeof(ScanKey) * scan->numberOfKeys) * bdesc->bd_tupdesc->natts +
626  MAXALIGN(sizeof(int) * bdesc->bd_tupdesc->natts);
627 
628  ptr = palloc(len);
629  tmp = ptr;
630 
631  keys = (ScanKey **) ptr;
632  ptr += MAXALIGN(sizeof(ScanKey *) * bdesc->bd_tupdesc->natts);
633 
634  nullkeys = (ScanKey **) ptr;
635  ptr += MAXALIGN(sizeof(ScanKey *) * bdesc->bd_tupdesc->natts);
636 
637  nkeys = (int *) ptr;
638  ptr += MAXALIGN(sizeof(int) * bdesc->bd_tupdesc->natts);
639 
640  nnullkeys = (int *) ptr;
641  ptr += MAXALIGN(sizeof(int) * bdesc->bd_tupdesc->natts);
642 
643  for (int i = 0; i < bdesc->bd_tupdesc->natts; i++)
644  {
645  keys[i] = (ScanKey *) ptr;
646  ptr += MAXALIGN(sizeof(ScanKey) * scan->numberOfKeys);
647 
648  nullkeys[i] = (ScanKey *) ptr;
649  ptr += MAXALIGN(sizeof(ScanKey) * scan->numberOfKeys);
650  }
651 
652  Assert(tmp + len == ptr);
653 
654  /* zero the number of keys */
655  memset(nkeys, 0, sizeof(int) * bdesc->bd_tupdesc->natts);
656  memset(nnullkeys, 0, sizeof(int) * bdesc->bd_tupdesc->natts);
657 
658  /* Preprocess the scan keys - split them into per-attribute arrays. */
659  for (int keyno = 0; keyno < scan->numberOfKeys; keyno++)
660  {
661  ScanKey key = &scan->keyData[keyno];
662  AttrNumber keyattno = key->sk_attno;
663 
664  /*
665  * The collation of the scan key must match the collation used in the
666  * index column (but only if the search is not IS NULL/ IS NOT NULL).
667  * Otherwise we shouldn't be using this index ...
668  */
669  Assert((key->sk_flags & SK_ISNULL) ||
670  (key->sk_collation ==
671  TupleDescAttr(bdesc->bd_tupdesc,
672  keyattno - 1)->attcollation));
673 
674  /*
675  * First time we see this index attribute, so init as needed.
676  *
677  * This is a bit of an overkill - we don't know how many scan keys are
678  * there for this attribute, so we simply allocate the largest number
679  * possible (as if all keys were for this attribute). This may waste a
680  * bit of memory, but we only expect small number of scan keys in
681  * general, so this should be negligible, and repeated repalloc calls
682  * are not free either.
683  */
684  if (consistentFn[keyattno - 1].fn_oid == InvalidOid)
685  {
686  FmgrInfo *tmp;
687 
688  /* First time we see this attribute, so no key/null keys. */
689  Assert(nkeys[keyattno - 1] == 0);
690  Assert(nnullkeys[keyattno - 1] == 0);
691 
692  tmp = index_getprocinfo(idxRel, keyattno,
694  fmgr_info_copy(&consistentFn[keyattno - 1], tmp,
696  }
697 
698  /* Add key to the proper per-attribute array. */
699  if (key->sk_flags & SK_ISNULL)
700  {
701  nullkeys[keyattno - 1][nnullkeys[keyattno - 1]] = key;
702  nnullkeys[keyattno - 1]++;
703  }
704  else
705  {
706  keys[keyattno - 1][nkeys[keyattno - 1]] = key;
707  nkeys[keyattno - 1]++;
708  }
709  }
710 
711  /* allocate an initial in-memory tuple, out of the per-range memcxt */
712  dtup = brin_new_memtuple(bdesc);
713 
714  /*
715  * Setup and use a per-range memory context, which is reset every time we
716  * loop below. This avoids having to free the tuples within the loop.
717  */
719  "bringetbitmap cxt",
721  oldcxt = MemoryContextSwitchTo(perRangeCxt);
722 
723  /*
724  * Now scan the revmap. We start by querying for heap page 0,
725  * incrementing by the number of pages per range; this gives us a full
726  * view of the table.
727  */
728  for (heapBlk = 0; heapBlk < nblocks; heapBlk += opaque->bo_pagesPerRange)
729  {
730  bool addrange;
731  bool gottuple = false;
732  BrinTuple *tup;
733  OffsetNumber off;
734  Size size;
735 
737 
738  MemoryContextReset(perRangeCxt);
739 
740  tup = brinGetTupleForHeapBlock(opaque->bo_rmAccess, heapBlk, &buf,
741  &off, &size, BUFFER_LOCK_SHARE);
742  if (tup)
743  {
744  gottuple = true;
745  btup = brin_copy_tuple(tup, size, btup, &btupsz);
747  }
748 
749  /*
750  * For page ranges with no indexed tuple, we must return the whole
751  * range; otherwise, compare it to the scan keys.
752  */
753  if (!gottuple)
754  {
755  addrange = true;
756  }
757  else
758  {
759  dtup = brin_deform_tuple(bdesc, btup, dtup);
760  if (dtup->bt_placeholder)
761  {
762  /*
763  * Placeholder tuples are always returned, regardless of the
764  * values stored in them.
765  */
766  addrange = true;
767  }
768  else
769  {
770  int attno;
771 
772  /*
773  * Compare scan keys with summary values stored for the range.
774  * If scan keys are matched, the page range must be added to
775  * the bitmap. We initially assume the range needs to be
776  * added; in particular this serves the case where there are
777  * no keys.
778  */
779  addrange = true;
780  for (attno = 1; attno <= bdesc->bd_tupdesc->natts; attno++)
781  {
782  BrinValues *bval;
783  Datum add;
784  Oid collation;
785 
786  /*
787  * skip attributes without any scan keys (both regular and
788  * IS [NOT] NULL)
789  */
790  if (nkeys[attno - 1] == 0 && nnullkeys[attno - 1] == 0)
791  continue;
792 
793  bval = &dtup->bt_columns[attno - 1];
794 
795  /*
796  * If the BRIN tuple indicates that this range is empty,
797  * we can skip it: there's nothing to match. We don't
798  * need to examine the next columns.
799  */
800  if (dtup->bt_empty_range)
801  {
802  addrange = false;
803  break;
804  }
805 
806  /*
807  * First check if there are any IS [NOT] NULL scan keys,
808  * and if we're violating them. In that case we can
809  * terminate early, without invoking the support function.
810  *
811  * As there may be more keys, we can only determine
812  * mismatch within this loop.
813  */
814  if (bdesc->bd_info[attno - 1]->oi_regular_nulls &&
815  !check_null_keys(bval, nullkeys[attno - 1],
816  nnullkeys[attno - 1]))
817  {
818  /*
819  * If any of the IS [NOT] NULL keys failed, the page
820  * range as a whole can't pass. So terminate the loop.
821  */
822  addrange = false;
823  break;
824  }
825 
826  /*
827  * So either there are no IS [NOT] NULL keys, or all
828  * passed. If there are no regular scan keys, we're done -
829  * the page range matches. If there are regular keys, but
830  * the page range is marked as 'all nulls' it can't
831  * possibly pass (we're assuming the operators are
832  * strict).
833  */
834 
835  /* No regular scan keys - page range as a whole passes. */
836  if (!nkeys[attno - 1])
837  continue;
838 
839  Assert((nkeys[attno - 1] > 0) &&
840  (nkeys[attno - 1] <= scan->numberOfKeys));
841 
842  /* If it is all nulls, it cannot possibly be consistent. */
843  if (bval->bv_allnulls)
844  {
845  addrange = false;
846  break;
847  }
848 
849  /*
850  * Collation from the first key (has to be the same for
851  * all keys for the same attribute).
852  */
853  collation = keys[attno - 1][0]->sk_collation;
854 
855  /*
856  * Check whether the scan key is consistent with the page
857  * range values; if so, have the pages in the range added
858  * to the output bitmap.
859  *
860  * The opclass may or may not support processing of
861  * multiple scan keys. We can determine that based on the
862  * number of arguments - functions with extra parameter
863  * (number of scan keys) do support this, otherwise we
864  * have to simply pass the scan keys one by one.
865  */
866  if (consistentFn[attno - 1].fn_nargs >= 4)
867  {
868  /* Check all keys at once */
869  add = FunctionCall4Coll(&consistentFn[attno - 1],
870  collation,
871  PointerGetDatum(bdesc),
872  PointerGetDatum(bval),
873  PointerGetDatum(keys[attno - 1]),
874  Int32GetDatum(nkeys[attno - 1]));
875  addrange = DatumGetBool(add);
876  }
877  else
878  {
879  /*
880  * Check keys one by one
881  *
882  * When there are multiple scan keys, failure to meet
883  * the criteria for a single one of them is enough to
884  * discard the range as a whole, so break out of the
885  * loop as soon as a false return value is obtained.
886  */
887  int keyno;
888 
889  for (keyno = 0; keyno < nkeys[attno - 1]; keyno++)
890  {
891  add = FunctionCall3Coll(&consistentFn[attno - 1],
892  keys[attno - 1][keyno]->sk_collation,
893  PointerGetDatum(bdesc),
894  PointerGetDatum(bval),
895  PointerGetDatum(keys[attno - 1][keyno]));
896  addrange = DatumGetBool(add);
897  if (!addrange)
898  break;
899  }
900  }
901 
902  /*
903  * If we found a scan key eliminating the range, no need
904  * to check additional ones.
905  */
906  if (!addrange)
907  break;
908  }
909  }
910  }
911 
912  /* add the pages in the range to the output bitmap, if needed */
913  if (addrange)
914  {
915  BlockNumber pageno;
916 
917  for (pageno = heapBlk;
918  pageno <= Min(nblocks, heapBlk + opaque->bo_pagesPerRange) - 1;
919  pageno++)
920  {
921  MemoryContextSwitchTo(oldcxt);
922  tbm_add_page(tbm, pageno);
923  totalpages++;
924  MemoryContextSwitchTo(perRangeCxt);
925  }
926  }
927  }
928 
929  MemoryContextSwitchTo(oldcxt);
930  MemoryContextDelete(perRangeCxt);
931 
932  if (buf != InvalidBuffer)
934 
935  /*
936  * XXX We have an approximation of the number of *pages* that our scan
937  * returns, but we don't have a precise idea of the number of heap tuples
938  * involved.
939  */
940  return totalpages * 10;
941 }
int16 AttrNumber
Definition: attnum.h:21
static bool check_null_keys(BrinValues *bval, ScanKey *nullkeys, int nnullkeys)
Definition: brin.c:2288
#define BRIN_PROCNUM_CONSISTENT
Definition: brin_internal.h:72
BrinTuple * brinGetTupleForHeapBlock(BrinRevmap *revmap, BlockNumber heapBlk, Buffer *buf, OffsetNumber *off, Size *size, int mode)
Definition: brin_revmap.c:194
BrinTuple * brin_copy_tuple(BrinTuple *tuple, Size len, BrinTuple *dest, Size *destsz)
Definition: brin_tuple.c:446
#define InvalidBuffer
Definition: buf.h:25
void LockBuffer(Buffer buffer, int mode)
Definition: bufmgr.c:5140
#define BUFFER_LOCK_UNLOCK
Definition: bufmgr.h:189
#define BUFFER_LOCK_SHARE
Definition: bufmgr.h:190
#define Min(x, y)
Definition: c.h:1004
#define MAXALIGN(LEN)
Definition: c.h:811
#define PG_USED_FOR_ASSERTS_ONLY
Definition: c.h:182
#define palloc0_array(type, count)
Definition: fe_memutils.h:65
Datum FunctionCall3Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2, Datum arg3)
Definition: fmgr.c:1171
void fmgr_info_copy(FmgrInfo *dstinfo, FmgrInfo *srcinfo, MemoryContext destcxt)
Definition: fmgr.c:580
#define AccessShareLock
Definition: lockdefs.h:36
uint16 OffsetNumber
Definition: off.h:24
#define pgstat_count_index_scan(rel)
Definition: pgstat.h:658
static Datum Int32GetDatum(int32 X)
Definition: postgres.h:212
static void addrange(struct cvec *cv, chr from, chr to)
Definition: regc_cvec.c:90
#define SK_ISNULL
Definition: skey.h:115
static pg_noinline void Size size
Definition: slab.c:607
bool bt_placeholder
Definition: brin_tuple.h:46
struct ScanKeyData * keyData
Definition: relscan.h:122
Relation indexRelation
Definition: relscan.h:118
Oid sk_collation
Definition: skey.h:70
void tbm_add_page(TIDBitmap *tbm, BlockNumber pageno)
Definition: tidbitmap.c:443

References AccessShareLock, addrange(), ALLOCSET_DEFAULT_SIZES, AllocSetContextCreate, Assert, BrinDesc::bd_info, BrinDesc::bd_tupdesc, BrinOpaque::bo_bdesc, BrinOpaque::bo_pagesPerRange, BrinOpaque::bo_rmAccess, brin_copy_tuple(), brin_deform_tuple(), brin_new_memtuple(), BRIN_PROCNUM_CONSISTENT, brinGetTupleForHeapBlock(), BrinMemTuple::bt_columns, BrinMemTuple::bt_empty_range, BrinMemTuple::bt_placeholder, buf, BUFFER_LOCK_SHARE, BUFFER_LOCK_UNLOCK, BrinValues::bv_allnulls, CHECK_FOR_INTERRUPTS, check_null_keys(), CurrentMemoryContext, DatumGetBool(), fmgr_info_copy(), FunctionCall3Coll(), FunctionCall4Coll(), i, index_getprocinfo(), IndexGetRelation(), IndexScanDescData::indexRelation, Int32GetDatum(), InvalidBuffer, InvalidOid, sort-test::key, IndexScanDescData::keyData, len, LockBuffer(), MAXALIGN, MemoryContextDelete(), MemoryContextReset(), MemoryContextSwitchTo(), Min, TupleDescData::natts, IndexScanDescData::numberOfKeys, BrinOpcInfo::oi_regular_nulls, IndexScanDescData::opaque, palloc(), palloc0_array, PG_USED_FOR_ASSERTS_ONLY, pgstat_count_index_scan, PointerGetDatum(), RelationGetNumberOfBlocks, RelationGetRelid, ReleaseBuffer(), size, ScanKeyData::sk_collation, SK_ISNULL, table_close(), table_open(), tbm_add_page(), and TupleDescAttr.

Referenced by brinhandler().

◆ brinGetStats()

void brinGetStats ( Relation  index,
BrinStatsData stats 
)

Definition at line 1637 of file brin.c.

1638 {
1639  Buffer metabuffer;
1640  Page metapage;
1641  BrinMetaPageData *metadata;
1642 
1643  metabuffer = ReadBuffer(index, BRIN_METAPAGE_BLKNO);
1644  LockBuffer(metabuffer, BUFFER_LOCK_SHARE);
1645  metapage = BufferGetPage(metabuffer);
1646  metadata = (BrinMetaPageData *) PageGetContents(metapage);
1647 
1648  stats->pagesPerRange = metadata->pagesPerRange;
1649  stats->revmapNumPages = metadata->lastRevmapPage - 1;
1650 
1651  UnlockReleaseBuffer(metabuffer);
1652 }
Buffer ReadBuffer(Relation reln, BlockNumber blockNum)
Definition: bufmgr.c:746
static char * PageGetContents(Page page)
Definition: bufpage.h:257
BlockNumber lastRevmapPage
Definition: brin_page.h:69
BlockNumber pagesPerRange
Definition: brin_page.h:68
BlockNumber revmapNumPages
Definition: brin.h:35
BlockNumber pagesPerRange
Definition: brin.h:34

References BRIN_METAPAGE_BLKNO, BUFFER_LOCK_SHARE, BufferGetPage(), BrinMetaPageData::lastRevmapPage, LockBuffer(), PageGetContents(), BrinStatsData::pagesPerRange, BrinMetaPageData::pagesPerRange, ReadBuffer(), BrinStatsData::revmapNumPages, and UnlockReleaseBuffer().

Referenced by brincostestimate().

◆ brinhandler()

Datum brinhandler ( PG_FUNCTION_ARGS  )

Definition at line 247 of file brin.c.

248 {
249  IndexAmRoutine *amroutine = makeNode(IndexAmRoutine);
250 
251  amroutine->amstrategies = 0;
253  amroutine->amoptsprocnum = BRIN_PROCNUM_OPTIONS;
254  amroutine->amcanorder = false;
255  amroutine->amcanorderbyop = false;
256  amroutine->amcanbackward = false;
257  amroutine->amcanunique = false;
258  amroutine->amcanmulticol = true;
259  amroutine->amoptionalkey = true;
260  amroutine->amsearcharray = false;
261  amroutine->amsearchnulls = true;
262  amroutine->amstorage = true;
263  amroutine->amclusterable = false;
264  amroutine->ampredlocks = false;
265  amroutine->amcanparallel = false;
266  amroutine->amcanbuildparallel = true;
267  amroutine->amcaninclude = false;
268  amroutine->amusemaintenanceworkmem = false;
269  amroutine->amsummarizing = true;
270  amroutine->amparallelvacuumoptions =
272  amroutine->amkeytype = InvalidOid;
273 
274  amroutine->ambuild = brinbuild;
275  amroutine->ambuildempty = brinbuildempty;
276  amroutine->aminsert = brininsert;
277  amroutine->aminsertcleanup = brininsertcleanup;
278  amroutine->ambulkdelete = brinbulkdelete;
279  amroutine->amvacuumcleanup = brinvacuumcleanup;
280  amroutine->amcanreturn = NULL;
281  amroutine->amcostestimate = brincostestimate;
282  amroutine->amgettreeheight = NULL;
283  amroutine->amoptions = brinoptions;
284  amroutine->amproperty = NULL;
285  amroutine->ambuildphasename = NULL;
286  amroutine->amvalidate = brinvalidate;
287  amroutine->amadjustmembers = NULL;
288  amroutine->ambeginscan = brinbeginscan;
289  amroutine->amrescan = brinrescan;
290  amroutine->amgettuple = NULL;
291  amroutine->amgetbitmap = bringetbitmap;
292  amroutine->amendscan = brinendscan;
293  amroutine->ammarkpos = NULL;
294  amroutine->amrestrpos = NULL;
295  amroutine->amestimateparallelscan = NULL;
296  amroutine->aminitparallelscan = NULL;
297  amroutine->amparallelrescan = NULL;
298 
299  PG_RETURN_POINTER(amroutine);
300 }
IndexBulkDeleteResult * brinvacuumcleanup(IndexVacuumInfo *info, IndexBulkDeleteResult *stats)
Definition: brin.c:1306
void brininsertcleanup(Relation index, IndexInfo *indexInfo)
Definition: brin.c:504
void brinrescan(IndexScanDesc scan, ScanKey scankey, int nscankeys, ScanKey orderbys, int norderbys)
Definition: brin.c:947
IndexScanDesc brinbeginscan(Relation r, int nkeys, int norderbys)
Definition: brin.c:529
IndexBuildResult * brinbuild(Relation heap, Relation index, IndexInfo *indexInfo)
Definition: brin.c:1093
int64 bringetbitmap(IndexScanDesc scan, TIDBitmap *tbm)
Definition: brin.c:557
void brinbuildempty(Relation index)
Definition: brin.c:1262
bool brininsert(Relation idxRel, Datum *values, bool *nulls, ItemPointer heaptid, Relation heapRel, IndexUniqueCheck checkUnique, bool indexUnchanged, IndexInfo *indexInfo)
Definition: brin.c:336
bytea * brinoptions(Datum reloptions, bool validate)
Definition: brin.c:1336
IndexBulkDeleteResult * brinbulkdelete(IndexVacuumInfo *info, IndexBulkDeleteResult *stats, IndexBulkDeleteCallback callback, void *callback_state)
Definition: brin.c:1291
void brinendscan(IndexScanDesc scan)
Definition: brin.c:966
#define BRIN_LAST_OPTIONAL_PROCNUM
Definition: brin_internal.h:78
#define BRIN_PROCNUM_OPTIONS
Definition: brin_internal.h:75
bool brinvalidate(Oid opclassoid)
Definition: brin_validate.c:37
#define PG_RETURN_POINTER(x)
Definition: fmgr.h:361
#define makeNode(_type_)
Definition: nodes.h:155
void brincostestimate(PlannerInfo *root, IndexPath *path, double loop_count, Cost *indexStartupCost, Cost *indexTotalCost, Selectivity *indexSelectivity, double *indexCorrelation, double *indexPages)
Definition: selfuncs.c:7981
ambuildphasename_function ambuildphasename
Definition: amapi.h:285
ambuildempty_function ambuildempty
Definition: amapi.h:275
amvacuumcleanup_function amvacuumcleanup
Definition: amapi.h:279
bool amclusterable
Definition: amapi.h:249
amoptions_function amoptions
Definition: amapi.h:283
amestimateparallelscan_function amestimateparallelscan
Definition: amapi.h:297
amrestrpos_function amrestrpos
Definition: amapi.h:294
aminsert_function aminsert
Definition: amapi.h:276
amendscan_function amendscan
Definition: amapi.h:292
uint16 amoptsprocnum
Definition: amapi.h:229
amparallelrescan_function amparallelrescan
Definition: amapi.h:299
Oid amkeytype
Definition: amapi.h:265
bool ampredlocks
Definition: amapi.h:251
uint16 amsupport
Definition: amapi.h:227
amcostestimate_function amcostestimate
Definition: amapi.h:281
bool amcanorderbyop
Definition: amapi.h:233
amadjustmembers_function amadjustmembers
Definition: amapi.h:287
ambuild_function ambuild
Definition: amapi.h:274
bool amstorage
Definition: amapi.h:247
uint16 amstrategies
Definition: amapi.h:225
bool amoptionalkey
Definition: amapi.h:241
amgettuple_function amgettuple
Definition: amapi.h:290
amcanreturn_function amcanreturn
Definition: amapi.h:280
bool amcanunique
Definition: amapi.h:237
amgetbitmap_function amgetbitmap
Definition: amapi.h:291
amproperty_function amproperty
Definition: amapi.h:284
ambulkdelete_function ambulkdelete
Definition: amapi.h:278
bool amsearcharray
Definition: amapi.h:243
bool amsummarizing
Definition: amapi.h:261
amvalidate_function amvalidate
Definition: amapi.h:286
ammarkpos_function ammarkpos
Definition: amapi.h:293
bool amcanmulticol
Definition: amapi.h:239
bool amusemaintenanceworkmem
Definition: amapi.h:259
ambeginscan_function ambeginscan
Definition: amapi.h:288
bool amcanparallel
Definition: amapi.h:253
amrescan_function amrescan
Definition: amapi.h:289
bool amcanorder
Definition: amapi.h:231
bool amcanbuildparallel
Definition: amapi.h:255
aminitparallelscan_function aminitparallelscan
Definition: amapi.h:298
uint8 amparallelvacuumoptions
Definition: amapi.h:263
aminsertcleanup_function aminsertcleanup
Definition: amapi.h:277
bool amcanbackward
Definition: amapi.h:235
amgettreeheight_function amgettreeheight
Definition: amapi.h:282
bool amcaninclude
Definition: amapi.h:257
bool amsearchnulls
Definition: amapi.h:245
#define VACUUM_OPTION_PARALLEL_CLEANUP
Definition: vacuum.h:63

References IndexAmRoutine::amadjustmembers, IndexAmRoutine::ambeginscan, IndexAmRoutine::ambuild, IndexAmRoutine::ambuildempty, IndexAmRoutine::ambuildphasename, IndexAmRoutine::ambulkdelete, IndexAmRoutine::amcanbackward, IndexAmRoutine::amcanbuildparallel, IndexAmRoutine::amcaninclude, IndexAmRoutine::amcanmulticol, IndexAmRoutine::amcanorder, IndexAmRoutine::amcanorderbyop, IndexAmRoutine::amcanparallel, IndexAmRoutine::amcanreturn, IndexAmRoutine::amcanunique, IndexAmRoutine::amclusterable, IndexAmRoutine::amcostestimate, IndexAmRoutine::amendscan, IndexAmRoutine::amestimateparallelscan, IndexAmRoutine::amgetbitmap, IndexAmRoutine::amgettreeheight, IndexAmRoutine::amgettuple, IndexAmRoutine::aminitparallelscan, IndexAmRoutine::aminsert, IndexAmRoutine::aminsertcleanup, IndexAmRoutine::amkeytype, IndexAmRoutine::ammarkpos, IndexAmRoutine::amoptionalkey, IndexAmRoutine::amoptions, IndexAmRoutine::amoptsprocnum, IndexAmRoutine::amparallelrescan, IndexAmRoutine::amparallelvacuumoptions, IndexAmRoutine::ampredlocks, IndexAmRoutine::amproperty, IndexAmRoutine::amrescan, IndexAmRoutine::amrestrpos, IndexAmRoutine::amsearcharray, IndexAmRoutine::amsearchnulls, IndexAmRoutine::amstorage, IndexAmRoutine::amstrategies, IndexAmRoutine::amsummarizing, IndexAmRoutine::amsupport, IndexAmRoutine::amusemaintenanceworkmem, IndexAmRoutine::amvacuumcleanup, IndexAmRoutine::amvalidate, BRIN_LAST_OPTIONAL_PROCNUM, BRIN_PROCNUM_OPTIONS, brinbeginscan(), brinbuild(), brinbuildempty(), brinbulkdelete(), brincostestimate(), brinendscan(), bringetbitmap(), brininsert(), brininsertcleanup(), brinoptions(), brinrescan(), brinvacuumcleanup(), brinvalidate(), InvalidOid, makeNode, PG_RETURN_POINTER, and VACUUM_OPTION_PARALLEL_CLEANUP.

◆ brininsert()

bool brininsert ( Relation  idxRel,
Datum values,
bool nulls,
ItemPointer  heaptid,
Relation  heapRel,
IndexUniqueCheck  checkUnique,
bool  indexUnchanged,
IndexInfo indexInfo 
)

Definition at line 336 of file brin.c.

341 {
342  BlockNumber pagesPerRange;
343  BlockNumber origHeapBlk;
344  BlockNumber heapBlk;
345  BrinInsertState *bistate = (BrinInsertState *) indexInfo->ii_AmCache;
346  BrinRevmap *revmap;
347  BrinDesc *bdesc;
349  MemoryContext tupcxt = NULL;
351  bool autosummarize = BrinGetAutoSummarize(idxRel);
352 
353  /*
354  * If first time through in this statement, initialize the insert state
355  * that we keep for all the inserts in the command.
356  */
357  if (!bistate)
358  bistate = initialize_brin_insertstate(idxRel, indexInfo);
359 
360  revmap = bistate->bis_rmAccess;
361  bdesc = bistate->bis_desc;
362  pagesPerRange = bistate->bis_pages_per_range;
363 
364  /*
365  * origHeapBlk is the block number where the insertion occurred. heapBlk
366  * is the first block in the corresponding page range.
367  */
368  origHeapBlk = ItemPointerGetBlockNumber(heaptid);
369  heapBlk = (origHeapBlk / pagesPerRange) * pagesPerRange;
370 
371  for (;;)
372  {
373  bool need_insert = false;
374  OffsetNumber off;
375  BrinTuple *brtup;
376  BrinMemTuple *dtup;
377 
379 
380  /*
381  * If auto-summarization is enabled and we just inserted the first
382  * tuple into the first block of a new non-first page range, request a
383  * summarization run of the previous range.
384  */
385  if (autosummarize &&
386  heapBlk > 0 &&
387  heapBlk == origHeapBlk &&
389  {
390  BlockNumber lastPageRange = heapBlk - 1;
391  BrinTuple *lastPageTuple;
392 
393  lastPageTuple =
394  brinGetTupleForHeapBlock(revmap, lastPageRange, &buf, &off,
395  NULL, BUFFER_LOCK_SHARE);
396  if (!lastPageTuple)
397  {
398  bool recorded;
399 
401  RelationGetRelid(idxRel),
402  lastPageRange);
403  if (!recorded)
404  ereport(LOG,
405  (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED),
406  errmsg("request for BRIN range summarization for index \"%s\" page %u was not recorded",
407  RelationGetRelationName(idxRel),
408  lastPageRange)));
409  }
410  else
412  }
413 
414  brtup = brinGetTupleForHeapBlock(revmap, heapBlk, &buf, &off,
415  NULL, BUFFER_LOCK_SHARE);
416 
417  /* if range is unsummarized, there's nothing to do */
418  if (!brtup)
419  break;
420 
421  /* First time through in this brininsert call? */
422  if (tupcxt == NULL)
423  {
425  "brininsert cxt",
427  MemoryContextSwitchTo(tupcxt);
428  }
429 
430  dtup = brin_deform_tuple(bdesc, brtup, NULL);
431 
432  need_insert = add_values_to_range(idxRel, bdesc, dtup, values, nulls);
433 
434  if (!need_insert)
435  {
436  /*
437  * The tuple is consistent with the new values, so there's nothing
438  * to do.
439  */
441  }
442  else
443  {
444  Page page = BufferGetPage(buf);
445  ItemId lp = PageGetItemId(page, off);
446  Size origsz;
447  BrinTuple *origtup;
448  Size newsz;
449  BrinTuple *newtup;
450  bool samepage;
451 
452  /*
453  * Make a copy of the old tuple, so that we can compare it after
454  * re-acquiring the lock.
455  */
456  origsz = ItemIdGetLength(lp);
457  origtup = brin_copy_tuple(brtup, origsz, NULL, NULL);
458 
459  /*
460  * Before releasing the lock, check if we can attempt a same-page
461  * update. Another process could insert a tuple concurrently in
462  * the same page though, so downstream we must be prepared to cope
463  * if this turns out to not be possible after all.
464  */
465  newtup = brin_form_tuple(bdesc, heapBlk, dtup, &newsz);
466  samepage = brin_can_do_samepage_update(buf, origsz, newsz);
468 
469  /*
470  * Try to update the tuple. If this doesn't work for whatever
471  * reason, we need to restart from the top; the revmap might be
472  * pointing at a different tuple for this block now, so we need to
473  * recompute to ensure both our new heap tuple and the other
474  * inserter's are covered by the combined tuple. It might be that
475  * we don't need to update at all.
476  */
477  if (!brin_doupdate(idxRel, pagesPerRange, revmap, heapBlk,
478  buf, off, origtup, origsz, newtup, newsz,
479  samepage))
480  {
481  /* no luck; start over */
482  MemoryContextReset(tupcxt);
483  continue;
484  }
485  }
486 
487  /* success! */
488  break;
489  }
490 
491  if (BufferIsValid(buf))
493  MemoryContextSwitchTo(oldcxt);
494  if (tupcxt != NULL)
495  MemoryContextDelete(tupcxt);
496 
497  return false;
498 }
bool AutoVacuumRequestWork(AutoVacuumWorkItemType type, Oid relationId, BlockNumber blkno)
Definition: autovacuum.c:3211
@ AVW_BRINSummarizeRange
Definition: autovacuum.h:25
static BrinInsertState * initialize_brin_insertstate(Relation idxRel, IndexInfo *indexInfo)
Definition: brin.c:307
#define BrinGetAutoSummarize(relation)
Definition: brin.h:46
bool brin_doupdate(Relation idxrel, BlockNumber pagesPerRange, BrinRevmap *revmap, BlockNumber heapBlk, Buffer oldbuf, OffsetNumber oldoff, const BrinTuple *origtup, Size origsz, const BrinTuple *newtup, Size newsz, bool samepage)
Definition: brin_pageops.c:53
bool brin_can_do_samepage_update(Buffer buffer, Size origsz, Size newsz)
Definition: brin_pageops.c:323
static bool BufferIsValid(Buffer bufnum)
Definition: bufmgr.h:351
static ItemId PageGetItemId(Page page, OffsetNumber offsetNumber)
Definition: bufpage.h:243
#define LOG
Definition: elog.h:31
#define ItemIdGetLength(itemId)
Definition: itemid.h:59
static OffsetNumber ItemPointerGetOffsetNumber(const ItemPointerData *pointer)
Definition: itemptr.h:124
#define FirstOffsetNumber
Definition: off.h:27
BrinDesc * bis_desc
Definition: brin.c:192
BrinRevmap * bis_rmAccess
Definition: brin.c:191
BlockNumber bis_pages_per_range
Definition: brin.c:193
void * ii_AmCache
Definition: execnodes.h:210

References add_values_to_range(), ALLOCSET_DEFAULT_SIZES, AllocSetContextCreate, AutoVacuumRequestWork(), AVW_BRINSummarizeRange, BrinInsertState::bis_desc, BrinInsertState::bis_pages_per_range, BrinInsertState::bis_rmAccess, brin_can_do_samepage_update(), brin_copy_tuple(), brin_deform_tuple(), brin_doupdate(), brin_form_tuple(), BrinGetAutoSummarize, brinGetTupleForHeapBlock(), buf, BUFFER_LOCK_SHARE, BUFFER_LOCK_UNLOCK, BufferGetPage(), BufferIsValid(), CHECK_FOR_INTERRUPTS, CurrentMemoryContext, ereport, errcode(), errmsg(), FirstOffsetNumber, IndexInfo::ii_AmCache, initialize_brin_insertstate(), InvalidBuffer, ItemIdGetLength, ItemPointerGetBlockNumber(), ItemPointerGetOffsetNumber(), LockBuffer(), LOG, MemoryContextDelete(), MemoryContextReset(), MemoryContextSwitchTo(), PageGetItemId(), RelationGetRelationName, RelationGetRelid, ReleaseBuffer(), and values.

Referenced by brinhandler().

◆ brininsertcleanup()

void brininsertcleanup ( Relation  index,
IndexInfo indexInfo 
)

Definition at line 504 of file brin.c.

505 {
506  BrinInsertState *bistate = (BrinInsertState *) indexInfo->ii_AmCache;
507 
508  /* bail out if cache not initialized */
509  if (indexInfo->ii_AmCache == NULL)
510  return;
511 
512  /*
513  * Clean up the revmap. Note that the brinDesc has already been cleaned up
514  * as part of its own memory context.
515  */
517  bistate->bis_rmAccess = NULL;
518  bistate->bis_desc = NULL;
519 }
if(TABLE==NULL||TABLE_index==NULL)
Definition: isn.c:77

References BrinInsertState::bis_desc, BrinInsertState::bis_rmAccess, brinRevmapTerminate(), if(), and IndexInfo::ii_AmCache.

Referenced by brinhandler().

◆ brinoptions()

bytea* brinoptions ( Datum  reloptions,
bool  validate 
)

Definition at line 1336 of file brin.c.

1337 {
1338  static const relopt_parse_elt tab[] = {
1339  {"pages_per_range", RELOPT_TYPE_INT, offsetof(BrinOptions, pagesPerRange)},
1340  {"autosummarize", RELOPT_TYPE_BOOL, offsetof(BrinOptions, autosummarize)}
1341  };
1342 
1343  return (bytea *) build_reloptions(reloptions, validate,
1345  sizeof(BrinOptions),
1346  tab, lengthof(tab));
1347 }
#define lengthof(array)
Definition: c.h:788
void * build_reloptions(Datum reloptions, bool validate, relopt_kind kind, Size relopt_struct_size, const relopt_parse_elt *relopt_elems, int num_relopt_elems)
Definition: reloptions.c:1908
@ RELOPT_KIND_BRIN
Definition: reloptions.h:52
@ RELOPT_TYPE_INT
Definition: reloptions.h:32
@ RELOPT_TYPE_BOOL
Definition: reloptions.h:31
Definition: c.h:687

References build_reloptions(), lengthof, RELOPT_KIND_BRIN, RELOPT_TYPE_BOOL, and RELOPT_TYPE_INT.

Referenced by brinhandler().

◆ brinrescan()

void brinrescan ( IndexScanDesc  scan,
ScanKey  scankey,
int  nscankeys,
ScanKey  orderbys,
int  norderbys 
)

Definition at line 947 of file brin.c.

949 {
950  /*
951  * Other index AMs preprocess the scan keys at this point, or sometime
952  * early during the scan; this lets them optimize by removing redundant
953  * keys, or doing early returns when they are impossible to satisfy; see
954  * _bt_preprocess_keys for an example. Something like that could be added
955  * here someday, too.
956  */
957 
958  if (scankey && scan->numberOfKeys > 0)
959  memcpy(scan->keyData, scankey, scan->numberOfKeys * sizeof(ScanKeyData));
960 }

References IndexScanDescData::keyData, and IndexScanDescData::numberOfKeys.

Referenced by brinhandler().

◆ brinsummarize()

static void brinsummarize ( Relation  index,
Relation  heapRel,
BlockNumber  pageRange,
bool  include_partial,
double *  numSummarized,
double *  numExisting 
)
static

Definition at line 1876 of file brin.c.

1878 {
1879  BrinRevmap *revmap;
1880  BrinBuildState *state = NULL;
1881  IndexInfo *indexInfo = NULL;
1882  BlockNumber heapNumBlocks;
1883  BlockNumber pagesPerRange;
1884  Buffer buf;
1885  BlockNumber startBlk;
1886 
1887  revmap = brinRevmapInitialize(index, &pagesPerRange);
1888 
1889  /* determine range of pages to process */
1890  heapNumBlocks = RelationGetNumberOfBlocks(heapRel);
1891  if (pageRange == BRIN_ALL_BLOCKRANGES)
1892  startBlk = 0;
1893  else
1894  {
1895  startBlk = (pageRange / pagesPerRange) * pagesPerRange;
1896  heapNumBlocks = Min(heapNumBlocks, startBlk + pagesPerRange);
1897  }
1898  if (startBlk > heapNumBlocks)
1899  {
1900  /* Nothing to do if start point is beyond end of table */
1901  brinRevmapTerminate(revmap);
1902  return;
1903  }
1904 
1905  /*
1906  * Scan the revmap to find unsummarized items.
1907  */
1908  buf = InvalidBuffer;
1909  for (; startBlk < heapNumBlocks; startBlk += pagesPerRange)
1910  {
1911  BrinTuple *tup;
1912  OffsetNumber off;
1913 
1914  /*
1915  * Unless requested to summarize even a partial range, go away now if
1916  * we think the next range is partial. Caller would pass true when it
1917  * is typically run once bulk data loading is done
1918  * (brin_summarize_new_values), and false when it is typically the
1919  * result of arbitrarily-scheduled maintenance command (vacuuming).
1920  */
1921  if (!include_partial &&
1922  (startBlk + pagesPerRange > heapNumBlocks))
1923  break;
1924 
1926 
1927  tup = brinGetTupleForHeapBlock(revmap, startBlk, &buf, &off, NULL,
1929  if (tup == NULL)
1930  {
1931  /* no revmap entry for this heap range. Summarize it. */
1932  if (state == NULL)
1933  {
1934  /* first time through */
1935  Assert(!indexInfo);
1937  pagesPerRange,
1939  indexInfo = BuildIndexInfo(index);
1940  }
1941  summarize_range(indexInfo, state, heapRel, startBlk, heapNumBlocks);
1942 
1943  /* and re-initialize state for the next range */
1944  brin_memtuple_initialize(state->bs_dtuple, state->bs_bdesc);
1945 
1946  if (numSummarized)
1947  *numSummarized += 1.0;
1948  }
1949  else
1950  {
1951  if (numExisting)
1952  *numExisting += 1.0;
1954  }
1955  }
1956 
1957  if (BufferIsValid(buf))
1958  ReleaseBuffer(buf);
1959 
1960  /* free resources */
1961  brinRevmapTerminate(revmap);
1962  if (state)
1963  {
1965  pfree(indexInfo);
1966  }
1967 }
static void summarize_range(IndexInfo *indexInfo, BrinBuildState *state, Relation heapRel, BlockNumber heapBlk, BlockNumber heapNumBlks)
Definition: brin.c:1750

References Assert, BRIN_ALL_BLOCKRANGES, brin_memtuple_initialize(), brinGetTupleForHeapBlock(), brinRevmapInitialize(), brinRevmapTerminate(), buf, BUFFER_LOCK_SHARE, BUFFER_LOCK_UNLOCK, BufferIsValid(), BuildIndexInfo(), CHECK_FOR_INTERRUPTS, initialize_brin_buildstate(), InvalidBlockNumber, InvalidBuffer, LockBuffer(), Min, pfree(), RelationGetNumberOfBlocks, ReleaseBuffer(), summarize_range(), and terminate_brin_buildstate().

Referenced by brin_summarize_range(), and brinvacuumcleanup().

◆ brinvacuumcleanup()

IndexBulkDeleteResult* brinvacuumcleanup ( IndexVacuumInfo info,
IndexBulkDeleteResult stats 
)

Definition at line 1306 of file brin.c.

1307 {
1308  Relation heapRel;
1309 
1310  /* No-op in ANALYZE ONLY mode */
1311  if (info->analyze_only)
1312  return stats;
1313 
1314  if (!stats)
1316  stats->num_pages = RelationGetNumberOfBlocks(info->index);
1317  /* rest of stats is initialized by zeroing */
1318 
1319  heapRel = table_open(IndexGetRelation(RelationGetRelid(info->index), false),
1320  AccessShareLock);
1321 
1322  brin_vacuum_scan(info->index, info->strategy);
1323 
1324  brinsummarize(info->index, heapRel, BRIN_ALL_BLOCKRANGES, false,
1325  &stats->num_index_tuples, &stats->num_index_tuples);
1326 
1327  table_close(heapRel, AccessShareLock);
1328 
1329  return stats;
1330 }
static void brin_vacuum_scan(Relation idxrel, BufferAccessStrategy strategy)
Definition: brin.c:2161
BlockNumber num_pages
Definition: genam.h:77
double num_index_tuples
Definition: genam.h:79
Relation index
Definition: genam.h:46
bool analyze_only
Definition: genam.h:48
BufferAccessStrategy strategy
Definition: genam.h:53

References AccessShareLock, IndexVacuumInfo::analyze_only, BRIN_ALL_BLOCKRANGES, brin_vacuum_scan(), brinsummarize(), IndexVacuumInfo::index, IndexGetRelation(), IndexBulkDeleteResult::num_index_tuples, IndexBulkDeleteResult::num_pages, palloc0_object, RelationGetNumberOfBlocks, RelationGetRelid, IndexVacuumInfo::strategy, table_close(), and table_open().

Referenced by brinhandler().

◆ check_null_keys()

static bool check_null_keys ( BrinValues bval,
ScanKey nullkeys,
int  nnullkeys 
)
static

Definition at line 2288 of file brin.c.

2289 {
2290  int keyno;
2291 
2292  /*
2293  * First check if there are any IS [NOT] NULL scan keys, and if we're
2294  * violating them.
2295  */
2296  for (keyno = 0; keyno < nnullkeys; keyno++)
2297  {
2298  ScanKey key = nullkeys[keyno];
2299 
2300  Assert(key->sk_attno == bval->bv_attno);
2301 
2302  /* Handle only IS NULL/IS NOT NULL tests */
2303  if (!(key->sk_flags & SK_ISNULL))
2304  continue;
2305 
2306  if (key->sk_flags & SK_SEARCHNULL)
2307  {
2308  /* IS NULL scan key, but range has no NULLs */
2309  if (!bval->bv_allnulls && !bval->bv_hasnulls)
2310  return false;
2311  }
2312  else if (key->sk_flags & SK_SEARCHNOTNULL)
2313  {
2314  /*
2315  * For IS NOT NULL, we can only skip ranges that are known to have
2316  * only nulls.
2317  */
2318  if (bval->bv_allnulls)
2319  return false;
2320  }
2321  else
2322  {
2323  /*
2324  * Neither IS NULL nor IS NOT NULL was used; assume all indexable
2325  * operators are strict and thus return false with NULL value in
2326  * the scan key.
2327  */
2328  return false;
2329  }
2330  }
2331 
2332  return true;
2333 }
#define SK_SEARCHNOTNULL
Definition: skey.h:122
#define SK_SEARCHNULL
Definition: skey.h:121
AttrNumber bv_attno
Definition: brin_tuple.h:31

References Assert, BrinValues::bv_allnulls, BrinValues::bv_attno, BrinValues::bv_hasnulls, sort-test::key, SK_ISNULL, SK_SEARCHNOTNULL, and SK_SEARCHNULL.

Referenced by bringetbitmap().

◆ form_and_insert_tuple()

static void form_and_insert_tuple ( BrinBuildState state)
static

Definition at line 1974 of file brin.c.

1975 {
1976  BrinTuple *tup;
1977  Size size;
1978 
1979  tup = brin_form_tuple(state->bs_bdesc, state->bs_currRangeStart,
1980  state->bs_dtuple, &size);
1981  brin_doinsert(state->bs_irel, state->bs_pagesPerRange, state->bs_rmAccess,
1982  &state->bs_currentInsertBuf, state->bs_currRangeStart,
1983  tup, size);
1984  state->bs_numtuples++;
1985 
1986  pfree(tup);
1987 }

References brin_doinsert(), brin_form_tuple(), pfree(), and size.

Referenced by brinbuild(), and brinbuildCallback().

◆ form_and_spill_tuple()

static void form_and_spill_tuple ( BrinBuildState state)
static

Definition at line 1995 of file brin.c.

1996 {
1997  BrinTuple *tup;
1998  Size size;
1999 
2000  /* don't insert empty tuples in parallel build */
2001  if (state->bs_dtuple->bt_empty_range)
2002  return;
2003 
2004  tup = brin_form_tuple(state->bs_bdesc, state->bs_currRangeStart,
2005  state->bs_dtuple, &size);
2006 
2007  /* write the BRIN tuple to the tuplesort */
2008  tuplesort_putbrintuple(state->bs_sortstate, tup, size);
2009 
2010  state->bs_numtuples++;
2011 
2012  pfree(tup);
2013 }
void tuplesort_putbrintuple(Tuplesortstate *state, BrinTuple *tuple, Size size)

References brin_form_tuple(), pfree(), size, and tuplesort_putbrintuple().

Referenced by _brin_parallel_scan_and_build(), and brinbuildCallbackParallel().

◆ initialize_brin_buildstate()

static BrinBuildState * initialize_brin_buildstate ( Relation  idxRel,
BrinRevmap revmap,
BlockNumber  pagesPerRange,
BlockNumber  tablePages 
)
static

Definition at line 1658 of file brin.c.

1660 {
1662  BlockNumber lastRange = 0;
1663 
1665 
1666  state->bs_irel = idxRel;
1667  state->bs_numtuples = 0;
1668  state->bs_reltuples = 0;
1669  state->bs_currentInsertBuf = InvalidBuffer;
1670  state->bs_pagesPerRange = pagesPerRange;
1671  state->bs_currRangeStart = 0;
1672  state->bs_rmAccess = revmap;
1673  state->bs_bdesc = brin_build_desc(idxRel);
1674  state->bs_dtuple = brin_new_memtuple(state->bs_bdesc);
1675  state->bs_leader = NULL;
1676  state->bs_worker_id = 0;
1677  state->bs_sortstate = NULL;
1678  state->bs_context = CurrentMemoryContext;
1679  state->bs_emptyTuple = NULL;
1680  state->bs_emptyTupleLen = 0;
1681 
1682  /* Remember the memory context to use for an empty tuple, if needed. */
1683  state->bs_context = CurrentMemoryContext;
1684  state->bs_emptyTuple = NULL;
1685  state->bs_emptyTupleLen = 0;
1686 
1687  /*
1688  * Calculate the start of the last page range. Page numbers are 0-based,
1689  * so to calculate the index we need to subtract one. The integer division
1690  * gives us the index of the page range.
1691  */
1692  if (tablePages > 0)
1693  lastRange = ((tablePages - 1) / pagesPerRange) * pagesPerRange;
1694 
1695  /* Now calculate the start of the next range. */
1696  state->bs_maxRangeStart = lastRange + state->bs_pagesPerRange;
1697 
1698  return state;
1699 }

References brin_build_desc(), brin_new_memtuple(), CurrentMemoryContext, InvalidBuffer, and palloc_object.

Referenced by _brin_parallel_build_main(), brinbuild(), and brinsummarize().

◆ initialize_brin_insertstate()

static BrinInsertState * initialize_brin_insertstate ( Relation  idxRel,
IndexInfo indexInfo 
)
static

Definition at line 307 of file brin.c.

308 {
309  BrinInsertState *bistate;
310  MemoryContext oldcxt;
311 
312  oldcxt = MemoryContextSwitchTo(indexInfo->ii_Context);
313  bistate = palloc0(sizeof(BrinInsertState));
314  bistate->bis_desc = brin_build_desc(idxRel);
315  bistate->bis_rmAccess = brinRevmapInitialize(idxRel,
316  &bistate->bis_pages_per_range);
317  indexInfo->ii_AmCache = bistate;
318  MemoryContextSwitchTo(oldcxt);
319 
320  return bistate;
321 }
MemoryContext ii_Context
Definition: execnodes.h:211

References BrinInsertState::bis_desc, BrinInsertState::bis_pages_per_range, BrinInsertState::bis_rmAccess, brin_build_desc(), brinRevmapInitialize(), IndexInfo::ii_AmCache, IndexInfo::ii_Context, MemoryContextSwitchTo(), and palloc0().

Referenced by brininsert().

◆ summarize_range()

static void summarize_range ( IndexInfo indexInfo,
BrinBuildState state,
Relation  heapRel,
BlockNumber  heapBlk,
BlockNumber  heapNumBlks 
)
static

Definition at line 1750 of file brin.c.

1752 {
1753  Buffer phbuf;
1754  BrinTuple *phtup;
1755  Size phsz;
1756  OffsetNumber offset;
1757  BlockNumber scanNumBlks;
1758 
1759  /*
1760  * Insert the placeholder tuple
1761  */
1762  phbuf = InvalidBuffer;
1763  phtup = brin_form_placeholder_tuple(state->bs_bdesc, heapBlk, &phsz);
1764  offset = brin_doinsert(state->bs_irel, state->bs_pagesPerRange,
1765  state->bs_rmAccess, &phbuf,
1766  heapBlk, phtup, phsz);
1767 
1768  /*
1769  * Compute range end. We hold ShareUpdateExclusive lock on table, so it
1770  * cannot shrink concurrently (but it can grow).
1771  */
1772  Assert(heapBlk % state->bs_pagesPerRange == 0);
1773  if (heapBlk + state->bs_pagesPerRange > heapNumBlks)
1774  {
1775  /*
1776  * If we're asked to scan what we believe to be the final range on the
1777  * table (i.e. a range that might be partial) we need to recompute our
1778  * idea of what the latest page is after inserting the placeholder
1779  * tuple. Anyone that grows the table later will update the
1780  * placeholder tuple, so it doesn't matter that we won't scan these
1781  * pages ourselves. Careful: the table might have been extended
1782  * beyond the current range, so clamp our result.
1783  *
1784  * Fortunately, this should occur infrequently.
1785  */
1786  scanNumBlks = Min(RelationGetNumberOfBlocks(heapRel) - heapBlk,
1787  state->bs_pagesPerRange);
1788  }
1789  else
1790  {
1791  /* Easy case: range is known to be complete */
1792  scanNumBlks = state->bs_pagesPerRange;
1793  }
1794 
1795  /*
1796  * Execute the partial heap scan covering the heap blocks in the specified
1797  * page range, summarizing the heap tuples in it. This scan stops just
1798  * short of brinbuildCallback creating the new index entry.
1799  *
1800  * Note that it is critical we use the "any visible" mode of
1801  * table_index_build_range_scan here: otherwise, we would miss tuples
1802  * inserted by transactions that are still in progress, among other corner
1803  * cases.
1804  */
1805  state->bs_currRangeStart = heapBlk;
1806  table_index_build_range_scan(heapRel, state->bs_irel, indexInfo, false, true, false,
1807  heapBlk, scanNumBlks,
1808  brinbuildCallback, (void *) state, NULL);
1809 
1810  /*
1811  * Now we update the values obtained by the scan with the placeholder
1812  * tuple. We do this in a loop which only terminates if we're able to
1813  * update the placeholder tuple successfully; if we are not, this means
1814  * somebody else modified the placeholder tuple after we read it.
1815  */
1816  for (;;)
1817  {
1818  BrinTuple *newtup;
1819  Size newsize;
1820  bool didupdate;
1821  bool samepage;
1822 
1824 
1825  /*
1826  * Update the summary tuple and try to update.
1827  */
1828  newtup = brin_form_tuple(state->bs_bdesc,
1829  heapBlk, state->bs_dtuple, &newsize);
1830  samepage = brin_can_do_samepage_update(phbuf, phsz, newsize);
1831  didupdate =
1832  brin_doupdate(state->bs_irel, state->bs_pagesPerRange,
1833  state->bs_rmAccess, heapBlk, phbuf, offset,
1834  phtup, phsz, newtup, newsize, samepage);
1835  brin_free_tuple(phtup);
1836  brin_free_tuple(newtup);
1837 
1838  /* If the update succeeded, we're done. */
1839  if (didupdate)
1840  break;
1841 
1842  /*
1843  * If the update didn't work, it might be because somebody updated the
1844  * placeholder tuple concurrently. Extract the new version, union it
1845  * with the values we have from the scan, and start over. (There are
1846  * other reasons for the update to fail, but it's simple to treat them
1847  * the same.)
1848  */
1849  phtup = brinGetTupleForHeapBlock(state->bs_rmAccess, heapBlk, &phbuf,
1850  &offset, &phsz, BUFFER_LOCK_SHARE);
1851  /* the placeholder tuple must exist */
1852  if (phtup == NULL)
1853  elog(ERROR, "missing placeholder tuple");
1854  phtup = brin_copy_tuple(phtup, phsz, NULL, NULL);
1856 
1857  /* merge it into the tuple from the heap scan */
1858  union_tuples(state->bs_bdesc, state->bs_dtuple, phtup);
1859  }
1860 
1861  ReleaseBuffer(phbuf);
1862 }
void brin_free_tuple(BrinTuple *tuple)
Definition: brin_tuple.c:433
BrinTuple * brin_form_placeholder_tuple(BrinDesc *brdesc, BlockNumber blkno, Size *size)
Definition: brin_tuple.c:388
static double table_index_build_range_scan(Relation table_rel, Relation index_rel, struct IndexInfo *index_info, bool allow_sync, bool anyvisible, bool progress, BlockNumber start_blockno, BlockNumber numblocks, IndexBuildCallback callback, void *callback_state, TableScanDesc scan)
Definition: tableam.h:1808

References Assert, brin_can_do_samepage_update(), brin_copy_tuple(), brin_doinsert(), brin_doupdate(), brin_form_placeholder_tuple(), brin_form_tuple(), brin_free_tuple(), brinbuildCallback(), brinGetTupleForHeapBlock(), BUFFER_LOCK_SHARE, BUFFER_LOCK_UNLOCK, CHECK_FOR_INTERRUPTS, elog, ERROR, InvalidBuffer, LockBuffer(), Min, RelationGetNumberOfBlocks, ReleaseBuffer(), table_index_build_range_scan(), and union_tuples().

Referenced by brinsummarize().

◆ terminate_brin_buildstate()

static void terminate_brin_buildstate ( BrinBuildState state)
static

Definition at line 1705 of file brin.c.

1706 {
1707  /*
1708  * Release the last index buffer used. We might as well ensure that
1709  * whatever free space remains in that page is available in FSM, too.
1710  */
1711  if (!BufferIsInvalid(state->bs_currentInsertBuf))
1712  {
1713  Page page;
1714  Size freespace;
1715  BlockNumber blk;
1716 
1717  page = BufferGetPage(state->bs_currentInsertBuf);
1718  freespace = PageGetFreeSpace(page);
1719  blk = BufferGetBlockNumber(state->bs_currentInsertBuf);
1720  ReleaseBuffer(state->bs_currentInsertBuf);
1721  RecordPageWithFreeSpace(state->bs_irel, blk, freespace);
1722  FreeSpaceMapVacuumRange(state->bs_irel, blk, blk + 1);
1723  }
1724 
1725  brin_free_desc(state->bs_bdesc);
1726  pfree(state->bs_dtuple);
1727  pfree(state);
1728 }
#define BufferIsInvalid(buffer)
Definition: buf.h:31
Size PageGetFreeSpace(Page page)
Definition: bufpage.c:907
void FreeSpaceMapVacuumRange(Relation rel, BlockNumber start, BlockNumber end)
Definition: freespace.c:377
void RecordPageWithFreeSpace(Relation rel, BlockNumber heapBlk, Size spaceAvail)
Definition: freespace.c:194

References brin_free_desc(), BufferGetBlockNumber(), BufferGetPage(), BufferIsInvalid, FreeSpaceMapVacuumRange(), PageGetFreeSpace(), pfree(), RecordPageWithFreeSpace(), and ReleaseBuffer().

Referenced by brinbuild(), and brinsummarize().

◆ union_tuples()

static void union_tuples ( BrinDesc bdesc,
BrinMemTuple a,
BrinTuple b 
)
static

Definition at line 2020 of file brin.c.

2021 {
2022  int keyno;
2023  BrinMemTuple *db;
2024  MemoryContext cxt;
2025  MemoryContext oldcxt;
2026 
2027  /* Use our own memory context to avoid retail pfree */
2029  "brin union",
2031  oldcxt = MemoryContextSwitchTo(cxt);
2032  db = brin_deform_tuple(bdesc, b, NULL);
2033  MemoryContextSwitchTo(oldcxt);
2034 
2035  /*
2036  * Check if the ranges are empty.
2037  *
2038  * If at least one of them is empty, we don't need to call per-key union
2039  * functions at all. If "b" is empty, we just use "a" as the result (it
2040  * might be empty fine, but that's fine). If "a" is empty but "b" is not,
2041  * we use "b" as the result (but we have to copy the data into "a" first).
2042  *
2043  * Only when both ranges are non-empty, we actually do the per-key merge.
2044  */
2045 
2046  /* If "b" is empty - ignore it and just use "a" (even if it's empty etc.). */
2047  if (db->bt_empty_range)
2048  {
2049  /* skip the per-key merge */
2050  MemoryContextDelete(cxt);
2051  return;
2052  }
2053 
2054  /*
2055  * Now we know "b" is not empty. If "a" is empty, then "b" is the result.
2056  * But we need to copy the data from "b" to "a" first, because that's how
2057  * we pass result out.
2058  *
2059  * We have to copy all the global/per-key flags etc. too.
2060  */
2061  if (a->bt_empty_range)
2062  {
2063  for (keyno = 0; keyno < bdesc->bd_tupdesc->natts; keyno++)
2064  {
2065  int i;
2066  BrinValues *col_a = &a->bt_columns[keyno];
2067  BrinValues *col_b = &db->bt_columns[keyno];
2068  BrinOpcInfo *opcinfo = bdesc->bd_info[keyno];
2069 
2070  col_a->bv_allnulls = col_b->bv_allnulls;
2071  col_a->bv_hasnulls = col_b->bv_hasnulls;
2072 
2073  /* If "b" has no data, we're done. */
2074  if (col_b->bv_allnulls)
2075  continue;
2076 
2077  for (i = 0; i < opcinfo->oi_nstored; i++)
2078  col_a->bv_values[i] =
2079  datumCopy(col_b->bv_values[i],
2080  opcinfo->oi_typcache[i]->typbyval,
2081  opcinfo->oi_typcache[i]->typlen);
2082  }
2083 
2084  /* "a" started empty, but "b" was not empty, so remember that */
2085  a->bt_empty_range = false;
2086 
2087  /* skip the per-key merge */
2088  MemoryContextDelete(cxt);
2089  return;
2090  }
2091 
2092  /* Now we know neither range is empty. */
2093  for (keyno = 0; keyno < bdesc->bd_tupdesc->natts; keyno++)
2094  {
2095  FmgrInfo *unionFn;
2096  BrinValues *col_a = &a->bt_columns[keyno];
2097  BrinValues *col_b = &db->bt_columns[keyno];
2098  BrinOpcInfo *opcinfo = bdesc->bd_info[keyno];
2099 
2100  if (opcinfo->oi_regular_nulls)
2101  {
2102  /* Does the "b" summary represent any NULL values? */
2103  bool b_has_nulls = (col_b->bv_hasnulls || col_b->bv_allnulls);
2104 
2105  /* Adjust "hasnulls". */
2106  if (!col_a->bv_allnulls && b_has_nulls)
2107  col_a->bv_hasnulls = true;
2108 
2109  /* If there are no values in B, there's nothing left to do. */
2110  if (col_b->bv_allnulls)
2111  continue;
2112 
2113  /*
2114  * Adjust "allnulls". If A doesn't have values, just copy the
2115  * values from B into A, and we're done. We cannot run the
2116  * operators in this case, because values in A might contain
2117  * garbage. Note we already established that B contains values.
2118  *
2119  * Also adjust "hasnulls" in order not to forget the summary
2120  * represents NULL values. This is not redundant with the earlier
2121  * update, because that only happens when allnulls=false.
2122  */
2123  if (col_a->bv_allnulls)
2124  {
2125  int i;
2126 
2127  col_a->bv_allnulls = false;
2128  col_a->bv_hasnulls = true;
2129 
2130  for (i = 0; i < opcinfo->oi_nstored; i++)
2131  col_a->bv_values[i] =
2132  datumCopy(col_b->bv_values[i],
2133  opcinfo->oi_typcache[i]->typbyval,
2134  opcinfo->oi_typcache[i]->typlen);
2135 
2136  continue;
2137  }
2138  }
2139 
2140  unionFn = index_getprocinfo(bdesc->bd_index, keyno + 1,
2142  FunctionCall3Coll(unionFn,
2143  bdesc->bd_index->rd_indcollation[keyno],
2144  PointerGetDatum(bdesc),
2145  PointerGetDatum(col_a),
2146  PointerGetDatum(col_b));
2147  }
2148 
2149  MemoryContextDelete(cxt);
2150 }
#define BRIN_PROCNUM_UNION
Definition: brin_internal.h:73
Datum datumCopy(Datum value, bool typByVal, int typLen)
Definition: datum.c:132
int b
Definition: isn.c:70
int a
Definition: isn.c:69
TypeCacheEntry * oi_typcache[FLEXIBLE_ARRAY_MEMBER]
Definition: brin_internal.h:37
Datum * bv_values
Definition: brin_tuple.h:34
bool typbyval
Definition: typcache.h:40
int16 typlen
Definition: typcache.h:39

References a, ALLOCSET_DEFAULT_SIZES, AllocSetContextCreate, b, BrinDesc::bd_index, BrinDesc::bd_info, BrinDesc::bd_tupdesc, brin_deform_tuple(), BRIN_PROCNUM_UNION, BrinMemTuple::bt_columns, BrinMemTuple::bt_empty_range, BrinValues::bv_allnulls, BrinValues::bv_hasnulls, BrinValues::bv_values, CurrentMemoryContext, datumCopy(), FunctionCall3Coll(), i, index_getprocinfo(), MemoryContextDelete(), MemoryContextSwitchTo(), TupleDescData::natts, BrinOpcInfo::oi_nstored, BrinOpcInfo::oi_regular_nulls, BrinOpcInfo::oi_typcache, PointerGetDatum(), RelationData::rd_indcollation, TypeCacheEntry::typbyval, and TypeCacheEntry::typlen.

Referenced by _brin_parallel_merge(), and summarize_range().