bernoulli_8c_source.html

 /*-------------------------------------------------------------------------

  *

  * bernoulli.c

  *    support routines for BERNOULLI tablesample method

  *

  * To ensure repeatability of samples, it is necessary that selection of a

  * given tuple be history-independent; otherwise syncscanning would break

  * repeatability, to say nothing of logically-irrelevant maintenance such

  * as physical extension or shortening of the relation.

  *

  * To achieve that, we proceed by hashing each candidate TID together with

  * the active seed, and then selecting it if the hash is less than the

  * cutoff value computed from the selection probability by BeginSampleScan.

  *

  *

  * Portions Copyright (c) 1996-2024, PostgreSQL Global Development Group

  * Portions Copyright (c) 1994, Regents of the University of California

  *

  * IDENTIFICATION

  *    src/backend/access/tablesample/bernoulli.c

  *

  *-------------------------------------------------------------------------

  */


 #include "postgres.h"


 #include <math.h>


 #include "access/tsmapi.h"

 #include "catalog/pg_type.h"

 #include "common/hashfn.h"

 #include "optimizer/optimizer.h"

 #include "utils/fmgrprotos.h"


 /* Private state */

 typedef struct

 {

     uint64      cutoff;         /* select tuples with hash less than this */

     uint32      seed;           /* random seed */

     OffsetNumber lt;            /* last tuple returned from current block */

 } BernoulliSamplerData;


 static void bernoulli_samplescangetsamplesize(PlannerInfo *root,

                                               RelOptInfo *baserel,

                                               List *paramexprs,

                                               BlockNumber *pages,

                                               double *tuples);

 static void bernoulli_initsamplescan(SampleScanState *node,

                                      int eflags);

 static void bernoulli_beginsamplescan(SampleScanState *node,

                                       Datum *params,

                                       int nparams,

                                       uint32 seed);

 static OffsetNumber bernoulli_nextsampletuple(SampleScanState *node,

                                               BlockNumber blockno,

                                               OffsetNumber maxoffset);


 /*

  * Create a TsmRoutine descriptor for the BERNOULLI method.

  */

 Datum

 tsm_bernoulli_handler(PG_FUNCTION_ARGS)

 {

     TsmRoutine *tsm = makeNode(TsmRoutine);


     tsm->parameterTypes = list_make1_oid(FLOAT4OID);

     tsm->repeatable_across_queries = true;

     tsm->repeatable_across_scans = true;

     tsm->SampleScanGetSampleSize = bernoulli_samplescangetsamplesize;

     tsm->InitSampleScan = bernoulli_initsamplescan;

     tsm->BeginSampleScan = bernoulli_beginsamplescan;

     tsm->NextSampleBlock = NULL;

     tsm->NextSampleTuple = bernoulli_nextsampletuple;

     tsm->EndSampleScan = NULL;


     PG_RETURN_POINTER(tsm);

 }


 /*

  * Sample size estimation.

  */

 static void

 bernoulli_samplescangetsamplesize(PlannerInfo *root,

                                   RelOptInfo *baserel,

                                   List *paramexprs,

                                   BlockNumber *pages,

                                   double *tuples)

 {

     Node       *pctnode;

     float4      samplefract;


     /* Try to extract an estimate for the sample percentage */

     pctnode = (Node *) linitial(paramexprs);

     pctnode = estimate_expression_value(root, pctnode);


     if (IsA(pctnode, Const) &&

         !((Const *) pctnode)->constisnull)

     {

         samplefract = DatumGetFloat4(((Const *) pctnode)->constvalue);

         if (samplefract >= 0 && samplefract <= 100 && !isnan(samplefract))

             samplefract /= 100.0f;

         else

         {

             /* Default samplefract if the value is bogus */

             samplefract = 0.1f;

         }

     }

     else

     {

         /* Default samplefract if we didn't obtain a non-null Const */

         samplefract = 0.1f;

     }


     /* We'll visit all pages of the baserel */

     *pages = baserel->pages;


     *tuples = clamp_row_est(baserel->tuples * samplefract);

 }


 /*

  * Initialize during executor setup.

  */

 static void

 bernoulli_initsamplescan(SampleScanState *node, int eflags)

 {

     node->tsm_state = palloc0(sizeof(BernoulliSamplerData));

 }


 /*

  * Examine parameters and prepare for a sample scan.

  */

 static void

 bernoulli_beginsamplescan(SampleScanState *node,

                           Datum *params,

                           int nparams,

                           uint32 seed)

 {

     BernoulliSamplerData *sampler = (BernoulliSamplerData *) node->tsm_state;

     double      percent = DatumGetFloat4(params[0]);

     double      dcutoff;


     if (percent < 0 || percent > 100 || isnan(percent))

         ereport(ERROR,

                 (errcode(ERRCODE_INVALID_TABLESAMPLE_ARGUMENT),

                  errmsg("sample percentage must be between 0 and 100")));


     /*

      * The cutoff is sample probability times (PG_UINT32_MAX + 1); we have to

      * store that as a uint64, of course.  Note that this gives strictly

      * correct behavior at the limits of zero or one probability.

      */

     dcutoff = rint(((double) PG_UINT32_MAX + 1) * percent / 100);

     sampler->cutoff = (uint64) dcutoff;

     sampler->seed = seed;

     sampler->lt = InvalidOffsetNumber;


     /*

      * Use bulkread, since we're scanning all pages.  But pagemode visibility

      * checking is a win only at larger sampling fractions.  The 25% cutoff

      * here is based on very limited experimentation.

      */

     node->use_bulkread = true;

     node->use_pagemode = (percent >= 25);

 }


 /*

  * Select next sampled tuple in current block.

  *

  * It is OK here to return an offset without knowing if the tuple is visible

  * (or even exists).  The reason is that we do the coinflip for every tuple

  * offset in the table.  Since all tuples have the same probability of being

  * returned, it doesn't matter if we do extra coinflips for invisible tuples.

  *

  * When we reach end of the block, return InvalidOffsetNumber which tells

  * SampleScan to go to next block.

  */

 static OffsetNumber

 bernoulli_nextsampletuple(SampleScanState *node,

                           BlockNumber blockno,

                           OffsetNumber maxoffset)

 {

     BernoulliSamplerData *sampler = (BernoulliSamplerData *) node->tsm_state;

     OffsetNumber tupoffset = sampler->lt;

     uint32      hashinput[3];


     /* Advance to first/next tuple in block */

     if (tupoffset == InvalidOffsetNumber)

         tupoffset = FirstOffsetNumber;

     else

         tupoffset++;


     /*

      * We compute the hash by applying hash_any to an array of 3 uint32's

      * containing the block, offset, and seed.  This is efficient to set up,

      * and with the current implementation of hash_any, it gives

      * machine-independent results, which is a nice property for regression

      * testing.

      *

      * These words in the hash input are the same throughout the block:

      */

     hashinput[0] = blockno;

     hashinput[2] = sampler->seed;


     /*

      * Loop over tuple offsets until finding suitable TID or reaching end of

      * block.

      */

     for (; tupoffset <= maxoffset; tupoffset++)

     {

         uint32      hash;


         hashinput[1] = tupoffset;


         hash = DatumGetUInt32(hash_any((const unsigned char *) hashinput,

                                        (int) sizeof(hashinput)));

         if (hash < sampler->cutoff)

             break;

     }


     if (tupoffset > maxoffset)

         tupoffset = InvalidOffsetNumber;


     sampler->lt = tupoffset;


     return tupoffset;

 }

bernoulli_samplescangetsamplesize
static void bernoulli_samplescangetsamplesize(PlannerInfo *root, RelOptInfo *baserel, List *paramexprs, BlockNumber *pages, double *tuples)
Definition: bernoulli.c:86

bernoulli_initsamplescan
static void bernoulli_initsamplescan(SampleScanState *node, int eflags)
Definition: bernoulli.c:127

tsm_bernoulli_handler
Datum tsm_bernoulli_handler(PG_FUNCTION_ARGS)
Definition: bernoulli.c:65

bernoulli_beginsamplescan
static void bernoulli_beginsamplescan(SampleScanState *node, Datum *params, int nparams, uint32 seed)
Definition: bernoulli.c:136

bernoulli_nextsampletuple
static OffsetNumber bernoulli_nextsampletuple(SampleScanState *node, BlockNumber blockno, OffsetNumber maxoffset)
Definition: bernoulli.c:181

BlockNumber
uint32 BlockNumber
Definition: block.h:31

uint32
unsigned int uint32
Definition: c.h:506

PG_UINT32_MAX
#define PG_UINT32_MAX
Definition: c.h:581

float4
float float4
Definition: c.h:620

estimate_expression_value
Node * estimate_expression_value(PlannerInfo *root, Node *node)
Definition: clauses.c:2395

clamp_row_est
double clamp_row_est(double nrows)
Definition: costsize.c:213

errcode
int errcode(int sqlerrcode)
Definition: elog.c:853

errmsg
int errmsg(const char *fmt,...)
Definition: elog.c:1070

ERROR
#define ERROR
Definition: elog.h:39

ereport
#define ereport(elevel,...)
Definition: elog.h:149

PG_RETURN_POINTER
#define PG_RETURN_POINTER(x)
Definition: fmgr.h:361

PG_FUNCTION_ARGS
#define PG_FUNCTION_ARGS
Definition: fmgr.h:193

hashfn.h

hash_any
static Datum hash_any(const unsigned char *k, int keylen)
Definition: hashfn.h:31

if
if(TABLE==NULL||TABLE_index==NULL)
Definition: isn.c:77

palloc0
void * palloc0(Size size)
Definition: mcxt.c:1347

IsA
#define IsA(nodeptr, _type_)
Definition: nodes.h:158

makeNode
#define makeNode(_type_)
Definition: nodes.h:155

InvalidOffsetNumber
#define InvalidOffsetNumber
Definition: off.h:26

OffsetNumber
uint16 OffsetNumber
Definition: off.h:24

FirstOffsetNumber
#define FirstOffsetNumber
Definition: off.h:27

optimizer.h

list_make1_oid
#define list_make1_oid(x1)
Definition: pg_list.h:242

linitial
#define linitial(l)
Definition: pg_list.h:178

pg_type.h

postgres.h

DatumGetUInt32
static uint32 DatumGetUInt32(Datum X)
Definition: postgres.h:222

Datum
uintptr_t Datum
Definition: postgres.h:64

DatumGetFloat4
static float4 DatumGetFloat4(Datum X)
Definition: postgres.h:458

root
tree ctl root
Definition: radixtree.h:1886

hash
static unsigned hash(unsigned *uv, int n)
Definition: rege_dfa.c:715

BernoulliSamplerData
Definition: bernoulli.c:38

BernoulliSamplerData::seed
uint32 seed
Definition: bernoulli.c:40

BernoulliSamplerData::lt
OffsetNumber lt
Definition: bernoulli.c:41

BernoulliSamplerData::cutoff
uint64 cutoff
Definition: bernoulli.c:39

Const
Definition: primnodes.h:307

List
Definition: pg_list.h:54

Node
Definition: nodes.h:129

PlannerInfo
Definition: pathnodes.h:196

RelOptInfo
Definition: pathnodes.h:860

RelOptInfo::tuples
Cardinality tuples
Definition: pathnodes.h:949

RelOptInfo::pages
BlockNumber pages
Definition: pathnodes.h:948

SampleScanState
Definition: execnodes.h:1596

SampleScanState::use_bulkread
bool use_bulkread
Definition: execnodes.h:1603

SampleScanState::tsm_state
void * tsm_state
Definition: execnodes.h:1602

SampleScanState::use_pagemode
bool use_pagemode
Definition: execnodes.h:1604

TsmRoutine
Definition: tsmapi.h:57

TsmRoutine::NextSampleTuple
NextSampleTuple_function NextSampleTuple
Definition: tsmapi.h:74

TsmRoutine::repeatable_across_scans
bool repeatable_across_scans
Definition: tsmapi.h:65

TsmRoutine::EndSampleScan
EndSampleScan_function EndSampleScan
Definition: tsmapi.h:75

TsmRoutine::SampleScanGetSampleSize
SampleScanGetSampleSize_function SampleScanGetSampleSize
Definition: tsmapi.h:68

TsmRoutine::BeginSampleScan
BeginSampleScan_function BeginSampleScan
Definition: tsmapi.h:72

TsmRoutine::NextSampleBlock
NextSampleBlock_function NextSampleBlock
Definition: tsmapi.h:73

TsmRoutine::InitSampleScan
InitSampleScan_function InitSampleScan
Definition: tsmapi.h:71

TsmRoutine::parameterTypes
List * parameterTypes
Definition: tsmapi.h:61

TsmRoutine::repeatable_across_queries
bool repeatable_across_queries
Definition: tsmapi.h:64

tsmapi.h