nodeAgg_8h_source.html

/*-------------------------------------------------------------------------

 *

 * nodeAgg.h

 *    prototypes for nodeAgg.c

 *

 *

 * Portions Copyright (c) 1996-2025, PostgreSQL Global Development Group

 * Portions Copyright (c) 1994, Regents of the University of California

 *

 * src/include/executor/nodeAgg.h

 *

 *-------------------------------------------------------------------------

 */

#ifndef NODEAGG_H

#define NODEAGG_H


#include "access/parallel.h"

#include "nodes/execnodes.h"


/*

 * AggStatePerTransData - per aggregate state value information

 *

 * Working state for updating the aggregate's state value, by calling the

 * transition function with an input row. This struct does not store the

 * information needed to produce the final aggregate result from the transition

 * state, that's stored in AggStatePerAggData instead. This separation allows

 * multiple aggregate results to be produced from a single state value.

 */

typedef struct AggStatePerTransData

{

    /*

     * These values are set up during ExecInitAgg() and do not change

     * thereafter:

     */


    /*

     * Link to an Aggref expr this state value is for.

     *

     * There can be multiple Aggref's sharing the same state value, so long as

     * the inputs and transition functions are identical and the final

     * functions are not read-write.  This points to the first one of them.

     */

    Aggref     *aggref;


    /*

     * Is this state value actually being shared by more than one Aggref?

     */

    bool        aggshared;


    /*

     * True for ORDER BY and DISTINCT Aggrefs that are not aggpresorted.

     */

    bool        aggsortrequired;


    /*

     * Number of aggregated input columns.  This includes ORDER BY expressions

     * in both the plain-agg and ordered-set cases.  Ordered-set direct args

     * are not counted, though.

     */

    int         numInputs;


    /*

     * Number of aggregated input columns to pass to the transfn.  This

     * includes the ORDER BY columns for ordered-set aggs, but not for plain

     * aggs.  (This doesn't count the transition state value!)

     */

    int         numTransInputs;


    /* Oid of the state transition or combine function */

    Oid         transfn_oid;


    /* Oid of the serialization function or InvalidOid */

    Oid         serialfn_oid;


    /* Oid of the deserialization function or InvalidOid */

    Oid         deserialfn_oid;


    /* Oid of state value's datatype */

    Oid         aggtranstype;


    /*

     * fmgr lookup data for transition function or combine function.  Note in

     * particular that the fn_strict flag is kept here.

     */

    FmgrInfo    transfn;


    /* fmgr lookup data for serialization function */

    FmgrInfo    serialfn;


    /* fmgr lookup data for deserialization function */

    FmgrInfo    deserialfn;


    /* Input collation derived for aggregate */

    Oid         aggCollation;


    /* number of sorting columns */

    int         numSortCols;


    /* number of sorting columns to consider in DISTINCT comparisons */

    /* (this is either zero or the same as numSortCols) */

    int         numDistinctCols;


    /* deconstructed sorting information (arrays of length numSortCols) */

    AttrNumber *sortColIdx;

    Oid        *sortOperators;

    Oid        *sortCollations;

    bool       *sortNullsFirst;


    /*

     * Comparators for input columns --- only set/used when aggregate has

     * DISTINCT flag. equalfnOne version is used for single-column

     * comparisons, equalfnMulti for the case of multiple columns.

     */

    FmgrInfo    equalfnOne;

    ExprState  *equalfnMulti;


    /*

     * initial value from pg_aggregate entry

     */

    Datum       initValue;

    bool        initValueIsNull;


    /*

     * We need the len and byval info for the agg's input and transition data

     * types in order to know how to copy/delete values.

     *

     * Note that the info for the input type is used only when handling

     * DISTINCT aggs with just one argument, so there is only one input type.

     */

    int16       inputtypeLen,

                transtypeLen;

    bool        inputtypeByVal,

                transtypeByVal;


    /*

     * Slots for holding the evaluated input arguments.  These are set up

     * during ExecInitAgg() and then used for each input row requiring either

     * FILTER or ORDER BY/DISTINCT processing.

     */

    TupleTableSlot *sortslot;   /* current input tuple */

    TupleTableSlot *uniqslot;   /* used for multi-column DISTINCT */

    TupleDesc   sortdesc;       /* descriptor of input tuples */

    Datum       lastdatum;      /* used for single-column DISTINCT */

    bool        lastisnull;     /* used for single-column DISTINCT */

    bool        haslast;        /* got a last value for DISTINCT check */


    /*

     * These values are working state that is initialized at the start of an

     * input tuple group and updated for each input tuple.

     *

     * For a simple (non DISTINCT/ORDER BY) aggregate, we just feed the input

     * values straight to the transition function.  If it's DISTINCT or

     * requires ORDER BY, we pass the input values into a Tuplesort object;

     * then at completion of the input tuple group, we scan the sorted values,

     * eliminate duplicates if needed, and run the transition function on the

     * rest.

     *

     * We need a separate tuplesort for each grouping set.

     */


    Tuplesortstate **sortstates;    /* sort objects, if DISTINCT or ORDER BY */


    /*

     * This field is a pre-initialized FunctionCallInfo struct used for

     * calling this aggregate's transfn.  We save a few cycles per row by not

     * re-initializing the unchanging fields; which isn't much, but it seems

     * worth the extra space consumption.

     */

    FunctionCallInfo transfn_fcinfo;


    /* Likewise for serialization and deserialization functions */

    FunctionCallInfo serialfn_fcinfo;


    FunctionCallInfo deserialfn_fcinfo;

}           AggStatePerTransData;


/*

 * AggStatePerAggData - per-aggregate information

 *

 * This contains the information needed to call the final function, to produce

 * a final aggregate result from the state value. If there are multiple

 * identical Aggrefs in the query, they can all share the same per-agg data.

 *

 * These values are set up during ExecInitAgg() and do not change thereafter.

 */

typedef struct AggStatePerAggData

{

    /*

     * Link to an Aggref expr this state value is for.

     *

     * There can be multiple identical Aggref's sharing the same per-agg. This

     * points to the first one of them.

     */

    Aggref     *aggref;


    /* index to the state value which this agg should use */

    int         transno;


    /* Optional Oid of final function (may be InvalidOid) */

    Oid         finalfn_oid;


    /*

     * fmgr lookup data for final function --- only valid when finalfn_oid is

     * not InvalidOid.

     */

    FmgrInfo    finalfn;


    /*

     * Number of arguments to pass to the finalfn.  This is always at least 1

     * (the transition state value) plus any ordered-set direct args. If the

     * finalfn wants extra args then we pass nulls corresponding to the

     * aggregated input columns.

     */

    int         numFinalArgs;


    /* ExprStates for any direct-argument expressions */

    List       *aggdirectargs;


    /*

     * We need the len and byval info for the agg's result data type in order

     * to know how to copy/delete values.

     */

    int16       resulttypeLen;

    bool        resulttypeByVal;


    /*

     * "shareable" is false if this agg cannot share state values with other

     * aggregates because the final function is read-write.

     */

    bool        shareable;

}           AggStatePerAggData;


/*

 * AggStatePerGroupData - per-aggregate-per-group working state

 *

 * These values are working state that is initialized at the start of

 * an input tuple group and updated for each input tuple.

 *

 * In AGG_PLAIN and AGG_SORTED modes, we have a single array of these

 * structs (pointed to by aggstate->pergroup); we re-use the array for

 * each input group, if it's AGG_SORTED mode.  In AGG_HASHED mode, the

 * hash table contains an array of these structs for each tuple group.

 *

 * Logically, the sortstate field belongs in this struct, but we do not

 * keep it here for space reasons: we don't support DISTINCT aggregates

 * in AGG_HASHED mode, so there's no reason to use up a pointer field

 * in every entry of the hashtable.

 */

typedef struct AggStatePerGroupData

{

#define FIELDNO_AGGSTATEPERGROUPDATA_TRANSVALUE 0

    Datum       transValue;     /* current transition value */

#define FIELDNO_AGGSTATEPERGROUPDATA_TRANSVALUEISNULL 1

    bool        transValueIsNull;


#define FIELDNO_AGGSTATEPERGROUPDATA_NOTRANSVALUE 2

    bool        noTransValue;   /* true if transValue not set yet */


    /*

     * Note: noTransValue initially has the same value as transValueIsNull,

     * and if true both are cleared to false at the same time.  They are not

     * the same though: if transfn later returns a NULL, we want to keep that

     * NULL and not auto-replace it with a later input value. Only the first

     * non-NULL input will be auto-substituted.

     */

} AggStatePerGroupData;


/*

 * AggStatePerPhaseData - per-grouping-set-phase state

 *

 * Grouping sets are divided into "phases", where a single phase can be

 * processed in one pass over the input. If there is more than one phase, then

 * at the end of input from the current phase, state is reset and another pass

 * taken over the data which has been re-sorted in the mean time.

 *

 * Accordingly, each phase specifies a list of grouping sets and group clause

 * information, plus each phase after the first also has a sort order.

 */

typedef struct AggStatePerPhaseData

{

    AggStrategy aggstrategy;    /* strategy for this phase */

    int         numsets;        /* number of grouping sets (or 0) */

    int        *gset_lengths;   /* lengths of grouping sets */

    Bitmapset **grouped_cols;   /* column groupings for rollup */

    ExprState **eqfunctions;    /* expression returning equality, indexed by

                                 * nr of cols to compare */

    Agg        *aggnode;        /* Agg node for phase data */

    Sort       *sortnode;       /* Sort node for input ordering for phase */


    ExprState  *evaltrans;      /* evaluation of transition functions  */


    /*----------

     * Cached variants of the compiled expression.

     * first subscript: 0: outerops; 1: TTSOpsMinimalTuple

     * second subscript: 0: no NULL check; 1: with NULL check

     *----------

     */

    ExprState  *evaltrans_cache[2][2];

}           AggStatePerPhaseData;


/*

 * AggStatePerHashData - per-hashtable state

 *

 * When doing grouping sets with hashing, we have one of these for each

 * grouping set. (When doing hashing without grouping sets, we have just one of

 * them.)

 */

typedef struct AggStatePerHashData

{

    TupleHashTable hashtable;   /* hash table with one entry per group */

    TupleHashIterator hashiter; /* for iterating through hash table */

    TupleTableSlot *hashslot;   /* slot for loading hash table */

    FmgrInfo   *hashfunctions;  /* per-grouping-field hash fns */

    Oid        *eqfuncoids;     /* per-grouping-field equality fns */

    int         numCols;        /* number of hash key columns */

    int         numhashGrpCols; /* number of columns in hash table */

    int         largestGrpColIdx;   /* largest col required for hashing */

    AttrNumber *hashGrpColIdxInput; /* hash col indices in input slot */

    AttrNumber *hashGrpColIdxHash;  /* indices in hash table tuples */

    Agg        *aggnode;        /* original Agg node, for numGroups etc. */

}           AggStatePerHashData;


extern AggState *ExecInitAgg(Agg *node, EState *estate, int eflags);

extern void ExecEndAgg(AggState *node);

extern void ExecReScanAgg(AggState *node);


extern Size hash_agg_entry_size(int numTrans, Size tupleWidth,

                                Size transitionSpace);

extern void hash_agg_set_limits(double hashentrysize, double input_groups,

                                int used_bits, Size *mem_limit,

                                uint64 *ngroups_limit, int *num_partitions);


/* parallel instrumentation support */

extern void ExecAggEstimate(AggState *node, ParallelContext *pcxt);

extern void ExecAggInitializeDSM(AggState *node, ParallelContext *pcxt);

extern void ExecAggInitializeWorker(AggState *node, ParallelWorkerContext *pwcxt);

extern void ExecAggRetrieveInstrumentation(AggState *node);


#endif                          /* NODEAGG_H */

AttrNumber
int16 AttrNumber
Definition: attnum.h:21

int16
int16_t int16
Definition: c.h:497

uint64
uint64_t uint64
Definition: c.h:503

Size
size_t Size
Definition: c.h:576

execnodes.h

TupleHashIterator
tuplehash_iterator TupleHashIterator
Definition: execnodes.h:877

parallel.h

ExecAggEstimate
void ExecAggEstimate(AggState *node, ParallelContext *pcxt)
Definition: nodeAgg.c:4786

AggStatePerAggData
struct AggStatePerAggData AggStatePerAggData

ExecAggInitializeWorker
void ExecAggInitializeWorker(AggState *node, ParallelWorkerContext *pwcxt)
Definition: nodeAgg.c:4832

AggStatePerTransData
struct AggStatePerTransData AggStatePerTransData

ExecAggRetrieveInstrumentation
void ExecAggRetrieveInstrumentation(AggState *node)
Definition: nodeAgg.c:4845

AggStatePerGroupData
struct AggStatePerGroupData AggStatePerGroupData

ExecReScanAgg
void ExecReScanAgg(AggState *node)
Definition: nodeAgg.c:4466

hash_agg_entry_size
Size hash_agg_entry_size(int numTrans, Size tupleWidth, Size transitionSpace)
Definition: nodeAgg.c:1701

ExecAggInitializeDSM
void ExecAggInitializeDSM(AggState *node, ParallelContext *pcxt)
Definition: nodeAgg.c:4807

AggStatePerPhaseData
struct AggStatePerPhaseData AggStatePerPhaseData

AggStatePerHashData
struct AggStatePerHashData AggStatePerHashData

ExecEndAgg
void ExecEndAgg(AggState *node)
Definition: nodeAgg.c:4400

ExecInitAgg
AggState * ExecInitAgg(Agg *node, EState *estate, int eflags)
Definition: nodeAgg.c:3279

hash_agg_set_limits
void hash_agg_set_limits(double hashentrysize, double input_groups, int used_bits, Size *mem_limit, uint64 *ngroups_limit, int *num_partitions)
Definition: nodeAgg.c:1809

AggStrategy
AggStrategy
Definition: nodes.h:359

Datum
uintptr_t Datum
Definition: postgres.h:69

Oid
unsigned int Oid
Definition: postgres_ext.h:30

AggStatePerAggData
Definition: nodeAgg.h:188

AggStatePerAggData::finalfn
FmgrInfo finalfn
Definition: nodeAgg.h:207

AggStatePerAggData::shareable
bool shareable
Definition: nodeAgg.h:231

AggStatePerAggData::resulttypeByVal
bool resulttypeByVal
Definition: nodeAgg.h:225

AggStatePerAggData::aggdirectargs
List * aggdirectargs
Definition: nodeAgg.h:218

AggStatePerAggData::aggref
Aggref * aggref
Definition: nodeAgg.h:195

AggStatePerAggData::transno
int transno
Definition: nodeAgg.h:198

AggStatePerAggData::numFinalArgs
int numFinalArgs
Definition: nodeAgg.h:215

AggStatePerAggData::finalfn_oid
Oid finalfn_oid
Definition: nodeAgg.h:201

AggStatePerAggData::resulttypeLen
int16 resulttypeLen
Definition: nodeAgg.h:224

AggStatePerGroupData
Definition: nodeAgg.h:251

AggStatePerGroupData::transValue
Datum transValue
Definition: nodeAgg.h:253

AggStatePerGroupData::noTransValue
bool noTransValue
Definition: nodeAgg.h:258

AggStatePerGroupData::transValueIsNull
bool transValueIsNull
Definition: nodeAgg.h:255

AggStatePerHashData
Definition: nodeAgg.h:310

AggStatePerHashData::numhashGrpCols
int numhashGrpCols
Definition: nodeAgg.h:317

AggStatePerHashData::hashfunctions
FmgrInfo * hashfunctions
Definition: nodeAgg.h:314

AggStatePerHashData::hashtable
TupleHashTable hashtable
Definition: nodeAgg.h:311

AggStatePerHashData::aggnode
Agg * aggnode
Definition: nodeAgg.h:321

AggStatePerHashData::hashslot
TupleTableSlot * hashslot
Definition: nodeAgg.h:313

AggStatePerHashData::largestGrpColIdx
int largestGrpColIdx
Definition: nodeAgg.h:318

AggStatePerHashData::hashiter
TupleHashIterator hashiter
Definition: nodeAgg.h:312

AggStatePerHashData::hashGrpColIdxHash
AttrNumber * hashGrpColIdxHash
Definition: nodeAgg.h:320

AggStatePerHashData::numCols
int numCols
Definition: nodeAgg.h:316

AggStatePerHashData::hashGrpColIdxInput
AttrNumber * hashGrpColIdxInput
Definition: nodeAgg.h:319

AggStatePerHashData::eqfuncoids
Oid * eqfuncoids
Definition: nodeAgg.h:315

AggStatePerPhaseData
Definition: nodeAgg.h:281

AggStatePerPhaseData::aggnode
Agg * aggnode
Definition: nodeAgg.h:288

AggStatePerPhaseData::gset_lengths
int * gset_lengths
Definition: nodeAgg.h:284

AggStatePerPhaseData::grouped_cols
Bitmapset ** grouped_cols
Definition: nodeAgg.h:285

AggStatePerPhaseData::evaltrans
ExprState * evaltrans
Definition: nodeAgg.h:291

AggStatePerPhaseData::sortnode
Sort * sortnode
Definition: nodeAgg.h:289

AggStatePerPhaseData::numsets
int numsets
Definition: nodeAgg.h:283

AggStatePerPhaseData::evaltrans_cache
ExprState * evaltrans_cache[2][2]
Definition: nodeAgg.h:299

AggStatePerPhaseData::eqfunctions
ExprState ** eqfunctions
Definition: nodeAgg.h:286

AggStatePerPhaseData::aggstrategy
AggStrategy aggstrategy
Definition: nodeAgg.h:282

AggStatePerTransData
Definition: nodeAgg.h:31

AggStatePerTransData::sortNullsFirst
bool * sortNullsFirst
Definition: nodeAgg.h:108

AggStatePerTransData::serialfn
FmgrInfo serialfn
Definition: nodeAgg.h:89

AggStatePerTransData::numSortCols
int numSortCols
Definition: nodeAgg.h:98

AggStatePerTransData::equalfnOne
FmgrInfo equalfnOne
Definition: nodeAgg.h:115

AggStatePerTransData::sortCollations
Oid * sortCollations
Definition: nodeAgg.h:107

AggStatePerTransData::sortdesc
TupleDesc sortdesc
Definition: nodeAgg.h:143

AggStatePerTransData::deserialfn_oid
Oid deserialfn_oid
Definition: nodeAgg.h:77

AggStatePerTransData::aggCollation
Oid aggCollation
Definition: nodeAgg.h:95

AggStatePerTransData::inputtypeLen
int16 inputtypeLen
Definition: nodeAgg.h:131

AggStatePerTransData::sortslot
TupleTableSlot * sortslot
Definition: nodeAgg.h:141

AggStatePerTransData::transfn
FmgrInfo transfn
Definition: nodeAgg.h:86

AggStatePerTransData::transtypeByVal
bool transtypeByVal
Definition: nodeAgg.h:134

AggStatePerTransData::inputtypeByVal
bool inputtypeByVal
Definition: nodeAgg.h:133

AggStatePerTransData::aggref
Aggref * aggref
Definition: nodeAgg.h:44

AggStatePerTransData::numInputs
int numInputs
Definition: nodeAgg.h:61

AggStatePerTransData::equalfnMulti
ExprState * equalfnMulti
Definition: nodeAgg.h:116

AggStatePerTransData::sortstates
Tuplesortstate ** sortstates
Definition: nodeAgg.h:162

AggStatePerTransData::uniqslot
TupleTableSlot * uniqslot
Definition: nodeAgg.h:142

AggStatePerTransData::numDistinctCols
int numDistinctCols
Definition: nodeAgg.h:102

AggStatePerTransData::lastdatum
Datum lastdatum
Definition: nodeAgg.h:144

AggStatePerTransData::initValue
Datum initValue
Definition: nodeAgg.h:121

AggStatePerTransData::initValueIsNull
bool initValueIsNull
Definition: nodeAgg.h:122

AggStatePerTransData::deserialfn
FmgrInfo deserialfn
Definition: nodeAgg.h:92

AggStatePerTransData::sortOperators
Oid * sortOperators
Definition: nodeAgg.h:106

AggStatePerTransData::serialfn_oid
Oid serialfn_oid
Definition: nodeAgg.h:74

AggStatePerTransData::deserialfn_fcinfo
FunctionCallInfo deserialfn_fcinfo
Definition: nodeAgg.h:175

AggStatePerTransData::lastisnull
bool lastisnull
Definition: nodeAgg.h:145

AggStatePerTransData::transtypeLen
int16 transtypeLen
Definition: nodeAgg.h:132

AggStatePerTransData::aggtranstype
Oid aggtranstype
Definition: nodeAgg.h:80

AggStatePerTransData::sortColIdx
AttrNumber * sortColIdx
Definition: nodeAgg.h:105

AggStatePerTransData::numTransInputs
int numTransInputs
Definition: nodeAgg.h:68

AggStatePerTransData::serialfn_fcinfo
FunctionCallInfo serialfn_fcinfo
Definition: nodeAgg.h:173

AggStatePerTransData::aggshared
bool aggshared
Definition: nodeAgg.h:49

AggStatePerTransData::transfn_oid
Oid transfn_oid
Definition: nodeAgg.h:71

AggStatePerTransData::aggsortrequired
bool aggsortrequired
Definition: nodeAgg.h:54

AggStatePerTransData::haslast
bool haslast
Definition: nodeAgg.h:146

AggStatePerTransData::transfn_fcinfo
FunctionCallInfo transfn_fcinfo
Definition: nodeAgg.h:170

AggState
Definition: execnodes.h:2523

Agg
Definition: plannodes.h:1132

Aggref
Definition: primnodes.h:457

Bitmapset
Definition: bitmapset.h:50

EState
Definition: execnodes.h:651

ExprState
Definition: execnodes.h:87

FmgrInfo
Definition: fmgr.h:57

FunctionCallInfoBaseData
Definition: fmgr.h:86

List
Definition: pg_list.h:54

ParallelContext
Definition: parallel.h:32

ParallelWorkerContext
Definition: parallel.h:51

Sort
Definition: plannodes.h:1066

TupleDescData
Definition: tupdesc.h:136

TupleHashTableData
Definition: execnodes.h:859

TupleTableSlot
Definition: tuptable.h:115

Tuplesortstate
Definition: tuplesort.c:186