gistsplit_8c_source.html

 /*-------------------------------------------------------------------------

  *

  * gistsplit.c

  *    Multi-column page splitting algorithm

  *

  * This file is concerned with making good page-split decisions in multi-column

  * GiST indexes.  The opclass-specific picksplit functions can only be expected

  * to produce answers based on a single column.  We first run the picksplit

  * function for column 1; then, if there are more columns, we check if any of

  * the tuples are "don't cares" so far as the column 1 split is concerned

  * (that is, they could go to either side for no additional penalty).  If so,

  * we try to redistribute those tuples on the basis of the next column.

  * Repeat till we're out of columns.

  *

  * gistSplitByKey() is the entry point to this file.

  *

  *

  * Portions Copyright (c) 1996-2024, PostgreSQL Global Development Group

  * Portions Copyright (c) 1994, Regents of the University of California

  *

  * IDENTIFICATION

  *    src/backend/access/gist/gistsplit.c

  *

  *-------------------------------------------------------------------------

  */

 #include "postgres.h"


 #include "access/gist_private.h"

 #include "utils/rel.h"


 typedef struct

 {

     OffsetNumber *entries;

     int         len;

     Datum      *attr;

     bool       *isnull;

     bool       *dontcare;

 } GistSplitUnion;


 /*

  * Form unions of subkeys in itvec[] entries listed in gsvp->entries[],

  * ignoring any tuples that are marked in gsvp->dontcare[].  Subroutine for

  * gistunionsubkey.

  */

 static void

 gistunionsubkeyvec(GISTSTATE *giststate, IndexTuple *itvec,

                    GistSplitUnion *gsvp)

 {

     IndexTuple *cleanedItVec;

     int         i,

                 cleanedLen = 0;


     cleanedItVec = (IndexTuple *) palloc(sizeof(IndexTuple) * gsvp->len);


     for (i = 0; i < gsvp->len; i++)

     {

         if (gsvp->dontcare && gsvp->dontcare[gsvp->entries[i]])

             continue;


         cleanedItVec[cleanedLen++] = itvec[gsvp->entries[i] - 1];

     }


     gistMakeUnionItVec(giststate, cleanedItVec, cleanedLen,

                        gsvp->attr, gsvp->isnull);


     pfree(cleanedItVec);

 }


 /*

  * Recompute unions of left- and right-side subkeys after a page split,

  * ignoring any tuples that are marked in spl->spl_dontcare[].

  *

  * Note: we always recompute union keys for all index columns.  In some cases

  * this might represent duplicate work for the leftmost column(s), but it's

  * not safe to assume that "zero penalty to move a tuple" means "the union

  * key doesn't change at all".  Penalty functions aren't 100% accurate.

  */

 static void

 gistunionsubkey(GISTSTATE *giststate, IndexTuple *itvec, GistSplitVector *spl)

 {

     GistSplitUnion gsvp;


     gsvp.dontcare = spl->spl_dontcare;


     gsvp.entries = spl->splitVector.spl_left;

     gsvp.len = spl->splitVector.spl_nleft;

     gsvp.attr = spl->spl_lattr;

     gsvp.isnull = spl->spl_lisnull;


     gistunionsubkeyvec(giststate, itvec, &gsvp);


     gsvp.entries = spl->splitVector.spl_right;

     gsvp.len = spl->splitVector.spl_nright;

     gsvp.attr = spl->spl_rattr;

     gsvp.isnull = spl->spl_risnull;


     gistunionsubkeyvec(giststate, itvec, &gsvp);

 }


 /*

  * Find tuples that are "don't cares", that is could be moved to the other

  * side of the split with zero penalty, so far as the attno column is

  * concerned.

  *

  * Don't-care tuples are marked by setting the corresponding entry in

  * spl->spl_dontcare[] to "true".  Caller must have initialized that array

  * to zeroes.

  *

  * Returns number of don't-cares found.

  */

 static int

 findDontCares(Relation r, GISTSTATE *giststate, GISTENTRY *valvec,

               GistSplitVector *spl, int attno)

 {

     int         i;

     GISTENTRY   entry;

     int         NumDontCare = 0;


     /*

      * First, search the left-side tuples to see if any have zero penalty to

      * be added to the right-side union key.

      *

      * attno column is known all-not-null (see gistSplitByKey), so we need not

      * check for nulls

      */

     gistentryinit(entry, spl->splitVector.spl_rdatum, r, NULL,

                   (OffsetNumber) 0, false);

     for (i = 0; i < spl->splitVector.spl_nleft; i++)

     {

         int         j = spl->splitVector.spl_left[i];

         float       penalty = gistpenalty(giststate, attno, &entry, false,

                                           &valvec[j], false);


         if (penalty == 0.0)

         {

             spl->spl_dontcare[j] = true;

             NumDontCare++;

         }

     }


     /* And conversely for the right-side tuples */

     gistentryinit(entry, spl->splitVector.spl_ldatum, r, NULL,

                   (OffsetNumber) 0, false);

     for (i = 0; i < spl->splitVector.spl_nright; i++)

     {

         int         j = spl->splitVector.spl_right[i];

         float       penalty = gistpenalty(giststate, attno, &entry, false,

                                           &valvec[j], false);


         if (penalty == 0.0)

         {

             spl->spl_dontcare[j] = true;

             NumDontCare++;

         }

     }


     return NumDontCare;

 }


 /*

  * Remove tuples that are marked don't-cares from the tuple index array a[]

  * of length *len.  This is applied separately to the spl_left and spl_right

  * arrays.

  */

 static void

 removeDontCares(OffsetNumber *a, int *len, const bool *dontcare)

 {

     int         origlen,

                 newlen,

                 i;

     OffsetNumber *curwpos;


     origlen = newlen = *len;

     curwpos = a;

     for (i = 0; i < origlen; i++)

     {

         OffsetNumber ai = a[i];


         if (dontcare[ai] == false)

         {

             /* re-emit item into a[] */

             *curwpos = ai;

             curwpos++;

         }

         else

             newlen--;

     }


     *len = newlen;

 }


 /*

  * Place a single don't-care tuple into either the left or right side of the

  * split, according to which has least penalty for merging the tuple into

  * the previously-computed union keys.  We need consider only columns starting

  * at attno.

  */

 static void

 placeOne(Relation r, GISTSTATE *giststate, GistSplitVector *v,

          IndexTuple itup, OffsetNumber off, int attno)

 {

     GISTENTRY   identry[INDEX_MAX_KEYS];

     bool        isnull[INDEX_MAX_KEYS];

     bool        toLeft = true;


     gistDeCompressAtt(giststate, r, itup, NULL, (OffsetNumber) 0,

                       identry, isnull);


     for (; attno < giststate->nonLeafTupdesc->natts; attno++)

     {

         float       lpenalty,

                     rpenalty;

         GISTENTRY   entry;


         gistentryinit(entry, v->spl_lattr[attno], r, NULL, 0, false);

         lpenalty = gistpenalty(giststate, attno, &entry, v->spl_lisnull[attno],

                                identry + attno, isnull[attno]);

         gistentryinit(entry, v->spl_rattr[attno], r, NULL, 0, false);

         rpenalty = gistpenalty(giststate, attno, &entry, v->spl_risnull[attno],

                                identry + attno, isnull[attno]);


         if (lpenalty != rpenalty)

         {

             if (lpenalty > rpenalty)

                 toLeft = false;

             break;

         }

     }


     if (toLeft)

         v->splitVector.spl_left[v->splitVector.spl_nleft++] = off;

     else

         v->splitVector.spl_right[v->splitVector.spl_nright++] = off;

 }


 #define SWAPVAR( s, d, t ) \

 do {    \

     (t) = (s); \

     (s) = (d); \

     (d) = (t); \

 } while(0)


 /*

  * Clean up when we did a secondary split but the user-defined PickSplit

  * method didn't support it (leaving spl_ldatum_exists or spl_rdatum_exists

  * true).

  *

  * We consider whether to swap the left and right outputs of the secondary

  * split; this can be worthwhile if the penalty for merging those tuples into

  * the previously chosen sets is less that way.

  *

  * In any case we must update the union datums for the current column by

  * adding in the previous union keys (oldL/oldR), since the user-defined

  * PickSplit method didn't do so.

  */

 static void

 supportSecondarySplit(Relation r, GISTSTATE *giststate, int attno,

                       GIST_SPLITVEC *sv, Datum oldL, Datum oldR)

 {

     bool        leaveOnLeft = true,

                 tmpBool;

     GISTENTRY   entryL,

                 entryR,

                 entrySL,

                 entrySR;


     gistentryinit(entryL, oldL, r, NULL, 0, false);

     gistentryinit(entryR, oldR, r, NULL, 0, false);

     gistentryinit(entrySL, sv->spl_ldatum, r, NULL, 0, false);

     gistentryinit(entrySR, sv->spl_rdatum, r, NULL, 0, false);


     if (sv->spl_ldatum_exists && sv->spl_rdatum_exists)

     {

         float       penalty1,

                     penalty2;


         penalty1 = gistpenalty(giststate, attno, &entryL, false, &entrySL, false) +

             gistpenalty(giststate, attno, &entryR, false, &entrySR, false);

         penalty2 = gistpenalty(giststate, attno, &entryL, false, &entrySR, false) +

             gistpenalty(giststate, attno, &entryR, false, &entrySL, false);


         if (penalty1 > penalty2)

             leaveOnLeft = false;

     }

     else

     {

         GISTENTRY  *entry1 = (sv->spl_ldatum_exists) ? &entryL : &entryR;

         float       penalty1,

                     penalty2;


         /*

          * There is only one previously defined union, so we just choose swap

          * or not by lowest penalty for that side.  We can only get here if a

          * secondary split happened to have all NULLs in its column in the

          * tuples that the outer recursion level had assigned to one side.

          * (Note that the null checks in gistSplitByKey don't prevent the

          * case, because they'll only be checking tuples that were considered

          * don't-cares at the outer recursion level, not the tuples that went

          * into determining the passed-down left and right union keys.)

          */

         penalty1 = gistpenalty(giststate, attno, entry1, false, &entrySL, false);

         penalty2 = gistpenalty(giststate, attno, entry1, false, &entrySR, false);


         if (penalty1 < penalty2)

             leaveOnLeft = sv->spl_ldatum_exists;

         else

             leaveOnLeft = sv->spl_rdatum_exists;

     }


     if (leaveOnLeft == false)

     {

         /*

          * swap left and right

          */

         OffsetNumber *off,

                     noff;

         Datum       datum;


         SWAPVAR(sv->spl_left, sv->spl_right, off);

         SWAPVAR(sv->spl_nleft, sv->spl_nright, noff);

         SWAPVAR(sv->spl_ldatum, sv->spl_rdatum, datum);

         gistentryinit(entrySL, sv->spl_ldatum, r, NULL, 0, false);

         gistentryinit(entrySR, sv->spl_rdatum, r, NULL, 0, false);

     }


     if (sv->spl_ldatum_exists)

         gistMakeUnionKey(giststate, attno, &entryL, false, &entrySL, false,

                          &sv->spl_ldatum, &tmpBool);


     if (sv->spl_rdatum_exists)

         gistMakeUnionKey(giststate, attno, &entryR, false, &entrySR, false,

                          &sv->spl_rdatum, &tmpBool);


     sv->spl_ldatum_exists = sv->spl_rdatum_exists = false;

 }


 /*

  * Trivial picksplit implementation. Function called only

  * if user-defined picksplit puts all keys on the same side of the split.

  * That is a bug of user-defined picksplit but we don't want to fail.

  */

 static void

 genericPickSplit(GISTSTATE *giststate, GistEntryVector *entryvec, GIST_SPLITVEC *v, int attno)

 {

     OffsetNumber i,

                 maxoff;

     int         nbytes;

     GistEntryVector *evec;


     maxoff = entryvec->n - 1;


     nbytes = (maxoff + 2) * sizeof(OffsetNumber);


     v->spl_left = (OffsetNumber *) palloc(nbytes);

     v->spl_right = (OffsetNumber *) palloc(nbytes);

     v->spl_nleft = v->spl_nright = 0;


     for (i = FirstOffsetNumber; i <= maxoff; i = OffsetNumberNext(i))

     {

         if (i <= (maxoff - FirstOffsetNumber + 1) / 2)

         {

             v->spl_left[v->spl_nleft] = i;

             v->spl_nleft++;

         }

         else

         {

             v->spl_right[v->spl_nright] = i;

             v->spl_nright++;

         }

     }


     /*

      * Form union datums for each side

      */

     evec = palloc(sizeof(GISTENTRY) * entryvec->n + GEVHDRSZ);


     evec->n = v->spl_nleft;

     memcpy(evec->vector, entryvec->vector + FirstOffsetNumber,

            sizeof(GISTENTRY) * evec->n);

     v->spl_ldatum = FunctionCall2Coll(&giststate->unionFn[attno],

                                       giststate->supportCollation[attno],

                                       PointerGetDatum(evec),

                                       PointerGetDatum(&nbytes));


     evec->n = v->spl_nright;

     memcpy(evec->vector, entryvec->vector + FirstOffsetNumber + v->spl_nleft,

            sizeof(GISTENTRY) * evec->n);

     v->spl_rdatum = FunctionCall2Coll(&giststate->unionFn[attno],

                                       giststate->supportCollation[attno],

                                       PointerGetDatum(evec),

                                       PointerGetDatum(&nbytes));

 }


 /*

  * Calls user picksplit method for attno column to split tuples into

  * two vectors.

  *

  * Returns false if split is complete (there are no more index columns, or

  * there is no need to consider them because split is optimal already).

  *

  * Returns true and v->spl_dontcare = NULL if the picksplit result is

  * degenerate (all tuples seem to be don't-cares), so we should just

  * disregard this column and split on the next column(s) instead.

  *

  * Returns true and v->spl_dontcare != NULL if there are don't-care tuples

  * that could be relocated based on the next column(s).  The don't-care

  * tuples have been removed from the split and must be reinserted by caller.

  * There is at least one non-don't-care tuple on each side of the split,

  * and union keys for all columns are updated to include just those tuples.

  *

  * A true result implies there is at least one more index column.

  */

 static bool

 gistUserPicksplit(Relation r, GistEntryVector *entryvec, int attno, GistSplitVector *v,

                   IndexTuple *itup, int len, GISTSTATE *giststate)

 {

     GIST_SPLITVEC *sv = &v->splitVector;


     /*

      * Prepare spl_ldatum/spl_rdatum/spl_ldatum_exists/spl_rdatum_exists in

      * case we are doing a secondary split (see comments in gist.h).

      */

     sv->spl_ldatum_exists = !(v->spl_lisnull[attno]);

     sv->spl_rdatum_exists = !(v->spl_risnull[attno]);

     sv->spl_ldatum = v->spl_lattr[attno];

     sv->spl_rdatum = v->spl_rattr[attno];


     /*

      * Let the opclass-specific PickSplit method do its thing.  Note that at

      * this point we know there are no null keys in the entryvec.

      */

     FunctionCall2Coll(&giststate->picksplitFn[attno],

                       giststate->supportCollation[attno],

                       PointerGetDatum(entryvec),

                       PointerGetDatum(sv));


     if (sv->spl_nleft == 0 || sv->spl_nright == 0)

     {

         /*

          * User-defined picksplit failed to create an actual split, ie it put

          * everything on the same side.  Complain but cope.

          */

         ereport(DEBUG1,

                 (errcode(ERRCODE_INTERNAL_ERROR),

                  errmsg("picksplit method for column %d of index \"%s\" failed",

                         attno + 1, RelationGetRelationName(r)),

                  errhint("The index is not optimal. To optimize it, contact a developer, or try to use the column as the second one in the CREATE INDEX command.")));


         /*

          * Reinit GIST_SPLITVEC. Although these fields are not used by

          * genericPickSplit(), set them up for further processing

          */

         sv->spl_ldatum_exists = !(v->spl_lisnull[attno]);

         sv->spl_rdatum_exists = !(v->spl_risnull[attno]);

         sv->spl_ldatum = v->spl_lattr[attno];

         sv->spl_rdatum = v->spl_rattr[attno];


         /* Do a generic split */

         genericPickSplit(giststate, entryvec, sv, attno);

     }

     else

     {

         /* hack for compatibility with old picksplit API */

         if (sv->spl_left[sv->spl_nleft - 1] == InvalidOffsetNumber)

             sv->spl_left[sv->spl_nleft - 1] = (OffsetNumber) (entryvec->n - 1);

         if (sv->spl_right[sv->spl_nright - 1] == InvalidOffsetNumber)

             sv->spl_right[sv->spl_nright - 1] = (OffsetNumber) (entryvec->n - 1);

     }


     /* Clean up if PickSplit didn't take care of a secondary split */

     if (sv->spl_ldatum_exists || sv->spl_rdatum_exists)

         supportSecondarySplit(r, giststate, attno, sv,

                               v->spl_lattr[attno], v->spl_rattr[attno]);


     /* emit union datums computed by PickSplit back to v arrays */

     v->spl_lattr[attno] = sv->spl_ldatum;

     v->spl_rattr[attno] = sv->spl_rdatum;

     v->spl_lisnull[attno] = false;

     v->spl_risnull[attno] = false;


     /*

      * If index columns remain, then consider whether we can improve the split

      * by using them.

      */

     v->spl_dontcare = NULL;


     if (attno + 1 < giststate->nonLeafTupdesc->natts)

     {

         int         NumDontCare;


         /*

          * Make a quick check to see if left and right union keys are equal;

          * if so, the split is certainly degenerate, so tell caller to

          * re-split with the next column.

          */

         if (gistKeyIsEQ(giststate, attno, sv->spl_ldatum, sv->spl_rdatum))

             return true;


         /*

          * Locate don't-care tuples, if any.  If there are none, the split is

          * optimal, so just fall out and return false.

          */

         v->spl_dontcare = (bool *) palloc0(sizeof(bool) * (entryvec->n + 1));


         NumDontCare = findDontCares(r, giststate, entryvec->vector, v, attno);


         if (NumDontCare > 0)

         {

             /*

              * Remove don't-cares from spl_left[] and spl_right[].

              */

             removeDontCares(sv->spl_left, &sv->spl_nleft, v->spl_dontcare);

             removeDontCares(sv->spl_right, &sv->spl_nright, v->spl_dontcare);


             /*

              * If all tuples on either side were don't-cares, the split is

              * degenerate, and we're best off to ignore it and split on the

              * next column.  (We used to try to press on with a secondary

              * split by forcing a random tuple on each side to be treated as

              * non-don't-care, but it seems unlikely that that technique

              * really gives a better result.  Note that we don't want to try a

              * secondary split with empty left or right primary split sides,

              * because then there is no union key on that side for the

              * PickSplit function to try to expand, so it can have no good

              * figure of merit for what it's doing.  Also note that this check

              * ensures we can't produce a bogus one-side-only split in the

              * NumDontCare == 1 special case below.)

              */

             if (sv->spl_nleft == 0 || sv->spl_nright == 0)

             {

                 v->spl_dontcare = NULL;

                 return true;

             }


             /*

              * Recompute union keys, considering only non-don't-care tuples.

              * NOTE: this will set union keys for remaining index columns,

              * which will cause later calls of gistUserPicksplit to pass those

              * values down to user-defined PickSplit methods with

              * spl_ldatum_exists/spl_rdatum_exists set true.

              */

             gistunionsubkey(giststate, itup, v);


             if (NumDontCare == 1)

             {

                 /*

                  * If there's only one don't-care tuple then we can't do a

                  * PickSplit on it, so just choose whether to send it left or

                  * right by comparing penalties.  We needed the

                  * gistunionsubkey step anyway so that we have appropriate

                  * union keys for figuring the penalties.

                  */

                 OffsetNumber toMove;


                 /* find it ... */

                 for (toMove = FirstOffsetNumber; toMove < entryvec->n; toMove++)

                 {

                     if (v->spl_dontcare[toMove])

                         break;

                 }

                 Assert(toMove < entryvec->n);


                 /* ... and assign it to cheaper side */

                 placeOne(r, giststate, v, itup[toMove - 1], toMove, attno + 1);


                 /*

                  * At this point the union keys are wrong, but we don't care

                  * because we're done splitting.  The outermost recursion

                  * level of gistSplitByKey will fix things before returning.

                  */

             }

             else

                 return true;

         }

     }


     return false;

 }


 /*

  * simply split page in half

  */

 static void

 gistSplitHalf(GIST_SPLITVEC *v, int len)

 {

     int         i;


     v->spl_nright = v->spl_nleft = 0;

     v->spl_left = (OffsetNumber *) palloc(len * sizeof(OffsetNumber));

     v->spl_right = (OffsetNumber *) palloc(len * sizeof(OffsetNumber));

     for (i = 1; i <= len; i++)

         if (i < len / 2)

             v->spl_right[v->spl_nright++] = i;

         else

             v->spl_left[v->spl_nleft++] = i;


     /* we need not compute union keys, caller took care of it */

 }


 /*

  * gistSplitByKey: main entry point for page-splitting algorithm

  *

  * r: index relation

  * page: page being split

  * itup: array of IndexTuples to be processed

  * len: number of IndexTuples to be processed (must be at least 2)

  * giststate: additional info about index

  * v: working state and output area

  * attno: column we are working on (zero-based index)

  *

  * Outside caller must initialize v->spl_lisnull and v->spl_risnull arrays

  * to all-true.  On return, spl_left/spl_nleft contain indexes of tuples

  * to go left, spl_right/spl_nright contain indexes of tuples to go right,

  * spl_lattr/spl_lisnull contain left-side union key values, and

  * spl_rattr/spl_risnull contain right-side union key values.  Other fields

  * in this struct are workspace for this file.

  *

  * Outside caller must pass zero for attno.  The function may internally

  * recurse to the next column by passing attno+1.

  */

 void

 gistSplitByKey(Relation r, Page page, IndexTuple *itup, int len,

                GISTSTATE *giststate, GistSplitVector *v, int attno)

 {

     GistEntryVector *entryvec;

     OffsetNumber *offNullTuples;

     int         nOffNullTuples = 0;

     int         i;


     /* generate the item array, and identify tuples with null keys */

     /* note that entryvec->vector[0] goes unused in this code */

     entryvec = palloc(GEVHDRSZ + (len + 1) * sizeof(GISTENTRY));

     entryvec->n = len + 1;

     offNullTuples = (OffsetNumber *) palloc(len * sizeof(OffsetNumber));


     for (i = 1; i <= len; i++)

     {

         Datum       datum;

         bool        IsNull;


         datum = index_getattr(itup[i - 1], attno + 1, giststate->leafTupdesc,

                               &IsNull);

         gistdentryinit(giststate, attno, &(entryvec->vector[i]),

                        datum, r, page, i,

                        false, IsNull);

         if (IsNull)

             offNullTuples[nOffNullTuples++] = i;

     }


     if (nOffNullTuples == len)

     {

         /*

          * Corner case: All keys in attno column are null, so just transfer

          * our attention to the next column.  If there's no next column, just

          * split page in half.

          */

         v->spl_risnull[attno] = v->spl_lisnull[attno] = true;


         if (attno + 1 < giststate->nonLeafTupdesc->natts)

             gistSplitByKey(r, page, itup, len, giststate, v, attno + 1);

         else

             gistSplitHalf(&v->splitVector, len);

     }

     else if (nOffNullTuples > 0)

     {

         int         j = 0;


         /*

          * We don't want to mix NULL and not-NULL keys on one page, so split

          * nulls to right page and not-nulls to left.

          */

         v->splitVector.spl_right = offNullTuples;

         v->splitVector.spl_nright = nOffNullTuples;

         v->spl_risnull[attno] = true;


         v->splitVector.spl_left = (OffsetNumber *) palloc(len * sizeof(OffsetNumber));

         v->splitVector.spl_nleft = 0;

         for (i = 1; i <= len; i++)

             if (j < v->splitVector.spl_nright && offNullTuples[j] == i)

                 j++;

             else

                 v->splitVector.spl_left[v->splitVector.spl_nleft++] = i;


         /* Compute union keys, unless outer recursion level will handle it */

         if (attno == 0 && giststate->nonLeafTupdesc->natts == 1)

         {

             v->spl_dontcare = NULL;

             gistunionsubkey(giststate, itup, v);

         }

     }

     else

     {

         /*

          * All keys are not-null, so apply user-defined PickSplit method

          */

         if (gistUserPicksplit(r, entryvec, attno, v, itup, len, giststate))

         {

             /*

              * Splitting on attno column is not optimal, so consider

              * redistributing don't-care tuples according to the next column

              */

             Assert(attno + 1 < giststate->nonLeafTupdesc->natts);


             if (v->spl_dontcare == NULL)

             {

                 /*

                  * This split was actually degenerate, so ignore it altogether

                  * and just split according to the next column.

                  */

                 gistSplitByKey(r, page, itup, len, giststate, v, attno + 1);

             }

             else

             {

                 /*

                  * Form an array of just the don't-care tuples to pass to a

                  * recursive invocation of this function for the next column.

                  */

                 IndexTuple *newitup = (IndexTuple *) palloc(len * sizeof(IndexTuple));

                 OffsetNumber *map = (OffsetNumber *) palloc(len * sizeof(OffsetNumber));

                 int         newlen = 0;

                 GIST_SPLITVEC backupSplit;


                 for (i = 0; i < len; i++)

                 {

                     if (v->spl_dontcare[i + 1])

                     {

                         newitup[newlen] = itup[i];

                         map[newlen] = i + 1;

                         newlen++;

                     }

                 }


                 Assert(newlen > 0);


                 /*

                  * Make a backup copy of v->splitVector, since the recursive

                  * call will overwrite that with its own result.

                  */

                 backupSplit = v->splitVector;

                 backupSplit.spl_left = (OffsetNumber *) palloc(sizeof(OffsetNumber) * len);

                 memcpy(backupSplit.spl_left, v->splitVector.spl_left, sizeof(OffsetNumber) * v->splitVector.spl_nleft);

                 backupSplit.spl_right = (OffsetNumber *) palloc(sizeof(OffsetNumber) * len);

                 memcpy(backupSplit.spl_right, v->splitVector.spl_right, sizeof(OffsetNumber) * v->splitVector.spl_nright);


                 /* Recursively decide how to split the don't-care tuples */

                 gistSplitByKey(r, page, newitup, newlen, giststate, v, attno + 1);


                 /* Merge result of subsplit with non-don't-care tuples */

                 for (i = 0; i < v->splitVector.spl_nleft; i++)

                     backupSplit.spl_left[backupSplit.spl_nleft++] = map[v->splitVector.spl_left[i] - 1];

                 for (i = 0; i < v->splitVector.spl_nright; i++)

                     backupSplit.spl_right[backupSplit.spl_nright++] = map[v->splitVector.spl_right[i] - 1];


                 v->splitVector = backupSplit;

             }

         }

     }


     /*

      * If we're handling a multicolumn index, at the end of the recursion

      * recompute the left and right union datums for all index columns.  This

      * makes sure we hand back correct union datums in all corner cases,

      * including when we haven't processed all columns to start with, or when

      * a secondary split moved "don't care" tuples from one side to the other

      * (we really shouldn't assume that that didn't change the union datums).

      *

      * Note: when we're in an internal recursion (attno > 0), we do not worry

      * about whether the union datums we return with are sensible, since

      * calling levels won't care.  Also, in a single-column index, we expect

      * that PickSplit (or the special cases above) produced correct union

      * datums.

      */

     if (attno == 0 && giststate->nonLeafTupdesc->natts > 1)

     {

         v->spl_dontcare = NULL;

         gistunionsubkey(giststate, itup, v);

     }

 }

Page
Pointer Page
Definition: bufpage.h:78

Assert
#define Assert(condition)
Definition: c.h:858

errhint
int errhint(const char *fmt,...)
Definition: elog.c:1319

errcode
int errcode(int sqlerrcode)
Definition: elog.c:859

errmsg
int errmsg(const char *fmt,...)
Definition: elog.c:1072

DEBUG1
#define DEBUG1
Definition: elog.h:30

ereport
#define ereport(elevel,...)
Definition: elog.h:149

FunctionCall2Coll
Datum FunctionCall2Coll(FmgrInfo *flinfo, Oid collation, Datum arg1, Datum arg2)
Definition: fmgr.c:1149

GEVHDRSZ
#define GEVHDRSZ
Definition: gist.h:239

gistentryinit
#define gistentryinit(e, k, r, pg, o, l)
Definition: gist.h:244

gist_private.h

removeDontCares
static void removeDontCares(OffsetNumber *a, int *len, const bool *dontcare)
Definition: gistsplit.c:167

supportSecondarySplit
static void supportSecondarySplit(Relation r, GISTSTATE *giststate, int attno, GIST_SPLITVEC *sv, Datum oldL, Datum oldR)
Definition: gistsplit.c:258

genericPickSplit
static void genericPickSplit(GISTSTATE *giststate, GistEntryVector *entryvec, GIST_SPLITVEC *v, int attno)
Definition: gistsplit.c:344

placeOne
static void placeOne(Relation r, GISTSTATE *giststate, GistSplitVector *v, IndexTuple itup, OffsetNumber off, int attno)
Definition: gistsplit.c:200

gistunionsubkey
static void gistunionsubkey(GISTSTATE *giststate, IndexTuple *itvec, GistSplitVector *spl)
Definition: gistsplit.c:80

gistSplitByKey
void gistSplitByKey(Relation r, Page page, IndexTuple *itup, int len, GISTSTATE *giststate, GistSplitVector *v, int attno)
Definition: gistsplit.c:623

gistUserPicksplit
static bool gistUserPicksplit(Relation r, GistEntryVector *entryvec, int attno, GistSplitVector *v, IndexTuple *itup, int len, GISTSTATE *giststate)
Definition: gistsplit.c:415

findDontCares
static int findDontCares(Relation r, GISTSTATE *giststate, GISTENTRY *valvec, GistSplitVector *spl, int attno)
Definition: gistsplit.c:113

gistunionsubkeyvec
static void gistunionsubkeyvec(GISTSTATE *giststate, IndexTuple *itvec, GistSplitUnion *gsvp)
Definition: gistsplit.c:47

gistSplitHalf
static void gistSplitHalf(GIST_SPLITVEC *v, int len)
Definition: gistsplit.c:585

SWAPVAR
#define SWAPVAR(s, d, t)
Definition: gistsplit.c:237

gistDeCompressAtt
void gistDeCompressAtt(GISTSTATE *giststate, Relation r, IndexTuple tuple, Page p, OffsetNumber o, GISTENTRY *attdata, bool *isnull)
Definition: gistutil.c:296

gistMakeUnionKey
void gistMakeUnionKey(GISTSTATE *giststate, int attno, GISTENTRY *entry1, bool isnull1, GISTENTRY *entry2, bool isnull2, Datum *dst, bool *dstisnull)
Definition: gistutil.c:233

gistMakeUnionItVec
void gistMakeUnionItVec(GISTSTATE *giststate, IndexTuple *itvec, int len, Datum *attr, bool *isnull)
Definition: gistutil.c:155

gistKeyIsEQ
bool gistKeyIsEQ(GISTSTATE *giststate, int attno, Datum a, Datum b)
Definition: gistutil.c:281

gistdentryinit
void gistdentryinit(GISTSTATE *giststate, int nkey, GISTENTRY *e, Datum k, Relation r, Page pg, OffsetNumber o, bool l, bool isNull)
Definition: gistutil.c:547

gistpenalty
float gistpenalty(GISTSTATE *giststate, int attno, GISTENTRY *orig, bool isNullOrig, GISTENTRY *add, bool isNullAdd)
Definition: gistutil.c:724

for
for(;;)
Definition: hashfn_unstable.h:283

a
int a
Definition: isn.c:69

j
int j
Definition: isn.c:74

i
int i
Definition: isn.c:73

index_getattr
static Datum index_getattr(IndexTuple tup, int attnum, TupleDesc tupleDesc, bool *isnull)
Definition: itup.h:117

pfree
void pfree(void *pointer)
Definition: mcxt.c:1520

palloc0
void * palloc0(Size size)
Definition: mcxt.c:1346

palloc
void * palloc(Size size)
Definition: mcxt.c:1316

InvalidOffsetNumber
#define InvalidOffsetNumber
Definition: off.h:26

OffsetNumberNext
#define OffsetNumberNext(offsetNumber)
Definition: off.h:52

OffsetNumber
uint16 OffsetNumber
Definition: off.h:24

FirstOffsetNumber
#define FirstOffsetNumber
Definition: off.h:27

INDEX_MAX_KEYS
#define INDEX_MAX_KEYS
Definition: pg_config_manual.h:69

len
const void size_t len
Definition: pg_crc32c_sse42.c:24

postgres.h

PointerGetDatum
static Datum PointerGetDatum(const void *X)
Definition: postgres.h:322

Datum
uintptr_t Datum
Definition: postgres.h:64

rel.h

RelationGetRelationName
#define RelationGetRelationName(relation)
Definition: rel.h:539

GISTENTRY
Definition: gist.h:159

GISTSTATE
Definition: gist_private.h:76

GISTSTATE::leafTupdesc
TupleDesc leafTupdesc
Definition: gist_private.h:80

GISTSTATE::nonLeafTupdesc
TupleDesc nonLeafTupdesc
Definition: gist_private.h:81

GISTSTATE::supportCollation
Oid supportCollation[INDEX_MAX_KEYS]
Definition: gist_private.h:97

GISTSTATE::unionFn
FmgrInfo unionFn[INDEX_MAX_KEYS]
Definition: gist_private.h:87

GISTSTATE::picksplitFn
FmgrInfo picksplitFn[INDEX_MAX_KEYS]
Definition: gist_private.h:91

GIST_SPLITVEC
Definition: gist.h:141

GIST_SPLITVEC::spl_ldatum_exists
bool spl_ldatum_exists
Definition: gist.h:145

GIST_SPLITVEC::spl_rdatum_exists
bool spl_rdatum_exists
Definition: gist.h:150

GIST_SPLITVEC::spl_nleft
int spl_nleft
Definition: gist.h:143

GIST_SPLITVEC::spl_right
OffsetNumber * spl_right
Definition: gist.h:147

GIST_SPLITVEC::spl_ldatum
Datum spl_ldatum
Definition: gist.h:144

GIST_SPLITVEC::spl_rdatum
Datum spl_rdatum
Definition: gist.h:149

GIST_SPLITVEC::spl_nright
int spl_nright
Definition: gist.h:148

GIST_SPLITVEC::spl_left
OffsetNumber * spl_left
Definition: gist.h:142

GistEntryVector
Definition: gist.h:234

GistEntryVector::vector
GISTENTRY vector[FLEXIBLE_ARRAY_MEMBER]
Definition: gist.h:236

GistEntryVector::n
int32 n
Definition: gist.h:235

GistSplitUnion
Definition: gistsplit.c:32

GistSplitUnion::entries
OffsetNumber * entries
Definition: gistsplit.c:33

GistSplitUnion::isnull
bool * isnull
Definition: gistsplit.c:36

GistSplitUnion::len
int len
Definition: gistsplit.c:34

GistSplitUnion::dontcare
bool * dontcare
Definition: gistsplit.c:37

GistSplitUnion::attr
Datum * attr
Definition: gistsplit.c:35

GistSplitVector
Definition: gist_private.h:236

GistSplitVector::spl_dontcare
bool * spl_dontcare
Definition: gist_private.h:247

GistSplitVector::splitVector
GIST_SPLITVEC splitVector
Definition: gist_private.h:237

GistSplitVector::spl_lattr
Datum spl_lattr[INDEX_MAX_KEYS]
Definition: gist_private.h:239

GistSplitVector::spl_lisnull
bool spl_lisnull[INDEX_MAX_KEYS]
Definition: gist_private.h:241

GistSplitVector::spl_rattr
Datum spl_rattr[INDEX_MAX_KEYS]
Definition: gist_private.h:243

GistSplitVector::spl_risnull
bool spl_risnull[INDEX_MAX_KEYS]
Definition: gist_private.h:245

IndexTupleData
Definition: itup.h:36

RelationData
Definition: rel.h:56

TupleDescData::natts
int natts
Definition: tupdesc.h:81