PostgreSQL Source Code git master
spgtextproc.c File Reference
#include "postgres.h"
#include "access/spgist.h"
#include "catalog/pg_type.h"
#include "common/int.h"
#include "mb/pg_wchar.h"
#include "utils/datum.h"
#include "utils/fmgrprotos.h"
#include "utils/pg_locale.h"
#include "utils/varlena.h"
#include "varatt.h"
Include dependency graph for spgtextproc.c:

Go to the source code of this file.

Data Structures

struct  spgNodePtr
 

Macros

#define SPGIST_MAX_PREFIX_LENGTH   Max((int) (BLCKSZ - 258 * 16 - 100), 32)
 
#define SPG_STRATEGY_ADDITION   (10)
 
#define SPG_IS_COLLATION_AWARE_STRATEGY(s)
 

Typedefs

typedef struct spgNodePtr spgNodePtr
 

Functions

Datum spg_text_config (PG_FUNCTION_ARGS)
 
static Datum formTextDatum (const char *data, int datalen)
 
static int commonPrefix (const char *a, const char *b, int lena, int lenb)
 
static bool searchChar (const Datum *nodeLabels, int nNodes, int16 c, int *i)
 
Datum spg_text_choose (PG_FUNCTION_ARGS)
 
static int cmpNodePtr (const void *a, const void *b)
 
Datum spg_text_picksplit (PG_FUNCTION_ARGS)
 
Datum spg_text_inner_consistent (PG_FUNCTION_ARGS)
 
Datum spg_text_leaf_consistent (PG_FUNCTION_ARGS)
 

Macro Definition Documentation

◆ SPG_IS_COLLATION_AWARE_STRATEGY

#define SPG_IS_COLLATION_AWARE_STRATEGY (   s)
Value:
#define SPG_STRATEGY_ADDITION
Definition: spgtextproc.c:82
#define RTPrefixStrategyNumber
Definition: stratnum.h:78

Definition at line 83 of file spgtextproc.c.

◆ SPG_STRATEGY_ADDITION

#define SPG_STRATEGY_ADDITION   (10)

Definition at line 82 of file spgtextproc.c.

◆ SPGIST_MAX_PREFIX_LENGTH

#define SPGIST_MAX_PREFIX_LENGTH   Max((int) (BLCKSZ - 258 * 16 - 100), 32)

Definition at line 70 of file spgtextproc.c.

Typedef Documentation

◆ spgNodePtr

typedef struct spgNodePtr spgNodePtr

Function Documentation

◆ cmpNodePtr()

static int cmpNodePtr ( const void *  a,
const void *  b 
)
static

Definition at line 323 of file spgtextproc.c.

324{
325 const spgNodePtr *aa = (const spgNodePtr *) a;
326 const spgNodePtr *bb = (const spgNodePtr *) b;
327
328 return pg_cmp_s16(aa->c, bb->c);
329}
static int pg_cmp_s16(int16 a, int16 b)
Definition: int.h:701
int b
Definition: isn.c:74
int a
Definition: isn.c:73

References a, b, spgNodePtr::c, and pg_cmp_s16().

Referenced by spg_text_picksplit().

◆ commonPrefix()

static int commonPrefix ( const char *  a,
const char *  b,
int  lena,
int  lenb 
)
static

Definition at line 138 of file spgtextproc.c.

139{
140 int i = 0;
141
142 while (i < lena && i < lenb && *a == *b)
143 {
144 a++;
145 b++;
146 i++;
147 }
148
149 return i;
150}
int i
Definition: isn.c:77

References a, b, and i.

Referenced by spg_text_choose(), and spg_text_picksplit().

◆ formTextDatum()

static Datum formTextDatum ( const char *  data,
int  datalen 
)
static

Definition at line 113 of file spgtextproc.c.

114{
115 char *p;
116
117 p = (char *) palloc(datalen + VARHDRSZ);
118
119 if (datalen + VARHDRSZ_SHORT <= VARATT_SHORT_MAX)
120 {
121 SET_VARSIZE_SHORT(p, datalen + VARHDRSZ_SHORT);
122 if (datalen)
123 memcpy(p + VARHDRSZ_SHORT, data, datalen);
124 }
125 else
126 {
127 SET_VARSIZE(p, datalen + VARHDRSZ);
128 memcpy(p + VARHDRSZ, data, datalen);
129 }
130
131 return PointerGetDatum(p);
132}
#define VARHDRSZ
Definition: c.h:711
void * palloc(Size size)
Definition: mcxt.c:1365
const void * data
static Datum PointerGetDatum(const void *X)
Definition: postgres.h:332
#define VARHDRSZ_SHORT
Definition: varatt.h:278
static void SET_VARSIZE_SHORT(void *PTR, Size len)
Definition: varatt.h:439
#define VARATT_SHORT_MAX
Definition: varatt.h:279
static void SET_VARSIZE(void *PTR, Size len)
Definition: varatt.h:432

References data, palloc(), PointerGetDatum(), SET_VARSIZE(), SET_VARSIZE_SHORT(), VARATT_SHORT_MAX, VARHDRSZ, and VARHDRSZ_SHORT.

Referenced by spg_text_choose(), and spg_text_picksplit().

◆ searchChar()

static bool searchChar ( const Datum nodeLabels,
int  nNodes,
int16  c,
int *  i 
)
static

Definition at line 158 of file spgtextproc.c.

159{
160 int StopLow = 0,
161 StopHigh = nNodes;
162
163 while (StopLow < StopHigh)
164 {
165 int StopMiddle = (StopLow + StopHigh) >> 1;
166 int16 middle = DatumGetInt16(nodeLabels[StopMiddle]);
167
168 if (c < middle)
169 StopHigh = StopMiddle;
170 else if (c > middle)
171 StopLow = StopMiddle + 1;
172 else
173 {
174 *i = StopMiddle;
175 return true;
176 }
177 }
178
179 *i = StopHigh;
180 return false;
181}
int16_t int16
Definition: c.h:547
static int16 DatumGetInt16(Datum X)
Definition: postgres.h:172
char * c

References DatumGetInt16(), and i.

Referenced by spg_text_choose().

◆ spg_text_choose()

Datum spg_text_choose ( PG_FUNCTION_ARGS  )

Definition at line 184 of file spgtextproc.c.

185{
188 text *inText = DatumGetTextPP(in->datum);
189 char *inStr = VARDATA_ANY(inText);
190 int inSize = VARSIZE_ANY_EXHDR(inText);
191 char *prefixStr = NULL;
192 int prefixSize = 0;
193 int commonLen = 0;
194 int16 nodeChar = 0;
195 int i = 0;
196
197 /* Check for prefix match, set nodeChar to first byte after prefix */
198 if (in->hasPrefix)
199 {
200 text *prefixText = DatumGetTextPP(in->prefixDatum);
201
202 prefixStr = VARDATA_ANY(prefixText);
203 prefixSize = VARSIZE_ANY_EXHDR(prefixText);
204
205 commonLen = commonPrefix(inStr + in->level,
206 prefixStr,
207 inSize - in->level,
208 prefixSize);
209
210 if (commonLen == prefixSize)
211 {
212 if (inSize - in->level > commonLen)
213 nodeChar = *(unsigned char *) (inStr + in->level + commonLen);
214 else
215 nodeChar = -1;
216 }
217 else
218 {
219 /* Must split tuple because incoming value doesn't match prefix */
221
222 if (commonLen == 0)
223 {
224 out->result.splitTuple.prefixHasPrefix = false;
225 }
226 else
227 {
230 formTextDatum(prefixStr, commonLen);
231 }
235 Int16GetDatum(*(unsigned char *) (prefixStr + commonLen));
236
238
239 if (prefixSize - commonLen == 1)
240 {
242 }
243 else
244 {
247 formTextDatum(prefixStr + commonLen + 1,
248 prefixSize - commonLen - 1);
249 }
250
252 }
253 }
254 else if (inSize > in->level)
255 {
256 nodeChar = *(unsigned char *) (inStr + in->level);
257 }
258 else
259 {
260 nodeChar = -1;
261 }
262
263 /* Look up nodeChar in the node label array */
264 if (searchChar(in->nodeLabels, in->nNodes, nodeChar, &i))
265 {
266 /*
267 * Descend to existing node. (If in->allTheSame, the core code will
268 * ignore our nodeN specification here, but that's OK. We still have
269 * to provide the correct levelAdd and restDatum values, and those are
270 * the same regardless of which node gets chosen by core.)
271 */
272 int levelAdd;
273
275 out->result.matchNode.nodeN = i;
276 levelAdd = commonLen;
277 if (nodeChar >= 0)
278 levelAdd++;
279 out->result.matchNode.levelAdd = levelAdd;
280 if (inSize - in->level - levelAdd > 0)
282 formTextDatum(inStr + in->level + levelAdd,
283 inSize - in->level - levelAdd);
284 else
286 formTextDatum(NULL, 0);
287 }
288 else if (in->allTheSame)
289 {
290 /*
291 * Can't use AddNode action, so split the tuple. The upper tuple has
292 * the same prefix as before and uses a dummy node label -2 for the
293 * lower tuple. The lower tuple has no prefix and the same node
294 * labels as the original tuple.
295 *
296 * Note: it might seem tempting to shorten the upper tuple's prefix,
297 * if it has one, then use its last byte as label for the lower tuple.
298 * But that doesn't win since we know the incoming value matches the
299 * whole prefix: we'd just end up splitting the lower tuple again.
300 */
309 }
310 else
311 {
312 /* Add a node for the not-previously-seen nodeChar value */
313 out->resultType = spgAddNode;
314 out->result.addNode.nodeLabel = Int16GetDatum(nodeChar);
315 out->result.addNode.nodeN = i;
316 }
317
319}
#define palloc_object(type)
Definition: fe_memutils.h:74
#define PG_RETURN_VOID()
Definition: fmgr.h:349
#define DatumGetTextPP(X)
Definition: fmgr.h:292
#define PG_GETARG_POINTER(n)
Definition: fmgr.h:276
static Datum Int16GetDatum(int16 X)
Definition: postgres.h:182
uint64_t Datum
Definition: postgres.h:70
@ spgMatchNode
Definition: spgist.h:69
@ spgAddNode
Definition: spgist.h:70
@ spgSplitTuple
Definition: spgist.h:71
static int commonPrefix(const char *a, const char *b, int lena, int lenb)
Definition: spgtextproc.c:138
static Datum formTextDatum(const char *data, int datalen)
Definition: spgtextproc.c:113
static bool searchChar(const Datum *nodeLabels, int nNodes, int16 c, int *i)
Definition: spgtextproc.c:158
Datum * nodeLabels
Definition: spgist.h:64
bool hasPrefix
Definition: spgist.h:61
Datum prefixDatum
Definition: spgist.h:62
int nNodes
Definition: spgist.h:63
Datum datum
Definition: spgist.h:55
int level
Definition: spgist.h:57
bool allTheSame
Definition: spgist.h:60
bool postfixHasPrefix
Definition: spgist.h:101
int childNodeN
Definition: spgist.h:98
spgChooseResultType resultType
Definition: spgist.h:76
int levelAdd
Definition: spgist.h:82
struct spgChooseOut::@53::@54 matchNode
struct spgChooseOut::@53::@56 splitTuple
union spgChooseOut::@53 result
Datum nodeLabel
Definition: spgist.h:87
Datum * prefixNodeLabels
Definition: spgist.h:96
Datum postfixPrefixDatum
Definition: spgist.h:102
Datum restDatum
Definition: spgist.h:83
int prefixNNodes
Definition: spgist.h:95
int nodeN
Definition: spgist.h:81
struct spgChooseOut::@53::@55 addNode
Datum prefixPrefixDatum
Definition: spgist.h:94
bool prefixHasPrefix
Definition: spgist.h:93
Definition: c.h:706
static Size VARSIZE_ANY_EXHDR(const void *PTR)
Definition: varatt.h:472
static char * VARDATA_ANY(const void *PTR)
Definition: varatt.h:486

References spgChooseOut::addNode, spgChooseIn::allTheSame, spgChooseOut::childNodeN, commonPrefix(), spgChooseIn::datum, DatumGetTextPP, formTextDatum(), spgChooseIn::hasPrefix, i, Int16GetDatum(), spgChooseIn::level, spgChooseOut::levelAdd, spgChooseOut::matchNode, spgChooseIn::nNodes, spgChooseOut::nodeLabel, spgChooseIn::nodeLabels, spgChooseOut::nodeN, palloc_object, PG_GETARG_POINTER, PG_RETURN_VOID, spgChooseOut::postfixHasPrefix, spgChooseOut::postfixPrefixDatum, spgChooseIn::prefixDatum, spgChooseOut::prefixHasPrefix, spgChooseOut::prefixNNodes, spgChooseOut::prefixNodeLabels, spgChooseOut::prefixPrefixDatum, spgChooseOut::restDatum, spgChooseOut::result, spgChooseOut::resultType, searchChar(), spgAddNode, spgMatchNode, spgSplitTuple, spgChooseOut::splitTuple, VARDATA_ANY(), and VARSIZE_ANY_EXHDR().

◆ spg_text_config()

Datum spg_text_config ( PG_FUNCTION_ARGS  )

Definition at line 96 of file spgtextproc.c.

97{
98 /* spgConfigIn *cfgin = (spgConfigIn *) PG_GETARG_POINTER(0); */
100
101 cfg->prefixType = TEXTOID;
102 cfg->labelType = INT2OID;
103 cfg->canReturnData = true;
104 cfg->longValuesOK = true; /* suffixing will shorten long values */
106}
bool longValuesOK
Definition: spgist.h:47
bool canReturnData
Definition: spgist.h:46
Oid labelType
Definition: spgist.h:44
Oid prefixType
Definition: spgist.h:43

References spgConfigOut::canReturnData, spgConfigOut::labelType, spgConfigOut::longValuesOK, PG_GETARG_POINTER, PG_RETURN_VOID, and spgConfigOut::prefixType.

◆ spg_text_inner_consistent()

Datum spg_text_inner_consistent ( PG_FUNCTION_ARGS  )

Definition at line 425 of file spgtextproc.c.

426{
430 text *reconstructedValue;
431 text *reconstrText;
432 int maxReconstrLen;
433 text *prefixText = NULL;
434 int prefixSize = 0;
435 int i;
436
437 /*
438 * Reconstruct values represented at this tuple, including parent data,
439 * prefix of this tuple if any, and the node label if it's non-dummy.
440 * in->level should be the length of the previously reconstructed value,
441 * and the number of bytes added here is prefixSize or prefixSize + 1.
442 *
443 * Note: we assume that in->reconstructedValue isn't toasted and doesn't
444 * have a short varlena header. This is okay because it must have been
445 * created by a previous invocation of this routine, and we always emit
446 * long-format reconstructed values.
447 */
448 reconstructedValue = (text *) DatumGetPointer(in->reconstructedValue);
449 Assert(reconstructedValue == NULL ? in->level == 0 :
450 VARSIZE_ANY_EXHDR(reconstructedValue) == in->level);
451
452 maxReconstrLen = in->level + 1;
453 if (in->hasPrefix)
454 {
455 prefixText = DatumGetTextPP(in->prefixDatum);
456 prefixSize = VARSIZE_ANY_EXHDR(prefixText);
457 maxReconstrLen += prefixSize;
458 }
459
460 reconstrText = palloc(VARHDRSZ + maxReconstrLen);
461 SET_VARSIZE(reconstrText, VARHDRSZ + maxReconstrLen);
462
463 if (in->level)
464 memcpy(VARDATA(reconstrText),
465 VARDATA(reconstructedValue),
466 in->level);
467 if (prefixSize)
468 memcpy(((char *) VARDATA(reconstrText)) + in->level,
469 VARDATA_ANY(prefixText),
470 prefixSize);
471 /* last byte of reconstrText will be filled in below */
472
473 /*
474 * Scan the child nodes. For each one, complete the reconstructed value
475 * and see if it's consistent with the query. If so, emit an entry into
476 * the output arrays.
477 */
478 out->nodeNumbers = palloc_array(int, in->nNodes);
479 out->levelAdds = palloc_array(int, in->nNodes);
481 out->nNodes = 0;
482
483 for (i = 0; i < in->nNodes; i++)
484 {
485 int16 nodeChar = DatumGetInt16(in->nodeLabels[i]);
486 int thisLen;
487 bool res = true;
488 int j;
489
490 /* If nodeChar is a dummy value, don't include it in data */
491 if (nodeChar <= 0)
492 thisLen = maxReconstrLen - 1;
493 else
494 {
495 ((unsigned char *) VARDATA(reconstrText))[maxReconstrLen - 1] = nodeChar;
496 thisLen = maxReconstrLen;
497 }
498
499 for (j = 0; j < in->nkeys; j++)
500 {
501 StrategyNumber strategy = in->scankeys[j].sk_strategy;
502 text *inText;
503 int inSize;
504 int r;
505
506 /*
507 * If it's a collation-aware operator, but the collation is C, we
508 * can treat it as non-collation-aware. With non-C collation we
509 * need to traverse whole tree :-( so there's no point in making
510 * any check here. (Note also that our reconstructed value may
511 * well end with a partial multibyte character, so that applying
512 * any encoding-sensitive test to it would be risky anyhow.)
513 */
515 {
516 if (collate_is_c)
517 strategy -= SPG_STRATEGY_ADDITION;
518 else
519 continue;
520 }
521
522 inText = DatumGetTextPP(in->scankeys[j].sk_argument);
523 inSize = VARSIZE_ANY_EXHDR(inText);
524
525 r = memcmp(VARDATA(reconstrText), VARDATA_ANY(inText),
526 Min(inSize, thisLen));
527
528 switch (strategy)
529 {
532 if (r > 0)
533 res = false;
534 break;
536 if (r != 0 || inSize < thisLen)
537 res = false;
538 break;
541 if (r < 0)
542 res = false;
543 break;
545 if (r != 0)
546 res = false;
547 break;
548 default:
549 elog(ERROR, "unrecognized strategy number: %d",
550 in->scankeys[j].sk_strategy);
551 break;
552 }
553
554 if (!res)
555 break; /* no need to consider remaining conditions */
556 }
557
558 if (res)
559 {
560 out->nodeNumbers[out->nNodes] = i;
561 out->levelAdds[out->nNodes] = thisLen - in->level;
562 SET_VARSIZE(reconstrText, VARHDRSZ + thisLen);
563 out->reconstructedValues[out->nNodes] =
564 datumCopy(PointerGetDatum(reconstrText), false, -1);
565 out->nNodes++;
566 }
567 }
568
570}
#define Min(x, y)
Definition: c.h:1016
Datum datumCopy(Datum value, bool typByVal, int typLen)
Definition: datum.c:132
#define ERROR
Definition: elog.h:39
#define elog(elevel,...)
Definition: elog.h:226
#define palloc_array(type, count)
Definition: fe_memutils.h:76
#define PG_GET_COLLATION()
Definition: fmgr.h:198
Assert(PointerIsAligned(start, uint64))
int j
Definition: isn.c:78
pg_locale_t pg_newlocale_from_collation(Oid collid)
Definition: pg_locale.c:1186
static Pointer DatumGetPointer(Datum X)
Definition: postgres.h:322
#define SPG_IS_COLLATION_AWARE_STRATEGY(s)
Definition: spgtextproc.c:83
uint16 StrategyNumber
Definition: stratnum.h:22
#define BTGreaterStrategyNumber
Definition: stratnum.h:33
#define BTLessStrategyNumber
Definition: stratnum.h:29
#define BTEqualStrategyNumber
Definition: stratnum.h:31
#define BTLessEqualStrategyNumber
Definition: stratnum.h:30
#define BTGreaterEqualStrategyNumber
Definition: stratnum.h:32
Datum sk_argument
Definition: skey.h:72
StrategyNumber sk_strategy
Definition: skey.h:68
Datum reconstructedValue
Definition: spgist.h:140
ScanKey scankeys
Definition: spgist.h:134
Datum * nodeLabels
Definition: spgist.h:151
Datum * reconstructedValues
Definition: spgist.h:159
static char * VARDATA(const void *PTR)
Definition: varatt.h:305

References Assert(), BTEqualStrategyNumber, BTGreaterEqualStrategyNumber, BTGreaterStrategyNumber, BTLessEqualStrategyNumber, BTLessStrategyNumber, pg_locale_struct::collate_is_c, datumCopy(), DatumGetInt16(), DatumGetPointer(), DatumGetTextPP, elog, ERROR, spgInnerConsistentIn::hasPrefix, i, j, spgInnerConsistentIn::level, spgInnerConsistentOut::levelAdds, Min, spgInnerConsistentIn::nkeys, spgInnerConsistentIn::nNodes, spgInnerConsistentOut::nNodes, spgInnerConsistentIn::nodeLabels, spgInnerConsistentOut::nodeNumbers, palloc(), palloc_array, PG_GET_COLLATION, PG_GETARG_POINTER, pg_newlocale_from_collation(), PG_RETURN_VOID, PointerGetDatum(), spgInnerConsistentIn::prefixDatum, spgInnerConsistentIn::reconstructedValue, spgInnerConsistentOut::reconstructedValues, RTPrefixStrategyNumber, spgInnerConsistentIn::scankeys, SET_VARSIZE(), ScanKeyData::sk_argument, ScanKeyData::sk_strategy, SPG_IS_COLLATION_AWARE_STRATEGY, SPG_STRATEGY_ADDITION, VARDATA(), VARDATA_ANY(), VARHDRSZ, and VARSIZE_ANY_EXHDR().

◆ spg_text_leaf_consistent()

Datum spg_text_leaf_consistent ( PG_FUNCTION_ARGS  )

Definition at line 573 of file spgtextproc.c.

574{
577 int level = in->level;
578 text *leafValue,
579 *reconstrValue = NULL;
580 char *fullValue;
581 int fullLen;
582 bool res;
583 int j;
584
585 /* all tests are exact */
586 out->recheck = false;
587
588 leafValue = DatumGetTextPP(in->leafDatum);
589
590 /* As above, in->reconstructedValue isn't toasted or short. */
592 reconstrValue = (text *) DatumGetPointer(in->reconstructedValue);
593
594 Assert(reconstrValue == NULL ? level == 0 :
595 VARSIZE_ANY_EXHDR(reconstrValue) == level);
596
597 /* Reconstruct the full string represented by this leaf tuple */
598 fullLen = level + VARSIZE_ANY_EXHDR(leafValue);
599 if (VARSIZE_ANY_EXHDR(leafValue) == 0 && level > 0)
600 {
601 fullValue = VARDATA(reconstrValue);
602 out->leafValue = PointerGetDatum(reconstrValue);
603 }
604 else
605 {
606 text *fullText = palloc(VARHDRSZ + fullLen);
607
608 SET_VARSIZE(fullText, VARHDRSZ + fullLen);
609 fullValue = VARDATA(fullText);
610 if (level)
611 memcpy(fullValue, VARDATA(reconstrValue), level);
612 if (VARSIZE_ANY_EXHDR(leafValue) > 0)
613 memcpy(fullValue + level, VARDATA_ANY(leafValue),
614 VARSIZE_ANY_EXHDR(leafValue));
615 out->leafValue = PointerGetDatum(fullText);
616 }
617
618 /* Perform the required comparison(s) */
619 res = true;
620 for (j = 0; j < in->nkeys; j++)
621 {
622 StrategyNumber strategy = in->scankeys[j].sk_strategy;
624 int queryLen = VARSIZE_ANY_EXHDR(query);
625 int r;
626
627 if (strategy == RTPrefixStrategyNumber)
628 {
629 /*
630 * if level >= length of query then reconstrValue must begin with
631 * query (prefix) string, so we don't need to check it again.
632 */
633 res = (level >= queryLen) ||
636 out->leafValue,
637 PointerGetDatum(query)));
638
639 if (!res) /* no need to consider remaining conditions */
640 break;
641
642 continue;
643 }
644
646 {
647 /* Collation-aware comparison */
648 strategy -= SPG_STRATEGY_ADDITION;
649
650 /* If asserts enabled, verify encoding of reconstructed string */
651 Assert(pg_verifymbstr(fullValue, fullLen, false));
652
653 r = varstr_cmp(fullValue, fullLen,
654 VARDATA_ANY(query), queryLen,
656 }
657 else
658 {
659 /* Non-collation-aware comparison */
660 r = memcmp(fullValue, VARDATA_ANY(query), Min(queryLen, fullLen));
661
662 if (r == 0)
663 {
664 if (queryLen > fullLen)
665 r = -1;
666 else if (queryLen < fullLen)
667 r = 1;
668 }
669 }
670
671 switch (strategy)
672 {
674 res = (r < 0);
675 break;
677 res = (r <= 0);
678 break;
680 res = (r == 0);
681 break;
683 res = (r >= 0);
684 break;
686 res = (r > 0);
687 break;
688 default:
689 elog(ERROR, "unrecognized strategy number: %d",
690 in->scankeys[j].sk_strategy);
691 res = false;
692 break;
693 }
694
695 if (!res)
696 break; /* no need to consider remaining conditions */
697 }
698
699 PG_RETURN_BOOL(res);
700}
Datum DirectFunctionCall2Coll(PGFunction func, Oid collation, Datum arg1, Datum arg2)
Definition: fmgr.c:813
#define PG_RETURN_BOOL(x)
Definition: fmgr.h:359
bool pg_verifymbstr(const char *mbstr, int len, bool noError)
Definition: mbutils.c:1559
static bool DatumGetBool(Datum X)
Definition: postgres.h:100
ScanKey scankeys
Definition: spgist.h:169
Datum reconstructedValue
Definition: spgist.h:175
int varstr_cmp(const char *arg1, int len1, const char *arg2, int len2, Oid collid)
Definition: varlena.c:1308
Datum text_starts_with(PG_FUNCTION_ARGS)
Definition: varlena.c:1545

References Assert(), BTEqualStrategyNumber, BTGreaterEqualStrategyNumber, BTGreaterStrategyNumber, BTLessEqualStrategyNumber, BTLessStrategyNumber, DatumGetBool(), DatumGetPointer(), DatumGetTextPP, DirectFunctionCall2Coll(), elog, ERROR, j, spgLeafConsistentIn::leafDatum, spgLeafConsistentOut::leafValue, spgLeafConsistentIn::level, Min, spgLeafConsistentIn::nkeys, palloc(), PG_GET_COLLATION, PG_GETARG_POINTER, PG_RETURN_BOOL, pg_verifymbstr(), PointerGetDatum(), spgLeafConsistentOut::recheck, spgLeafConsistentIn::reconstructedValue, RTPrefixStrategyNumber, spgLeafConsistentIn::scankeys, SET_VARSIZE(), ScanKeyData::sk_argument, ScanKeyData::sk_strategy, SPG_IS_COLLATION_AWARE_STRATEGY, SPG_STRATEGY_ADDITION, text_starts_with(), VARDATA(), VARDATA_ANY(), VARHDRSZ, VARSIZE_ANY_EXHDR(), and varstr_cmp().

◆ spg_text_picksplit()

Datum spg_text_picksplit ( PG_FUNCTION_ARGS  )

Definition at line 332 of file spgtextproc.c.

333{
336 text *text0 = DatumGetTextPP(in->datums[0]);
337 int i,
338 commonLen;
339 spgNodePtr *nodes;
340
341 /* Identify longest common prefix, if any */
342 commonLen = VARSIZE_ANY_EXHDR(text0);
343 for (i = 1; i < in->nTuples && commonLen > 0; i++)
344 {
345 text *texti = DatumGetTextPP(in->datums[i]);
346 int tmp = commonPrefix(VARDATA_ANY(text0),
347 VARDATA_ANY(texti),
348 VARSIZE_ANY_EXHDR(text0),
349 VARSIZE_ANY_EXHDR(texti));
350
351 if (tmp < commonLen)
352 commonLen = tmp;
353 }
354
355 /*
356 * Limit the prefix length, if necessary, to ensure that the resulting
357 * inner tuple will fit on a page.
358 */
359 commonLen = Min(commonLen, SPGIST_MAX_PREFIX_LENGTH);
360
361 /* Set node prefix to be that string, if it's not empty */
362 if (commonLen == 0)
363 {
364 out->hasPrefix = false;
365 }
366 else
367 {
368 out->hasPrefix = true;
369 out->prefixDatum = formTextDatum(VARDATA_ANY(text0), commonLen);
370 }
371
372 /* Extract the node label (first non-common byte) from each value */
373 nodes = palloc_array(spgNodePtr, in->nTuples);
374
375 for (i = 0; i < in->nTuples; i++)
376 {
377 text *texti = DatumGetTextPP(in->datums[i]);
378
379 if (commonLen < VARSIZE_ANY_EXHDR(texti))
380 nodes[i].c = *(unsigned char *) (VARDATA_ANY(texti) + commonLen);
381 else
382 nodes[i].c = -1; /* use -1 if string is all common */
383 nodes[i].i = i;
384 nodes[i].d = in->datums[i];
385 }
386
387 /*
388 * Sort by label values so that we can group the values into nodes. This
389 * also ensures that the nodes are ordered by label value, allowing the
390 * use of binary search in searchChar.
391 */
392 qsort(nodes, in->nTuples, sizeof(*nodes), cmpNodePtr);
393
394 /* And emit results */
395 out->nNodes = 0;
397 out->mapTuplesToNodes = palloc_array(int, in->nTuples);
399
400 for (i = 0; i < in->nTuples; i++)
401 {
402 text *texti = DatumGetTextPP(nodes[i].d);
403 Datum leafD;
404
405 if (i == 0 || nodes[i].c != nodes[i - 1].c)
406 {
407 out->nodeLabels[out->nNodes] = Int16GetDatum(nodes[i].c);
408 out->nNodes++;
409 }
410
411 if (commonLen < VARSIZE_ANY_EXHDR(texti))
412 leafD = formTextDatum(VARDATA_ANY(texti) + commonLen + 1,
413 VARSIZE_ANY_EXHDR(texti) - commonLen - 1);
414 else
415 leafD = formTextDatum(NULL, 0);
416
417 out->leafTupleDatums[nodes[i].i] = leafD;
418 out->mapTuplesToNodes[nodes[i].i] = out->nNodes - 1;
419 }
420
422}
#define qsort(a, b, c, d)
Definition: port.h:499
static int cmpNodePtr(const void *a, const void *b)
Definition: spgtextproc.c:323
#define SPGIST_MAX_PREFIX_LENGTH
Definition: spgtextproc.c:70
Datum * datums
Definition: spgist.h:113
bool hasPrefix
Definition: spgist.h:119
int * mapTuplesToNodes
Definition: spgist.h:125
Datum * nodeLabels
Definition: spgist.h:123
Datum * leafTupleDatums
Definition: spgist.h:126
Datum prefixDatum
Definition: spgist.h:120

References spgNodePtr::c, cmpNodePtr(), commonPrefix(), spgNodePtr::d, DatumGetTextPP, spgPickSplitIn::datums, formTextDatum(), spgPickSplitOut::hasPrefix, i, spgNodePtr::i, Int16GetDatum(), spgPickSplitOut::leafTupleDatums, spgPickSplitOut::mapTuplesToNodes, Min, spgPickSplitOut::nNodes, spgPickSplitOut::nodeLabels, spgPickSplitIn::nTuples, palloc_array, PG_GETARG_POINTER, PG_RETURN_VOID, spgPickSplitOut::prefixDatum, qsort, SPGIST_MAX_PREFIX_LENGTH, VARDATA_ANY(), and VARSIZE_ANY_EXHDR().