PostgreSQL Source Code git master
All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Pages
spgtextproc.c File Reference
#include "postgres.h"
#include "access/spgist.h"
#include "catalog/pg_type.h"
#include "common/int.h"
#include "mb/pg_wchar.h"
#include "utils/datum.h"
#include "utils/fmgrprotos.h"
#include "utils/pg_locale.h"
#include "utils/varlena.h"
#include "varatt.h"
Include dependency graph for spgtextproc.c:

Go to the source code of this file.

Data Structures

struct  spgNodePtr
 

Macros

#define SPGIST_MAX_PREFIX_LENGTH   Max((int) (BLCKSZ - 258 * 16 - 100), 32)
 
#define SPG_STRATEGY_ADDITION   (10)
 
#define SPG_IS_COLLATION_AWARE_STRATEGY(s)
 

Typedefs

typedef struct spgNodePtr spgNodePtr
 

Functions

Datum spg_text_config (PG_FUNCTION_ARGS)
 
static Datum formTextDatum (const char *data, int datalen)
 
static int commonPrefix (const char *a, const char *b, int lena, int lenb)
 
static bool searchChar (Datum *nodeLabels, int nNodes, int16 c, int *i)
 
Datum spg_text_choose (PG_FUNCTION_ARGS)
 
static int cmpNodePtr (const void *a, const void *b)
 
Datum spg_text_picksplit (PG_FUNCTION_ARGS)
 
Datum spg_text_inner_consistent (PG_FUNCTION_ARGS)
 
Datum spg_text_leaf_consistent (PG_FUNCTION_ARGS)
 

Macro Definition Documentation

◆ SPG_IS_COLLATION_AWARE_STRATEGY

#define SPG_IS_COLLATION_AWARE_STRATEGY (   s)
Value:
#define SPG_STRATEGY_ADDITION
Definition: spgtextproc.c:82
#define RTPrefixStrategyNumber
Definition: stratnum.h:78

Definition at line 83 of file spgtextproc.c.

◆ SPG_STRATEGY_ADDITION

#define SPG_STRATEGY_ADDITION   (10)

Definition at line 82 of file spgtextproc.c.

◆ SPGIST_MAX_PREFIX_LENGTH

#define SPGIST_MAX_PREFIX_LENGTH   Max((int) (BLCKSZ - 258 * 16 - 100), 32)

Definition at line 70 of file spgtextproc.c.

Typedef Documentation

◆ spgNodePtr

typedef struct spgNodePtr spgNodePtr

Function Documentation

◆ cmpNodePtr()

static int cmpNodePtr ( const void *  a,
const void *  b 
)
static

Definition at line 324 of file spgtextproc.c.

325{
326 const spgNodePtr *aa = (const spgNodePtr *) a;
327 const spgNodePtr *bb = (const spgNodePtr *) b;
328
329 return pg_cmp_s16(aa->c, bb->c);
330}
static int pg_cmp_s16(int16 a, int16 b)
Definition: int.h:634
int b
Definition: isn.c:69
int a
Definition: isn.c:68

References a, b, spgNodePtr::c, and pg_cmp_s16().

Referenced by spg_text_picksplit().

◆ commonPrefix()

static int commonPrefix ( const char *  a,
const char *  b,
int  lena,
int  lenb 
)
static

Definition at line 138 of file spgtextproc.c.

139{
140 int i = 0;
141
142 while (i < lena && i < lenb && *a == *b)
143 {
144 a++;
145 b++;
146 i++;
147 }
148
149 return i;
150}
int i
Definition: isn.c:72

References a, b, and i.

Referenced by spg_text_choose(), and spg_text_picksplit().

◆ formTextDatum()

static Datum formTextDatum ( const char *  data,
int  datalen 
)
static

Definition at line 113 of file spgtextproc.c.

114{
115 char *p;
116
117 p = (char *) palloc(datalen + VARHDRSZ);
118
119 if (datalen + VARHDRSZ_SHORT <= VARATT_SHORT_MAX)
120 {
121 SET_VARSIZE_SHORT(p, datalen + VARHDRSZ_SHORT);
122 if (datalen)
123 memcpy(p + VARHDRSZ_SHORT, data, datalen);
124 }
125 else
126 {
127 SET_VARSIZE(p, datalen + VARHDRSZ);
128 memcpy(p + VARHDRSZ, data, datalen);
129 }
130
131 return PointerGetDatum(p);
132}
#define VARHDRSZ
Definition: c.h:663
void * palloc(Size size)
Definition: mcxt.c:1317
const void * data
static Datum PointerGetDatum(const void *X)
Definition: postgres.h:327
#define VARHDRSZ_SHORT
Definition: varatt.h:255
#define SET_VARSIZE_SHORT(PTR, len)
Definition: varatt.h:306
#define SET_VARSIZE(PTR, len)
Definition: varatt.h:305
#define VARATT_SHORT_MAX
Definition: varatt.h:257

References data, palloc(), PointerGetDatum(), SET_VARSIZE, SET_VARSIZE_SHORT, VARATT_SHORT_MAX, VARHDRSZ, and VARHDRSZ_SHORT.

Referenced by spg_text_choose(), and spg_text_picksplit().

◆ searchChar()

static bool searchChar ( Datum nodeLabels,
int  nNodes,
int16  c,
int *  i 
)
static

Definition at line 158 of file spgtextproc.c.

159{
160 int StopLow = 0,
161 StopHigh = nNodes;
162
163 while (StopLow < StopHigh)
164 {
165 int StopMiddle = (StopLow + StopHigh) >> 1;
166 int16 middle = DatumGetInt16(nodeLabels[StopMiddle]);
167
168 if (c < middle)
169 StopHigh = StopMiddle;
170 else if (c > middle)
171 StopLow = StopMiddle + 1;
172 else
173 {
174 *i = StopMiddle;
175 return true;
176 }
177 }
178
179 *i = StopHigh;
180 return false;
181}
int16_t int16
Definition: c.h:497
static int16 DatumGetInt16(Datum X)
Definition: postgres.h:167
char * c

References DatumGetInt16(), and i.

Referenced by spg_text_choose().

◆ spg_text_choose()

Datum spg_text_choose ( PG_FUNCTION_ARGS  )

Definition at line 184 of file spgtextproc.c.

185{
188 text *inText = DatumGetTextPP(in->datum);
189 char *inStr = VARDATA_ANY(inText);
190 int inSize = VARSIZE_ANY_EXHDR(inText);
191 char *prefixStr = NULL;
192 int prefixSize = 0;
193 int commonLen = 0;
194 int16 nodeChar = 0;
195 int i = 0;
196
197 /* Check for prefix match, set nodeChar to first byte after prefix */
198 if (in->hasPrefix)
199 {
200 text *prefixText = DatumGetTextPP(in->prefixDatum);
201
202 prefixStr = VARDATA_ANY(prefixText);
203 prefixSize = VARSIZE_ANY_EXHDR(prefixText);
204
205 commonLen = commonPrefix(inStr + in->level,
206 prefixStr,
207 inSize - in->level,
208 prefixSize);
209
210 if (commonLen == prefixSize)
211 {
212 if (inSize - in->level > commonLen)
213 nodeChar = *(unsigned char *) (inStr + in->level + commonLen);
214 else
215 nodeChar = -1;
216 }
217 else
218 {
219 /* Must split tuple because incoming value doesn't match prefix */
221
222 if (commonLen == 0)
223 {
224 out->result.splitTuple.prefixHasPrefix = false;
225 }
226 else
227 {
230 formTextDatum(prefixStr, commonLen);
231 }
234 (Datum *) palloc(sizeof(Datum));
236 Int16GetDatum(*(unsigned char *) (prefixStr + commonLen));
237
239
240 if (prefixSize - commonLen == 1)
241 {
243 }
244 else
245 {
248 formTextDatum(prefixStr + commonLen + 1,
249 prefixSize - commonLen - 1);
250 }
251
253 }
254 }
255 else if (inSize > in->level)
256 {
257 nodeChar = *(unsigned char *) (inStr + in->level);
258 }
259 else
260 {
261 nodeChar = -1;
262 }
263
264 /* Look up nodeChar in the node label array */
265 if (searchChar(in->nodeLabels, in->nNodes, nodeChar, &i))
266 {
267 /*
268 * Descend to existing node. (If in->allTheSame, the core code will
269 * ignore our nodeN specification here, but that's OK. We still have
270 * to provide the correct levelAdd and restDatum values, and those are
271 * the same regardless of which node gets chosen by core.)
272 */
273 int levelAdd;
274
276 out->result.matchNode.nodeN = i;
277 levelAdd = commonLen;
278 if (nodeChar >= 0)
279 levelAdd++;
280 out->result.matchNode.levelAdd = levelAdd;
281 if (inSize - in->level - levelAdd > 0)
283 formTextDatum(inStr + in->level + levelAdd,
284 inSize - in->level - levelAdd);
285 else
287 formTextDatum(NULL, 0);
288 }
289 else if (in->allTheSame)
290 {
291 /*
292 * Can't use AddNode action, so split the tuple. The upper tuple has
293 * the same prefix as before and uses a dummy node label -2 for the
294 * lower tuple. The lower tuple has no prefix and the same node
295 * labels as the original tuple.
296 *
297 * Note: it might seem tempting to shorten the upper tuple's prefix,
298 * if it has one, then use its last byte as label for the lower tuple.
299 * But that doesn't win since we know the incoming value matches the
300 * whole prefix: we'd just end up splitting the lower tuple again.
301 */
310 }
311 else
312 {
313 /* Add a node for the not-previously-seen nodeChar value */
314 out->resultType = spgAddNode;
315 out->result.addNode.nodeLabel = Int16GetDatum(nodeChar);
316 out->result.addNode.nodeN = i;
317 }
318
320}
#define PG_RETURN_VOID()
Definition: fmgr.h:349
#define DatumGetTextPP(X)
Definition: fmgr.h:292
#define PG_GETARG_POINTER(n)
Definition: fmgr.h:276
uintptr_t Datum
Definition: postgres.h:69
static Datum Int16GetDatum(int16 X)
Definition: postgres.h:177
@ spgMatchNode
Definition: spgist.h:69
@ spgAddNode
Definition: spgist.h:70
@ spgSplitTuple
Definition: spgist.h:71
static int commonPrefix(const char *a, const char *b, int lena, int lenb)
Definition: spgtextproc.c:138
static Datum formTextDatum(const char *data, int datalen)
Definition: spgtextproc.c:113
static bool searchChar(Datum *nodeLabels, int nNodes, int16 c, int *i)
Definition: spgtextproc.c:158
Datum * nodeLabels
Definition: spgist.h:64
bool hasPrefix
Definition: spgist.h:61
Datum prefixDatum
Definition: spgist.h:62
int nNodes
Definition: spgist.h:63
Datum datum
Definition: spgist.h:55
int level
Definition: spgist.h:57
bool allTheSame
Definition: spgist.h:60
bool postfixHasPrefix
Definition: spgist.h:101
int childNodeN
Definition: spgist.h:98
spgChooseResultType resultType
Definition: spgist.h:76
int levelAdd
Definition: spgist.h:82
struct spgChooseOut::@51::@54 splitTuple
Datum nodeLabel
Definition: spgist.h:87
Datum * prefixNodeLabels
Definition: spgist.h:96
Datum postfixPrefixDatum
Definition: spgist.h:102
Datum restDatum
Definition: spgist.h:83
int prefixNNodes
Definition: spgist.h:95
int nodeN
Definition: spgist.h:81
Datum prefixPrefixDatum
Definition: spgist.h:94
struct spgChooseOut::@51::@53 addNode
bool prefixHasPrefix
Definition: spgist.h:93
struct spgChooseOut::@51::@52 matchNode
union spgChooseOut::@51 result
Definition: c.h:658
#define VARDATA_ANY(PTR)
Definition: varatt.h:324
#define VARSIZE_ANY_EXHDR(PTR)
Definition: varatt.h:317

References spgChooseOut::addNode, spgChooseIn::allTheSame, spgChooseOut::childNodeN, commonPrefix(), spgChooseIn::datum, DatumGetTextPP, formTextDatum(), spgChooseIn::hasPrefix, i, Int16GetDatum(), spgChooseIn::level, spgChooseOut::levelAdd, spgChooseOut::matchNode, spgChooseIn::nNodes, spgChooseOut::nodeLabel, spgChooseIn::nodeLabels, spgChooseOut::nodeN, palloc(), PG_GETARG_POINTER, PG_RETURN_VOID, spgChooseOut::postfixHasPrefix, spgChooseOut::postfixPrefixDatum, spgChooseIn::prefixDatum, spgChooseOut::prefixHasPrefix, spgChooseOut::prefixNNodes, spgChooseOut::prefixNodeLabels, spgChooseOut::prefixPrefixDatum, spgChooseOut::restDatum, spgChooseOut::result, spgChooseOut::resultType, searchChar(), spgAddNode, spgMatchNode, spgSplitTuple, spgChooseOut::splitTuple, VARDATA_ANY, and VARSIZE_ANY_EXHDR.

◆ spg_text_config()

Datum spg_text_config ( PG_FUNCTION_ARGS  )

Definition at line 96 of file spgtextproc.c.

97{
98 /* spgConfigIn *cfgin = (spgConfigIn *) PG_GETARG_POINTER(0); */
100
101 cfg->prefixType = TEXTOID;
102 cfg->labelType = INT2OID;
103 cfg->canReturnData = true;
104 cfg->longValuesOK = true; /* suffixing will shorten long values */
106}
bool longValuesOK
Definition: spgist.h:47
bool canReturnData
Definition: spgist.h:46
Oid labelType
Definition: spgist.h:44
Oid prefixType
Definition: spgist.h:43

References spgConfigOut::canReturnData, spgConfigOut::labelType, spgConfigOut::longValuesOK, PG_GETARG_POINTER, PG_RETURN_VOID, and spgConfigOut::prefixType.

◆ spg_text_inner_consistent()

Datum spg_text_inner_consistent ( PG_FUNCTION_ARGS  )

Definition at line 426 of file spgtextproc.c.

427{
431 text *reconstructedValue;
432 text *reconstrText;
433 int maxReconstrLen;
434 text *prefixText = NULL;
435 int prefixSize = 0;
436 int i;
437
438 /*
439 * Reconstruct values represented at this tuple, including parent data,
440 * prefix of this tuple if any, and the node label if it's non-dummy.
441 * in->level should be the length of the previously reconstructed value,
442 * and the number of bytes added here is prefixSize or prefixSize + 1.
443 *
444 * Note: we assume that in->reconstructedValue isn't toasted and doesn't
445 * have a short varlena header. This is okay because it must have been
446 * created by a previous invocation of this routine, and we always emit
447 * long-format reconstructed values.
448 */
449 reconstructedValue = (text *) DatumGetPointer(in->reconstructedValue);
450 Assert(reconstructedValue == NULL ? in->level == 0 :
451 VARSIZE_ANY_EXHDR(reconstructedValue) == in->level);
452
453 maxReconstrLen = in->level + 1;
454 if (in->hasPrefix)
455 {
456 prefixText = DatumGetTextPP(in->prefixDatum);
457 prefixSize = VARSIZE_ANY_EXHDR(prefixText);
458 maxReconstrLen += prefixSize;
459 }
460
461 reconstrText = palloc(VARHDRSZ + maxReconstrLen);
462 SET_VARSIZE(reconstrText, VARHDRSZ + maxReconstrLen);
463
464 if (in->level)
465 memcpy(VARDATA(reconstrText),
466 VARDATA(reconstructedValue),
467 in->level);
468 if (prefixSize)
469 memcpy(((char *) VARDATA(reconstrText)) + in->level,
470 VARDATA_ANY(prefixText),
471 prefixSize);
472 /* last byte of reconstrText will be filled in below */
473
474 /*
475 * Scan the child nodes. For each one, complete the reconstructed value
476 * and see if it's consistent with the query. If so, emit an entry into
477 * the output arrays.
478 */
479 out->nodeNumbers = (int *) palloc(sizeof(int) * in->nNodes);
480 out->levelAdds = (int *) palloc(sizeof(int) * in->nNodes);
481 out->reconstructedValues = (Datum *) palloc(sizeof(Datum) * in->nNodes);
482 out->nNodes = 0;
483
484 for (i = 0; i < in->nNodes; i++)
485 {
486 int16 nodeChar = DatumGetInt16(in->nodeLabels[i]);
487 int thisLen;
488 bool res = true;
489 int j;
490
491 /* If nodeChar is a dummy value, don't include it in data */
492 if (nodeChar <= 0)
493 thisLen = maxReconstrLen - 1;
494 else
495 {
496 ((unsigned char *) VARDATA(reconstrText))[maxReconstrLen - 1] = nodeChar;
497 thisLen = maxReconstrLen;
498 }
499
500 for (j = 0; j < in->nkeys; j++)
501 {
502 StrategyNumber strategy = in->scankeys[j].sk_strategy;
503 text *inText;
504 int inSize;
505 int r;
506
507 /*
508 * If it's a collation-aware operator, but the collation is C, we
509 * can treat it as non-collation-aware. With non-C collation we
510 * need to traverse whole tree :-( so there's no point in making
511 * any check here. (Note also that our reconstructed value may
512 * well end with a partial multibyte character, so that applying
513 * any encoding-sensitive test to it would be risky anyhow.)
514 */
516 {
517 if (collate_is_c)
518 strategy -= SPG_STRATEGY_ADDITION;
519 else
520 continue;
521 }
522
523 inText = DatumGetTextPP(in->scankeys[j].sk_argument);
524 inSize = VARSIZE_ANY_EXHDR(inText);
525
526 r = memcmp(VARDATA(reconstrText), VARDATA_ANY(inText),
527 Min(inSize, thisLen));
528
529 switch (strategy)
530 {
533 if (r > 0)
534 res = false;
535 break;
537 if (r != 0 || inSize < thisLen)
538 res = false;
539 break;
542 if (r < 0)
543 res = false;
544 break;
546 if (r != 0)
547 res = false;
548 break;
549 default:
550 elog(ERROR, "unrecognized strategy number: %d",
551 in->scankeys[j].sk_strategy);
552 break;
553 }
554
555 if (!res)
556 break; /* no need to consider remaining conditions */
557 }
558
559 if (res)
560 {
561 out->nodeNumbers[out->nNodes] = i;
562 out->levelAdds[out->nNodes] = thisLen - in->level;
563 SET_VARSIZE(reconstrText, VARHDRSZ + thisLen);
564 out->reconstructedValues[out->nNodes] =
565 datumCopy(PointerGetDatum(reconstrText), false, -1);
566 out->nNodes++;
567 }
568 }
569
571}
#define Min(x, y)
Definition: c.h:975
Datum datumCopy(Datum value, bool typByVal, int typLen)
Definition: datum.c:132
#define ERROR
Definition: elog.h:39
#define elog(elevel,...)
Definition: elog.h:225
#define PG_GET_COLLATION()
Definition: fmgr.h:198
Assert(PointerIsAligned(start, uint64))
int j
Definition: isn.c:73
pg_locale_t pg_newlocale_from_collation(Oid collid)
Definition: pg_locale.c:1332
static Pointer DatumGetPointer(Datum X)
Definition: postgres.h:317
#define SPG_IS_COLLATION_AWARE_STRATEGY(s)
Definition: spgtextproc.c:83
uint16 StrategyNumber
Definition: stratnum.h:22
#define BTGreaterStrategyNumber
Definition: stratnum.h:33
#define BTLessStrategyNumber
Definition: stratnum.h:29
#define BTEqualStrategyNumber
Definition: stratnum.h:31
#define BTLessEqualStrategyNumber
Definition: stratnum.h:30
#define BTGreaterEqualStrategyNumber
Definition: stratnum.h:32
Datum sk_argument
Definition: skey.h:72
StrategyNumber sk_strategy
Definition: skey.h:68
Datum reconstructedValue
Definition: spgist.h:140
ScanKey scankeys
Definition: spgist.h:134
Datum * nodeLabels
Definition: spgist.h:151
Datum * reconstructedValues
Definition: spgist.h:159
#define VARDATA(PTR)
Definition: varatt.h:278

References Assert(), BTEqualStrategyNumber, BTGreaterEqualStrategyNumber, BTGreaterStrategyNumber, BTLessEqualStrategyNumber, BTLessStrategyNumber, pg_locale_struct::collate_is_c, datumCopy(), DatumGetInt16(), DatumGetPointer(), DatumGetTextPP, elog, ERROR, spgInnerConsistentIn::hasPrefix, i, j, spgInnerConsistentIn::level, spgInnerConsistentOut::levelAdds, Min, spgInnerConsistentIn::nkeys, spgInnerConsistentIn::nNodes, spgInnerConsistentOut::nNodes, spgInnerConsistentIn::nodeLabels, spgInnerConsistentOut::nodeNumbers, palloc(), PG_GET_COLLATION, PG_GETARG_POINTER, pg_newlocale_from_collation(), PG_RETURN_VOID, PointerGetDatum(), spgInnerConsistentIn::prefixDatum, spgInnerConsistentIn::reconstructedValue, spgInnerConsistentOut::reconstructedValues, RTPrefixStrategyNumber, spgInnerConsistentIn::scankeys, SET_VARSIZE, ScanKeyData::sk_argument, ScanKeyData::sk_strategy, SPG_IS_COLLATION_AWARE_STRATEGY, SPG_STRATEGY_ADDITION, VARDATA, VARDATA_ANY, VARHDRSZ, and VARSIZE_ANY_EXHDR.

◆ spg_text_leaf_consistent()

Datum spg_text_leaf_consistent ( PG_FUNCTION_ARGS  )

Definition at line 574 of file spgtextproc.c.

575{
578 int level = in->level;
579 text *leafValue,
580 *reconstrValue = NULL;
581 char *fullValue;
582 int fullLen;
583 bool res;
584 int j;
585
586 /* all tests are exact */
587 out->recheck = false;
588
589 leafValue = DatumGetTextPP(in->leafDatum);
590
591 /* As above, in->reconstructedValue isn't toasted or short. */
593 reconstrValue = (text *) DatumGetPointer(in->reconstructedValue);
594
595 Assert(reconstrValue == NULL ? level == 0 :
596 VARSIZE_ANY_EXHDR(reconstrValue) == level);
597
598 /* Reconstruct the full string represented by this leaf tuple */
599 fullLen = level + VARSIZE_ANY_EXHDR(leafValue);
600 if (VARSIZE_ANY_EXHDR(leafValue) == 0 && level > 0)
601 {
602 fullValue = VARDATA(reconstrValue);
603 out->leafValue = PointerGetDatum(reconstrValue);
604 }
605 else
606 {
607 text *fullText = palloc(VARHDRSZ + fullLen);
608
609 SET_VARSIZE(fullText, VARHDRSZ + fullLen);
610 fullValue = VARDATA(fullText);
611 if (level)
612 memcpy(fullValue, VARDATA(reconstrValue), level);
613 if (VARSIZE_ANY_EXHDR(leafValue) > 0)
614 memcpy(fullValue + level, VARDATA_ANY(leafValue),
615 VARSIZE_ANY_EXHDR(leafValue));
616 out->leafValue = PointerGetDatum(fullText);
617 }
618
619 /* Perform the required comparison(s) */
620 res = true;
621 for (j = 0; j < in->nkeys; j++)
622 {
623 StrategyNumber strategy = in->scankeys[j].sk_strategy;
625 int queryLen = VARSIZE_ANY_EXHDR(query);
626 int r;
627
628 if (strategy == RTPrefixStrategyNumber)
629 {
630 /*
631 * if level >= length of query then reconstrValue must begin with
632 * query (prefix) string, so we don't need to check it again.
633 */
634 res = (level >= queryLen) ||
637 out->leafValue,
638 PointerGetDatum(query)));
639
640 if (!res) /* no need to consider remaining conditions */
641 break;
642
643 continue;
644 }
645
647 {
648 /* Collation-aware comparison */
649 strategy -= SPG_STRATEGY_ADDITION;
650
651 /* If asserts enabled, verify encoding of reconstructed string */
652 Assert(pg_verifymbstr(fullValue, fullLen, false));
653
654 r = varstr_cmp(fullValue, fullLen,
655 VARDATA_ANY(query), queryLen,
657 }
658 else
659 {
660 /* Non-collation-aware comparison */
661 r = memcmp(fullValue, VARDATA_ANY(query), Min(queryLen, fullLen));
662
663 if (r == 0)
664 {
665 if (queryLen > fullLen)
666 r = -1;
667 else if (queryLen < fullLen)
668 r = 1;
669 }
670 }
671
672 switch (strategy)
673 {
675 res = (r < 0);
676 break;
678 res = (r <= 0);
679 break;
681 res = (r == 0);
682 break;
684 res = (r >= 0);
685 break;
687 res = (r > 0);
688 break;
689 default:
690 elog(ERROR, "unrecognized strategy number: %d",
691 in->scankeys[j].sk_strategy);
692 res = false;
693 break;
694 }
695
696 if (!res)
697 break; /* no need to consider remaining conditions */
698 }
699
700 PG_RETURN_BOOL(res);
701}
Datum DirectFunctionCall2Coll(PGFunction func, Oid collation, Datum arg1, Datum arg2)
Definition: fmgr.c:812
#define PG_RETURN_BOOL(x)
Definition: fmgr.h:359
bool pg_verifymbstr(const char *mbstr, int len, bool noError)
Definition: mbutils.c:1556
static bool DatumGetBool(Datum X)
Definition: postgres.h:95
ScanKey scankeys
Definition: spgist.h:169
Datum reconstructedValue
Definition: spgist.h:175
int varstr_cmp(const char *arg1, int len1, const char *arg2, int len2, Oid collid)
Definition: varlena.c:1610
Datum text_starts_with(PG_FUNCTION_ARGS)
Definition: varlena.c:1847

References Assert(), BTEqualStrategyNumber, BTGreaterEqualStrategyNumber, BTGreaterStrategyNumber, BTLessEqualStrategyNumber, BTLessStrategyNumber, DatumGetBool(), DatumGetPointer(), DatumGetTextPP, DirectFunctionCall2Coll(), elog, ERROR, j, spgLeafConsistentIn::leafDatum, spgLeafConsistentOut::leafValue, spgLeafConsistentIn::level, Min, spgLeafConsistentIn::nkeys, palloc(), PG_GET_COLLATION, PG_GETARG_POINTER, PG_RETURN_BOOL, pg_verifymbstr(), PointerGetDatum(), spgLeafConsistentOut::recheck, spgLeafConsistentIn::reconstructedValue, RTPrefixStrategyNumber, spgLeafConsistentIn::scankeys, SET_VARSIZE, ScanKeyData::sk_argument, ScanKeyData::sk_strategy, SPG_IS_COLLATION_AWARE_STRATEGY, SPG_STRATEGY_ADDITION, text_starts_with(), VARDATA, VARDATA_ANY, VARHDRSZ, VARSIZE_ANY_EXHDR, and varstr_cmp().

◆ spg_text_picksplit()

Datum spg_text_picksplit ( PG_FUNCTION_ARGS  )

Definition at line 333 of file spgtextproc.c.

334{
337 text *text0 = DatumGetTextPP(in->datums[0]);
338 int i,
339 commonLen;
340 spgNodePtr *nodes;
341
342 /* Identify longest common prefix, if any */
343 commonLen = VARSIZE_ANY_EXHDR(text0);
344 for (i = 1; i < in->nTuples && commonLen > 0; i++)
345 {
346 text *texti = DatumGetTextPP(in->datums[i]);
347 int tmp = commonPrefix(VARDATA_ANY(text0),
348 VARDATA_ANY(texti),
349 VARSIZE_ANY_EXHDR(text0),
350 VARSIZE_ANY_EXHDR(texti));
351
352 if (tmp < commonLen)
353 commonLen = tmp;
354 }
355
356 /*
357 * Limit the prefix length, if necessary, to ensure that the resulting
358 * inner tuple will fit on a page.
359 */
360 commonLen = Min(commonLen, SPGIST_MAX_PREFIX_LENGTH);
361
362 /* Set node prefix to be that string, if it's not empty */
363 if (commonLen == 0)
364 {
365 out->hasPrefix = false;
366 }
367 else
368 {
369 out->hasPrefix = true;
370 out->prefixDatum = formTextDatum(VARDATA_ANY(text0), commonLen);
371 }
372
373 /* Extract the node label (first non-common byte) from each value */
374 nodes = (spgNodePtr *) palloc(sizeof(spgNodePtr) * in->nTuples);
375
376 for (i = 0; i < in->nTuples; i++)
377 {
378 text *texti = DatumGetTextPP(in->datums[i]);
379
380 if (commonLen < VARSIZE_ANY_EXHDR(texti))
381 nodes[i].c = *(unsigned char *) (VARDATA_ANY(texti) + commonLen);
382 else
383 nodes[i].c = -1; /* use -1 if string is all common */
384 nodes[i].i = i;
385 nodes[i].d = in->datums[i];
386 }
387
388 /*
389 * Sort by label values so that we can group the values into nodes. This
390 * also ensures that the nodes are ordered by label value, allowing the
391 * use of binary search in searchChar.
392 */
393 qsort(nodes, in->nTuples, sizeof(*nodes), cmpNodePtr);
394
395 /* And emit results */
396 out->nNodes = 0;
397 out->nodeLabels = (Datum *) palloc(sizeof(Datum) * in->nTuples);
398 out->mapTuplesToNodes = (int *) palloc(sizeof(int) * in->nTuples);
399 out->leafTupleDatums = (Datum *) palloc(sizeof(Datum) * in->nTuples);
400
401 for (i = 0; i < in->nTuples; i++)
402 {
403 text *texti = DatumGetTextPP(nodes[i].d);
404 Datum leafD;
405
406 if (i == 0 || nodes[i].c != nodes[i - 1].c)
407 {
408 out->nodeLabels[out->nNodes] = Int16GetDatum(nodes[i].c);
409 out->nNodes++;
410 }
411
412 if (commonLen < VARSIZE_ANY_EXHDR(texti))
413 leafD = formTextDatum(VARDATA_ANY(texti) + commonLen + 1,
414 VARSIZE_ANY_EXHDR(texti) - commonLen - 1);
415 else
416 leafD = formTextDatum(NULL, 0);
417
418 out->leafTupleDatums[nodes[i].i] = leafD;
419 out->mapTuplesToNodes[nodes[i].i] = out->nNodes - 1;
420 }
421
423}
#define qsort(a, b, c, d)
Definition: port.h:475
static int cmpNodePtr(const void *a, const void *b)
Definition: spgtextproc.c:324
#define SPGIST_MAX_PREFIX_LENGTH
Definition: spgtextproc.c:70
Datum * datums
Definition: spgist.h:113
bool hasPrefix
Definition: spgist.h:119
int * mapTuplesToNodes
Definition: spgist.h:125
Datum * nodeLabels
Definition: spgist.h:123
Datum * leafTupleDatums
Definition: spgist.h:126
Datum prefixDatum
Definition: spgist.h:120

References spgNodePtr::c, cmpNodePtr(), commonPrefix(), spgNodePtr::d, DatumGetTextPP, spgPickSplitIn::datums, formTextDatum(), spgPickSplitOut::hasPrefix, i, spgNodePtr::i, Int16GetDatum(), spgPickSplitOut::leafTupleDatums, spgPickSplitOut::mapTuplesToNodes, Min, spgPickSplitOut::nNodes, spgPickSplitOut::nodeLabels, spgPickSplitIn::nTuples, palloc(), PG_GETARG_POINTER, PG_RETURN_VOID, spgPickSplitOut::prefixDatum, qsort, SPGIST_MAX_PREFIX_LENGTH, VARDATA_ANY, and VARSIZE_ANY_EXHDR.