PostgreSQL Source Code git master
tsquery_gist.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * tsquery_gist.c
4 * GiST index support for tsquery
5 *
6 * Portions Copyright (c) 1996-2025, PostgreSQL Global Development Group
7 *
8 *
9 * IDENTIFICATION
10 * src/backend/utils/adt/tsquery_gist.c
11 *
12 *-------------------------------------------------------------------------
13 */
14
15#include "postgres.h"
16
17#include "access/gist.h"
18#include "access/stratnum.h"
19#include "common/int.h"
20#include "tsearch/ts_utils.h"
21#include "utils/fmgrprotos.h"
22
23#define GETENTRY(vec,pos) DatumGetTSQuerySign((vec)->vector[pos].key)
24
25
28{
30 GISTENTRY *retval = entry;
31
32 if (entry->leafkey)
33 {
35
36 retval = (GISTENTRY *) palloc(sizeof(GISTENTRY));
38
40 entry->rel, entry->page,
41 entry->offset, false);
42 }
43
44 PG_RETURN_POINTER(retval);
45}
46
47/*
48 * We do not need a decompress function, because the other gtsquery
49 * support functions work with the compressed representation.
50 */
51
54{
56 TSQuery query = PG_GETARG_TSQUERY(1);
58
59 /* Oid subtype = PG_GETARG_OID(3); */
60 bool *recheck = (bool *) PG_GETARG_POINTER(4);
62 TSQuerySign sq = makeTSQuerySign(query);
63 bool retval;
64
65 /* All cases served by this function are inexact */
66 *recheck = true;
67
68 switch (strategy)
69 {
71 if (GIST_LEAF(entry))
72 retval = (key & sq) == sq;
73 else
74 retval = (key & sq) != 0;
75 break;
77 if (GIST_LEAF(entry))
78 retval = (key & sq) == key;
79 else
80 retval = (key & sq) != 0;
81 break;
82 default:
83 retval = false;
84 }
85 PG_RETURN_BOOL(retval);
86}
87
90{
92 int *size = (int *) PG_GETARG_POINTER(1);
94 int i;
95
96 sign = 0;
97
98 for (i = 0; i < entryvec->n; i++)
99 sign |= GETENTRY(entryvec, i);
100
101 *size = sizeof(TSQuerySign);
102
104}
105
106Datum
108{
111 bool *result = (bool *) PG_GETARG_POINTER(2);
112
113 *result = (a == b);
114
115 PG_RETURN_POINTER(result);
116}
117
118static int
120{
121 int size = 0,
122 i;
123
124 for (i = 0; i < TSQS_SIGLEN; i++)
125 size += 0x01 & (sign >> i);
126
127 return size;
128}
129
130static int
132{
133 TSQuerySign res = a ^ b;
134
135 return sizebitvec(res);
136}
137
138Datum
140{
143 float *penalty = (float *) PG_GETARG_POINTER(2);
144
145 *penalty = hemdist(origval, newval);
146
147 PG_RETURN_POINTER(penalty);
148}
149
150
151typedef struct
152{
153 OffsetNumber pos;
154 int32 cost;
155} SPLITCOST;
156
157static int
158comparecost(const void *a, const void *b)
159{
160 return pg_cmp_s32(((const SPLITCOST *) a)->cost,
161 ((const SPLITCOST *) b)->cost);
162}
163
164#define WISH_F(a,b,c) (double)( -(double)(((a)-(b))*((a)-(b))*((a)-(b)))*(c) )
165
166Datum
168{
171 OffsetNumber maxoff = entryvec->n - 2;
172 OffsetNumber k,
173 j;
174 TSQuerySign datum_l,
175 datum_r;
176 int32 size_alpha,
177 size_beta;
178 int32 size_waste,
179 waste = -1;
180 int32 nbytes;
181 OffsetNumber seed_1 = 0,
182 seed_2 = 0;
183 OffsetNumber *left,
184 *right;
185
186 SPLITCOST *costvector;
187
188 nbytes = (maxoff + 2) * sizeof(OffsetNumber);
189 left = v->spl_left = (OffsetNumber *) palloc(nbytes);
190 right = v->spl_right = (OffsetNumber *) palloc(nbytes);
191 v->spl_nleft = v->spl_nright = 0;
192
193 for (k = FirstOffsetNumber; k < maxoff; k = OffsetNumberNext(k))
194 for (j = OffsetNumberNext(k); j <= maxoff; j = OffsetNumberNext(j))
195 {
196 size_waste = hemdist(GETENTRY(entryvec, j), GETENTRY(entryvec, k));
197 if (size_waste > waste)
198 {
199 waste = size_waste;
200 seed_1 = k;
201 seed_2 = j;
202 }
203 }
204
205
206 if (seed_1 == 0 || seed_2 == 0)
207 {
208 seed_1 = 1;
209 seed_2 = 2;
210 }
211
212 datum_l = GETENTRY(entryvec, seed_1);
213 datum_r = GETENTRY(entryvec, seed_2);
214
215 maxoff = OffsetNumberNext(maxoff);
216 costvector = (SPLITCOST *) palloc(sizeof(SPLITCOST) * maxoff);
217 for (j = FirstOffsetNumber; j <= maxoff; j = OffsetNumberNext(j))
218 {
219 costvector[j - 1].pos = j;
220 size_alpha = hemdist(GETENTRY(entryvec, seed_1), GETENTRY(entryvec, j));
221 size_beta = hemdist(GETENTRY(entryvec, seed_2), GETENTRY(entryvec, j));
222 costvector[j - 1].cost = abs(size_alpha - size_beta);
223 }
224 qsort(costvector, maxoff, sizeof(SPLITCOST), comparecost);
225
226 for (k = 0; k < maxoff; k++)
227 {
228 j = costvector[k].pos;
229 if (j == seed_1)
230 {
231 *left++ = j;
232 v->spl_nleft++;
233 continue;
234 }
235 else if (j == seed_2)
236 {
237 *right++ = j;
238 v->spl_nright++;
239 continue;
240 }
241 size_alpha = hemdist(datum_l, GETENTRY(entryvec, j));
242 size_beta = hemdist(datum_r, GETENTRY(entryvec, j));
243
244 if (size_alpha < size_beta + WISH_F(v->spl_nleft, v->spl_nright, 0.05))
245 {
246 datum_l |= GETENTRY(entryvec, j);
247 *left++ = j;
248 v->spl_nleft++;
249 }
250 else
251 {
252 datum_r |= GETENTRY(entryvec, j);
253 *right++ = j;
254 v->spl_nright++;
255 }
256 }
257
258 *right = *left = FirstOffsetNumber;
259 v->spl_ldatum = TSQuerySignGetDatum(datum_l);
260 v->spl_rdatum = TSQuerySignGetDatum(datum_r);
261
263}
264
265/*
266 * Formerly, gtsquery_consistent was declared in pg_proc.h with arguments
267 * that did not match the documented conventions for GiST support functions.
268 * We fixed that, but we still need a pg_proc entry with the old signature
269 * to support reloading pre-9.6 contrib/tsearch2 opclass declarations.
270 * This compatibility function should go away eventually.
271 */
272Datum
274{
275 return gtsquery_consistent(fcinfo);
276}
int32_t int32
Definition: c.h:481
#define PG_GETARG_POINTER(n)
Definition: fmgr.h:276
#define PG_GETARG_UINT16(n)
Definition: fmgr.h:272
#define PG_RETURN_POINTER(x)
Definition: fmgr.h:361
#define PG_FUNCTION_ARGS
Definition: fmgr.h:193
#define PG_RETURN_BOOL(x)
Definition: fmgr.h:359
#define GIST_LEAF(entry)
Definition: gist.h:170
#define gistentryinit(e, k, r, pg, o, l)
Definition: gist.h:244
#define newval
char sign
Definition: informix.c:693
static int pg_cmp_s32(int32 a, int32 b)
Definition: int.h:646
int b
Definition: isn.c:69
int a
Definition: isn.c:68
int j
Definition: isn.c:73
int i
Definition: isn.c:72
void * palloc(Size size)
Definition: mcxt.c:1317
#define OffsetNumberNext(offsetNumber)
Definition: off.h:52
uint16 OffsetNumber
Definition: off.h:24
#define FirstOffsetNumber
Definition: off.h:27
#define qsort(a, b, c, d)
Definition: port.h:474
uintptr_t Datum
Definition: postgres.h:64
static pg_noinline void Size size
Definition: slab.c:607
uint16 StrategyNumber
Definition: stratnum.h:22
#define RTContainsStrategyNumber
Definition: stratnum.h:57
#define RTContainedByStrategyNumber
Definition: stratnum.h:58
OffsetNumber offset
Definition: gist.h:163
Datum key
Definition: gist.h:160
Page page
Definition: gist.h:162
Relation rel
Definition: gist.h:161
bool leafkey
Definition: gist.h:164
int spl_nleft
Definition: gist.h:143
OffsetNumber * spl_right
Definition: gist.h:147
Datum spl_ldatum
Definition: gist.h:144
Datum spl_rdatum
Definition: gist.h:149
int spl_nright
Definition: gist.h:148
OffsetNumber * spl_left
Definition: gist.h:142
int32 n
Definition: gist.h:235
int32 cost
Definition: hstore_gist.c:354
OffsetNumber pos
Definition: hstore_gist.c:353
static TSQuery DatumGetTSQuery(Datum X)
Definition: ts_type.h:249
#define PG_GETARG_TSQUERY(n)
Definition: ts_type.h:266
#define TSQS_SIGLEN
Definition: ts_utils.h:251
static Datum TSQuerySignGetDatum(TSQuerySign X)
Definition: ts_utils.h:254
uint64 TSQuerySign
Definition: ts_utils.h:249
static TSQuerySign DatumGetTSQuerySign(Datum X)
Definition: ts_utils.h:260
#define PG_GETARG_TSQUERYSIGN(n)
Definition: ts_utils.h:266
#define PG_RETURN_TSQUERYSIGN(X)
Definition: ts_utils.h:265
#define WISH_F(a, b, c)
Definition: tsquery_gist.c:164
#define GETENTRY(vec, pos)
Definition: tsquery_gist.c:23
Datum gtsquery_consistent(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:53
Datum gtsquery_consistent_oldsig(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:273
Datum gtsquery_union(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:89
Datum gtsquery_compress(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:27
static int sizebitvec(TSQuerySign sign)
Definition: tsquery_gist.c:119
Datum gtsquery_penalty(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:139
Datum gtsquery_same(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:107
static int hemdist(TSQuerySign a, TSQuerySign b)
Definition: tsquery_gist.c:131
Datum gtsquery_picksplit(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:167
static int comparecost(const void *a, const void *b)
Definition: tsquery_gist.c:158
TSQuerySign makeTSQuerySign(TSQuery a)
Definition: tsquery_op.c:250