PostgreSQL Source Code  git master
tsquery_gist.c
Go to the documentation of this file.
1 /*-------------------------------------------------------------------------
2  *
3  * tsquery_gist.c
4  * GiST index support for tsquery
5  *
6  * Portions Copyright (c) 1996-2024, PostgreSQL Global Development Group
7  *
8  *
9  * IDENTIFICATION
10  * src/backend/utils/adt/tsquery_gist.c
11  *
12  *-------------------------------------------------------------------------
13  */
14 
15 #include "postgres.h"
16 
17 #include "access/gist.h"
18 #include "access/stratnum.h"
19 #include "common/int.h"
20 #include "tsearch/ts_utils.h"
21 #include "utils/fmgrprotos.h"
22 
23 #define GETENTRY(vec,pos) DatumGetTSQuerySign((vec)->vector[pos].key)
24 
25 
26 Datum
28 {
29  GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
30  GISTENTRY *retval = entry;
31 
32  if (entry->leafkey)
33  {
35 
36  retval = (GISTENTRY *) palloc(sizeof(GISTENTRY));
38 
40  entry->rel, entry->page,
41  entry->offset, false);
42  }
43 
44  PG_RETURN_POINTER(retval);
45 }
46 
47 /*
48  * We do not need a decompress function, because the other gtsquery
49  * support functions work with the compressed representation.
50  */
51 
52 Datum
54 {
55  GISTENTRY *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
56  TSQuery query = PG_GETARG_TSQUERY(1);
58 
59  /* Oid subtype = PG_GETARG_OID(3); */
60  bool *recheck = (bool *) PG_GETARG_POINTER(4);
62  TSQuerySign sq = makeTSQuerySign(query);
63  bool retval;
64 
65  /* All cases served by this function are inexact */
66  *recheck = true;
67 
68  switch (strategy)
69  {
71  if (GIST_LEAF(entry))
72  retval = (key & sq) == sq;
73  else
74  retval = (key & sq) != 0;
75  break;
77  if (GIST_LEAF(entry))
78  retval = (key & sq) == key;
79  else
80  retval = (key & sq) != 0;
81  break;
82  default:
83  retval = false;
84  }
85  PG_RETURN_BOOL(retval);
86 }
87 
88 Datum
90 {
92  int *size = (int *) PG_GETARG_POINTER(1);
94  int i;
95 
96  sign = 0;
97 
98  for (i = 0; i < entryvec->n; i++)
99  sign |= GETENTRY(entryvec, i);
100 
101  *size = sizeof(TSQuerySign);
102 
104 }
105 
106 Datum
108 {
111  bool *result = (bool *) PG_GETARG_POINTER(2);
112 
113  *result = (a == b);
114 
115  PG_RETURN_POINTER(result);
116 }
117 
118 static int
120 {
121  int size = 0,
122  i;
123 
124  for (i = 0; i < TSQS_SIGLEN; i++)
125  size += 0x01 & (sign >> i);
126 
127  return size;
128 }
129 
130 static int
132 {
133  TSQuerySign res = a ^ b;
134 
135  return sizebitvec(res);
136 }
137 
138 Datum
140 {
143  float *penalty = (float *) PG_GETARG_POINTER(2);
144 
145  *penalty = hemdist(origval, newval);
146 
147  PG_RETURN_POINTER(penalty);
148 }
149 
150 
151 typedef struct
152 {
153  OffsetNumber pos;
154  int32 cost;
155 } SPLITCOST;
156 
157 static int
158 comparecost(const void *a, const void *b)
159 {
160  return pg_cmp_s32(((const SPLITCOST *) a)->cost,
161  ((const SPLITCOST *) b)->cost);
162 }
163 
164 #define WISH_F(a,b,c) (double)( -(double)(((a)-(b))*((a)-(b))*((a)-(b)))*(c) )
165 
166 Datum
168 {
171  OffsetNumber maxoff = entryvec->n - 2;
172  OffsetNumber k,
173  j;
174  TSQuerySign datum_l,
175  datum_r;
176  int32 size_alpha,
177  size_beta;
178  int32 size_waste,
179  waste = -1;
180  int32 nbytes;
181  OffsetNumber seed_1 = 0,
182  seed_2 = 0;
183  OffsetNumber *left,
184  *right;
185 
186  SPLITCOST *costvector;
187 
188  nbytes = (maxoff + 2) * sizeof(OffsetNumber);
189  left = v->spl_left = (OffsetNumber *) palloc(nbytes);
190  right = v->spl_right = (OffsetNumber *) palloc(nbytes);
191  v->spl_nleft = v->spl_nright = 0;
192 
193  for (k = FirstOffsetNumber; k < maxoff; k = OffsetNumberNext(k))
194  for (j = OffsetNumberNext(k); j <= maxoff; j = OffsetNumberNext(j))
195  {
196  size_waste = hemdist(GETENTRY(entryvec, j), GETENTRY(entryvec, k));
197  if (size_waste > waste)
198  {
199  waste = size_waste;
200  seed_1 = k;
201  seed_2 = j;
202  }
203  }
204 
205 
206  if (seed_1 == 0 || seed_2 == 0)
207  {
208  seed_1 = 1;
209  seed_2 = 2;
210  }
211 
212  datum_l = GETENTRY(entryvec, seed_1);
213  datum_r = GETENTRY(entryvec, seed_2);
214 
215  maxoff = OffsetNumberNext(maxoff);
216  costvector = (SPLITCOST *) palloc(sizeof(SPLITCOST) * maxoff);
217  for (j = FirstOffsetNumber; j <= maxoff; j = OffsetNumberNext(j))
218  {
219  costvector[j - 1].pos = j;
220  size_alpha = hemdist(GETENTRY(entryvec, seed_1), GETENTRY(entryvec, j));
221  size_beta = hemdist(GETENTRY(entryvec, seed_2), GETENTRY(entryvec, j));
222  costvector[j - 1].cost = abs(size_alpha - size_beta);
223  }
224  qsort(costvector, maxoff, sizeof(SPLITCOST), comparecost);
225 
226  for (k = 0; k < maxoff; k++)
227  {
228  j = costvector[k].pos;
229  if (j == seed_1)
230  {
231  *left++ = j;
232  v->spl_nleft++;
233  continue;
234  }
235  else if (j == seed_2)
236  {
237  *right++ = j;
238  v->spl_nright++;
239  continue;
240  }
241  size_alpha = hemdist(datum_l, GETENTRY(entryvec, j));
242  size_beta = hemdist(datum_r, GETENTRY(entryvec, j));
243 
244  if (size_alpha < size_beta + WISH_F(v->spl_nleft, v->spl_nright, 0.05))
245  {
246  datum_l |= GETENTRY(entryvec, j);
247  *left++ = j;
248  v->spl_nleft++;
249  }
250  else
251  {
252  datum_r |= GETENTRY(entryvec, j);
253  *right++ = j;
254  v->spl_nright++;
255  }
256  }
257 
258  *right = *left = FirstOffsetNumber;
259  v->spl_ldatum = TSQuerySignGetDatum(datum_l);
260  v->spl_rdatum = TSQuerySignGetDatum(datum_r);
261 
263 }
264 
265 /*
266  * Formerly, gtsquery_consistent was declared in pg_proc.h with arguments
267  * that did not match the documented conventions for GiST support functions.
268  * We fixed that, but we still need a pg_proc entry with the old signature
269  * to support reloading pre-9.6 contrib/tsearch2 opclass declarations.
270  * This compatibility function should go away eventually.
271  */
272 Datum
274 {
275  return gtsquery_consistent(fcinfo);
276 }
signed int int32
Definition: c.h:494
#define PG_GETARG_POINTER(n)
Definition: fmgr.h:276
#define PG_GETARG_UINT16(n)
Definition: fmgr.h:272
#define PG_RETURN_POINTER(x)
Definition: fmgr.h:361
#define PG_FUNCTION_ARGS
Definition: fmgr.h:193
#define PG_RETURN_BOOL(x)
Definition: fmgr.h:359
#define GIST_LEAF(entry)
Definition: gist.h:170
#define gistentryinit(e, k, r, pg, o, l)
Definition: gist.h:244
#define newval
char sign
Definition: informix.c:674
static int pg_cmp_s32(int32 a, int32 b)
Definition: int.h:483
int b
Definition: isn.c:70
int a
Definition: isn.c:69
int j
Definition: isn.c:74
int i
Definition: isn.c:73
void * palloc(Size size)
Definition: mcxt.c:1316
#define OffsetNumberNext(offsetNumber)
Definition: off.h:52
uint16 OffsetNumber
Definition: off.h:24
#define FirstOffsetNumber
Definition: off.h:27
#define qsort(a, b, c, d)
Definition: port.h:449
uintptr_t Datum
Definition: postgres.h:64
static pg_noinline void Size size
Definition: slab.c:607
uint16 StrategyNumber
Definition: stratnum.h:22
#define RTContainsStrategyNumber
Definition: stratnum.h:57
#define RTContainedByStrategyNumber
Definition: stratnum.h:58
OffsetNumber offset
Definition: gist.h:163
Datum key
Definition: gist.h:160
Page page
Definition: gist.h:162
Relation rel
Definition: gist.h:161
bool leafkey
Definition: gist.h:164
int spl_nleft
Definition: gist.h:143
OffsetNumber * spl_right
Definition: gist.h:147
Datum spl_ldatum
Definition: gist.h:144
Datum spl_rdatum
Definition: gist.h:149
int spl_nright
Definition: gist.h:148
OffsetNumber * spl_left
Definition: gist.h:142
int32 n
Definition: gist.h:235
int32 cost
Definition: hstore_gist.c:354
OffsetNumber pos
Definition: hstore_gist.c:353
static TSQuery DatumGetTSQuery(Datum X)
Definition: ts_type.h:249
#define PG_GETARG_TSQUERY(n)
Definition: ts_type.h:266
#define TSQS_SIGLEN
Definition: ts_utils.h:251
static Datum TSQuerySignGetDatum(TSQuerySign X)
Definition: ts_utils.h:254
uint64 TSQuerySign
Definition: ts_utils.h:249
static TSQuerySign DatumGetTSQuerySign(Datum X)
Definition: ts_utils.h:260
#define PG_GETARG_TSQUERYSIGN(n)
Definition: ts_utils.h:266
#define PG_RETURN_TSQUERYSIGN(X)
Definition: ts_utils.h:265
#define WISH_F(a, b, c)
Definition: tsquery_gist.c:164
#define GETENTRY(vec, pos)
Definition: tsquery_gist.c:23
Datum gtsquery_consistent(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:53
Datum gtsquery_consistent_oldsig(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:273
Datum gtsquery_union(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:89
Datum gtsquery_compress(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:27
static int sizebitvec(TSQuerySign sign)
Definition: tsquery_gist.c:119
Datum gtsquery_penalty(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:139
Datum gtsquery_same(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:107
static int hemdist(TSQuerySign a, TSQuerySign b)
Definition: tsquery_gist.c:131
Datum gtsquery_picksplit(PG_FUNCTION_ARGS)
Definition: tsquery_gist.c:167
static int comparecost(const void *a, const void *b)
Definition: tsquery_gist.c:158
TSQuerySign makeTSQuerySign(TSQuery a)
Definition: tsquery_op.c:250