Age Owner TLA Line data Source code
1 : /*-------------------------------------------------------------------------
2 : *
3 : * gistscan.c
4 : * routines to manage scans on GiST index relations
5 : *
6 : *
7 : * Portions Copyright (c) 1996-2023, PostgreSQL Global Development Group
8 : * Portions Copyright (c) 1994, Regents of the University of California
9 : *
10 : * IDENTIFICATION
11 : * src/backend/access/gist/gistscan.c
12 : *
13 : *-------------------------------------------------------------------------
14 : */
15 : #include "postgres.h"
16 :
17 : #include "access/gist_private.h"
18 : #include "access/gistscan.h"
19 : #include "access/relscan.h"
20 : #include "utils/float.h"
21 : #include "utils/lsyscache.h"
22 : #include "utils/memutils.h"
23 : #include "utils/rel.h"
24 :
25 :
26 : /*
27 : * Pairing heap comparison function for the GISTSearchItem queue
28 : */
29 : static int
3030 heikki.linnakangas 30 CBC 175972 : pairingheap_GISTSearchItem_cmp(const pairingheap_node *a, const pairingheap_node *b, void *arg)
31 : {
32 175972 : const GISTSearchItem *sa = (const GISTSearchItem *) a;
33 175972 : const GISTSearchItem *sb = (const GISTSearchItem *) b;
4510 tgl 34 175972 : IndexScanDesc scan = (IndexScanDesc) arg;
35 : int i;
36 :
37 : /* Order according to distance comparison */
38 178055 : for (i = 0; i < scan->numberOfOrderBys; i++)
39 : {
1298 akorotkov 40 34325 : if (sa->distances[i].isnull)
41 : {
42 54 : if (!sb->distances[i].isnull)
1309 43 54 : return -1;
44 : }
1298 45 34271 : else if (sb->distances[i].isnull)
46 : {
1309 47 7 : return 1;
48 : }
49 : else
50 : {
1298 51 68528 : int cmp = -float8_cmp_internal(sa->distances[i].value,
52 34264 : sb->distances[i].value);
53 :
1309 54 34264 : if (cmp != 0)
55 32181 : return cmp;
56 : }
57 : }
58 :
59 : /* Heap items go before inner pages, to ensure a depth-first search */
3030 heikki.linnakangas 60 143730 : if (GISTSearchItemIsHeap(*sa) && !GISTSearchItemIsHeap(*sb))
3030 heikki.linnakangas 61 UBC 0 : return 1;
2973 heikki.linnakangas 62 CBC 143730 : if (!GISTSearchItemIsHeap(*sa) && GISTSearchItemIsHeap(*sb))
63 1 : return -1;
64 :
3030 65 143729 : return 0;
66 : }
67 :
68 :
69 : /*
70 : * Index AM API functions for scanning GiST indexes
71 : */
72 :
73 : IndexScanDesc
2639 tgl 74 1258 : gistbeginscan(Relation r, int nkeys, int norderbys)
75 : {
76 : IndexScanDesc scan;
77 : GISTSTATE *giststate;
78 : GISTScanOpaque so;
79 : MemoryContext oldCxt;
80 :
4511 81 1258 : scan = RelationGetIndexScan(r, nkeys, norderbys);
82 :
83 : /* First, set up a GISTSTATE with a scan-lifespan memory context */
4209 84 1258 : giststate = initGISTstate(scan->indexRelation);
85 :
86 : /*
87 : * Everything made below is in the scanCxt, or is a child of the scanCxt,
88 : * so it'll all go away automatically in gistendscan.
89 : */
90 1258 : oldCxt = MemoryContextSwitchTo(giststate->scanCxt);
91 :
92 : /* initialize opaque data */
4510 93 1258 : so = (GISTScanOpaque) palloc0(sizeof(GISTScanOpaqueData));
4209 94 1258 : so->giststate = giststate;
95 1258 : giststate->tempCxt = createTempGistContext();
96 1258 : so->queue = NULL;
3955 bruce 97 1258 : so->queueCxt = giststate->scanCxt; /* see gistrescan */
98 :
99 : /* workspaces with size dependent on numberOfOrderBys: */
1298 akorotkov 100 1258 : so->distances = palloc(sizeof(so->distances[0]) * scan->numberOfOrderBys);
4510 tgl 101 1258 : so->qual_ok = true; /* in case there are zero keys */
2886 heikki.linnakangas 102 1258 : if (scan->numberOfOrderBys > 0)
103 : {
2878 tgl 104 63 : scan->xs_orderbyvals = palloc0(sizeof(Datum) * scan->numberOfOrderBys);
2886 heikki.linnakangas 105 63 : scan->xs_orderbynulls = palloc(sizeof(bool) * scan->numberOfOrderBys);
2878 tgl 106 63 : memset(scan->xs_orderbynulls, true, sizeof(bool) * scan->numberOfOrderBys);
107 : }
108 :
2769 teodor 109 1258 : so->killedItems = NULL; /* until needed */
110 1258 : so->numKilled = 0;
111 1258 : so->curBlkno = InvalidBlockNumber;
112 1258 : so->curPageLSN = InvalidXLogRecPtr;
113 :
4511 tgl 114 1258 : scan->opaque = so;
115 :
116 : /*
117 : * All fields required for index-only scans are initialized in gistrescan,
118 : * as we don't know yet if we're doing an index-only scan or not.
119 : */
120 :
4209 121 1258 : MemoryContextSwitchTo(oldCxt);
122 :
2639 123 1258 : return scan;
124 : }
125 :
126 : void
127 1303 : gistrescan(IndexScanDesc scan, ScanKey key, int nkeys,
128 : ScanKey orderbys, int norderbys)
129 : {
130 : /* nkeys and norderbys arguments are ignored */
4511 131 1303 : GISTScanOpaque so = (GISTScanOpaque) scan->opaque;
132 : bool first_time;
133 : int i;
134 : MemoryContext oldCxt;
135 :
136 : /* rescan an existing indexscan --- reset state */
137 :
138 : /*
139 : * The first time through, we create the search queue in the scanCxt.
140 : * Subsequent times through, we create the queue in a separate queueCxt,
141 : * which is created on the second call and reset on later calls. Thus, in
142 : * the common case where a scan is only rescan'd once, we just put the
143 : * queue in scanCxt and don't pay the overhead of making a second memory
144 : * context. If we do rescan more than once, the first queue is just left
145 : * for dead until end of scan; this small wastage seems worth the savings
146 : * in the common case.
147 : */
4209 148 1303 : if (so->queue == NULL)
149 : {
150 : /* first time through */
151 1258 : Assert(so->queueCxt == so->giststate->scanCxt);
152 1258 : first_time = true;
153 : }
154 45 : else if (so->queueCxt == so->giststate->scanCxt)
155 : {
156 : /* second time through */
157 15 : so->queueCxt = AllocSetContextCreate(so->giststate->scanCxt,
158 : "GiST queue context",
159 : ALLOCSET_DEFAULT_SIZES);
160 15 : first_time = false;
161 : }
162 : else
163 : {
164 : /* third or later time through */
165 30 : MemoryContextReset(so->queueCxt);
166 30 : first_time = false;
167 : }
168 :
169 : /*
170 : * If we're doing an index-only scan, on the first call, also initialize a
171 : * tuple descriptor to represent the returned index tuples and create a
172 : * memory context to hold them during the scan.
173 : */
2232 174 1303 : if (scan->xs_want_itup && !scan->xs_hitupdesc)
175 : {
176 : int natts;
177 : int nkeyatts;
178 : int attno;
179 :
180 : /*
181 : * The storage type of the index can be different from the original
182 : * datatype being indexed, so we cannot just grab the index's tuple
183 : * descriptor. Instead, construct a descriptor with the original data
184 : * types.
185 : */
2878 bruce 186 334 : natts = RelationGetNumberOfAttributes(scan->indexRelation);
1491 akorotkov 187 334 : nkeyatts = IndexRelationGetNumberOfKeyAttributes(scan->indexRelation);
1601 andres 188 334 : so->giststate->fetchTupdesc = CreateTemplateTupleDesc(natts);
1491 akorotkov 189 681 : for (attno = 1; attno <= nkeyatts; attno++)
190 : {
2936 heikki.linnakangas 191 347 : TupleDescInitEntry(so->giststate->fetchTupdesc, attno, NULL,
192 347 : scan->indexRelation->rd_opcintype[attno - 1],
193 : -1, 0);
194 : }
195 :
1491 akorotkov 196 334 : for (; attno <= natts; attno++)
197 : {
198 : /* taking opcintype from giststate->tupdesc */
1491 akorotkov 199 UBC 0 : TupleDescInitEntry(so->giststate->fetchTupdesc, attno, NULL,
200 0 : TupleDescAttr(so->giststate->leafTupdesc,
201 : attno - 1)->atttypid,
202 : -1, 0);
203 : }
2232 tgl 204 CBC 334 : scan->xs_hitupdesc = so->giststate->fetchTupdesc;
205 :
206 : /* Also create a memory context that will hold the returned tuples */
2936 heikki.linnakangas 207 334 : so->pageDataCxt = AllocSetContextCreate(so->giststate->scanCxt,
208 : "GiST page data context",
209 : ALLOCSET_DEFAULT_SIZES);
210 : }
211 :
212 : /* create new, empty pairing heap for search queue */
4510 tgl 213 1303 : oldCxt = MemoryContextSwitchTo(so->queueCxt);
3030 heikki.linnakangas 214 1303 : so->queue = pairingheap_allocate(pairingheap_GISTSearchItem_cmp, scan);
4510 tgl 215 1303 : MemoryContextSwitchTo(oldCxt);
216 :
217 1303 : so->firstCall = true;
218 :
219 : /* Update scan key, if a new one is given */
6536 neilc 220 1303 : if (key && scan->numberOfKeys > 0)
221 : {
3622 tgl 222 1228 : void **fn_extras = NULL;
223 :
224 : /*
225 : * If this isn't the first time through, preserve the fn_extra
226 : * pointers, so that if the consistentFns are using them to cache
227 : * data, that data is not leaked across a rescan.
228 : */
4209 229 1228 : if (!first_time)
230 : {
3622 231 15 : fn_extras = (void **) palloc(scan->numberOfKeys * sizeof(void *));
4209 232 30 : for (i = 0; i < scan->numberOfKeys; i++)
3622 233 15 : fn_extras[i] = scan->keyData[i].sk_func.fn_extra;
234 : }
235 :
6536 neilc 236 1228 : memmove(scan->keyData, key,
237 1228 : scan->numberOfKeys * sizeof(ScanKeyData));
238 :
239 : /*
240 : * Modify the scan key so that the Consistent method is called for all
241 : * comparisons. The original operator is passed to the Consistent
242 : * function in the form of its strategy number, which is available
243 : * from the sk_strategy field, and its subtype from the sk_subtype
244 : * field.
245 : *
246 : * Next, if any of keys is a NULL and that key is not marked with
247 : * SK_SEARCHNULL/SK_SEARCHNOTNULL then nothing can be found (ie, we
248 : * assume all indexable operators are strict).
249 : */
4510 tgl 250 1228 : so->qual_ok = true;
251 :
5050 bruce 252 2518 : for (i = 0; i < scan->numberOfKeys; i++)
253 : {
4510 tgl 254 1290 : ScanKey skey = scan->keyData + i;
255 :
256 : /*
257 : * Copy consistent support function to ScanKey structure instead
258 : * of function implementing filtering operator.
259 : */
3622 260 1290 : fmgr_info_copy(&(skey->sk_func),
261 1290 : &(so->giststate->consistentFn[skey->sk_attno - 1]),
262 1290 : so->giststate->scanCxt);
263 :
264 : /* Restore prior fn_extra pointers, if not first time */
265 1290 : if (!first_time)
266 15 : skey->sk_func.fn_extra = fn_extras[i];
267 :
4846 268 1290 : if (skey->sk_flags & SK_ISNULL)
269 : {
270 13 : if (!(skey->sk_flags & (SK_SEARCHNULL | SK_SEARCHNOTNULL)))
5287 teodor 271 UBC 0 : so->qual_ok = false;
272 : }
273 : }
274 :
3622 tgl 275 CBC 1228 : if (!first_time)
276 15 : pfree(fn_extras);
277 : }
278 :
279 : /* Update order-by key, if a new one is given */
4510 280 1303 : if (orderbys && scan->numberOfOrderBys > 0)
281 : {
3622 282 99 : void **fn_extras = NULL;
283 :
284 : /* As above, preserve fn_extra if not first time through */
4209 285 99 : if (!first_time)
286 : {
3622 287 36 : fn_extras = (void **) palloc(scan->numberOfOrderBys * sizeof(void *));
4209 288 72 : for (i = 0; i < scan->numberOfOrderBys; i++)
3622 289 36 : fn_extras[i] = scan->orderByData[i].sk_func.fn_extra;
290 : }
291 :
4510 292 99 : memmove(scan->orderByData, orderbys,
293 99 : scan->numberOfOrderBys * sizeof(ScanKeyData));
294 :
2886 heikki.linnakangas 295 99 : so->orderByTypes = (Oid *) palloc(scan->numberOfOrderBys * sizeof(Oid));
296 :
297 : /*
298 : * Modify the order-by key so that the Distance method is called for
299 : * all comparisons. The original operator is passed to the Distance
300 : * function in the form of its strategy number, which is available
301 : * from the sk_strategy field, and its subtype from the sk_subtype
302 : * field.
303 : */
4510 tgl 304 198 : for (i = 0; i < scan->numberOfOrderBys; i++)
305 : {
306 99 : ScanKey skey = scan->orderByData + i;
3622 307 99 : FmgrInfo *finfo = &(so->giststate->distanceFn[skey->sk_attno - 1]);
308 :
309 : /* Check we actually have a distance function ... */
310 99 : if (!OidIsValid(finfo->fn_oid))
4510 tgl 311 UBC 0 : elog(ERROR, "missing support function %d for attribute %d of index \"%s\"",
312 : GIST_DISTANCE_PROC, skey->sk_attno,
313 : RelationGetRelationName(scan->indexRelation));
314 :
315 : /*
316 : * Look up the datatype returned by the original ordering
317 : * operator. GiST always uses a float8 for the distance function,
318 : * but the ordering operator could be anything else.
319 : *
320 : * XXX: The distance function is only allowed to be lossy if the
321 : * ordering operator's result type is float4 or float8. Otherwise
322 : * we don't know how to return the distance to the executor. But
323 : * we cannot check that here, as we won't know if the distance
324 : * function is lossy until it returns *recheck = true for the
325 : * first time.
326 : */
2886 heikki.linnakangas 327 CBC 99 : so->orderByTypes[i] = get_func_rettype(skey->sk_func.fn_oid);
328 :
329 : /*
330 : * Copy distance support function to ScanKey structure instead of
331 : * function implementing ordering operator.
332 : */
2623 teodor 333 99 : fmgr_info_copy(&(skey->sk_func), finfo, so->giststate->scanCxt);
334 :
335 : /* Restore prior fn_extra pointers, if not first time */
3622 tgl 336 99 : if (!first_time)
337 36 : skey->sk_func.fn_extra = fn_extras[i];
338 : }
339 :
340 99 : if (!first_time)
341 36 : pfree(fn_extras);
342 : }
343 :
344 : /* any previous xs_hitup will have been pfree'd in context resets above */
2166 345 1303 : scan->xs_hitup = NULL;
9722 scrappy 346 1303 : }
347 :
348 : void
2639 tgl 349 1230 : gistendscan(IndexScanDesc scan)
350 : {
4511 351 1230 : GISTScanOpaque so = (GISTScanOpaque) scan->opaque;
352 :
353 : /*
354 : * freeGISTstate is enough to clean up everything made by gistbeginscan,
355 : * as well as the queueCxt if there is a separate context for it.
356 : */
4510 357 1230 : freeGISTstate(so->giststate);
9722 scrappy 358 1230 : }
|