1 | /*------------------------------------------------------------------------- |
2 | * |
3 | * gistscan.c |
4 | * routines to manage scans on GiST index relations |
5 | * |
6 | * |
7 | * Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group |
8 | * Portions Copyright (c) 1994, Regents of the University of California |
9 | * |
10 | * IDENTIFICATION |
11 | * src/backend/access/gist/gistscan.c |
12 | * |
13 | *------------------------------------------------------------------------- |
14 | */ |
15 | #include "postgres.h" |
16 | |
17 | #include "access/gist_private.h" |
18 | #include "access/gistscan.h" |
19 | #include "access/relscan.h" |
20 | #include "utils/float.h" |
21 | #include "utils/lsyscache.h" |
22 | #include "utils/memutils.h" |
23 | #include "utils/rel.h" |
24 | |
25 | |
26 | /* |
27 | * Pairing heap comparison function for the GISTSearchItem queue |
28 | */ |
29 | static int |
30 | pairingheap_GISTSearchItem_cmp(const pairingheap_node *a, const pairingheap_node *b, void *arg) |
31 | { |
32 | const GISTSearchItem *sa = (const GISTSearchItem *) a; |
33 | const GISTSearchItem *sb = (const GISTSearchItem *) b; |
34 | IndexScanDesc scan = (IndexScanDesc) arg; |
35 | int i; |
36 | |
37 | /* Order according to distance comparison */ |
38 | for (i = 0; i < scan->numberOfOrderBys; i++) |
39 | { |
40 | if (sa->distances[i].isnull) |
41 | { |
42 | if (!sb->distances[i].isnull) |
43 | return -1; |
44 | } |
45 | else if (sb->distances[i].isnull) |
46 | { |
47 | return 1; |
48 | } |
49 | else |
50 | { |
51 | int cmp = -float8_cmp_internal(sa->distances[i].value, |
52 | sb->distances[i].value); |
53 | |
54 | if (cmp != 0) |
55 | return cmp; |
56 | } |
57 | } |
58 | |
59 | /* Heap items go before inner pages, to ensure a depth-first search */ |
60 | if (GISTSearchItemIsHeap(*sa) && !GISTSearchItemIsHeap(*sb)) |
61 | return 1; |
62 | if (!GISTSearchItemIsHeap(*sa) && GISTSearchItemIsHeap(*sb)) |
63 | return -1; |
64 | |
65 | return 0; |
66 | } |
67 | |
68 | |
69 | /* |
70 | * Index AM API functions for scanning GiST indexes |
71 | */ |
72 | |
73 | IndexScanDesc |
74 | gistbeginscan(Relation r, int nkeys, int norderbys) |
75 | { |
76 | IndexScanDesc scan; |
77 | GISTSTATE *giststate; |
78 | GISTScanOpaque so; |
79 | MemoryContext oldCxt; |
80 | |
81 | scan = RelationGetIndexScan(r, nkeys, norderbys); |
82 | |
83 | /* First, set up a GISTSTATE with a scan-lifespan memory context */ |
84 | giststate = initGISTstate(scan->indexRelation); |
85 | |
86 | /* |
87 | * Everything made below is in the scanCxt, or is a child of the scanCxt, |
88 | * so it'll all go away automatically in gistendscan. |
89 | */ |
90 | oldCxt = MemoryContextSwitchTo(giststate->scanCxt); |
91 | |
92 | /* initialize opaque data */ |
93 | so = (GISTScanOpaque) palloc0(sizeof(GISTScanOpaqueData)); |
94 | so->giststate = giststate; |
95 | giststate->tempCxt = createTempGistContext(); |
96 | so->queue = NULL; |
97 | so->queueCxt = giststate->scanCxt; /* see gistrescan */ |
98 | |
99 | /* workspaces with size dependent on numberOfOrderBys: */ |
100 | so->distances = palloc(sizeof(so->distances[0]) * scan->numberOfOrderBys); |
101 | so->qual_ok = true; /* in case there are zero keys */ |
102 | if (scan->numberOfOrderBys > 0) |
103 | { |
104 | scan->xs_orderbyvals = palloc0(sizeof(Datum) * scan->numberOfOrderBys); |
105 | scan->xs_orderbynulls = palloc(sizeof(bool) * scan->numberOfOrderBys); |
106 | memset(scan->xs_orderbynulls, true, sizeof(bool) * scan->numberOfOrderBys); |
107 | } |
108 | |
109 | so->killedItems = NULL; /* until needed */ |
110 | so->numKilled = 0; |
111 | so->curBlkno = InvalidBlockNumber; |
112 | so->curPageLSN = InvalidXLogRecPtr; |
113 | |
114 | scan->opaque = so; |
115 | |
116 | /* |
117 | * All fields required for index-only scans are initialized in gistrescan, |
118 | * as we don't know yet if we're doing an index-only scan or not. |
119 | */ |
120 | |
121 | MemoryContextSwitchTo(oldCxt); |
122 | |
123 | return scan; |
124 | } |
125 | |
126 | void |
127 | gistrescan(IndexScanDesc scan, ScanKey key, int nkeys, |
128 | ScanKey orderbys, int norderbys) |
129 | { |
130 | /* nkeys and norderbys arguments are ignored */ |
131 | GISTScanOpaque so = (GISTScanOpaque) scan->opaque; |
132 | bool first_time; |
133 | int i; |
134 | MemoryContext oldCxt; |
135 | |
136 | /* rescan an existing indexscan --- reset state */ |
137 | |
138 | /* |
139 | * The first time through, we create the search queue in the scanCxt. |
140 | * Subsequent times through, we create the queue in a separate queueCxt, |
141 | * which is created on the second call and reset on later calls. Thus, in |
142 | * the common case where a scan is only rescan'd once, we just put the |
143 | * queue in scanCxt and don't pay the overhead of making a second memory |
144 | * context. If we do rescan more than once, the first queue is just left |
145 | * for dead until end of scan; this small wastage seems worth the savings |
146 | * in the common case. |
147 | */ |
148 | if (so->queue == NULL) |
149 | { |
150 | /* first time through */ |
151 | Assert(so->queueCxt == so->giststate->scanCxt); |
152 | first_time = true; |
153 | } |
154 | else if (so->queueCxt == so->giststate->scanCxt) |
155 | { |
156 | /* second time through */ |
157 | so->queueCxt = AllocSetContextCreate(so->giststate->scanCxt, |
158 | "GiST queue context" , |
159 | ALLOCSET_DEFAULT_SIZES); |
160 | first_time = false; |
161 | } |
162 | else |
163 | { |
164 | /* third or later time through */ |
165 | MemoryContextReset(so->queueCxt); |
166 | first_time = false; |
167 | } |
168 | |
169 | /* |
170 | * If we're doing an index-only scan, on the first call, also initialize a |
171 | * tuple descriptor to represent the returned index tuples and create a |
172 | * memory context to hold them during the scan. |
173 | */ |
174 | if (scan->xs_want_itup && !scan->xs_hitupdesc) |
175 | { |
176 | int natts; |
177 | int nkeyatts; |
178 | int attno; |
179 | |
180 | /* |
181 | * The storage type of the index can be different from the original |
182 | * datatype being indexed, so we cannot just grab the index's tuple |
183 | * descriptor. Instead, construct a descriptor with the original data |
184 | * types. |
185 | */ |
186 | natts = RelationGetNumberOfAttributes(scan->indexRelation); |
187 | nkeyatts = IndexRelationGetNumberOfKeyAttributes(scan->indexRelation); |
188 | so->giststate->fetchTupdesc = CreateTemplateTupleDesc(natts); |
189 | for (attno = 1; attno <= nkeyatts; attno++) |
190 | { |
191 | TupleDescInitEntry(so->giststate->fetchTupdesc, attno, NULL, |
192 | scan->indexRelation->rd_opcintype[attno - 1], |
193 | -1, 0); |
194 | } |
195 | |
196 | for (; attno <= natts; attno++) |
197 | { |
198 | /* taking opcintype from giststate->tupdesc */ |
199 | TupleDescInitEntry(so->giststate->fetchTupdesc, attno, NULL, |
200 | TupleDescAttr(so->giststate->leafTupdesc, |
201 | attno - 1)->atttypid, |
202 | -1, 0); |
203 | } |
204 | scan->xs_hitupdesc = so->giststate->fetchTupdesc; |
205 | |
206 | /* Also create a memory context that will hold the returned tuples */ |
207 | so->pageDataCxt = AllocSetContextCreate(so->giststate->scanCxt, |
208 | "GiST page data context" , |
209 | ALLOCSET_DEFAULT_SIZES); |
210 | } |
211 | |
212 | /* create new, empty pairing heap for search queue */ |
213 | oldCxt = MemoryContextSwitchTo(so->queueCxt); |
214 | so->queue = pairingheap_allocate(pairingheap_GISTSearchItem_cmp, scan); |
215 | MemoryContextSwitchTo(oldCxt); |
216 | |
217 | so->firstCall = true; |
218 | |
219 | /* Update scan key, if a new one is given */ |
220 | if (key && scan->numberOfKeys > 0) |
221 | { |
222 | void ** = NULL; |
223 | |
224 | /* |
225 | * If this isn't the first time through, preserve the fn_extra |
226 | * pointers, so that if the consistentFns are using them to cache |
227 | * data, that data is not leaked across a rescan. |
228 | */ |
229 | if (!first_time) |
230 | { |
231 | fn_extras = (void **) palloc(scan->numberOfKeys * sizeof(void *)); |
232 | for (i = 0; i < scan->numberOfKeys; i++) |
233 | fn_extras[i] = scan->keyData[i].sk_func.fn_extra; |
234 | } |
235 | |
236 | memmove(scan->keyData, key, |
237 | scan->numberOfKeys * sizeof(ScanKeyData)); |
238 | |
239 | /* |
240 | * Modify the scan key so that the Consistent method is called for all |
241 | * comparisons. The original operator is passed to the Consistent |
242 | * function in the form of its strategy number, which is available |
243 | * from the sk_strategy field, and its subtype from the sk_subtype |
244 | * field. |
245 | * |
246 | * Next, if any of keys is a NULL and that key is not marked with |
247 | * SK_SEARCHNULL/SK_SEARCHNOTNULL then nothing can be found (ie, we |
248 | * assume all indexable operators are strict). |
249 | */ |
250 | so->qual_ok = true; |
251 | |
252 | for (i = 0; i < scan->numberOfKeys; i++) |
253 | { |
254 | ScanKey skey = scan->keyData + i; |
255 | |
256 | /* |
257 | * Copy consistent support function to ScanKey structure instead |
258 | * of function implementing filtering operator. |
259 | */ |
260 | fmgr_info_copy(&(skey->sk_func), |
261 | &(so->giststate->consistentFn[skey->sk_attno - 1]), |
262 | so->giststate->scanCxt); |
263 | |
264 | /* Restore prior fn_extra pointers, if not first time */ |
265 | if (!first_time) |
266 | skey->sk_func.fn_extra = fn_extras[i]; |
267 | |
268 | if (skey->sk_flags & SK_ISNULL) |
269 | { |
270 | if (!(skey->sk_flags & (SK_SEARCHNULL | SK_SEARCHNOTNULL))) |
271 | so->qual_ok = false; |
272 | } |
273 | } |
274 | |
275 | if (!first_time) |
276 | pfree(fn_extras); |
277 | } |
278 | |
279 | /* Update order-by key, if a new one is given */ |
280 | if (orderbys && scan->numberOfOrderBys > 0) |
281 | { |
282 | void ** = NULL; |
283 | |
284 | /* As above, preserve fn_extra if not first time through */ |
285 | if (!first_time) |
286 | { |
287 | fn_extras = (void **) palloc(scan->numberOfOrderBys * sizeof(void *)); |
288 | for (i = 0; i < scan->numberOfOrderBys; i++) |
289 | fn_extras[i] = scan->orderByData[i].sk_func.fn_extra; |
290 | } |
291 | |
292 | memmove(scan->orderByData, orderbys, |
293 | scan->numberOfOrderBys * sizeof(ScanKeyData)); |
294 | |
295 | so->orderByTypes = (Oid *) palloc(scan->numberOfOrderBys * sizeof(Oid)); |
296 | |
297 | /* |
298 | * Modify the order-by key so that the Distance method is called for |
299 | * all comparisons. The original operator is passed to the Distance |
300 | * function in the form of its strategy number, which is available |
301 | * from the sk_strategy field, and its subtype from the sk_subtype |
302 | * field. |
303 | */ |
304 | for (i = 0; i < scan->numberOfOrderBys; i++) |
305 | { |
306 | ScanKey skey = scan->orderByData + i; |
307 | FmgrInfo *finfo = &(so->giststate->distanceFn[skey->sk_attno - 1]); |
308 | |
309 | /* Check we actually have a distance function ... */ |
310 | if (!OidIsValid(finfo->fn_oid)) |
311 | elog(ERROR, "missing support function %d for attribute %d of index \"%s\"" , |
312 | GIST_DISTANCE_PROC, skey->sk_attno, |
313 | RelationGetRelationName(scan->indexRelation)); |
314 | |
315 | /* |
316 | * Look up the datatype returned by the original ordering |
317 | * operator. GiST always uses a float8 for the distance function, |
318 | * but the ordering operator could be anything else. |
319 | * |
320 | * XXX: The distance function is only allowed to be lossy if the |
321 | * ordering operator's result type is float4 or float8. Otherwise |
322 | * we don't know how to return the distance to the executor. But |
323 | * we cannot check that here, as we won't know if the distance |
324 | * function is lossy until it returns *recheck = true for the |
325 | * first time. |
326 | */ |
327 | so->orderByTypes[i] = get_func_rettype(skey->sk_func.fn_oid); |
328 | |
329 | /* |
330 | * Copy distance support function to ScanKey structure instead of |
331 | * function implementing ordering operator. |
332 | */ |
333 | fmgr_info_copy(&(skey->sk_func), finfo, so->giststate->scanCxt); |
334 | |
335 | /* Restore prior fn_extra pointers, if not first time */ |
336 | if (!first_time) |
337 | skey->sk_func.fn_extra = fn_extras[i]; |
338 | } |
339 | |
340 | if (!first_time) |
341 | pfree(fn_extras); |
342 | } |
343 | |
344 | /* any previous xs_hitup will have been pfree'd in context resets above */ |
345 | scan->xs_hitup = NULL; |
346 | } |
347 | |
348 | void |
349 | gistendscan(IndexScanDesc scan) |
350 | { |
351 | GISTScanOpaque so = (GISTScanOpaque) scan->opaque; |
352 | |
353 | /* |
354 | * freeGISTstate is enough to clean up everything made by gistbeginscan, |
355 | * as well as the queueCxt if there is a separate context for it. |
356 | */ |
357 | freeGISTstate(so->giststate); |
358 | } |
359 | |