1 | /*------------------------------------------------------------------------- |
2 | * |
3 | * sortsupport.h |
4 | * Framework for accelerated sorting. |
5 | * |
6 | * Traditionally, PostgreSQL has implemented sorting by repeatedly invoking |
7 | * an SQL-callable comparison function "cmp(x, y) returns int" on pairs of |
8 | * values to be compared, where the comparison function is the BTORDER_PROC |
9 | * pg_amproc support function of the appropriate btree index opclass. |
10 | * |
11 | * This file defines alternative APIs that allow sorting to be performed with |
12 | * reduced overhead. To support lower-overhead sorting, a btree opclass may |
13 | * provide a BTSORTSUPPORT_PROC pg_amproc entry, which must take a single |
14 | * argument of type internal and return void. The argument is actually a |
15 | * pointer to a SortSupportData struct, which is defined below. |
16 | * |
17 | * If provided, the BTSORTSUPPORT function will be called during sort setup, |
18 | * and it must initialize the provided struct with pointers to function(s) |
19 | * that can be called to perform sorting. This API is defined to allow |
20 | * multiple acceleration mechanisms to be supported, but no opclass is |
21 | * required to provide all of them. The BTSORTSUPPORT function should |
22 | * simply not set any function pointers for mechanisms it doesn't support. |
23 | * Opclasses that provide BTSORTSUPPORT and don't provide a comparator |
24 | * function will have a shim set up by sort support automatically. However, |
25 | * opclasses that support the optional additional abbreviated key capability |
26 | * must always provide an authoritative comparator used to tie-break |
27 | * inconclusive abbreviated comparisons and also used when aborting |
28 | * abbreviation. Furthermore, a converter and abort/costing function must be |
29 | * provided. |
30 | * |
31 | * All sort support functions will be passed the address of the |
32 | * SortSupportData struct when called, so they can use it to store |
33 | * additional private data as needed. In particular, for collation-aware |
34 | * datatypes, the ssup_collation field is set before calling BTSORTSUPPORT |
35 | * and is available to all support functions. Additional opclass-dependent |
36 | * data can be stored using the ssup_extra field. Any such data |
37 | * should be allocated in the ssup_cxt memory context. |
38 | * |
39 | * Note: since pg_amproc functions are indexed by (lefttype, righttype) |
40 | * it is possible to associate a BTSORTSUPPORT function with a cross-type |
41 | * comparison. This could sensibly be used to provide a fast comparator |
42 | * function for such cases, but probably not any other acceleration method. |
43 | * |
44 | * |
45 | * Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group |
46 | * Portions Copyright (c) 1994, Regents of the University of California |
47 | * |
48 | * src/include/utils/sortsupport.h |
49 | * |
50 | *------------------------------------------------------------------------- |
51 | */ |
52 | #ifndef SORTSUPPORT_H |
53 | #define SORTSUPPORT_H |
54 | |
55 | #include "access/attnum.h" |
56 | #include "utils/relcache.h" |
57 | |
58 | typedef struct SortSupportData *SortSupport; |
59 | |
60 | typedef struct SortSupportData |
61 | { |
62 | /* |
63 | * These fields are initialized before calling the BTSORTSUPPORT function |
64 | * and should not be changed later. |
65 | */ |
66 | MemoryContext ssup_cxt; /* Context containing sort info */ |
67 | Oid ssup_collation; /* Collation to use, or InvalidOid */ |
68 | |
69 | /* |
70 | * Additional sorting parameters; but unlike ssup_collation, these can be |
71 | * changed after BTSORTSUPPORT is called, so don't use them in selecting |
72 | * sort support functions. |
73 | */ |
74 | bool ssup_reverse; /* descending-order sort? */ |
75 | bool ssup_nulls_first; /* sort nulls first? */ |
76 | |
77 | /* |
78 | * These fields are workspace for callers, and should not be touched by |
79 | * opclass-specific functions. |
80 | */ |
81 | AttrNumber ssup_attno; /* column number to sort */ |
82 | |
83 | /* |
84 | * ssup_extra is zeroed before calling the BTSORTSUPPORT function, and is |
85 | * not touched subsequently by callers. |
86 | */ |
87 | void *; /* Workspace for opclass functions */ |
88 | |
89 | /* |
90 | * Function pointers are zeroed before calling the BTSORTSUPPORT function, |
91 | * and must be set by it for any acceleration methods it wants to supply. |
92 | * The comparator pointer must be set, others are optional. |
93 | */ |
94 | |
95 | /* |
96 | * Comparator function has the same API as the traditional btree |
97 | * comparison function, ie, return <0, 0, or >0 according as x is less |
98 | * than, equal to, or greater than y. Note that x and y are guaranteed |
99 | * not null, and there is no way to return null either. |
100 | * |
101 | * This may be either the authoritative comparator, or the abbreviated |
102 | * comparator. Core code may switch this over the initial preference of |
103 | * an opclass support function despite originally indicating abbreviation |
104 | * was applicable, by assigning the authoritative comparator back. |
105 | */ |
106 | int (*comparator) (Datum x, Datum y, SortSupport ssup); |
107 | |
108 | /* |
109 | * "Abbreviated key" infrastructure follows. |
110 | * |
111 | * All callbacks must be set by sortsupport opclasses that make use of |
112 | * this optional additional infrastructure (unless for whatever reasons |
113 | * the opclass doesn't proceed with abbreviation, in which case |
114 | * abbrev_converter must not be set). |
115 | * |
116 | * This allows opclass authors to supply a conversion routine, used to |
117 | * create an alternative representation of the underlying type (an |
118 | * "abbreviated key"). This representation must be pass-by-value and |
119 | * typically will use some ad-hoc format that only the opclass has |
120 | * knowledge of. An alternative comparator, used only with this |
121 | * alternative representation must also be provided (which is assigned to |
122 | * "comparator"). This representation is a simple approximation of the |
123 | * original Datum. It must be possible to compare datums of this |
124 | * representation with each other using the supplied alternative |
125 | * comparator, and have any non-zero return value be a reliable proxy for |
126 | * what a proper comparison would indicate. Returning zero from the |
127 | * alternative comparator does not indicate equality, as with a |
128 | * conventional support routine 1, though -- it indicates that it wasn't |
129 | * possible to determine how the two abbreviated values compared. A |
130 | * proper comparison, using "abbrev_full_comparator"/ |
131 | * ApplySortAbbrevFullComparator() is therefore required. In many cases |
132 | * this results in most or all comparisons only using the cheap |
133 | * alternative comparison func, which is typically implemented as code |
134 | * that compiles to just a few CPU instructions. CPU cache miss penalties |
135 | * are expensive; to get good overall performance, sort infrastructure |
136 | * must heavily weigh cache performance. |
137 | * |
138 | * Opclass authors must consider the final cardinality of abbreviated keys |
139 | * when devising an encoding scheme. It's possible for a strategy to work |
140 | * better than an alternative strategy with one usage pattern, while the |
141 | * reverse might be true for another usage pattern. All of these factors |
142 | * must be considered. |
143 | */ |
144 | |
145 | /* |
146 | * "abbreviate" concerns whether or not the abbreviated key optimization |
147 | * is applicable in principle (that is, the sortsupport routine needs to |
148 | * know if its dealing with a key where an abbreviated representation can |
149 | * usefully be packed together. Conventionally, this is the leading |
150 | * attribute key). Note, however, that in order to determine that |
151 | * abbreviation is not in play, the core code always checks whether or not |
152 | * the opclass has set abbrev_converter. This is a one way, one time |
153 | * message to the opclass. |
154 | */ |
155 | bool abbreviate; |
156 | |
157 | /* |
158 | * Converter to abbreviated format, from original representation. Core |
159 | * code uses this callback to convert from a pass-by-reference "original" |
160 | * Datum to a pass-by-value abbreviated key Datum. Note that original is |
161 | * guaranteed NOT NULL, because it doesn't make sense to factor NULLness |
162 | * into ad-hoc cost model. |
163 | * |
164 | * abbrev_converter is tested to see if abbreviation is in play. Core |
165 | * code may set it to NULL to indicate abbreviation should not be used |
166 | * (which is something sortsupport routines need not concern themselves |
167 | * with). However, sortsupport routines must not set it when it is |
168 | * immediately established that abbreviation should not proceed (e.g., for |
169 | * !abbreviate calls, or due to platform-specific impediments to using |
170 | * abbreviation). |
171 | */ |
172 | Datum (*abbrev_converter) (Datum original, SortSupport ssup); |
173 | |
174 | /* |
175 | * abbrev_abort callback allows clients to verify that the current |
176 | * strategy is working out, using a sortsupport routine defined ad-hoc |
177 | * cost model. If there is a lot of duplicate abbreviated keys in |
178 | * practice, it's useful to be able to abandon the strategy before paying |
179 | * too high a cost in conversion (perhaps certain opclass-specific |
180 | * adaptations are useful too). |
181 | */ |
182 | bool (*abbrev_abort) (int memtupcount, SortSupport ssup); |
183 | |
184 | /* |
185 | * Full, authoritative comparator for key that an abbreviated |
186 | * representation was generated for, used when an abbreviated comparison |
187 | * was inconclusive (by calling ApplySortAbbrevFullComparator()), or used |
188 | * to replace "comparator" when core system ultimately decides against |
189 | * abbreviation. |
190 | */ |
191 | int (*abbrev_full_comparator) (Datum x, Datum y, SortSupport ssup); |
192 | } SortSupportData; |
193 | |
194 | |
195 | /* |
196 | * Apply a sort comparator function and return a 3-way comparison result. |
197 | * This takes care of handling reverse-sort and NULLs-ordering properly. |
198 | */ |
199 | static inline int |
200 | ApplySortComparator(Datum datum1, bool isNull1, |
201 | Datum datum2, bool isNull2, |
202 | SortSupport ssup) |
203 | { |
204 | int compare; |
205 | |
206 | if (isNull1) |
207 | { |
208 | if (isNull2) |
209 | compare = 0; /* NULL "=" NULL */ |
210 | else if (ssup->ssup_nulls_first) |
211 | compare = -1; /* NULL "<" NOT_NULL */ |
212 | else |
213 | compare = 1; /* NULL ">" NOT_NULL */ |
214 | } |
215 | else if (isNull2) |
216 | { |
217 | if (ssup->ssup_nulls_first) |
218 | compare = 1; /* NOT_NULL ">" NULL */ |
219 | else |
220 | compare = -1; /* NOT_NULL "<" NULL */ |
221 | } |
222 | else |
223 | { |
224 | compare = ssup->comparator(datum1, datum2, ssup); |
225 | if (ssup->ssup_reverse) |
226 | INVERT_COMPARE_RESULT(compare); |
227 | } |
228 | |
229 | return compare; |
230 | } |
231 | |
232 | /* |
233 | * Apply a sort comparator function and return a 3-way comparison using full, |
234 | * authoritative comparator. This takes care of handling reverse-sort and |
235 | * NULLs-ordering properly. |
236 | */ |
237 | static inline int |
238 | ApplySortAbbrevFullComparator(Datum datum1, bool isNull1, |
239 | Datum datum2, bool isNull2, |
240 | SortSupport ssup) |
241 | { |
242 | int compare; |
243 | |
244 | if (isNull1) |
245 | { |
246 | if (isNull2) |
247 | compare = 0; /* NULL "=" NULL */ |
248 | else if (ssup->ssup_nulls_first) |
249 | compare = -1; /* NULL "<" NOT_NULL */ |
250 | else |
251 | compare = 1; /* NULL ">" NOT_NULL */ |
252 | } |
253 | else if (isNull2) |
254 | { |
255 | if (ssup->ssup_nulls_first) |
256 | compare = 1; /* NOT_NULL ">" NULL */ |
257 | else |
258 | compare = -1; /* NOT_NULL "<" NULL */ |
259 | } |
260 | else |
261 | { |
262 | compare = ssup->abbrev_full_comparator(datum1, datum2, ssup); |
263 | if (ssup->ssup_reverse) |
264 | INVERT_COMPARE_RESULT(compare); |
265 | } |
266 | |
267 | return compare; |
268 | } |
269 | |
270 | /* Other functions in utils/sort/sortsupport.c */ |
271 | extern void PrepareSortSupportComparisonShim(Oid cmpFunc, SortSupport ssup); |
272 | extern void PrepareSortSupportFromOrderingOp(Oid orderingOp, SortSupport ssup); |
273 | extern void PrepareSortSupportFromIndexRel(Relation indexRel, int16 strategy, |
274 | SortSupport ssup); |
275 | |
276 | #endif /* SORTSUPPORT_H */ |
277 | |