1 /*-------------------------------------------------------------------------
2  *
3  * sortsupport.h
4  *	  Framework for accelerated sorting.
5  *
6  * Traditionally, PostgreSQL has implemented sorting by repeatedly invoking
7  * an SQL-callable comparison function "cmp(x, y) returns int" on pairs of
8  * values to be compared, where the comparison function is the BTORDER_PROC
9  * pg_amproc support function of the appropriate btree index opclass.
10  *
11  * This file defines alternative APIs that allow sorting to be performed with
12  * reduced overhead.  To support lower-overhead sorting, a btree opclass may
13  * provide a BTSORTSUPPORT_PROC pg_amproc entry, which must take a single
14  * argument of type internal and return void.  The argument is actually a
15  * pointer to a SortSupportData struct, which is defined below.
16  *
17  * If provided, the BTSORTSUPPORT function will be called during sort setup,
18  * and it must initialize the provided struct with pointers to function(s)
19  * that can be called to perform sorting.  This API is defined to allow
20  * multiple acceleration mechanisms to be supported, but no opclass is
21  * required to provide all of them.  The BTSORTSUPPORT function should
22  * simply not set any function pointers for mechanisms it doesn't support.
23  * Opclasses that provide BTSORTSUPPORT and don't provide a comparator
24  * function will have a shim set up by sort support automatically.  However,
25  * opclasses that support the optional additional abbreviated key capability
26  * must always provide an authoritative comparator used to tie-break
27  * inconclusive abbreviated comparisons and also used  when aborting
28  * abbreviation.  Furthermore, a converter and abort/costing function must be
29  * provided.
30  *
31  * All sort support functions will be passed the address of the
32  * SortSupportData struct when called, so they can use it to store
33  * additional private data as needed.  In particular, for collation-aware
34  * datatypes, the ssup_collation field is set before calling BTSORTSUPPORT
35  * and is available to all support functions.  Additional opclass-dependent
36  * data can be stored using the ssup_extra field.  Any such data
37  * should be allocated in the ssup_cxt memory context.
38  *
39  * Note: since pg_amproc functions are indexed by (lefttype, righttype)
40  * it is possible to associate a BTSORTSUPPORT function with a cross-type
41  * comparison.  This could sensibly be used to provide a fast comparator
42  * function for such cases, but probably not any other acceleration method.
43  *
44  *
45  * Portions Copyright (c) 1996-2019, PostgreSQL Global Development Group
46  * Portions Copyright (c) 1994, Regents of the University of California
47  *
48  * src/include/utils/sortsupport.h
49  *
50  *-------------------------------------------------------------------------
51  */
52 #ifndef SORTSUPPORT_H
53 #define SORTSUPPORT_H
54 
55 #include "access/attnum.h"
56 #include "utils/relcache.h"
57 
58 typedef struct SortSupportData *SortSupport;
59 
60 typedef struct SortSupportData
61 {
62 	/*
63 	 * These fields are initialized before calling the BTSORTSUPPORT function
64 	 * and should not be changed later.
65 	 */
66 	MemoryContext ssup_cxt;		/* Context containing sort info */
67 	Oid			ssup_collation; /* Collation to use, or InvalidOid */
68 
69 	/*
70 	 * Additional sorting parameters; but unlike ssup_collation, these can be
71 	 * changed after BTSORTSUPPORT is called, so don't use them in selecting
72 	 * sort support functions.
73 	 */
74 	bool		ssup_reverse;	/* descending-order sort? */
75 	bool		ssup_nulls_first;	/* sort nulls first? */
76 
77 	/*
78 	 * These fields are workspace for callers, and should not be touched by
79 	 * opclass-specific functions.
80 	 */
81 	AttrNumber	ssup_attno;		/* column number to sort */
82 
83 	/*
84 	 * ssup_extra is zeroed before calling the BTSORTSUPPORT function, and is
85 	 * not touched subsequently by callers.
86 	 */
87 	void	   *ssup_extra;		/* Workspace for opclass functions */
88 
89 	/*
90 	 * Function pointers are zeroed before calling the BTSORTSUPPORT function,
91 	 * and must be set by it for any acceleration methods it wants to supply.
92 	 * The comparator pointer must be set, others are optional.
93 	 */
94 
95 	/*
96 	 * Comparator function has the same API as the traditional btree
97 	 * comparison function, ie, return <0, 0, or >0 according as x is less
98 	 * than, equal to, or greater than y.  Note that x and y are guaranteed
99 	 * not null, and there is no way to return null either.
100 	 *
101 	 * This may be either the authoritative comparator, or the abbreviated
102 	 * comparator.  Core code may switch this over the initial preference of
103 	 * an opclass support function despite originally indicating abbreviation
104 	 * was applicable, by assigning the authoritative comparator back.
105 	 */
106 	int			(*comparator) (Datum x, Datum y, SortSupport ssup);
107 
108 	/*
109 	 * "Abbreviated key" infrastructure follows.
110 	 *
111 	 * All callbacks must be set by sortsupport opclasses that make use of
112 	 * this optional additional infrastructure (unless for whatever reasons
113 	 * the opclass doesn't proceed with abbreviation, in which case
114 	 * abbrev_converter must not be set).
115 	 *
116 	 * This allows opclass authors to supply a conversion routine, used to
117 	 * create an alternative representation of the underlying type (an
118 	 * "abbreviated key").  This representation must be pass-by-value and
119 	 * typically will use some ad-hoc format that only the opclass has
120 	 * knowledge of.  An alternative comparator, used only with this
121 	 * alternative representation must also be provided (which is assigned to
122 	 * "comparator").  This representation is a simple approximation of the
123 	 * original Datum.  It must be possible to compare datums of this
124 	 * representation with each other using the supplied alternative
125 	 * comparator, and have any non-zero return value be a reliable proxy for
126 	 * what a proper comparison would indicate. Returning zero from the
127 	 * alternative comparator does not indicate equality, as with a
128 	 * conventional support routine 1, though -- it indicates that it wasn't
129 	 * possible to determine how the two abbreviated values compared.  A
130 	 * proper comparison, using "abbrev_full_comparator"/
131 	 * ApplySortAbbrevFullComparator() is therefore required.  In many cases
132 	 * this results in most or all comparisons only using the cheap
133 	 * alternative comparison func, which is typically implemented as code
134 	 * that compiles to just a few CPU instructions.  CPU cache miss penalties
135 	 * are expensive; to get good overall performance, sort infrastructure
136 	 * must heavily weigh cache performance.
137 	 *
138 	 * Opclass authors must consider the final cardinality of abbreviated keys
139 	 * when devising an encoding scheme.  It's possible for a strategy to work
140 	 * better than an alternative strategy with one usage pattern, while the
141 	 * reverse might be true for another usage pattern.  All of these factors
142 	 * must be considered.
143 	 */
144 
145 	/*
146 	 * "abbreviate" concerns whether or not the abbreviated key optimization
147 	 * is applicable in principle (that is, the sortsupport routine needs to
148 	 * know if its dealing with a key where an abbreviated representation can
149 	 * usefully be packed together.  Conventionally, this is the leading
150 	 * attribute key).  Note, however, that in order to determine that
151 	 * abbreviation is not in play, the core code always checks whether or not
152 	 * the opclass has set abbrev_converter.  This is a one way, one time
153 	 * message to the opclass.
154 	 */
155 	bool		abbreviate;
156 
157 	/*
158 	 * Converter to abbreviated format, from original representation.  Core
159 	 * code uses this callback to convert from a pass-by-reference "original"
160 	 * Datum to a pass-by-value abbreviated key Datum.  Note that original is
161 	 * guaranteed NOT NULL, because it doesn't make sense to factor NULLness
162 	 * into ad-hoc cost model.
163 	 *
164 	 * abbrev_converter is tested to see if abbreviation is in play.  Core
165 	 * code may set it to NULL to indicate abbreviation should not be used
166 	 * (which is something sortsupport routines need not concern themselves
167 	 * with). However, sortsupport routines must not set it when it is
168 	 * immediately established that abbreviation should not proceed (e.g., for
169 	 * !abbreviate calls, or due to platform-specific impediments to using
170 	 * abbreviation).
171 	 */
172 	Datum		(*abbrev_converter) (Datum original, SortSupport ssup);
173 
174 	/*
175 	 * abbrev_abort callback allows clients to verify that the current
176 	 * strategy is working out, using a sortsupport routine defined ad-hoc
177 	 * cost model. If there is a lot of duplicate abbreviated keys in
178 	 * practice, it's useful to be able to abandon the strategy before paying
179 	 * too high a cost in conversion (perhaps certain opclass-specific
180 	 * adaptations are useful too).
181 	 */
182 	bool		(*abbrev_abort) (int memtupcount, SortSupport ssup);
183 
184 	/*
185 	 * Full, authoritative comparator for key that an abbreviated
186 	 * representation was generated for, used when an abbreviated comparison
187 	 * was inconclusive (by calling ApplySortAbbrevFullComparator()), or used
188 	 * to replace "comparator" when core system ultimately decides against
189 	 * abbreviation.
190 	 */
191 	int			(*abbrev_full_comparator) (Datum x, Datum y, SortSupport ssup);
192 } SortSupportData;
193 
194 
195 /*
196  * Apply a sort comparator function and return a 3-way comparison result.
197  * This takes care of handling reverse-sort and NULLs-ordering properly.
198  */
199 static inline int
ApplySortComparator(Datum datum1,bool isNull1,Datum datum2,bool isNull2,SortSupport ssup)200 ApplySortComparator(Datum datum1, bool isNull1,
201 					Datum datum2, bool isNull2,
202 					SortSupport ssup)
203 {
204 	int			compare;
205 
206 	if (isNull1)
207 	{
208 		if (isNull2)
209 			compare = 0;		/* NULL "=" NULL */
210 		else if (ssup->ssup_nulls_first)
211 			compare = -1;		/* NULL "<" NOT_NULL */
212 		else
213 			compare = 1;		/* NULL ">" NOT_NULL */
214 	}
215 	else if (isNull2)
216 	{
217 		if (ssup->ssup_nulls_first)
218 			compare = 1;		/* NOT_NULL ">" NULL */
219 		else
220 			compare = -1;		/* NOT_NULL "<" NULL */
221 	}
222 	else
223 	{
224 		compare = ssup->comparator(datum1, datum2, ssup);
225 		if (ssup->ssup_reverse)
226 			INVERT_COMPARE_RESULT(compare);
227 	}
228 
229 	return compare;
230 }
231 
232 /*
233  * Apply a sort comparator function and return a 3-way comparison using full,
234  * authoritative comparator.  This takes care of handling reverse-sort and
235  * NULLs-ordering properly.
236  */
237 static inline int
ApplySortAbbrevFullComparator(Datum datum1,bool isNull1,Datum datum2,bool isNull2,SortSupport ssup)238 ApplySortAbbrevFullComparator(Datum datum1, bool isNull1,
239 							  Datum datum2, bool isNull2,
240 							  SortSupport ssup)
241 {
242 	int			compare;
243 
244 	if (isNull1)
245 	{
246 		if (isNull2)
247 			compare = 0;		/* NULL "=" NULL */
248 		else if (ssup->ssup_nulls_first)
249 			compare = -1;		/* NULL "<" NOT_NULL */
250 		else
251 			compare = 1;		/* NULL ">" NOT_NULL */
252 	}
253 	else if (isNull2)
254 	{
255 		if (ssup->ssup_nulls_first)
256 			compare = 1;		/* NOT_NULL ">" NULL */
257 		else
258 			compare = -1;		/* NOT_NULL "<" NULL */
259 	}
260 	else
261 	{
262 		compare = ssup->abbrev_full_comparator(datum1, datum2, ssup);
263 		if (ssup->ssup_reverse)
264 			INVERT_COMPARE_RESULT(compare);
265 	}
266 
267 	return compare;
268 }
269 
270 /* Other functions in utils/sort/sortsupport.c */
271 extern void PrepareSortSupportComparisonShim(Oid cmpFunc, SortSupport ssup);
272 extern void PrepareSortSupportFromOrderingOp(Oid orderingOp, SortSupport ssup);
273 extern void PrepareSortSupportFromIndexRel(Relation indexRel, int16 strategy,
274 										   SortSupport ssup);
275 
276 #endif							/* SORTSUPPORT_H */
277