1 /*-------------------------------------------------------------------------
2 *
3 * ginbulk.c
4 * routines for fast build of inverted index
5 *
6 *
7 * Portions Copyright (c) 1996-2018, PostgreSQL Global Development Group
8 * Portions Copyright (c) 1994, Regents of the University of California
9 *
10 * IDENTIFICATION
11 * src/backend/access/gin/ginbulk.c
12 *-------------------------------------------------------------------------
13 */
14
15 #include "postgres.h"
16
17 #include <limits.h>
18
19 #include "access/gin_private.h"
20 #include "utils/datum.h"
21 #include "utils/memutils.h"
22
23
24 #define DEF_NENTRY 2048 /* GinEntryAccumulator allocation quantum */
25 #define DEF_NPTR 5 /* ItemPointer initial allocation quantum */
26
27
28 /* Combiner function for rbtree.c */
29 static void
ginCombineData(RBTNode * existing,const RBTNode * newdata,void * arg)30 ginCombineData(RBTNode *existing, const RBTNode *newdata, void *arg)
31 {
32 GinEntryAccumulator *eo = (GinEntryAccumulator *) existing;
33 const GinEntryAccumulator *en = (const GinEntryAccumulator *) newdata;
34 BuildAccumulator *accum = (BuildAccumulator *) arg;
35
36 /*
37 * Note this code assumes that newdata contains only one itempointer.
38 */
39 if (eo->count >= eo->maxcount)
40 {
41 if (eo->maxcount > INT_MAX)
42 ereport(ERROR,
43 (errcode(ERRCODE_PROGRAM_LIMIT_EXCEEDED),
44 errmsg("posting list is too long"),
45 errhint("Reduce maintenance_work_mem.")));
46
47 accum->allocatedMemory -= GetMemoryChunkSpace(eo->list);
48 eo->maxcount *= 2;
49 eo->list = (ItemPointerData *)
50 repalloc_huge(eo->list, sizeof(ItemPointerData) * eo->maxcount);
51 accum->allocatedMemory += GetMemoryChunkSpace(eo->list);
52 }
53
54 /* If item pointers are not ordered, they will need to be sorted later */
55 if (eo->shouldSort == false)
56 {
57 int res;
58
59 res = ginCompareItemPointers(eo->list + eo->count - 1, en->list);
60 Assert(res != 0);
61
62 if (res > 0)
63 eo->shouldSort = true;
64 }
65
66 eo->list[eo->count] = en->list[0];
67 eo->count++;
68 }
69
70 /* Comparator function for rbtree.c */
71 static int
cmpEntryAccumulator(const RBTNode * a,const RBTNode * b,void * arg)72 cmpEntryAccumulator(const RBTNode *a, const RBTNode *b, void *arg)
73 {
74 const GinEntryAccumulator *ea = (const GinEntryAccumulator *) a;
75 const GinEntryAccumulator *eb = (const GinEntryAccumulator *) b;
76 BuildAccumulator *accum = (BuildAccumulator *) arg;
77
78 return ginCompareAttEntries(accum->ginstate,
79 ea->attnum, ea->key, ea->category,
80 eb->attnum, eb->key, eb->category);
81 }
82
83 /* Allocator function for rbtree.c */
84 static RBTNode *
ginAllocEntryAccumulator(void * arg)85 ginAllocEntryAccumulator(void *arg)
86 {
87 BuildAccumulator *accum = (BuildAccumulator *) arg;
88 GinEntryAccumulator *ea;
89
90 /*
91 * Allocate memory by rather big chunks to decrease overhead. We have no
92 * need to reclaim RBTNodes individually, so this costs nothing.
93 */
94 if (accum->entryallocator == NULL || accum->eas_used >= DEF_NENTRY)
95 {
96 accum->entryallocator = palloc(sizeof(GinEntryAccumulator) * DEF_NENTRY);
97 accum->allocatedMemory += GetMemoryChunkSpace(accum->entryallocator);
98 accum->eas_used = 0;
99 }
100
101 /* Allocate new RBTNode from current chunk */
102 ea = accum->entryallocator + accum->eas_used;
103 accum->eas_used++;
104
105 return (RBTNode *) ea;
106 }
107
108 void
ginInitBA(BuildAccumulator * accum)109 ginInitBA(BuildAccumulator *accum)
110 {
111 /* accum->ginstate is intentionally not set here */
112 accum->allocatedMemory = 0;
113 accum->entryallocator = NULL;
114 accum->eas_used = 0;
115 accum->tree = rbt_create(sizeof(GinEntryAccumulator),
116 cmpEntryAccumulator,
117 ginCombineData,
118 ginAllocEntryAccumulator,
119 NULL, /* no freefunc needed */
120 (void *) accum);
121 }
122
123 /*
124 * This is basically the same as datumCopy(), but extended to count
125 * palloc'd space in accum->allocatedMemory.
126 */
127 static Datum
getDatumCopy(BuildAccumulator * accum,OffsetNumber attnum,Datum value)128 getDatumCopy(BuildAccumulator *accum, OffsetNumber attnum, Datum value)
129 {
130 Form_pg_attribute att;
131 Datum res;
132
133 att = TupleDescAttr(accum->ginstate->origTupdesc, attnum - 1);
134 if (att->attbyval)
135 res = value;
136 else
137 {
138 res = datumCopy(value, false, att->attlen);
139 accum->allocatedMemory += GetMemoryChunkSpace(DatumGetPointer(res));
140 }
141 return res;
142 }
143
144 /*
145 * Find/store one entry from indexed value.
146 */
147 static void
ginInsertBAEntry(BuildAccumulator * accum,ItemPointer heapptr,OffsetNumber attnum,Datum key,GinNullCategory category)148 ginInsertBAEntry(BuildAccumulator *accum,
149 ItemPointer heapptr, OffsetNumber attnum,
150 Datum key, GinNullCategory category)
151 {
152 GinEntryAccumulator eatmp;
153 GinEntryAccumulator *ea;
154 bool isNew;
155
156 /*
157 * For the moment, fill only the fields of eatmp that will be looked at by
158 * cmpEntryAccumulator or ginCombineData.
159 */
160 eatmp.attnum = attnum;
161 eatmp.key = key;
162 eatmp.category = category;
163 /* temporarily set up single-entry itempointer list */
164 eatmp.list = heapptr;
165
166 ea = (GinEntryAccumulator *) rbt_insert(accum->tree, (RBTNode *) &eatmp,
167 &isNew);
168
169 if (isNew)
170 {
171 /*
172 * Finish initializing new tree entry, including making permanent
173 * copies of the datum (if it's not null) and itempointer.
174 */
175 if (category == GIN_CAT_NORM_KEY)
176 ea->key = getDatumCopy(accum, attnum, key);
177 ea->maxcount = DEF_NPTR;
178 ea->count = 1;
179 ea->shouldSort = false;
180 ea->list =
181 (ItemPointerData *) palloc(sizeof(ItemPointerData) * DEF_NPTR);
182 ea->list[0] = *heapptr;
183 accum->allocatedMemory += GetMemoryChunkSpace(ea->list);
184 }
185 else
186 {
187 /*
188 * ginCombineData did everything needed.
189 */
190 }
191 }
192
193 /*
194 * Insert the entries for one heap pointer.
195 *
196 * Since the entries are being inserted into a balanced binary tree, you
197 * might think that the order of insertion wouldn't be critical, but it turns
198 * out that inserting the entries in sorted order results in a lot of
199 * rebalancing operations and is slow. To prevent this, we attempt to insert
200 * the nodes in an order that will produce a nearly-balanced tree if the input
201 * is in fact sorted.
202 *
203 * We do this as follows. First, we imagine that we have an array whose size
204 * is the smallest power of two greater than or equal to the actual array
205 * size. Second, we insert the middle entry of our virtual array into the
206 * tree; then, we insert the middles of each half of our virtual array, then
207 * middles of quarters, etc.
208 */
209 void
ginInsertBAEntries(BuildAccumulator * accum,ItemPointer heapptr,OffsetNumber attnum,Datum * entries,GinNullCategory * categories,int32 nentries)210 ginInsertBAEntries(BuildAccumulator *accum,
211 ItemPointer heapptr, OffsetNumber attnum,
212 Datum *entries, GinNullCategory *categories,
213 int32 nentries)
214 {
215 uint32 step = nentries;
216
217 if (nentries <= 0)
218 return;
219
220 Assert(ItemPointerIsValid(heapptr) && attnum >= FirstOffsetNumber);
221
222 /*
223 * step will contain largest power of 2 and <= nentries
224 */
225 step |= (step >> 1);
226 step |= (step >> 2);
227 step |= (step >> 4);
228 step |= (step >> 8);
229 step |= (step >> 16);
230 step >>= 1;
231 step++;
232
233 while (step > 0)
234 {
235 int i;
236
237 for (i = step - 1; i < nentries && i >= 0; i += step << 1 /* *2 */ )
238 ginInsertBAEntry(accum, heapptr, attnum,
239 entries[i], categories[i]);
240
241 step >>= 1; /* /2 */
242 }
243 }
244
245 static int
qsortCompareItemPointers(const void * a,const void * b)246 qsortCompareItemPointers(const void *a, const void *b)
247 {
248 int res = ginCompareItemPointers((ItemPointer) a, (ItemPointer) b);
249
250 /* Assert that there are no equal item pointers being sorted */
251 Assert(res != 0);
252 return res;
253 }
254
255 /* Prepare to read out the rbtree contents using ginGetBAEntry */
256 void
ginBeginBAScan(BuildAccumulator * accum)257 ginBeginBAScan(BuildAccumulator *accum)
258 {
259 rbt_begin_iterate(accum->tree, LeftRightWalk, &accum->tree_walk);
260 }
261
262 /*
263 * Get the next entry in sequence from the BuildAccumulator's rbtree.
264 * This consists of a single key datum and a list (array) of one or more
265 * heap TIDs in which that key is found. The list is guaranteed sorted.
266 */
267 ItemPointerData *
ginGetBAEntry(BuildAccumulator * accum,OffsetNumber * attnum,Datum * key,GinNullCategory * category,uint32 * n)268 ginGetBAEntry(BuildAccumulator *accum,
269 OffsetNumber *attnum, Datum *key, GinNullCategory *category,
270 uint32 *n)
271 {
272 GinEntryAccumulator *entry;
273 ItemPointerData *list;
274
275 entry = (GinEntryAccumulator *) rbt_iterate(&accum->tree_walk);
276
277 if (entry == NULL)
278 return NULL; /* no more entries */
279
280 *attnum = entry->attnum;
281 *key = entry->key;
282 *category = entry->category;
283 list = entry->list;
284 *n = entry->count;
285
286 Assert(list != NULL && entry->count > 0);
287
288 if (entry->shouldSort && entry->count > 1)
289 qsort(list, entry->count, sizeof(ItemPointerData),
290 qsortCompareItemPointers);
291
292 return list;
293 }
294