Line data Source code
1 : /*-------------------------------------------------------------------------
2 : *
3 : * gininsert.c
4 : * insert routines for the postgres inverted index access method.
5 : *
6 : *
7 : * Portions Copyright (c) 1996-2025, PostgreSQL Global Development Group
8 : * Portions Copyright (c) 1994, Regents of the University of California
9 : *
10 : * IDENTIFICATION
11 : * src/backend/access/gin/gininsert.c
12 : *-------------------------------------------------------------------------
13 : */
14 :
15 : #include "postgres.h"
16 :
17 : #include "access/gin_private.h"
18 : #include "access/tableam.h"
19 : #include "access/xloginsert.h"
20 : #include "miscadmin.h"
21 : #include "nodes/execnodes.h"
22 : #include "storage/bufmgr.h"
23 : #include "storage/predicate.h"
24 : #include "utils/memutils.h"
25 : #include "utils/rel.h"
26 :
27 : typedef struct
28 : {
29 : GinState ginstate;
30 : double indtuples;
31 : GinStatsData buildStats;
32 : MemoryContext tmpCtx;
33 : MemoryContext funcCtx;
34 : BuildAccumulator accum;
35 : } GinBuildState;
36 :
37 :
38 : /*
39 : * Adds array of item pointers to tuple's posting list, or
40 : * creates posting tree and tuple pointing to tree in case
41 : * of not enough space. Max size of tuple is defined in
42 : * GinFormTuple(). Returns a new, modified index tuple.
43 : * items[] must be in sorted order with no duplicates.
44 : */
45 : static IndexTuple
46 32676 : addItemPointersToLeafTuple(GinState *ginstate,
47 : IndexTuple old,
48 : ItemPointerData *items, uint32 nitem,
49 : GinStatsData *buildStats, Buffer buffer)
50 : {
51 : OffsetNumber attnum;
52 : Datum key;
53 : GinNullCategory category;
54 : IndexTuple res;
55 : ItemPointerData *newItems,
56 : *oldItems;
57 : int oldNPosting,
58 : newNPosting;
59 : GinPostingList *compressedList;
60 :
61 : Assert(!GinIsPostingTree(old));
62 :
63 32676 : attnum = gintuple_get_attrnum(ginstate, old);
64 32676 : key = gintuple_get_key(ginstate, old, &category);
65 :
66 : /* merge the old and new posting lists */
67 32676 : oldItems = ginReadTuple(ginstate, attnum, old, &oldNPosting);
68 :
69 32676 : newItems = ginMergeItemPointers(items, nitem,
70 : oldItems, oldNPosting,
71 : &newNPosting);
72 :
73 : /* Compress the posting list, and try to a build tuple with room for it */
74 32676 : res = NULL;
75 32676 : compressedList = ginCompressPostingList(newItems, newNPosting, GinMaxItemSize,
76 : NULL);
77 32676 : pfree(newItems);
78 32676 : if (compressedList)
79 : {
80 32676 : res = GinFormTuple(ginstate, attnum, key, category,
81 : (char *) compressedList,
82 32676 : SizeOfGinPostingList(compressedList),
83 : newNPosting,
84 : false);
85 32676 : pfree(compressedList);
86 : }
87 32676 : if (!res)
88 : {
89 : /* posting list would be too big, convert to posting tree */
90 : BlockNumber postingRoot;
91 :
92 : /*
93 : * Initialize posting tree with the old tuple's posting list. It's
94 : * surely small enough to fit on one posting-tree page, and should
95 : * already be in order with no duplicates.
96 : */
97 28 : postingRoot = createPostingTree(ginstate->index,
98 : oldItems,
99 : oldNPosting,
100 : buildStats,
101 : buffer);
102 :
103 : /* Now insert the TIDs-to-be-added into the posting tree */
104 28 : ginInsertItemPointers(ginstate->index, postingRoot,
105 : items, nitem,
106 : buildStats);
107 :
108 : /* And build a new posting-tree-only result tuple */
109 28 : res = GinFormTuple(ginstate, attnum, key, category, NULL, 0, 0, true);
110 28 : GinSetPostingTree(res, postingRoot);
111 : }
112 32676 : pfree(oldItems);
113 :
114 32676 : return res;
115 : }
116 :
117 : /*
118 : * Build a fresh leaf tuple, either posting-list or posting-tree format
119 : * depending on whether the given items list will fit.
120 : * items[] must be in sorted order with no duplicates.
121 : *
122 : * This is basically the same logic as in addItemPointersToLeafTuple,
123 : * but working from slightly different input.
124 : */
125 : static IndexTuple
126 689426 : buildFreshLeafTuple(GinState *ginstate,
127 : OffsetNumber attnum, Datum key, GinNullCategory category,
128 : ItemPointerData *items, uint32 nitem,
129 : GinStatsData *buildStats, Buffer buffer)
130 : {
131 689426 : IndexTuple res = NULL;
132 : GinPostingList *compressedList;
133 :
134 : /* try to build a posting list tuple with all the items */
135 689426 : compressedList = ginCompressPostingList(items, nitem, GinMaxItemSize, NULL);
136 689426 : if (compressedList)
137 : {
138 689426 : res = GinFormTuple(ginstate, attnum, key, category,
139 : (char *) compressedList,
140 689426 : SizeOfGinPostingList(compressedList),
141 : nitem, false);
142 689426 : pfree(compressedList);
143 : }
144 689426 : if (!res)
145 : {
146 : /* posting list would be too big, build posting tree */
147 : BlockNumber postingRoot;
148 :
149 : /*
150 : * Build posting-tree-only result tuple. We do this first so as to
151 : * fail quickly if the key is too big.
152 : */
153 100 : res = GinFormTuple(ginstate, attnum, key, category, NULL, 0, 0, true);
154 :
155 : /*
156 : * Initialize a new posting tree with the TIDs.
157 : */
158 100 : postingRoot = createPostingTree(ginstate->index, items, nitem,
159 : buildStats, buffer);
160 :
161 : /* And save the root link in the result tuple */
162 100 : GinSetPostingTree(res, postingRoot);
163 : }
164 :
165 689426 : return res;
166 : }
167 :
168 : /*
169 : * Insert one or more heap TIDs associated with the given key value.
170 : * This will either add a single key entry, or enlarge a pre-existing entry.
171 : *
172 : * During an index build, buildStats is non-null and the counters
173 : * it contains should be incremented as needed.
174 : */
175 : void
176 771506 : ginEntryInsert(GinState *ginstate,
177 : OffsetNumber attnum, Datum key, GinNullCategory category,
178 : ItemPointerData *items, uint32 nitem,
179 : GinStatsData *buildStats)
180 : {
181 : GinBtreeData btree;
182 : GinBtreeEntryInsertData insertdata;
183 : GinBtreeStack *stack;
184 : IndexTuple itup;
185 : Page page;
186 :
187 771506 : insertdata.isDelete = false;
188 :
189 771506 : ginPrepareEntryScan(&btree, attnum, key, category, ginstate);
190 771506 : btree.isBuild = (buildStats != NULL);
191 :
192 771506 : stack = ginFindLeafPage(&btree, false, false);
193 771506 : page = BufferGetPage(stack->buffer);
194 :
195 771506 : if (btree.findItem(&btree, stack))
196 : {
197 : /* found pre-existing entry */
198 82076 : itup = (IndexTuple) PageGetItem(page, PageGetItemId(page, stack->off));
199 :
200 82076 : if (GinIsPostingTree(itup))
201 : {
202 : /* add entries to existing posting tree */
203 49392 : BlockNumber rootPostingTree = GinGetPostingTree(itup);
204 :
205 : /* release all stack */
206 49392 : LockBuffer(stack->buffer, GIN_UNLOCK);
207 49392 : freeGinBtreeStack(stack);
208 :
209 : /* insert into posting tree */
210 49392 : ginInsertItemPointers(ginstate->index, rootPostingTree,
211 : items, nitem,
212 : buildStats);
213 49388 : return;
214 : }
215 :
216 32684 : CheckForSerializableConflictIn(ginstate->index, NULL,
217 : BufferGetBlockNumber(stack->buffer));
218 : /* modify an existing leaf entry */
219 32676 : itup = addItemPointersToLeafTuple(ginstate, itup,
220 : items, nitem, buildStats, stack->buffer);
221 :
222 32676 : insertdata.isDelete = true;
223 : }
224 : else
225 : {
226 689430 : CheckForSerializableConflictIn(ginstate->index, NULL,
227 : BufferGetBlockNumber(stack->buffer));
228 : /* no match, so construct a new leaf entry */
229 689426 : itup = buildFreshLeafTuple(ginstate, attnum, key, category,
230 : items, nitem, buildStats, stack->buffer);
231 :
232 : /*
233 : * nEntries counts leaf tuples, so increment it only when we make a
234 : * new one.
235 : */
236 689426 : if (buildStats)
237 149146 : buildStats->nEntries++;
238 : }
239 :
240 : /* Insert the new or modified leaf tuple */
241 722102 : insertdata.entry = itup;
242 722102 : ginInsertValue(&btree, stack, &insertdata, buildStats);
243 722098 : pfree(itup);
244 : }
245 :
246 : /*
247 : * Extract index entries for a single indexable item, and add them to the
248 : * BuildAccumulator's state.
249 : *
250 : * This function is used only during initial index creation.
251 : */
252 : static void
253 869230 : ginHeapTupleBulkInsert(GinBuildState *buildstate, OffsetNumber attnum,
254 : Datum value, bool isNull,
255 : ItemPointer heapptr)
256 : {
257 : Datum *entries;
258 : GinNullCategory *categories;
259 : int32 nentries;
260 : MemoryContext oldCtx;
261 :
262 869230 : oldCtx = MemoryContextSwitchTo(buildstate->funcCtx);
263 869230 : entries = ginExtractEntries(buildstate->accum.ginstate, attnum,
264 : value, isNull,
265 : &nentries, &categories);
266 869230 : MemoryContextSwitchTo(oldCtx);
267 :
268 869230 : ginInsertBAEntries(&buildstate->accum, heapptr, attnum,
269 : entries, categories, nentries);
270 :
271 869230 : buildstate->indtuples += nentries;
272 :
273 869230 : MemoryContextReset(buildstate->funcCtx);
274 869230 : }
275 :
276 : static void
277 868612 : ginBuildCallback(Relation index, ItemPointer tid, Datum *values,
278 : bool *isnull, bool tupleIsAlive, void *state)
279 : {
280 868612 : GinBuildState *buildstate = (GinBuildState *) state;
281 : MemoryContext oldCtx;
282 : int i;
283 :
284 868612 : oldCtx = MemoryContextSwitchTo(buildstate->tmpCtx);
285 :
286 1737842 : for (i = 0; i < buildstate->ginstate.origTupdesc->natts; i++)
287 869230 : ginHeapTupleBulkInsert(buildstate, (OffsetNumber) (i + 1),
288 869230 : values[i], isnull[i], tid);
289 :
290 : /* If we've maxed out our available memory, dump everything to the index */
291 868612 : if (buildstate->accum.allocatedMemory >= (Size) maintenance_work_mem * 1024L)
292 : {
293 : ItemPointerData *list;
294 : Datum key;
295 : GinNullCategory category;
296 : uint32 nlist;
297 : OffsetNumber attnum;
298 :
299 0 : ginBeginBAScan(&buildstate->accum);
300 0 : while ((list = ginGetBAEntry(&buildstate->accum,
301 : &attnum, &key, &category, &nlist)) != NULL)
302 : {
303 : /* there could be many entries, so be willing to abort here */
304 0 : CHECK_FOR_INTERRUPTS();
305 0 : ginEntryInsert(&buildstate->ginstate, attnum, key, category,
306 : list, nlist, &buildstate->buildStats);
307 : }
308 :
309 0 : MemoryContextReset(buildstate->tmpCtx);
310 0 : ginInitBA(&buildstate->accum);
311 : }
312 :
313 868612 : MemoryContextSwitchTo(oldCtx);
314 868612 : }
315 :
316 : IndexBuildResult *
317 314 : ginbuild(Relation heap, Relation index, IndexInfo *indexInfo)
318 : {
319 : IndexBuildResult *result;
320 : double reltuples;
321 : GinBuildState buildstate;
322 : Buffer RootBuffer,
323 : MetaBuffer;
324 : ItemPointerData *list;
325 : Datum key;
326 : GinNullCategory category;
327 : uint32 nlist;
328 : MemoryContext oldCtx;
329 : OffsetNumber attnum;
330 :
331 314 : if (RelationGetNumberOfBlocks(index) != 0)
332 0 : elog(ERROR, "index \"%s\" already contains data",
333 : RelationGetRelationName(index));
334 :
335 314 : initGinState(&buildstate.ginstate, index);
336 314 : buildstate.indtuples = 0;
337 314 : memset(&buildstate.buildStats, 0, sizeof(GinStatsData));
338 :
339 : /* initialize the meta page */
340 314 : MetaBuffer = GinNewBuffer(index);
341 :
342 : /* initialize the root page */
343 314 : RootBuffer = GinNewBuffer(index);
344 :
345 314 : START_CRIT_SECTION();
346 314 : GinInitMetabuffer(MetaBuffer);
347 314 : MarkBufferDirty(MetaBuffer);
348 314 : GinInitBuffer(RootBuffer, GIN_LEAF);
349 314 : MarkBufferDirty(RootBuffer);
350 :
351 :
352 314 : UnlockReleaseBuffer(MetaBuffer);
353 314 : UnlockReleaseBuffer(RootBuffer);
354 314 : END_CRIT_SECTION();
355 :
356 : /* count the root as first entry page */
357 314 : buildstate.buildStats.nEntryPages++;
358 :
359 : /*
360 : * create a temporary memory context that is used to hold data not yet
361 : * dumped out to the index
362 : */
363 314 : buildstate.tmpCtx = AllocSetContextCreate(CurrentMemoryContext,
364 : "Gin build temporary context",
365 : ALLOCSET_DEFAULT_SIZES);
366 :
367 : /*
368 : * create a temporary memory context that is used for calling
369 : * ginExtractEntries(), and can be reset after each tuple
370 : */
371 314 : buildstate.funcCtx = AllocSetContextCreate(CurrentMemoryContext,
372 : "Gin build temporary context for user-defined function",
373 : ALLOCSET_DEFAULT_SIZES);
374 :
375 314 : buildstate.accum.ginstate = &buildstate.ginstate;
376 314 : ginInitBA(&buildstate.accum);
377 :
378 : /*
379 : * Do the heap scan. We disallow sync scan here because dataPlaceToPage
380 : * prefers to receive tuples in TID order.
381 : */
382 314 : reltuples = table_index_build_scan(heap, index, indexInfo, false, true,
383 : ginBuildCallback, &buildstate, NULL);
384 :
385 : /* dump remaining entries to the index */
386 314 : oldCtx = MemoryContextSwitchTo(buildstate.tmpCtx);
387 314 : ginBeginBAScan(&buildstate.accum);
388 149460 : while ((list = ginGetBAEntry(&buildstate.accum,
389 : &attnum, &key, &category, &nlist)) != NULL)
390 : {
391 : /* there could be many entries, so be willing to abort here */
392 149146 : CHECK_FOR_INTERRUPTS();
393 149146 : ginEntryInsert(&buildstate.ginstate, attnum, key, category,
394 : list, nlist, &buildstate.buildStats);
395 : }
396 314 : MemoryContextSwitchTo(oldCtx);
397 :
398 314 : MemoryContextDelete(buildstate.funcCtx);
399 314 : MemoryContextDelete(buildstate.tmpCtx);
400 :
401 : /*
402 : * Update metapage stats
403 : */
404 314 : buildstate.buildStats.nTotalPages = RelationGetNumberOfBlocks(index);
405 314 : ginUpdateStats(index, &buildstate.buildStats, true);
406 :
407 : /*
408 : * We didn't write WAL records as we built the index, so if WAL-logging is
409 : * required, write all pages to the WAL now.
410 : */
411 314 : if (RelationNeedsWAL(index))
412 : {
413 190 : log_newpage_range(index, MAIN_FORKNUM,
414 : 0, RelationGetNumberOfBlocks(index),
415 : true);
416 : }
417 :
418 : /*
419 : * Return statistics
420 : */
421 314 : result = (IndexBuildResult *) palloc(sizeof(IndexBuildResult));
422 :
423 314 : result->heap_tuples = reltuples;
424 314 : result->index_tuples = buildstate.indtuples;
425 :
426 314 : return result;
427 : }
428 :
429 : /*
430 : * ginbuildempty() -- build an empty gin index in the initialization fork
431 : */
432 : void
433 6 : ginbuildempty(Relation index)
434 : {
435 : Buffer RootBuffer,
436 : MetaBuffer;
437 :
438 : /* An empty GIN index has two pages. */
439 6 : MetaBuffer = ExtendBufferedRel(BMR_REL(index), INIT_FORKNUM, NULL,
440 : EB_LOCK_FIRST | EB_SKIP_EXTENSION_LOCK);
441 6 : RootBuffer = ExtendBufferedRel(BMR_REL(index), INIT_FORKNUM, NULL,
442 : EB_LOCK_FIRST | EB_SKIP_EXTENSION_LOCK);
443 :
444 : /* Initialize and xlog metabuffer and root buffer. */
445 6 : START_CRIT_SECTION();
446 6 : GinInitMetabuffer(MetaBuffer);
447 6 : MarkBufferDirty(MetaBuffer);
448 6 : log_newpage_buffer(MetaBuffer, true);
449 6 : GinInitBuffer(RootBuffer, GIN_LEAF);
450 6 : MarkBufferDirty(RootBuffer);
451 6 : log_newpage_buffer(RootBuffer, false);
452 6 : END_CRIT_SECTION();
453 :
454 : /* Unlock and release the buffers. */
455 6 : UnlockReleaseBuffer(MetaBuffer);
456 6 : UnlockReleaseBuffer(RootBuffer);
457 6 : }
458 :
459 : /*
460 : * Insert index entries for a single indexable item during "normal"
461 : * (non-fast-update) insertion
462 : */
463 : static void
464 33896 : ginHeapTupleInsert(GinState *ginstate, OffsetNumber attnum,
465 : Datum value, bool isNull,
466 : ItemPointer item)
467 : {
468 : Datum *entries;
469 : GinNullCategory *categories;
470 : int32 i,
471 : nentries;
472 :
473 33896 : entries = ginExtractEntries(ginstate, attnum, value, isNull,
474 : &nentries, &categories);
475 :
476 290142 : for (i = 0; i < nentries; i++)
477 256266 : ginEntryInsert(ginstate, attnum, entries[i], categories[i],
478 : item, 1, NULL);
479 33876 : }
480 :
481 : bool
482 298846 : gininsert(Relation index, Datum *values, bool *isnull,
483 : ItemPointer ht_ctid, Relation heapRel,
484 : IndexUniqueCheck checkUnique,
485 : bool indexUnchanged,
486 : IndexInfo *indexInfo)
487 : {
488 298846 : GinState *ginstate = (GinState *) indexInfo->ii_AmCache;
489 : MemoryContext oldCtx;
490 : MemoryContext insertCtx;
491 : int i;
492 :
493 : /* Initialize GinState cache if first call in this statement */
494 298846 : if (ginstate == NULL)
495 : {
496 2006 : oldCtx = MemoryContextSwitchTo(indexInfo->ii_Context);
497 2006 : ginstate = (GinState *) palloc(sizeof(GinState));
498 2006 : initGinState(ginstate, index);
499 2006 : indexInfo->ii_AmCache = ginstate;
500 2006 : MemoryContextSwitchTo(oldCtx);
501 : }
502 :
503 298846 : insertCtx = AllocSetContextCreate(CurrentMemoryContext,
504 : "Gin insert temporary context",
505 : ALLOCSET_DEFAULT_SIZES);
506 :
507 298846 : oldCtx = MemoryContextSwitchTo(insertCtx);
508 :
509 298846 : if (GinGetUseFastUpdate(index))
510 264944 : {
511 : GinTupleCollector collector;
512 :
513 264950 : memset(&collector, 0, sizeof(GinTupleCollector));
514 :
515 649978 : for (i = 0; i < ginstate->origTupdesc->natts; i++)
516 385028 : ginHeapTupleFastCollect(ginstate, &collector,
517 385028 : (OffsetNumber) (i + 1),
518 385028 : values[i], isnull[i],
519 : ht_ctid);
520 :
521 264950 : ginHeapTupleFastInsert(ginstate, &collector);
522 : }
523 : else
524 : {
525 67772 : for (i = 0; i < ginstate->origTupdesc->natts; i++)
526 33896 : ginHeapTupleInsert(ginstate, (OffsetNumber) (i + 1),
527 33896 : values[i], isnull[i],
528 : ht_ctid);
529 : }
530 :
531 298820 : MemoryContextSwitchTo(oldCtx);
532 298820 : MemoryContextDelete(insertCtx);
533 :
534 298820 : return false;
535 : }
|