LCOV - code coverage report
Current view: top level - src/backend/access/gin - ginscan.c (source / functions) Hit Total Coverage
Test: PostgreSQL 19devel Lines: 190 201 94.5 %
Date: 2026-02-02 14:17:46 Functions: 8 8 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*-------------------------------------------------------------------------
       2             :  *
       3             :  * ginscan.c
       4             :  *    routines to manage scans of inverted index relations
       5             :  *
       6             :  *
       7             :  * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
       8             :  * Portions Copyright (c) 1994, Regents of the University of California
       9             :  *
      10             :  * IDENTIFICATION
      11             :  *          src/backend/access/gin/ginscan.c
      12             :  *-------------------------------------------------------------------------
      13             :  */
      14             : 
      15             : #include "postgres.h"
      16             : 
      17             : #include "access/gin_private.h"
      18             : #include "access/relscan.h"
      19             : #include "executor/instrument_node.h"
      20             : #include "pgstat.h"
      21             : #include "utils/memutils.h"
      22             : #include "utils/rel.h"
      23             : 
      24             : 
      25             : IndexScanDesc
      26        1948 : ginbeginscan(Relation rel, int nkeys, int norderbys)
      27             : {
      28             :     IndexScanDesc scan;
      29             :     GinScanOpaque so;
      30             : 
      31             :     /* no order by operators allowed */
      32             :     Assert(norderbys == 0);
      33             : 
      34        1948 :     scan = RelationGetIndexScan(rel, nkeys, norderbys);
      35             : 
      36             :     /* allocate private workspace */
      37        1948 :     so = (GinScanOpaque) palloc_object(GinScanOpaqueData);
      38        1948 :     so->keys = NULL;
      39        1948 :     so->nkeys = 0;
      40        1948 :     so->tempCtx = AllocSetContextCreate(CurrentMemoryContext,
      41             :                                         "Gin scan temporary context",
      42             :                                         ALLOCSET_DEFAULT_SIZES);
      43        1948 :     so->keyCtx = AllocSetContextCreate(CurrentMemoryContext,
      44             :                                        "Gin scan key context",
      45             :                                        ALLOCSET_DEFAULT_SIZES);
      46        1948 :     initGinState(&so->ginstate, scan->indexRelation);
      47             : 
      48        1948 :     scan->opaque = so;
      49             : 
      50        1948 :     return scan;
      51             : }
      52             : 
      53             : /*
      54             :  * Create a new GinScanEntry, unless an equivalent one already exists,
      55             :  * in which case just return it
      56             :  */
      57             : static GinScanEntry
      58        7076 : ginFillScanEntry(GinScanOpaque so, OffsetNumber attnum,
      59             :                  StrategyNumber strategy, int32 searchMode,
      60             :                  Datum queryKey, GinNullCategory queryCategory,
      61             :                  bool isPartialMatch, Pointer extra_data)
      62             : {
      63        7076 :     GinState   *ginstate = &so->ginstate;
      64             :     GinScanEntry scanEntry;
      65             :     uint32      i;
      66             : 
      67             :     /*
      68             :      * Look for an existing equivalent entry.
      69             :      *
      70             :      * Entries with non-null extra_data are never considered identical, since
      71             :      * we can't know exactly what the opclass might be doing with that.
      72             :      *
      73             :      * Also, give up de-duplication once we have 100 entries.  That avoids
      74             :      * spending O(N^2) time on probably-fruitless de-duplication of large
      75             :      * search-key sets.  The threshold of 100 is arbitrary but matches
      76             :      * predtest.c's threshold for what's a large array.
      77             :      */
      78        7076 :     if (extra_data == NULL && so->totalentries < 100)
      79             :     {
      80       56134 :         for (i = 0; i < so->totalentries; i++)
      81             :         {
      82       53090 :             GinScanEntry prevEntry = so->entries[i];
      83             : 
      84       53090 :             if (prevEntry->extra_data == NULL &&
      85       52790 :                 prevEntry->isPartialMatch == isPartialMatch &&
      86       52790 :                 prevEntry->strategy == strategy &&
      87       52650 :                 prevEntry->searchMode == searchMode &&
      88      105276 :                 prevEntry->attnum == attnum &&
      89       52626 :                 ginCompareEntries(ginstate, attnum,
      90             :                                   prevEntry->queryKey,
      91       52626 :                                   prevEntry->queryCategory,
      92             :                                   queryKey,
      93             :                                   queryCategory) == 0)
      94             :             {
      95             :                 /* Successful match */
      96           0 :                 return prevEntry;
      97             :             }
      98             :         }
      99             :     }
     100             : 
     101             :     /* Nope, create a new entry */
     102        7076 :     scanEntry = palloc_object(GinScanEntryData);
     103        7076 :     scanEntry->queryKey = queryKey;
     104        7076 :     scanEntry->queryCategory = queryCategory;
     105        7076 :     scanEntry->isPartialMatch = isPartialMatch;
     106        7076 :     scanEntry->extra_data = extra_data;
     107        7076 :     scanEntry->strategy = strategy;
     108        7076 :     scanEntry->searchMode = searchMode;
     109        7076 :     scanEntry->attnum = attnum;
     110             : 
     111        7076 :     scanEntry->buffer = InvalidBuffer;
     112        7076 :     ItemPointerSetMin(&scanEntry->curItem);
     113        7076 :     scanEntry->matchBitmap = NULL;
     114        7076 :     scanEntry->matchIterator = NULL;
     115        7076 :     scanEntry->matchResult.blockno = InvalidBlockNumber;
     116        7076 :     scanEntry->matchNtuples = -1;
     117        7076 :     scanEntry->list = NULL;
     118        7076 :     scanEntry->nlist = 0;
     119        7076 :     scanEntry->offset = InvalidOffsetNumber;
     120        7076 :     scanEntry->isFinished = false;
     121        7076 :     scanEntry->reduceResult = false;
     122             : 
     123             :     /* Add it to so's array */
     124        7076 :     if (so->totalentries >= so->allocentries)
     125             :     {
     126          46 :         so->allocentries *= 2;
     127          46 :         so->entries = repalloc_array(so->entries, GinScanEntry, so->allocentries);
     128             :     }
     129        7076 :     so->entries[so->totalentries++] = scanEntry;
     130             : 
     131        7076 :     return scanEntry;
     132             : }
     133             : 
     134             : /*
     135             :  * Append hidden scan entry of given category to the scan key.
     136             :  *
     137             :  * NB: this had better be called at most once per scan key, since
     138             :  * ginFillScanKey leaves room for only one hidden entry.  Currently,
     139             :  * it seems sufficiently clear that this is true that we don't bother
     140             :  * with any cross-check logic.
     141             :  */
     142             : static void
     143         326 : ginScanKeyAddHiddenEntry(GinScanOpaque so, GinScanKey key,
     144             :                          GinNullCategory queryCategory)
     145             : {
     146         326 :     int         i = key->nentries++;
     147             : 
     148             :     /* strategy is of no interest because this is not a partial-match item */
     149         326 :     key->scanEntry[i] = ginFillScanEntry(so, key->attnum,
     150             :                                          InvalidStrategy, key->searchMode,
     151             :                                          (Datum) 0, queryCategory,
     152             :                                          false, NULL);
     153         326 : }
     154             : 
     155             : /*
     156             :  * Initialize the next GinScanKey using the output from the extractQueryFn
     157             :  */
     158             : static void
     159        2074 : ginFillScanKey(GinScanOpaque so, OffsetNumber attnum,
     160             :                StrategyNumber strategy, int32 searchMode,
     161             :                Datum query, uint32 nQueryValues,
     162             :                Datum *queryValues, GinNullCategory *queryCategories,
     163             :                bool *partial_matches, Pointer *extra_data)
     164             : {
     165        2074 :     GinScanKey  key = &(so->keys[so->nkeys++]);
     166        2074 :     GinState   *ginstate = &so->ginstate;
     167             :     uint32      i;
     168             : 
     169        2074 :     key->nentries = nQueryValues;
     170        2074 :     key->nuserentries = nQueryValues;
     171             : 
     172             :     /* Allocate one extra array slot for possible "hidden" entry */
     173        2074 :     key->scanEntry = palloc_array(GinScanEntry, nQueryValues + 1);
     174        2074 :     key->entryRes = palloc0_array(GinTernaryValue, nQueryValues + 1);
     175             : 
     176        2074 :     key->query = query;
     177        2074 :     key->queryValues = queryValues;
     178        2074 :     key->queryCategories = queryCategories;
     179        2074 :     key->extra_data = extra_data;
     180        2074 :     key->strategy = strategy;
     181        2074 :     key->searchMode = searchMode;
     182        2074 :     key->attnum = attnum;
     183             : 
     184             :     /*
     185             :      * Initially, scan keys of GIN_SEARCH_MODE_ALL mode are marked
     186             :      * excludeOnly.  This might get changed later.
     187             :      */
     188        2074 :     key->excludeOnly = (searchMode == GIN_SEARCH_MODE_ALL);
     189             : 
     190        2074 :     ItemPointerSetMin(&key->curItem);
     191        2074 :     key->curItemMatches = false;
     192        2074 :     key->recheckCurItem = false;
     193        2074 :     key->isFinished = false;
     194        2074 :     key->nrequired = 0;
     195        2074 :     key->nadditional = 0;
     196        2074 :     key->requiredEntries = NULL;
     197        2074 :     key->additionalEntries = NULL;
     198             : 
     199        2074 :     ginInitConsistentFunction(ginstate, key);
     200             : 
     201             :     /* Set up normal scan entries using extractQueryFn's outputs */
     202        8824 :     for (i = 0; i < nQueryValues; i++)
     203             :     {
     204             :         Datum       queryKey;
     205             :         GinNullCategory queryCategory;
     206             :         bool        isPartialMatch;
     207             :         Pointer     this_extra;
     208             : 
     209        6750 :         queryKey = queryValues[i];
     210        6750 :         queryCategory = queryCategories[i];
     211        6750 :         isPartialMatch =
     212        6750 :             (ginstate->canPartialMatch[attnum - 1] && partial_matches)
     213        6750 :             ? partial_matches[i] : false;
     214        6750 :         this_extra = (extra_data) ? extra_data[i] : NULL;
     215             : 
     216        6750 :         key->scanEntry[i] = ginFillScanEntry(so, attnum,
     217             :                                              strategy, searchMode,
     218             :                                              queryKey, queryCategory,
     219             :                                              isPartialMatch, this_extra);
     220             :     }
     221             : 
     222             :     /*
     223             :      * For GIN_SEARCH_MODE_INCLUDE_EMPTY and GIN_SEARCH_MODE_EVERYTHING search
     224             :      * modes, we add the "hidden" entry immediately.  GIN_SEARCH_MODE_ALL is
     225             :      * handled later, since we might be able to omit the hidden entry for it.
     226             :      */
     227        2074 :     if (searchMode == GIN_SEARCH_MODE_INCLUDE_EMPTY)
     228          44 :         ginScanKeyAddHiddenEntry(so, key, GIN_CAT_EMPTY_ITEM);
     229        2030 :     else if (searchMode == GIN_SEARCH_MODE_EVERYTHING)
     230           0 :         ginScanKeyAddHiddenEntry(so, key, GIN_CAT_EMPTY_QUERY);
     231        2074 : }
     232             : 
     233             : /*
     234             :  * Release current scan keys, if any.
     235             :  */
     236             : void
     237        5856 : ginFreeScanKeys(GinScanOpaque so)
     238             : {
     239             :     uint32      i;
     240             : 
     241        5856 :     if (so->keys == NULL)
     242        3902 :         return;
     243             : 
     244        9030 :     for (i = 0; i < so->totalentries; i++)
     245             :     {
     246        7076 :         GinScanEntry entry = so->entries[i];
     247             : 
     248        7076 :         if (entry->buffer != InvalidBuffer)
     249           0 :             ReleaseBuffer(entry->buffer);
     250        7076 :         if (entry->list)
     251        4454 :             pfree(entry->list);
     252        7076 :         if (entry->matchIterator)
     253           0 :             tbm_end_private_iterate(entry->matchIterator);
     254        7076 :         if (entry->matchBitmap)
     255         880 :             tbm_free(entry->matchBitmap);
     256             :     }
     257             : 
     258        1954 :     MemoryContextReset(so->keyCtx);
     259             : 
     260        1954 :     so->keys = NULL;
     261        1954 :     so->nkeys = 0;
     262        1954 :     so->entries = NULL;
     263        1954 :     so->totalentries = 0;
     264             : }
     265             : 
     266             : void
     267        1954 : ginNewScanKey(IndexScanDesc scan)
     268             : {
     269        1954 :     ScanKey     scankey = scan->keyData;
     270        1954 :     GinScanOpaque so = (GinScanOpaque) scan->opaque;
     271             :     int         i;
     272             :     int         numExcludeOnly;
     273        1954 :     bool        hasNullQuery = false;
     274        1954 :     bool        attrHasNormalScan[INDEX_MAX_KEYS] = {false};
     275             :     MemoryContext oldCtx;
     276             : 
     277             :     /*
     278             :      * Allocate all the scan key information in the key context. (If
     279             :      * extractQuery leaks anything there, it won't be reset until the end of
     280             :      * scan or rescan, but that's OK.)
     281             :      */
     282        1954 :     oldCtx = MemoryContextSwitchTo(so->keyCtx);
     283             : 
     284             :     /* if no scan keys provided, allocate extra EVERYTHING GinScanKey */
     285        1954 :     so->keys = (GinScanKey)
     286        1954 :         palloc(Max(scan->numberOfKeys, 1) * sizeof(GinScanKeyData));
     287        1954 :     so->nkeys = 0;
     288             : 
     289             :     /* initialize expansible array of GinScanEntry pointers */
     290        1954 :     so->totalentries = 0;
     291        1954 :     so->allocentries = 32;
     292        1954 :     so->entries = (GinScanEntry *)
     293        1954 :         palloc(so->allocentries * sizeof(GinScanEntry));
     294             : 
     295        1954 :     so->isVoidRes = false;
     296             : 
     297        4028 :     for (i = 0; i < scan->numberOfKeys; i++)
     298             :     {
     299        2086 :         ScanKey     skey = &scankey[i];
     300             :         Datum      *queryValues;
     301        2086 :         int32       nQueryValues = 0;
     302        2086 :         bool       *partial_matches = NULL;
     303        2086 :         Pointer    *extra_data = NULL;
     304        2086 :         bool       *nullFlags = NULL;
     305             :         GinNullCategory *categories;
     306        2086 :         int32       searchMode = GIN_SEARCH_MODE_DEFAULT;
     307             : 
     308             :         /*
     309             :          * We assume that GIN-indexable operators are strict, so a null query
     310             :          * argument means an unsatisfiable query.
     311             :          */
     312        2086 :         if (skey->sk_flags & SK_ISNULL)
     313             :         {
     314           0 :             so->isVoidRes = true;
     315          12 :             break;
     316             :         }
     317             : 
     318             :         /* OK to call the extractQueryFn */
     319             :         queryValues = (Datum *)
     320        6258 :             DatumGetPointer(FunctionCall7Coll(&so->ginstate.extractQueryFn[skey->sk_attno - 1],
     321        2086 :                                               so->ginstate.supportCollation[skey->sk_attno - 1],
     322             :                                               skey->sk_argument,
     323             :                                               PointerGetDatum(&nQueryValues),
     324        2086 :                                               UInt16GetDatum(skey->sk_strategy),
     325             :                                               PointerGetDatum(&partial_matches),
     326             :                                               PointerGetDatum(&extra_data),
     327             :                                               PointerGetDatum(&nullFlags),
     328             :                                               PointerGetDatum(&searchMode)));
     329             : 
     330             :         /*
     331             :          * If bogus searchMode is returned, treat as GIN_SEARCH_MODE_ALL; note
     332             :          * in particular we don't allow extractQueryFn to select
     333             :          * GIN_SEARCH_MODE_EVERYTHING.
     334             :          */
     335        2086 :         if (searchMode < GIN_SEARCH_MODE_DEFAULT ||
     336        2086 :             searchMode > GIN_SEARCH_MODE_ALL)
     337           0 :             searchMode = GIN_SEARCH_MODE_ALL;
     338             : 
     339             :         /* Non-default modes require the index to have placeholders */
     340        2086 :         if (searchMode != GIN_SEARCH_MODE_DEFAULT)
     341         368 :             hasNullQuery = true;
     342             : 
     343             :         /*
     344             :          * In default mode, no keys means an unsatisfiable query.
     345             :          */
     346        2086 :         if (queryValues == NULL || nQueryValues <= 0)
     347             :         {
     348         308 :             if (searchMode == GIN_SEARCH_MODE_DEFAULT)
     349             :             {
     350          12 :                 so->isVoidRes = true;
     351          12 :                 break;
     352             :             }
     353         296 :             nQueryValues = 0;   /* ensure sane value */
     354             :         }
     355             : 
     356             :         /*
     357             :          * Create GinNullCategory representation.  If the extractQueryFn
     358             :          * didn't create a nullFlags array, we assume everything is non-null.
     359             :          * While at it, detect whether any null keys are present.
     360             :          */
     361        2074 :         categories = (GinNullCategory *) palloc0(nQueryValues * sizeof(GinNullCategory));
     362        2074 :         if (nullFlags)
     363             :         {
     364             :             int32       j;
     365             : 
     366        4034 :             for (j = 0; j < nQueryValues; j++)
     367             :             {
     368        3464 :                 if (nullFlags[j])
     369             :                 {
     370           0 :                     categories[j] = GIN_CAT_NULL_KEY;
     371           0 :                     hasNullQuery = true;
     372             :                 }
     373             :             }
     374             :         }
     375             : 
     376        2074 :         ginFillScanKey(so, skey->sk_attno,
     377        2074 :                        skey->sk_strategy, searchMode,
     378             :                        skey->sk_argument, nQueryValues,
     379             :                        queryValues, categories,
     380             :                        partial_matches, extra_data);
     381             : 
     382             :         /* Remember if we had any non-excludeOnly keys */
     383        2074 :         if (searchMode != GIN_SEARCH_MODE_ALL)
     384        1750 :             attrHasNormalScan[skey->sk_attno - 1] = true;
     385             :     }
     386             : 
     387             :     /*
     388             :      * Processing GIN_SEARCH_MODE_ALL scan keys requires us to make a second
     389             :      * pass over the scan keys.  Above we marked each such scan key as
     390             :      * excludeOnly.  If the involved column has any normal (not excludeOnly)
     391             :      * scan key as well, then we can leave it like that.  Otherwise, one
     392             :      * excludeOnly scan key must receive a GIN_CAT_EMPTY_QUERY hidden entry
     393             :      * and be set to normal (excludeOnly = false).
     394             :      */
     395        1954 :     numExcludeOnly = 0;
     396        4028 :     for (i = 0; i < so->nkeys; i++)
     397             :     {
     398        2074 :         GinScanKey  key = &so->keys[i];
     399             : 
     400        2074 :         if (key->searchMode != GIN_SEARCH_MODE_ALL)
     401        1750 :             continue;
     402             : 
     403         324 :         if (!attrHasNormalScan[key->attnum - 1])
     404             :         {
     405         282 :             key->excludeOnly = false;
     406         282 :             ginScanKeyAddHiddenEntry(so, key, GIN_CAT_EMPTY_QUERY);
     407         282 :             attrHasNormalScan[key->attnum - 1] = true;
     408             :         }
     409             :         else
     410          42 :             numExcludeOnly++;
     411             :     }
     412             : 
     413             :     /*
     414             :      * If we left any excludeOnly scan keys as-is, move them to the end of the
     415             :      * scan key array: they must appear after normal key(s).
     416             :      */
     417        1954 :     if (numExcludeOnly > 0)
     418             :     {
     419             :         GinScanKey  tmpkeys;
     420             :         int         iNormalKey;
     421             :         int         iExcludeOnly;
     422             : 
     423             :         /* We'd better have made at least one normal key */
     424             :         Assert(numExcludeOnly < so->nkeys);
     425             :         /* Make a temporary array to hold the re-ordered scan keys */
     426          42 :         tmpkeys = (GinScanKey) palloc(so->nkeys * sizeof(GinScanKeyData));
     427             :         /* Re-order the keys ... */
     428          42 :         iNormalKey = 0;
     429          42 :         iExcludeOnly = so->nkeys - numExcludeOnly;
     430         150 :         for (i = 0; i < so->nkeys; i++)
     431             :         {
     432         108 :             GinScanKey  key = &so->keys[i];
     433             : 
     434         108 :             if (key->excludeOnly)
     435             :             {
     436          42 :                 memcpy(tmpkeys + iExcludeOnly, key, sizeof(GinScanKeyData));
     437          42 :                 iExcludeOnly++;
     438             :             }
     439             :             else
     440             :             {
     441          66 :                 memcpy(tmpkeys + iNormalKey, key, sizeof(GinScanKeyData));
     442          66 :                 iNormalKey++;
     443             :             }
     444             :         }
     445             :         Assert(iNormalKey == so->nkeys - numExcludeOnly);
     446             :         Assert(iExcludeOnly == so->nkeys);
     447             :         /* ... and copy them back to so->keys[] */
     448          42 :         memcpy(so->keys, tmpkeys, so->nkeys * sizeof(GinScanKeyData));
     449          42 :         pfree(tmpkeys);
     450             :     }
     451             : 
     452             :     /*
     453             :      * If there are no regular scan keys, generate an EVERYTHING scankey to
     454             :      * drive a full-index scan.
     455             :      */
     456        1954 :     if (so->nkeys == 0 && !so->isVoidRes)
     457             :     {
     458           0 :         hasNullQuery = true;
     459           0 :         ginFillScanKey(so, FirstOffsetNumber,
     460             :                        InvalidStrategy, GIN_SEARCH_MODE_EVERYTHING,
     461             :                        (Datum) 0, 0,
     462             :                        NULL, NULL, NULL, NULL);
     463             :     }
     464             : 
     465             :     /*
     466             :      * If the index is version 0, it may be missing null and placeholder
     467             :      * entries, which would render searches for nulls and full-index scans
     468             :      * unreliable.  Throw an error if so.
     469             :      */
     470        1954 :     if (hasNullQuery && !so->isVoidRes)
     471             :     {
     472             :         GinStatsData ginStats;
     473             : 
     474         328 :         ginGetStats(scan->indexRelation, &ginStats);
     475         328 :         if (ginStats.ginVersion < 1)
     476           0 :             ereport(ERROR,
     477             :                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     478             :                      errmsg("old GIN indexes do not support whole-index scans nor searches for nulls"),
     479             :                      errhint("To fix this, do REINDEX INDEX \"%s\".",
     480             :                              RelationGetRelationName(scan->indexRelation))));
     481             :     }
     482             : 
     483        1954 :     MemoryContextSwitchTo(oldCtx);
     484             : 
     485        1954 :     pgstat_count_index_scan(scan->indexRelation);
     486        1954 :     if (scan->instrument)
     487        1954 :         scan->instrument->nsearches++;
     488        1954 : }
     489             : 
     490             : void
     491        1954 : ginrescan(IndexScanDesc scan, ScanKey scankey, int nscankeys,
     492             :           ScanKey orderbys, int norderbys)
     493             : {
     494        1954 :     GinScanOpaque so = (GinScanOpaque) scan->opaque;
     495             : 
     496        1954 :     ginFreeScanKeys(so);
     497             : 
     498        1954 :     if (scankey && scan->numberOfKeys > 0)
     499        1954 :         memcpy(scan->keyData, scankey, scan->numberOfKeys * sizeof(ScanKeyData));
     500        1954 : }
     501             : 
     502             : 
     503             : void
     504        1948 : ginendscan(IndexScanDesc scan)
     505             : {
     506        1948 :     GinScanOpaque so = (GinScanOpaque) scan->opaque;
     507             : 
     508        1948 :     ginFreeScanKeys(so);
     509             : 
     510        1948 :     MemoryContextDelete(so->tempCtx);
     511        1948 :     MemoryContextDelete(so->keyCtx);
     512             : 
     513        1948 :     pfree(so);
     514        1948 : }

Generated by: LCOV version 1.16