LCOV - code coverage report
Current view: top level - src/include/tsearch - ts_type.h (source / functions) Hit Total Coverage
Test: PostgreSQL 18devel Lines: 12 12 100.0 %
Date: 2024-11-21 08:14:44 Functions: 6 6 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*-------------------------------------------------------------------------
       2             :  *
       3             :  * ts_type.h
       4             :  *    Definitions for the tsvector and tsquery types
       5             :  *
       6             :  * Copyright (c) 1998-2024, PostgreSQL Global Development Group
       7             :  *
       8             :  * src/include/tsearch/ts_type.h
       9             :  *
      10             :  *-------------------------------------------------------------------------
      11             :  */
      12             : #ifndef _PG_TSTYPE_H_
      13             : #define _PG_TSTYPE_H_
      14             : 
      15             : #include "fmgr.h"
      16             : #include "utils/memutils.h"
      17             : 
      18             : 
      19             : /*
      20             :  * TSVector type.
      21             :  *
      22             :  * Structure of tsvector datatype:
      23             :  * 1) standard varlena header
      24             :  * 2) int32     size - number of lexemes (WordEntry array entries)
      25             :  * 3) Array of WordEntry - one per lexeme; must be sorted according to
      26             :  *              tsCompareString() (ie, memcmp of lexeme strings).
      27             :  *              WordEntry->pos gives the number of bytes from end of WordEntry
      28             :  *              array to start of lexeme's string, which is of length len.
      29             :  * 4) Per-lexeme data storage:
      30             :  *    lexeme string (not null-terminated)
      31             :  *    if haspos is true:
      32             :  *      padding byte if necessary to make the position data 2-byte aligned
      33             :  *      uint16          number of positions that follow
      34             :  *      WordEntryPos[]  positions
      35             :  *
      36             :  * The positions for each lexeme must be sorted.
      37             :  *
      38             :  * Note, tsvectorsend/recv believe that sizeof(WordEntry) == 4
      39             :  */
      40             : 
      41             : typedef struct
      42             : {
      43             :     uint32
      44             :                 haspos:1,
      45             :                 len:11,         /* MAX 2Kb */
      46             :                 pos:20;         /* MAX 1Mb */
      47             : } WordEntry;
      48             : 
      49             : #define MAXSTRLEN ( (1<<11) - 1)
      50             : #define MAXSTRPOS ( (1<<20) - 1)
      51             : 
      52             : extern int  compareWordEntryPos(const void *a, const void *b);
      53             : 
      54             : /*
      55             :  * Equivalent to
      56             :  * typedef struct {
      57             :  *      uint16
      58             :  *          weight:2,
      59             :  *          pos:14;
      60             :  * }
      61             :  */
      62             : 
      63             : typedef uint16 WordEntryPos;
      64             : 
      65             : typedef struct
      66             : {
      67             :     uint16      npos;
      68             :     WordEntryPos pos[FLEXIBLE_ARRAY_MEMBER];
      69             : } WordEntryPosVector;
      70             : 
      71             : /* WordEntryPosVector with exactly 1 entry */
      72             : typedef struct
      73             : {
      74             :     uint16      npos;
      75             :     WordEntryPos pos[1];
      76             : } WordEntryPosVector1;
      77             : 
      78             : 
      79             : #define WEP_GETWEIGHT(x)    ( (x) >> 14 )
      80             : #define WEP_GETPOS(x)       ( (x) & 0x3fff )
      81             : 
      82             : #define WEP_SETWEIGHT(x,v)  ( (x) = ( (v) << 14 ) | ( (x) & 0x3fff ) )
      83             : #define WEP_SETPOS(x,v)     ( (x) = ( (x) & 0xc000 ) | ( (v) & 0x3fff ) )
      84             : 
      85             : #define MAXENTRYPOS (1<<14)
      86             : #define MAXNUMPOS   (256)
      87             : #define LIMITPOS(x) ( ( (x) >= MAXENTRYPOS ) ? (MAXENTRYPOS-1) : (x) )
      88             : 
      89             : /* This struct represents a complete tsvector datum */
      90             : typedef struct
      91             : {
      92             :     int32       vl_len_;        /* varlena header (do not touch directly!) */
      93             :     int32       size;
      94             :     WordEntry   entries[FLEXIBLE_ARRAY_MEMBER];
      95             :     /* lexemes follow the entries[] array */
      96             : } TSVectorData;
      97             : 
      98             : typedef TSVectorData *TSVector;
      99             : 
     100             : #define DATAHDRSIZE (offsetof(TSVectorData, entries))
     101             : #define CALCDATASIZE(nentries, lenstr) (DATAHDRSIZE + (nentries) * sizeof(WordEntry) + (lenstr) )
     102             : 
     103             : /* pointer to start of a tsvector's WordEntry array */
     104             : #define ARRPTR(x)   ( (x)->entries )
     105             : 
     106             : /* pointer to start of a tsvector's lexeme storage */
     107             : #define STRPTR(x)   ( (char *) &(x)->entries[(x)->size] )
     108             : 
     109             : #define _POSVECPTR(x, e)    ((WordEntryPosVector *)(STRPTR(x) + SHORTALIGN((e)->pos + (e)->len)))
     110             : #define POSDATALEN(x,e) ( ( (e)->haspos ) ? (_POSVECPTR(x,e)->npos) : 0 )
     111             : #define POSDATAPTR(x,e) (_POSVECPTR(x,e)->pos)
     112             : 
     113             : /*
     114             :  * fmgr interface functions
     115             :  */
     116             : 
     117             : static inline TSVector
     118      246714 : DatumGetTSVector(Datum X)
     119             : {
     120      246714 :     return (TSVector) PG_DETOAST_DATUM(X);
     121             : }
     122             : 
     123             : static inline TSVector
     124          30 : DatumGetTSVectorCopy(Datum X)
     125             : {
     126          30 :     return (TSVector) PG_DETOAST_DATUM_COPY(X);
     127             : }
     128             : 
     129             : static inline Datum
     130        7598 : TSVectorGetDatum(const TSVectorData *X)
     131             : {
     132        7598 :     return PointerGetDatum(X);
     133             : }
     134             : 
     135             : #define PG_GETARG_TSVECTOR(n)       DatumGetTSVector(PG_GETARG_DATUM(n))
     136             : #define PG_GETARG_TSVECTOR_COPY(n)  DatumGetTSVectorCopy(PG_GETARG_DATUM(n))
     137             : #define PG_RETURN_TSVECTOR(x)       return TSVectorGetDatum(x)
     138             : 
     139             : 
     140             : /*
     141             :  * TSQuery
     142             :  *
     143             :  *
     144             :  */
     145             : 
     146             : typedef int8 QueryItemType;
     147             : 
     148             : /* Valid values for QueryItemType: */
     149             : #define QI_VAL 1
     150             : #define QI_OPR 2
     151             : #define QI_VALSTOP 3            /* This is only used in an intermediate stack
     152             :                                  * representation in parse_tsquery. It's not a
     153             :                                  * legal type elsewhere. */
     154             : 
     155             : /*
     156             :  * QueryItem is one node in tsquery - operator or operand.
     157             :  */
     158             : typedef struct
     159             : {
     160             :     QueryItemType type;         /* operand or kind of operator (ts_tokentype) */
     161             :     uint8       weight;         /* weights of operand to search. It's a
     162             :                                  * bitmask of allowed weights. if it =0 then
     163             :                                  * any weight are allowed. Weights and bit
     164             :                                  * map: A: 1<<3 B: 1<<2 C: 1<<1 D: 1<<0 */
     165             :     bool        prefix;         /* true if it's a prefix search */
     166             :     int32       valcrc;         /* XXX: pg_crc32 would be a more appropriate
     167             :                                  * data type, but we use comparisons to signed
     168             :                                  * integers in the code. They would need to be
     169             :                                  * changed as well. */
     170             : 
     171             :     /* pointer to text value of operand, must correlate with WordEntry */
     172             :     uint32
     173             :                 length:12,
     174             :                 distance:20;
     175             : } QueryOperand;
     176             : 
     177             : 
     178             : /*
     179             :  * Legal values for QueryOperator.operator.
     180             :  */
     181             : #define OP_NOT          1
     182             : #define OP_AND          2
     183             : #define OP_OR           3
     184             : #define OP_PHRASE       4       /* highest code, tsquery_cleanup.c */
     185             : #define OP_COUNT        4
     186             : 
     187             : extern PGDLLIMPORT const int tsearch_op_priority[OP_COUNT];
     188             : 
     189             : /* get operation priority by its code */
     190             : #define OP_PRIORITY(x)  ( tsearch_op_priority[(x) - 1] )
     191             : /* get QueryOperator priority */
     192             : #define QO_PRIORITY(x)  OP_PRIORITY(((QueryOperator *) (x))->oper)
     193             : 
     194             : typedef struct
     195             : {
     196             :     QueryItemType type;
     197             :     int8        oper;           /* see above */
     198             :     int16       distance;       /* distance between agrs for OP_PHRASE */
     199             :     uint32      left;           /* pointer to left operand. Right operand is
     200             :                                  * item + 1, left operand is placed
     201             :                                  * item+item->left */
     202             : } QueryOperator;
     203             : 
     204             : /*
     205             :  * Note: TSQuery is 4-bytes aligned, so make sure there's no fields
     206             :  * inside QueryItem requiring 8-byte alignment, like int64.
     207             :  */
     208             : typedef union
     209             : {
     210             :     QueryItemType type;
     211             :     QueryOperator qoperator;
     212             :     QueryOperand qoperand;
     213             : } QueryItem;
     214             : 
     215             : /*
     216             :  * Storage:
     217             :  *  (len)(size)(array of QueryItem)(operands as '\0'-terminated c-strings)
     218             :  */
     219             : 
     220             : typedef struct
     221             : {
     222             :     int32       vl_len_;        /* varlena header (do not touch directly!) */
     223             :     int32       size;           /* number of QueryItems */
     224             :     char        data[FLEXIBLE_ARRAY_MEMBER];    /* data starts here */
     225             : } TSQueryData;
     226             : 
     227             : typedef TSQueryData *TSQuery;
     228             : 
     229             : #define HDRSIZETQ   ( VARHDRSZ + sizeof(int32) )
     230             : 
     231             : /* Computes the size of header and all QueryItems. size is the number of
     232             :  * QueryItems, and lenofoperand is the total length of all operands
     233             :  */
     234             : #define COMPUTESIZE(size, lenofoperand) ( HDRSIZETQ + (size) * sizeof(QueryItem) + (lenofoperand) )
     235             : #define TSQUERY_TOO_BIG(size, lenofoperand) \
     236             :     ((size) > (MaxAllocSize - HDRSIZETQ - (lenofoperand)) / sizeof(QueryItem))
     237             : 
     238             : /* Returns a pointer to the first QueryItem in a TSQuery */
     239             : #define GETQUERY(x)  ((QueryItem*)( (char*)(x)+HDRSIZETQ ))
     240             : 
     241             : /* Returns a pointer to the beginning of operands in a TSQuery */
     242             : #define GETOPERAND(x)   ( (char*)GETQUERY(x) + ((TSQuery)(x))->size * sizeof(QueryItem) )
     243             : 
     244             : /*
     245             :  * fmgr interface functions
     246             :  * Note, TSQuery type marked as plain storage, so it can't be toasted
     247             :  * but PG_DETOAST_DATUM_COPY is used for simplicity
     248             :  */
     249             : 
     250             : static inline TSQuery
     251      565556 : DatumGetTSQuery(Datum X)
     252             : {
     253      565556 :     return (TSQuery) DatumGetPointer(X);
     254             : }
     255             : 
     256             : static inline TSQuery
     257        1296 : DatumGetTSQueryCopy(Datum X)
     258             : {
     259        1296 :     return (TSQuery) PG_DETOAST_DATUM_COPY(X);
     260             : }
     261             : 
     262             : static inline Datum
     263        3914 : TSQueryGetDatum(const TSQueryData *X)
     264             : {
     265        3914 :     return PointerGetDatum(X);
     266             : }
     267             : 
     268             : #define PG_GETARG_TSQUERY(n)        DatumGetTSQuery(PG_GETARG_DATUM(n))
     269             : #define PG_GETARG_TSQUERY_COPY(n)   DatumGetTSQueryCopy(PG_GETARG_DATUM(n))
     270             : #define PG_RETURN_TSQUERY(x)        return TSQueryGetDatum(x)
     271             : 
     272             : #endif                          /* _PG_TSTYPE_H_ */

Generated by: LCOV version 1.14