LCOV - code coverage report
Current view: top level - src/backend/commands - indexcmds.c (source / functions) Hit Total Coverage
Test: PostgreSQL 17devel Lines: 1223 1334 91.7 %
Date: 2024-05-09 12:10:51 Functions: 26 26 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*-------------------------------------------------------------------------
       2             :  *
       3             :  * indexcmds.c
       4             :  *    POSTGRES define and remove index code.
       5             :  *
       6             :  * Portions Copyright (c) 1996-2024, PostgreSQL Global Development Group
       7             :  * Portions Copyright (c) 1994, Regents of the University of California
       8             :  *
       9             :  *
      10             :  * IDENTIFICATION
      11             :  *    src/backend/commands/indexcmds.c
      12             :  *
      13             :  *-------------------------------------------------------------------------
      14             :  */
      15             : 
      16             : #include "postgres.h"
      17             : 
      18             : #include "access/amapi.h"
      19             : #include "access/gist.h"
      20             : #include "access/heapam.h"
      21             : #include "access/htup_details.h"
      22             : #include "access/reloptions.h"
      23             : #include "access/sysattr.h"
      24             : #include "access/tableam.h"
      25             : #include "access/xact.h"
      26             : #include "catalog/catalog.h"
      27             : #include "catalog/index.h"
      28             : #include "catalog/indexing.h"
      29             : #include "catalog/namespace.h"
      30             : #include "catalog/pg_am.h"
      31             : #include "catalog/pg_authid.h"
      32             : #include "catalog/pg_constraint.h"
      33             : #include "catalog/pg_database.h"
      34             : #include "catalog/pg_inherits.h"
      35             : #include "catalog/pg_namespace.h"
      36             : #include "catalog/pg_opclass.h"
      37             : #include "catalog/pg_opfamily.h"
      38             : #include "catalog/pg_tablespace.h"
      39             : #include "catalog/pg_type.h"
      40             : #include "commands/comment.h"
      41             : #include "commands/dbcommands.h"
      42             : #include "commands/defrem.h"
      43             : #include "commands/event_trigger.h"
      44             : #include "commands/progress.h"
      45             : #include "commands/tablecmds.h"
      46             : #include "commands/tablespace.h"
      47             : #include "mb/pg_wchar.h"
      48             : #include "miscadmin.h"
      49             : #include "nodes/makefuncs.h"
      50             : #include "nodes/nodeFuncs.h"
      51             : #include "optimizer/optimizer.h"
      52             : #include "parser/parse_coerce.h"
      53             : #include "parser/parse_oper.h"
      54             : #include "partitioning/partdesc.h"
      55             : #include "pgstat.h"
      56             : #include "rewrite/rewriteManip.h"
      57             : #include "storage/lmgr.h"
      58             : #include "storage/proc.h"
      59             : #include "storage/procarray.h"
      60             : #include "storage/sinvaladt.h"
      61             : #include "utils/acl.h"
      62             : #include "utils/builtins.h"
      63             : #include "utils/fmgroids.h"
      64             : #include "utils/guc.h"
      65             : #include "utils/inval.h"
      66             : #include "utils/lsyscache.h"
      67             : #include "utils/memutils.h"
      68             : #include "utils/partcache.h"
      69             : #include "utils/pg_rusage.h"
      70             : #include "utils/regproc.h"
      71             : #include "utils/snapmgr.h"
      72             : #include "utils/syscache.h"
      73             : 
      74             : 
      75             : /* non-export function prototypes */
      76             : static bool CompareOpclassOptions(const Datum *opts1, const Datum *opts2, int natts);
      77             : static void CheckPredicate(Expr *predicate);
      78             : static void ComputeIndexAttrs(IndexInfo *indexInfo,
      79             :                               Oid *typeOids,
      80             :                               Oid *collationOids,
      81             :                               Oid *opclassOids,
      82             :                               Datum *opclassOptions,
      83             :                               int16 *colOptions,
      84             :                               const List *attList,
      85             :                               const List *exclusionOpNames,
      86             :                               Oid relId,
      87             :                               const char *accessMethodName,
      88             :                               Oid accessMethodId,
      89             :                               bool amcanorder,
      90             :                               bool isconstraint,
      91             :                               bool iswithoutoverlaps,
      92             :                               Oid ddl_userid,
      93             :                               int ddl_sec_context,
      94             :                               int *ddl_save_nestlevel);
      95             : static char *ChooseIndexName(const char *tabname, Oid namespaceId,
      96             :                              const List *colnames, const List *exclusionOpNames,
      97             :                              bool primary, bool isconstraint);
      98             : static char *ChooseIndexNameAddition(const List *colnames);
      99             : static List *ChooseIndexColumnNames(const List *indexElems);
     100             : static void ReindexIndex(const ReindexStmt *stmt, const ReindexParams *params,
     101             :                          bool isTopLevel);
     102             : static void RangeVarCallbackForReindexIndex(const RangeVar *relation,
     103             :                                             Oid relId, Oid oldRelId, void *arg);
     104             : static Oid  ReindexTable(const ReindexStmt *stmt, const ReindexParams *params,
     105             :                          bool isTopLevel);
     106             : static void ReindexMultipleTables(const ReindexStmt *stmt,
     107             :                                   const ReindexParams *params);
     108             : static void reindex_error_callback(void *arg);
     109             : static void ReindexPartitions(const ReindexStmt *stmt, Oid relid,
     110             :                               const ReindexParams *params, bool isTopLevel);
     111             : static void ReindexMultipleInternal(const ReindexStmt *stmt, const List *relids,
     112             :                                     const ReindexParams *params);
     113             : static bool ReindexRelationConcurrently(const ReindexStmt *stmt,
     114             :                                         Oid relationOid,
     115             :                                         const ReindexParams *params);
     116             : static void update_relispartition(Oid relationId, bool newval);
     117             : static inline void set_indexsafe_procflags(void);
     118             : 
     119             : /*
     120             :  * callback argument type for RangeVarCallbackForReindexIndex()
     121             :  */
     122             : struct ReindexIndexCallbackState
     123             : {
     124             :     ReindexParams params;       /* options from statement */
     125             :     Oid         locked_table_oid;   /* tracks previously locked table */
     126             : };
     127             : 
     128             : /*
     129             :  * callback arguments for reindex_error_callback()
     130             :  */
     131             : typedef struct ReindexErrorInfo
     132             : {
     133             :     char       *relname;
     134             :     char       *relnamespace;
     135             :     char        relkind;
     136             : } ReindexErrorInfo;
     137             : 
     138             : /*
     139             :  * CheckIndexCompatible
     140             :  *      Determine whether an existing index definition is compatible with a
     141             :  *      prospective index definition, such that the existing index storage
     142             :  *      could become the storage of the new index, avoiding a rebuild.
     143             :  *
     144             :  * 'oldId': the OID of the existing index
     145             :  * 'accessMethodName': name of the AM to use.
     146             :  * 'attributeList': a list of IndexElem specifying columns and expressions
     147             :  *      to index on.
     148             :  * 'exclusionOpNames': list of names of exclusion-constraint operators,
     149             :  *      or NIL if not an exclusion constraint.
     150             :  * 'isWithoutOverlaps': true iff this index has a WITHOUT OVERLAPS clause.
     151             :  *
     152             :  * This is tailored to the needs of ALTER TABLE ALTER TYPE, which recreates
     153             :  * any indexes that depended on a changing column from their pg_get_indexdef
     154             :  * or pg_get_constraintdef definitions.  We omit some of the sanity checks of
     155             :  * DefineIndex.  We assume that the old and new indexes have the same number
     156             :  * of columns and that if one has an expression column or predicate, both do.
     157             :  * Errors arising from the attribute list still apply.
     158             :  *
     159             :  * Most column type changes that can skip a table rewrite do not invalidate
     160             :  * indexes.  We acknowledge this when all operator classes, collations and
     161             :  * exclusion operators match.  Though we could further permit intra-opfamily
     162             :  * changes for btree and hash indexes, that adds subtle complexity with no
     163             :  * concrete benefit for core types. Note, that INCLUDE columns aren't
     164             :  * checked by this function, for them it's enough that table rewrite is
     165             :  * skipped.
     166             :  *
     167             :  * When a comparison or exclusion operator has a polymorphic input type, the
     168             :  * actual input types must also match.  This defends against the possibility
     169             :  * that operators could vary behavior in response to get_fn_expr_argtype().
     170             :  * At present, this hazard is theoretical: check_exclusion_constraint() and
     171             :  * all core index access methods decline to set fn_expr for such calls.
     172             :  *
     173             :  * We do not yet implement a test to verify compatibility of expression
     174             :  * columns or predicates, so assume any such index is incompatible.
     175             :  */
     176             : bool
     177         102 : CheckIndexCompatible(Oid oldId,
     178             :                      const char *accessMethodName,
     179             :                      const List *attributeList,
     180             :                      const List *exclusionOpNames,
     181             :                      bool isWithoutOverlaps)
     182             : {
     183             :     bool        isconstraint;
     184             :     Oid        *typeIds;
     185             :     Oid        *collationIds;
     186             :     Oid        *opclassIds;
     187             :     Datum      *opclassOptions;
     188             :     Oid         accessMethodId;
     189             :     Oid         relationId;
     190             :     HeapTuple   tuple;
     191             :     Form_pg_index indexForm;
     192             :     Form_pg_am  accessMethodForm;
     193             :     IndexAmRoutine *amRoutine;
     194             :     bool        amcanorder;
     195             :     bool        amsummarizing;
     196             :     int16      *coloptions;
     197             :     IndexInfo  *indexInfo;
     198             :     int         numberOfAttributes;
     199             :     int         old_natts;
     200         102 :     bool        ret = true;
     201             :     oidvector  *old_indclass;
     202             :     oidvector  *old_indcollation;
     203             :     Relation    irel;
     204             :     int         i;
     205             :     Datum       d;
     206             : 
     207             :     /* Caller should already have the relation locked in some way. */
     208         102 :     relationId = IndexGetRelation(oldId, false);
     209             : 
     210             :     /*
     211             :      * We can pretend isconstraint = false unconditionally.  It only serves to
     212             :      * decide the text of an error message that should never happen for us.
     213             :      */
     214         102 :     isconstraint = false;
     215             : 
     216         102 :     numberOfAttributes = list_length(attributeList);
     217             :     Assert(numberOfAttributes > 0);
     218             :     Assert(numberOfAttributes <= INDEX_MAX_KEYS);
     219             : 
     220             :     /* look up the access method */
     221         102 :     tuple = SearchSysCache1(AMNAME, PointerGetDatum(accessMethodName));
     222         102 :     if (!HeapTupleIsValid(tuple))
     223           0 :         ereport(ERROR,
     224             :                 (errcode(ERRCODE_UNDEFINED_OBJECT),
     225             :                  errmsg("access method \"%s\" does not exist",
     226             :                         accessMethodName)));
     227         102 :     accessMethodForm = (Form_pg_am) GETSTRUCT(tuple);
     228         102 :     accessMethodId = accessMethodForm->oid;
     229         102 :     amRoutine = GetIndexAmRoutine(accessMethodForm->amhandler);
     230         102 :     ReleaseSysCache(tuple);
     231             : 
     232         102 :     amcanorder = amRoutine->amcanorder;
     233         102 :     amsummarizing = amRoutine->amsummarizing;
     234             : 
     235             :     /*
     236             :      * Compute the operator classes, collations, and exclusion operators for
     237             :      * the new index, so we can test whether it's compatible with the existing
     238             :      * one.  Note that ComputeIndexAttrs might fail here, but that's OK:
     239             :      * DefineIndex would have failed later.  Our attributeList contains only
     240             :      * key attributes, thus we're filling ii_NumIndexAttrs and
     241             :      * ii_NumIndexKeyAttrs with same value.
     242             :      */
     243         102 :     indexInfo = makeIndexInfo(numberOfAttributes, numberOfAttributes,
     244             :                               accessMethodId, NIL, NIL, false, false,
     245             :                               false, false, amsummarizing);
     246         102 :     typeIds = palloc_array(Oid, numberOfAttributes);
     247         102 :     collationIds = palloc_array(Oid, numberOfAttributes);
     248         102 :     opclassIds = palloc_array(Oid, numberOfAttributes);
     249         102 :     opclassOptions = palloc_array(Datum, numberOfAttributes);
     250         102 :     coloptions = palloc_array(int16, numberOfAttributes);
     251         102 :     ComputeIndexAttrs(indexInfo,
     252             :                       typeIds, collationIds, opclassIds, opclassOptions,
     253             :                       coloptions, attributeList,
     254             :                       exclusionOpNames, relationId,
     255             :                       accessMethodName, accessMethodId,
     256             :                       amcanorder, isconstraint, isWithoutOverlaps, InvalidOid,
     257             :                       0, NULL);
     258             : 
     259             :     /* Get the soon-obsolete pg_index tuple. */
     260         102 :     tuple = SearchSysCache1(INDEXRELID, ObjectIdGetDatum(oldId));
     261         102 :     if (!HeapTupleIsValid(tuple))
     262           0 :         elog(ERROR, "cache lookup failed for index %u", oldId);
     263         102 :     indexForm = (Form_pg_index) GETSTRUCT(tuple);
     264             : 
     265             :     /*
     266             :      * We don't assess expressions or predicates; assume incompatibility.
     267             :      * Also, if the index is invalid for any reason, treat it as incompatible.
     268             :      */
     269         204 :     if (!(heap_attisnull(tuple, Anum_pg_index_indpred, NULL) &&
     270         102 :           heap_attisnull(tuple, Anum_pg_index_indexprs, NULL) &&
     271         102 :           indexForm->indisvalid))
     272             :     {
     273           0 :         ReleaseSysCache(tuple);
     274           0 :         return false;
     275             :     }
     276             : 
     277             :     /* Any change in operator class or collation breaks compatibility. */
     278         102 :     old_natts = indexForm->indnkeyatts;
     279             :     Assert(old_natts == numberOfAttributes);
     280             : 
     281         102 :     d = SysCacheGetAttrNotNull(INDEXRELID, tuple, Anum_pg_index_indcollation);
     282         102 :     old_indcollation = (oidvector *) DatumGetPointer(d);
     283             : 
     284         102 :     d = SysCacheGetAttrNotNull(INDEXRELID, tuple, Anum_pg_index_indclass);
     285         102 :     old_indclass = (oidvector *) DatumGetPointer(d);
     286             : 
     287         204 :     ret = (memcmp(old_indclass->values, opclassIds, old_natts * sizeof(Oid)) == 0 &&
     288         102 :            memcmp(old_indcollation->values, collationIds, old_natts * sizeof(Oid)) == 0);
     289             : 
     290         102 :     ReleaseSysCache(tuple);
     291             : 
     292         102 :     if (!ret)
     293           0 :         return false;
     294             : 
     295             :     /* For polymorphic opcintype, column type changes break compatibility. */
     296         102 :     irel = index_open(oldId, AccessShareLock);  /* caller probably has a lock */
     297         210 :     for (i = 0; i < old_natts; i++)
     298             :     {
     299         108 :         if (IsPolymorphicType(get_opclass_input_type(opclassIds[i])) &&
     300           0 :             TupleDescAttr(irel->rd_att, i)->atttypid != typeIds[i])
     301             :         {
     302           0 :             ret = false;
     303           0 :             break;
     304             :         }
     305             :     }
     306             : 
     307             :     /* Any change in opclass options break compatibility. */
     308         102 :     if (ret)
     309             :     {
     310         102 :         Datum      *oldOpclassOptions = palloc_array(Datum, old_natts);
     311             : 
     312         210 :         for (i = 0; i < old_natts; i++)
     313         108 :             oldOpclassOptions[i] = get_attoptions(oldId, i + 1);
     314             : 
     315         102 :         ret = CompareOpclassOptions(oldOpclassOptions, opclassOptions, old_natts);
     316             : 
     317         102 :         pfree(oldOpclassOptions);
     318             :     }
     319             : 
     320             :     /* Any change in exclusion operator selections breaks compatibility. */
     321         102 :     if (ret && indexInfo->ii_ExclusionOps != NULL)
     322             :     {
     323             :         Oid        *old_operators,
     324             :                    *old_procs;
     325             :         uint16     *old_strats;
     326             : 
     327           0 :         RelationGetExclusionInfo(irel, &old_operators, &old_procs, &old_strats);
     328           0 :         ret = memcmp(old_operators, indexInfo->ii_ExclusionOps,
     329             :                      old_natts * sizeof(Oid)) == 0;
     330             : 
     331             :         /* Require an exact input type match for polymorphic operators. */
     332           0 :         if (ret)
     333             :         {
     334           0 :             for (i = 0; i < old_natts && ret; i++)
     335             :             {
     336             :                 Oid         left,
     337             :                             right;
     338             : 
     339           0 :                 op_input_types(indexInfo->ii_ExclusionOps[i], &left, &right);
     340           0 :                 if ((IsPolymorphicType(left) || IsPolymorphicType(right)) &&
     341           0 :                     TupleDescAttr(irel->rd_att, i)->atttypid != typeIds[i])
     342             :                 {
     343           0 :                     ret = false;
     344           0 :                     break;
     345             :                 }
     346             :             }
     347             :         }
     348             :     }
     349             : 
     350         102 :     index_close(irel, NoLock);
     351         102 :     return ret;
     352             : }
     353             : 
     354             : /*
     355             :  * CompareOpclassOptions
     356             :  *
     357             :  * Compare per-column opclass options which are represented by arrays of text[]
     358             :  * datums.  Both elements of arrays and array themselves can be NULL.
     359             :  */
     360             : static bool
     361         102 : CompareOpclassOptions(const Datum *opts1, const Datum *opts2, int natts)
     362             : {
     363             :     int         i;
     364             : 
     365         102 :     if (!opts1 && !opts2)
     366           0 :         return true;
     367             : 
     368         210 :     for (i = 0; i < natts; i++)
     369             :     {
     370         108 :         Datum       opt1 = opts1 ? opts1[i] : (Datum) 0;
     371         108 :         Datum       opt2 = opts2 ? opts2[i] : (Datum) 0;
     372             : 
     373         108 :         if (opt1 == (Datum) 0)
     374             :         {
     375         108 :             if (opt2 == (Datum) 0)
     376         108 :                 continue;
     377             :             else
     378           0 :                 return false;
     379             :         }
     380           0 :         else if (opt2 == (Datum) 0)
     381           0 :             return false;
     382             : 
     383             :         /* Compare non-NULL text[] datums. */
     384           0 :         if (!DatumGetBool(DirectFunctionCall2(array_eq, opt1, opt2)))
     385           0 :             return false;
     386             :     }
     387             : 
     388         102 :     return true;
     389             : }
     390             : 
     391             : /*
     392             :  * WaitForOlderSnapshots
     393             :  *
     394             :  * Wait for transactions that might have an older snapshot than the given xmin
     395             :  * limit, because it might not contain tuples deleted just before it has
     396             :  * been taken. Obtain a list of VXIDs of such transactions, and wait for them
     397             :  * individually. This is used when building an index concurrently.
     398             :  *
     399             :  * We can exclude any running transactions that have xmin > the xmin given;
     400             :  * their oldest snapshot must be newer than our xmin limit.
     401             :  * We can also exclude any transactions that have xmin = zero, since they
     402             :  * evidently have no live snapshot at all (and any one they might be in
     403             :  * process of taking is certainly newer than ours).  Transactions in other
     404             :  * DBs can be ignored too, since they'll never even be able to see the
     405             :  * index being worked on.
     406             :  *
     407             :  * We can also exclude autovacuum processes and processes running manual
     408             :  * lazy VACUUMs, because they won't be fazed by missing index entries
     409             :  * either.  (Manual ANALYZEs, however, can't be excluded because they
     410             :  * might be within transactions that are going to do arbitrary operations
     411             :  * later.)  Processes running CREATE INDEX CONCURRENTLY or REINDEX CONCURRENTLY
     412             :  * on indexes that are neither expressional nor partial are also safe to
     413             :  * ignore, since we know that those processes won't examine any data
     414             :  * outside the table they're indexing.
     415             :  *
     416             :  * Also, GetCurrentVirtualXIDs never reports our own vxid, so we need not
     417             :  * check for that.
     418             :  *
     419             :  * If a process goes idle-in-transaction with xmin zero, we do not need to
     420             :  * wait for it anymore, per the above argument.  We do not have the
     421             :  * infrastructure right now to stop waiting if that happens, but we can at
     422             :  * least avoid the folly of waiting when it is idle at the time we would
     423             :  * begin to wait.  We do this by repeatedly rechecking the output of
     424             :  * GetCurrentVirtualXIDs.  If, during any iteration, a particular vxid
     425             :  * doesn't show up in the output, we know we can forget about it.
     426             :  */
     427             : void
     428         628 : WaitForOlderSnapshots(TransactionId limitXmin, bool progress)
     429             : {
     430             :     int         n_old_snapshots;
     431             :     int         i;
     432             :     VirtualTransactionId *old_snapshots;
     433             : 
     434         628 :     old_snapshots = GetCurrentVirtualXIDs(limitXmin, true, false,
     435             :                                           PROC_IS_AUTOVACUUM | PROC_IN_VACUUM
     436             :                                           | PROC_IN_SAFE_IC,
     437             :                                           &n_old_snapshots);
     438         628 :     if (progress)
     439         614 :         pgstat_progress_update_param(PROGRESS_WAITFOR_TOTAL, n_old_snapshots);
     440             : 
     441         920 :     for (i = 0; i < n_old_snapshots; i++)
     442             :     {
     443         292 :         if (!VirtualTransactionIdIsValid(old_snapshots[i]))
     444          56 :             continue;           /* found uninteresting in previous cycle */
     445             : 
     446         236 :         if (i > 0)
     447             :         {
     448             :             /* see if anything's changed ... */
     449             :             VirtualTransactionId *newer_snapshots;
     450             :             int         n_newer_snapshots;
     451             :             int         j;
     452             :             int         k;
     453             : 
     454          68 :             newer_snapshots = GetCurrentVirtualXIDs(limitXmin,
     455             :                                                     true, false,
     456             :                                                     PROC_IS_AUTOVACUUM | PROC_IN_VACUUM
     457             :                                                     | PROC_IN_SAFE_IC,
     458             :                                                     &n_newer_snapshots);
     459         250 :             for (j = i; j < n_old_snapshots; j++)
     460             :             {
     461         182 :                 if (!VirtualTransactionIdIsValid(old_snapshots[j]))
     462          12 :                     continue;   /* found uninteresting in previous cycle */
     463         486 :                 for (k = 0; k < n_newer_snapshots; k++)
     464             :                 {
     465         392 :                     if (VirtualTransactionIdEquals(old_snapshots[j],
     466             :                                                    newer_snapshots[k]))
     467          76 :                         break;
     468             :                 }
     469         170 :                 if (k >= n_newer_snapshots) /* not there anymore */
     470          94 :                     SetInvalidVirtualTransactionId(old_snapshots[j]);
     471             :             }
     472          68 :             pfree(newer_snapshots);
     473             :         }
     474             : 
     475         236 :         if (VirtualTransactionIdIsValid(old_snapshots[i]))
     476             :         {
     477             :             /* If requested, publish who we're going to wait for. */
     478         198 :             if (progress)
     479             :             {
     480         198 :                 PGPROC     *holder = ProcNumberGetProc(old_snapshots[i].procNumber);
     481             : 
     482         198 :                 if (holder)
     483         198 :                     pgstat_progress_update_param(PROGRESS_WAITFOR_CURRENT_PID,
     484         198 :                                                  holder->pid);
     485             :             }
     486         198 :             VirtualXactLock(old_snapshots[i], true);
     487             :         }
     488             : 
     489         236 :         if (progress)
     490         236 :             pgstat_progress_update_param(PROGRESS_WAITFOR_DONE, i + 1);
     491             :     }
     492         628 : }
     493             : 
     494             : 
     495             : /*
     496             :  * DefineIndex
     497             :  *      Creates a new index.
     498             :  *
     499             :  * This function manages the current userid according to the needs of pg_dump.
     500             :  * Recreating old-database catalog entries in new-database is fine, regardless
     501             :  * of which users would have permission to recreate those entries now.  That's
     502             :  * just preservation of state.  Running opaque expressions, like calling a
     503             :  * function named in a catalog entry or evaluating a pg_node_tree in a catalog
     504             :  * entry, as anyone other than the object owner, is not fine.  To adhere to
     505             :  * those principles and to remain fail-safe, use the table owner userid for
     506             :  * most ACL checks.  Use the original userid for ACL checks reached without
     507             :  * traversing opaque expressions.  (pg_dump can predict such ACL checks from
     508             :  * catalogs.)  Overall, this is a mess.  Future DDL development should
     509             :  * consider offering one DDL command for catalog setup and a separate DDL
     510             :  * command for steps that run opaque expressions.
     511             :  *
     512             :  * 'tableId': the OID of the table relation on which the index is to be
     513             :  *      created
     514             :  * 'stmt': IndexStmt describing the properties of the new index.
     515             :  * 'indexRelationId': normally InvalidOid, but during bootstrap can be
     516             :  *      nonzero to specify a preselected OID for the index.
     517             :  * 'parentIndexId': the OID of the parent index; InvalidOid if not the child
     518             :  *      of a partitioned index.
     519             :  * 'parentConstraintId': the OID of the parent constraint; InvalidOid if not
     520             :  *      the child of a constraint (only used when recursing)
     521             :  * 'total_parts': total number of direct and indirect partitions of relation;
     522             :  *      pass -1 if not known or rel is not partitioned.
     523             :  * 'is_alter_table': this is due to an ALTER rather than a CREATE operation.
     524             :  * 'check_rights': check for CREATE rights in namespace and tablespace.  (This
     525             :  *      should be true except when ALTER is deleting/recreating an index.)
     526             :  * 'check_not_in_use': check for table not already in use in current session.
     527             :  *      This should be true unless caller is holding the table open, in which
     528             :  *      case the caller had better have checked it earlier.
     529             :  * 'skip_build': make the catalog entries but don't create the index files
     530             :  * 'quiet': suppress the NOTICE chatter ordinarily provided for constraints.
     531             :  *
     532             :  * Returns the object address of the created index.
     533             :  */
     534             : ObjectAddress
     535       27250 : DefineIndex(Oid tableId,
     536             :             IndexStmt *stmt,
     537             :             Oid indexRelationId,
     538             :             Oid parentIndexId,
     539             :             Oid parentConstraintId,
     540             :             int total_parts,
     541             :             bool is_alter_table,
     542             :             bool check_rights,
     543             :             bool check_not_in_use,
     544             :             bool skip_build,
     545             :             bool quiet)
     546             : {
     547             :     bool        concurrent;
     548             :     char       *indexRelationName;
     549             :     char       *accessMethodName;
     550             :     Oid        *typeIds;
     551             :     Oid        *collationIds;
     552             :     Oid        *opclassIds;
     553             :     Datum      *opclassOptions;
     554             :     Oid         accessMethodId;
     555             :     Oid         namespaceId;
     556             :     Oid         tablespaceId;
     557       27250 :     Oid         createdConstraintId = InvalidOid;
     558             :     List       *indexColNames;
     559             :     List       *allIndexParams;
     560             :     Relation    rel;
     561             :     HeapTuple   tuple;
     562             :     Form_pg_am  accessMethodForm;
     563             :     IndexAmRoutine *amRoutine;
     564             :     bool        amcanorder;
     565             :     bool        amissummarizing;
     566             :     amoptions_function amoptions;
     567             :     bool        exclusion;
     568             :     bool        partitioned;
     569             :     bool        safe_index;
     570             :     Datum       reloptions;
     571             :     int16      *coloptions;
     572             :     IndexInfo  *indexInfo;
     573             :     bits16      flags;
     574             :     bits16      constr_flags;
     575             :     int         numberOfAttributes;
     576             :     int         numberOfKeyAttributes;
     577             :     TransactionId limitXmin;
     578             :     ObjectAddress address;
     579             :     LockRelId   heaprelid;
     580             :     LOCKTAG     heaplocktag;
     581             :     LOCKMODE    lockmode;
     582             :     Snapshot    snapshot;
     583             :     Oid         root_save_userid;
     584             :     int         root_save_sec_context;
     585             :     int         root_save_nestlevel;
     586             : 
     587       27250 :     root_save_nestlevel = NewGUCNestLevel();
     588             : 
     589       27250 :     RestrictSearchPath();
     590             : 
     591             :     /*
     592             :      * Some callers need us to run with an empty default_tablespace; this is a
     593             :      * necessary hack to be able to reproduce catalog state accurately when
     594             :      * recreating indexes after table-rewriting ALTER TABLE.
     595             :      */
     596       27250 :     if (stmt->reset_default_tblspc)
     597         512 :         (void) set_config_option("default_tablespace", "",
     598             :                                  PGC_USERSET, PGC_S_SESSION,
     599             :                                  GUC_ACTION_SAVE, true, 0, false);
     600             : 
     601             :     /*
     602             :      * Force non-concurrent build on temporary relations, even if CONCURRENTLY
     603             :      * was requested.  Other backends can't access a temporary relation, so
     604             :      * there's no harm in grabbing a stronger lock, and a non-concurrent DROP
     605             :      * is more efficient.  Do this before any use of the concurrent option is
     606             :      * done.
     607             :      */
     608       27250 :     if (stmt->concurrent && get_rel_persistence(tableId) != RELPERSISTENCE_TEMP)
     609         170 :         concurrent = true;
     610             :     else
     611       27080 :         concurrent = false;
     612             : 
     613             :     /*
     614             :      * Start progress report.  If we're building a partition, this was already
     615             :      * done.
     616             :      */
     617       27250 :     if (!OidIsValid(parentIndexId))
     618             :     {
     619       24424 :         pgstat_progress_start_command(PROGRESS_COMMAND_CREATE_INDEX, tableId);
     620       24424 :         pgstat_progress_update_param(PROGRESS_CREATEIDX_COMMAND,
     621             :                                      concurrent ?
     622             :                                      PROGRESS_CREATEIDX_COMMAND_CREATE_CONCURRENTLY :
     623             :                                      PROGRESS_CREATEIDX_COMMAND_CREATE);
     624             :     }
     625             : 
     626             :     /*
     627             :      * No index OID to report yet
     628             :      */
     629       27250 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_INDEX_OID,
     630             :                                  InvalidOid);
     631             : 
     632             :     /*
     633             :      * count key attributes in index
     634             :      */
     635       27250 :     numberOfKeyAttributes = list_length(stmt->indexParams);
     636             : 
     637             :     /*
     638             :      * Calculate the new list of index columns including both key columns and
     639             :      * INCLUDE columns.  Later we can determine which of these are key
     640             :      * columns, and which are just part of the INCLUDE list by checking the
     641             :      * list position.  A list item in a position less than ii_NumIndexKeyAttrs
     642             :      * is part of the key columns, and anything equal to and over is part of
     643             :      * the INCLUDE columns.
     644             :      */
     645       27250 :     allIndexParams = list_concat_copy(stmt->indexParams,
     646       27250 :                                       stmt->indexIncludingParams);
     647       27250 :     numberOfAttributes = list_length(allIndexParams);
     648             : 
     649       27250 :     if (numberOfKeyAttributes <= 0)
     650           0 :         ereport(ERROR,
     651             :                 (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
     652             :                  errmsg("must specify at least one column")));
     653       27250 :     if (numberOfAttributes > INDEX_MAX_KEYS)
     654           0 :         ereport(ERROR,
     655             :                 (errcode(ERRCODE_TOO_MANY_COLUMNS),
     656             :                  errmsg("cannot use more than %d columns in an index",
     657             :                         INDEX_MAX_KEYS)));
     658             : 
     659             :     /*
     660             :      * Only SELECT ... FOR UPDATE/SHARE are allowed while doing a standard
     661             :      * index build; but for concurrent builds we allow INSERT/UPDATE/DELETE
     662             :      * (but not VACUUM).
     663             :      *
     664             :      * NB: Caller is responsible for making sure that tableId refers to the
     665             :      * relation on which the index should be built; except in bootstrap mode,
     666             :      * this will typically require the caller to have already locked the
     667             :      * relation.  To avoid lock upgrade hazards, that lock should be at least
     668             :      * as strong as the one we take here.
     669             :      *
     670             :      * NB: If the lock strength here ever changes, code that is run by
     671             :      * parallel workers under the control of certain particular ambuild
     672             :      * functions will need to be updated, too.
     673             :      */
     674       27250 :     lockmode = concurrent ? ShareUpdateExclusiveLock : ShareLock;
     675       27250 :     rel = table_open(tableId, lockmode);
     676             : 
     677             :     /*
     678             :      * Switch to the table owner's userid, so that any index functions are run
     679             :      * as that user.  Also lock down security-restricted operations.  We
     680             :      * already arranged to make GUC variable changes local to this command.
     681             :      */
     682       27250 :     GetUserIdAndSecContext(&root_save_userid, &root_save_sec_context);
     683       27250 :     SetUserIdAndSecContext(rel->rd_rel->relowner,
     684             :                            root_save_sec_context | SECURITY_RESTRICTED_OPERATION);
     685             : 
     686       27250 :     namespaceId = RelationGetNamespace(rel);
     687             : 
     688             :     /*
     689             :      * It has exclusion constraint behavior if it's an EXCLUDE constraint or a
     690             :      * temporal PRIMARY KEY/UNIQUE constraint
     691             :      */
     692       27250 :     exclusion = stmt->excludeOpNames || stmt->iswithoutoverlaps;
     693             : 
     694             :     /* Ensure that it makes sense to index this kind of relation */
     695       27250 :     switch (rel->rd_rel->relkind)
     696             :     {
     697       27244 :         case RELKIND_RELATION:
     698             :         case RELKIND_MATVIEW:
     699             :         case RELKIND_PARTITIONED_TABLE:
     700             :             /* OK */
     701       27244 :             break;
     702           6 :         default:
     703           6 :             ereport(ERROR,
     704             :                     (errcode(ERRCODE_WRONG_OBJECT_TYPE),
     705             :                      errmsg("cannot create index on relation \"%s\"",
     706             :                             RelationGetRelationName(rel)),
     707             :                      errdetail_relkind_not_supported(rel->rd_rel->relkind)));
     708             :             break;
     709             :     }
     710             : 
     711             :     /*
     712             :      * Establish behavior for partitioned tables, and verify sanity of
     713             :      * parameters.
     714             :      *
     715             :      * We do not build an actual index in this case; we only create a few
     716             :      * catalog entries.  The actual indexes are built by recursing for each
     717             :      * partition.
     718             :      */
     719       27244 :     partitioned = rel->rd_rel->relkind == RELKIND_PARTITIONED_TABLE;
     720       27244 :     if (partitioned)
     721             :     {
     722             :         /*
     723             :          * Note: we check 'stmt->concurrent' rather than 'concurrent', so that
     724             :          * the error is thrown also for temporary tables.  Seems better to be
     725             :          * consistent, even though we could do it on temporary table because
     726             :          * we're not actually doing it concurrently.
     727             :          */
     728        2050 :         if (stmt->concurrent)
     729           6 :             ereport(ERROR,
     730             :                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     731             :                      errmsg("cannot create index on partitioned table \"%s\" concurrently",
     732             :                             RelationGetRelationName(rel))));
     733             :     }
     734             : 
     735             :     /*
     736             :      * Don't try to CREATE INDEX on temp tables of other backends.
     737             :      */
     738       27238 :     if (RELATION_IS_OTHER_TEMP(rel))
     739           0 :         ereport(ERROR,
     740             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     741             :                  errmsg("cannot create indexes on temporary tables of other sessions")));
     742             : 
     743             :     /*
     744             :      * Unless our caller vouches for having checked this already, insist that
     745             :      * the table not be in use by our own session, either.  Otherwise we might
     746             :      * fail to make entries in the new index (for instance, if an INSERT or
     747             :      * UPDATE is in progress and has already made its list of target indexes).
     748             :      */
     749       27238 :     if (check_not_in_use)
     750       13784 :         CheckTableNotInUse(rel, "CREATE INDEX");
     751             : 
     752             :     /*
     753             :      * Verify we (still) have CREATE rights in the rel's namespace.
     754             :      * (Presumably we did when the rel was created, but maybe not anymore.)
     755             :      * Skip check if caller doesn't want it.  Also skip check if
     756             :      * bootstrapping, since permissions machinery may not be working yet.
     757             :      */
     758       27232 :     if (check_rights && !IsBootstrapProcessingMode())
     759             :     {
     760             :         AclResult   aclresult;
     761             : 
     762       14870 :         aclresult = object_aclcheck(NamespaceRelationId, namespaceId, root_save_userid,
     763             :                                     ACL_CREATE);
     764       14870 :         if (aclresult != ACLCHECK_OK)
     765           0 :             aclcheck_error(aclresult, OBJECT_SCHEMA,
     766           0 :                            get_namespace_name(namespaceId));
     767             :     }
     768             : 
     769             :     /*
     770             :      * Select tablespace to use.  If not specified, use default tablespace
     771             :      * (which may in turn default to database's default).
     772             :      */
     773       27232 :     if (stmt->tableSpace)
     774             :     {
     775         200 :         tablespaceId = get_tablespace_oid(stmt->tableSpace, false);
     776         200 :         if (partitioned && tablespaceId == MyDatabaseTableSpace)
     777           6 :             ereport(ERROR,
     778             :                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     779             :                      errmsg("cannot specify default tablespace for partitioned relations")));
     780             :     }
     781             :     else
     782             :     {
     783       27032 :         tablespaceId = GetDefaultTablespace(rel->rd_rel->relpersistence,
     784             :                                             partitioned);
     785             :         /* note InvalidOid is OK in this case */
     786             :     }
     787             : 
     788             :     /* Check tablespace permissions */
     789       27220 :     if (check_rights &&
     790         104 :         OidIsValid(tablespaceId) && tablespaceId != MyDatabaseTableSpace)
     791             :     {
     792             :         AclResult   aclresult;
     793             : 
     794         104 :         aclresult = object_aclcheck(TableSpaceRelationId, tablespaceId, root_save_userid,
     795             :                                     ACL_CREATE);
     796         104 :         if (aclresult != ACLCHECK_OK)
     797           0 :             aclcheck_error(aclresult, OBJECT_TABLESPACE,
     798           0 :                            get_tablespace_name(tablespaceId));
     799             :     }
     800             : 
     801             :     /*
     802             :      * Force shared indexes into the pg_global tablespace.  This is a bit of a
     803             :      * hack but seems simpler than marking them in the BKI commands.  On the
     804             :      * other hand, if it's not shared, don't allow it to be placed there.
     805             :      */
     806       27220 :     if (rel->rd_rel->relisshared)
     807        1680 :         tablespaceId = GLOBALTABLESPACE_OID;
     808       25540 :     else if (tablespaceId == GLOBALTABLESPACE_OID)
     809           0 :         ereport(ERROR,
     810             :                 (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
     811             :                  errmsg("only shared relations can be placed in pg_global tablespace")));
     812             : 
     813             :     /*
     814             :      * Choose the index column names.
     815             :      */
     816       27220 :     indexColNames = ChooseIndexColumnNames(allIndexParams);
     817             : 
     818             :     /*
     819             :      * Select name for index if caller didn't specify
     820             :      */
     821       27220 :     indexRelationName = stmt->idxname;
     822       27220 :     if (indexRelationName == NULL)
     823       11140 :         indexRelationName = ChooseIndexName(RelationGetRelationName(rel),
     824             :                                             namespaceId,
     825             :                                             indexColNames,
     826       11140 :                                             stmt->excludeOpNames,
     827       11140 :                                             stmt->primary,
     828       11140 :                                             stmt->isconstraint);
     829             : 
     830             :     /*
     831             :      * look up the access method, verify it can handle the requested features
     832             :      */
     833       27220 :     accessMethodName = stmt->accessMethod;
     834       27220 :     tuple = SearchSysCache1(AMNAME, PointerGetDatum(accessMethodName));
     835       27220 :     if (!HeapTupleIsValid(tuple))
     836             :     {
     837             :         /*
     838             :          * Hack to provide more-or-less-transparent updating of old RTREE
     839             :          * indexes to GiST: if RTREE is requested and not found, use GIST.
     840             :          */
     841           6 :         if (strcmp(accessMethodName, "rtree") == 0)
     842             :         {
     843           6 :             ereport(NOTICE,
     844             :                     (errmsg("substituting access method \"gist\" for obsolete method \"rtree\"")));
     845           6 :             accessMethodName = "gist";
     846           6 :             tuple = SearchSysCache1(AMNAME, PointerGetDatum(accessMethodName));
     847             :         }
     848             : 
     849           6 :         if (!HeapTupleIsValid(tuple))
     850           0 :             ereport(ERROR,
     851             :                     (errcode(ERRCODE_UNDEFINED_OBJECT),
     852             :                      errmsg("access method \"%s\" does not exist",
     853             :                             accessMethodName)));
     854             :     }
     855       27220 :     accessMethodForm = (Form_pg_am) GETSTRUCT(tuple);
     856       27220 :     accessMethodId = accessMethodForm->oid;
     857       27220 :     amRoutine = GetIndexAmRoutine(accessMethodForm->amhandler);
     858             : 
     859       27220 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_ACCESS_METHOD_OID,
     860             :                                  accessMethodId);
     861             : 
     862       27220 :     if (stmt->unique && !stmt->iswithoutoverlaps && !amRoutine->amcanunique)
     863           0 :         ereport(ERROR,
     864             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     865             :                  errmsg("access method \"%s\" does not support unique indexes",
     866             :                         accessMethodName)));
     867       27220 :     if (stmt->indexIncludingParams != NIL && !amRoutine->amcaninclude)
     868          18 :         ereport(ERROR,
     869             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     870             :                  errmsg("access method \"%s\" does not support included columns",
     871             :                         accessMethodName)));
     872       27202 :     if (numberOfKeyAttributes > 1 && !amRoutine->amcanmulticol)
     873           0 :         ereport(ERROR,
     874             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     875             :                  errmsg("access method \"%s\" does not support multicolumn indexes",
     876             :                         accessMethodName)));
     877       27202 :     if (exclusion && amRoutine->amgettuple == NULL)
     878           0 :         ereport(ERROR,
     879             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     880             :                  errmsg("access method \"%s\" does not support exclusion constraints",
     881             :                         accessMethodName)));
     882             : 
     883       27202 :     amcanorder = amRoutine->amcanorder;
     884       27202 :     amoptions = amRoutine->amoptions;
     885       27202 :     amissummarizing = amRoutine->amsummarizing;
     886             : 
     887       27202 :     pfree(amRoutine);
     888       27202 :     ReleaseSysCache(tuple);
     889             : 
     890             :     /*
     891             :      * Validate predicate, if given
     892             :      */
     893       27202 :     if (stmt->whereClause)
     894         400 :         CheckPredicate((Expr *) stmt->whereClause);
     895             : 
     896             :     /*
     897             :      * Parse AM-specific options, convert to text array form, validate.
     898             :      */
     899       27202 :     reloptions = transformRelOptions((Datum) 0, stmt->options,
     900             :                                      NULL, NULL, false, false);
     901             : 
     902       27196 :     (void) index_reloptions(amoptions, reloptions, true);
     903             : 
     904             :     /*
     905             :      * Prepare arguments for index_create, primarily an IndexInfo structure.
     906             :      * Note that predicates must be in implicit-AND format.  In a concurrent
     907             :      * build, mark it not-ready-for-inserts.
     908             :      */
     909       27132 :     indexInfo = makeIndexInfo(numberOfAttributes,
     910             :                               numberOfKeyAttributes,
     911             :                               accessMethodId,
     912             :                               NIL,  /* expressions, NIL for now */
     913       27132 :                               make_ands_implicit((Expr *) stmt->whereClause),
     914       27132 :                               stmt->unique,
     915       27132 :                               stmt->nulls_not_distinct,
     916       27132 :                               !concurrent,
     917             :                               concurrent,
     918       27132 :                               amissummarizing);
     919             : 
     920       27132 :     typeIds = palloc_array(Oid, numberOfAttributes);
     921       27132 :     collationIds = palloc_array(Oid, numberOfAttributes);
     922       27132 :     opclassIds = palloc_array(Oid, numberOfAttributes);
     923       27132 :     opclassOptions = palloc_array(Datum, numberOfAttributes);
     924       27132 :     coloptions = palloc_array(int16, numberOfAttributes);
     925       27132 :     ComputeIndexAttrs(indexInfo,
     926             :                       typeIds, collationIds, opclassIds, opclassOptions,
     927             :                       coloptions, allIndexParams,
     928       27132 :                       stmt->excludeOpNames, tableId,
     929             :                       accessMethodName, accessMethodId,
     930       27132 :                       amcanorder, stmt->isconstraint, stmt->iswithoutoverlaps,
     931             :                       root_save_userid, root_save_sec_context,
     932             :                       &root_save_nestlevel);
     933             : 
     934             :     /*
     935             :      * Extra checks when creating a PRIMARY KEY index.
     936             :      */
     937       26902 :     if (stmt->primary)
     938        8412 :         index_check_primary_key(rel, indexInfo, is_alter_table, stmt);
     939             : 
     940             :     /*
     941             :      * If this table is partitioned and we're creating a unique index, primary
     942             :      * key, or exclusion constraint, make sure that the partition key is a
     943             :      * subset of the index's columns.  Otherwise it would be possible to
     944             :      * violate uniqueness by putting values that ought to be unique in
     945             :      * different partitions.
     946             :      *
     947             :      * We could lift this limitation if we had global indexes, but those have
     948             :      * their own problems, so this is a useful feature combination.
     949             :      */
     950       26860 :     if (partitioned && (stmt->unique || exclusion))
     951             :     {
     952        1168 :         PartitionKey key = RelationGetPartitionKey(rel);
     953             :         const char *constraint_type;
     954             :         int         i;
     955             : 
     956        1168 :         if (stmt->primary)
     957         866 :             constraint_type = "PRIMARY KEY";
     958         302 :         else if (stmt->unique)
     959         202 :             constraint_type = "UNIQUE";
     960         100 :         else if (stmt->excludeOpNames)
     961         100 :             constraint_type = "EXCLUDE";
     962             :         else
     963             :         {
     964           0 :             elog(ERROR, "unknown constraint type");
     965             :             constraint_type = NULL; /* keep compiler quiet */
     966             :         }
     967             : 
     968             :         /*
     969             :          * Verify that all the columns in the partition key appear in the
     970             :          * unique key definition, with the same notion of equality.
     971             :          */
     972        2334 :         for (i = 0; i < key->partnatts; i++)
     973             :         {
     974        1270 :             bool        found = false;
     975             :             int         eq_strategy;
     976             :             Oid         ptkey_eqop;
     977             :             int         j;
     978             : 
     979             :             /*
     980             :              * Identify the equality operator associated with this partkey
     981             :              * column.  For list and range partitioning, partkeys use btree
     982             :              * operator classes; hash partitioning uses hash operator classes.
     983             :              * (Keep this in sync with ComputePartitionAttrs!)
     984             :              */
     985        1270 :             if (key->strategy == PARTITION_STRATEGY_HASH)
     986          46 :                 eq_strategy = HTEqualStrategyNumber;
     987             :             else
     988        1224 :                 eq_strategy = BTEqualStrategyNumber;
     989             : 
     990        1270 :             ptkey_eqop = get_opfamily_member(key->partopfamily[i],
     991        1270 :                                              key->partopcintype[i],
     992        1270 :                                              key->partopcintype[i],
     993             :                                              eq_strategy);
     994        1270 :             if (!OidIsValid(ptkey_eqop))
     995           0 :                 elog(ERROR, "missing operator %d(%u,%u) in partition opfamily %u",
     996             :                      eq_strategy, key->partopcintype[i], key->partopcintype[i],
     997             :                      key->partopfamily[i]);
     998             : 
     999             :             /*
    1000             :              * We'll need to be able to identify the equality operators
    1001             :              * associated with index columns, too.  We know what to do with
    1002             :              * btree opclasses; if there are ever any other index types that
    1003             :              * support unique indexes, this logic will need extension. But if
    1004             :              * we have an exclusion constraint (or a temporal PK), it already
    1005             :              * knows the operators, so we don't have to infer them.
    1006             :              */
    1007        1270 :             if (stmt->unique && !stmt->iswithoutoverlaps && accessMethodId != BTREE_AM_OID)
    1008           0 :                 ereport(ERROR,
    1009             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    1010             :                          errmsg("cannot match partition key to an index using access method \"%s\"",
    1011             :                                 accessMethodName)));
    1012             : 
    1013             :             /*
    1014             :              * It may be possible to support UNIQUE constraints when partition
    1015             :              * keys are expressions, but is it worth it?  Give up for now.
    1016             :              */
    1017        1270 :             if (key->partattrs[i] == 0)
    1018          12 :                 ereport(ERROR,
    1019             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    1020             :                          errmsg("unsupported %s constraint with partition key definition",
    1021             :                                 constraint_type),
    1022             :                          errdetail("%s constraints cannot be used when partition keys include expressions.",
    1023             :                                    constraint_type)));
    1024             : 
    1025             :             /* Search the index column(s) for a match */
    1026        1428 :             for (j = 0; j < indexInfo->ii_NumIndexKeyAttrs; j++)
    1027             :             {
    1028        1350 :                 if (key->partattrs[i] == indexInfo->ii_IndexAttrNumbers[j])
    1029             :                 {
    1030             :                     /*
    1031             :                      * Matched the column, now what about the collation and
    1032             :                      * equality op?
    1033             :                      */
    1034             :                     Oid         idx_opfamily;
    1035             :                     Oid         idx_opcintype;
    1036             : 
    1037        1180 :                     if (key->partcollation[i] != collationIds[j])
    1038           0 :                         continue;
    1039             : 
    1040        1180 :                     if (get_opclass_opfamily_and_input_type(opclassIds[j],
    1041             :                                                             &idx_opfamily,
    1042             :                                                             &idx_opcintype))
    1043             :                     {
    1044        1180 :                         Oid         idx_eqop = InvalidOid;
    1045             : 
    1046        1180 :                         if (stmt->unique && !stmt->iswithoutoverlaps)
    1047        1044 :                             idx_eqop = get_opfamily_member(idx_opfamily,
    1048             :                                                            idx_opcintype,
    1049             :                                                            idx_opcintype,
    1050             :                                                            BTEqualStrategyNumber);
    1051         136 :                         else if (exclusion)
    1052         136 :                             idx_eqop = indexInfo->ii_ExclusionOps[j];
    1053             :                         Assert(idx_eqop);
    1054             : 
    1055        1180 :                         if (ptkey_eqop == idx_eqop)
    1056             :                         {
    1057        1166 :                             found = true;
    1058        1166 :                             break;
    1059             :                         }
    1060          14 :                         else if (exclusion)
    1061             :                         {
    1062             :                             /*
    1063             :                              * We found a match, but it's not an equality
    1064             :                              * operator. Instead of failing below with an
    1065             :                              * error message about a missing column, fail now
    1066             :                              * and explain that the operator is wrong.
    1067             :                              */
    1068          14 :                             Form_pg_attribute att = TupleDescAttr(RelationGetDescr(rel), key->partattrs[i] - 1);
    1069             : 
    1070          14 :                             ereport(ERROR,
    1071             :                                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    1072             :                                      errmsg("cannot match partition key to index on column \"%s\" using non-equal operator \"%s\"",
    1073             :                                             NameStr(att->attname),
    1074             :                                             get_opname(indexInfo->ii_ExclusionOps[j]))));
    1075             :                         }
    1076             :                     }
    1077             :                 }
    1078             :             }
    1079             : 
    1080        1244 :             if (!found)
    1081             :             {
    1082             :                 Form_pg_attribute att;
    1083             : 
    1084          78 :                 att = TupleDescAttr(RelationGetDescr(rel),
    1085             :                                     key->partattrs[i] - 1);
    1086          78 :                 ereport(ERROR,
    1087             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    1088             :                          errmsg("unique constraint on partitioned table must include all partitioning columns"),
    1089             :                          errdetail("%s constraint on table \"%s\" lacks column \"%s\" which is part of the partition key.",
    1090             :                                    constraint_type, RelationGetRelationName(rel),
    1091             :                                    NameStr(att->attname))));
    1092             :             }
    1093             :         }
    1094             :     }
    1095             : 
    1096             : 
    1097             :     /*
    1098             :      * We disallow indexes on system columns.  They would not necessarily get
    1099             :      * updated correctly, and they don't seem useful anyway.
    1100             :      */
    1101       64040 :     for (int i = 0; i < indexInfo->ii_NumIndexAttrs; i++)
    1102             :     {
    1103       37284 :         AttrNumber  attno = indexInfo->ii_IndexAttrNumbers[i];
    1104             : 
    1105       37284 :         if (attno < 0)
    1106           0 :             ereport(ERROR,
    1107             :                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    1108             :                      errmsg("index creation on system columns is not supported")));
    1109             :     }
    1110             : 
    1111             :     /*
    1112             :      * Also check for system columns used in expressions or predicates.
    1113             :      */
    1114       26756 :     if (indexInfo->ii_Expressions || indexInfo->ii_Predicate)
    1115             :     {
    1116        1098 :         Bitmapset  *indexattrs = NULL;
    1117             : 
    1118        1098 :         pull_varattnos((Node *) indexInfo->ii_Expressions, 1, &indexattrs);
    1119        1098 :         pull_varattnos((Node *) indexInfo->ii_Predicate, 1, &indexattrs);
    1120             : 
    1121        7674 :         for (int i = FirstLowInvalidHeapAttributeNumber + 1; i < 0; i++)
    1122             :         {
    1123        6588 :             if (bms_is_member(i - FirstLowInvalidHeapAttributeNumber,
    1124             :                               indexattrs))
    1125          12 :                 ereport(ERROR,
    1126             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    1127             :                          errmsg("index creation on system columns is not supported")));
    1128             :         }
    1129             :     }
    1130             : 
    1131             :     /* Is index safe for others to ignore?  See set_indexsafe_procflags() */
    1132       52696 :     safe_index = indexInfo->ii_Expressions == NIL &&
    1133       25952 :         indexInfo->ii_Predicate == NIL;
    1134             : 
    1135             :     /*
    1136             :      * Report index creation if appropriate (delay this till after most of the
    1137             :      * error checks)
    1138             :      */
    1139       26744 :     if (stmt->isconstraint && !quiet)
    1140             :     {
    1141             :         const char *constraint_type;
    1142             : 
    1143        9212 :         if (stmt->primary)
    1144        8214 :             constraint_type = "PRIMARY KEY";
    1145         998 :         else if (stmt->unique)
    1146         822 :             constraint_type = "UNIQUE";
    1147         176 :         else if (stmt->excludeOpNames)
    1148         176 :             constraint_type = "EXCLUDE";
    1149             :         else
    1150             :         {
    1151           0 :             elog(ERROR, "unknown constraint type");
    1152             :             constraint_type = NULL; /* keep compiler quiet */
    1153             :         }
    1154             : 
    1155        9212 :         ereport(DEBUG1,
    1156             :                 (errmsg_internal("%s %s will create implicit index \"%s\" for table \"%s\"",
    1157             :                                  is_alter_table ? "ALTER TABLE / ADD" : "CREATE TABLE /",
    1158             :                                  constraint_type,
    1159             :                                  indexRelationName, RelationGetRelationName(rel))));
    1160             :     }
    1161             : 
    1162             :     /*
    1163             :      * A valid stmt->oldNumber implies that we already have a built form of
    1164             :      * the index.  The caller should also decline any index build.
    1165             :      */
    1166             :     Assert(!RelFileNumberIsValid(stmt->oldNumber) || (skip_build && !concurrent));
    1167             : 
    1168             :     /*
    1169             :      * Make the catalog entries for the index, including constraints. This
    1170             :      * step also actually builds the index, except if caller requested not to
    1171             :      * or in concurrent mode, in which case it'll be done later, or doing a
    1172             :      * partitioned index (because those don't have storage).
    1173             :      */
    1174       26744 :     flags = constr_flags = 0;
    1175       26744 :     if (stmt->isconstraint)
    1176        9446 :         flags |= INDEX_CREATE_ADD_CONSTRAINT;
    1177       26744 :     if (skip_build || concurrent || partitioned)
    1178       12440 :         flags |= INDEX_CREATE_SKIP_BUILD;
    1179       26744 :     if (stmt->if_not_exists)
    1180          18 :         flags |= INDEX_CREATE_IF_NOT_EXISTS;
    1181       26744 :     if (concurrent)
    1182         164 :         flags |= INDEX_CREATE_CONCURRENT;
    1183       26744 :     if (partitioned)
    1184        1928 :         flags |= INDEX_CREATE_PARTITIONED;
    1185       26744 :     if (stmt->primary)
    1186        8340 :         flags |= INDEX_CREATE_IS_PRIMARY;
    1187             : 
    1188             :     /*
    1189             :      * If the table is partitioned, and recursion was declined but partitions
    1190             :      * exist, mark the index as invalid.
    1191             :      */
    1192       26744 :     if (partitioned && stmt->relation && !stmt->relation->inh)
    1193             :     {
    1194         228 :         PartitionDesc pd = RelationGetPartitionDesc(rel, true);
    1195             : 
    1196         228 :         if (pd->nparts != 0)
    1197         214 :             flags |= INDEX_CREATE_INVALID;
    1198             :     }
    1199             : 
    1200       26744 :     if (stmt->deferrable)
    1201         138 :         constr_flags |= INDEX_CONSTR_CREATE_DEFERRABLE;
    1202       26744 :     if (stmt->initdeferred)
    1203          38 :         constr_flags |= INDEX_CONSTR_CREATE_INIT_DEFERRED;
    1204       26744 :     if (stmt->iswithoutoverlaps)
    1205         404 :         constr_flags |= INDEX_CONSTR_CREATE_WITHOUT_OVERLAPS;
    1206             : 
    1207             :     indexRelationId =
    1208       26744 :         index_create(rel, indexRelationName, indexRelationId, parentIndexId,
    1209             :                      parentConstraintId,
    1210             :                      stmt->oldNumber, indexInfo, indexColNames,
    1211             :                      accessMethodId, tablespaceId,
    1212             :                      collationIds, opclassIds, opclassOptions,
    1213             :                      coloptions, NULL, reloptions,
    1214             :                      flags, constr_flags,
    1215       26744 :                      allowSystemTableMods, !check_rights,
    1216       26744 :                      &createdConstraintId);
    1217             : 
    1218       26560 :     ObjectAddressSet(address, RelationRelationId, indexRelationId);
    1219             : 
    1220       26560 :     if (!OidIsValid(indexRelationId))
    1221             :     {
    1222             :         /*
    1223             :          * Roll back any GUC changes executed by index functions.  Also revert
    1224             :          * to original default_tablespace if we changed it above.
    1225             :          */
    1226          18 :         AtEOXact_GUC(false, root_save_nestlevel);
    1227             : 
    1228             :         /* Restore userid and security context */
    1229          18 :         SetUserIdAndSecContext(root_save_userid, root_save_sec_context);
    1230             : 
    1231          18 :         table_close(rel, NoLock);
    1232             : 
    1233             :         /* If this is the top-level index, we're done */
    1234          18 :         if (!OidIsValid(parentIndexId))
    1235          18 :             pgstat_progress_end_command();
    1236             : 
    1237          18 :         return address;
    1238             :     }
    1239             : 
    1240             :     /*
    1241             :      * Roll back any GUC changes executed by index functions, and keep
    1242             :      * subsequent changes local to this command.  This is essential if some
    1243             :      * index function changed a behavior-affecting GUC, e.g. search_path.
    1244             :      */
    1245       26542 :     AtEOXact_GUC(false, root_save_nestlevel);
    1246       26542 :     root_save_nestlevel = NewGUCNestLevel();
    1247             : 
    1248             :     /* Add any requested comment */
    1249       26542 :     if (stmt->idxcomment != NULL)
    1250          90 :         CreateComments(indexRelationId, RelationRelationId, 0,
    1251          90 :                        stmt->idxcomment);
    1252             : 
    1253       26542 :     if (partitioned)
    1254             :     {
    1255             :         PartitionDesc partdesc;
    1256             : 
    1257             :         /*
    1258             :          * Unless caller specified to skip this step (via ONLY), process each
    1259             :          * partition to make sure they all contain a corresponding index.
    1260             :          *
    1261             :          * If we're called internally (no stmt->relation), recurse always.
    1262             :          */
    1263        1928 :         partdesc = RelationGetPartitionDesc(rel, true);
    1264        1928 :         if ((!stmt->relation || stmt->relation->inh) && partdesc->nparts > 0)
    1265             :         {
    1266         574 :             int         nparts = partdesc->nparts;
    1267         574 :             Oid        *part_oids = palloc_array(Oid, nparts);
    1268         574 :             bool        invalidate_parent = false;
    1269             :             Relation    parentIndex;
    1270             :             TupleDesc   parentDesc;
    1271             : 
    1272             :             /*
    1273             :              * Report the total number of partitions at the start of the
    1274             :              * command; don't update it when being called recursively.
    1275             :              */
    1276         574 :             if (!OidIsValid(parentIndexId))
    1277             :             {
    1278             :                 /*
    1279             :                  * When called by ProcessUtilitySlow, the number of partitions
    1280             :                  * is passed in as an optimization; but other callers pass -1
    1281             :                  * since they don't have the value handy.  This should count
    1282             :                  * partitions the same way, ie one less than the number of
    1283             :                  * relations find_all_inheritors reports.
    1284             :                  *
    1285             :                  * We assume we needn't ask find_all_inheritors to take locks,
    1286             :                  * because that should have happened already for all callers.
    1287             :                  * Even if it did not, this is safe as long as we don't try to
    1288             :                  * touch the partitions here; the worst consequence would be a
    1289             :                  * bogus progress-reporting total.
    1290             :                  */
    1291         462 :                 if (total_parts < 0)
    1292             :                 {
    1293         128 :                     List       *children = find_all_inheritors(tableId, NoLock, NULL);
    1294             : 
    1295         128 :                     total_parts = list_length(children) - 1;
    1296         128 :                     list_free(children);
    1297             :                 }
    1298             : 
    1299         462 :                 pgstat_progress_update_param(PROGRESS_CREATEIDX_PARTITIONS_TOTAL,
    1300             :                                              total_parts);
    1301             :             }
    1302             : 
    1303             :             /* Make a local copy of partdesc->oids[], just for safety */
    1304         574 :             memcpy(part_oids, partdesc->oids, sizeof(Oid) * nparts);
    1305             : 
    1306             :             /*
    1307             :              * We'll need an IndexInfo describing the parent index.  The one
    1308             :              * built above is almost good enough, but not quite, because (for
    1309             :              * example) its predicate expression if any hasn't been through
    1310             :              * expression preprocessing.  The most reliable way to get an
    1311             :              * IndexInfo that will match those for child indexes is to build
    1312             :              * it the same way, using BuildIndexInfo().
    1313             :              */
    1314         574 :             parentIndex = index_open(indexRelationId, lockmode);
    1315         574 :             indexInfo = BuildIndexInfo(parentIndex);
    1316             : 
    1317         574 :             parentDesc = RelationGetDescr(rel);
    1318             : 
    1319             :             /*
    1320             :              * For each partition, scan all existing indexes; if one matches
    1321             :              * our index definition and is not already attached to some other
    1322             :              * parent index, attach it to the one we just created.
    1323             :              *
    1324             :              * If none matches, build a new index by calling ourselves
    1325             :              * recursively with the same options (except for the index name).
    1326             :              */
    1327        1590 :             for (int i = 0; i < nparts; i++)
    1328             :             {
    1329        1040 :                 Oid         childRelid = part_oids[i];
    1330             :                 Relation    childrel;
    1331             :                 Oid         child_save_userid;
    1332             :                 int         child_save_sec_context;
    1333             :                 int         child_save_nestlevel;
    1334             :                 List       *childidxs;
    1335             :                 ListCell   *cell;
    1336             :                 AttrMap    *attmap;
    1337        1040 :                 bool        found = false;
    1338             : 
    1339        1040 :                 childrel = table_open(childRelid, lockmode);
    1340             : 
    1341        1040 :                 GetUserIdAndSecContext(&child_save_userid,
    1342             :                                        &child_save_sec_context);
    1343        1040 :                 SetUserIdAndSecContext(childrel->rd_rel->relowner,
    1344             :                                        child_save_sec_context | SECURITY_RESTRICTED_OPERATION);
    1345        1040 :                 child_save_nestlevel = NewGUCNestLevel();
    1346        1040 :                 RestrictSearchPath();
    1347             : 
    1348             :                 /*
    1349             :                  * Don't try to create indexes on foreign tables, though. Skip
    1350             :                  * those if a regular index, or fail if trying to create a
    1351             :                  * constraint index.
    1352             :                  */
    1353        1040 :                 if (childrel->rd_rel->relkind == RELKIND_FOREIGN_TABLE)
    1354             :                 {
    1355          18 :                     if (stmt->unique || stmt->primary)
    1356          12 :                         ereport(ERROR,
    1357             :                                 (errcode(ERRCODE_WRONG_OBJECT_TYPE),
    1358             :                                  errmsg("cannot create unique index on partitioned table \"%s\"",
    1359             :                                         RelationGetRelationName(rel)),
    1360             :                                  errdetail("Table \"%s\" contains partitions that are foreign tables.",
    1361             :                                            RelationGetRelationName(rel))));
    1362             : 
    1363           6 :                     AtEOXact_GUC(false, child_save_nestlevel);
    1364           6 :                     SetUserIdAndSecContext(child_save_userid,
    1365             :                                            child_save_sec_context);
    1366           6 :                     table_close(childrel, lockmode);
    1367           6 :                     continue;
    1368             :                 }
    1369             : 
    1370        1022 :                 childidxs = RelationGetIndexList(childrel);
    1371             :                 attmap =
    1372        1022 :                     build_attrmap_by_name(RelationGetDescr(childrel),
    1373             :                                           parentDesc,
    1374             :                                           false);
    1375             : 
    1376        1364 :                 foreach(cell, childidxs)
    1377             :                 {
    1378         402 :                     Oid         cldidxid = lfirst_oid(cell);
    1379             :                     Relation    cldidx;
    1380             :                     IndexInfo  *cldIdxInfo;
    1381             : 
    1382             :                     /* this index is already partition of another one */
    1383         402 :                     if (has_superclass(cldidxid))
    1384         318 :                         continue;
    1385             : 
    1386          84 :                     cldidx = index_open(cldidxid, lockmode);
    1387          84 :                     cldIdxInfo = BuildIndexInfo(cldidx);
    1388          84 :                     if (CompareIndexInfo(cldIdxInfo, indexInfo,
    1389          84 :                                          cldidx->rd_indcollation,
    1390          84 :                                          parentIndex->rd_indcollation,
    1391          84 :                                          cldidx->rd_opfamily,
    1392          84 :                                          parentIndex->rd_opfamily,
    1393             :                                          attmap))
    1394             :                     {
    1395          60 :                         Oid         cldConstrOid = InvalidOid;
    1396             : 
    1397             :                         /*
    1398             :                          * Found a match.
    1399             :                          *
    1400             :                          * If this index is being created in the parent
    1401             :                          * because of a constraint, then the child needs to
    1402             :                          * have a constraint also, so look for one.  If there
    1403             :                          * is no such constraint, this index is no good, so
    1404             :                          * keep looking.
    1405             :                          */
    1406          60 :                         if (createdConstraintId != InvalidOid)
    1407             :                         {
    1408             :                             cldConstrOid =
    1409          12 :                                 get_relation_idx_constraint_oid(childRelid,
    1410             :                                                                 cldidxid);
    1411          12 :                             if (cldConstrOid == InvalidOid)
    1412             :                             {
    1413           0 :                                 index_close(cldidx, lockmode);
    1414           0 :                                 continue;
    1415             :                             }
    1416             :                         }
    1417             : 
    1418             :                         /* Attach index to parent and we're done. */
    1419          60 :                         IndexSetParentIndex(cldidx, indexRelationId);
    1420          60 :                         if (createdConstraintId != InvalidOid)
    1421          12 :                             ConstraintSetParentConstraint(cldConstrOid,
    1422             :                                                           createdConstraintId,
    1423             :                                                           childRelid);
    1424             : 
    1425          60 :                         if (!cldidx->rd_index->indisvalid)
    1426          18 :                             invalidate_parent = true;
    1427             : 
    1428          60 :                         found = true;
    1429             : 
    1430             :                         /*
    1431             :                          * Report this partition as processed.  Note that if
    1432             :                          * the partition has children itself, we'd ideally
    1433             :                          * count the children and update the progress report
    1434             :                          * for all of them; but that seems unduly expensive.
    1435             :                          * Instead, the progress report will act like all such
    1436             :                          * indirect children were processed in zero time at
    1437             :                          * the end of the command.
    1438             :                          */
    1439          60 :                         pgstat_progress_incr_param(PROGRESS_CREATEIDX_PARTITIONS_DONE, 1);
    1440             : 
    1441             :                         /* keep lock till commit */
    1442          60 :                         index_close(cldidx, NoLock);
    1443          60 :                         break;
    1444             :                     }
    1445             : 
    1446          24 :                     index_close(cldidx, lockmode);
    1447             :                 }
    1448             : 
    1449        1022 :                 list_free(childidxs);
    1450        1022 :                 AtEOXact_GUC(false, child_save_nestlevel);
    1451        1022 :                 SetUserIdAndSecContext(child_save_userid,
    1452             :                                        child_save_sec_context);
    1453        1022 :                 table_close(childrel, NoLock);
    1454             : 
    1455             :                 /*
    1456             :                  * If no matching index was found, create our own.
    1457             :                  */
    1458        1022 :                 if (!found)
    1459             :                 {
    1460         962 :                     IndexStmt  *childStmt = copyObject(stmt);
    1461             :                     bool        found_whole_row;
    1462             :                     ListCell   *lc;
    1463             :                     ObjectAddress childAddr;
    1464             : 
    1465             :                     /*
    1466             :                      * We can't use the same index name for the child index,
    1467             :                      * so clear idxname to let the recursive invocation choose
    1468             :                      * a new name.  Likewise, the existing target relation
    1469             :                      * field is wrong, and if indexOid or oldNumber are set,
    1470             :                      * they mustn't be applied to the child either.
    1471             :                      */
    1472         962 :                     childStmt->idxname = NULL;
    1473         962 :                     childStmt->relation = NULL;
    1474         962 :                     childStmt->indexOid = InvalidOid;
    1475         962 :                     childStmt->oldNumber = InvalidRelFileNumber;
    1476         962 :                     childStmt->oldCreateSubid = InvalidSubTransactionId;
    1477         962 :                     childStmt->oldFirstRelfilelocatorSubid = InvalidSubTransactionId;
    1478             : 
    1479             :                     /*
    1480             :                      * Adjust any Vars (both in expressions and in the index's
    1481             :                      * WHERE clause) to match the partition's column numbering
    1482             :                      * in case it's different from the parent's.
    1483             :                      */
    1484        2124 :                     foreach(lc, childStmt->indexParams)
    1485             :                     {
    1486        1162 :                         IndexElem  *ielem = lfirst(lc);
    1487             : 
    1488             :                         /*
    1489             :                          * If the index parameter is an expression, we must
    1490             :                          * translate it to contain child Vars.
    1491             :                          */
    1492        1162 :                         if (ielem->expr)
    1493             :                         {
    1494          84 :                             ielem->expr =
    1495          84 :                                 map_variable_attnos((Node *) ielem->expr,
    1496             :                                                     1, 0, attmap,
    1497             :                                                     InvalidOid,
    1498             :                                                     &found_whole_row);
    1499          84 :                             if (found_whole_row)
    1500           0 :                                 elog(ERROR, "cannot convert whole-row table reference");
    1501             :                         }
    1502             :                     }
    1503         962 :                     childStmt->whereClause =
    1504         962 :                         map_variable_attnos(stmt->whereClause, 1, 0,
    1505             :                                             attmap,
    1506             :                                             InvalidOid, &found_whole_row);
    1507         962 :                     if (found_whole_row)
    1508           0 :                         elog(ERROR, "cannot convert whole-row table reference");
    1509             : 
    1510             :                     /*
    1511             :                      * Recurse as the starting user ID.  Callee will use that
    1512             :                      * for permission checks, then switch again.
    1513             :                      */
    1514             :                     Assert(GetUserId() == child_save_userid);
    1515         962 :                     SetUserIdAndSecContext(root_save_userid,
    1516             :                                            root_save_sec_context);
    1517             :                     childAddr =
    1518         962 :                         DefineIndex(childRelid, childStmt,
    1519             :                                     InvalidOid, /* no predefined OID */
    1520             :                                     indexRelationId,    /* this is our child */
    1521             :                                     createdConstraintId,
    1522             :                                     -1,
    1523             :                                     is_alter_table, check_rights,
    1524             :                                     check_not_in_use,
    1525             :                                     skip_build, quiet);
    1526         950 :                     SetUserIdAndSecContext(child_save_userid,
    1527             :                                            child_save_sec_context);
    1528             : 
    1529             :                     /*
    1530             :                      * Check if the index just created is valid or not, as it
    1531             :                      * could be possible that it has been switched as invalid
    1532             :                      * when recursing across multiple partition levels.
    1533             :                      */
    1534         950 :                     if (!get_index_isvalid(childAddr.objectId))
    1535           6 :                         invalidate_parent = true;
    1536             :                 }
    1537             : 
    1538        1010 :                 free_attrmap(attmap);
    1539             :             }
    1540             : 
    1541         550 :             index_close(parentIndex, lockmode);
    1542             : 
    1543             :             /*
    1544             :              * The pg_index row we inserted for this index was marked
    1545             :              * indisvalid=true.  But if we attached an existing index that is
    1546             :              * invalid, this is incorrect, so update our row to invalid too.
    1547             :              */
    1548         550 :             if (invalidate_parent)
    1549             :             {
    1550          24 :                 Relation    pg_index = table_open(IndexRelationId, RowExclusiveLock);
    1551             :                 HeapTuple   tup,
    1552             :                             newtup;
    1553             : 
    1554          24 :                 tup = SearchSysCache1(INDEXRELID,
    1555             :                                       ObjectIdGetDatum(indexRelationId));
    1556          24 :                 if (!HeapTupleIsValid(tup))
    1557           0 :                     elog(ERROR, "cache lookup failed for index %u",
    1558             :                          indexRelationId);
    1559          24 :                 newtup = heap_copytuple(tup);
    1560          24 :                 ((Form_pg_index) GETSTRUCT(newtup))->indisvalid = false;
    1561          24 :                 CatalogTupleUpdate(pg_index, &tup->t_self, newtup);
    1562          24 :                 ReleaseSysCache(tup);
    1563          24 :                 table_close(pg_index, RowExclusiveLock);
    1564          24 :                 heap_freetuple(newtup);
    1565             : 
    1566             :                 /*
    1567             :                  * CCI here to make this update visible, in case this recurses
    1568             :                  * across multiple partition levels.
    1569             :                  */
    1570          24 :                 CommandCounterIncrement();
    1571             :             }
    1572             :         }
    1573             : 
    1574             :         /*
    1575             :          * Indexes on partitioned tables are not themselves built, so we're
    1576             :          * done here.
    1577             :          */
    1578        1904 :         AtEOXact_GUC(false, root_save_nestlevel);
    1579        1904 :         SetUserIdAndSecContext(root_save_userid, root_save_sec_context);
    1580        1904 :         table_close(rel, NoLock);
    1581        1904 :         if (!OidIsValid(parentIndexId))
    1582        1634 :             pgstat_progress_end_command();
    1583             :         else
    1584             :         {
    1585             :             /* Update progress for an intermediate partitioned index itself */
    1586         270 :             pgstat_progress_incr_param(PROGRESS_CREATEIDX_PARTITIONS_DONE, 1);
    1587             :         }
    1588             : 
    1589        1904 :         return address;
    1590             :     }
    1591             : 
    1592       24614 :     AtEOXact_GUC(false, root_save_nestlevel);
    1593       24614 :     SetUserIdAndSecContext(root_save_userid, root_save_sec_context);
    1594             : 
    1595       24614 :     if (!concurrent)
    1596             :     {
    1597             :         /* Close the heap and we're done, in the non-concurrent case */
    1598       24462 :         table_close(rel, NoLock);
    1599             : 
    1600             :         /*
    1601             :          * If this is the top-level index, the command is done overall;
    1602             :          * otherwise, increment progress to report one child index is done.
    1603             :          */
    1604       24462 :         if (!OidIsValid(parentIndexId))
    1605       21942 :             pgstat_progress_end_command();
    1606             :         else
    1607        2520 :             pgstat_progress_incr_param(PROGRESS_CREATEIDX_PARTITIONS_DONE, 1);
    1608             : 
    1609       24462 :         return address;
    1610             :     }
    1611             : 
    1612             :     /* save lockrelid and locktag for below, then close rel */
    1613         152 :     heaprelid = rel->rd_lockInfo.lockRelId;
    1614         152 :     SET_LOCKTAG_RELATION(heaplocktag, heaprelid.dbId, heaprelid.relId);
    1615         152 :     table_close(rel, NoLock);
    1616             : 
    1617             :     /*
    1618             :      * For a concurrent build, it's important to make the catalog entries
    1619             :      * visible to other transactions before we start to build the index. That
    1620             :      * will prevent them from making incompatible HOT updates.  The new index
    1621             :      * will be marked not indisready and not indisvalid, so that no one else
    1622             :      * tries to either insert into it or use it for queries.
    1623             :      *
    1624             :      * We must commit our current transaction so that the index becomes
    1625             :      * visible; then start another.  Note that all the data structures we just
    1626             :      * built are lost in the commit.  The only data we keep past here are the
    1627             :      * relation IDs.
    1628             :      *
    1629             :      * Before committing, get a session-level lock on the table, to ensure
    1630             :      * that neither it nor the index can be dropped before we finish. This
    1631             :      * cannot block, even if someone else is waiting for access, because we
    1632             :      * already have the same lock within our transaction.
    1633             :      *
    1634             :      * Note: we don't currently bother with a session lock on the index,
    1635             :      * because there are no operations that could change its state while we
    1636             :      * hold lock on the parent table.  This might need to change later.
    1637             :      */
    1638         152 :     LockRelationIdForSession(&heaprelid, ShareUpdateExclusiveLock);
    1639             : 
    1640         152 :     PopActiveSnapshot();
    1641         152 :     CommitTransactionCommand();
    1642         152 :     StartTransactionCommand();
    1643             : 
    1644             :     /* Tell concurrent index builds to ignore us, if index qualifies */
    1645         152 :     if (safe_index)
    1646         112 :         set_indexsafe_procflags();
    1647             : 
    1648             :     /*
    1649             :      * The index is now visible, so we can report the OID.  While on it,
    1650             :      * include the report for the beginning of phase 2.
    1651             :      */
    1652             :     {
    1653         152 :         const int   progress_cols[] = {
    1654             :             PROGRESS_CREATEIDX_INDEX_OID,
    1655             :             PROGRESS_CREATEIDX_PHASE
    1656             :         };
    1657         152 :         const int64 progress_vals[] = {
    1658             :             indexRelationId,
    1659             :             PROGRESS_CREATEIDX_PHASE_WAIT_1
    1660             :         };
    1661             : 
    1662         152 :         pgstat_progress_update_multi_param(2, progress_cols, progress_vals);
    1663             :     }
    1664             : 
    1665             :     /*
    1666             :      * Phase 2 of concurrent index build (see comments for validate_index()
    1667             :      * for an overview of how this works)
    1668             :      *
    1669             :      * Now we must wait until no running transaction could have the table open
    1670             :      * with the old list of indexes.  Use ShareLock to consider running
    1671             :      * transactions that hold locks that permit writing to the table.  Note we
    1672             :      * do not need to worry about xacts that open the table for writing after
    1673             :      * this point; they will see the new index when they open it.
    1674             :      *
    1675             :      * Note: the reason we use actual lock acquisition here, rather than just
    1676             :      * checking the ProcArray and sleeping, is that deadlock is possible if
    1677             :      * one of the transactions in question is blocked trying to acquire an
    1678             :      * exclusive lock on our table.  The lock code will detect deadlock and
    1679             :      * error out properly.
    1680             :      */
    1681         152 :     WaitForLockers(heaplocktag, ShareLock, true);
    1682             : 
    1683             :     /*
    1684             :      * At this moment we are sure that there are no transactions with the
    1685             :      * table open for write that don't have this new index in their list of
    1686             :      * indexes.  We have waited out all the existing transactions and any new
    1687             :      * transaction will have the new index in its list, but the index is still
    1688             :      * marked as "not-ready-for-inserts".  The index is consulted while
    1689             :      * deciding HOT-safety though.  This arrangement ensures that no new HOT
    1690             :      * chains can be created where the new tuple and the old tuple in the
    1691             :      * chain have different index keys.
    1692             :      *
    1693             :      * We now take a new snapshot, and build the index using all tuples that
    1694             :      * are visible in this snapshot.  We can be sure that any HOT updates to
    1695             :      * these tuples will be compatible with the index, since any updates made
    1696             :      * by transactions that didn't know about the index are now committed or
    1697             :      * rolled back.  Thus, each visible tuple is either the end of its
    1698             :      * HOT-chain or the extension of the chain is HOT-safe for this index.
    1699             :      */
    1700             : 
    1701             :     /* Set ActiveSnapshot since functions in the indexes may need it */
    1702         152 :     PushActiveSnapshot(GetTransactionSnapshot());
    1703             : 
    1704             :     /* Perform concurrent build of index */
    1705         152 :     index_concurrently_build(tableId, indexRelationId);
    1706             : 
    1707             :     /* we can do away with our snapshot */
    1708         134 :     PopActiveSnapshot();
    1709             : 
    1710             :     /*
    1711             :      * Commit this transaction to make the indisready update visible.
    1712             :      */
    1713         134 :     CommitTransactionCommand();
    1714         134 :     StartTransactionCommand();
    1715             : 
    1716             :     /* Tell concurrent index builds to ignore us, if index qualifies */
    1717         134 :     if (safe_index)
    1718         100 :         set_indexsafe_procflags();
    1719             : 
    1720             :     /*
    1721             :      * Phase 3 of concurrent index build
    1722             :      *
    1723             :      * We once again wait until no transaction can have the table open with
    1724             :      * the index marked as read-only for updates.
    1725             :      */
    1726         134 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_PHASE,
    1727             :                                  PROGRESS_CREATEIDX_PHASE_WAIT_2);
    1728         134 :     WaitForLockers(heaplocktag, ShareLock, true);
    1729             : 
    1730             :     /*
    1731             :      * Now take the "reference snapshot" that will be used by validate_index()
    1732             :      * to filter candidate tuples.  Beware!  There might still be snapshots in
    1733             :      * use that treat some transaction as in-progress that our reference
    1734             :      * snapshot treats as committed.  If such a recently-committed transaction
    1735             :      * deleted tuples in the table, we will not include them in the index; yet
    1736             :      * those transactions which see the deleting one as still-in-progress will
    1737             :      * expect such tuples to be there once we mark the index as valid.
    1738             :      *
    1739             :      * We solve this by waiting for all endangered transactions to exit before
    1740             :      * we mark the index as valid.
    1741             :      *
    1742             :      * We also set ActiveSnapshot to this snap, since functions in indexes may
    1743             :      * need a snapshot.
    1744             :      */
    1745         134 :     snapshot = RegisterSnapshot(GetTransactionSnapshot());
    1746         134 :     PushActiveSnapshot(snapshot);
    1747             : 
    1748             :     /*
    1749             :      * Scan the index and the heap, insert any missing index entries.
    1750             :      */
    1751         134 :     validate_index(tableId, indexRelationId, snapshot);
    1752             : 
    1753             :     /*
    1754             :      * Drop the reference snapshot.  We must do this before waiting out other
    1755             :      * snapshot holders, else we will deadlock against other processes also
    1756             :      * doing CREATE INDEX CONCURRENTLY, which would see our snapshot as one
    1757             :      * they must wait for.  But first, save the snapshot's xmin to use as
    1758             :      * limitXmin for GetCurrentVirtualXIDs().
    1759             :      */
    1760         134 :     limitXmin = snapshot->xmin;
    1761             : 
    1762         134 :     PopActiveSnapshot();
    1763         134 :     UnregisterSnapshot(snapshot);
    1764             : 
    1765             :     /*
    1766             :      * The snapshot subsystem could still contain registered snapshots that
    1767             :      * are holding back our process's advertised xmin; in particular, if
    1768             :      * default_transaction_isolation = serializable, there is a transaction
    1769             :      * snapshot that is still active.  The CatalogSnapshot is likewise a
    1770             :      * hazard.  To ensure no deadlocks, we must commit and start yet another
    1771             :      * transaction, and do our wait before any snapshot has been taken in it.
    1772             :      */
    1773         134 :     CommitTransactionCommand();
    1774         134 :     StartTransactionCommand();
    1775             : 
    1776             :     /* Tell concurrent index builds to ignore us, if index qualifies */
    1777         134 :     if (safe_index)
    1778         100 :         set_indexsafe_procflags();
    1779             : 
    1780             :     /* We should now definitely not be advertising any xmin. */
    1781             :     Assert(MyProc->xmin == InvalidTransactionId);
    1782             : 
    1783             :     /*
    1784             :      * The index is now valid in the sense that it contains all currently
    1785             :      * interesting tuples.  But since it might not contain tuples deleted just
    1786             :      * before the reference snap was taken, we have to wait out any
    1787             :      * transactions that might have older snapshots.
    1788             :      */
    1789         134 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_PHASE,
    1790             :                                  PROGRESS_CREATEIDX_PHASE_WAIT_3);
    1791         134 :     WaitForOlderSnapshots(limitXmin, true);
    1792             : 
    1793             :     /*
    1794             :      * Index can now be marked valid -- update its pg_index entry
    1795             :      */
    1796         134 :     index_set_state_flags(indexRelationId, INDEX_CREATE_SET_VALID);
    1797             : 
    1798             :     /*
    1799             :      * The pg_index update will cause backends (including this one) to update
    1800             :      * relcache entries for the index itself, but we should also send a
    1801             :      * relcache inval on the parent table to force replanning of cached plans.
    1802             :      * Otherwise existing sessions might fail to use the new index where it
    1803             :      * would be useful.  (Note that our earlier commits did not create reasons
    1804             :      * to replan; so relcache flush on the index itself was sufficient.)
    1805             :      */
    1806         134 :     CacheInvalidateRelcacheByRelid(heaprelid.relId);
    1807             : 
    1808             :     /*
    1809             :      * Last thing to do is release the session-level lock on the parent table.
    1810             :      */
    1811         134 :     UnlockRelationIdForSession(&heaprelid, ShareUpdateExclusiveLock);
    1812             : 
    1813         134 :     pgstat_progress_end_command();
    1814             : 
    1815         134 :     return address;
    1816             : }
    1817             : 
    1818             : 
    1819             : /*
    1820             :  * CheckPredicate
    1821             :  *      Checks that the given partial-index predicate is valid.
    1822             :  *
    1823             :  * This used to also constrain the form of the predicate to forms that
    1824             :  * indxpath.c could do something with.  However, that seems overly
    1825             :  * restrictive.  One useful application of partial indexes is to apply
    1826             :  * a UNIQUE constraint across a subset of a table, and in that scenario
    1827             :  * any evaluable predicate will work.  So accept any predicate here
    1828             :  * (except ones requiring a plan), and let indxpath.c fend for itself.
    1829             :  */
    1830             : static void
    1831         400 : CheckPredicate(Expr *predicate)
    1832             : {
    1833             :     /*
    1834             :      * transformExpr() should have already rejected subqueries, aggregates,
    1835             :      * and window functions, based on the EXPR_KIND_ for a predicate.
    1836             :      */
    1837             : 
    1838             :     /*
    1839             :      * A predicate using mutable functions is probably wrong, for the same
    1840             :      * reasons that we don't allow an index expression to use one.
    1841             :      */
    1842         400 :     if (contain_mutable_functions_after_planning(predicate))
    1843           0 :         ereport(ERROR,
    1844             :                 (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
    1845             :                  errmsg("functions in index predicate must be marked IMMUTABLE")));
    1846         400 : }
    1847             : 
    1848             : /*
    1849             :  * Compute per-index-column information, including indexed column numbers
    1850             :  * or index expressions, opclasses and their options. Note, all output vectors
    1851             :  * should be allocated for all columns, including "including" ones.
    1852             :  *
    1853             :  * If the caller switched to the table owner, ddl_userid is the role for ACL
    1854             :  * checks reached without traversing opaque expressions.  Otherwise, it's
    1855             :  * InvalidOid, and other ddl_* arguments are undefined.
    1856             :  */
    1857             : static void
    1858       27234 : ComputeIndexAttrs(IndexInfo *indexInfo,
    1859             :                   Oid *typeOids,
    1860             :                   Oid *collationOids,
    1861             :                   Oid *opclassOids,
    1862             :                   Datum *opclassOptions,
    1863             :                   int16 *colOptions,
    1864             :                   const List *attList,  /* list of IndexElem's */
    1865             :                   const List *exclusionOpNames,
    1866             :                   Oid relId,
    1867             :                   const char *accessMethodName,
    1868             :                   Oid accessMethodId,
    1869             :                   bool amcanorder,
    1870             :                   bool isconstraint,
    1871             :                   bool iswithoutoverlaps,
    1872             :                   Oid ddl_userid,
    1873             :                   int ddl_sec_context,
    1874             :                   int *ddl_save_nestlevel)
    1875             : {
    1876             :     ListCell   *nextExclOp;
    1877             :     ListCell   *lc;
    1878             :     int         attn;
    1879       27234 :     int         nkeycols = indexInfo->ii_NumIndexKeyAttrs;
    1880             :     Oid         save_userid;
    1881             :     int         save_sec_context;
    1882             : 
    1883             :     /* Allocate space for exclusion operator info, if needed */
    1884       27234 :     if (exclusionOpNames)
    1885             :     {
    1886             :         Assert(list_length(exclusionOpNames) == nkeycols);
    1887         288 :         indexInfo->ii_ExclusionOps = palloc_array(Oid, nkeycols);
    1888         288 :         indexInfo->ii_ExclusionProcs = palloc_array(Oid, nkeycols);
    1889         288 :         indexInfo->ii_ExclusionStrats = palloc_array(uint16, nkeycols);
    1890         288 :         nextExclOp = list_head(exclusionOpNames);
    1891             :     }
    1892             :     else
    1893       26946 :         nextExclOp = NULL;
    1894             : 
    1895             :     /* exclusionOpNames can be non-NIL if we are creating a partition */
    1896       27234 :     if (iswithoutoverlaps && exclusionOpNames == NIL)
    1897             :     {
    1898         368 :         indexInfo->ii_ExclusionOps = palloc_array(Oid, nkeycols);
    1899         368 :         indexInfo->ii_ExclusionProcs = palloc_array(Oid, nkeycols);
    1900         368 :         indexInfo->ii_ExclusionStrats = palloc_array(uint16, nkeycols);
    1901             :     }
    1902             : 
    1903       27234 :     if (OidIsValid(ddl_userid))
    1904       27132 :         GetUserIdAndSecContext(&save_userid, &save_sec_context);
    1905             : 
    1906             :     /*
    1907             :      * process attributeList
    1908             :      */
    1909       27234 :     attn = 0;
    1910       64804 :     foreach(lc, attList)
    1911             :     {
    1912       37800 :         IndexElem  *attribute = (IndexElem *) lfirst(lc);
    1913             :         Oid         atttype;
    1914             :         Oid         attcollation;
    1915             : 
    1916             :         /*
    1917             :          * Process the column-or-expression to be indexed.
    1918             :          */
    1919       37800 :         if (attribute->name != NULL)
    1920             :         {
    1921             :             /* Simple index attribute */
    1922             :             HeapTuple   atttuple;
    1923             :             Form_pg_attribute attform;
    1924             : 
    1925             :             Assert(attribute->expr == NULL);
    1926       36794 :             atttuple = SearchSysCacheAttName(relId, attribute->name);
    1927       36794 :             if (!HeapTupleIsValid(atttuple))
    1928             :             {
    1929             :                 /* difference in error message spellings is historical */
    1930          30 :                 if (isconstraint)
    1931          18 :                     ereport(ERROR,
    1932             :                             (errcode(ERRCODE_UNDEFINED_COLUMN),
    1933             :                              errmsg("column \"%s\" named in key does not exist",
    1934             :                                     attribute->name)));
    1935             :                 else
    1936          12 :                     ereport(ERROR,
    1937             :                             (errcode(ERRCODE_UNDEFINED_COLUMN),
    1938             :                              errmsg("column \"%s\" does not exist",
    1939             :                                     attribute->name)));
    1940             :             }
    1941       36764 :             attform = (Form_pg_attribute) GETSTRUCT(atttuple);
    1942       36764 :             indexInfo->ii_IndexAttrNumbers[attn] = attform->attnum;
    1943       36764 :             atttype = attform->atttypid;
    1944       36764 :             attcollation = attform->attcollation;
    1945       36764 :             ReleaseSysCache(atttuple);
    1946             :         }
    1947             :         else
    1948             :         {
    1949             :             /* Index expression */
    1950        1006 :             Node       *expr = attribute->expr;
    1951             : 
    1952             :             Assert(expr != NULL);
    1953             : 
    1954        1006 :             if (attn >= nkeycols)
    1955           0 :                 ereport(ERROR,
    1956             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    1957             :                          errmsg("expressions are not supported in included columns")));
    1958        1006 :             atttype = exprType(expr);
    1959        1006 :             attcollation = exprCollation(expr);
    1960             : 
    1961             :             /*
    1962             :              * Strip any top-level COLLATE clause.  This ensures that we treat
    1963             :              * "x COLLATE y" and "(x COLLATE y)" alike.
    1964             :              */
    1965        1036 :             while (IsA(expr, CollateExpr))
    1966          30 :                 expr = (Node *) ((CollateExpr *) expr)->arg;
    1967             : 
    1968        1006 :             if (IsA(expr, Var) &&
    1969          12 :                 ((Var *) expr)->varattno != InvalidAttrNumber)
    1970             :             {
    1971             :                 /*
    1972             :                  * User wrote "(column)" or "(column COLLATE something)".
    1973             :                  * Treat it like simple attribute anyway.
    1974             :                  */
    1975          12 :                 indexInfo->ii_IndexAttrNumbers[attn] = ((Var *) expr)->varattno;
    1976             :             }
    1977             :             else
    1978             :             {
    1979         994 :                 indexInfo->ii_IndexAttrNumbers[attn] = 0;    /* marks expression */
    1980         994 :                 indexInfo->ii_Expressions = lappend(indexInfo->ii_Expressions,
    1981             :                                                     expr);
    1982             : 
    1983             :                 /*
    1984             :                  * transformExpr() should have already rejected subqueries,
    1985             :                  * aggregates, and window functions, based on the EXPR_KIND_
    1986             :                  * for an index expression.
    1987             :                  */
    1988             : 
    1989             :                 /*
    1990             :                  * An expression using mutable functions is probably wrong,
    1991             :                  * since if you aren't going to get the same result for the
    1992             :                  * same data every time, it's not clear what the index entries
    1993             :                  * mean at all.
    1994             :                  */
    1995         994 :                 if (contain_mutable_functions_after_planning((Expr *) expr))
    1996         168 :                     ereport(ERROR,
    1997             :                             (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
    1998             :                              errmsg("functions in index expression must be marked IMMUTABLE")));
    1999             :             }
    2000             :         }
    2001             : 
    2002       37602 :         typeOids[attn] = atttype;
    2003             : 
    2004             :         /*
    2005             :          * Included columns have no collation, no opclass and no ordering
    2006             :          * options.
    2007             :          */
    2008       37602 :         if (attn >= nkeycols)
    2009             :         {
    2010         644 :             if (attribute->collation)
    2011           0 :                 ereport(ERROR,
    2012             :                         (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
    2013             :                          errmsg("including column does not support a collation")));
    2014         644 :             if (attribute->opclass)
    2015           0 :                 ereport(ERROR,
    2016             :                         (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
    2017             :                          errmsg("including column does not support an operator class")));
    2018         644 :             if (attribute->ordering != SORTBY_DEFAULT)
    2019           0 :                 ereport(ERROR,
    2020             :                         (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
    2021             :                          errmsg("including column does not support ASC/DESC options")));
    2022         644 :             if (attribute->nulls_ordering != SORTBY_NULLS_DEFAULT)
    2023           0 :                 ereport(ERROR,
    2024             :                         (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
    2025             :                          errmsg("including column does not support NULLS FIRST/LAST options")));
    2026             : 
    2027         644 :             opclassOids[attn] = InvalidOid;
    2028         644 :             opclassOptions[attn] = (Datum) 0;
    2029         644 :             colOptions[attn] = 0;
    2030         644 :             collationOids[attn] = InvalidOid;
    2031         644 :             attn++;
    2032             : 
    2033         644 :             continue;
    2034             :         }
    2035             : 
    2036             :         /*
    2037             :          * Apply collation override if any.  Use of ddl_userid is necessary
    2038             :          * due to ACL checks therein, and it's safe because collations don't
    2039             :          * contain opaque expressions (or non-opaque expressions).
    2040             :          */
    2041       36958 :         if (attribute->collation)
    2042             :         {
    2043         112 :             if (OidIsValid(ddl_userid))
    2044             :             {
    2045         112 :                 AtEOXact_GUC(false, *ddl_save_nestlevel);
    2046         112 :                 SetUserIdAndSecContext(ddl_userid, ddl_sec_context);
    2047             :             }
    2048         112 :             attcollation = get_collation_oid(attribute->collation, false);
    2049         110 :             if (OidIsValid(ddl_userid))
    2050             :             {
    2051         110 :                 SetUserIdAndSecContext(save_userid, save_sec_context);
    2052         110 :                 *ddl_save_nestlevel = NewGUCNestLevel();
    2053             :             }
    2054             :         }
    2055             : 
    2056             :         /*
    2057             :          * Check we have a collation iff it's a collatable type.  The only
    2058             :          * expected failures here are (1) COLLATE applied to a noncollatable
    2059             :          * type, or (2) index expression had an unresolved collation.  But we
    2060             :          * might as well code this to be a complete consistency check.
    2061             :          */
    2062       36956 :         if (type_is_collatable(atttype))
    2063             :         {
    2064        5784 :             if (!OidIsValid(attcollation))
    2065           0 :                 ereport(ERROR,
    2066             :                         (errcode(ERRCODE_INDETERMINATE_COLLATION),
    2067             :                          errmsg("could not determine which collation to use for index expression"),
    2068             :                          errhint("Use the COLLATE clause to set the collation explicitly.")));
    2069             :         }
    2070             :         else
    2071             :         {
    2072       31172 :             if (OidIsValid(attcollation))
    2073          12 :                 ereport(ERROR,
    2074             :                         (errcode(ERRCODE_DATATYPE_MISMATCH),
    2075             :                          errmsg("collations are not supported by type %s",
    2076             :                                 format_type_be(atttype))));
    2077             :         }
    2078             : 
    2079       36944 :         collationOids[attn] = attcollation;
    2080             : 
    2081             :         /*
    2082             :          * Identify the opclass to use.  Use of ddl_userid is necessary due to
    2083             :          * ACL checks therein.  This is safe despite opclasses containing
    2084             :          * opaque expressions (specifically, functions), because only
    2085             :          * superusers can define opclasses.
    2086             :          */
    2087       36944 :         if (OidIsValid(ddl_userid))
    2088             :         {
    2089       36836 :             AtEOXact_GUC(false, *ddl_save_nestlevel);
    2090       36836 :             SetUserIdAndSecContext(ddl_userid, ddl_sec_context);
    2091             :         }
    2092       36944 :         opclassOids[attn] = ResolveOpClass(attribute->opclass,
    2093             :                                            atttype,
    2094             :                                            accessMethodName,
    2095             :                                            accessMethodId);
    2096       36926 :         if (OidIsValid(ddl_userid))
    2097             :         {
    2098       36818 :             SetUserIdAndSecContext(save_userid, save_sec_context);
    2099       36818 :             *ddl_save_nestlevel = NewGUCNestLevel();
    2100             :         }
    2101             : 
    2102             :         /*
    2103             :          * Identify the exclusion operator, if any.
    2104             :          */
    2105       36926 :         if (nextExclOp)
    2106             :         {
    2107         444 :             List       *opname = (List *) lfirst(nextExclOp);
    2108             :             Oid         opid;
    2109             :             Oid         opfamily;
    2110             :             int         strat;
    2111             : 
    2112             :             /*
    2113             :              * Find the operator --- it must accept the column datatype
    2114             :              * without runtime coercion (but binary compatibility is OK).
    2115             :              * Operators contain opaque expressions (specifically, functions).
    2116             :              * compatible_oper_opid() boils down to oper() and
    2117             :              * IsBinaryCoercible().  PostgreSQL would have security problems
    2118             :              * elsewhere if oper() started calling opaque expressions.
    2119             :              */
    2120         444 :             if (OidIsValid(ddl_userid))
    2121             :             {
    2122         444 :                 AtEOXact_GUC(false, *ddl_save_nestlevel);
    2123         444 :                 SetUserIdAndSecContext(ddl_userid, ddl_sec_context);
    2124             :             }
    2125         444 :             opid = compatible_oper_opid(opname, atttype, atttype, false);
    2126         444 :             if (OidIsValid(ddl_userid))
    2127             :             {
    2128         444 :                 SetUserIdAndSecContext(save_userid, save_sec_context);
    2129         444 :                 *ddl_save_nestlevel = NewGUCNestLevel();
    2130             :             }
    2131             : 
    2132             :             /*
    2133             :              * Only allow commutative operators to be used in exclusion
    2134             :              * constraints. If X conflicts with Y, but Y does not conflict
    2135             :              * with X, bad things will happen.
    2136             :              */
    2137         444 :             if (get_commutator(opid) != opid)
    2138           0 :                 ereport(ERROR,
    2139             :                         (errcode(ERRCODE_WRONG_OBJECT_TYPE),
    2140             :                          errmsg("operator %s is not commutative",
    2141             :                                 format_operator(opid)),
    2142             :                          errdetail("Only commutative operators can be used in exclusion constraints.")));
    2143             : 
    2144             :             /*
    2145             :              * Operator must be a member of the right opfamily, too
    2146             :              */
    2147         444 :             opfamily = get_opclass_family(opclassOids[attn]);
    2148         444 :             strat = get_op_opfamily_strategy(opid, opfamily);
    2149         444 :             if (strat == 0)
    2150             :             {
    2151             :                 HeapTuple   opftuple;
    2152             :                 Form_pg_opfamily opfform;
    2153             : 
    2154             :                 /*
    2155             :                  * attribute->opclass might not explicitly name the opfamily,
    2156             :                  * so fetch the name of the selected opfamily for use in the
    2157             :                  * error message.
    2158             :                  */
    2159           0 :                 opftuple = SearchSysCache1(OPFAMILYOID,
    2160             :                                            ObjectIdGetDatum(opfamily));
    2161           0 :                 if (!HeapTupleIsValid(opftuple))
    2162           0 :                     elog(ERROR, "cache lookup failed for opfamily %u",
    2163             :                          opfamily);
    2164           0 :                 opfform = (Form_pg_opfamily) GETSTRUCT(opftuple);
    2165             : 
    2166           0 :                 ereport(ERROR,
    2167             :                         (errcode(ERRCODE_WRONG_OBJECT_TYPE),
    2168             :                          errmsg("operator %s is not a member of operator family \"%s\"",
    2169             :                                 format_operator(opid),
    2170             :                                 NameStr(opfform->opfname)),
    2171             :                          errdetail("The exclusion operator must be related to the index operator class for the constraint.")));
    2172             :             }
    2173             : 
    2174         444 :             indexInfo->ii_ExclusionOps[attn] = opid;
    2175         444 :             indexInfo->ii_ExclusionProcs[attn] = get_opcode(opid);
    2176         444 :             indexInfo->ii_ExclusionStrats[attn] = strat;
    2177         444 :             nextExclOp = lnext(exclusionOpNames, nextExclOp);
    2178             :         }
    2179       36482 :         else if (iswithoutoverlaps)
    2180             :         {
    2181             :             StrategyNumber strat;
    2182             :             Oid         opid;
    2183             : 
    2184         752 :             if (attn == nkeycols - 1)
    2185         356 :                 strat = RTOverlapStrategyNumber;
    2186             :             else
    2187         396 :                 strat = RTEqualStrategyNumber;
    2188         752 :             GetOperatorFromWellKnownStrategy(opclassOids[attn], InvalidOid,
    2189             :                                              &opid, &strat);
    2190         752 :             indexInfo->ii_ExclusionOps[attn] = opid;
    2191         752 :             indexInfo->ii_ExclusionProcs[attn] = get_opcode(opid);
    2192         752 :             indexInfo->ii_ExclusionStrats[attn] = strat;
    2193             :         }
    2194             : 
    2195             :         /*
    2196             :          * Set up the per-column options (indoption field).  For now, this is
    2197             :          * zero for any un-ordered index, while ordered indexes have DESC and
    2198             :          * NULLS FIRST/LAST options.
    2199             :          */
    2200       36926 :         colOptions[attn] = 0;
    2201       36926 :         if (amcanorder)
    2202             :         {
    2203             :             /* default ordering is ASC */
    2204       33288 :             if (attribute->ordering == SORTBY_DESC)
    2205          42 :                 colOptions[attn] |= INDOPTION_DESC;
    2206             :             /* default null ordering is LAST for ASC, FIRST for DESC */
    2207       33288 :             if (attribute->nulls_ordering == SORTBY_NULLS_DEFAULT)
    2208             :             {
    2209       33258 :                 if (attribute->ordering == SORTBY_DESC)
    2210          30 :                     colOptions[attn] |= INDOPTION_NULLS_FIRST;
    2211             :             }
    2212          30 :             else if (attribute->nulls_ordering == SORTBY_NULLS_FIRST)
    2213          12 :                 colOptions[attn] |= INDOPTION_NULLS_FIRST;
    2214             :         }
    2215             :         else
    2216             :         {
    2217             :             /* index AM does not support ordering */
    2218        3638 :             if (attribute->ordering != SORTBY_DEFAULT)
    2219           0 :                 ereport(ERROR,
    2220             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    2221             :                          errmsg("access method \"%s\" does not support ASC/DESC options",
    2222             :                                 accessMethodName)));
    2223        3638 :             if (attribute->nulls_ordering != SORTBY_NULLS_DEFAULT)
    2224           0 :                 ereport(ERROR,
    2225             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    2226             :                          errmsg("access method \"%s\" does not support NULLS FIRST/LAST options",
    2227             :                                 accessMethodName)));
    2228             :         }
    2229             : 
    2230             :         /* Set up the per-column opclass options (attoptions field). */
    2231       36926 :         if (attribute->opclassopts)
    2232             :         {
    2233             :             Assert(attn < nkeycols);
    2234             : 
    2235         138 :             opclassOptions[attn] =
    2236         138 :                 transformRelOptions((Datum) 0, attribute->opclassopts,
    2237             :                                     NULL, NULL, false, false);
    2238             :         }
    2239             :         else
    2240       36788 :             opclassOptions[attn] = (Datum) 0;
    2241             : 
    2242       36926 :         attn++;
    2243             :     }
    2244       27004 : }
    2245             : 
    2246             : /*
    2247             :  * Resolve possibly-defaulted operator class specification
    2248             :  *
    2249             :  * Note: This is used to resolve operator class specifications in index and
    2250             :  * partition key definitions.
    2251             :  */
    2252             : Oid
    2253       37076 : ResolveOpClass(const List *opclass, Oid attrType,
    2254             :                const char *accessMethodName, Oid accessMethodId)
    2255             : {
    2256             :     char       *schemaname;
    2257             :     char       *opcname;
    2258             :     HeapTuple   tuple;
    2259             :     Form_pg_opclass opform;
    2260             :     Oid         opClassId,
    2261             :                 opInputType;
    2262             : 
    2263       37076 :     if (opclass == NIL)
    2264             :     {
    2265             :         /* no operator class specified, so find the default */
    2266       19420 :         opClassId = GetDefaultOpClass(attrType, accessMethodId);
    2267       19420 :         if (!OidIsValid(opClassId))
    2268          18 :             ereport(ERROR,
    2269             :                     (errcode(ERRCODE_UNDEFINED_OBJECT),
    2270             :                      errmsg("data type %s has no default operator class for access method \"%s\"",
    2271             :                             format_type_be(attrType), accessMethodName),
    2272             :                      errhint("You must specify an operator class for the index or define a default operator class for the data type.")));
    2273       19402 :         return opClassId;
    2274             :     }
    2275             : 
    2276             :     /*
    2277             :      * Specific opclass name given, so look up the opclass.
    2278             :      */
    2279             : 
    2280             :     /* deconstruct the name list */
    2281       17656 :     DeconstructQualifiedName(opclass, &schemaname, &opcname);
    2282             : 
    2283       17656 :     if (schemaname)
    2284             :     {
    2285             :         /* Look in specific schema only */
    2286             :         Oid         namespaceId;
    2287             : 
    2288          10 :         namespaceId = LookupExplicitNamespace(schemaname, false);
    2289          10 :         tuple = SearchSysCache3(CLAAMNAMENSP,
    2290             :                                 ObjectIdGetDatum(accessMethodId),
    2291             :                                 PointerGetDatum(opcname),
    2292             :                                 ObjectIdGetDatum(namespaceId));
    2293             :     }
    2294             :     else
    2295             :     {
    2296             :         /* Unqualified opclass name, so search the search path */
    2297       17646 :         opClassId = OpclassnameGetOpcid(accessMethodId, opcname);
    2298       17646 :         if (!OidIsValid(opClassId))
    2299          12 :             ereport(ERROR,
    2300             :                     (errcode(ERRCODE_UNDEFINED_OBJECT),
    2301             :                      errmsg("operator class \"%s\" does not exist for access method \"%s\"",
    2302             :                             opcname, accessMethodName)));
    2303       17634 :         tuple = SearchSysCache1(CLAOID, ObjectIdGetDatum(opClassId));
    2304             :     }
    2305             : 
    2306       17644 :     if (!HeapTupleIsValid(tuple))
    2307           0 :         ereport(ERROR,
    2308             :                 (errcode(ERRCODE_UNDEFINED_OBJECT),
    2309             :                  errmsg("operator class \"%s\" does not exist for access method \"%s\"",
    2310             :                         NameListToString(opclass), accessMethodName)));
    2311             : 
    2312             :     /*
    2313             :      * Verify that the index operator class accepts this datatype.  Note we
    2314             :      * will accept binary compatibility.
    2315             :      */
    2316       17644 :     opform = (Form_pg_opclass) GETSTRUCT(tuple);
    2317       17644 :     opClassId = opform->oid;
    2318       17644 :     opInputType = opform->opcintype;
    2319             : 
    2320       17644 :     if (!IsBinaryCoercible(attrType, opInputType))
    2321           0 :         ereport(ERROR,
    2322             :                 (errcode(ERRCODE_DATATYPE_MISMATCH),
    2323             :                  errmsg("operator class \"%s\" does not accept data type %s",
    2324             :                         NameListToString(opclass), format_type_be(attrType))));
    2325             : 
    2326       17644 :     ReleaseSysCache(tuple);
    2327             : 
    2328       17644 :     return opClassId;
    2329             : }
    2330             : 
    2331             : /*
    2332             :  * GetDefaultOpClass
    2333             :  *
    2334             :  * Given the OIDs of a datatype and an access method, find the default
    2335             :  * operator class, if any.  Returns InvalidOid if there is none.
    2336             :  */
    2337             : Oid
    2338       93718 : GetDefaultOpClass(Oid type_id, Oid am_id)
    2339             : {
    2340       93718 :     Oid         result = InvalidOid;
    2341       93718 :     int         nexact = 0;
    2342       93718 :     int         ncompatible = 0;
    2343       93718 :     int         ncompatiblepreferred = 0;
    2344             :     Relation    rel;
    2345             :     ScanKeyData skey[1];
    2346             :     SysScanDesc scan;
    2347             :     HeapTuple   tup;
    2348             :     TYPCATEGORY tcategory;
    2349             : 
    2350             :     /* If it's a domain, look at the base type instead */
    2351       93718 :     type_id = getBaseType(type_id);
    2352             : 
    2353       93718 :     tcategory = TypeCategory(type_id);
    2354             : 
    2355             :     /*
    2356             :      * We scan through all the opclasses available for the access method,
    2357             :      * looking for one that is marked default and matches the target type
    2358             :      * (either exactly or binary-compatibly, but prefer an exact match).
    2359             :      *
    2360             :      * We could find more than one binary-compatible match.  If just one is
    2361             :      * for a preferred type, use that one; otherwise we fail, forcing the user
    2362             :      * to specify which one he wants.  (The preferred-type special case is a
    2363             :      * kluge for varchar: it's binary-compatible to both text and bpchar, so
    2364             :      * we need a tiebreaker.)  If we find more than one exact match, then
    2365             :      * someone put bogus entries in pg_opclass.
    2366             :      */
    2367       93718 :     rel = table_open(OperatorClassRelationId, AccessShareLock);
    2368             : 
    2369       93718 :     ScanKeyInit(&skey[0],
    2370             :                 Anum_pg_opclass_opcmethod,
    2371             :                 BTEqualStrategyNumber, F_OIDEQ,
    2372             :                 ObjectIdGetDatum(am_id));
    2373             : 
    2374       93718 :     scan = systable_beginscan(rel, OpclassAmNameNspIndexId, true,
    2375             :                               NULL, 1, skey);
    2376             : 
    2377     4110166 :     while (HeapTupleIsValid(tup = systable_getnext(scan)))
    2378             :     {
    2379     4016448 :         Form_pg_opclass opclass = (Form_pg_opclass) GETSTRUCT(tup);
    2380             : 
    2381             :         /* ignore altogether if not a default opclass */
    2382     4016448 :         if (!opclass->opcdefault)
    2383      603220 :             continue;
    2384     3413228 :         if (opclass->opcintype == type_id)
    2385             :         {
    2386       83454 :             nexact++;
    2387       83454 :             result = opclass->oid;
    2388             :         }
    2389     4989904 :         else if (nexact == 0 &&
    2390     1660130 :                  IsBinaryCoercible(type_id, opclass->opcintype))
    2391             :         {
    2392       20504 :             if (IsPreferredType(tcategory, opclass->opcintype))
    2393             :             {
    2394        1742 :                 ncompatiblepreferred++;
    2395        1742 :                 result = opclass->oid;
    2396             :             }
    2397       18762 :             else if (ncompatiblepreferred == 0)
    2398             :             {
    2399       18762 :                 ncompatible++;
    2400       18762 :                 result = opclass->oid;
    2401             :             }
    2402             :         }
    2403             :     }
    2404             : 
    2405       93718 :     systable_endscan(scan);
    2406             : 
    2407       93718 :     table_close(rel, AccessShareLock);
    2408             : 
    2409             :     /* raise error if pg_opclass contains inconsistent data */
    2410       93718 :     if (nexact > 1)
    2411           0 :         ereport(ERROR,
    2412             :                 (errcode(ERRCODE_DUPLICATE_OBJECT),
    2413             :                  errmsg("there are multiple default operator classes for data type %s",
    2414             :                         format_type_be(type_id))));
    2415             : 
    2416       93718 :     if (nexact == 1 ||
    2417        8524 :         ncompatiblepreferred == 1 ||
    2418        8524 :         (ncompatiblepreferred == 0 && ncompatible == 1))
    2419       92726 :         return result;
    2420             : 
    2421         992 :     return InvalidOid;
    2422             : }
    2423             : 
    2424             : /*
    2425             :  * GetOperatorFromWellKnownStrategy
    2426             :  *
    2427             :  * opclass - the opclass to use
    2428             :  * rhstype - the type for the right-hand side, or InvalidOid to use the type of the given opclass.
    2429             :  * opid - holds the operator we found
    2430             :  * strat - holds the input and output strategy number
    2431             :  *
    2432             :  * Finds an operator from a "well-known" strategy number.  This is used for
    2433             :  * temporal index constraints (and other temporal features) to look up
    2434             :  * equality and overlaps operators, since the strategy numbers for non-btree
    2435             :  * indexams need not follow any fixed scheme.  We ask an opclass support
    2436             :  * function to translate from the well-known number to the internal value.  If
    2437             :  * the function isn't defined or it gives no result, we return
    2438             :  * InvalidStrategy.
    2439             :  */
    2440             : void
    2441        1556 : GetOperatorFromWellKnownStrategy(Oid opclass, Oid rhstype,
    2442             :                                  Oid *opid, StrategyNumber *strat)
    2443             : {
    2444             :     Oid         opfamily;
    2445             :     Oid         opcintype;
    2446        1556 :     StrategyNumber instrat = *strat;
    2447             : 
    2448             :     Assert(instrat == RTEqualStrategyNumber || instrat == RTOverlapStrategyNumber || instrat == RTContainedByStrategyNumber);
    2449             : 
    2450        1556 :     *opid = InvalidOid;
    2451             : 
    2452        1556 :     if (get_opclass_opfamily_and_input_type(opclass, &opfamily, &opcintype))
    2453             :     {
    2454             :         /*
    2455             :          * Ask the opclass to translate to its internal stratnum
    2456             :          *
    2457             :          * For now we only need GiST support, but this could support other
    2458             :          * indexams if we wanted.
    2459             :          */
    2460        1556 :         *strat = GistTranslateStratnum(opclass, instrat);
    2461        1556 :         if (*strat == InvalidStrategy)
    2462             :         {
    2463             :             HeapTuple   tuple;
    2464             : 
    2465           0 :             tuple = SearchSysCache1(CLAOID, ObjectIdGetDatum(opclass));
    2466           0 :             if (!HeapTupleIsValid(tuple))
    2467           0 :                 elog(ERROR, "cache lookup failed for operator class %u", opclass);
    2468             : 
    2469           0 :             ereport(ERROR,
    2470             :                     errcode(ERRCODE_UNDEFINED_OBJECT),
    2471             :                     instrat == RTEqualStrategyNumber ? errmsg("could not identify an equality operator for type %s", format_type_be(opcintype)) :
    2472             :                     instrat == RTOverlapStrategyNumber ? errmsg("could not identify an overlaps operator for type %s", format_type_be(opcintype)) :
    2473             :                     instrat == RTContainedByStrategyNumber ? errmsg("could not identify a contained-by operator for type %s", format_type_be(opcintype)) : 0,
    2474             :                     errdetail("Could not translate strategy number %d for operator class \"%s\" for access method \"%s\".",
    2475             :                               instrat, NameStr(((Form_pg_opclass) GETSTRUCT(tuple))->opcname), "gist"));
    2476             :         }
    2477             : 
    2478             :         /*
    2479             :          * We parameterize rhstype so foreign keys can ask for a <@ operator
    2480             :          * whose rhs matches the aggregate function. For example range_agg
    2481             :          * returns anymultirange.
    2482             :          */
    2483        1556 :         if (!OidIsValid(rhstype))
    2484        1154 :             rhstype = opcintype;
    2485        1556 :         *opid = get_opfamily_member(opfamily, opcintype, rhstype, *strat);
    2486             :     }
    2487             : 
    2488        1556 :     if (!OidIsValid(*opid))
    2489             :     {
    2490             :         HeapTuple   tuple;
    2491             : 
    2492           0 :         tuple = SearchSysCache1(OPFAMILYOID, ObjectIdGetDatum(opfamily));
    2493           0 :         if (!HeapTupleIsValid(tuple))
    2494           0 :             elog(ERROR, "cache lookup failed for operator family %u", opfamily);
    2495             : 
    2496           0 :         ereport(ERROR,
    2497             :                 errcode(ERRCODE_UNDEFINED_OBJECT),
    2498             :                 instrat == RTEqualStrategyNumber ? errmsg("could not identify an equality operator for type %s", format_type_be(opcintype)) :
    2499             :                 instrat == RTOverlapStrategyNumber ? errmsg("could not identify an overlaps operator for type %s", format_type_be(opcintype)) :
    2500             :                 instrat == RTContainedByStrategyNumber ? errmsg("could not identify a contained-by operator for type %s", format_type_be(opcintype)) : 0,
    2501             :                 errdetail("There is no suitable operator in operator family \"%s\" for access method \"%s\".",
    2502             :                           NameStr(((Form_pg_opfamily) GETSTRUCT(tuple))->opfname), "gist"));
    2503             :     }
    2504        1556 : }
    2505             : 
    2506             : /*
    2507             :  *  makeObjectName()
    2508             :  *
    2509             :  *  Create a name for an implicitly created index, sequence, constraint,
    2510             :  *  extended statistics, etc.
    2511             :  *
    2512             :  *  The parameters are typically: the original table name, the original field
    2513             :  *  name, and a "type" string (such as "seq" or "pkey").    The field name
    2514             :  *  and/or type can be NULL if not relevant.
    2515             :  *
    2516             :  *  The result is a palloc'd string.
    2517             :  *
    2518             :  *  The basic result we want is "name1_name2_label", omitting "_name2" or
    2519             :  *  "_label" when those parameters are NULL.  However, we must generate
    2520             :  *  a name with less than NAMEDATALEN characters!  So, we truncate one or
    2521             :  *  both names if necessary to make a short-enough string.  The label part
    2522             :  *  is never truncated (so it had better be reasonably short).
    2523             :  *
    2524             :  *  The caller is responsible for checking uniqueness of the generated
    2525             :  *  name and retrying as needed; retrying will be done by altering the
    2526             :  *  "label" string (which is why we never truncate that part).
    2527             :  */
    2528             : char *
    2529       86192 : makeObjectName(const char *name1, const char *name2, const char *label)
    2530             : {
    2531             :     char       *name;
    2532       86192 :     int         overhead = 0;   /* chars needed for label and underscores */
    2533             :     int         availchars;     /* chars available for name(s) */
    2534             :     int         name1chars;     /* chars allocated to name1 */
    2535             :     int         name2chars;     /* chars allocated to name2 */
    2536             :     int         ndx;
    2537             : 
    2538       86192 :     name1chars = strlen(name1);
    2539       86192 :     if (name2)
    2540             :     {
    2541       77214 :         name2chars = strlen(name2);
    2542       77214 :         overhead++;             /* allow for separating underscore */
    2543             :     }
    2544             :     else
    2545        8978 :         name2chars = 0;
    2546       86192 :     if (label)
    2547       26212 :         overhead += strlen(label) + 1;
    2548             : 
    2549       86192 :     availchars = NAMEDATALEN - 1 - overhead;
    2550             :     Assert(availchars > 0);      /* else caller chose a bad label */
    2551             : 
    2552             :     /*
    2553             :      * If we must truncate, preferentially truncate the longer name. This
    2554             :      * logic could be expressed without a loop, but it's simple and obvious as
    2555             :      * a loop.
    2556             :      */
    2557       86258 :     while (name1chars + name2chars > availchars)
    2558             :     {
    2559          66 :         if (name1chars > name2chars)
    2560           0 :             name1chars--;
    2561             :         else
    2562          66 :             name2chars--;
    2563             :     }
    2564             : 
    2565       86192 :     name1chars = pg_mbcliplen(name1, name1chars, name1chars);
    2566       86192 :     if (name2)
    2567       77214 :         name2chars = pg_mbcliplen(name2, name2chars, name2chars);
    2568             : 
    2569             :     /* Now construct the string using the chosen lengths */
    2570       86192 :     name = palloc(name1chars + name2chars + overhead + 1);
    2571       86192 :     memcpy(name, name1, name1chars);
    2572       86192 :     ndx = name1chars;
    2573       86192 :     if (name2)
    2574             :     {
    2575       77214 :         name[ndx++] = '_';
    2576       77214 :         memcpy(name + ndx, name2, name2chars);
    2577       77214 :         ndx += name2chars;
    2578             :     }
    2579       86192 :     if (label)
    2580             :     {
    2581       26212 :         name[ndx++] = '_';
    2582       26212 :         strcpy(name + ndx, label);
    2583             :     }
    2584             :     else
    2585       59980 :         name[ndx] = '\0';
    2586             : 
    2587       86192 :     return name;
    2588             : }
    2589             : 
    2590             : /*
    2591             :  * Select a nonconflicting name for a new relation.  This is ordinarily
    2592             :  * used to choose index names (which is why it's here) but it can also
    2593             :  * be used for sequences, or any autogenerated relation kind.
    2594             :  *
    2595             :  * name1, name2, and label are used the same way as for makeObjectName(),
    2596             :  * except that the label can't be NULL; digits will be appended to the label
    2597             :  * if needed to create a name that is unique within the specified namespace.
    2598             :  *
    2599             :  * If isconstraint is true, we also avoid choosing a name matching any
    2600             :  * existing constraint in the same namespace.  (This is stricter than what
    2601             :  * Postgres itself requires, but the SQL standard says that constraint names
    2602             :  * should be unique within schemas, so we follow that for autogenerated
    2603             :  * constraint names.)
    2604             :  *
    2605             :  * Note: it is theoretically possible to get a collision anyway, if someone
    2606             :  * else chooses the same name concurrently.  This is fairly unlikely to be
    2607             :  * a problem in practice, especially if one is holding an exclusive lock on
    2608             :  * the relation identified by name1.  However, if choosing multiple names
    2609             :  * within a single command, you'd better create the new object and do
    2610             :  * CommandCounterIncrement before choosing the next one!
    2611             :  *
    2612             :  * Returns a palloc'd string.
    2613             :  */
    2614             : char *
    2615       13246 : ChooseRelationName(const char *name1, const char *name2,
    2616             :                    const char *label, Oid namespaceid,
    2617             :                    bool isconstraint)
    2618             : {
    2619       13246 :     int         pass = 0;
    2620       13246 :     char       *relname = NULL;
    2621             :     char        modlabel[NAMEDATALEN];
    2622             : 
    2623             :     /* try the unmodified label first */
    2624       13246 :     strlcpy(modlabel, label, sizeof(modlabel));
    2625             : 
    2626             :     for (;;)
    2627             :     {
    2628       14338 :         relname = makeObjectName(name1, name2, modlabel);
    2629             : 
    2630       14338 :         if (!OidIsValid(get_relname_relid(relname, namespaceid)))
    2631             :         {
    2632       13252 :             if (!isconstraint ||
    2633        8390 :                 !ConstraintNameExists(relname, namespaceid))
    2634             :                 break;
    2635             :         }
    2636             : 
    2637             :         /* found a conflict, so try a new name component */
    2638        1092 :         pfree(relname);
    2639        1092 :         snprintf(modlabel, sizeof(modlabel), "%s%d", label, ++pass);
    2640             :     }
    2641             : 
    2642       13246 :     return relname;
    2643             : }
    2644             : 
    2645             : /*
    2646             :  * Select the name to be used for an index.
    2647             :  *
    2648             :  * The argument list is pretty ad-hoc :-(
    2649             :  */
    2650             : static char *
    2651       11140 : ChooseIndexName(const char *tabname, Oid namespaceId,
    2652             :                 const List *colnames, const List *exclusionOpNames,
    2653             :                 bool primary, bool isconstraint)
    2654             : {
    2655             :     char       *indexname;
    2656             : 
    2657       11140 :     if (primary)
    2658             :     {
    2659             :         /* the primary key's name does not depend on the specific column(s) */
    2660        7500 :         indexname = ChooseRelationName(tabname,
    2661             :                                        NULL,
    2662             :                                        "pkey",
    2663             :                                        namespaceId,
    2664             :                                        true);
    2665             :     }
    2666        3640 :     else if (exclusionOpNames != NIL)
    2667             :     {
    2668         206 :         indexname = ChooseRelationName(tabname,
    2669         206 :                                        ChooseIndexNameAddition(colnames),
    2670             :                                        "excl",
    2671             :                                        namespaceId,
    2672             :                                        true);
    2673             :     }
    2674        3434 :     else if (isconstraint)
    2675             :     {
    2676         678 :         indexname = ChooseRelationName(tabname,
    2677         678 :                                        ChooseIndexNameAddition(colnames),
    2678             :                                        "key",
    2679             :                                        namespaceId,
    2680             :                                        true);
    2681             :     }
    2682             :     else
    2683             :     {
    2684        2756 :         indexname = ChooseRelationName(tabname,
    2685        2756 :                                        ChooseIndexNameAddition(colnames),
    2686             :                                        "idx",
    2687             :                                        namespaceId,
    2688             :                                        false);
    2689             :     }
    2690             : 
    2691       11140 :     return indexname;
    2692             : }
    2693             : 
    2694             : /*
    2695             :  * Generate "name2" for a new index given the list of column names for it
    2696             :  * (as produced by ChooseIndexColumnNames).  This will be passed to
    2697             :  * ChooseRelationName along with the parent table name and a suitable label.
    2698             :  *
    2699             :  * We know that less than NAMEDATALEN characters will actually be used,
    2700             :  * so we can truncate the result once we've generated that many.
    2701             :  *
    2702             :  * XXX See also ChooseForeignKeyConstraintNameAddition and
    2703             :  * ChooseExtendedStatisticNameAddition.
    2704             :  */
    2705             : static char *
    2706        3640 : ChooseIndexNameAddition(const List *colnames)
    2707             : {
    2708             :     char        buf[NAMEDATALEN * 2];
    2709        3640 :     int         buflen = 0;
    2710             :     ListCell   *lc;
    2711             : 
    2712        3640 :     buf[0] = '\0';
    2713        8294 :     foreach(lc, colnames)
    2714             :     {
    2715        4654 :         const char *name = (const char *) lfirst(lc);
    2716             : 
    2717        4654 :         if (buflen > 0)
    2718        1014 :             buf[buflen++] = '_';    /* insert _ between names */
    2719             : 
    2720             :         /*
    2721             :          * At this point we have buflen <= NAMEDATALEN.  name should be less
    2722             :          * than NAMEDATALEN already, but use strlcpy for paranoia.
    2723             :          */
    2724        4654 :         strlcpy(buf + buflen, name, NAMEDATALEN);
    2725        4654 :         buflen += strlen(buf + buflen);
    2726        4654 :         if (buflen >= NAMEDATALEN)
    2727           0 :             break;
    2728             :     }
    2729        3640 :     return pstrdup(buf);
    2730             : }
    2731             : 
    2732             : /*
    2733             :  * Select the actual names to be used for the columns of an index, given the
    2734             :  * list of IndexElems for the columns.  This is mostly about ensuring the
    2735             :  * names are unique so we don't get a conflicting-attribute-names error.
    2736             :  *
    2737             :  * Returns a List of plain strings (char *, not String nodes).
    2738             :  */
    2739             : static List *
    2740       27220 : ChooseIndexColumnNames(const List *indexElems)
    2741             : {
    2742       27220 :     List       *result = NIL;
    2743             :     ListCell   *lc;
    2744             : 
    2745       65058 :     foreach(lc, indexElems)
    2746             :     {
    2747       37838 :         IndexElem  *ielem = (IndexElem *) lfirst(lc);
    2748             :         const char *origname;
    2749             :         const char *curname;
    2750             :         int         i;
    2751             :         char        buf[NAMEDATALEN];
    2752             : 
    2753             :         /* Get the preliminary name from the IndexElem */
    2754       37838 :         if (ielem->indexcolname)
    2755        2852 :             origname = ielem->indexcolname; /* caller-specified name */
    2756       34986 :         else if (ielem->name)
    2757       34588 :             origname = ielem->name; /* simple column reference */
    2758             :         else
    2759         398 :             origname = "expr";    /* default name for expression */
    2760             : 
    2761             :         /* If it conflicts with any previous column, tweak it */
    2762       37838 :         curname = origname;
    2763       37838 :         for (i = 1;; i++)
    2764          62 :         {
    2765             :             ListCell   *lc2;
    2766             :             char        nbuf[32];
    2767             :             int         nlen;
    2768             : 
    2769       60002 :             foreach(lc2, result)
    2770             :             {
    2771       22164 :                 if (strcmp(curname, (char *) lfirst(lc2)) == 0)
    2772          62 :                     break;
    2773             :             }
    2774       37900 :             if (lc2 == NULL)
    2775       37838 :                 break;          /* found nonconflicting name */
    2776             : 
    2777          62 :             sprintf(nbuf, "%d", i);
    2778             : 
    2779             :             /* Ensure generated names are shorter than NAMEDATALEN */
    2780          62 :             nlen = pg_mbcliplen(origname, strlen(origname),
    2781          62 :                                 NAMEDATALEN - 1 - strlen(nbuf));
    2782          62 :             memcpy(buf, origname, nlen);
    2783          62 :             strcpy(buf + nlen, nbuf);
    2784          62 :             curname = buf;
    2785             :         }
    2786             : 
    2787             :         /* And attach to the result list */
    2788       37838 :         result = lappend(result, pstrdup(curname));
    2789             :     }
    2790       27220 :     return result;
    2791             : }
    2792             : 
    2793             : /*
    2794             :  * ExecReindex
    2795             :  *
    2796             :  * Primary entry point for manual REINDEX commands.  This is mainly a
    2797             :  * preparation wrapper for the real operations that will happen in
    2798             :  * each subroutine of REINDEX.
    2799             :  */
    2800             : void
    2801        1058 : ExecReindex(ParseState *pstate, const ReindexStmt *stmt, bool isTopLevel)
    2802             : {
    2803        1058 :     ReindexParams params = {0};
    2804             :     ListCell   *lc;
    2805        1058 :     bool        concurrently = false;
    2806        1058 :     bool        verbose = false;
    2807        1058 :     char       *tablespacename = NULL;
    2808             : 
    2809             :     /* Parse option list */
    2810        1782 :     foreach(lc, stmt->params)
    2811             :     {
    2812         724 :         DefElem    *opt = (DefElem *) lfirst(lc);
    2813             : 
    2814         724 :         if (strcmp(opt->defname, "verbose") == 0)
    2815          14 :             verbose = defGetBoolean(opt);
    2816         710 :         else if (strcmp(opt->defname, "concurrently") == 0)
    2817         582 :             concurrently = defGetBoolean(opt);
    2818         128 :         else if (strcmp(opt->defname, "tablespace") == 0)
    2819         128 :             tablespacename = defGetString(opt);
    2820             :         else
    2821           0 :             ereport(ERROR,
    2822             :                     (errcode(ERRCODE_SYNTAX_ERROR),
    2823             :                      errmsg("unrecognized REINDEX option \"%s\"",
    2824             :                             opt->defname),
    2825             :                      parser_errposition(pstate, opt->location)));
    2826             :     }
    2827             : 
    2828        1058 :     if (concurrently)
    2829         582 :         PreventInTransactionBlock(isTopLevel,
    2830             :                                   "REINDEX CONCURRENTLY");
    2831             : 
    2832        1040 :     params.options =
    2833        2080 :         (verbose ? REINDEXOPT_VERBOSE : 0) |
    2834        1040 :         (concurrently ? REINDEXOPT_CONCURRENTLY : 0);
    2835             : 
    2836             :     /*
    2837             :      * Assign the tablespace OID to move indexes to, with InvalidOid to do
    2838             :      * nothing.
    2839             :      */
    2840        1040 :     if (tablespacename != NULL)
    2841             :     {
    2842         128 :         params.tablespaceOid = get_tablespace_oid(tablespacename, false);
    2843             : 
    2844             :         /* Check permissions except when moving to database's default */
    2845         128 :         if (OidIsValid(params.tablespaceOid) &&
    2846         128 :             params.tablespaceOid != MyDatabaseTableSpace)
    2847             :         {
    2848             :             AclResult   aclresult;
    2849             : 
    2850         128 :             aclresult = object_aclcheck(TableSpaceRelationId, params.tablespaceOid,
    2851             :                                         GetUserId(), ACL_CREATE);
    2852         128 :             if (aclresult != ACLCHECK_OK)
    2853          12 :                 aclcheck_error(aclresult, OBJECT_TABLESPACE,
    2854          12 :                                get_tablespace_name(params.tablespaceOid));
    2855             :         }
    2856             :     }
    2857             :     else
    2858         912 :         params.tablespaceOid = InvalidOid;
    2859             : 
    2860        1028 :     switch (stmt->kind)
    2861             :     {
    2862         366 :         case REINDEX_OBJECT_INDEX:
    2863         366 :             ReindexIndex(stmt, &params, isTopLevel);
    2864         260 :             break;
    2865         480 :         case REINDEX_OBJECT_TABLE:
    2866         480 :             ReindexTable(stmt, &params, isTopLevel);
    2867         358 :             break;
    2868         182 :         case REINDEX_OBJECT_SCHEMA:
    2869             :         case REINDEX_OBJECT_SYSTEM:
    2870             :         case REINDEX_OBJECT_DATABASE:
    2871             : 
    2872             :             /*
    2873             :              * This cannot run inside a user transaction block; if we were
    2874             :              * inside a transaction, then its commit- and
    2875             :              * start-transaction-command calls would not have the intended
    2876             :              * effect!
    2877             :              */
    2878         182 :             PreventInTransactionBlock(isTopLevel,
    2879         250 :                                       (stmt->kind == REINDEX_OBJECT_SCHEMA) ? "REINDEX SCHEMA" :
    2880          68 :                                       (stmt->kind == REINDEX_OBJECT_SYSTEM) ? "REINDEX SYSTEM" :
    2881             :                                       "REINDEX DATABASE");
    2882         176 :             ReindexMultipleTables(stmt, &params);
    2883         126 :             break;
    2884           0 :         default:
    2885           0 :             elog(ERROR, "unrecognized object type: %d",
    2886             :                  (int) stmt->kind);
    2887             :             break;
    2888             :     }
    2889         744 : }
    2890             : 
    2891             : /*
    2892             :  * ReindexIndex
    2893             :  *      Recreate a specific index.
    2894             :  */
    2895             : static void
    2896         366 : ReindexIndex(const ReindexStmt *stmt, const ReindexParams *params, bool isTopLevel)
    2897             : {
    2898         366 :     const RangeVar *indexRelation = stmt->relation;
    2899             :     struct ReindexIndexCallbackState state;
    2900             :     Oid         indOid;
    2901             :     char        persistence;
    2902             :     char        relkind;
    2903             : 
    2904             :     /*
    2905             :      * Find and lock index, and check permissions on table; use callback to
    2906             :      * obtain lock on table first, to avoid deadlock hazard.  The lock level
    2907             :      * used here must match the index lock obtained in reindex_index().
    2908             :      *
    2909             :      * If it's a temporary index, we will perform a non-concurrent reindex,
    2910             :      * even if CONCURRENTLY was requested.  In that case, reindex_index() will
    2911             :      * upgrade the lock, but that's OK, because other sessions can't hold
    2912             :      * locks on our temporary table.
    2913             :      */
    2914         366 :     state.params = *params;
    2915         366 :     state.locked_table_oid = InvalidOid;
    2916         366 :     indOid = RangeVarGetRelidExtended(indexRelation,
    2917         366 :                                       (params->options & REINDEXOPT_CONCURRENTLY) != 0 ?
    2918             :                                       ShareUpdateExclusiveLock : AccessExclusiveLock,
    2919             :                                       0,
    2920             :                                       RangeVarCallbackForReindexIndex,
    2921             :                                       &state);
    2922             : 
    2923             :     /*
    2924             :      * Obtain the current persistence and kind of the existing index.  We
    2925             :      * already hold a lock on the index.
    2926             :      */
    2927         318 :     persistence = get_rel_persistence(indOid);
    2928         318 :     relkind = get_rel_relkind(indOid);
    2929             : 
    2930         318 :     if (relkind == RELKIND_PARTITIONED_INDEX)
    2931          36 :         ReindexPartitions(stmt, indOid, params, isTopLevel);
    2932         282 :     else if ((params->options & REINDEXOPT_CONCURRENTLY) != 0 &&
    2933             :              persistence != RELPERSISTENCE_TEMP)
    2934         162 :         ReindexRelationConcurrently(stmt, indOid, params);
    2935             :     else
    2936             :     {
    2937         120 :         ReindexParams newparams = *params;
    2938             : 
    2939         120 :         newparams.options |= REINDEXOPT_REPORT_PROGRESS;
    2940         120 :         reindex_index(stmt, indOid, false, persistence, &newparams);
    2941             :     }
    2942         260 : }
    2943             : 
    2944             : /*
    2945             :  * Check permissions on table before acquiring relation lock; also lock
    2946             :  * the heap before the RangeVarGetRelidExtended takes the index lock, to avoid
    2947             :  * deadlocks.
    2948             :  */
    2949             : static void
    2950         372 : RangeVarCallbackForReindexIndex(const RangeVar *relation,
    2951             :                                 Oid relId, Oid oldRelId, void *arg)
    2952             : {
    2953             :     char        relkind;
    2954         372 :     struct ReindexIndexCallbackState *state = arg;
    2955             :     LOCKMODE    table_lockmode;
    2956             :     Oid         table_oid;
    2957             : 
    2958             :     /*
    2959             :      * Lock level here should match table lock in reindex_index() for
    2960             :      * non-concurrent case and table locks used by index_concurrently_*() for
    2961             :      * concurrent case.
    2962             :      */
    2963         744 :     table_lockmode = (state->params.options & REINDEXOPT_CONCURRENTLY) != 0 ?
    2964         372 :         ShareUpdateExclusiveLock : ShareLock;
    2965             : 
    2966             :     /*
    2967             :      * If we previously locked some other index's heap, and the name we're
    2968             :      * looking up no longer refers to that relation, release the now-useless
    2969             :      * lock.
    2970             :      */
    2971         372 :     if (relId != oldRelId && OidIsValid(oldRelId))
    2972             :     {
    2973           6 :         UnlockRelationOid(state->locked_table_oid, table_lockmode);
    2974           6 :         state->locked_table_oid = InvalidOid;
    2975             :     }
    2976             : 
    2977             :     /* If the relation does not exist, there's nothing more to do. */
    2978         372 :     if (!OidIsValid(relId))
    2979          12 :         return;
    2980             : 
    2981             :     /*
    2982             :      * If the relation does exist, check whether it's an index.  But note that
    2983             :      * the relation might have been dropped between the time we did the name
    2984             :      * lookup and now.  In that case, there's nothing to do.
    2985             :      */
    2986         360 :     relkind = get_rel_relkind(relId);
    2987         360 :     if (!relkind)
    2988           0 :         return;
    2989         360 :     if (relkind != RELKIND_INDEX &&
    2990             :         relkind != RELKIND_PARTITIONED_INDEX)
    2991          24 :         ereport(ERROR,
    2992             :                 (errcode(ERRCODE_WRONG_OBJECT_TYPE),
    2993             :                  errmsg("\"%s\" is not an index", relation->relname)));
    2994             : 
    2995             :     /* Check permissions */
    2996         336 :     table_oid = IndexGetRelation(relId, true);
    2997         336 :     if (OidIsValid(table_oid))
    2998             :     {
    2999             :         AclResult   aclresult;
    3000             : 
    3001         336 :         aclresult = pg_class_aclcheck(table_oid, GetUserId(), ACL_MAINTAIN);
    3002         336 :         if (aclresult != ACLCHECK_OK)
    3003          12 :             aclcheck_error(aclresult, OBJECT_INDEX, relation->relname);
    3004             :     }
    3005             : 
    3006             :     /* Lock heap before index to avoid deadlock. */
    3007         324 :     if (relId != oldRelId)
    3008             :     {
    3009             :         /*
    3010             :          * If the OID isn't valid, it means the index was concurrently
    3011             :          * dropped, which is not a problem for us; just return normally.
    3012             :          */
    3013         324 :         if (OidIsValid(table_oid))
    3014             :         {
    3015         324 :             LockRelationOid(table_oid, table_lockmode);
    3016         324 :             state->locked_table_oid = table_oid;
    3017             :         }
    3018             :     }
    3019             : }
    3020             : 
    3021             : /*
    3022             :  * ReindexTable
    3023             :  *      Recreate all indexes of a table (and of its toast table, if any)
    3024             :  */
    3025             : static Oid
    3026         480 : ReindexTable(const ReindexStmt *stmt, const ReindexParams *params, bool isTopLevel)
    3027             : {
    3028             :     Oid         heapOid;
    3029             :     bool        result;
    3030         480 :     const RangeVar *relation = stmt->relation;
    3031             : 
    3032             :     /*
    3033             :      * The lock level used here should match reindex_relation().
    3034             :      *
    3035             :      * If it's a temporary table, we will perform a non-concurrent reindex,
    3036             :      * even if CONCURRENTLY was requested.  In that case, reindex_relation()
    3037             :      * will upgrade the lock, but that's OK, because other sessions can't hold
    3038             :      * locks on our temporary table.
    3039             :      */
    3040         480 :     heapOid = RangeVarGetRelidExtended(relation,
    3041         480 :                                        (params->options & REINDEXOPT_CONCURRENTLY) != 0 ?
    3042             :                                        ShareUpdateExclusiveLock : ShareLock,
    3043             :                                        0,
    3044             :                                        RangeVarCallbackMaintainsTable, NULL);
    3045             : 
    3046         434 :     if (get_rel_relkind(heapOid) == RELKIND_PARTITIONED_TABLE)
    3047          70 :         ReindexPartitions(stmt, heapOid, params, isTopLevel);
    3048         598 :     else if ((params->options & REINDEXOPT_CONCURRENTLY) != 0 &&
    3049         234 :              get_rel_persistence(heapOid) != RELPERSISTENCE_TEMP)
    3050             :     {
    3051         222 :         result = ReindexRelationConcurrently(stmt, heapOid, params);
    3052             : 
    3053         184 :         if (!result)
    3054          18 :             ereport(NOTICE,
    3055             :                     (errmsg("table \"%s\" has no indexes that can be reindexed concurrently",
    3056             :                             relation->relname)));
    3057             :     }
    3058             :     else
    3059             :     {
    3060         142 :         ReindexParams newparams = *params;
    3061             : 
    3062         142 :         newparams.options |= REINDEXOPT_REPORT_PROGRESS;
    3063         142 :         result = reindex_relation(stmt, heapOid,
    3064             :                                   REINDEX_REL_PROCESS_TOAST |
    3065             :                                   REINDEX_REL_CHECK_CONSTRAINTS,
    3066             :                                   &newparams);
    3067         110 :         if (!result)
    3068          12 :             ereport(NOTICE,
    3069             :                     (errmsg("table \"%s\" has no indexes to reindex",
    3070             :                             relation->relname)));
    3071             :     }
    3072             : 
    3073         358 :     return heapOid;
    3074             : }
    3075             : 
    3076             : /*
    3077             :  * ReindexMultipleTables
    3078             :  *      Recreate indexes of tables selected by objectName/objectKind.
    3079             :  *
    3080             :  * To reduce the probability of deadlocks, each table is reindexed in a
    3081             :  * separate transaction, so we can release the lock on it right away.
    3082             :  * That means this must not be called within a user transaction block!
    3083             :  */
    3084             : static void
    3085         176 : ReindexMultipleTables(const ReindexStmt *stmt, const ReindexParams *params)
    3086             : {
    3087             : 
    3088             :     Oid         objectOid;
    3089             :     Relation    relationRelation;
    3090             :     TableScanDesc scan;
    3091             :     ScanKeyData scan_keys[1];
    3092             :     HeapTuple   tuple;
    3093             :     MemoryContext private_context;
    3094             :     MemoryContext old;
    3095         176 :     List       *relids = NIL;
    3096             :     int         num_keys;
    3097         176 :     bool        concurrent_warning = false;
    3098         176 :     bool        tablespace_warning = false;
    3099         176 :     const char *objectName = stmt->name;
    3100         176 :     const ReindexObjectType objectKind = stmt->kind;
    3101             : 
    3102             :     Assert(objectKind == REINDEX_OBJECT_SCHEMA ||
    3103             :            objectKind == REINDEX_OBJECT_SYSTEM ||
    3104             :            objectKind == REINDEX_OBJECT_DATABASE);
    3105             : 
    3106             :     /*
    3107             :      * This matches the options enforced by the grammar, where the object name
    3108             :      * is optional for DATABASE and SYSTEM.
    3109             :      */
    3110             :     Assert(objectName || objectKind != REINDEX_OBJECT_SCHEMA);
    3111             : 
    3112         176 :     if (objectKind == REINDEX_OBJECT_SYSTEM &&
    3113          34 :         (params->options & REINDEXOPT_CONCURRENTLY) != 0)
    3114          20 :         ereport(ERROR,
    3115             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3116             :                  errmsg("cannot reindex system catalogs concurrently")));
    3117             : 
    3118             :     /*
    3119             :      * Get OID of object to reindex, being the database currently being used
    3120             :      * by session for a database or for system catalogs, or the schema defined
    3121             :      * by caller. At the same time do permission checks that need different
    3122             :      * processing depending on the object type.
    3123             :      */
    3124         156 :     if (objectKind == REINDEX_OBJECT_SCHEMA)
    3125             :     {
    3126         108 :         objectOid = get_namespace_oid(objectName, false);
    3127             : 
    3128         102 :         if (!object_ownercheck(NamespaceRelationId, objectOid, GetUserId()) &&
    3129          24 :             !has_privs_of_role(GetUserId(), ROLE_PG_MAINTAIN))
    3130          18 :             aclcheck_error(ACLCHECK_NOT_OWNER, OBJECT_SCHEMA,
    3131             :                            objectName);
    3132             :     }
    3133             :     else
    3134             :     {
    3135          48 :         objectOid = MyDatabaseId;
    3136             : 
    3137          48 :         if (objectName && strcmp(objectName, get_database_name(objectOid)) != 0)
    3138           6 :             ereport(ERROR,
    3139             :                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3140             :                      errmsg("can only reindex the currently open database")));
    3141          42 :         if (!object_ownercheck(DatabaseRelationId, objectOid, GetUserId()) &&
    3142           0 :             !has_privs_of_role(GetUserId(), ROLE_PG_MAINTAIN))
    3143           0 :             aclcheck_error(ACLCHECK_NOT_OWNER, OBJECT_DATABASE,
    3144           0 :                            get_database_name(objectOid));
    3145             :     }
    3146             : 
    3147             :     /*
    3148             :      * Create a memory context that will survive forced transaction commits we
    3149             :      * do below.  Since it is a child of PortalContext, it will go away
    3150             :      * eventually even if we suffer an error; there's no need for special
    3151             :      * abort cleanup logic.
    3152             :      */
    3153         126 :     private_context = AllocSetContextCreate(PortalContext,
    3154             :                                             "ReindexMultipleTables",
    3155             :                                             ALLOCSET_SMALL_SIZES);
    3156             : 
    3157             :     /*
    3158             :      * Define the search keys to find the objects to reindex. For a schema, we
    3159             :      * select target relations using relnamespace, something not necessary for
    3160             :      * a database-wide operation.
    3161             :      */
    3162         126 :     if (objectKind == REINDEX_OBJECT_SCHEMA)
    3163             :     {
    3164          84 :         num_keys = 1;
    3165          84 :         ScanKeyInit(&scan_keys[0],
    3166             :                     Anum_pg_class_relnamespace,
    3167             :                     BTEqualStrategyNumber, F_OIDEQ,
    3168             :                     ObjectIdGetDatum(objectOid));
    3169             :     }
    3170             :     else
    3171          42 :         num_keys = 0;
    3172             : 
    3173             :     /*
    3174             :      * Scan pg_class to build a list of the relations we need to reindex.
    3175             :      *
    3176             :      * We only consider plain relations and materialized views here (toast
    3177             :      * rels will be processed indirectly by reindex_relation).
    3178             :      */
    3179         126 :     relationRelation = table_open(RelationRelationId, AccessShareLock);
    3180         126 :     scan = table_beginscan_catalog(relationRelation, num_keys, scan_keys);
    3181       20176 :     while ((tuple = heap_getnext(scan, ForwardScanDirection)) != NULL)
    3182             :     {
    3183       20050 :         Form_pg_class classtuple = (Form_pg_class) GETSTRUCT(tuple);
    3184       20050 :         Oid         relid = classtuple->oid;
    3185             : 
    3186             :         /*
    3187             :          * Only regular tables and matviews can have indexes, so ignore any
    3188             :          * other kind of relation.
    3189             :          *
    3190             :          * Partitioned tables/indexes are skipped but matching leaf partitions
    3191             :          * are processed.
    3192             :          */
    3193       20050 :         if (classtuple->relkind != RELKIND_RELATION &&
    3194       16492 :             classtuple->relkind != RELKIND_MATVIEW)
    3195       16474 :             continue;
    3196             : 
    3197             :         /* Skip temp tables of other backends; we can't reindex them at all */
    3198        3576 :         if (classtuple->relpersistence == RELPERSISTENCE_TEMP &&
    3199          36 :             !isTempNamespace(classtuple->relnamespace))
    3200           0 :             continue;
    3201             : 
    3202             :         /*
    3203             :          * Check user/system classification.  SYSTEM processes all the
    3204             :          * catalogs, and DATABASE processes everything that's not a catalog.
    3205             :          */
    3206        3576 :         if (objectKind == REINDEX_OBJECT_SYSTEM &&
    3207         984 :             !IsCatalogRelationOid(relid))
    3208          88 :             continue;
    3209        5408 :         else if (objectKind == REINDEX_OBJECT_DATABASE &&
    3210        1920 :                  IsCatalogRelationOid(relid))
    3211        1792 :             continue;
    3212             : 
    3213             :         /*
    3214             :          * We already checked privileges on the database or schema, but we
    3215             :          * further restrict reindexing shared catalogs to roles with the
    3216             :          * MAINTAIN privilege on the relation.
    3217             :          */
    3218        1938 :         if (classtuple->relisshared &&
    3219         242 :             pg_class_aclcheck(relid, GetUserId(), ACL_MAINTAIN) != ACLCHECK_OK)
    3220           0 :             continue;
    3221             : 
    3222             :         /*
    3223             :          * Skip system tables, since index_create() would reject indexing them
    3224             :          * concurrently (and it would likely fail if we tried).
    3225             :          */
    3226        2178 :         if ((params->options & REINDEXOPT_CONCURRENTLY) != 0 &&
    3227         482 :             IsCatalogRelationOid(relid))
    3228             :         {
    3229         384 :             if (!concurrent_warning)
    3230           6 :                 ereport(WARNING,
    3231             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3232             :                          errmsg("cannot reindex system catalogs concurrently, skipping all")));
    3233         384 :             concurrent_warning = true;
    3234         384 :             continue;
    3235             :         }
    3236             : 
    3237             :         /*
    3238             :          * If a new tablespace is set, check if this relation has to be
    3239             :          * skipped.
    3240             :          */
    3241        1312 :         if (OidIsValid(params->tablespaceOid))
    3242             :         {
    3243           0 :             bool        skip_rel = false;
    3244             : 
    3245             :             /*
    3246             :              * Mapped relations cannot be moved to different tablespaces (in
    3247             :              * particular this eliminates all shared catalogs.).
    3248             :              */
    3249           0 :             if (RELKIND_HAS_STORAGE(classtuple->relkind) &&
    3250           0 :                 !RelFileNumberIsValid(classtuple->relfilenode))
    3251           0 :                 skip_rel = true;
    3252             : 
    3253             :             /*
    3254             :              * A system relation is always skipped, even with
    3255             :              * allow_system_table_mods enabled.
    3256             :              */
    3257           0 :             if (IsSystemClass(relid, classtuple))
    3258           0 :                 skip_rel = true;
    3259             : 
    3260           0 :             if (skip_rel)
    3261             :             {
    3262           0 :                 if (!tablespace_warning)
    3263           0 :                     ereport(WARNING,
    3264             :                             (errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
    3265             :                              errmsg("cannot move system relations, skipping all")));
    3266           0 :                 tablespace_warning = true;
    3267           0 :                 continue;
    3268             :             }
    3269             :         }
    3270             : 
    3271             :         /* Save the list of relation OIDs in private context */
    3272        1312 :         old = MemoryContextSwitchTo(private_context);
    3273             : 
    3274             :         /*
    3275             :          * We always want to reindex pg_class first if it's selected to be
    3276             :          * reindexed.  This ensures that if there is any corruption in
    3277             :          * pg_class' indexes, they will be fixed before we process any other
    3278             :          * tables.  This is critical because reindexing itself will try to
    3279             :          * update pg_class.
    3280             :          */
    3281        1312 :         if (relid == RelationRelationId)
    3282          16 :             relids = lcons_oid(relid, relids);
    3283             :         else
    3284        1296 :             relids = lappend_oid(relids, relid);
    3285             : 
    3286        1312 :         MemoryContextSwitchTo(old);
    3287             :     }
    3288         126 :     table_endscan(scan);
    3289         126 :     table_close(relationRelation, AccessShareLock);
    3290             : 
    3291             :     /*
    3292             :      * Process each relation listed in a separate transaction.  Note that this
    3293             :      * commits and then starts a new transaction immediately.
    3294             :      */
    3295         126 :     ReindexMultipleInternal(stmt, relids, params);
    3296             : 
    3297         126 :     MemoryContextDelete(private_context);
    3298         126 : }
    3299             : 
    3300             : /*
    3301             :  * Error callback specific to ReindexPartitions().
    3302             :  */
    3303             : static void
    3304          12 : reindex_error_callback(void *arg)
    3305             : {
    3306          12 :     ReindexErrorInfo *errinfo = (ReindexErrorInfo *) arg;
    3307             : 
    3308             :     Assert(RELKIND_HAS_PARTITIONS(errinfo->relkind));
    3309             : 
    3310          12 :     if (errinfo->relkind == RELKIND_PARTITIONED_TABLE)
    3311           6 :         errcontext("while reindexing partitioned table \"%s.%s\"",
    3312             :                    errinfo->relnamespace, errinfo->relname);
    3313           6 :     else if (errinfo->relkind == RELKIND_PARTITIONED_INDEX)
    3314           6 :         errcontext("while reindexing partitioned index \"%s.%s\"",
    3315             :                    errinfo->relnamespace, errinfo->relname);
    3316          12 : }
    3317             : 
    3318             : /*
    3319             :  * ReindexPartitions
    3320             :  *
    3321             :  * Reindex a set of partitions, per the partitioned index or table given
    3322             :  * by the caller.
    3323             :  */
    3324             : static void
    3325         106 : ReindexPartitions(const ReindexStmt *stmt, Oid relid, const ReindexParams *params, bool isTopLevel)
    3326             : {
    3327         106 :     List       *partitions = NIL;
    3328         106 :     char        relkind = get_rel_relkind(relid);
    3329         106 :     char       *relname = get_rel_name(relid);
    3330         106 :     char       *relnamespace = get_namespace_name(get_rel_namespace(relid));
    3331             :     MemoryContext reindex_context;
    3332             :     List       *inhoids;
    3333             :     ListCell   *lc;
    3334             :     ErrorContextCallback errcallback;
    3335             :     ReindexErrorInfo errinfo;
    3336             : 
    3337             :     Assert(RELKIND_HAS_PARTITIONS(relkind));
    3338             : 
    3339             :     /*
    3340             :      * Check if this runs in a transaction block, with an error callback to
    3341             :      * provide more context under which a problem happens.
    3342             :      */
    3343         106 :     errinfo.relname = pstrdup(relname);
    3344         106 :     errinfo.relnamespace = pstrdup(relnamespace);
    3345         106 :     errinfo.relkind = relkind;
    3346         106 :     errcallback.callback = reindex_error_callback;
    3347         106 :     errcallback.arg = (void *) &errinfo;
    3348         106 :     errcallback.previous = error_context_stack;
    3349         106 :     error_context_stack = &errcallback;
    3350             : 
    3351         106 :     PreventInTransactionBlock(isTopLevel,
    3352             :                               relkind == RELKIND_PARTITIONED_TABLE ?
    3353             :                               "REINDEX TABLE" : "REINDEX INDEX");
    3354             : 
    3355             :     /* Pop the error context stack */
    3356          94 :     error_context_stack = errcallback.previous;
    3357             : 
    3358             :     /*
    3359             :      * Create special memory context for cross-transaction storage.
    3360             :      *
    3361             :      * Since it is a child of PortalContext, it will go away eventually even
    3362             :      * if we suffer an error so there is no need for special abort cleanup
    3363             :      * logic.
    3364             :      */
    3365          94 :     reindex_context = AllocSetContextCreate(PortalContext, "Reindex",
    3366             :                                             ALLOCSET_DEFAULT_SIZES);
    3367             : 
    3368             :     /* ShareLock is enough to prevent schema modifications */
    3369          94 :     inhoids = find_all_inheritors(relid, ShareLock, NULL);
    3370             : 
    3371             :     /*
    3372             :      * The list of relations to reindex are the physical partitions of the
    3373             :      * tree so discard any partitioned table or index.
    3374             :      */
    3375         364 :     foreach(lc, inhoids)
    3376             :     {
    3377         270 :         Oid         partoid = lfirst_oid(lc);
    3378         270 :         char        partkind = get_rel_relkind(partoid);
    3379             :         MemoryContext old_context;
    3380             : 
    3381             :         /*
    3382             :          * This discards partitioned tables, partitioned indexes and foreign
    3383             :          * tables.
    3384             :          */
    3385         270 :         if (!RELKIND_HAS_STORAGE(partkind))
    3386         158 :             continue;
    3387             : 
    3388             :         Assert(partkind == RELKIND_INDEX ||
    3389             :                partkind == RELKIND_RELATION);
    3390             : 
    3391             :         /* Save partition OID */
    3392         112 :         old_context = MemoryContextSwitchTo(reindex_context);
    3393         112 :         partitions = lappend_oid(partitions, partoid);
    3394         112 :         MemoryContextSwitchTo(old_context);
    3395             :     }
    3396             : 
    3397             :     /*
    3398             :      * Process each partition listed in a separate transaction.  Note that
    3399             :      * this commits and then starts a new transaction immediately.
    3400             :      */
    3401          94 :     ReindexMultipleInternal(stmt, partitions, params);
    3402             : 
    3403             :     /*
    3404             :      * Clean up working storage --- note we must do this after
    3405             :      * StartTransactionCommand, else we might be trying to delete the active
    3406             :      * context!
    3407             :      */
    3408          94 :     MemoryContextDelete(reindex_context);
    3409          94 : }
    3410             : 
    3411             : /*
    3412             :  * ReindexMultipleInternal
    3413             :  *
    3414             :  * Reindex a list of relations, each one being processed in its own
    3415             :  * transaction.  This commits the existing transaction immediately,
    3416             :  * and starts a new transaction when finished.
    3417             :  */
    3418             : static void
    3419         220 : ReindexMultipleInternal(const ReindexStmt *stmt, const List *relids, const ReindexParams *params)
    3420             : {
    3421             :     ListCell   *l;
    3422             : 
    3423         220 :     PopActiveSnapshot();
    3424         220 :     CommitTransactionCommand();
    3425             : 
    3426        1644 :     foreach(l, relids)
    3427             :     {
    3428        1424 :         Oid         relid = lfirst_oid(l);
    3429             :         char        relkind;
    3430             :         char        relpersistence;
    3431             : 
    3432        1424 :         StartTransactionCommand();
    3433             : 
    3434             :         /* functions in indexes may want a snapshot set */
    3435        1424 :         PushActiveSnapshot(GetTransactionSnapshot());
    3436             : 
    3437             :         /* check if the relation still exists */
    3438        1424 :         if (!SearchSysCacheExists1(RELOID, ObjectIdGetDatum(relid)))
    3439             :         {
    3440           4 :             PopActiveSnapshot();
    3441           4 :             CommitTransactionCommand();
    3442           4 :             continue;
    3443             :         }
    3444             : 
    3445             :         /*
    3446             :          * Check permissions except when moving to database's default if a new
    3447             :          * tablespace is chosen.  Note that this check also happens in
    3448             :          * ExecReindex(), but we do an extra check here as this runs across
    3449             :          * multiple transactions.
    3450             :          */
    3451        1420 :         if (OidIsValid(params->tablespaceOid) &&
    3452          12 :             params->tablespaceOid != MyDatabaseTableSpace)
    3453             :         {
    3454             :             AclResult   aclresult;
    3455             : 
    3456          12 :             aclresult = object_aclcheck(TableSpaceRelationId, params->tablespaceOid,
    3457             :                                         GetUserId(), ACL_CREATE);
    3458          12 :             if (aclresult != ACLCHECK_OK)
    3459           0 :                 aclcheck_error(aclresult, OBJECT_TABLESPACE,
    3460           0 :                                get_tablespace_name(params->tablespaceOid));
    3461             :         }
    3462             : 
    3463        1420 :         relkind = get_rel_relkind(relid);
    3464        1420 :         relpersistence = get_rel_persistence(relid);
    3465             : 
    3466             :         /*
    3467             :          * Partitioned tables and indexes can never be processed directly, and
    3468             :          * a list of their leaves should be built first.
    3469             :          */
    3470             :         Assert(!RELKIND_HAS_PARTITIONS(relkind));
    3471             : 
    3472        1420 :         if ((params->options & REINDEXOPT_CONCURRENTLY) != 0 &&
    3473             :             relpersistence != RELPERSISTENCE_TEMP)
    3474         122 :         {
    3475         122 :             ReindexParams newparams = *params;
    3476             : 
    3477         122 :             newparams.options |= REINDEXOPT_MISSING_OK;
    3478         122 :             (void) ReindexRelationConcurrently(stmt, relid, &newparams);
    3479         122 :             if (ActiveSnapshotSet())
    3480          26 :                 PopActiveSnapshot();
    3481             :             /* ReindexRelationConcurrently() does the verbose output */
    3482             :         }
    3483        1298 :         else if (relkind == RELKIND_INDEX)
    3484             :         {
    3485          18 :             ReindexParams newparams = *params;
    3486             : 
    3487          18 :             newparams.options |=
    3488             :                 REINDEXOPT_REPORT_PROGRESS | REINDEXOPT_MISSING_OK;
    3489          18 :             reindex_index(stmt, relid, false, relpersistence, &newparams);
    3490          18 :             PopActiveSnapshot();
    3491             :             /* reindex_index() does the verbose output */
    3492             :         }
    3493             :         else
    3494             :         {
    3495             :             bool        result;
    3496        1280 :             ReindexParams newparams = *params;
    3497             : 
    3498        1280 :             newparams.options |=
    3499             :                 REINDEXOPT_REPORT_PROGRESS | REINDEXOPT_MISSING_OK;
    3500        1280 :             result = reindex_relation(stmt, relid,
    3501             :                                       REINDEX_REL_PROCESS_TOAST |
    3502             :                                       REINDEX_REL_CHECK_CONSTRAINTS,
    3503             :                                       &newparams);
    3504             : 
    3505        1280 :             if (result && (params->options & REINDEXOPT_VERBOSE) != 0)
    3506           0 :                 ereport(INFO,
    3507             :                         (errmsg("table \"%s.%s\" was reindexed",
    3508             :                                 get_namespace_name(get_rel_namespace(relid)),
    3509             :                                 get_rel_name(relid))));
    3510             : 
    3511        1280 :             PopActiveSnapshot();
    3512             :         }
    3513             : 
    3514        1420 :         CommitTransactionCommand();
    3515             :     }
    3516             : 
    3517         220 :     StartTransactionCommand();
    3518         220 : }
    3519             : 
    3520             : 
    3521             : /*
    3522             :  * ReindexRelationConcurrently - process REINDEX CONCURRENTLY for given
    3523             :  * relation OID
    3524             :  *
    3525             :  * 'relationOid' can either belong to an index, a table or a materialized
    3526             :  * view.  For tables and materialized views, all its indexes will be rebuilt,
    3527             :  * excluding invalid indexes and any indexes used in exclusion constraints,
    3528             :  * but including its associated toast table indexes.  For indexes, the index
    3529             :  * itself will be rebuilt.
    3530             :  *
    3531             :  * The locks taken on parent tables and involved indexes are kept until the
    3532             :  * transaction is committed, at which point a session lock is taken on each
    3533             :  * relation.  Both of these protect against concurrent schema changes.
    3534             :  *
    3535             :  * Returns true if any indexes have been rebuilt (including toast table's
    3536             :  * indexes, when relevant), otherwise returns false.
    3537             :  *
    3538             :  * NOTE: This cannot be used on temporary relations.  A concurrent build would
    3539             :  * cause issues with ON COMMIT actions triggered by the transactions of the
    3540             :  * concurrent build.  Temporary relations are not subject to concurrent
    3541             :  * concerns, so there's no need for the more complicated concurrent build,
    3542             :  * anyway, and a non-concurrent reindex is more efficient.
    3543             :  */
    3544             : static bool
    3545         506 : ReindexRelationConcurrently(const ReindexStmt *stmt, Oid relationOid, const ReindexParams *params)
    3546             : {
    3547             :     typedef struct ReindexIndexInfo
    3548             :     {
    3549             :         Oid         indexId;
    3550             :         Oid         tableId;
    3551             :         Oid         amId;
    3552             :         bool        safe;       /* for set_indexsafe_procflags */
    3553             :     } ReindexIndexInfo;
    3554         506 :     List       *heapRelationIds = NIL;
    3555         506 :     List       *indexIds = NIL;
    3556         506 :     List       *newIndexIds = NIL;
    3557         506 :     List       *relationLocks = NIL;
    3558         506 :     List       *lockTags = NIL;
    3559             :     ListCell   *lc,
    3560             :                *lc2;
    3561             :     MemoryContext private_context;
    3562             :     MemoryContext oldcontext;
    3563             :     char        relkind;
    3564         506 :     char       *relationName = NULL;
    3565         506 :     char       *relationNamespace = NULL;
    3566             :     PGRUsage    ru0;
    3567         506 :     const int   progress_index[] = {
    3568             :         PROGRESS_CREATEIDX_COMMAND,
    3569             :         PROGRESS_CREATEIDX_PHASE,
    3570             :         PROGRESS_CREATEIDX_INDEX_OID,
    3571             :         PROGRESS_CREATEIDX_ACCESS_METHOD_OID
    3572             :     };
    3573             :     int64       progress_vals[4];
    3574             : 
    3575             :     /*
    3576             :      * Create a memory context that will survive forced transaction commits we
    3577             :      * do below.  Since it is a child of PortalContext, it will go away
    3578             :      * eventually even if we suffer an error; there's no need for special
    3579             :      * abort cleanup logic.
    3580             :      */
    3581         506 :     private_context = AllocSetContextCreate(PortalContext,
    3582             :                                             "ReindexConcurrent",
    3583             :                                             ALLOCSET_SMALL_SIZES);
    3584             : 
    3585         506 :     if ((params->options & REINDEXOPT_VERBOSE) != 0)
    3586             :     {
    3587             :         /* Save data needed by REINDEX VERBOSE in private context */
    3588           4 :         oldcontext = MemoryContextSwitchTo(private_context);
    3589             : 
    3590           4 :         relationName = get_rel_name(relationOid);
    3591           4 :         relationNamespace = get_namespace_name(get_rel_namespace(relationOid));
    3592             : 
    3593           4 :         pg_rusage_init(&ru0);
    3594             : 
    3595           4 :         MemoryContextSwitchTo(oldcontext);
    3596             :     }
    3597             : 
    3598         506 :     relkind = get_rel_relkind(relationOid);
    3599             : 
    3600             :     /*
    3601             :      * Extract the list of indexes that are going to be rebuilt based on the
    3602             :      * relation Oid given by caller.
    3603             :      */
    3604         506 :     switch (relkind)
    3605             :     {
    3606         320 :         case RELKIND_RELATION:
    3607             :         case RELKIND_MATVIEW:
    3608             :         case RELKIND_TOASTVALUE:
    3609             :             {
    3610             :                 /*
    3611             :                  * In the case of a relation, find all its indexes including
    3612             :                  * toast indexes.
    3613             :                  */
    3614             :                 Relation    heapRelation;
    3615             : 
    3616             :                 /* Save the list of relation OIDs in private context */
    3617         320 :                 oldcontext = MemoryContextSwitchTo(private_context);
    3618             : 
    3619             :                 /* Track this relation for session locks */
    3620         320 :                 heapRelationIds = lappend_oid(heapRelationIds, relationOid);
    3621             : 
    3622         320 :                 MemoryContextSwitchTo(oldcontext);
    3623             : 
    3624         320 :                 if (IsCatalogRelationOid(relationOid))
    3625          36 :                     ereport(ERROR,
    3626             :                             (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3627             :                              errmsg("cannot reindex system catalogs concurrently")));
    3628             : 
    3629             :                 /* Open relation to get its indexes */
    3630         284 :                 if ((params->options & REINDEXOPT_MISSING_OK) != 0)
    3631             :                 {
    3632          98 :                     heapRelation = try_table_open(relationOid,
    3633             :                                                   ShareUpdateExclusiveLock);
    3634             :                     /* leave if relation does not exist */
    3635          98 :                     if (!heapRelation)
    3636           0 :                         break;
    3637             :                 }
    3638             :                 else
    3639         186 :                     heapRelation = table_open(relationOid,
    3640             :                                               ShareUpdateExclusiveLock);
    3641             : 
    3642         306 :                 if (OidIsValid(params->tablespaceOid) &&
    3643          22 :                     IsSystemRelation(heapRelation))
    3644           2 :                     ereport(ERROR,
    3645             :                             (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3646             :                              errmsg("cannot move system relation \"%s\"",
    3647             :                                     RelationGetRelationName(heapRelation))));
    3648             : 
    3649             :                 /* Add all the valid indexes of relation to list */
    3650         544 :                 foreach(lc, RelationGetIndexList(heapRelation))
    3651             :                 {
    3652         262 :                     Oid         cellOid = lfirst_oid(lc);
    3653         262 :                     Relation    indexRelation = index_open(cellOid,
    3654             :                                                            ShareUpdateExclusiveLock);
    3655             : 
    3656         262 :                     if (!indexRelation->rd_index->indisvalid)
    3657           6 :                         ereport(WARNING,
    3658             :                                 (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
    3659             :                                  errmsg("skipping reindex of invalid index \"%s.%s\"",
    3660             :                                         get_namespace_name(get_rel_namespace(cellOid)),
    3661             :                                         get_rel_name(cellOid)),
    3662             :                                  errhint("Use DROP INDEX or REINDEX INDEX.")));
    3663         256 :                     else if (indexRelation->rd_index->indisexclusion)
    3664           6 :                         ereport(WARNING,
    3665             :                                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3666             :                                  errmsg("cannot reindex exclusion constraint index \"%s.%s\" concurrently, skipping",
    3667             :                                         get_namespace_name(get_rel_namespace(cellOid)),
    3668             :                                         get_rel_name(cellOid))));
    3669             :                     else
    3670             :                     {
    3671             :                         ReindexIndexInfo *idx;
    3672             : 
    3673             :                         /* Save the list of relation OIDs in private context */
    3674         250 :                         oldcontext = MemoryContextSwitchTo(private_context);
    3675             : 
    3676         250 :                         idx = palloc_object(ReindexIndexInfo);
    3677         250 :                         idx->indexId = cellOid;
    3678             :                         /* other fields set later */
    3679             : 
    3680         250 :                         indexIds = lappend(indexIds, idx);
    3681             : 
    3682         250 :                         MemoryContextSwitchTo(oldcontext);
    3683             :                     }
    3684             : 
    3685         262 :                     index_close(indexRelation, NoLock);
    3686             :                 }
    3687             : 
    3688             :                 /* Also add the toast indexes */
    3689         282 :                 if (OidIsValid(heapRelation->rd_rel->reltoastrelid))
    3690             :                 {
    3691          82 :                     Oid         toastOid = heapRelation->rd_rel->reltoastrelid;
    3692          82 :                     Relation    toastRelation = table_open(toastOid,
    3693             :                                                            ShareUpdateExclusiveLock);
    3694             : 
    3695             :                     /* Save the list of relation OIDs in private context */
    3696          82 :                     oldcontext = MemoryContextSwitchTo(private_context);
    3697             : 
    3698             :                     /* Track this relation for session locks */
    3699          82 :                     heapRelationIds = lappend_oid(heapRelationIds, toastOid);
    3700             : 
    3701          82 :                     MemoryContextSwitchTo(oldcontext);
    3702             : 
    3703         164 :                     foreach(lc2, RelationGetIndexList(toastRelation))
    3704             :                     {
    3705          82 :                         Oid         cellOid = lfirst_oid(lc2);
    3706          82 :                         Relation    indexRelation = index_open(cellOid,
    3707             :                                                                ShareUpdateExclusiveLock);
    3708             : 
    3709          82 :                         if (!indexRelation->rd_index->indisvalid)
    3710           0 :                             ereport(WARNING,
    3711             :                                     (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
    3712             :                                      errmsg("skipping reindex of invalid index \"%s.%s\"",
    3713             :                                             get_namespace_name(get_rel_namespace(cellOid)),
    3714             :                                             get_rel_name(cellOid)),
    3715             :                                      errhint("Use DROP INDEX or REINDEX INDEX.")));
    3716             :                         else
    3717             :                         {
    3718             :                             ReindexIndexInfo *idx;
    3719             : 
    3720             :                             /*
    3721             :                              * Save the list of relation OIDs in private
    3722             :                              * context
    3723             :                              */
    3724          82 :                             oldcontext = MemoryContextSwitchTo(private_context);
    3725             : 
    3726          82 :                             idx = palloc_object(ReindexIndexInfo);
    3727          82 :                             idx->indexId = cellOid;
    3728          82 :                             indexIds = lappend(indexIds, idx);
    3729             :                             /* other fields set later */
    3730             : 
    3731          82 :                             MemoryContextSwitchTo(oldcontext);
    3732             :                         }
    3733             : 
    3734          82 :                         index_close(indexRelation, NoLock);
    3735             :                     }
    3736             : 
    3737          82 :                     table_close(toastRelation, NoLock);
    3738             :                 }
    3739             : 
    3740         282 :                 table_close(heapRelation, NoLock);
    3741         282 :                 break;
    3742             :             }
    3743         186 :         case RELKIND_INDEX:
    3744             :             {
    3745         186 :                 Oid         heapId = IndexGetRelation(relationOid,
    3746         186 :                                                       (params->options & REINDEXOPT_MISSING_OK) != 0);
    3747             :                 Relation    heapRelation;
    3748             :                 ReindexIndexInfo *idx;
    3749             : 
    3750             :                 /* if relation is missing, leave */
    3751         186 :                 if (!OidIsValid(heapId))
    3752           0 :                     break;
    3753             : 
    3754         186 :                 if (IsCatalogRelationOid(heapId))
    3755          18 :                     ereport(ERROR,
    3756             :                             (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3757             :                              errmsg("cannot reindex system catalogs concurrently")));
    3758             : 
    3759             :                 /*
    3760             :                  * Don't allow reindex for an invalid index on TOAST table, as
    3761             :                  * if rebuilt it would not be possible to drop it.  Match
    3762             :                  * error message in reindex_index().
    3763             :                  */
    3764         168 :                 if (IsToastNamespace(get_rel_namespace(relationOid)) &&
    3765          56 :                     !get_index_isvalid(relationOid))
    3766           0 :                     ereport(ERROR,
    3767             :                             (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3768             :                              errmsg("cannot reindex invalid index on TOAST table")));
    3769             : 
    3770             :                 /*
    3771             :                  * Check if parent relation can be locked and if it exists,
    3772             :                  * this needs to be done at this stage as the list of indexes
    3773             :                  * to rebuild is not complete yet, and REINDEXOPT_MISSING_OK
    3774             :                  * should not be used once all the session locks are taken.
    3775             :                  */
    3776         168 :                 if ((params->options & REINDEXOPT_MISSING_OK) != 0)
    3777             :                 {
    3778          24 :                     heapRelation = try_table_open(heapId,
    3779             :                                                   ShareUpdateExclusiveLock);
    3780             :                     /* leave if relation does not exist */
    3781          24 :                     if (!heapRelation)
    3782           0 :                         break;
    3783             :                 }
    3784             :                 else
    3785         144 :                     heapRelation = table_open(heapId,
    3786             :                                               ShareUpdateExclusiveLock);
    3787             : 
    3788         176 :                 if (OidIsValid(params->tablespaceOid) &&
    3789           8 :                     IsSystemRelation(heapRelation))
    3790           2 :                     ereport(ERROR,
    3791             :                             (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3792             :                              errmsg("cannot move system relation \"%s\"",
    3793             :                                     get_rel_name(relationOid))));
    3794             : 
    3795         166 :                 table_close(heapRelation, NoLock);
    3796             : 
    3797             :                 /* Save the list of relation OIDs in private context */
    3798         166 :                 oldcontext = MemoryContextSwitchTo(private_context);
    3799             : 
    3800             :                 /* Track the heap relation of this index for session locks */
    3801         166 :                 heapRelationIds = list_make1_oid(heapId);
    3802             : 
    3803             :                 /*
    3804             :                  * Save the list of relation OIDs in private context.  Note
    3805             :                  * that invalid indexes are allowed here.
    3806             :                  */
    3807         166 :                 idx = palloc_object(ReindexIndexInfo);
    3808         166 :                 idx->indexId = relationOid;
    3809         166 :                 indexIds = lappend(indexIds, idx);
    3810             :                 /* other fields set later */
    3811             : 
    3812         166 :                 MemoryContextSwitchTo(oldcontext);
    3813         166 :                 break;
    3814             :             }
    3815             : 
    3816           0 :         case RELKIND_PARTITIONED_TABLE:
    3817             :         case RELKIND_PARTITIONED_INDEX:
    3818             :         default:
    3819             :             /* Return error if type of relation is not supported */
    3820           0 :             ereport(ERROR,
    3821             :                     (errcode(ERRCODE_WRONG_OBJECT_TYPE),
    3822             :                      errmsg("cannot reindex this type of relation concurrently")));
    3823             :             break;
    3824             :     }
    3825             : 
    3826             :     /*
    3827             :      * Definitely no indexes, so leave.  Any checks based on
    3828             :      * REINDEXOPT_MISSING_OK should be done only while the list of indexes to
    3829             :      * work on is built as the session locks taken before this transaction
    3830             :      * commits will make sure that they cannot be dropped by a concurrent
    3831             :      * session until this operation completes.
    3832             :      */
    3833         448 :     if (indexIds == NIL)
    3834          44 :         return false;
    3835             : 
    3836             :     /* It's not a shared catalog, so refuse to move it to shared tablespace */
    3837         404 :     if (params->tablespaceOid == GLOBALTABLESPACE_OID)
    3838           6 :         ereport(ERROR,
    3839             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
    3840             :                  errmsg("cannot move non-shared relation to tablespace \"%s\"",
    3841             :                         get_tablespace_name(params->tablespaceOid))));
    3842             : 
    3843             :     Assert(heapRelationIds != NIL);
    3844             : 
    3845             :     /*-----
    3846             :      * Now we have all the indexes we want to process in indexIds.
    3847             :      *
    3848             :      * The phases now are:
    3849             :      *
    3850             :      * 1. create new indexes in the catalog
    3851             :      * 2. build new indexes
    3852             :      * 3. let new indexes catch up with tuples inserted in the meantime
    3853             :      * 4. swap index names
    3854             :      * 5. mark old indexes as dead
    3855             :      * 6. drop old indexes
    3856             :      *
    3857             :      * We process each phase for all indexes before moving to the next phase,
    3858             :      * for efficiency.
    3859             :      */
    3860             : 
    3861             :     /*
    3862             :      * Phase 1 of REINDEX CONCURRENTLY
    3863             :      *
    3864             :      * Create a new index with the same properties as the old one, but it is
    3865             :      * only registered in catalogs and will be built later.  Then get session
    3866             :      * locks on all involved tables.  See analogous code in DefineIndex() for
    3867             :      * more detailed comments.
    3868             :      */
    3869             : 
    3870         884 :     foreach(lc, indexIds)
    3871             :     {
    3872             :         char       *concurrentName;
    3873         492 :         ReindexIndexInfo *idx = lfirst(lc);
    3874             :         ReindexIndexInfo *newidx;
    3875             :         Oid         newIndexId;
    3876             :         Relation    indexRel;
    3877             :         Relation    heapRel;
    3878             :         Oid         save_userid;
    3879             :         int         save_sec_context;
    3880             :         int         save_nestlevel;
    3881             :         Relation    newIndexRel;
    3882             :         LockRelId  *lockrelid;
    3883             :         Oid         tablespaceid;
    3884             : 
    3885         492 :         indexRel = index_open(idx->indexId, ShareUpdateExclusiveLock);
    3886         492 :         heapRel = table_open(indexRel->rd_index->indrelid,
    3887             :                              ShareUpdateExclusiveLock);
    3888             : 
    3889             :         /*
    3890             :          * Switch to the table owner's userid, so that any index functions are
    3891             :          * run as that user.  Also lock down security-restricted operations
    3892             :          * and arrange to make GUC variable changes local to this command.
    3893             :          */
    3894         492 :         GetUserIdAndSecContext(&save_userid, &save_sec_context);
    3895         492 :         SetUserIdAndSecContext(heapRel->rd_rel->relowner,
    3896             :                                save_sec_context | SECURITY_RESTRICTED_OPERATION);
    3897         492 :         save_nestlevel = NewGUCNestLevel();
    3898         492 :         RestrictSearchPath();
    3899             : 
    3900             :         /* determine safety of this index for set_indexsafe_procflags */
    3901         966 :         idx->safe = (indexRel->rd_indexprs == NIL &&
    3902         474 :                      indexRel->rd_indpred == NIL);
    3903         492 :         idx->tableId = RelationGetRelid(heapRel);
    3904         492 :         idx->amId = indexRel->rd_rel->relam;
    3905             : 
    3906             :         /* This function shouldn't be called for temporary relations. */
    3907         492 :         if (indexRel->rd_rel->relpersistence == RELPERSISTENCE_TEMP)
    3908           0 :             elog(ERROR, "cannot reindex a temporary table concurrently");
    3909             : 
    3910         492 :         pgstat_progress_start_command(PROGRESS_COMMAND_CREATE_INDEX, idx->tableId);
    3911             : 
    3912         492 :         progress_vals[0] = PROGRESS_CREATEIDX_COMMAND_REINDEX_CONCURRENTLY;
    3913         492 :         progress_vals[1] = 0;   /* initializing */
    3914         492 :         progress_vals[2] = idx->indexId;
    3915         492 :         progress_vals[3] = idx->amId;
    3916         492 :         pgstat_progress_update_multi_param(4, progress_index, progress_vals);
    3917             : 
    3918             :         /* Choose a temporary relation name for the new index */
    3919         492 :         concurrentName = ChooseRelationName(get_rel_name(idx->indexId),
    3920             :                                             NULL,
    3921             :                                             "ccnew",
    3922         492 :                                             get_rel_namespace(indexRel->rd_index->indrelid),
    3923             :                                             false);
    3924             : 
    3925             :         /* Choose the new tablespace, indexes of toast tables are not moved */
    3926         492 :         if (OidIsValid(params->tablespaceOid) &&
    3927          28 :             heapRel->rd_rel->relkind != RELKIND_TOASTVALUE)
    3928          20 :             tablespaceid = params->tablespaceOid;
    3929             :         else
    3930         472 :             tablespaceid = indexRel->rd_rel->reltablespace;
    3931             : 
    3932             :         /* Create new index definition based on given index */
    3933         492 :         newIndexId = index_concurrently_create_copy(heapRel,
    3934             :                                                     idx->indexId,
    3935             :                                                     tablespaceid,
    3936             :                                                     concurrentName);
    3937             : 
    3938             :         /*
    3939             :          * Now open the relation of the new index, a session-level lock is
    3940             :          * also needed on it.
    3941             :          */
    3942         486 :         newIndexRel = index_open(newIndexId, ShareUpdateExclusiveLock);
    3943             : 
    3944             :         /*
    3945             :          * Save the list of OIDs and locks in private context
    3946             :          */
    3947         486 :         oldcontext = MemoryContextSwitchTo(private_context);
    3948             : 
    3949         486 :         newidx = palloc_object(ReindexIndexInfo);
    3950         486 :         newidx->indexId = newIndexId;
    3951         486 :         newidx->safe = idx->safe;
    3952         486 :         newidx->tableId = idx->tableId;
    3953         486 :         newidx->amId = idx->amId;
    3954             : 
    3955         486 :         newIndexIds = lappend(newIndexIds, newidx);
    3956             : 
    3957             :         /*
    3958             :          * Save lockrelid to protect each relation from drop then close
    3959             :          * relations. The lockrelid on parent relation is not taken here to
    3960             :          * avoid multiple locks taken on the same relation, instead we rely on
    3961             :          * parentRelationIds built earlier.
    3962             :          */
    3963         486 :         lockrelid = palloc_object(LockRelId);
    3964         486 :         *lockrelid = indexRel->rd_lockInfo.lockRelId;
    3965         486 :         relationLocks = lappend(relationLocks, lockrelid);
    3966         486 :         lockrelid = palloc_object(LockRelId);
    3967         486 :         *lockrelid = newIndexRel->rd_lockInfo.lockRelId;
    3968         486 :         relationLocks = lappend(relationLocks, lockrelid);
    3969             : 
    3970         486 :         MemoryContextSwitchTo(oldcontext);
    3971             : 
    3972         486 :         index_close(indexRel, NoLock);
    3973         486 :         index_close(newIndexRel, NoLock);
    3974             : 
    3975             :         /* Roll back any GUC changes executed by index functions */
    3976         486 :         AtEOXact_GUC(false, save_nestlevel);
    3977             : 
    3978             :         /* Restore userid and security context */
    3979         486 :         SetUserIdAndSecContext(save_userid, save_sec_context);
    3980             : 
    3981         486 :         table_close(heapRel, NoLock);
    3982             : 
    3983             :         /*
    3984             :          * If a statement is available, telling that this comes from a REINDEX
    3985             :          * command, collect the new index for event triggers.
    3986             :          */
    3987         486 :         if (stmt)
    3988             :         {
    3989             :             ObjectAddress address;
    3990             : 
    3991         486 :             ObjectAddressSet(address, RelationRelationId, newIndexId);
    3992         486 :             EventTriggerCollectSimpleCommand(address,
    3993             :                                              InvalidObjectAddress,
    3994             :                                              (Node *) stmt);
    3995             :         }
    3996             :     }
    3997             : 
    3998             :     /*
    3999             :      * Save the heap lock for following visibility checks with other backends
    4000             :      * might conflict with this session.
    4001             :      */
    4002         866 :     foreach(lc, heapRelationIds)
    4003             :     {
    4004         474 :         Relation    heapRelation = table_open(lfirst_oid(lc), ShareUpdateExclusiveLock);
    4005             :         LockRelId  *lockrelid;
    4006             :         LOCKTAG    *heaplocktag;
    4007             : 
    4008             :         /* Save the list of locks in private context */
    4009         474 :         oldcontext = MemoryContextSwitchTo(private_context);
    4010             : 
    4011             :         /* Add lockrelid of heap relation to the list of locked relations */
    4012         474 :         lockrelid = palloc_object(LockRelId);
    4013         474 :         *lockrelid = heapRelation->rd_lockInfo.lockRelId;
    4014         474 :         relationLocks = lappend(relationLocks, lockrelid);
    4015             : 
    4016         474 :         heaplocktag = palloc_object(LOCKTAG);
    4017             : 
    4018             :         /* Save the LOCKTAG for this parent relation for the wait phase */
    4019         474 :         SET_LOCKTAG_RELATION(*heaplocktag, lockrelid->dbId, lockrelid->relId);
    4020         474 :         lockTags = lappend(lockTags, heaplocktag);
    4021             : 
    4022         474 :         MemoryContextSwitchTo(oldcontext);
    4023             : 
    4024             :         /* Close heap relation */
    4025         474 :         table_close(heapRelation, NoLock);
    4026             :     }
    4027             : 
    4028             :     /* Get a session-level lock on each table. */
    4029        1838 :     foreach(lc, relationLocks)
    4030             :     {
    4031        1446 :         LockRelId  *lockrelid = (LockRelId *) lfirst(lc);
    4032             : 
    4033        1446 :         LockRelationIdForSession(lockrelid, ShareUpdateExclusiveLock);
    4034             :     }
    4035             : 
    4036         392 :     PopActiveSnapshot();
    4037         392 :     CommitTransactionCommand();
    4038         392 :     StartTransactionCommand();
    4039             : 
    4040             :     /*
    4041             :      * Because we don't take a snapshot in this transaction, there's no need
    4042             :      * to set the PROC_IN_SAFE_IC flag here.
    4043             :      */
    4044             : 
    4045             :     /*
    4046             :      * Phase 2 of REINDEX CONCURRENTLY
    4047             :      *
    4048             :      * Build the new indexes in a separate transaction for each index to avoid
    4049             :      * having open transactions for an unnecessary long time.  But before
    4050             :      * doing that, wait until no running transactions could have the table of
    4051             :      * the index open with the old list of indexes.  See "phase 2" in
    4052             :      * DefineIndex() for more details.
    4053             :      */
    4054             : 
    4055         392 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_PHASE,
    4056             :                                  PROGRESS_CREATEIDX_PHASE_WAIT_1);
    4057         392 :     WaitForLockersMultiple(lockTags, ShareLock, true);
    4058         392 :     CommitTransactionCommand();
    4059             : 
    4060         872 :     foreach(lc, newIndexIds)
    4061             :     {
    4062         486 :         ReindexIndexInfo *newidx = lfirst(lc);
    4063             : 
    4064             :         /* Start new transaction for this index's concurrent build */
    4065         486 :         StartTransactionCommand();
    4066             : 
    4067             :         /*
    4068             :          * Check for user-requested abort.  This is inside a transaction so as
    4069             :          * xact.c does not issue a useless WARNING, and ensures that
    4070             :          * session-level locks are cleaned up on abort.
    4071             :          */
    4072         486 :         CHECK_FOR_INTERRUPTS();
    4073             : 
    4074             :         /* Tell concurrent indexing to ignore us, if index qualifies */
    4075         486 :         if (newidx->safe)
    4076         462 :             set_indexsafe_procflags();
    4077             : 
    4078             :         /* Set ActiveSnapshot since functions in the indexes may need it */
    4079         486 :         PushActiveSnapshot(GetTransactionSnapshot());
    4080             : 
    4081             :         /*
    4082             :          * Update progress for the index to build, with the correct parent
    4083             :          * table involved.
    4084             :          */
    4085         486 :         pgstat_progress_start_command(PROGRESS_COMMAND_CREATE_INDEX, newidx->tableId);
    4086         486 :         progress_vals[0] = PROGRESS_CREATEIDX_COMMAND_REINDEX_CONCURRENTLY;
    4087         486 :         progress_vals[1] = PROGRESS_CREATEIDX_PHASE_BUILD;
    4088         486 :         progress_vals[2] = newidx->indexId;
    4089         486 :         progress_vals[3] = newidx->amId;
    4090         486 :         pgstat_progress_update_multi_param(4, progress_index, progress_vals);
    4091             : 
    4092             :         /* Perform concurrent build of new index */
    4093         486 :         index_concurrently_build(newidx->tableId, newidx->indexId);
    4094             : 
    4095         480 :         PopActiveSnapshot();
    4096         480 :         CommitTransactionCommand();
    4097             :     }
    4098             : 
    4099         386 :     StartTransactionCommand();
    4100             : 
    4101             :     /*
    4102             :      * Because we don't take a snapshot or Xid in this transaction, there's no
    4103             :      * need to set the PROC_IN_SAFE_IC flag here.
    4104             :      */
    4105             : 
    4106             :     /*
    4107             :      * Phase 3 of REINDEX CONCURRENTLY
    4108             :      *
    4109             :      * During this phase the old indexes catch up with any new tuples that
    4110             :      * were created during the previous phase.  See "phase 3" in DefineIndex()
    4111             :      * for more details.
    4112             :      */
    4113             : 
    4114         386 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_PHASE,
    4115             :                                  PROGRESS_CREATEIDX_PHASE_WAIT_2);
    4116         386 :     WaitForLockersMultiple(lockTags, ShareLock, true);
    4117         386 :     CommitTransactionCommand();
    4118             : 
    4119         866 :     foreach(lc, newIndexIds)
    4120             :     {
    4121         480 :         ReindexIndexInfo *newidx = lfirst(lc);
    4122             :         TransactionId limitXmin;
    4123             :         Snapshot    snapshot;
    4124             : 
    4125         480 :         StartTransactionCommand();
    4126             : 
    4127             :         /*
    4128             :          * Check for user-requested abort.  This is inside a transaction so as
    4129             :          * xact.c does not issue a useless WARNING, and ensures that
    4130             :          * session-level locks are cleaned up on abort.
    4131             :          */
    4132         480 :         CHECK_FOR_INTERRUPTS();
    4133             : 
    4134             :         /* Tell concurrent indexing to ignore us, if index qualifies */
    4135         480 :         if (newidx->safe)
    4136         456 :             set_indexsafe_procflags();
    4137             : 
    4138             :         /*
    4139             :          * Take the "reference snapshot" that will be used by validate_index()
    4140             :          * to filter candidate tuples.
    4141             :          */
    4142         480 :         snapshot = RegisterSnapshot(GetTransactionSnapshot());
    4143         480 :         PushActiveSnapshot(snapshot);
    4144             : 
    4145             :         /*
    4146             :          * Update progress for the index to build, with the correct parent
    4147             :          * table involved.
    4148             :          */
    4149         480 :         pgstat_progress_start_command(PROGRESS_COMMAND_CREATE_INDEX, newidx->tableId);
    4150         480 :         progress_vals[0] = PROGRESS_CREATEIDX_COMMAND_REINDEX_CONCURRENTLY;
    4151         480 :         progress_vals[1] = PROGRESS_CREATEIDX_PHASE_VALIDATE_IDXSCAN;
    4152         480 :         progress_vals[2] = newidx->indexId;
    4153         480 :         progress_vals[3] = newidx->amId;
    4154         480 :         pgstat_progress_update_multi_param(4, progress_index, progress_vals);
    4155             : 
    4156         480 :         validate_index(newidx->tableId, newidx->indexId, snapshot);
    4157             : 
    4158             :         /*
    4159             :          * We can now do away with our active snapshot, we still need to save
    4160             :          * the xmin limit to wait for older snapshots.
    4161             :          */
    4162         480 :         limitXmin = snapshot->xmin;
    4163             : 
    4164         480 :         PopActiveSnapshot();
    4165         480 :         UnregisterSnapshot(snapshot);
    4166             : 
    4167             :         /*
    4168             :          * To ensure no deadlocks, we must commit and start yet another
    4169             :          * transaction, and do our wait before any snapshot has been taken in
    4170             :          * it.
    4171             :          */
    4172         480 :         CommitTransactionCommand();
    4173         480 :         StartTransactionCommand();
    4174             : 
    4175             :         /*
    4176             :          * The index is now valid in the sense that it contains all currently
    4177             :          * interesting tuples.  But since it might not contain tuples deleted
    4178             :          * just before the reference snap was taken, we have to wait out any
    4179             :          * transactions that might have older snapshots.
    4180             :          *
    4181             :          * Because we don't take a snapshot or Xid in this transaction,
    4182             :          * there's no need to set the PROC_IN_SAFE_IC flag here.
    4183             :          */
    4184         480 :         pgstat_progress_update_param(PROGRESS_CREATEIDX_PHASE,
    4185             :                                      PROGRESS_CREATEIDX_PHASE_WAIT_3);
    4186         480 :         WaitForOlderSnapshots(limitXmin, true);
    4187             : 
    4188         480 :         CommitTransactionCommand();
    4189             :     }
    4190             : 
    4191             :     /*
    4192             :      * Phase 4 of REINDEX CONCURRENTLY
    4193             :      *
    4194             :      * Now that the new indexes have been validated, swap each new index with
    4195             :      * its corresponding old index.
    4196             :      *
    4197             :      * We mark the new indexes as valid and the old indexes as not valid at
    4198             :      * the same time to make sure we only get constraint violations from the
    4199             :      * indexes with the correct names.
    4200             :      */
    4201             : 
    4202         386 :     StartTransactionCommand();
    4203             : 
    4204             :     /*
    4205             :      * Because this transaction only does catalog manipulations and doesn't do
    4206             :      * any index operations, we can set the PROC_IN_SAFE_IC flag here
    4207             :      * unconditionally.
    4208             :      */
    4209         386 :     set_indexsafe_procflags();
    4210             : 
    4211         866 :     forboth(lc, indexIds, lc2, newIndexIds)
    4212             :     {
    4213         480 :         ReindexIndexInfo *oldidx = lfirst(lc);
    4214         480 :         ReindexIndexInfo *newidx = lfirst(lc2);
    4215             :         char       *oldName;
    4216             : 
    4217             :         /*
    4218             :          * Check for user-requested abort.  This is inside a transaction so as
    4219             :          * xact.c does not issue a useless WARNING, and ensures that
    4220             :          * session-level locks are cleaned up on abort.
    4221             :          */
    4222         480 :         CHECK_FOR_INTERRUPTS();
    4223             : 
    4224             :         /* Choose a relation name for old index */
    4225         480 :         oldName = ChooseRelationName(get_rel_name(oldidx->indexId),
    4226             :                                      NULL,
    4227             :                                      "ccold",
    4228             :                                      get_rel_namespace(oldidx->tableId),
    4229             :                                      false);
    4230             : 
    4231             :         /*
    4232             :          * Swap old index with the new one.  This also marks the new one as
    4233             :          * valid and the old one as not valid.
    4234             :          */
    4235         480 :         index_concurrently_swap(newidx->indexId, oldidx->indexId, oldName);
    4236             : 
    4237             :         /*
    4238             :          * Invalidate the relcache for the table, so that after this commit
    4239             :          * all sessions will refresh any cached plans that might reference the
    4240             :          * index.
    4241             :          */
    4242         480 :         CacheInvalidateRelcacheByRelid(oldidx->tableId);
    4243             : 
    4244             :         /*
    4245             :          * CCI here so that subsequent iterations see the oldName in the
    4246             :          * catalog and can choose a nonconflicting name for their oldName.
    4247             :          * Otherwise, this could lead to conflicts if a table has two indexes
    4248             :          * whose names are equal for the first NAMEDATALEN-minus-a-few
    4249             :          * characters.
    4250             :          */
    4251         480 :         CommandCounterIncrement();
    4252             :     }
    4253             : 
    4254             :     /* Commit this transaction and make index swaps visible */
    4255         386 :     CommitTransactionCommand();
    4256         386 :     StartTransactionCommand();
    4257             : 
    4258             :     /*
    4259             :      * While we could set PROC_IN_SAFE_IC if all indexes qualified, there's no
    4260             :      * real need for that, because we only acquire an Xid after the wait is
    4261             :      * done, and that lasts for a very short period.
    4262             :      */
    4263             : 
    4264             :     /*
    4265             :      * Phase 5 of REINDEX CONCURRENTLY
    4266             :      *
    4267             :      * Mark the old indexes as dead.  First we must wait until no running
    4268             :      * transaction could be using the index for a query.  See also
    4269             :      * index_drop() for more details.
    4270             :      */
    4271             : 
    4272         386 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_PHASE,
    4273             :                                  PROGRESS_CREATEIDX_PHASE_WAIT_4);
    4274         386 :     WaitForLockersMultiple(lockTags, AccessExclusiveLock, true);
    4275             : 
    4276         866 :     foreach(lc, indexIds)
    4277             :     {
    4278         480 :         ReindexIndexInfo *oldidx = lfirst(lc);
    4279             : 
    4280             :         /*
    4281             :          * Check for user-requested abort.  This is inside a transaction so as
    4282             :          * xact.c does not issue a useless WARNING, and ensures that
    4283             :          * session-level locks are cleaned up on abort.
    4284             :          */
    4285         480 :         CHECK_FOR_INTERRUPTS();
    4286             : 
    4287         480 :         index_concurrently_set_dead(oldidx->tableId, oldidx->indexId);
    4288             :     }
    4289             : 
    4290             :     /* Commit this transaction to make the updates visible. */
    4291         386 :     CommitTransactionCommand();
    4292         386 :     StartTransactionCommand();
    4293             : 
    4294             :     /*
    4295             :      * While we could set PROC_IN_SAFE_IC if all indexes qualified, there's no
    4296             :      * real need for that, because we only acquire an Xid after the wait is
    4297             :      * done, and that lasts for a very short period.
    4298             :      */
    4299             : 
    4300             :     /*
    4301             :      * Phase 6 of REINDEX CONCURRENTLY
    4302             :      *
    4303             :      * Drop the old indexes.
    4304             :      */
    4305             : 
    4306         386 :     pgstat_progress_update_param(PROGRESS_CREATEIDX_PHASE,
    4307             :                                  PROGRESS_CREATEIDX_PHASE_WAIT_5);
    4308         386 :     WaitForLockersMultiple(lockTags, AccessExclusiveLock, true);
    4309             : 
    4310         386 :     PushActiveSnapshot(GetTransactionSnapshot());
    4311             : 
    4312             :     {
    4313         386 :         ObjectAddresses *objects = new_object_addresses();
    4314             : 
    4315         866 :         foreach(lc, indexIds)
    4316             :         {
    4317         480 :             ReindexIndexInfo *idx = lfirst(lc);
    4318             :             ObjectAddress object;
    4319             : 
    4320         480 :             object.classId = RelationRelationId;
    4321         480 :             object.objectId = idx->indexId;
    4322         480 :             object.objectSubId = 0;
    4323             : 
    4324         480 :             add_exact_object_address(&object, objects);
    4325             :         }
    4326             : 
    4327             :         /*
    4328             :          * Use PERFORM_DELETION_CONCURRENT_LOCK so that index_drop() uses the
    4329             :          * right lock level.
    4330             :          */
    4331         386 :         performMultipleDeletions(objects, DROP_RESTRICT,
    4332             :                                  PERFORM_DELETION_CONCURRENT_LOCK | PERFORM_DELETION_INTERNAL);
    4333             :     }
    4334             : 
    4335         386 :     PopActiveSnapshot();
    4336         386 :     CommitTransactionCommand();
    4337             : 
    4338             :     /*
    4339             :      * Finally, release the session-level lock on the table.
    4340             :      */
    4341        1814 :     foreach(lc, relationLocks)
    4342             :     {
    4343        1428 :         LockRelId  *lockrelid = (LockRelId *) lfirst(lc);
    4344             : 
    4345        1428 :         UnlockRelationIdForSession(lockrelid, ShareUpdateExclusiveLock);
    4346             :     }
    4347             : 
    4348             :     /* Start a new transaction to finish process properly */
    4349         386 :     StartTransactionCommand();
    4350             : 
    4351             :     /* Log what we did */
    4352         386 :     if ((params->options & REINDEXOPT_VERBOSE) != 0)
    4353             :     {
    4354           4 :         if (relkind == RELKIND_INDEX)
    4355           0 :             ereport(INFO,
    4356             :                     (errmsg("index \"%s.%s\" was reindexed",
    4357             :                             relationNamespace, relationName),
    4358             :                      errdetail("%s.",
    4359             :                                pg_rusage_show(&ru0))));
    4360             :         else
    4361             :         {
    4362          12 :             foreach(lc, newIndexIds)
    4363             :             {
    4364           8 :                 ReindexIndexInfo *idx = lfirst(lc);
    4365           8 :                 Oid         indOid = idx->indexId;
    4366             : 
    4367           8 :                 ereport(INFO,
    4368             :                         (errmsg("index \"%s.%s\" was reindexed",
    4369             :                                 get_namespace_name(get_rel_namespace(indOid)),
    4370             :                                 get_rel_name(indOid))));
    4371             :                 /* Don't show rusage here, since it's not per index. */
    4372             :             }
    4373             : 
    4374           4 :             ereport(INFO,
    4375             :                     (errmsg("table \"%s.%s\" was reindexed",
    4376             :                             relationNamespace, relationName),
    4377             :                      errdetail("%s.",
    4378             :                                pg_rusage_show(&ru0))));
    4379             :         }
    4380             :     }
    4381             : 
    4382         386 :     MemoryContextDelete(private_context);
    4383             : 
    4384         386 :     pgstat_progress_end_command();
    4385             : 
    4386         386 :     return true;
    4387             : }
    4388             : 
    4389             : /*
    4390             :  * Insert or delete an appropriate pg_inherits tuple to make the given index
    4391             :  * be a partition of the indicated parent index.
    4392             :  *
    4393             :  * This also corrects the pg_depend information for the affected index.
    4394             :  */
    4395             : void
    4396         870 : IndexSetParentIndex(Relation partitionIdx, Oid parentOid)
    4397             : {
    4398             :     Relation    pg_inherits;
    4399             :     ScanKeyData key[2];
    4400             :     SysScanDesc scan;
    4401         870 :     Oid         partRelid = RelationGetRelid(partitionIdx);
    4402             :     HeapTuple   tuple;
    4403             :     bool        fix_dependencies;
    4404             : 
    4405             :     /* Make sure this is an index */
    4406             :     Assert(partitionIdx->rd_rel->relkind == RELKIND_INDEX ||
    4407             :            partitionIdx->rd_rel->relkind == RELKIND_PARTITIONED_INDEX);
    4408             : 
    4409             :     /*
    4410             :      * Scan pg_inherits for rows linking our index to some parent.
    4411             :      */
    4412         870 :     pg_inherits = relation_open(InheritsRelationId, RowExclusiveLock);
    4413         870 :     ScanKeyInit(&key[0],
    4414             :                 Anum_pg_inherits_inhrelid,
    4415             :                 BTEqualStrategyNumber, F_OIDEQ,
    4416             :                 ObjectIdGetDatum(partRelid));
    4417         870 :     ScanKeyInit(&key[1],
    4418             :                 Anum_pg_inherits_inhseqno,
    4419             :                 BTEqualStrategyNumber, F_INT4EQ,
    4420             :                 Int32GetDatum(1));
    4421         870 :     scan = systable_beginscan(pg_inherits, InheritsRelidSeqnoIndexId, true,
    4422             :                               NULL, 2, key);
    4423         870 :     tuple = systable_getnext(scan);
    4424             : 
    4425         870 :     if (!HeapTupleIsValid(tuple))
    4426             :     {
    4427         544 :         if (parentOid == InvalidOid)
    4428             :         {
    4429             :             /*
    4430             :              * No pg_inherits row, and no parent wanted: nothing to do in this
    4431             :              * case.
    4432             :              */
    4433           0 :             fix_dependencies = false;
    4434             :         }
    4435             :         else
    4436             :         {
    4437         544 :             StoreSingleInheritance(partRelid, parentOid, 1);
    4438         544 :             fix_dependencies = true;
    4439             :         }
    4440             :     }
    4441             :     else
    4442             :     {
    4443         326 :         Form_pg_inherits inhForm = (Form_pg_inherits) GETSTRUCT(tuple);
    4444             : 
    4445         326 :         if (parentOid == InvalidOid)
    4446             :         {
    4447             :             /*
    4448             :              * There exists a pg_inherits row, which we want to clear; do so.
    4449             :              */
    4450         326 :             CatalogTupleDelete(pg_inherits, &tuple->t_self);
    4451         326 :             fix_dependencies = true;
    4452             :         }
    4453             :         else
    4454             :         {
    4455             :             /*
    4456             :              * A pg_inherits row exists.  If it's the same we want, then we're
    4457             :              * good; if it differs, that amounts to a corrupt catalog and
    4458             :              * should not happen.
    4459             :              */
    4460           0 :             if (inhForm->inhparent != parentOid)
    4461             :             {
    4462             :                 /* unexpected: we should not get called in this case */
    4463           0 :                 elog(ERROR, "bogus pg_inherit row: inhrelid %u inhparent %u",
    4464             :                      inhForm->inhrelid, inhForm->inhparent);
    4465             :             }
    4466             : 
    4467             :             /* already in the right state */
    4468           0 :             fix_dependencies = false;
    4469             :         }
    4470             :     }
    4471             : 
    4472             :     /* done with pg_inherits */
    4473         870 :     systable_endscan(scan);
    4474         870 :     relation_close(pg_inherits, RowExclusiveLock);
    4475             : 
    4476             :     /* set relhassubclass if an index partition has been added to the parent */
    4477         870 :     if (OidIsValid(parentOid))
    4478         544 :         SetRelationHasSubclass(parentOid, true);
    4479             : 
    4480             :     /* set relispartition correctly on the partition */
    4481         870 :     update_relispartition(partRelid, OidIsValid(parentOid));
    4482             : 
    4483         870 :     if (fix_dependencies)
    4484             :     {
    4485             :         /*
    4486             :          * Insert/delete pg_depend rows.  If setting a parent, add PARTITION
    4487             :          * dependencies on the parent index and the table; if removing a
    4488             :          * parent, delete PARTITION dependencies.
    4489             :          */
    4490         870 :         if (OidIsValid(parentOid))
    4491             :         {
    4492             :             ObjectAddress partIdx;
    4493             :             ObjectAddress parentIdx;
    4494             :             ObjectAddress partitionTbl;
    4495             : 
    4496         544 :             ObjectAddressSet(partIdx, RelationRelationId, partRelid);
    4497         544 :             ObjectAddressSet(parentIdx, RelationRelationId, parentOid);
    4498         544 :             ObjectAddressSet(partitionTbl, RelationRelationId,
    4499             :                              partitionIdx->rd_index->indrelid);
    4500         544 :             recordDependencyOn(&partIdx, &parentIdx,
    4501             :                                DEPENDENCY_PARTITION_PRI);
    4502         544 :             recordDependencyOn(&partIdx, &partitionTbl,
    4503             :                                DEPENDENCY_PARTITION_SEC);
    4504             :         }
    4505             :         else
    4506             :         {
    4507         326 :             deleteDependencyRecordsForClass(RelationRelationId, partRelid,
    4508             :                                             RelationRelationId,
    4509             :                                             DEPENDENCY_PARTITION_PRI);
    4510         326 :             deleteDependencyRecordsForClass(RelationRelationId, partRelid,
    4511             :                                             RelationRelationId,
    4512             :                                             DEPENDENCY_PARTITION_SEC);
    4513             :         }
    4514             : 
    4515             :         /* make our updates visible */
    4516         870 :         CommandCounterIncrement();
    4517             :     }
    4518         870 : }
    4519             : 
    4520             : /*
    4521             :  * Subroutine of IndexSetParentIndex to update the relispartition flag of the
    4522             :  * given index to the given value.
    4523             :  */
    4524             : static void
    4525         870 : update_relispartition(Oid relationId, bool newval)
    4526             : {
    4527             :     HeapTuple   tup;
    4528             :     Relation    classRel;
    4529             : 
    4530         870 :     classRel = table_open(RelationRelationId, RowExclusiveLock);
    4531         870 :     tup = SearchSysCacheCopy1(RELOID, ObjectIdGetDatum(relationId));
    4532         870 :     if (!HeapTupleIsValid(tup))
    4533           0 :         elog(ERROR, "cache lookup failed for relation %u", relationId);
    4534             :     Assert(((Form_pg_class) GETSTRUCT(tup))->relispartition != newval);
    4535         870 :     ((Form_pg_class) GETSTRUCT(tup))->relispartition = newval;
    4536         870 :     CatalogTupleUpdate(classRel, &tup->t_self, tup);
    4537         870 :     heap_freetuple(tup);
    4538         870 :     table_close(classRel, RowExclusiveLock);
    4539         870 : }
    4540             : 
    4541             : /*
    4542             :  * Set the PROC_IN_SAFE_IC flag in MyProc->statusFlags.
    4543             :  *
    4544             :  * When doing concurrent index builds, we can set this flag
    4545             :  * to tell other processes concurrently running CREATE
    4546             :  * INDEX CONCURRENTLY or REINDEX CONCURRENTLY to ignore us when
    4547             :  * doing their waits for concurrent snapshots.  On one hand it
    4548             :  * avoids pointlessly waiting for a process that's not interesting
    4549             :  * anyway; but more importantly it avoids deadlocks in some cases.
    4550             :  *
    4551             :  * This can be done safely only for indexes that don't execute any
    4552             :  * expressions that could access other tables, so index must not be
    4553             :  * expressional nor partial.  Caller is responsible for only calling
    4554             :  * this routine when that assumption holds true.
    4555             :  *
    4556             :  * (The flag is reset automatically at transaction end, so it must be
    4557             :  * set for each transaction.)
    4558             :  */
    4559             : static inline void
    4560        1616 : set_indexsafe_procflags(void)
    4561             : {
    4562             :     /*
    4563             :      * This should only be called before installing xid or xmin in MyProc;
    4564             :      * otherwise, concurrent processes could see an Xmin that moves backwards.
    4565             :      */
    4566             :     Assert(MyProc->xid == InvalidTransactionId &&
    4567             :            MyProc->xmin == InvalidTransactionId);
    4568             : 
    4569        1616 :     LWLockAcquire(ProcArrayLock, LW_EXCLUSIVE);
    4570        1616 :     MyProc->statusFlags |= PROC_IN_SAFE_IC;
    4571        1616 :     ProcGlobal->statusFlags[MyProc->pgxactoff] = MyProc->statusFlags;
    4572        1616 :     LWLockRelease(ProcArrayLock);
    4573        1616 : }

Generated by: LCOV version 1.14