LCOV - code coverage report
Current view: top level - src/backend/commands - statscmds.c (source / functions) Hit Total Coverage
Test: PostgreSQL 18devel Lines: 252 278 90.6 %
Date: 2025-01-18 04:15:08 Functions: 8 8 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*-------------------------------------------------------------------------
       2             :  *
       3             :  * statscmds.c
       4             :  *    Commands for creating and altering extended statistics objects
       5             :  *
       6             :  * Portions Copyright (c) 1996-2025, PostgreSQL Global Development Group
       7             :  * Portions Copyright (c) 1994, Regents of the University of California
       8             :  *
       9             :  *
      10             :  * IDENTIFICATION
      11             :  *    src/backend/commands/statscmds.c
      12             :  *
      13             :  *-------------------------------------------------------------------------
      14             :  */
      15             : #include "postgres.h"
      16             : 
      17             : #include "access/relation.h"
      18             : #include "access/table.h"
      19             : #include "catalog/catalog.h"
      20             : #include "catalog/dependency.h"
      21             : #include "catalog/indexing.h"
      22             : #include "catalog/namespace.h"
      23             : #include "catalog/objectaccess.h"
      24             : #include "catalog/pg_namespace.h"
      25             : #include "catalog/pg_statistic_ext.h"
      26             : #include "catalog/pg_statistic_ext_data.h"
      27             : #include "commands/comment.h"
      28             : #include "commands/defrem.h"
      29             : #include "miscadmin.h"
      30             : #include "nodes/nodeFuncs.h"
      31             : #include "optimizer/optimizer.h"
      32             : #include "statistics/statistics.h"
      33             : #include "utils/acl.h"
      34             : #include "utils/builtins.h"
      35             : #include "utils/inval.h"
      36             : #include "utils/lsyscache.h"
      37             : #include "utils/rel.h"
      38             : #include "utils/syscache.h"
      39             : #include "utils/typcache.h"
      40             : 
      41             : 
      42             : static char *ChooseExtendedStatisticName(const char *name1, const char *name2,
      43             :                                          const char *label, Oid namespaceid);
      44             : static char *ChooseExtendedStatisticNameAddition(List *exprs);
      45             : 
      46             : 
      47             : /* qsort comparator for the attnums in CreateStatistics */
      48             : static int
      49         512 : compare_int16(const void *a, const void *b)
      50             : {
      51         512 :     int         av = *(const int16 *) a;
      52         512 :     int         bv = *(const int16 *) b;
      53             : 
      54             :     /* this can't overflow if int is wider than int16 */
      55         512 :     return (av - bv);
      56             : }
      57             : 
      58             : /*
      59             :  *      CREATE STATISTICS
      60             :  */
      61             : ObjectAddress
      62         632 : CreateStatistics(CreateStatsStmt *stmt)
      63             : {
      64             :     int16       attnums[STATS_MAX_DIMENSIONS];
      65         632 :     int         nattnums = 0;
      66             :     int         numcols;
      67             :     char       *namestr;
      68             :     NameData    stxname;
      69             :     Oid         statoid;
      70             :     Oid         namespaceId;
      71         632 :     Oid         stxowner = GetUserId();
      72             :     HeapTuple   htup;
      73             :     Datum       values[Natts_pg_statistic_ext];
      74             :     bool        nulls[Natts_pg_statistic_ext];
      75             :     int2vector *stxkeys;
      76         632 :     List       *stxexprs = NIL;
      77             :     Datum       exprsDatum;
      78             :     Relation    statrel;
      79         632 :     Relation    rel = NULL;
      80             :     Oid         relid;
      81             :     ObjectAddress parentobject,
      82             :                 myself;
      83             :     Datum       types[4];       /* one for each possible type of statistic */
      84             :     int         ntypes;
      85             :     ArrayType  *stxkind;
      86             :     bool        build_ndistinct;
      87             :     bool        build_dependencies;
      88             :     bool        build_mcv;
      89             :     bool        build_expressions;
      90         632 :     bool        requested_type = false;
      91             :     int         i;
      92             :     ListCell   *cell;
      93             :     ListCell   *cell2;
      94             : 
      95             :     Assert(IsA(stmt, CreateStatsStmt));
      96             : 
      97             :     /*
      98             :      * Examine the FROM clause.  Currently, we only allow it to be a single
      99             :      * simple table, but later we'll probably allow multiple tables and JOIN
     100             :      * syntax.  The grammar is already prepared for that, so we have to check
     101             :      * here that what we got is what we can support.
     102             :      */
     103         632 :     if (list_length(stmt->relations) != 1)
     104           0 :         ereport(ERROR,
     105             :                 (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     106             :                  errmsg("only a single relation is allowed in CREATE STATISTICS")));
     107             : 
     108        1234 :     foreach(cell, stmt->relations)
     109             :     {
     110         632 :         Node       *rln = (Node *) lfirst(cell);
     111             : 
     112         632 :         if (!IsA(rln, RangeVar))
     113           0 :             ereport(ERROR,
     114             :                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     115             :                      errmsg("only a single relation is allowed in CREATE STATISTICS")));
     116             : 
     117             :         /*
     118             :          * CREATE STATISTICS will influence future execution plans but does
     119             :          * not interfere with currently executing plans.  So it should be
     120             :          * enough to take only ShareUpdateExclusiveLock on relation,
     121             :          * conflicting with ANALYZE and other DDL that sets statistical
     122             :          * information, but not with normal queries.
     123             :          */
     124         632 :         rel = relation_openrv((RangeVar *) rln, ShareUpdateExclusiveLock);
     125             : 
     126             :         /* Restrict to allowed relation types */
     127         632 :         if (rel->rd_rel->relkind != RELKIND_RELATION &&
     128          54 :             rel->rd_rel->relkind != RELKIND_MATVIEW &&
     129          48 :             rel->rd_rel->relkind != RELKIND_FOREIGN_TABLE &&
     130          42 :             rel->rd_rel->relkind != RELKIND_PARTITIONED_TABLE)
     131          30 :             ereport(ERROR,
     132             :                     (errcode(ERRCODE_WRONG_OBJECT_TYPE),
     133             :                      errmsg("cannot define statistics for relation \"%s\"",
     134             :                             RelationGetRelationName(rel)),
     135             :                      errdetail_relkind_not_supported(rel->rd_rel->relkind)));
     136             : 
     137             :         /* You must own the relation to create stats on it */
     138         602 :         if (!object_ownercheck(RelationRelationId, RelationGetRelid(rel), stxowner))
     139           0 :             aclcheck_error(ACLCHECK_NOT_OWNER, get_relkind_objtype(rel->rd_rel->relkind),
     140           0 :                            RelationGetRelationName(rel));
     141             : 
     142             :         /* Creating statistics on system catalogs is not allowed */
     143         602 :         if (!allowSystemTableMods && IsSystemRelation(rel))
     144           0 :             ereport(ERROR,
     145             :                     (errcode(ERRCODE_INSUFFICIENT_PRIVILEGE),
     146             :                      errmsg("permission denied: \"%s\" is a system catalog",
     147             :                             RelationGetRelationName(rel))));
     148             :     }
     149             : 
     150             :     Assert(rel);
     151         602 :     relid = RelationGetRelid(rel);
     152             : 
     153             :     /*
     154             :      * If the node has a name, split it up and determine creation namespace.
     155             :      * If not, put the object in the same namespace as the relation, and cons
     156             :      * up a name for it.  (This can happen either via "CREATE STATISTICS ..."
     157             :      * or via "CREATE TABLE ... (LIKE)".)
     158             :      */
     159         602 :     if (stmt->defnames)
     160         518 :         namespaceId = QualifiedNameGetCreationNamespace(stmt->defnames,
     161             :                                                         &namestr);
     162             :     else
     163             :     {
     164          84 :         namespaceId = RelationGetNamespace(rel);
     165          84 :         namestr = ChooseExtendedStatisticName(RelationGetRelationName(rel),
     166          84 :                                               ChooseExtendedStatisticNameAddition(stmt->exprs),
     167             :                                               "stat",
     168             :                                               namespaceId);
     169             :     }
     170         602 :     namestrcpy(&stxname, namestr);
     171             : 
     172             :     /*
     173             :      * Deal with the possibility that the statistics object already exists.
     174             :      */
     175         602 :     if (SearchSysCacheExists2(STATEXTNAMENSP,
     176             :                               CStringGetDatum(namestr),
     177             :                               ObjectIdGetDatum(namespaceId)))
     178             :     {
     179           6 :         if (stmt->if_not_exists)
     180             :         {
     181             :             /*
     182             :              * Since stats objects aren't members of extensions (see comments
     183             :              * below), no need for checkMembershipInCurrentExtension here.
     184             :              */
     185           6 :             ereport(NOTICE,
     186             :                     (errcode(ERRCODE_DUPLICATE_OBJECT),
     187             :                      errmsg("statistics object \"%s\" already exists, skipping",
     188             :                             namestr)));
     189           6 :             relation_close(rel, NoLock);
     190           6 :             return InvalidObjectAddress;
     191             :         }
     192             : 
     193           0 :         ereport(ERROR,
     194             :                 (errcode(ERRCODE_DUPLICATE_OBJECT),
     195             :                  errmsg("statistics object \"%s\" already exists", namestr)));
     196             :     }
     197             : 
     198             :     /*
     199             :      * Make sure no more than STATS_MAX_DIMENSIONS columns are used. There
     200             :      * might be duplicates and so on, but we'll deal with those later.
     201             :      */
     202         596 :     numcols = list_length(stmt->exprs);
     203         596 :     if (numcols > STATS_MAX_DIMENSIONS)
     204          18 :         ereport(ERROR,
     205             :                 (errcode(ERRCODE_TOO_MANY_COLUMNS),
     206             :                  errmsg("cannot have more than %d columns in statistics",
     207             :                         STATS_MAX_DIMENSIONS)));
     208             : 
     209             :     /*
     210             :      * Convert the expression list to a simple array of attnums, but also keep
     211             :      * a list of more complex expressions.  While at it, enforce some
     212             :      * constraints - we don't allow extended statistics on system attributes,
     213             :      * and we require the data type to have a less-than operator.
     214             :      *
     215             :      * There are many ways to "mask" a simple attribute reference as an
     216             :      * expression, for example "(a+0)" etc. We can't possibly detect all of
     217             :      * them, but we handle at least the simple case with the attribute in
     218             :      * parens. There'll always be a way around this, if the user is determined
     219             :      * (like the "(a+0)" example), but this makes it somewhat consistent with
     220             :      * how indexes treat attributes/expressions.
     221             :      */
     222        1916 :     foreach(cell, stmt->exprs)
     223             :     {
     224        1344 :         StatsElem  *selem = lfirst_node(StatsElem, cell);
     225             : 
     226        1344 :         if (selem->name)     /* column reference */
     227             :         {
     228             :             char       *attname;
     229             :             HeapTuple   atttuple;
     230             :             Form_pg_attribute attForm;
     231             :             TypeCacheEntry *type;
     232             : 
     233         954 :             attname = selem->name;
     234             : 
     235         954 :             atttuple = SearchSysCacheAttName(relid, attname);
     236         954 :             if (!HeapTupleIsValid(atttuple))
     237           6 :                 ereport(ERROR,
     238             :                         (errcode(ERRCODE_UNDEFINED_COLUMN),
     239             :                          errmsg("column \"%s\" does not exist",
     240             :                                 attname)));
     241         948 :             attForm = (Form_pg_attribute) GETSTRUCT(atttuple);
     242             : 
     243             :             /* Disallow use of system attributes in extended stats */
     244         948 :             if (attForm->attnum <= 0)
     245           0 :                 ereport(ERROR,
     246             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     247             :                          errmsg("statistics creation on system columns is not supported")));
     248             : 
     249             :             /* Disallow data types without a less-than operator */
     250         948 :             type = lookup_type_cache(attForm->atttypid, TYPECACHE_LT_OPR);
     251         948 :             if (type->lt_opr == InvalidOid)
     252           0 :                 ereport(ERROR,
     253             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     254             :                          errmsg("column \"%s\" cannot be used in statistics because its type %s has no default btree operator class",
     255             :                                 attname, format_type_be(attForm->atttypid))));
     256             : 
     257         948 :             attnums[nattnums] = attForm->attnum;
     258         948 :             nattnums++;
     259         948 :             ReleaseSysCache(atttuple);
     260             :         }
     261         390 :         else if (IsA(selem->expr, Var)) /* column reference in parens */
     262             :         {
     263           6 :             Var        *var = (Var *) selem->expr;
     264             :             TypeCacheEntry *type;
     265             : 
     266             :             /* Disallow use of system attributes in extended stats */
     267           6 :             if (var->varattno <= 0)
     268           0 :                 ereport(ERROR,
     269             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     270             :                          errmsg("statistics creation on system columns is not supported")));
     271             : 
     272             :             /* Disallow data types without a less-than operator */
     273           6 :             type = lookup_type_cache(var->vartype, TYPECACHE_LT_OPR);
     274           6 :             if (type->lt_opr == InvalidOid)
     275           0 :                 ereport(ERROR,
     276             :                         (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     277             :                          errmsg("column \"%s\" cannot be used in statistics because its type %s has no default btree operator class",
     278             :                                 get_attname(relid, var->varattno, false), format_type_be(var->vartype))));
     279             : 
     280           6 :             attnums[nattnums] = var->varattno;
     281           6 :             nattnums++;
     282             :         }
     283             :         else                    /* expression */
     284             :         {
     285         384 :             Node       *expr = selem->expr;
     286             :             Oid         atttype;
     287             :             TypeCacheEntry *type;
     288         384 :             Bitmapset  *attnums = NULL;
     289             :             int         k;
     290             : 
     291             :             Assert(expr != NULL);
     292             : 
     293             :             /* Disallow expressions referencing system attributes. */
     294         384 :             pull_varattnos(expr, 1, &attnums);
     295             : 
     296         384 :             k = -1;
     297         894 :             while ((k = bms_next_member(attnums, k)) >= 0)
     298             :             {
     299         510 :                 AttrNumber  attnum = k + FirstLowInvalidHeapAttributeNumber;
     300             : 
     301         510 :                 if (attnum <= 0)
     302           0 :                     ereport(ERROR,
     303             :                             (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     304             :                              errmsg("statistics creation on system columns is not supported")));
     305             :             }
     306             : 
     307             :             /*
     308             :              * Disallow data types without a less-than operator.
     309             :              *
     310             :              * We ignore this for statistics on a single expression, in which
     311             :              * case we'll build the regular statistics only (and that code can
     312             :              * deal with such data types).
     313             :              */
     314         384 :             if (list_length(stmt->exprs) > 1)
     315             :             {
     316         304 :                 atttype = exprType(expr);
     317         304 :                 type = lookup_type_cache(atttype, TYPECACHE_LT_OPR);
     318         304 :                 if (type->lt_opr == InvalidOid)
     319           0 :                     ereport(ERROR,
     320             :                             (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     321             :                              errmsg("expression cannot be used in multivariate statistics because its type %s has no default btree operator class",
     322             :                                     format_type_be(atttype))));
     323             :             }
     324             : 
     325         384 :             stxexprs = lappend(stxexprs, expr);
     326             :         }
     327             :     }
     328             : 
     329             :     /*
     330             :      * Parse the statistics kinds.
     331             :      *
     332             :      * First check that if this is the case with a single expression, there
     333             :      * are no statistics kinds specified (we don't allow that for the simple
     334             :      * CREATE STATISTICS form).
     335             :      */
     336         572 :     if ((list_length(stmt->exprs) == 1) && (list_length(stxexprs) == 1))
     337             :     {
     338             :         /* statistics kinds not specified */
     339          80 :         if (stmt->stat_types != NIL)
     340           0 :             ereport(ERROR,
     341             :                     (errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
     342             :                      errmsg("when building statistics on a single expression, statistics kinds may not be specified")));
     343             :     }
     344             : 
     345             :     /* OK, let's check that we recognize the statistics kinds. */
     346         572 :     build_ndistinct = false;
     347         572 :     build_dependencies = false;
     348         572 :     build_mcv = false;
     349         924 :     foreach(cell, stmt->stat_types)
     350             :     {
     351         358 :         char       *type = strVal(lfirst(cell));
     352             : 
     353         358 :         if (strcmp(type, "ndistinct") == 0)
     354             :         {
     355          98 :             build_ndistinct = true;
     356          98 :             requested_type = true;
     357             :         }
     358         260 :         else if (strcmp(type, "dependencies") == 0)
     359             :         {
     360          84 :             build_dependencies = true;
     361          84 :             requested_type = true;
     362             :         }
     363         176 :         else if (strcmp(type, "mcv") == 0)
     364             :         {
     365         170 :             build_mcv = true;
     366         170 :             requested_type = true;
     367             :         }
     368             :         else
     369           6 :             ereport(ERROR,
     370             :                     (errcode(ERRCODE_SYNTAX_ERROR),
     371             :                      errmsg("unrecognized statistics kind \"%s\"",
     372             :                             type)));
     373             :     }
     374             : 
     375             :     /*
     376             :      * If no statistic type was specified, build them all (but only when the
     377             :      * statistics is defined on more than one column/expression).
     378             :      */
     379         566 :     if ((!requested_type) && (numcols >= 2))
     380             :     {
     381         188 :         build_ndistinct = true;
     382         188 :         build_dependencies = true;
     383         188 :         build_mcv = true;
     384             :     }
     385             : 
     386             :     /*
     387             :      * When there are non-trivial expressions, build the expression stats
     388             :      * automatically. This allows calculating good estimates for stats that
     389             :      * consider per-clause estimates (e.g. functional dependencies).
     390             :      */
     391         566 :     build_expressions = (stxexprs != NIL);
     392             : 
     393             :     /*
     394             :      * Check that at least two columns were specified in the statement, or
     395             :      * that we're building statistics on a single expression.
     396             :      */
     397         566 :     if ((numcols < 2) && (list_length(stxexprs) != 1))
     398           6 :         ereport(ERROR,
     399             :                 (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
     400             :                  errmsg("extended statistics require at least 2 columns")));
     401             : 
     402             :     /*
     403             :      * Sort the attnums, which makes detecting duplicates somewhat easier, and
     404             :      * it does not hurt (it does not matter for the contents, unlike for
     405             :      * indexes, for example).
     406             :      */
     407         560 :     qsort(attnums, nattnums, sizeof(int16), compare_int16);
     408             : 
     409             :     /*
     410             :      * Check for duplicates in the list of columns. The attnums are sorted so
     411             :      * just check consecutive elements.
     412             :      */
     413        1060 :     for (i = 1; i < nattnums; i++)
     414             :     {
     415         506 :         if (attnums[i] == attnums[i - 1])
     416           6 :             ereport(ERROR,
     417             :                     (errcode(ERRCODE_DUPLICATE_COLUMN),
     418             :                      errmsg("duplicate column name in statistics definition")));
     419             :     }
     420             : 
     421             :     /*
     422             :      * Check for duplicate expressions. We do two loops, counting the
     423             :      * occurrences of each expression. This is O(N^2) but we only allow small
     424             :      * number of expressions and it's not executed often.
     425             :      *
     426             :      * XXX We don't cross-check attributes and expressions, because it does
     427             :      * not seem worth it. In principle we could check that expressions don't
     428             :      * contain trivial attribute references like "(a)", but the reasoning is
     429             :      * similar to why we don't bother with extracting columns from
     430             :      * expressions. It's either expensive or very easy to defeat for
     431             :      * determined user, and there's no risk if we allow such statistics (the
     432             :      * statistics is useless, but harmless).
     433             :      */
     434         926 :     foreach(cell, stxexprs)
     435             :     {
     436         378 :         Node       *expr1 = (Node *) lfirst(cell);
     437         378 :         int         cnt = 0;
     438             : 
     439        1222 :         foreach(cell2, stxexprs)
     440             :         {
     441         844 :             Node       *expr2 = (Node *) lfirst(cell2);
     442             : 
     443         844 :             if (equal(expr1, expr2))
     444         384 :                 cnt += 1;
     445             :         }
     446             : 
     447             :         /* every expression should find at least itself */
     448             :         Assert(cnt >= 1);
     449             : 
     450         378 :         if (cnt > 1)
     451           6 :             ereport(ERROR,
     452             :                     (errcode(ERRCODE_DUPLICATE_COLUMN),
     453             :                      errmsg("duplicate expression in statistics definition")));
     454             :     }
     455             : 
     456             :     /* Form an int2vector representation of the sorted column list */
     457         548 :     stxkeys = buildint2vector(attnums, nattnums);
     458             : 
     459             :     /* construct the char array of enabled statistic types */
     460         548 :     ntypes = 0;
     461         548 :     if (build_ndistinct)
     462         274 :         types[ntypes++] = CharGetDatum(STATS_EXT_NDISTINCT);
     463         548 :     if (build_dependencies)
     464         260 :         types[ntypes++] = CharGetDatum(STATS_EXT_DEPENDENCIES);
     465         548 :     if (build_mcv)
     466         346 :         types[ntypes++] = CharGetDatum(STATS_EXT_MCV);
     467         548 :     if (build_expressions)
     468         210 :         types[ntypes++] = CharGetDatum(STATS_EXT_EXPRESSIONS);
     469             :     Assert(ntypes > 0 && ntypes <= lengthof(types));
     470         548 :     stxkind = construct_array_builtin(types, ntypes, CHAROID);
     471             : 
     472             :     /* convert the expressions (if any) to a text datum */
     473         548 :     if (stxexprs != NIL)
     474             :     {
     475             :         char       *exprsString;
     476             : 
     477         210 :         exprsString = nodeToString(stxexprs);
     478         210 :         exprsDatum = CStringGetTextDatum(exprsString);
     479         210 :         pfree(exprsString);
     480             :     }
     481             :     else
     482         338 :         exprsDatum = (Datum) 0;
     483             : 
     484         548 :     statrel = table_open(StatisticExtRelationId, RowExclusiveLock);
     485             : 
     486             :     /*
     487             :      * Everything seems fine, so let's build the pg_statistic_ext tuple.
     488             :      */
     489         548 :     memset(values, 0, sizeof(values));
     490         548 :     memset(nulls, false, sizeof(nulls));
     491             : 
     492         548 :     statoid = GetNewOidWithIndex(statrel, StatisticExtOidIndexId,
     493             :                                  Anum_pg_statistic_ext_oid);
     494         548 :     values[Anum_pg_statistic_ext_oid - 1] = ObjectIdGetDatum(statoid);
     495         548 :     values[Anum_pg_statistic_ext_stxrelid - 1] = ObjectIdGetDatum(relid);
     496         548 :     values[Anum_pg_statistic_ext_stxname - 1] = NameGetDatum(&stxname);
     497         548 :     values[Anum_pg_statistic_ext_stxnamespace - 1] = ObjectIdGetDatum(namespaceId);
     498         548 :     values[Anum_pg_statistic_ext_stxowner - 1] = ObjectIdGetDatum(stxowner);
     499         548 :     values[Anum_pg_statistic_ext_stxkeys - 1] = PointerGetDatum(stxkeys);
     500         548 :     nulls[Anum_pg_statistic_ext_stxstattarget - 1] = true;
     501         548 :     values[Anum_pg_statistic_ext_stxkind - 1] = PointerGetDatum(stxkind);
     502             : 
     503         548 :     values[Anum_pg_statistic_ext_stxexprs - 1] = exprsDatum;
     504         548 :     if (exprsDatum == (Datum) 0)
     505         338 :         nulls[Anum_pg_statistic_ext_stxexprs - 1] = true;
     506             : 
     507             :     /* insert it into pg_statistic_ext */
     508         548 :     htup = heap_form_tuple(statrel->rd_att, values, nulls);
     509         548 :     CatalogTupleInsert(statrel, htup);
     510         548 :     heap_freetuple(htup);
     511             : 
     512         548 :     relation_close(statrel, RowExclusiveLock);
     513             : 
     514             :     /*
     515             :      * We used to create the pg_statistic_ext_data tuple too, but it's not
     516             :      * clear what value should the stxdinherit flag have (it depends on
     517             :      * whether the rel is partitioned, contains data, etc.)
     518             :      */
     519             : 
     520         548 :     InvokeObjectPostCreateHook(StatisticExtRelationId, statoid, 0);
     521             : 
     522             :     /*
     523             :      * Invalidate relcache so that others see the new statistics object.
     524             :      */
     525         548 :     CacheInvalidateRelcache(rel);
     526             : 
     527         548 :     relation_close(rel, NoLock);
     528             : 
     529             :     /*
     530             :      * Add an AUTO dependency on each column used in the stats, so that the
     531             :      * stats object goes away if any or all of them get dropped.
     532             :      */
     533         548 :     ObjectAddressSet(myself, StatisticExtRelationId, statoid);
     534             : 
     535             :     /* add dependencies for plain column references */
     536        1460 :     for (i = 0; i < nattnums; i++)
     537             :     {
     538         912 :         ObjectAddressSubSet(parentobject, RelationRelationId, relid, attnums[i]);
     539         912 :         recordDependencyOn(&myself, &parentobject, DEPENDENCY_AUTO);
     540             :     }
     541             : 
     542             :     /*
     543             :      * If there are no dependencies on a column, give the statistics object an
     544             :      * auto dependency on the whole table.  In most cases, this will be
     545             :      * redundant, but it might not be if the statistics expressions contain no
     546             :      * Vars (which might seem strange but possible). This is consistent with
     547             :      * what we do for indexes in index_create.
     548             :      *
     549             :      * XXX We intentionally don't consider the expressions before adding this
     550             :      * dependency, because recordDependencyOnSingleRelExpr may not create any
     551             :      * dependencies for whole-row Vars.
     552             :      */
     553         548 :     if (!nattnums)
     554             :     {
     555         136 :         ObjectAddressSet(parentobject, RelationRelationId, relid);
     556         136 :         recordDependencyOn(&myself, &parentobject, DEPENDENCY_AUTO);
     557             :     }
     558             : 
     559             :     /*
     560             :      * Store dependencies on anything mentioned in statistics expressions,
     561             :      * just like we do for index expressions.
     562             :      */
     563         548 :     if (stxexprs)
     564         210 :         recordDependencyOnSingleRelExpr(&myself,
     565             :                                         (Node *) stxexprs,
     566             :                                         relid,
     567             :                                         DEPENDENCY_NORMAL,
     568             :                                         DEPENDENCY_AUTO, false);
     569             : 
     570             :     /*
     571             :      * Also add dependencies on namespace and owner.  These are required
     572             :      * because the stats object might have a different namespace and/or owner
     573             :      * than the underlying table(s).
     574             :      */
     575         548 :     ObjectAddressSet(parentobject, NamespaceRelationId, namespaceId);
     576         548 :     recordDependencyOn(&myself, &parentobject, DEPENDENCY_NORMAL);
     577             : 
     578         548 :     recordDependencyOnOwner(StatisticExtRelationId, statoid, stxowner);
     579             : 
     580             :     /*
     581             :      * XXX probably there should be a recordDependencyOnCurrentExtension call
     582             :      * here too, but we'd have to add support for ALTER EXTENSION ADD/DROP
     583             :      * STATISTICS, which is more work than it seems worth.
     584             :      */
     585             : 
     586             :     /* Add any requested comment */
     587         548 :     if (stmt->stxcomment != NULL)
     588          36 :         CreateComments(statoid, StatisticExtRelationId, 0,
     589          36 :                        stmt->stxcomment);
     590             : 
     591             :     /* Return stats object's address */
     592         548 :     return myself;
     593             : }
     594             : 
     595             : /*
     596             :  *      ALTER STATISTICS
     597             :  */
     598             : ObjectAddress
     599          26 : AlterStatistics(AlterStatsStmt *stmt)
     600             : {
     601             :     Relation    rel;
     602             :     Oid         stxoid;
     603             :     HeapTuple   oldtup;
     604             :     HeapTuple   newtup;
     605             :     Datum       repl_val[Natts_pg_statistic_ext];
     606             :     bool        repl_null[Natts_pg_statistic_ext];
     607             :     bool        repl_repl[Natts_pg_statistic_ext];
     608             :     ObjectAddress address;
     609          26 :     int         newtarget = 0;
     610             :     bool        newtarget_default;
     611             : 
     612             :     /* -1 was used in previous versions for the default setting */
     613          26 :     if (stmt->stxstattarget && intVal(stmt->stxstattarget) != -1)
     614             :     {
     615          20 :         newtarget = intVal(stmt->stxstattarget);
     616          20 :         newtarget_default = false;
     617             :     }
     618             :     else
     619           6 :         newtarget_default = true;
     620             : 
     621          26 :     if (!newtarget_default)
     622             :     {
     623             :         /* Limit statistics target to a sane range */
     624          20 :         if (newtarget < 0)
     625             :         {
     626           0 :             ereport(ERROR,
     627             :                     (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
     628             :                      errmsg("statistics target %d is too low",
     629             :                             newtarget)));
     630             :         }
     631          20 :         else if (newtarget > MAX_STATISTICS_TARGET)
     632             :         {
     633           0 :             newtarget = MAX_STATISTICS_TARGET;
     634           0 :             ereport(WARNING,
     635             :                     (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
     636             :                      errmsg("lowering statistics target to %d",
     637             :                             newtarget)));
     638             :         }
     639             :     }
     640             : 
     641             :     /* lookup OID of the statistics object */
     642          26 :     stxoid = get_statistics_object_oid(stmt->defnames, stmt->missing_ok);
     643             : 
     644             :     /*
     645             :      * If we got here and the OID is not valid, it means the statistics object
     646             :      * does not exist, but the command specified IF EXISTS. So report this as
     647             :      * a simple NOTICE and we're done.
     648             :      */
     649          20 :     if (!OidIsValid(stxoid))
     650             :     {
     651             :         char       *schemaname;
     652             :         char       *statname;
     653             : 
     654             :         Assert(stmt->missing_ok);
     655             : 
     656           6 :         DeconstructQualifiedName(stmt->defnames, &schemaname, &statname);
     657             : 
     658           6 :         if (schemaname)
     659           0 :             ereport(NOTICE,
     660             :                     (errmsg("statistics object \"%s.%s\" does not exist, skipping",
     661             :                             schemaname, statname)));
     662             :         else
     663           6 :             ereport(NOTICE,
     664             :                     (errmsg("statistics object \"%s\" does not exist, skipping",
     665             :                             statname)));
     666             : 
     667           6 :         return InvalidObjectAddress;
     668             :     }
     669             : 
     670             :     /* Search pg_statistic_ext */
     671          14 :     rel = table_open(StatisticExtRelationId, RowExclusiveLock);
     672             : 
     673          14 :     oldtup = SearchSysCache1(STATEXTOID, ObjectIdGetDatum(stxoid));
     674          14 :     if (!HeapTupleIsValid(oldtup))
     675           0 :         elog(ERROR, "cache lookup failed for extended statistics object %u", stxoid);
     676             : 
     677             :     /* Must be owner of the existing statistics object */
     678          14 :     if (!object_ownercheck(StatisticExtRelationId, stxoid, GetUserId()))
     679           0 :         aclcheck_error(ACLCHECK_NOT_OWNER, OBJECT_STATISTIC_EXT,
     680           0 :                        NameListToString(stmt->defnames));
     681             : 
     682             :     /* Build new tuple. */
     683          14 :     memset(repl_val, 0, sizeof(repl_val));
     684          14 :     memset(repl_null, false, sizeof(repl_null));
     685          14 :     memset(repl_repl, false, sizeof(repl_repl));
     686             : 
     687             :     /* replace the stxstattarget column */
     688          14 :     repl_repl[Anum_pg_statistic_ext_stxstattarget - 1] = true;
     689          14 :     if (!newtarget_default)
     690           8 :         repl_val[Anum_pg_statistic_ext_stxstattarget - 1] = Int16GetDatum(newtarget);
     691             :     else
     692           6 :         repl_null[Anum_pg_statistic_ext_stxstattarget - 1] = true;
     693             : 
     694          14 :     newtup = heap_modify_tuple(oldtup, RelationGetDescr(rel),
     695             :                                repl_val, repl_null, repl_repl);
     696             : 
     697             :     /* Update system catalog. */
     698          14 :     CatalogTupleUpdate(rel, &newtup->t_self, newtup);
     699             : 
     700          14 :     InvokeObjectPostAlterHook(StatisticExtRelationId, stxoid, 0);
     701             : 
     702          14 :     ObjectAddressSet(address, StatisticExtRelationId, stxoid);
     703             : 
     704             :     /*
     705             :      * NOTE: because we only support altering the statistics target, not the
     706             :      * other fields, there is no need to update dependencies.
     707             :      */
     708             : 
     709          14 :     heap_freetuple(newtup);
     710          14 :     ReleaseSysCache(oldtup);
     711             : 
     712          14 :     table_close(rel, RowExclusiveLock);
     713             : 
     714          14 :     return address;
     715             : }
     716             : 
     717             : /*
     718             :  * Delete entry in pg_statistic_ext_data catalog. We don't know if the row
     719             :  * exists, so don't error out.
     720             :  */
     721             : void
     722        1370 : RemoveStatisticsDataById(Oid statsOid, bool inh)
     723             : {
     724             :     Relation    relation;
     725             :     HeapTuple   tup;
     726             : 
     727        1370 :     relation = table_open(StatisticExtDataRelationId, RowExclusiveLock);
     728             : 
     729        1370 :     tup = SearchSysCache2(STATEXTDATASTXOID, ObjectIdGetDatum(statsOid),
     730             :                           BoolGetDatum(inh));
     731             : 
     732             :     /* We don't know if the data row for inh value exists. */
     733        1370 :     if (HeapTupleIsValid(tup))
     734             :     {
     735         354 :         CatalogTupleDelete(relation, &tup->t_self);
     736             : 
     737         354 :         ReleaseSysCache(tup);
     738             :     }
     739             : 
     740        1370 :     table_close(relation, RowExclusiveLock);
     741        1370 : }
     742             : 
     743             : /*
     744             :  * Guts of statistics object deletion.
     745             :  */
     746             : void
     747         496 : RemoveStatisticsById(Oid statsOid)
     748             : {
     749             :     Relation    relation;
     750             :     Relation    rel;
     751             :     HeapTuple   tup;
     752             :     Form_pg_statistic_ext statext;
     753             :     Oid         relid;
     754             : 
     755             :     /*
     756             :      * Delete the pg_statistic_ext tuple.  Also send out a cache inval on the
     757             :      * associated table, so that dependent plans will be rebuilt.
     758             :      */
     759         496 :     relation = table_open(StatisticExtRelationId, RowExclusiveLock);
     760             : 
     761         496 :     tup = SearchSysCache1(STATEXTOID, ObjectIdGetDatum(statsOid));
     762             : 
     763         496 :     if (!HeapTupleIsValid(tup)) /* should not happen */
     764           0 :         elog(ERROR, "cache lookup failed for statistics object %u", statsOid);
     765             : 
     766         496 :     statext = (Form_pg_statistic_ext) GETSTRUCT(tup);
     767         496 :     relid = statext->stxrelid;
     768             : 
     769             :     /*
     770             :      * Delete the pg_statistic_ext_data tuples holding the actual statistical
     771             :      * data. There might be data with/without inheritance, so attempt deleting
     772             :      * both. We lock the user table first, to prevent other processes (e.g.
     773             :      * DROP STATISTICS) from removing the row concurrently.
     774             :      */
     775         496 :     rel = table_open(relid, ShareUpdateExclusiveLock);
     776             : 
     777         496 :     RemoveStatisticsDataById(statsOid, true);
     778         496 :     RemoveStatisticsDataById(statsOid, false);
     779             : 
     780         496 :     CacheInvalidateRelcacheByRelid(relid);
     781             : 
     782         496 :     CatalogTupleDelete(relation, &tup->t_self);
     783             : 
     784         496 :     ReleaseSysCache(tup);
     785             : 
     786             :     /* Keep lock until the end of the transaction. */
     787         496 :     table_close(rel, NoLock);
     788             : 
     789         496 :     table_close(relation, RowExclusiveLock);
     790         496 : }
     791             : 
     792             : /*
     793             :  * Select a nonconflicting name for a new statistics object.
     794             :  *
     795             :  * name1, name2, and label are used the same way as for makeObjectName(),
     796             :  * except that the label can't be NULL; digits will be appended to the label
     797             :  * if needed to create a name that is unique within the specified namespace.
     798             :  *
     799             :  * Returns a palloc'd string.
     800             :  *
     801             :  * Note: it is theoretically possible to get a collision anyway, if someone
     802             :  * else chooses the same name concurrently.  This is fairly unlikely to be
     803             :  * a problem in practice, especially if one is holding a share update
     804             :  * exclusive lock on the relation identified by name1.  However, if choosing
     805             :  * multiple names within a single command, you'd better create the new object
     806             :  * and do CommandCounterIncrement before choosing the next one!
     807             :  */
     808             : static char *
     809          84 : ChooseExtendedStatisticName(const char *name1, const char *name2,
     810             :                             const char *label, Oid namespaceid)
     811             : {
     812          84 :     int         pass = 0;
     813          84 :     char       *stxname = NULL;
     814             :     char        modlabel[NAMEDATALEN];
     815             : 
     816             :     /* try the unmodified label first */
     817          84 :     strlcpy(modlabel, label, sizeof(modlabel));
     818             : 
     819             :     for (;;)
     820          24 :     {
     821             :         Oid         existingstats;
     822             : 
     823         108 :         stxname = makeObjectName(name1, name2, modlabel);
     824             : 
     825         108 :         existingstats = GetSysCacheOid2(STATEXTNAMENSP, Anum_pg_statistic_ext_oid,
     826             :                                         PointerGetDatum(stxname),
     827             :                                         ObjectIdGetDatum(namespaceid));
     828         108 :         if (!OidIsValid(existingstats))
     829          84 :             break;
     830             : 
     831             :         /* found a conflict, so try a new name component */
     832          24 :         pfree(stxname);
     833          24 :         snprintf(modlabel, sizeof(modlabel), "%s%d", label, ++pass);
     834             :     }
     835             : 
     836          84 :     return stxname;
     837             : }
     838             : 
     839             : /*
     840             :  * Generate "name2" for a new statistics object given the list of column
     841             :  * names for it.  This will be passed to ChooseExtendedStatisticName along
     842             :  * with the parent table name and a suitable label.
     843             :  *
     844             :  * We know that less than NAMEDATALEN characters will actually be used,
     845             :  * so we can truncate the result once we've generated that many.
     846             :  *
     847             :  * XXX see also ChooseForeignKeyConstraintNameAddition and
     848             :  * ChooseIndexNameAddition.
     849             :  */
     850             : static char *
     851          84 : ChooseExtendedStatisticNameAddition(List *exprs)
     852             : {
     853             :     char        buf[NAMEDATALEN * 2];
     854          84 :     int         buflen = 0;
     855             :     ListCell   *lc;
     856             : 
     857          84 :     buf[0] = '\0';
     858         252 :     foreach(lc, exprs)
     859             :     {
     860         168 :         StatsElem  *selem = (StatsElem *) lfirst(lc);
     861             :         const char *name;
     862             : 
     863             :         /* It should be one of these, but just skip if it happens not to be */
     864         168 :         if (!IsA(selem, StatsElem))
     865           0 :             continue;
     866             : 
     867         168 :         name = selem->name;
     868             : 
     869         168 :         if (buflen > 0)
     870          84 :             buf[buflen++] = '_';    /* insert _ between names */
     871             : 
     872             :         /*
     873             :          * We use fixed 'expr' for expressions, which have empty column names.
     874             :          * For indexes this is handled in ChooseIndexColumnNames, but we have
     875             :          * no such function for stats and it does not seem worth adding. If a
     876             :          * better name is needed, the user can specify it explicitly.
     877             :          */
     878         168 :         if (!name)
     879          60 :             name = "expr";
     880             : 
     881             :         /*
     882             :          * At this point we have buflen <= NAMEDATALEN.  name should be less
     883             :          * than NAMEDATALEN already, but use strlcpy for paranoia.
     884             :          */
     885         168 :         strlcpy(buf + buflen, name, NAMEDATALEN);
     886         168 :         buflen += strlen(buf + buflen);
     887         168 :         if (buflen >= NAMEDATALEN)
     888           0 :             break;
     889             :     }
     890          84 :     return pstrdup(buf);
     891             : }
     892             : 
     893             : /*
     894             :  * StatisticsGetRelation: given a statistics object's OID, get the OID of
     895             :  * the relation it is defined on.  Uses the system cache.
     896             :  */
     897             : Oid
     898          14 : StatisticsGetRelation(Oid statId, bool missing_ok)
     899             : {
     900             :     HeapTuple   tuple;
     901             :     Form_pg_statistic_ext stx;
     902             :     Oid         result;
     903             : 
     904          14 :     tuple = SearchSysCache1(STATEXTOID, ObjectIdGetDatum(statId));
     905          14 :     if (!HeapTupleIsValid(tuple))
     906             :     {
     907           0 :         if (missing_ok)
     908           0 :             return InvalidOid;
     909           0 :         elog(ERROR, "cache lookup failed for statistics object %u", statId);
     910             :     }
     911          14 :     stx = (Form_pg_statistic_ext) GETSTRUCT(tuple);
     912             :     Assert(stx->oid == statId);
     913             : 
     914          14 :     result = stx->stxrelid;
     915          14 :     ReleaseSysCache(tuple);
     916          14 :     return result;
     917             : }

Generated by: LCOV version 1.14