LCOV - code coverage report
Current view: top level - src/include/utils - pgstat_internal.h (source / functions) Coverage Total Hit
Test: PostgreSQL 19devel Lines: 97.6 % 42 41
Test Date: 2026-05-06 12:16:27 Functions: 100.0 % 11 11
Legend: Lines:     hit not hit

            Line data    Source code
       1              : /* ----------
       2              :  * pgstat_internal.h
       3              :  *
       4              :  * Definitions for the PostgreSQL cumulative statistics system that should
       5              :  * only be needed by files implementing statistics support (rather than ones
       6              :  * reporting / querying stats).
       7              :  *
       8              :  * Copyright (c) 2001-2026, PostgreSQL Global Development Group
       9              :  *
      10              :  * src/include/utils/pgstat_internal.h
      11              :  * ----------
      12              :  */
      13              : #ifndef PGSTAT_INTERNAL_H
      14              : #define PGSTAT_INTERNAL_H
      15              : 
      16              : 
      17              : #include "common/hashfn_unstable.h"
      18              : #include "lib/dshash.h"
      19              : #include "lib/ilist.h"
      20              : #include "pgstat.h"
      21              : #include "storage/lwlock.h"
      22              : #include "utils/dsa.h"
      23              : 
      24              : 
      25              : /*
      26              :  * Types related to shared memory storage of statistics.
      27              :  *
      28              :  * Per-object statistics are stored in the "shared stats" hashtable. That
      29              :  * table's entries (PgStatShared_HashEntry) contain a pointer to the actual stats
      30              :  * data for the object (the size of the stats data varies depending on the
      31              :  * kind of stats). The table is keyed by PgStat_HashKey.
      32              :  *
      33              :  * Once a backend has a reference to a shared stats entry, it increments the
      34              :  * entry's refcount. Even after stats data is dropped (e.g., due to a DROP
      35              :  * TABLE), the entry itself can only be deleted once all references have been
      36              :  * released.
      37              :  *
      38              :  * These refcounts, in combination with a backend local hashtable
      39              :  * (pgStatEntryRefHash, with entries pointing to PgStat_EntryRef) in front of
      40              :  * the shared hash table, mean that most stats work can happen without
      41              :  * touching the shared hash table, reducing contention.
      42              :  *
      43              :  * Once there are pending stats updates for a table PgStat_EntryRef->pending
      44              :  * is allocated to contain a working space for as-of-yet-unapplied stats
      45              :  * updates. Once the stats are flushed, PgStat_EntryRef->pending is freed.
      46              :  *
      47              :  * Each stat kind in the shared hash table has a fixed member
      48              :  * PgStatShared_Common as the first element.
      49              :  */
      50              : 
      51              : /*
      52              :  * Struct for shared statistics hash entry key.
      53              :  *
      54              :  * NB: We assume that this struct contains no padding.  Also, 8 bytes
      55              :  * allocated for the object ID are good enough to ensure the uniqueness
      56              :  * of the hash key, hence the addition of new fields is not recommended.
      57              :  */
      58              : typedef struct PgStat_HashKey
      59              : {
      60              :     PgStat_Kind kind;           /* statistics entry kind */
      61              :     Oid         dboid;          /* database ID. InvalidOid for shared objects. */
      62              :     uint64      objid;          /* object ID (table, function, etc.), or
      63              :                                  * identifier. */
      64              : } PgStat_HashKey;
      65              : 
      66              : /*
      67              :  * Tracks if the stats file is being read, written or discarded, used in
      68              :  * combination with the finish callback.
      69              :  *
      70              :  * These states allow plugins that create auxiliary data files to determine
      71              :  * the current operation and perform any necessary file cleanup.
      72              :  */
      73              : typedef enum PgStat_StatsFileOp
      74              : {
      75              :     STATS_WRITE,
      76              :     STATS_READ,
      77              :     STATS_DISCARD,
      78              : } PgStat_StatsFileOp;
      79              : 
      80              : /*
      81              :  * PgStat_HashKey should not have any padding.  Checking that the structure
      82              :  * size matches with the sum of each field is a check simple enough to
      83              :  * enforce this policy.
      84              :  */
      85              : StaticAssertDecl((sizeof(PgStat_Kind) + sizeof(uint64) + sizeof(Oid)) ==
      86              :                  sizeof(PgStat_HashKey),
      87              :                  "PgStat_HashKey should have no padding");
      88              : 
      89              : /*
      90              :  * Shared statistics hash entry. Doesn't itself contain any stats, but points
      91              :  * to them (with ->body). That allows the stats entries themselves to be of
      92              :  * variable size.
      93              :  */
      94              : typedef struct PgStatShared_HashEntry
      95              : {
      96              :     PgStat_HashKey key;         /* hash key */
      97              : 
      98              :     /*
      99              :      * If dropped is set, backends need to release their references so that
     100              :      * the memory for the entry can be freed. No new references may be made
     101              :      * once marked as dropped.
     102              :      */
     103              :     bool        dropped;
     104              : 
     105              :     /*
     106              :      * Refcount managing lifetime of the entry itself (as opposed to the
     107              :      * dshash entry pointing to it). The stats lifetime has to be separate
     108              :      * from the hash table entry lifetime because we allow backends to point
     109              :      * to a stats entry without holding a hash table lock (and some other
     110              :      * reasons).
     111              :      *
     112              :      * As long as the entry is not dropped, 1 is added to the refcount
     113              :      * representing that the entry should not be dropped. In addition each
     114              :      * backend that has a reference to the entry needs to increment the
     115              :      * refcount as long as it does.
     116              :      *
     117              :      * May only be incremented / decremented while holding at least a shared
     118              :      * lock on the dshash partition containing the entry. It needs to be an
     119              :      * atomic variable because multiple backends can increment the refcount
     120              :      * with just a shared lock.
     121              :      *
     122              :      * When the refcount reaches 0 the entry needs to be freed.
     123              :      */
     124              :     pg_atomic_uint32 refcount;
     125              : 
     126              :     /*
     127              :      * Counter tracking the number of times the entry has been reused.
     128              :      *
     129              :      * Set to 0 when the entry is created, and incremented by one each time
     130              :      * the shared entry is reinitialized with pgstat_reinit_entry().
     131              :      *
     132              :      * May only be incremented / decremented while holding at least a shared
     133              :      * lock on the dshash partition containing the entry. Like refcount, it
     134              :      * needs to be an atomic variable because multiple backends can increment
     135              :      * the generation with just a shared lock.
     136              :      */
     137              :     pg_atomic_uint32 generation;
     138              : 
     139              :     /*
     140              :      * Pointer to shared stats. The stats entry always starts with
     141              :      * PgStatShared_Common, embedded in a larger struct containing the
     142              :      * PgStat_Kind specific stats fields.
     143              :      */
     144              :     dsa_pointer body;
     145              : } PgStatShared_HashEntry;
     146              : 
     147              : /*
     148              :  * Common header struct for PgStatShared_*.
     149              :  */
     150              : typedef struct PgStatShared_Common
     151              : {
     152              :     uint32      magic;          /* just a validity cross-check */
     153              :     /* lock protecting stats contents (i.e. data following the header) */
     154              :     LWLock      lock;
     155              : } PgStatShared_Common;
     156              : 
     157              : /*
     158              :  * A backend local reference to a shared stats entry. As long as at least one
     159              :  * such reference exists, the shared stats entry will not be released.
     160              :  *
     161              :  * If there are pending stats update to the shared stats, these are stored in
     162              :  * ->pending.
     163              :  */
     164              : typedef struct PgStat_EntryRef
     165              : {
     166              :     /*
     167              :      * Pointer to the PgStatShared_HashEntry entry in the shared stats
     168              :      * hashtable.
     169              :      */
     170              :     PgStatShared_HashEntry *shared_entry;
     171              : 
     172              :     /*
     173              :      * Pointer to the stats data (i.e. PgStatShared_HashEntry->body), resolved
     174              :      * as a local pointer, to avoid repeated dsa_get_address() calls.
     175              :      */
     176              :     PgStatShared_Common *shared_stats;
     177              : 
     178              :     /*
     179              :      * Copy of PgStatShared_HashEntry->generation, keeping locally track of
     180              :      * the shared stats entry "generation" retrieved (number of times reused).
     181              :      */
     182              :     uint32      generation;
     183              : 
     184              :     /*
     185              :      * Pending statistics data that will need to be flushed to shared memory
     186              :      * stats eventually. Each stats kind utilizing pending data defines what
     187              :      * format its pending data has and needs to provide a
     188              :      * PgStat_KindInfo->flush_pending_cb callback to merge pending entries
     189              :      * into the shared stats hash table.
     190              :      */
     191              :     void       *pending;
     192              :     dlist_node  pending_node;   /* membership in pgStatPending list */
     193              : } PgStat_EntryRef;
     194              : 
     195              : 
     196              : /*
     197              :  * Some stats changes are transactional. To maintain those, a stack of
     198              :  * PgStat_SubXactStatus entries is maintained, which contain data pertaining
     199              :  * to the current transaction and its active subtransactions.
     200              :  */
     201              : typedef struct PgStat_SubXactStatus
     202              : {
     203              :     int         nest_level;     /* subtransaction nest level */
     204              : 
     205              :     struct PgStat_SubXactStatus *prev;  /* higher-level subxact if any */
     206              : 
     207              :     /*
     208              :      * Statistics for transactionally dropped objects need to be
     209              :      * transactionally dropped as well. Collect the stats dropped in the
     210              :      * current (sub-)transaction and only execute the stats drop when we know
     211              :      * if the transaction commits/aborts. To handle replicas and crashes,
     212              :      * stats drops are included in commit / abort records.
     213              :      */
     214              :     dclist_head pending_drops;
     215              : 
     216              :     /*
     217              :      * Tuple insertion/deletion counts for an open transaction can't be
     218              :      * propagated into PgStat_TableStatus counters until we know if it is
     219              :      * going to commit or abort.  Hence, we keep these counts in per-subxact
     220              :      * structs that live in TopTransactionContext.  This data structure is
     221              :      * designed on the assumption that subxacts won't usually modify very many
     222              :      * tables.
     223              :      */
     224              :     PgStat_TableXactStatus *first;  /* head of list for this subxact */
     225              : } PgStat_SubXactStatus;
     226              : 
     227              : 
     228              : /*
     229              :  * Metadata for a specific kind of statistics.
     230              :  */
     231              : typedef struct PgStat_KindInfo
     232              : {
     233              :     /*
     234              :      * Do a fixed number of stats objects exist for this kind of stats (e.g.
     235              :      * bgwriter stats) or not (e.g. tables).
     236              :      */
     237              :     bool        fixed_amount:1;
     238              : 
     239              :     /*
     240              :      * Can stats of this kind be accessed from another database? Determines
     241              :      * whether a stats object gets included in stats snapshots.
     242              :      */
     243              :     bool        accessed_across_databases:1;
     244              : 
     245              :     /* Should stats be written to the on-disk stats file? */
     246              :     bool        write_to_file:1;
     247              : 
     248              :     /*
     249              :      * Should the number of entries be tracked?  For variable-numbered stats,
     250              :      * to update its PgStat_ShmemControl.entry_counts.
     251              :      */
     252              :     bool        track_entry_count:1;
     253              : 
     254              :     /*
     255              :      * The size of an entry in the shared stats hash table (pointed to by
     256              :      * PgStatShared_HashEntry->body).  For fixed-numbered statistics, this is
     257              :      * the size of an entry in PgStat_ShmemControl->custom_data.
     258              :      */
     259              :     uint32      shared_size;
     260              : 
     261              :     /*
     262              :      * The offset of the statistics struct in the cached statistics snapshot
     263              :      * PgStat_Snapshot, for fixed-numbered statistics.
     264              :      */
     265              :     uint32      snapshot_ctl_off;
     266              : 
     267              :     /*
     268              :      * The offset of the statistics struct in the containing shared memory
     269              :      * control structure PgStat_ShmemControl, for fixed-numbered statistics.
     270              :      */
     271              :     uint32      shared_ctl_off;
     272              : 
     273              :     /*
     274              :      * The offset/size of statistics inside the shared stats entry. Used when
     275              :      * [de-]serializing statistics to / from disk respectively. Separate from
     276              :      * shared_size because [de-]serialization may not include in-memory state
     277              :      * like lwlocks.
     278              :      */
     279              :     uint32      shared_data_off;
     280              :     uint32      shared_data_len;
     281              : 
     282              :     /*
     283              :      * The size of the pending data for this kind. E.g. how large
     284              :      * PgStat_EntryRef->pending is. Used for allocations.
     285              :      *
     286              :      * 0 signals that an entry of this kind should never have a pending entry.
     287              :      */
     288              :     uint32      pending_size;
     289              : 
     290              :     /*
     291              :      * Perform custom actions when initializing a backend (standalone or under
     292              :      * postmaster). Optional.
     293              :      */
     294              :     void        (*init_backend_cb) (void);
     295              : 
     296              :     /*
     297              :      * For variable-numbered stats: flush pending stats. Required if pending
     298              :      * data is used. See flush_static_cb when dealing with stats data that
     299              :      * that cannot use PgStat_EntryRef->pending.
     300              :      */
     301              :     bool        (*flush_pending_cb) (PgStat_EntryRef *sr, bool nowait);
     302              : 
     303              :     /*
     304              :      * For variable-numbered stats: delete pending stats. Optional.
     305              :      */
     306              :     void        (*delete_pending_cb) (PgStat_EntryRef *sr);
     307              : 
     308              :     /*
     309              :      * For variable-numbered stats: reset the reset timestamp. Optional.
     310              :      */
     311              :     void        (*reset_timestamp_cb) (PgStatShared_Common *header, TimestampTz ts);
     312              : 
     313              :     /*
     314              :      * For variable-numbered stats. Optional.
     315              :      */
     316              :     void        (*to_serialized_name) (const PgStat_HashKey *key,
     317              :                                        const PgStatShared_Common *header, NameData *name);
     318              :     bool        (*from_serialized_name) (const NameData *name, PgStat_HashKey *key);
     319              : 
     320              :     /*
     321              :      * For variable-numbered stats: read or write additional data related to
     322              :      * an entry, in the stats file or optionally in a different file.
     323              :      * Optional.
     324              :      *
     325              :      * to_serialized_data: write auxiliary data for an entry.
     326              :      *
     327              :      * from_serialized_data: read auxiliary data for an entry.  Returns true
     328              :      * on success, false on read error.
     329              :      *
     330              :      * "statfile" is a pointer to the on-disk stats file, named
     331              :      * PGSTAT_STAT_PERMANENT_FILENAME.  "key" is the hash key of the entry
     332              :      * just written or read.  "header" is a pointer to the stats data; it may
     333              :      * be modified only in from_serialized_data to reconstruct an entry.
     334              :      */
     335              :     void        (*to_serialized_data) (const PgStat_HashKey *key,
     336              :                                        const PgStatShared_Common *header,
     337              :                                        FILE *statfile);
     338              :     bool        (*from_serialized_data) (const PgStat_HashKey *key,
     339              :                                          PgStatShared_Common *header,
     340              :                                          FILE *statfile);
     341              : 
     342              :     /*
     343              :      * For fixed-numbered or variable-numbered statistics.
     344              :      *
     345              :      * Perform custom actions when done processing the on-disk stats file
     346              :      * after all the stats entries have been processed.  Optional.
     347              :      *
     348              :      * "status" tracks the operation done for the on-disk stats file (read,
     349              :      * write, discard).
     350              :      */
     351              :     void        (*finish) (PgStat_StatsFileOp status);
     352              : 
     353              :     /*
     354              :      * For fixed-numbered statistics: Initialize shared memory state.
     355              :      *
     356              :      * "stats" is the pointer to the allocated shared memory area.
     357              :      */
     358              :     void        (*init_shmem_cb) (void *stats);
     359              : 
     360              :     /*
     361              :      * For fixed-numbered or variable-numbered statistics: Flush pending stats
     362              :      * entries, for stats kinds that do not use PgStat_EntryRef->pending.
     363              :      *
     364              :      * Returns true if some of the stats could not be flushed, due to lock
     365              :      * contention for example. Optional.
     366              :      *
     367              :      * "pgstat_report_fixed" needs to be set to trigger the flush of pending
     368              :      * stats.
     369              :      */
     370              :     bool        (*flush_static_cb) (bool nowait);
     371              : 
     372              :     /*
     373              :      * For fixed-numbered statistics: Reset All.
     374              :      */
     375              :     void        (*reset_all_cb) (TimestampTz ts);
     376              : 
     377              :     /*
     378              :      * For fixed-numbered statistics: Build snapshot for entry
     379              :      */
     380              :     void        (*snapshot_cb) (void);
     381              : 
     382              :     /* name of the kind of stats */
     383              :     const char *const name;
     384              : } PgStat_KindInfo;
     385              : 
     386              : 
     387              : /*
     388              :  * List of SLRU names that we keep stats for.  There is no central registry of
     389              :  * SLRUs, so we use this fixed list instead.  The "other" entry is used for
     390              :  * all SLRUs without an explicit entry (e.g. SLRUs in extensions).
     391              :  *
     392              :  * This is only defined here so that SLRU_NUM_ELEMENTS is known for later type
     393              :  * definitions.
     394              :  */
     395              : static const char *const slru_names[] = {
     396              :     "commit_timestamp",
     397              :     "multixact_member",
     398              :     "multixact_offset",
     399              :     "notify",
     400              :     "serializable",
     401              :     "subtransaction",
     402              :     "transaction",
     403              :     "other"                       /* has to be last */
     404              : };
     405              : 
     406              : #define SLRU_NUM_ELEMENTS   lengthof(slru_names)
     407              : 
     408              : 
     409              : /* ----------
     410              :  * Types and definitions for different kinds of fixed-amount stats.
     411              :  *
     412              :  * Single-writer stats use the changecount mechanism to achieve low-overhead
     413              :  * writes - they're obviously more performance critical than reads. Check the
     414              :  * definition of struct PgBackendStatus for some explanation of the
     415              :  * changecount mechanism.
     416              :  *
     417              :  * Because the obvious implementation of resetting single-writer stats isn't
     418              :  * compatible with that (another backend needs to write), we don't scribble on
     419              :  * shared stats while resetting. Instead, just record the current counter
     420              :  * values in a copy of the stats data, which is protected by ->lock. See
     421              :  * pgstat_fetch_stat_(archiver|bgwriter|checkpointer) for the reader side.
     422              :  *
     423              :  * The only exception to that is the stat_reset_timestamp in these structs,
     424              :  * which is protected by ->lock, because it has to be written by another
     425              :  * backend while resetting.
     426              :  * ----------
     427              :  */
     428              : 
     429              : typedef struct PgStatShared_Archiver
     430              : {
     431              :     /* lock protects ->reset_offset as well as stats->stat_reset_timestamp */
     432              :     LWLock      lock;
     433              :     uint32      changecount;
     434              :     PgStat_ArchiverStats stats;
     435              :     PgStat_ArchiverStats reset_offset;
     436              : } PgStatShared_Archiver;
     437              : 
     438              : typedef struct PgStatShared_BgWriter
     439              : {
     440              :     /* lock protects ->reset_offset as well as stats->stat_reset_timestamp */
     441              :     LWLock      lock;
     442              :     uint32      changecount;
     443              :     PgStat_BgWriterStats stats;
     444              :     PgStat_BgWriterStats reset_offset;
     445              : } PgStatShared_BgWriter;
     446              : 
     447              : typedef struct PgStatShared_Checkpointer
     448              : {
     449              :     /* lock protects ->reset_offset as well as stats->stat_reset_timestamp */
     450              :     LWLock      lock;
     451              :     uint32      changecount;
     452              :     PgStat_CheckpointerStats stats;
     453              :     PgStat_CheckpointerStats reset_offset;
     454              : } PgStatShared_Checkpointer;
     455              : 
     456              : /* Shared-memory ready PgStat_IO */
     457              : typedef struct PgStatShared_IO
     458              : {
     459              :     /*
     460              :      * locks[i] protects stats.stats[i]. locks[0] also protects
     461              :      * stats.stat_reset_timestamp.
     462              :      */
     463              :     LWLock      locks[BACKEND_NUM_TYPES];
     464              :     PgStat_IO   stats;
     465              : } PgStatShared_IO;
     466              : 
     467              : typedef struct PgStatShared_Lock
     468              : {
     469              :     /* lock protects ->stats */
     470              :     LWLock      lock;
     471              :     PgStat_Lock stats;
     472              : } PgStatShared_Lock;
     473              : 
     474              : typedef struct PgStatShared_SLRU
     475              : {
     476              :     /* lock protects ->stats */
     477              :     LWLock      lock;
     478              :     PgStat_SLRUStats stats[SLRU_NUM_ELEMENTS];
     479              : } PgStatShared_SLRU;
     480              : 
     481              : typedef struct PgStatShared_Wal
     482              : {
     483              :     /* lock protects ->stats */
     484              :     LWLock      lock;
     485              :     PgStat_WalStats stats;
     486              : } PgStatShared_Wal;
     487              : 
     488              : 
     489              : 
     490              : /* ----------
     491              :  * Types and definitions for different kinds of variable-amount stats.
     492              :  *
     493              :  * Each struct has to start with PgStatShared_Common, containing information
     494              :  * common across the different types of stats. Kind-specific data follows.
     495              :  * ----------
     496              :  */
     497              : 
     498              : typedef struct PgStatShared_Database
     499              : {
     500              :     PgStatShared_Common header;
     501              :     PgStat_StatDBEntry stats;
     502              : } PgStatShared_Database;
     503              : 
     504              : typedef struct PgStatShared_Relation
     505              : {
     506              :     PgStatShared_Common header;
     507              :     PgStat_StatTabEntry stats;
     508              : } PgStatShared_Relation;
     509              : 
     510              : typedef struct PgStatShared_Function
     511              : {
     512              :     PgStatShared_Common header;
     513              :     PgStat_StatFuncEntry stats;
     514              : } PgStatShared_Function;
     515              : 
     516              : typedef struct PgStatShared_Subscription
     517              : {
     518              :     PgStatShared_Common header;
     519              :     PgStat_StatSubEntry stats;
     520              : } PgStatShared_Subscription;
     521              : 
     522              : typedef struct PgStatShared_ReplSlot
     523              : {
     524              :     PgStatShared_Common header;
     525              :     PgStat_StatReplSlotEntry stats;
     526              : } PgStatShared_ReplSlot;
     527              : 
     528              : typedef struct PgStatShared_Backend
     529              : {
     530              :     PgStatShared_Common header;
     531              :     PgStat_Backend stats;
     532              : } PgStatShared_Backend;
     533              : 
     534              : /*
     535              :  * Central shared memory entry for the cumulative stats system.
     536              :  *
     537              :  * Fixed amount stats, the dynamic shared memory hash table for
     538              :  * non-fixed-amount stats, as well as remaining bits and pieces are all
     539              :  * reached from here.
     540              :  */
     541              : typedef struct PgStat_ShmemControl
     542              : {
     543              :     void       *raw_dsa_area;
     544              : 
     545              :     /*
     546              :      * Stats for variable-numbered objects are kept in this shared hash table.
     547              :      * See comment above PgStat_Kind for details.
     548              :      */
     549              :     dshash_table_handle hash_handle;    /* shared dbstat hash */
     550              : 
     551              :     /* Has the stats system already been shut down? Just a debugging check. */
     552              :     bool        is_shutdown;
     553              : 
     554              :     /*
     555              :      * Whenever statistics for dropped objects could not be freed - because
     556              :      * backends still have references - the dropping backend calls
     557              :      * pgstat_request_entry_refs_gc() incrementing this counter. Eventually
     558              :      * that causes backends to run pgstat_gc_entry_refs(), allowing memory to
     559              :      * be reclaimed.
     560              :      */
     561              :     pg_atomic_uint64 gc_request_count;
     562              : 
     563              :     /*
     564              :      * Counters for the number of entries associated to a single stats kind
     565              :      * that uses variable-numbered objects stored in the shared hash table.
     566              :      * These counters can be enabled on a per-kind basis, when
     567              :      * track_entry_count is set.  This counter is incremented each time a new
     568              :      * entry is created (not reused) in the shared hash table, and is
     569              :      * decremented each time an entry is freed from the shared hash table.
     570              :      */
     571              :     pg_atomic_uint64 entry_counts[PGSTAT_KIND_MAX];
     572              : 
     573              :     /*
     574              :      * Stats data for fixed-numbered objects.
     575              :      */
     576              :     PgStatShared_Archiver archiver;
     577              :     PgStatShared_BgWriter bgwriter;
     578              :     PgStatShared_Checkpointer checkpointer;
     579              :     PgStatShared_IO io;
     580              :     PgStatShared_Lock lock;
     581              :     PgStatShared_SLRU slru;
     582              :     PgStatShared_Wal wal;
     583              : 
     584              :     /*
     585              :      * Custom stats data with fixed-numbered objects, indexed by (PgStat_Kind
     586              :      * - PGSTAT_KIND_CUSTOM_MIN).
     587              :      */
     588              :     void       *custom_data[PGSTAT_KIND_CUSTOM_SIZE];
     589              : 
     590              : } PgStat_ShmemControl;
     591              : 
     592              : 
     593              : /*
     594              :  * Cached statistics snapshot
     595              :  */
     596              : typedef struct PgStat_Snapshot
     597              : {
     598              :     PgStat_FetchConsistency mode;
     599              : 
     600              :     /* time at which snapshot was taken */
     601              :     TimestampTz snapshot_timestamp;
     602              : 
     603              :     bool        fixed_valid[PGSTAT_KIND_BUILTIN_SIZE];
     604              : 
     605              :     PgStat_ArchiverStats archiver;
     606              : 
     607              :     PgStat_BgWriterStats bgwriter;
     608              : 
     609              :     PgStat_CheckpointerStats checkpointer;
     610              : 
     611              :     PgStat_IO   io;
     612              : 
     613              :     PgStat_Lock lock;
     614              : 
     615              :     PgStat_SLRUStats slru[SLRU_NUM_ELEMENTS];
     616              : 
     617              :     PgStat_WalStats wal;
     618              : 
     619              :     /*
     620              :      * Data in snapshot for custom fixed-numbered statistics, indexed by
     621              :      * (PgStat_Kind - PGSTAT_KIND_CUSTOM_MIN).  Each entry is allocated in
     622              :      * TopMemoryContext, for a size of PgStat_KindInfo->shared_data_len.
     623              :      */
     624              :     bool        custom_valid[PGSTAT_KIND_CUSTOM_SIZE];
     625              :     void       *custom_data[PGSTAT_KIND_CUSTOM_SIZE];
     626              : 
     627              :     /* to free snapshot in bulk */
     628              :     MemoryContext context;
     629              :     struct pgstat_snapshot_hash *stats;
     630              : } PgStat_Snapshot;
     631              : 
     632              : 
     633              : /*
     634              :  * Collection of backend-local stats state.
     635              :  */
     636              : typedef struct PgStat_LocalState
     637              : {
     638              :     PgStat_ShmemControl *shmem;
     639              :     dsa_area   *dsa;
     640              :     dshash_table *shared_hash;
     641              : 
     642              :     /* the current statistics snapshot */
     643              :     PgStat_Snapshot snapshot;
     644              : } PgStat_LocalState;
     645              : 
     646              : 
     647              : /*
     648              :  * Inline functions defined further below.
     649              :  */
     650              : 
     651              : static inline void pgstat_begin_changecount_write(uint32 *cc);
     652              : static inline void pgstat_end_changecount_write(uint32 *cc);
     653              : static inline uint32 pgstat_begin_changecount_read(uint32 *cc);
     654              : static inline bool pgstat_end_changecount_read(uint32 *cc, uint32 cc_before);
     655              : 
     656              : static inline void pgstat_copy_changecounted_stats(void *dst, void *src, size_t len,
     657              :                                                    uint32 *cc);
     658              : 
     659              : static inline int pgstat_cmp_hash_key(const void *a, const void *b, size_t size, void *arg);
     660              : static inline uint32 pgstat_hash_hash_key(const void *d, size_t size, void *arg);
     661              : static inline size_t pgstat_get_entry_len(PgStat_Kind kind);
     662              : static inline void *pgstat_get_entry_data(PgStat_Kind kind, PgStatShared_Common *entry);
     663              : static inline void *pgstat_get_custom_shmem_data(PgStat_Kind kind);
     664              : static inline void *pgstat_get_custom_snapshot_data(PgStat_Kind kind);
     665              : 
     666              : 
     667              : /*
     668              :  * Functions in pgstat.c
     669              :  */
     670              : 
     671              : extern const PgStat_KindInfo *pgstat_get_kind_info(PgStat_Kind kind);
     672              : extern void pgstat_register_kind(PgStat_Kind kind,
     673              :                                  const PgStat_KindInfo *kind_info);
     674              : 
     675              : #ifdef USE_ASSERT_CHECKING
     676              : extern void pgstat_assert_is_up(void);
     677              : #else
     678              : #define pgstat_assert_is_up() ((void)true)
     679              : #endif
     680              : 
     681              : extern void pgstat_delete_pending_entry(PgStat_EntryRef *entry_ref);
     682              : extern PgStat_EntryRef *pgstat_prep_pending_entry(PgStat_Kind kind, Oid dboid,
     683              :                                                   uint64 objid,
     684              :                                                   bool *created_entry);
     685              : extern PgStat_EntryRef *pgstat_fetch_pending_entry(PgStat_Kind kind,
     686              :                                                    Oid dboid, uint64 objid);
     687              : 
     688              : extern void *pgstat_fetch_entry(PgStat_Kind kind, Oid dboid, uint64 objid,
     689              :                                 bool *may_free);
     690              : extern void pgstat_snapshot_fixed(PgStat_Kind kind);
     691              : 
     692              : 
     693              : /*
     694              :  * Functions in pgstat_archiver.c
     695              :  */
     696              : 
     697              : extern void pgstat_archiver_init_shmem_cb(void *stats);
     698              : extern void pgstat_archiver_reset_all_cb(TimestampTz ts);
     699              : extern void pgstat_archiver_snapshot_cb(void);
     700              : 
     701              : /*
     702              :  * Functions in pgstat_backend.c
     703              :  */
     704              : 
     705              : /* flags for pgstat_flush_backend() */
     706              : #define PGSTAT_BACKEND_FLUSH_IO     (1 << 0)  /* Flush I/O statistics */
     707              : #define PGSTAT_BACKEND_FLUSH_WAL   (1 << 1) /* Flush WAL statistics */
     708              : #define PGSTAT_BACKEND_FLUSH_ALL   (PGSTAT_BACKEND_FLUSH_IO | PGSTAT_BACKEND_FLUSH_WAL)
     709              : 
     710              : extern bool pgstat_flush_backend(bool nowait, uint32 flags);
     711              : extern bool pgstat_backend_flush_cb(bool nowait);
     712              : extern void pgstat_backend_reset_timestamp_cb(PgStatShared_Common *header,
     713              :                                               TimestampTz ts);
     714              : 
     715              : /*
     716              :  * Functions in pgstat_bgwriter.c
     717              :  */
     718              : 
     719              : extern void pgstat_bgwriter_init_shmem_cb(void *stats);
     720              : extern void pgstat_bgwriter_reset_all_cb(TimestampTz ts);
     721              : extern void pgstat_bgwriter_snapshot_cb(void);
     722              : 
     723              : 
     724              : /*
     725              :  * Functions in pgstat_checkpointer.c
     726              :  */
     727              : 
     728              : extern void pgstat_checkpointer_init_shmem_cb(void *stats);
     729              : extern void pgstat_checkpointer_reset_all_cb(TimestampTz ts);
     730              : extern void pgstat_checkpointer_snapshot_cb(void);
     731              : 
     732              : 
     733              : /*
     734              :  * Functions in pgstat_database.c
     735              :  */
     736              : 
     737              : extern void pgstat_report_disconnect(Oid dboid);
     738              : extern void pgstat_update_dbstats(TimestampTz ts);
     739              : extern void AtEOXact_PgStat_Database(bool isCommit, bool parallel);
     740              : 
     741              : extern PgStat_StatDBEntry *pgstat_prep_database_pending(Oid dboid);
     742              : extern void pgstat_reset_database_timestamp(Oid dboid, TimestampTz ts);
     743              : extern bool pgstat_database_flush_cb(PgStat_EntryRef *entry_ref, bool nowait);
     744              : extern void pgstat_database_reset_timestamp_cb(PgStatShared_Common *header, TimestampTz ts);
     745              : 
     746              : 
     747              : /*
     748              :  * Functions in pgstat_function.c
     749              :  */
     750              : 
     751              : extern bool pgstat_function_flush_cb(PgStat_EntryRef *entry_ref, bool nowait);
     752              : extern void pgstat_function_reset_timestamp_cb(PgStatShared_Common *header, TimestampTz ts);
     753              : 
     754              : 
     755              : /*
     756              :  * Functions in pgstat_io.c
     757              :  */
     758              : 
     759              : extern void pgstat_flush_io(bool nowait);
     760              : 
     761              : extern bool pgstat_io_flush_cb(bool nowait);
     762              : extern void pgstat_io_init_shmem_cb(void *stats);
     763              : extern void pgstat_io_reset_all_cb(TimestampTz ts);
     764              : extern void pgstat_io_snapshot_cb(void);
     765              : 
     766              : /*
     767              :  * Functions in pgstat_lock.c
     768              :  */
     769              : 
     770              : extern bool pgstat_lock_flush_cb(bool nowait);
     771              : extern void pgstat_lock_init_shmem_cb(void *stats);
     772              : extern void pgstat_lock_reset_all_cb(TimestampTz ts);
     773              : extern void pgstat_lock_snapshot_cb(void);
     774              : 
     775              : /*
     776              :  * Functions in pgstat_relation.c
     777              :  */
     778              : 
     779              : extern void AtEOXact_PgStat_Relations(PgStat_SubXactStatus *xact_state, bool isCommit);
     780              : extern void AtEOSubXact_PgStat_Relations(PgStat_SubXactStatus *xact_state, bool isCommit, int nestDepth);
     781              : extern void AtPrepare_PgStat_Relations(PgStat_SubXactStatus *xact_state);
     782              : extern void PostPrepare_PgStat_Relations(PgStat_SubXactStatus *xact_state);
     783              : 
     784              : extern bool pgstat_relation_flush_cb(PgStat_EntryRef *entry_ref, bool nowait);
     785              : extern void pgstat_relation_delete_pending_cb(PgStat_EntryRef *entry_ref);
     786              : extern void pgstat_relation_reset_timestamp_cb(PgStatShared_Common *header, TimestampTz ts);
     787              : 
     788              : 
     789              : /*
     790              :  * Functions in pgstat_replslot.c
     791              :  */
     792              : 
     793              : extern void pgstat_replslot_reset_timestamp_cb(PgStatShared_Common *header, TimestampTz ts);
     794              : extern void pgstat_replslot_to_serialized_name_cb(const PgStat_HashKey *key, const PgStatShared_Common *header, NameData *name);
     795              : extern bool pgstat_replslot_from_serialized_name_cb(const NameData *name, PgStat_HashKey *key);
     796              : 
     797              : 
     798              : /*
     799              :  * Functions in pgstat_shmem.c
     800              :  */
     801              : 
     802              : extern void pgstat_attach_shmem(void);
     803              : extern void pgstat_detach_shmem(void);
     804              : 
     805              : extern PgStat_EntryRef *pgstat_get_entry_ref(PgStat_Kind kind, Oid dboid, uint64 objid,
     806              :                                              bool create, bool *created_entry);
     807              : extern bool pgstat_lock_entry(PgStat_EntryRef *entry_ref, bool nowait);
     808              : extern bool pgstat_lock_entry_shared(PgStat_EntryRef *entry_ref, bool nowait);
     809              : extern void pgstat_unlock_entry(PgStat_EntryRef *entry_ref);
     810              : extern bool pgstat_drop_entry(PgStat_Kind kind, Oid dboid, uint64 objid);
     811              : extern void pgstat_drop_all_entries(void);
     812              : extern void pgstat_drop_matching_entries(bool (*do_drop) (PgStatShared_HashEntry *, Datum),
     813              :                                          Datum match_data);
     814              : extern PgStat_EntryRef *pgstat_get_entry_ref_locked(PgStat_Kind kind, Oid dboid, uint64 objid,
     815              :                                                     bool nowait);
     816              : extern void pgstat_reset_entry(PgStat_Kind kind, Oid dboid, uint64 objid, TimestampTz ts);
     817              : extern void pgstat_reset_entries_of_kind(PgStat_Kind kind, TimestampTz ts);
     818              : extern void pgstat_reset_matching_entries(bool (*do_reset) (PgStatShared_HashEntry *, Datum),
     819              :                                           Datum match_data,
     820              :                                           TimestampTz ts);
     821              : 
     822              : extern void pgstat_request_entry_refs_gc(void);
     823              : extern PgStatShared_Common *pgstat_init_entry(PgStat_Kind kind,
     824              :                                               PgStatShared_HashEntry *shhashent);
     825              : 
     826              : 
     827              : /*
     828              :  * Functions in pgstat_slru.c
     829              :  */
     830              : 
     831              : extern bool pgstat_slru_flush_cb(bool nowait);
     832              : extern void pgstat_slru_init_shmem_cb(void *stats);
     833              : extern void pgstat_slru_reset_all_cb(TimestampTz ts);
     834              : extern void pgstat_slru_snapshot_cb(void);
     835              : 
     836              : 
     837              : /*
     838              :  * Functions in pgstat_wal.c
     839              :  */
     840              : 
     841              : extern void pgstat_wal_init_backend_cb(void);
     842              : extern bool pgstat_wal_flush_cb(bool nowait);
     843              : extern void pgstat_wal_init_shmem_cb(void *stats);
     844              : extern void pgstat_wal_reset_all_cb(TimestampTz ts);
     845              : extern void pgstat_wal_snapshot_cb(void);
     846              : 
     847              : 
     848              : /*
     849              :  * Functions in pgstat_subscription.c
     850              :  */
     851              : 
     852              : extern bool pgstat_subscription_flush_cb(PgStat_EntryRef *entry_ref, bool nowait);
     853              : extern void pgstat_subscription_reset_timestamp_cb(PgStatShared_Common *header, TimestampTz ts);
     854              : 
     855              : 
     856              : /*
     857              :  * Functions in pgstat_xact.c
     858              :  */
     859              : 
     860              : extern PgStat_SubXactStatus *pgstat_get_xact_stack_level(int nest_level);
     861              : extern void pgstat_drop_transactional(PgStat_Kind kind, Oid dboid, uint64 objid);
     862              : extern void pgstat_create_transactional(PgStat_Kind kind, Oid dboid, uint64 objid);
     863              : 
     864              : 
     865              : /*
     866              :  * Variables in pgstat.c
     867              :  */
     868              : 
     869              : /*
     870              :  * Track if *any* pending fixed-numbered statistics should be flushed to
     871              :  * shared memory.
     872              :  *
     873              :  * This flag can be switched to true by fixed-numbered statistics to let
     874              :  * pgstat_report_stat() know if it needs to go through one round of
     875              :  * reports, calling flush_static_cb for each fixed-numbered statistics
     876              :  * kind.  When this flag is not set, pgstat_report_stat() is able to do
     877              :  * a fast exit, knowing that there are no pending fixed-numbered statistics.
     878              :  *
     879              :  * Statistics callbacks should never reset this flag; pgstat_report_stat()
     880              :  * is in charge of doing that.
     881              :  */
     882              : extern PGDLLIMPORT bool pgstat_report_fixed;
     883              : 
     884              : /* Backend-local stats state */
     885              : extern PGDLLIMPORT PgStat_LocalState pgStatLocal;
     886              : 
     887              : /* Helper functions for reading and writing of on-disk stats file */
     888              : extern void pgstat_write_chunk(FILE *fpout, void *ptr, size_t len);
     889              : extern bool pgstat_read_chunk(FILE *fpin, void *ptr, size_t len);
     890              : #define pgstat_read_chunk_s(fpin, ptr) pgstat_read_chunk(fpin, ptr, sizeof(*ptr))
     891              : #define pgstat_write_chunk_s(fpout, ptr) pgstat_write_chunk(fpout, ptr, sizeof(*ptr))
     892              : 
     893              : /*
     894              :  * Implementation of inline functions declared above.
     895              :  */
     896              : 
     897              : /*
     898              :  * Helpers for changecount manipulation. See comments around struct
     899              :  * PgBackendStatus for details.
     900              :  */
     901              : 
     902              : static inline void
     903        13923 : pgstat_begin_changecount_write(uint32 *cc)
     904              : {
     905              :     Assert((*cc & 1) == 0);
     906              : 
     907        13923 :     START_CRIT_SECTION();
     908        13923 :     (*cc)++;
     909        13923 :     pg_write_barrier();
     910        13923 : }
     911              : 
     912              : static inline void
     913        13923 : pgstat_end_changecount_write(uint32 *cc)
     914              : {
     915              :     Assert((*cc & 1) == 1);
     916              : 
     917        13923 :     pg_write_barrier();
     918              : 
     919        13923 :     (*cc)++;
     920              : 
     921        13923 :     END_CRIT_SECTION();
     922        13923 : }
     923              : 
     924              : static inline uint32
     925         3226 : pgstat_begin_changecount_read(uint32 *cc)
     926              : {
     927         3226 :     uint32      before_cc = *cc;
     928              : 
     929         3226 :     CHECK_FOR_INTERRUPTS();
     930              : 
     931         3226 :     pg_read_barrier();
     932              : 
     933         3226 :     return before_cc;
     934              : }
     935              : 
     936              : /*
     937              :  * Returns true if the read succeeded, false if it needs to be repeated.
     938              :  */
     939              : static inline bool
     940         3226 : pgstat_end_changecount_read(uint32 *cc, uint32 before_cc)
     941              : {
     942              :     uint32      after_cc;
     943              : 
     944         3226 :     pg_read_barrier();
     945              : 
     946         3226 :     after_cc = *cc;
     947              : 
     948              :     /* was a write in progress when we started? */
     949         3226 :     if (before_cc & 1)
     950            0 :         return false;
     951              : 
     952              :     /* did writes start and complete while we read? */
     953         3226 :     return before_cc == after_cc;
     954              : }
     955              : 
     956              : 
     957              : /*
     958              :  * helper function for PgStat_KindInfo->snapshot_cb
     959              :  * PgStat_KindInfo->reset_all_cb callbacks.
     960              :  *
     961              :  * Copies out the specified memory area following change-count protocol.
     962              :  */
     963              : static inline void
     964         3226 : pgstat_copy_changecounted_stats(void *dst, void *src, size_t len,
     965              :                                 uint32 *cc)
     966              : {
     967              :     uint32      cc_before;
     968              : 
     969              :     do
     970              :     {
     971         3226 :         cc_before = pgstat_begin_changecount_read(cc);
     972              : 
     973         3226 :         memcpy(dst, src, len);
     974              :     }
     975         3226 :     while (!pgstat_end_changecount_read(cc, cc_before));
     976         3226 : }
     977              : 
     978              : /* helpers for dshash / simplehash hashtables */
     979              : static inline int
     980      8177810 : pgstat_cmp_hash_key(const void *a, const void *b, size_t size, void *arg)
     981              : {
     982              :     Assert(size == sizeof(PgStat_HashKey) && arg == NULL);
     983      8177810 :     return memcmp(a, b, sizeof(PgStat_HashKey));
     984              : }
     985              : 
     986              : static inline uint32
     987      9819914 : pgstat_hash_hash_key(const void *d, size_t size, void *arg)
     988              : {
     989      9819914 :     const char *key = (const char *) d;
     990              : 
     991              :     Assert(size == sizeof(PgStat_HashKey) && arg == NULL);
     992      9819914 :     return fasthash32(key, size, 0);
     993              : }
     994              : 
     995              : /*
     996              :  * The length of the data portion of a shared memory stats entry (i.e. without
     997              :  * transient data such as refcounts, lwlocks, ...).
     998              :  */
     999              : static inline size_t
    1000       561814 : pgstat_get_entry_len(PgStat_Kind kind)
    1001              : {
    1002       561814 :     return pgstat_get_kind_info(kind)->shared_data_len;
    1003              : }
    1004              : 
    1005              : /*
    1006              :  * Returns a pointer to the data portion of a shared memory stats entry.
    1007              :  */
    1008              : static inline void *
    1009       813813 : pgstat_get_entry_data(PgStat_Kind kind, PgStatShared_Common *entry)
    1010              : {
    1011       813813 :     size_t      off = pgstat_get_kind_info(kind)->shared_data_off;
    1012              : 
    1013              :     Assert(off != 0 && off < PG_UINT32_MAX);
    1014              : 
    1015       813813 :     return ((char *) (entry)) + off;
    1016              : }
    1017              : 
    1018              : /*
    1019              :  * Returns the number of entries counted for a stats kind.
    1020              :  */
    1021              : static inline uint64
    1022              : pgstat_get_entry_count(PgStat_Kind kind)
    1023              : {
    1024              :     Assert(pgstat_get_kind_info(kind)->track_entry_count);
    1025              : 
    1026              :     return pg_atomic_read_u64(&pgStatLocal.shmem->entry_counts[kind - 1]);
    1027              : }
    1028              : 
    1029              : /*
    1030              :  * Returns a pointer to the shared memory area of custom stats for
    1031              :  * fixed-numbered statistics.
    1032              :  */
    1033              : static inline void *
    1034           12 : pgstat_get_custom_shmem_data(PgStat_Kind kind)
    1035              : {
    1036           12 :     int         idx = kind - PGSTAT_KIND_CUSTOM_MIN;
    1037              : 
    1038              :     Assert(pgstat_is_kind_custom(kind));
    1039              :     Assert(pgstat_get_kind_info(kind)->fixed_amount);
    1040              : 
    1041           12 :     return pgStatLocal.shmem->custom_data[idx];
    1042              : }
    1043              : 
    1044              : /*
    1045              :  * Returns a pointer to the portion of custom data for fixed-numbered
    1046              :  * statistics in the current snapshot.
    1047              :  */
    1048              : static inline void *
    1049            7 : pgstat_get_custom_snapshot_data(PgStat_Kind kind)
    1050              : {
    1051            7 :     int         idx = kind - PGSTAT_KIND_CUSTOM_MIN;
    1052              : 
    1053              :     Assert(pgstat_is_kind_custom(kind));
    1054              :     Assert(pgstat_get_kind_info(kind)->fixed_amount);
    1055              : 
    1056            7 :     return pgStatLocal.snapshot.custom_data[idx];
    1057              : }
    1058              : 
    1059              : #endif                          /* PGSTAT_INTERNAL_H */
        

Generated by: LCOV version 2.0-1