LCOV - code coverage report
Current view: top level - src/include/storage - bufmgr.h (source / functions) Coverage Total Hit
Test: PostgreSQL 19devel Lines: 100.0 % 15 15
Test Date: 2026-03-04 15:14:37 Functions: 100.0 % 5 5
Legend: Lines:     hit not hit

            Line data    Source code
       1              : /*-------------------------------------------------------------------------
       2              :  *
       3              :  * bufmgr.h
       4              :  *    POSTGRES buffer manager definitions.
       5              :  *
       6              :  *
       7              :  * Portions Copyright (c) 1996-2026, PostgreSQL Global Development Group
       8              :  * Portions Copyright (c) 1994, Regents of the University of California
       9              :  *
      10              :  * src/include/storage/bufmgr.h
      11              :  *
      12              :  *-------------------------------------------------------------------------
      13              :  */
      14              : #ifndef BUFMGR_H
      15              : #define BUFMGR_H
      16              : 
      17              : #include "port/pg_iovec.h"
      18              : #include "storage/aio_types.h"
      19              : #include "storage/block.h"
      20              : #include "storage/buf.h"
      21              : #include "storage/bufpage.h"
      22              : #include "storage/relfilelocator.h"
      23              : #include "utils/relcache.h"
      24              : #include "utils/snapmgr.h"
      25              : 
      26              : typedef void *Block;
      27              : 
      28              : /*
      29              :  * Possible arguments for GetAccessStrategy().
      30              :  *
      31              :  * If adding a new BufferAccessStrategyType, also add a new IOContext so
      32              :  * IO statistics using this strategy are tracked.
      33              :  */
      34              : typedef enum BufferAccessStrategyType
      35              : {
      36              :     BAS_NORMAL,                 /* Normal random access */
      37              :     BAS_BULKREAD,               /* Large read-only scan (hint bit updates are
      38              :                                  * ok) */
      39              :     BAS_BULKWRITE,              /* Large multi-block write (e.g. COPY IN) */
      40              :     BAS_VACUUM,                 /* VACUUM */
      41              : } BufferAccessStrategyType;
      42              : 
      43              : /* Possible modes for ReadBufferExtended() */
      44              : typedef enum
      45              : {
      46              :     RBM_NORMAL,                 /* Normal read */
      47              :     RBM_ZERO_AND_LOCK,          /* Don't read from disk, caller will
      48              :                                  * initialize. Also locks the page. */
      49              :     RBM_ZERO_AND_CLEANUP_LOCK,  /* Like RBM_ZERO_AND_LOCK, but locks the page
      50              :                                  * in "cleanup" mode */
      51              :     RBM_ZERO_ON_ERROR,          /* Read, but return an all-zeros page on error */
      52              :     RBM_NORMAL_NO_LOG,          /* Don't log page as invalid during WAL
      53              :                                  * replay; otherwise same as RBM_NORMAL */
      54              : } ReadBufferMode;
      55              : 
      56              : /*
      57              :  * Type returned by PrefetchBuffer().
      58              :  */
      59              : typedef struct PrefetchBufferResult
      60              : {
      61              :     Buffer      recent_buffer;  /* If valid, a hit (recheck needed!) */
      62              :     bool        initiated_io;   /* If true, a miss resulting in async I/O */
      63              : } PrefetchBufferResult;
      64              : 
      65              : /*
      66              :  * Flags influencing the behaviour of ExtendBufferedRel*
      67              :  */
      68              : typedef enum ExtendBufferedFlags
      69              : {
      70              :     /*
      71              :      * Don't acquire extension lock. This is safe only if the relation isn't
      72              :      * shared, an access exclusive lock is held or if this is the startup
      73              :      * process.
      74              :      */
      75              :     EB_SKIP_EXTENSION_LOCK = (1 << 0),
      76              : 
      77              :     /* Is this extension part of recovery? */
      78              :     EB_PERFORMING_RECOVERY = (1 << 1),
      79              : 
      80              :     /*
      81              :      * Should the fork be created if it does not currently exist? This likely
      82              :      * only ever makes sense for relation forks.
      83              :      */
      84              :     EB_CREATE_FORK_IF_NEEDED = (1 << 2),
      85              : 
      86              :     /* Should the first (possibly only) return buffer be returned locked? */
      87              :     EB_LOCK_FIRST = (1 << 3),
      88              : 
      89              :     /* Should the smgr size cache be cleared? */
      90              :     EB_CLEAR_SIZE_CACHE = (1 << 4),
      91              : 
      92              :     /* internal flags follow */
      93              :     EB_LOCK_TARGET = (1 << 5),
      94              : }           ExtendBufferedFlags;
      95              : 
      96              : /* forward declared, to avoid including smgr.h here */
      97              : typedef struct SMgrRelationData *SMgrRelation;
      98              : 
      99              : /*
     100              :  * Some functions identify relations either by relation or smgr +
     101              :  * relpersistence, initialized via the BMR_REL()/BMR_SMGR() macros below.
     102              :  * This allows us to use the same function for both recovery and normal
     103              :  * operation.  When BMR_REL is used, it's not valid to cache its rd_smgr here,
     104              :  * because our pointer would be obsolete in case of relcache invalidation.
     105              :  * For simplicity, use BMR_GET_SMGR to read the smgr.
     106              :  */
     107              : typedef struct BufferManagerRelation
     108              : {
     109              :     Relation    rel;
     110              :     SMgrRelation smgr;
     111              :     char        relpersistence;
     112              : } BufferManagerRelation;
     113              : 
     114              : #define BMR_REL(p_rel) \
     115              :     ((BufferManagerRelation){.rel = p_rel})
     116              : #define BMR_SMGR(p_smgr, p_relpersistence) \
     117              :     ((BufferManagerRelation){.smgr = p_smgr, .relpersistence = p_relpersistence})
     118              : #define BMR_GET_SMGR(bmr) \
     119              :     (RelationIsValid((bmr).rel) ? RelationGetSmgr((bmr).rel) : (bmr).smgr)
     120              : 
     121              : /* Zero out page if reading fails. */
     122              : #define READ_BUFFERS_ZERO_ON_ERROR (1 << 0)
     123              : /* Call smgrprefetch() if I/O necessary. */
     124              : #define READ_BUFFERS_ISSUE_ADVICE (1 << 1)
     125              : /* Don't treat page as invalid due to checksum failures. */
     126              : #define READ_BUFFERS_IGNORE_CHECKSUM_FAILURES (1 << 2)
     127              : /* IO will immediately be waited for */
     128              : #define READ_BUFFERS_SYNCHRONOUSLY (1 << 3)
     129              : 
     130              : 
     131              : struct ReadBuffersOperation
     132              : {
     133              :     /* The following members should be set by the caller. */
     134              :     Relation    rel;            /* optional */
     135              :     SMgrRelation smgr;
     136              :     char        persistence;
     137              :     ForkNumber  forknum;
     138              :     BufferAccessStrategy strategy;
     139              : 
     140              :     /*
     141              :      * The following private members are private state for communication
     142              :      * between StartReadBuffers() and WaitReadBuffers(), initialized only if
     143              :      * an actual read is required, and should not be modified.
     144              :      */
     145              :     Buffer     *buffers;
     146              :     BlockNumber blocknum;
     147              :     int         flags;
     148              :     int16       nblocks;
     149              :     int16       nblocks_done;
     150              :     PgAioWaitRef io_wref;
     151              :     PgAioReturn io_return;
     152              : };
     153              : 
     154              : typedef struct ReadBuffersOperation ReadBuffersOperation;
     155              : 
     156              : /* to avoid having to expose buf_internals.h here */
     157              : typedef struct WritebackContext WritebackContext;
     158              : 
     159              : /* in globals.c ... this duplicates miscadmin.h */
     160              : extern PGDLLIMPORT int NBuffers;
     161              : 
     162              : /* in bufmgr.c */
     163              : extern PGDLLIMPORT bool zero_damaged_pages;
     164              : extern PGDLLIMPORT int bgwriter_lru_maxpages;
     165              : extern PGDLLIMPORT double bgwriter_lru_multiplier;
     166              : extern PGDLLIMPORT bool track_io_timing;
     167              : 
     168              : #define DEFAULT_EFFECTIVE_IO_CONCURRENCY 16
     169              : #define DEFAULT_MAINTENANCE_IO_CONCURRENCY 16
     170              : extern PGDLLIMPORT int effective_io_concurrency;
     171              : extern PGDLLIMPORT int maintenance_io_concurrency;
     172              : 
     173              : #define MAX_IO_COMBINE_LIMIT PG_IOV_MAX
     174              : #define DEFAULT_IO_COMBINE_LIMIT Min(MAX_IO_COMBINE_LIMIT, (128 * 1024) / BLCKSZ)
     175              : extern PGDLLIMPORT int io_combine_limit;    /* min of the two GUCs below */
     176              : extern PGDLLIMPORT int io_combine_limit_guc;
     177              : extern PGDLLIMPORT int io_max_combine_limit;
     178              : 
     179              : extern PGDLLIMPORT int checkpoint_flush_after;
     180              : extern PGDLLIMPORT int backend_flush_after;
     181              : extern PGDLLIMPORT int bgwriter_flush_after;
     182              : 
     183              : extern PGDLLIMPORT const PgAioHandleCallbacks aio_shared_buffer_readv_cb;
     184              : extern PGDLLIMPORT const PgAioHandleCallbacks aio_local_buffer_readv_cb;
     185              : 
     186              : /* in buf_init.c */
     187              : extern PGDLLIMPORT char *BufferBlocks;
     188              : 
     189              : /* in localbuf.c */
     190              : extern PGDLLIMPORT int NLocBuffer;
     191              : extern PGDLLIMPORT Block *LocalBufferBlockPointers;
     192              : extern PGDLLIMPORT int32 *LocalRefCount;
     193              : 
     194              : /* upper limit for effective_io_concurrency */
     195              : #define MAX_IO_CONCURRENCY 1000
     196              : 
     197              : /* special block number for ReadBuffer() */
     198              : #define P_NEW   InvalidBlockNumber  /* grow the file to get a new page */
     199              : 
     200              : /*
     201              :  * Buffer content lock modes (mode argument for LockBuffer())
     202              :  */
     203              : typedef enum BufferLockMode
     204              : {
     205              :     BUFFER_LOCK_UNLOCK,
     206              : 
     207              :     /*
     208              :      * A share lock conflicts with exclusive locks.
     209              :      */
     210              :     BUFFER_LOCK_SHARE,
     211              : 
     212              :     /*
     213              :      * A share-exclusive lock conflicts with itself and exclusive locks.
     214              :      */
     215              :     BUFFER_LOCK_SHARE_EXCLUSIVE,
     216              : 
     217              :     /*
     218              :      * An exclusive lock conflicts with every other lock type.
     219              :      */
     220              :     BUFFER_LOCK_EXCLUSIVE,
     221              : } BufferLockMode;
     222              : 
     223              : 
     224              : /*
     225              :  * prototypes for functions in bufmgr.c
     226              :  */
     227              : extern PrefetchBufferResult PrefetchSharedBuffer(SMgrRelation smgr_reln,
     228              :                                                  ForkNumber forkNum,
     229              :                                                  BlockNumber blockNum);
     230              : extern PrefetchBufferResult PrefetchBuffer(Relation reln, ForkNumber forkNum,
     231              :                                            BlockNumber blockNum);
     232              : extern bool ReadRecentBuffer(RelFileLocator rlocator, ForkNumber forkNum,
     233              :                              BlockNumber blockNum, Buffer recent_buffer);
     234              : extern Buffer ReadBuffer(Relation reln, BlockNumber blockNum);
     235              : extern Buffer ReadBufferExtended(Relation reln, ForkNumber forkNum,
     236              :                                  BlockNumber blockNum, ReadBufferMode mode,
     237              :                                  BufferAccessStrategy strategy);
     238              : extern Buffer ReadBufferWithoutRelcache(RelFileLocator rlocator,
     239              :                                         ForkNumber forkNum, BlockNumber blockNum,
     240              :                                         ReadBufferMode mode, BufferAccessStrategy strategy,
     241              :                                         bool permanent);
     242              : 
     243              : extern bool StartReadBuffer(ReadBuffersOperation *operation,
     244              :                             Buffer *buffer,
     245              :                             BlockNumber blocknum,
     246              :                             int flags);
     247              : extern bool StartReadBuffers(ReadBuffersOperation *operation,
     248              :                              Buffer *buffers,
     249              :                              BlockNumber blockNum,
     250              :                              int *nblocks,
     251              :                              int flags);
     252              : extern void WaitReadBuffers(ReadBuffersOperation *operation);
     253              : 
     254              : extern void ReleaseBuffer(Buffer buffer);
     255              : extern void UnlockReleaseBuffer(Buffer buffer);
     256              : extern bool BufferIsLockedByMe(Buffer buffer);
     257              : extern bool BufferIsLockedByMeInMode(Buffer buffer, BufferLockMode mode);
     258              : extern bool BufferIsDirty(Buffer buffer);
     259              : extern void MarkBufferDirty(Buffer buffer);
     260              : extern void IncrBufferRefCount(Buffer buffer);
     261              : extern void CheckBufferIsPinnedOnce(Buffer buffer);
     262              : extern Buffer ReleaseAndReadBuffer(Buffer buffer, Relation relation,
     263              :                                    BlockNumber blockNum);
     264              : 
     265              : extern Buffer ExtendBufferedRel(BufferManagerRelation bmr,
     266              :                                 ForkNumber forkNum,
     267              :                                 BufferAccessStrategy strategy,
     268              :                                 uint32 flags);
     269              : extern BlockNumber ExtendBufferedRelBy(BufferManagerRelation bmr,
     270              :                                        ForkNumber fork,
     271              :                                        BufferAccessStrategy strategy,
     272              :                                        uint32 flags,
     273              :                                        uint32 extend_by,
     274              :                                        Buffer *buffers,
     275              :                                        uint32 *extended_by);
     276              : extern Buffer ExtendBufferedRelTo(BufferManagerRelation bmr,
     277              :                                   ForkNumber fork,
     278              :                                   BufferAccessStrategy strategy,
     279              :                                   uint32 flags,
     280              :                                   BlockNumber extend_to,
     281              :                                   ReadBufferMode mode);
     282              : 
     283              : extern void InitBufferManagerAccess(void);
     284              : extern void AtEOXact_Buffers(bool isCommit);
     285              : #ifdef USE_ASSERT_CHECKING
     286              : extern void AssertBufferLocksPermitCatalogRead(void);
     287              : #endif
     288              : extern char *DebugPrintBufferRefcount(Buffer buffer);
     289              : extern void CheckPointBuffers(int flags);
     290              : extern BlockNumber BufferGetBlockNumber(Buffer buffer);
     291              : extern BlockNumber RelationGetNumberOfBlocksInFork(Relation relation,
     292              :                                                    ForkNumber forkNum);
     293              : extern void FlushOneBuffer(Buffer buffer);
     294              : extern void FlushRelationBuffers(Relation rel);
     295              : extern void FlushRelationsAllBuffers(SMgrRelation *smgrs, int nrels);
     296              : extern void CreateAndCopyRelationData(RelFileLocator src_rlocator,
     297              :                                       RelFileLocator dst_rlocator,
     298              :                                       bool permanent);
     299              : extern void FlushDatabaseBuffers(Oid dbid);
     300              : extern void DropRelationBuffers(SMgrRelation smgr_reln,
     301              :                                 ForkNumber *forkNum,
     302              :                                 int nforks, BlockNumber *firstDelBlock);
     303              : extern void DropRelationsAllBuffers(SMgrRelation *smgr_reln,
     304              :                                     int nlocators);
     305              : extern void DropDatabaseBuffers(Oid dbid);
     306              : 
     307              : #define RelationGetNumberOfBlocks(reln) \
     308              :     RelationGetNumberOfBlocksInFork(reln, MAIN_FORKNUM)
     309              : 
     310              : extern bool BufferIsPermanent(Buffer buffer);
     311              : extern XLogRecPtr BufferGetLSNAtomic(Buffer buffer);
     312              : extern void BufferGetTag(Buffer buffer, RelFileLocator *rlocator,
     313              :                          ForkNumber *forknum, BlockNumber *blknum);
     314              : 
     315              : extern void MarkBufferDirtyHint(Buffer buffer, bool buffer_std);
     316              : 
     317              : extern void UnlockBuffers(void);
     318              : extern void UnlockBuffer(Buffer buffer);
     319              : extern void LockBufferInternal(Buffer buffer, BufferLockMode mode);
     320              : 
     321              : /*
     322              :  * Handling BUFFER_LOCK_UNLOCK in bufmgr.c leads to sufficiently worse branch
     323              :  * prediction to impact performance. Therefore handle that switch here, where
     324              :  * most of the time `mode` will be a constant and thus can be optimized out by
     325              :  * the compiler.
     326              :  */
     327              : static inline void
     328    176289909 : LockBuffer(Buffer buffer, BufferLockMode mode)
     329              : {
     330    176289909 :     if (mode == BUFFER_LOCK_UNLOCK)
     331     89072007 :         UnlockBuffer(buffer);
     332              :     else
     333     87217902 :         LockBufferInternal(buffer, mode);
     334    176289909 : }
     335              : 
     336              : extern bool ConditionalLockBuffer(Buffer buffer);
     337              : extern void LockBufferForCleanup(Buffer buffer);
     338              : extern bool ConditionalLockBufferForCleanup(Buffer buffer);
     339              : extern bool IsBufferCleanupOK(Buffer buffer);
     340              : extern bool HoldingBufferPinThatDelaysRecovery(void);
     341              : 
     342              : extern bool BgBufferSync(WritebackContext *wb_context);
     343              : 
     344              : extern uint32 GetPinLimit(void);
     345              : extern uint32 GetLocalPinLimit(void);
     346              : extern uint32 GetAdditionalPinLimit(void);
     347              : extern uint32 GetAdditionalLocalPinLimit(void);
     348              : extern void LimitAdditionalPins(uint32 *additional_pins);
     349              : extern void LimitAdditionalLocalPins(uint32 *additional_pins);
     350              : 
     351              : extern bool EvictUnpinnedBuffer(Buffer buf, bool *buffer_flushed);
     352              : extern void EvictAllUnpinnedBuffers(int32 *buffers_evicted,
     353              :                                     int32 *buffers_flushed,
     354              :                                     int32 *buffers_skipped);
     355              : extern void EvictRelUnpinnedBuffers(Relation rel,
     356              :                                     int32 *buffers_evicted,
     357              :                                     int32 *buffers_flushed,
     358              :                                     int32 *buffers_skipped);
     359              : extern bool MarkDirtyUnpinnedBuffer(Buffer buf, bool *buffer_already_dirty);
     360              : extern void MarkDirtyRelUnpinnedBuffers(Relation rel,
     361              :                                         int32 *buffers_dirtied,
     362              :                                         int32 *buffers_already_dirty,
     363              :                                         int32 *buffers_skipped);
     364              : extern void MarkDirtyAllUnpinnedBuffers(int32 *buffers_dirtied,
     365              :                                         int32 *buffers_already_dirty,
     366              :                                         int32 *buffers_skipped);
     367              : 
     368              : /* in buf_init.c */
     369              : extern void BufferManagerShmemInit(void);
     370              : extern Size BufferManagerShmemSize(void);
     371              : 
     372              : /* in localbuf.c */
     373              : extern void AtProcExit_LocalBuffers(void);
     374              : 
     375              : /* in freelist.c */
     376              : 
     377              : extern BufferAccessStrategy GetAccessStrategy(BufferAccessStrategyType btype);
     378              : extern BufferAccessStrategy GetAccessStrategyWithSize(BufferAccessStrategyType btype,
     379              :                                                       int ring_size_kb);
     380              : extern int  GetAccessStrategyBufferCount(BufferAccessStrategy strategy);
     381              : extern int  GetAccessStrategyPinLimit(BufferAccessStrategy strategy);
     382              : 
     383              : extern void FreeAccessStrategy(BufferAccessStrategy strategy);
     384              : 
     385              : 
     386              : /* inline functions */
     387              : 
     388              : /*
     389              :  * Although this header file is nominally backend-only, certain frontend
     390              :  * programs like pg_waldump include it.  For compilers that emit static
     391              :  * inline functions even when they're unused, that leads to unsatisfied
     392              :  * external references; hence hide these with #ifndef FRONTEND.
     393              :  */
     394              : 
     395              : #ifndef FRONTEND
     396              : 
     397              : /*
     398              :  * BufferIsValid
     399              :  *      True iff the given buffer number is valid (either as a shared
     400              :  *      or local buffer).
     401              :  *
     402              :  * Note: For a long time this was defined the same as BufferIsPinned,
     403              :  * that is it would say False if you didn't hold a pin on the buffer.
     404              :  * I believe this was bogus and served only to mask logic errors.
     405              :  * Code should always know whether it has a buffer reference,
     406              :  * independently of the pin state.
     407              :  *
     408              :  * Note: For a further long time this was not quite the inverse of the
     409              :  * BufferIsInvalid() macro, in that it also did sanity checks to verify
     410              :  * that the buffer number was in range.  Most likely, this macro was
     411              :  * originally intended only to be used in assertions, but its use has
     412              :  * since expanded quite a bit, and the overhead of making those checks
     413              :  * even in non-assert-enabled builds can be significant.  Thus, we've
     414              :  * now demoted the range checks to assertions within the macro itself.
     415              :  */
     416              : static inline bool
     417    333377083 : BufferIsValid(Buffer bufnum)
     418              : {
     419              :     Assert(bufnum <= NBuffers);
     420              :     Assert(bufnum >= -NLocBuffer);
     421              : 
     422    333377083 :     return bufnum != InvalidBuffer;
     423              : }
     424              : 
     425              : /*
     426              :  * BufferGetBlock
     427              :  *      Returns a reference to a disk page image associated with a buffer.
     428              :  *
     429              :  * Note:
     430              :  *      Assumes buffer is valid.
     431              :  */
     432              : static inline Block
     433    381104680 : BufferGetBlock(Buffer buffer)
     434              : {
     435              :     Assert(BufferIsValid(buffer));
     436              : 
     437    381104680 :     if (BufferIsLocal(buffer))
     438     11740252 :         return LocalBufferBlockPointers[-buffer - 1];
     439              :     else
     440    369364428 :         return (Block) (BufferBlocks + ((Size) (buffer - 1)) * BLCKSZ);
     441              : }
     442              : 
     443              : /*
     444              :  * BufferGetPageSize
     445              :  *      Returns the page size within a buffer.
     446              :  *
     447              :  * Notes:
     448              :  *      Assumes buffer is valid.
     449              :  *
     450              :  *      The buffer can be a raw disk block and need not contain a valid
     451              :  *      (formatted) disk page.
     452              :  */
     453              : /* XXX should dig out of buffer descriptor */
     454              : static inline Size
     455       230254 : BufferGetPageSize(Buffer buffer)
     456              : {
     457              :     Assert(BufferIsValid(buffer));
     458       230254 :     return (Size) BLCKSZ;
     459              : }
     460              : 
     461              : /*
     462              :  * BufferGetPage
     463              :  *      Returns the page associated with a buffer.
     464              :  */
     465              : static inline Page
     466    378101514 : BufferGetPage(Buffer buffer)
     467              : {
     468    378101514 :     return (Page) BufferGetBlock(buffer);
     469              : }
     470              : 
     471              : #endif                          /* FRONTEND */
     472              : 
     473              : #endif                          /* BUFMGR_H */
        

Generated by: LCOV version 2.0-1