LCOV - code coverage report
Current view: top level - src/backend/replication - walreceiverfuncs.c (source / functions) Coverage Total Hit
Test: PostgreSQL 19devel Lines: 83.4 % 151 126
Test Date: 2026-04-07 14:16:30 Functions: 90.9 % 11 10
Legend: Lines:     hit not hit

            Line data    Source code
       1              : /*-------------------------------------------------------------------------
       2              :  *
       3              :  * walreceiverfuncs.c
       4              :  *
       5              :  * This file contains functions used by the startup process to communicate
       6              :  * with the walreceiver process. Functions implementing walreceiver itself
       7              :  * are in walreceiver.c.
       8              :  *
       9              :  * Portions Copyright (c) 2010-2026, PostgreSQL Global Development Group
      10              :  *
      11              :  *
      12              :  * IDENTIFICATION
      13              :  *    src/backend/replication/walreceiverfuncs.c
      14              :  *
      15              :  *-------------------------------------------------------------------------
      16              :  */
      17              : #include "postgres.h"
      18              : 
      19              : #include <sys/stat.h>
      20              : #include <sys/time.h>
      21              : #include <time.h>
      22              : #include <unistd.h>
      23              : #include <signal.h>
      24              : 
      25              : #include "access/xlog_internal.h"
      26              : #include "access/xlogrecovery.h"
      27              : #include "pgstat.h"
      28              : #include "replication/walreceiver.h"
      29              : #include "storage/pmsignal.h"
      30              : #include "storage/proc.h"
      31              : #include "storage/shmem.h"
      32              : #include "storage/subsystems.h"
      33              : #include "utils/timestamp.h"
      34              : #include "utils/wait_event.h"
      35              : 
      36              : WalRcvData *WalRcv = NULL;
      37              : 
      38              : static void WalRcvShmemRequest(void *arg);
      39              : static void WalRcvShmemInit(void *arg);
      40              : 
      41              : const ShmemCallbacks WalRcvShmemCallbacks = {
      42              :     .request_fn = WalRcvShmemRequest,
      43              :     .init_fn = WalRcvShmemInit,
      44              : };
      45              : 
      46              : /*
      47              :  * How long to wait for walreceiver to start up after requesting
      48              :  * postmaster to launch it. In seconds.
      49              :  */
      50              : #define WALRCV_STARTUP_TIMEOUT 10
      51              : 
      52              : /* Register shared memory space needed by walreceiver */
      53              : static void
      54         1234 : WalRcvShmemRequest(void *arg)
      55              : {
      56         1234 :     ShmemRequestStruct(.name = "Wal Receiver Ctl",
      57              :                        .size = sizeof(WalRcvData),
      58              :                        .ptr = (void **) &WalRcv,
      59              :         );
      60         1234 : }
      61              : 
      62              : /* Initialize walreceiver-related shared memory */
      63              : static void
      64         1231 : WalRcvShmemInit(void *arg)
      65              : {
      66         1231 :     MemSet(WalRcv, 0, sizeof(WalRcvData));
      67         1231 :     WalRcv->walRcvState = WALRCV_STOPPED;
      68         1231 :     ConditionVariableInit(&WalRcv->walRcvStoppedCV);
      69         1231 :     SpinLockInit(&WalRcv->mutex);
      70         1231 :     pg_atomic_init_u64(&WalRcv->writtenUpto, 0);
      71         1231 :     WalRcv->procno = INVALID_PROC_NUMBER;
      72         1231 : }
      73              : 
      74              : /* Is walreceiver running (or starting up)? */
      75              : bool
      76         1116 : WalRcvRunning(void)
      77              : {
      78         1116 :     WalRcvData *walrcv = WalRcv;
      79              :     WalRcvState state;
      80              :     pg_time_t   startTime;
      81              : 
      82         1116 :     SpinLockAcquire(&walrcv->mutex);
      83              : 
      84         1116 :     state = walrcv->walRcvState;
      85         1116 :     startTime = walrcv->startTime;
      86              : 
      87         1116 :     SpinLockRelease(&walrcv->mutex);
      88              : 
      89              :     /*
      90              :      * If it has taken too long for walreceiver to start up, give up. Setting
      91              :      * the state to STOPPED ensures that if walreceiver later does start up
      92              :      * after all, it will see that it's not supposed to be running and die
      93              :      * without doing anything.
      94              :      */
      95         1116 :     if (state == WALRCV_STARTING)
      96              :     {
      97            0 :         pg_time_t   now = (pg_time_t) time(NULL);
      98              : 
      99            0 :         if ((now - startTime) > WALRCV_STARTUP_TIMEOUT)
     100              :         {
     101            0 :             bool        stopped = false;
     102              : 
     103            0 :             SpinLockAcquire(&walrcv->mutex);
     104            0 :             if (walrcv->walRcvState == WALRCV_STARTING)
     105              :             {
     106            0 :                 state = walrcv->walRcvState = WALRCV_STOPPED;
     107            0 :                 stopped = true;
     108              :             }
     109            0 :             SpinLockRelease(&walrcv->mutex);
     110              : 
     111            0 :             if (stopped)
     112            0 :                 ConditionVariableBroadcast(&walrcv->walRcvStoppedCV);
     113              :         }
     114              :     }
     115              : 
     116         1116 :     if (state != WALRCV_STOPPED)
     117           44 :         return true;
     118              :     else
     119         1072 :         return false;
     120              : }
     121              : 
     122              : /* Return the state of the walreceiver. */
     123              : WalRcvState
     124            0 : WalRcvGetState(void)
     125              : {
     126            0 :     WalRcvData *walrcv = WalRcv;
     127              :     WalRcvState state;
     128              : 
     129            0 :     SpinLockAcquire(&walrcv->mutex);
     130            0 :     state = walrcv->walRcvState;
     131            0 :     SpinLockRelease(&walrcv->mutex);
     132              : 
     133            0 :     return state;
     134              : }
     135              : 
     136              : /*
     137              :  * Is walreceiver running and streaming (or at least attempting to connect,
     138              :  * or starting up)?
     139              :  */
     140              : bool
     141        34660 : WalRcvStreaming(void)
     142              : {
     143        34660 :     WalRcvData *walrcv = WalRcv;
     144              :     WalRcvState state;
     145              :     pg_time_t   startTime;
     146              : 
     147        34660 :     SpinLockAcquire(&walrcv->mutex);
     148              : 
     149        34660 :     state = walrcv->walRcvState;
     150        34660 :     startTime = walrcv->startTime;
     151              : 
     152        34660 :     SpinLockRelease(&walrcv->mutex);
     153              : 
     154              :     /*
     155              :      * If it has taken too long for walreceiver to start up, give up. Setting
     156              :      * the state to STOPPED ensures that if walreceiver later does start up
     157              :      * after all, it will see that it's not supposed to be running and die
     158              :      * without doing anything.
     159              :      */
     160        34660 :     if (state == WALRCV_STARTING)
     161              :     {
     162          306 :         pg_time_t   now = (pg_time_t) time(NULL);
     163              : 
     164          306 :         if ((now - startTime) > WALRCV_STARTUP_TIMEOUT)
     165              :         {
     166            0 :             bool        stopped = false;
     167              : 
     168            0 :             SpinLockAcquire(&walrcv->mutex);
     169            0 :             if (walrcv->walRcvState == WALRCV_STARTING)
     170              :             {
     171            0 :                 state = walrcv->walRcvState = WALRCV_STOPPED;
     172            0 :                 stopped = true;
     173              :             }
     174            0 :             SpinLockRelease(&walrcv->mutex);
     175              : 
     176            0 :             if (stopped)
     177            0 :                 ConditionVariableBroadcast(&walrcv->walRcvStoppedCV);
     178              :         }
     179              :     }
     180              : 
     181        34660 :     if (state == WALRCV_STREAMING || state == WALRCV_STARTING ||
     182          313 :         state == WALRCV_CONNECTING || state == WALRCV_RESTARTING)
     183        34352 :         return true;
     184              :     else
     185          308 :         return false;
     186              : }
     187              : 
     188              : /*
     189              :  * Stop walreceiver (if running) and wait for it to die.
     190              :  * Executed by the Startup process.
     191              :  */
     192              : void
     193         1068 : ShutdownWalRcv(void)
     194              : {
     195         1068 :     WalRcvData *walrcv = WalRcv;
     196         1068 :     pid_t       walrcvpid = 0;
     197         1068 :     bool        stopped = false;
     198              : 
     199              :     /*
     200              :      * Request walreceiver to stop. Walreceiver will switch to WALRCV_STOPPED
     201              :      * mode once it's finished, and will also request postmaster to not
     202              :      * restart itself.
     203              :      */
     204         1068 :     SpinLockAcquire(&walrcv->mutex);
     205         1068 :     switch (walrcv->walRcvState)
     206              :     {
     207         1027 :         case WALRCV_STOPPED:
     208         1027 :             break;
     209            2 :         case WALRCV_STARTING:
     210            2 :             walrcv->walRcvState = WALRCV_STOPPED;
     211            2 :             stopped = true;
     212            2 :             break;
     213              : 
     214           39 :         case WALRCV_CONNECTING:
     215              :         case WALRCV_STREAMING:
     216              :         case WALRCV_WAITING:
     217              :         case WALRCV_RESTARTING:
     218           39 :             walrcv->walRcvState = WALRCV_STOPPING;
     219              :             pg_fallthrough;
     220           39 :         case WALRCV_STOPPING:
     221           39 :             walrcvpid = walrcv->pid;
     222           39 :             break;
     223              :     }
     224         1068 :     SpinLockRelease(&walrcv->mutex);
     225              : 
     226              :     /* Unnecessary but consistent. */
     227         1068 :     if (stopped)
     228            2 :         ConditionVariableBroadcast(&walrcv->walRcvStoppedCV);
     229              : 
     230              :     /*
     231              :      * Signal walreceiver process if it was still running.
     232              :      */
     233         1068 :     if (walrcvpid != 0)
     234           39 :         kill(walrcvpid, SIGTERM);
     235              : 
     236              :     /*
     237              :      * Wait for walreceiver to acknowledge its death by setting state to
     238              :      * WALRCV_STOPPED.
     239              :      */
     240         1068 :     ConditionVariablePrepareToSleep(&walrcv->walRcvStoppedCV);
     241         1105 :     while (WalRcvRunning())
     242           37 :         ConditionVariableSleep(&walrcv->walRcvStoppedCV,
     243              :                                WAIT_EVENT_WAL_RECEIVER_EXIT);
     244         1068 :     ConditionVariableCancelSleep();
     245         1068 : }
     246              : 
     247              : /*
     248              :  * Request postmaster to start walreceiver.
     249              :  *
     250              :  * "recptr" indicates the position where streaming should begin.  "conninfo"
     251              :  * is a libpq connection string to use.  "slotname" is, optionally, the name
     252              :  * of a replication slot to acquire.  "create_temp_slot" indicates to create
     253              :  * a temporary slot when no "slotname" is given.
     254              :  *
     255              :  * WAL receivers do not directly load GUC parameters used for the connection
     256              :  * to the primary, and rely on the values passed down by the caller of this
     257              :  * routine instead.  Hence, the addition of any new parameters should happen
     258              :  * through this code path.
     259              :  */
     260              : void
     261          198 : RequestXLogStreaming(TimeLineID tli, XLogRecPtr recptr, const char *conninfo,
     262              :                      const char *slotname, bool create_temp_slot)
     263              : {
     264          198 :     WalRcvData *walrcv = WalRcv;
     265          198 :     bool        launch = false;
     266          198 :     pg_time_t   now = (pg_time_t) time(NULL);
     267              :     ProcNumber  walrcv_proc;
     268              : 
     269              :     /*
     270              :      * We always start at the beginning of the segment. That prevents a broken
     271              :      * segment (i.e., with no records in the first half of a segment) from
     272              :      * being created by XLOG streaming, which might cause trouble later on if
     273              :      * the segment is e.g archived.
     274              :      */
     275          198 :     if (XLogSegmentOffset(recptr, wal_segment_size) != 0)
     276          198 :         recptr -= XLogSegmentOffset(recptr, wal_segment_size);
     277              : 
     278          198 :     SpinLockAcquire(&walrcv->mutex);
     279              : 
     280              :     /* It better be stopped if we try to restart it */
     281              :     Assert(walrcv->walRcvState == WALRCV_STOPPED ||
     282              :            walrcv->walRcvState == WALRCV_WAITING);
     283              : 
     284          198 :     if (conninfo != NULL)
     285          198 :         strlcpy(walrcv->conninfo, conninfo, MAXCONNINFO);
     286              :     else
     287            0 :         walrcv->conninfo[0] = '\0';
     288              : 
     289              :     /*
     290              :      * Use configured replication slot if present, and ignore the value of
     291              :      * create_temp_slot as the slot name should be persistent.  Otherwise, use
     292              :      * create_temp_slot to determine whether this WAL receiver should create a
     293              :      * temporary slot by itself and use it, or not.
     294              :      */
     295          198 :     if (slotname != NULL && slotname[0] != '\0')
     296              :     {
     297           58 :         strlcpy(walrcv->slotname, slotname, NAMEDATALEN);
     298           58 :         walrcv->is_temp_slot = false;
     299              :     }
     300              :     else
     301              :     {
     302          140 :         walrcv->slotname[0] = '\0';
     303          140 :         walrcv->is_temp_slot = create_temp_slot;
     304              :     }
     305              : 
     306          198 :     if (walrcv->walRcvState == WALRCV_STOPPED)
     307              :     {
     308          191 :         launch = true;
     309          191 :         walrcv->walRcvState = WALRCV_STARTING;
     310              :     }
     311              :     else
     312            7 :         walrcv->walRcvState = WALRCV_RESTARTING;
     313          198 :     walrcv->startTime = now;
     314              : 
     315              :     /*
     316              :      * If this is the first startup of walreceiver (on this timeline),
     317              :      * initialize flushedUpto and latestChunkStart to the starting point.
     318              :      */
     319          198 :     if (!XLogRecPtrIsValid(walrcv->receiveStart) || walrcv->receivedTLI != tli)
     320              :     {
     321          109 :         walrcv->flushedUpto = recptr;
     322          109 :         walrcv->receivedTLI = tli;
     323          109 :         walrcv->latestChunkStart = recptr;
     324          109 :         pg_atomic_write_u64(&walrcv->writtenUpto, recptr);
     325              :     }
     326          198 :     walrcv->receiveStart = recptr;
     327          198 :     walrcv->receiveStartTLI = tli;
     328              : 
     329          198 :     walrcv_proc = walrcv->procno;
     330              : 
     331          198 :     SpinLockRelease(&walrcv->mutex);
     332              : 
     333          198 :     if (launch)
     334          191 :         SendPostmasterSignal(PMSIGNAL_START_WALRECEIVER);
     335            7 :     else if (walrcv_proc != INVALID_PROC_NUMBER)
     336            7 :         SetLatch(&GetPGProcByNumber(walrcv_proc)->procLatch);
     337          198 : }
     338              : 
     339              : /*
     340              :  * Returns the last+1 byte position that walreceiver has flushed.
     341              :  *
     342              :  * Optionally, returns the previous chunk start, that is the first byte
     343              :  * written in the most recent walreceiver flush cycle.  Callers not
     344              :  * interested in that value may pass NULL for latestChunkStart. Same for
     345              :  * receiveTLI.
     346              :  */
     347              : XLogRecPtr
     348        33762 : GetWalRcvFlushRecPtr(XLogRecPtr *latestChunkStart, TimeLineID *receiveTLI)
     349              : {
     350        33762 :     WalRcvData *walrcv = WalRcv;
     351              :     XLogRecPtr  recptr;
     352              : 
     353        33762 :     SpinLockAcquire(&walrcv->mutex);
     354        33762 :     recptr = walrcv->flushedUpto;
     355        33762 :     if (latestChunkStart)
     356        32559 :         *latestChunkStart = walrcv->latestChunkStart;
     357        33762 :     if (receiveTLI)
     358        33520 :         *receiveTLI = walrcv->receivedTLI;
     359        33762 :     SpinLockRelease(&walrcv->mutex);
     360              : 
     361        33762 :     return recptr;
     362              : }
     363              : 
     364              : /*
     365              :  * Returns the last+1 byte position that walreceiver has written.
     366              :  * This returns a recently written value without taking a lock.
     367              :  */
     368              : XLogRecPtr
     369           43 : GetWalRcvWriteRecPtr(void)
     370              : {
     371           43 :     WalRcvData *walrcv = WalRcv;
     372              : 
     373           43 :     return pg_atomic_read_u64(&walrcv->writtenUpto);
     374              : }
     375              : 
     376              : /*
     377              :  * Returns the replication apply delay in ms or -1
     378              :  * if the apply delay info is not available
     379              :  */
     380              : int
     381          411 : GetReplicationApplyDelay(void)
     382              : {
     383          411 :     WalRcvData *walrcv = WalRcv;
     384              :     XLogRecPtr  receivePtr;
     385              :     XLogRecPtr  replayPtr;
     386              :     TimestampTz chunkReplayStartTime;
     387              : 
     388          411 :     SpinLockAcquire(&walrcv->mutex);
     389          411 :     receivePtr = walrcv->flushedUpto;
     390          411 :     SpinLockRelease(&walrcv->mutex);
     391              : 
     392          411 :     replayPtr = GetXLogReplayRecPtr(NULL);
     393              : 
     394          411 :     if (receivePtr == replayPtr)
     395          155 :         return 0;
     396              : 
     397          256 :     chunkReplayStartTime = GetCurrentChunkReplayStartTime();
     398              : 
     399          256 :     if (chunkReplayStartTime == 0)
     400            9 :         return -1;
     401              : 
     402          247 :     return TimestampDifferenceMilliseconds(chunkReplayStartTime,
     403              :                                            GetCurrentTimestamp());
     404              : }
     405              : 
     406              : /*
     407              :  * Returns the network latency in ms, note that this includes any
     408              :  * difference in clock settings between the servers, as well as timezone.
     409              :  */
     410              : int
     411          411 : GetReplicationTransferLatency(void)
     412              : {
     413          411 :     WalRcvData *walrcv = WalRcv;
     414              :     TimestampTz lastMsgSendTime;
     415              :     TimestampTz lastMsgReceiptTime;
     416              : 
     417          411 :     SpinLockAcquire(&walrcv->mutex);
     418          411 :     lastMsgSendTime = walrcv->lastMsgSendTime;
     419          411 :     lastMsgReceiptTime = walrcv->lastMsgReceiptTime;
     420          411 :     SpinLockRelease(&walrcv->mutex);
     421              : 
     422          411 :     return TimestampDifferenceMilliseconds(lastMsgSendTime,
     423              :                                            lastMsgReceiptTime);
     424              : }
        

Generated by: LCOV version 2.0-1