PostgreSQL Source Code git master
Loading...
Searching...
No Matches
walreceiverfuncs.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * walreceiverfuncs.c
4 *
5 * This file contains functions used by the startup process to communicate
6 * with the walreceiver process. Functions implementing walreceiver itself
7 * are in walreceiver.c.
8 *
9 * Portions Copyright (c) 2010-2026, PostgreSQL Global Development Group
10 *
11 *
12 * IDENTIFICATION
13 * src/backend/replication/walreceiverfuncs.c
14 *
15 *-------------------------------------------------------------------------
16 */
17#include "postgres.h"
18
19#include <sys/stat.h>
20#include <sys/time.h>
21#include <time.h>
22#include <unistd.h>
23#include <signal.h>
24
26#include "access/xlogrecovery.h"
27#include "pgstat.h"
29#include "storage/pmsignal.h"
30#include "storage/proc.h"
31#include "storage/shmem.h"
32#include "utils/timestamp.h"
33
35
36/*
37 * How long to wait for walreceiver to start up after requesting
38 * postmaster to launch it. In seconds.
39 */
40#define WALRCV_STARTUP_TIMEOUT 10
41
42/* Report shared memory space needed by WalRcvShmemInit */
43Size
45{
46 Size size = 0;
47
48 size = add_size(size, sizeof(WalRcvData));
49
50 return size;
51}
52
53/* Allocate and initialize walreceiver-related shared memory */
54void
56{
57 bool found;
58
59 WalRcv = (WalRcvData *)
60 ShmemInitStruct("Wal Receiver Ctl", WalRcvShmemSize(), &found);
61
62 if (!found)
63 {
64 /* First time through, so initialize */
71 }
72}
73
74/* Is walreceiver running (or starting up)? */
75bool
77{
80 pg_time_t startTime;
81
82 SpinLockAcquire(&walrcv->mutex);
83
84 state = walrcv->walRcvState;
85 startTime = walrcv->startTime;
86
87 SpinLockRelease(&walrcv->mutex);
88
89 /*
90 * If it has taken too long for walreceiver to start up, give up. Setting
91 * the state to STOPPED ensures that if walreceiver later does start up
92 * after all, it will see that it's not supposed to be running and die
93 * without doing anything.
94 */
96 {
97 pg_time_t now = (pg_time_t) time(NULL);
98
99 if ((now - startTime) > WALRCV_STARTUP_TIMEOUT)
100 {
101 bool stopped = false;
102
103 SpinLockAcquire(&walrcv->mutex);
104 if (walrcv->walRcvState == WALRCV_STARTING)
105 {
106 state = walrcv->walRcvState = WALRCV_STOPPED;
107 stopped = true;
108 }
109 SpinLockRelease(&walrcv->mutex);
110
111 if (stopped)
112 ConditionVariableBroadcast(&walrcv->walRcvStoppedCV);
113 }
114 }
115
116 if (state != WALRCV_STOPPED)
117 return true;
118 else
119 return false;
120}
121
122/* Return the state of the walreceiver. */
125{
128
129 SpinLockAcquire(&walrcv->mutex);
130 state = walrcv->walRcvState;
131 SpinLockRelease(&walrcv->mutex);
132
133 return state;
134}
135
136/*
137 * Is walreceiver running and streaming (or at least attempting to connect,
138 * or starting up)?
139 */
140bool
142{
145 pg_time_t startTime;
146
147 SpinLockAcquire(&walrcv->mutex);
148
149 state = walrcv->walRcvState;
150 startTime = walrcv->startTime;
151
152 SpinLockRelease(&walrcv->mutex);
153
154 /*
155 * If it has taken too long for walreceiver to start up, give up. Setting
156 * the state to STOPPED ensures that if walreceiver later does start up
157 * after all, it will see that it's not supposed to be running and die
158 * without doing anything.
159 */
160 if (state == WALRCV_STARTING)
161 {
162 pg_time_t now = (pg_time_t) time(NULL);
163
164 if ((now - startTime) > WALRCV_STARTUP_TIMEOUT)
165 {
166 bool stopped = false;
167
168 SpinLockAcquire(&walrcv->mutex);
169 if (walrcv->walRcvState == WALRCV_STARTING)
170 {
171 state = walrcv->walRcvState = WALRCV_STOPPED;
172 stopped = true;
173 }
174 SpinLockRelease(&walrcv->mutex);
175
176 if (stopped)
177 ConditionVariableBroadcast(&walrcv->walRcvStoppedCV);
178 }
179 }
180
183 return true;
184 else
185 return false;
186}
187
188/*
189 * Stop walreceiver (if running) and wait for it to die.
190 * Executed by the Startup process.
191 */
192void
194{
196 pid_t walrcvpid = 0;
197 bool stopped = false;
198
199 /*
200 * Request walreceiver to stop. Walreceiver will switch to WALRCV_STOPPED
201 * mode once it's finished, and will also request postmaster to not
202 * restart itself.
203 */
204 SpinLockAcquire(&walrcv->mutex);
205 switch (walrcv->walRcvState)
206 {
207 case WALRCV_STOPPED:
208 break;
209 case WALRCV_STARTING:
210 walrcv->walRcvState = WALRCV_STOPPED;
211 stopped = true;
212 break;
213
215 case WALRCV_STREAMING:
216 case WALRCV_WAITING:
218 walrcv->walRcvState = WALRCV_STOPPING;
219 /* fall through */
220 case WALRCV_STOPPING:
221 walrcvpid = walrcv->pid;
222 break;
223 }
224 SpinLockRelease(&walrcv->mutex);
225
226 /* Unnecessary but consistent. */
227 if (stopped)
228 ConditionVariableBroadcast(&walrcv->walRcvStoppedCV);
229
230 /*
231 * Signal walreceiver process if it was still running.
232 */
233 if (walrcvpid != 0)
235
236 /*
237 * Wait for walreceiver to acknowledge its death by setting state to
238 * WALRCV_STOPPED.
239 */
240 ConditionVariablePrepareToSleep(&walrcv->walRcvStoppedCV);
241 while (WalRcvRunning())
242 ConditionVariableSleep(&walrcv->walRcvStoppedCV,
245}
246
247/*
248 * Request postmaster to start walreceiver.
249 *
250 * "recptr" indicates the position where streaming should begin. "conninfo"
251 * is a libpq connection string to use. "slotname" is, optionally, the name
252 * of a replication slot to acquire. "create_temp_slot" indicates to create
253 * a temporary slot when no "slotname" is given.
254 *
255 * WAL receivers do not directly load GUC parameters used for the connection
256 * to the primary, and rely on the values passed down by the caller of this
257 * routine instead. Hence, the addition of any new parameters should happen
258 * through this code path.
259 */
260void
262 const char *slotname, bool create_temp_slot)
263{
265 bool launch = false;
266 pg_time_t now = (pg_time_t) time(NULL);
268
269 /*
270 * We always start at the beginning of the segment. That prevents a broken
271 * segment (i.e., with no records in the first half of a segment) from
272 * being created by XLOG streaming, which might cause trouble later on if
273 * the segment is e.g archived.
274 */
277
278 SpinLockAcquire(&walrcv->mutex);
279
280 /* It better be stopped if we try to restart it */
281 Assert(walrcv->walRcvState == WALRCV_STOPPED ||
282 walrcv->walRcvState == WALRCV_WAITING);
283
284 if (conninfo != NULL)
285 strlcpy(walrcv->conninfo, conninfo, MAXCONNINFO);
286 else
287 walrcv->conninfo[0] = '\0';
288
289 /*
290 * Use configured replication slot if present, and ignore the value of
291 * create_temp_slot as the slot name should be persistent. Otherwise, use
292 * create_temp_slot to determine whether this WAL receiver should create a
293 * temporary slot by itself and use it, or not.
294 */
295 if (slotname != NULL && slotname[0] != '\0')
296 {
297 strlcpy(walrcv->slotname, slotname, NAMEDATALEN);
298 walrcv->is_temp_slot = false;
299 }
300 else
301 {
302 walrcv->slotname[0] = '\0';
303 walrcv->is_temp_slot = create_temp_slot;
304 }
305
306 if (walrcv->walRcvState == WALRCV_STOPPED)
307 {
308 launch = true;
309 walrcv->walRcvState = WALRCV_STARTING;
310 }
311 else
312 walrcv->walRcvState = WALRCV_RESTARTING;
313 walrcv->startTime = now;
314
315 /*
316 * If this is the first startup of walreceiver (on this timeline),
317 * initialize flushedUpto and latestChunkStart to the starting point.
318 */
319 if (!XLogRecPtrIsValid(walrcv->receiveStart) || walrcv->receivedTLI != tli)
320 {
321 walrcv->flushedUpto = recptr;
322 walrcv->receivedTLI = tli;
323 walrcv->latestChunkStart = recptr;
324 }
325 walrcv->receiveStart = recptr;
326 walrcv->receiveStartTLI = tli;
327
328 walrcv_proc = walrcv->procno;
329
330 SpinLockRelease(&walrcv->mutex);
331
332 if (launch)
336}
337
338/*
339 * Returns the last+1 byte position that walreceiver has flushed.
340 *
341 * Optionally, returns the previous chunk start, that is the first byte
342 * written in the most recent walreceiver flush cycle. Callers not
343 * interested in that value may pass NULL for latestChunkStart. Same for
344 * receiveTLI.
345 */
348{
351
352 SpinLockAcquire(&walrcv->mutex);
353 recptr = walrcv->flushedUpto;
354 if (latestChunkStart)
355 *latestChunkStart = walrcv->latestChunkStart;
356 if (receiveTLI)
357 *receiveTLI = walrcv->receivedTLI;
358 SpinLockRelease(&walrcv->mutex);
359
360 return recptr;
361}
362
363/*
364 * Returns the last+1 byte position that walreceiver has written.
365 * This returns a recently written value without taking a lock.
366 */
369{
371
372 return pg_atomic_read_u64(&walrcv->writtenUpto);
373}
374
375/*
376 * Returns the replication apply delay in ms or -1
377 * if the apply delay info is not available
378 */
379int
404
405/*
406 * Returns the network latency in ms, note that this includes any
407 * difference in clock settings between the servers, as well as timezone.
408 */
409int
411{
413 TimestampTz lastMsgSendTime;
414 TimestampTz lastMsgReceiptTime;
415
416 SpinLockAcquire(&walrcv->mutex);
417 lastMsgSendTime = walrcv->lastMsgSendTime;
418 lastMsgReceiptTime = walrcv->lastMsgReceiptTime;
419 SpinLockRelease(&walrcv->mutex);
420
421 return TimestampDifferenceMilliseconds(lastMsgSendTime,
422 lastMsgReceiptTime);
423}
static void pg_atomic_init_u64(volatile pg_atomic_uint64 *ptr, uint64 val)
Definition atomics.h:453
static uint64 pg_atomic_read_u64(volatile pg_atomic_uint64 *ptr)
Definition atomics.h:467
long TimestampDifferenceMilliseconds(TimestampTz start_time, TimestampTz stop_time)
Definition timestamp.c:1757
TimestampTz GetCurrentTimestamp(void)
Definition timestamp.c:1645
Datum now(PG_FUNCTION_ARGS)
Definition timestamp.c:1609
#define Assert(condition)
Definition c.h:873
#define MemSet(start, val, len)
Definition c.h:1013
size_t Size
Definition c.h:619
bool ConditionVariableCancelSleep(void)
void ConditionVariableBroadcast(ConditionVariable *cv)
void ConditionVariablePrepareToSleep(ConditionVariable *cv)
void ConditionVariableInit(ConditionVariable *cv)
void ConditionVariableSleep(ConditionVariable *cv, uint32 wait_event_info)
int64 TimestampTz
Definition timestamp.h:39
void SetLatch(Latch *latch)
Definition latch.c:290
#define NAMEDATALEN
int64 pg_time_t
Definition pgtime.h:23
void SendPostmasterSignal(PMSignalReason reason)
Definition pmsignal.c:165
@ PMSIGNAL_START_WALRECEIVER
Definition pmsignal.h:42
size_t strlcpy(char *dst, const char *src, size_t siz)
Definition strlcpy.c:45
static int fb(int x)
#define GetPGProcByNumber(n)
Definition proc.h:446
#define INVALID_PROC_NUMBER
Definition procnumber.h:26
int ProcNumber
Definition procnumber.h:24
Size add_size(Size s1, Size s2)
Definition shmem.c:495
void * ShmemInitStruct(const char *name, Size size, bool *foundPtr)
Definition shmem.c:389
#define SpinLockInit(lock)
Definition spin.h:57
#define SpinLockRelease(lock)
Definition spin.h:61
#define SpinLockAcquire(lock)
Definition spin.h:59
ProcNumber procno
Definition walreceiver.h:68
ConditionVariable walRcvStoppedCV
Definition walreceiver.h:73
pg_atomic_uint64 writtenUpto
WalRcvState walRcvState
Definition walreceiver.h:72
slock_t mutex
#define MAXCONNINFO
Definition walreceiver.h:37
WalRcvState
Definition walreceiver.h:46
@ WALRCV_STARTING
Definition walreceiver.h:48
@ WALRCV_STOPPED
Definition walreceiver.h:47
@ WALRCV_CONNECTING
Definition walreceiver.h:50
@ WALRCV_RESTARTING
Definition walreceiver.h:53
@ WALRCV_STREAMING
Definition walreceiver.h:51
@ WALRCV_WAITING
Definition walreceiver.h:52
@ WALRCV_STOPPING
Definition walreceiver.h:54
XLogRecPtr GetWalRcvFlushRecPtr(XLogRecPtr *latestChunkStart, TimeLineID *receiveTLI)
bool WalRcvStreaming(void)
void RequestXLogStreaming(TimeLineID tli, XLogRecPtr recptr, const char *conninfo, const char *slotname, bool create_temp_slot)
WalRcvData * WalRcv
XLogRecPtr GetWalRcvWriteRecPtr(void)
void ShutdownWalRcv(void)
#define WALRCV_STARTUP_TIMEOUT
WalRcvState WalRcvGetState(void)
bool WalRcvRunning(void)
int GetReplicationApplyDelay(void)
void WalRcvShmemInit(void)
Size WalRcvShmemSize(void)
int GetReplicationTransferLatency(void)
#define kill(pid, sig)
Definition win32_port.h:490
int wal_segment_size
Definition xlog.c:146
#define XLogSegmentOffset(xlogptr, wal_segsz_bytes)
#define XLogRecPtrIsValid(r)
Definition xlogdefs.h:29
uint64 XLogRecPtr
Definition xlogdefs.h:21
uint32 TimeLineID
Definition xlogdefs.h:63
static TimeLineID receiveTLI
TimestampTz GetCurrentChunkReplayStartTime(void)
XLogRecPtr GetXLogReplayRecPtr(TimeLineID *replayTLI)