PostgreSQL Source Code git master
Loading...
Searching...
No Matches
slotsync.h File Reference
#include <signal.h>
#include "replication/walreceiver.h"
Include dependency graph for slotsync.h:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Functions

charCheckAndGetDbnameFromConninfo (void)
 
bool ValidateSlotSyncParams (int elevel)
 
pg_noreturn void ReplSlotSyncWorkerMain (const void *startup_data, size_t startup_data_len)
 
void ShutDownSlotSync (void)
 
bool SlotSyncWorkerCanRestart (void)
 
bool IsSyncingReplicationSlots (void)
 
void SyncReplicationSlots (WalReceiverConn *wrconn)
 
void HandleSlotSyncMessageInterrupt (void)
 
void ProcessSlotSyncMessage (void)
 

Variables

PGDLLIMPORT bool sync_replication_slots
 
PGDLLIMPORT volatile sig_atomic_t SlotSyncShutdownPending
 
PGDLLIMPORT charPrimaryConnInfo
 
PGDLLIMPORT charPrimarySlotName
 

Function Documentation

◆ CheckAndGetDbnameFromConninfo()

char * CheckAndGetDbnameFromConninfo ( void  )
extern

Definition at line 1139 of file slotsync.c.

1140{
1141 char *dbname;
1142
1143 /*
1144 * The slot synchronization needs a database connection for walrcv_exec to
1145 * work.
1146 */
1148 if (dbname == NULL)
1149 ereport(ERROR,
1151
1152 /*
1153 * translator: first %s is a connection option; second %s is a GUC
1154 * variable name
1155 */
1156 errmsg("replication slot synchronization requires \"%s\" to be specified in \"%s\"",
1157 "dbname", "primary_conninfo"));
1158 return dbname;
1159}
int errcode(int sqlerrcode)
Definition elog.c:874
#define ERROR
Definition elog.h:40
#define ereport(elevel,...)
Definition elog.h:152
static char * errmsg
static int fb(int x)
char * dbname
Definition streamutil.c:49
#define walrcv_get_dbname_from_conninfo(conninfo)
char * PrimaryConnInfo

References dbname, ereport, errcode(), errmsg, ERROR, fb(), PrimaryConnInfo, and walrcv_get_dbname_from_conninfo.

Referenced by pg_sync_replication_slots(), and ReplSlotSyncWorkerMain().

◆ HandleSlotSyncMessageInterrupt()

void HandleSlotSyncMessageInterrupt ( void  )
extern

Definition at line 1319 of file slotsync.c.

1320{
1321 InterruptPending = true;
1323 /* latch will be set by procsignal_sigusr1_handler */
1324}
volatile sig_atomic_t InterruptPending
Definition globals.c:32
volatile sig_atomic_t SlotSyncShutdownPending
Definition slotsync.c:159

References InterruptPending, and SlotSyncShutdownPending.

Referenced by procsignal_sigusr1_handler().

◆ IsSyncingReplicationSlots()

bool IsSyncingReplicationSlots ( void  )
extern

Definition at line 1897 of file slotsync.c.

1898{
1899 return syncing_slots;
1900}
static bool syncing_slots
Definition slotsync.c:152

References syncing_slots.

Referenced by CreateDecodingContext(), GetStandbyFlushRecPtr(), ProcessSlotSyncMessage(), and ReplicationSlotCreate().

◆ ProcessSlotSyncMessage()

void ProcessSlotSyncMessage ( void  )
extern

Definition at line 1335 of file slotsync.c.

1336{
1338
1340 {
1341 ereport(LOG,
1342 errmsg("replication slot synchronization worker will stop because promotion is triggered"));
1343 proc_exit(0);
1344 }
1345 else
1346 {
1347 /*
1348 * If sync has already completed, there is no need to interrupt the
1349 * caller with an error.
1350 */
1352 return;
1353
1354 ereport(ERROR,
1356 errmsg("replication slot synchronization will stop because promotion is triggered"));
1357 }
1358}
#define LOG
Definition elog.h:32
void proc_exit(int code)
Definition ipc.c:105
#define AmLogicalSlotSyncWorkerProcess()
Definition miscadmin.h:401
bool IsSyncingReplicationSlots(void)
Definition slotsync.c:1897

References AmLogicalSlotSyncWorkerProcess, ereport, errcode(), errmsg, ERROR, fb(), IsSyncingReplicationSlots(), LOG, proc_exit(), and SlotSyncShutdownPending.

Referenced by ProcessInterrupts().

◆ ReplSlotSyncWorkerMain()

pg_noreturn void ReplSlotSyncWorkerMain ( const void startup_data,
size_t  startup_data_len 
)
extern

Definition at line 1540 of file slotsync.c.

1541{
1543 char *dbname;
1544 char *err;
1547
1549
1550 /* Release postmaster's working memory context */
1552 {
1555 }
1556
1558
1560
1561 /*
1562 * Create a per-backend PGPROC struct in shared memory. We must do this
1563 * before we access any shared memory.
1564 */
1565 InitProcess();
1566
1567 /*
1568 * Early initialization.
1569 */
1570 BaseInit();
1571
1573
1574 /*
1575 * If an exception is encountered, processing resumes here.
1576 *
1577 * We just need to clean up, report the error, and go away.
1578 *
1579 * If we do not have this handling here, then since this worker process
1580 * operates at the bottom of the exception stack, ERRORs turn into FATALs.
1581 * Therefore, we create our own exception handler to catch ERRORs.
1582 */
1583 if (sigsetjmp(local_sigjmp_buf, 1) != 0)
1584 {
1585 /* since not using PG_TRY, must reset error stack by hand */
1587
1588 /* Prevents interrupts while cleaning up */
1590
1591 /* Report the error to the server log */
1593
1594 /*
1595 * We can now go away. Note that because we called InitProcess, a
1596 * callback was registered to do ProcKill, which will clean up
1597 * necessary state.
1598 */
1599 proc_exit(0);
1600 }
1601
1602 /* We can now handle ereport(ERROR) */
1604
1605 /* Setup signal handling */
1614
1616
1617 ereport(LOG, errmsg("slot sync worker started"));
1618
1619 /* Register it as soon as SlotSyncCtx->pid is initialized. */
1621
1622 /*
1623 * Establishes SIGALRM handler and initialize timeout module. It is needed
1624 * by InitPostgres to register different timeouts.
1625 */
1627
1628 /* Load the libpq-specific functions */
1629 load_file("libpqwalreceiver", false);
1630
1631 /*
1632 * Unblock signals (they were blocked when the postmaster forked us)
1633 */
1635
1636 /*
1637 * Set always-secure search path, so malicious users can't redirect user
1638 * code (e.g. operators).
1639 *
1640 * It's not strictly necessary since we won't be scanning or writing to
1641 * any user table locally, but it's good to retain it here for added
1642 * precaution.
1643 */
1644 SetConfigOption("search_path", "", PGC_SUSET, PGC_S_OVERRIDE);
1645
1647
1648 /*
1649 * Connect to the database specified by the user in primary_conninfo. We
1650 * need a database connection for walrcv_exec to work which we use to
1651 * fetch slot information from the remote node. See comments atop
1652 * libpqrcv_exec.
1653 *
1654 * We do not specify a specific user here since the slot sync worker will
1655 * operate as a superuser. This is safe because the slot sync worker does
1656 * not interact with user tables, eliminating the risk of executing
1657 * arbitrary code within triggers.
1658 */
1660
1662
1664 if (cluster_name[0])
1665 appendStringInfo(&app_name, "%s_%s", cluster_name, "slotsync worker");
1666 else
1667 appendStringInfoString(&app_name, "slotsync worker");
1668
1669 /*
1670 * Establish the connection to the primary server for slot
1671 * synchronization.
1672 */
1673 wrconn = walrcv_connect(PrimaryConnInfo, false, false, false,
1674 app_name.data, &err);
1675
1676 if (!wrconn)
1677 ereport(ERROR,
1679 errmsg("synchronization worker \"%s\" could not connect to the primary server: %s",
1680 app_name.data, err));
1681
1682 pfree(app_name.data);
1683
1684 /*
1685 * Register the disconnection callback.
1686 *
1687 * XXX: This can be combined with previous cleanup registration of
1688 * slotsync_worker_onexit() but that will need the connection to be made
1689 * global and we want to avoid introducing global for this purpose.
1690 */
1692
1693 /*
1694 * Using the specified primary server connection, check that we are not a
1695 * cascading standby and slot configured in 'primary_slot_name' exists on
1696 * the primary server.
1697 */
1699
1700 /* Main loop to synchronize slots */
1701 for (;;)
1702 {
1703 bool some_slot_updated = false;
1704 bool started_tx = false;
1706
1708
1711
1712 /*
1713 * The syscache access in fetch_remote_slots() needs a transaction
1714 * env.
1715 */
1716 if (!IsTransactionState())
1717 {
1719 started_tx = true;
1720 }
1721
1725
1726 if (started_tx)
1728
1730 }
1731
1732 /*
1733 * The slot sync worker can't get here because it will only stop when it
1734 * receives a stop request from the startup process, or when there is an
1735 * error.
1736 */
1737 Assert(false);
1738}
sigset_t UnBlockSig
Definition pqsignal.c:22
#define Assert(condition)
Definition c.h:943
void load_file(const char *filename, bool restricted)
Definition dfmgr.c:149
void EmitErrorReport(void)
Definition elog.c:1882
ErrorContextCallback * error_context_stack
Definition elog.c:99
sigjmp_buf * PG_exception_stack
Definition elog.c:101
void err(int eval, const char *fmt,...)
Definition err.c:43
int MyProcPid
Definition globals.c:49
void SetConfigOption(const char *name, const char *value, GucContext context, GucSource source)
Definition guc.c:4234
@ PGC_S_OVERRIDE
Definition guc.h:123
@ PGC_SUSET
Definition guc.h:78
char * cluster_name
Definition guc_tables.c:582
volatile sig_atomic_t ConfigReloadPending
Definition interrupt.c:27
void SignalHandlerForConfigReload(SIGNAL_ARGS)
Definition interrupt.c:61
void before_shmem_exit(pg_on_exit_callback function, Datum arg)
Definition ipc.c:344
void list_free_deep(List *list)
Definition list.c:1560
void pfree(void *pointer)
Definition mcxt.c:1616
MemoryContext PostmasterContext
Definition mcxt.c:168
void MemoryContextDelete(MemoryContext context)
Definition mcxt.c:472
@ NormalProcessing
Definition miscadmin.h:490
@ InitProcessing
Definition miscadmin.h:489
#define GetProcessingMode()
Definition miscadmin.h:499
#define CHECK_FOR_INTERRUPTS()
Definition miscadmin.h:125
#define HOLD_INTERRUPTS()
Definition miscadmin.h:136
#define SetProcessingMode(mode)
Definition miscadmin.h:501
#define NIL
Definition pg_list.h:68
#define die(msg)
#define pqsignal
Definition port.h:547
void FloatExceptionHandler(SIGNAL_ARGS)
Definition postgres.c:3070
void StatementCancelHandler(SIGNAL_ARGS)
Definition postgres.c:3053
static Datum PointerGetDatum(const void *X)
Definition postgres.h:342
uint64_t Datum
Definition postgres.h:70
#define InvalidOid
void BaseInit(void)
Definition postinit.c:616
void InitPostgres(const char *in_dbname, Oid dboid, const char *username, Oid useroid, uint32 flags, char *out_dbname)
Definition postinit.c:719
void procsignal_sigusr1_handler(SIGNAL_ARGS)
Definition procsignal.c:688
void init_ps_display(const char *fixed_part)
Definition ps_status.c:286
static void slotsync_worker_disconnect(int code, Datum arg)
Definition slotsync.c:1366
static SlotSyncCtxStruct * SlotSyncCtx
Definition slotsync.c:121
char * CheckAndGetDbnameFromConninfo(void)
Definition slotsync.c:1139
static void wait_for_slot_activity(bool some_slot_updated)
Definition slotsync.c:1425
static void slotsync_reread_config(void)
Definition slotsync.c:1235
static void slotsync_worker_onexit(int code, Datum arg)
Definition slotsync.c:1379
static void validate_remote_info(WalReceiverConn *wrconn)
Definition slotsync.c:1061
static void check_and_set_sync_info(pid_t sync_process_pid)
Definition slotsync.c:1460
static List * fetch_remote_slots(WalReceiverConn *wrconn, List *slot_names)
Definition slotsync.c:883
static bool synchronize_slots(WalReceiverConn *wrconn, List *remote_slot_list, bool *slot_persistence_pending)
Definition slotsync.c:1025
void InitProcess(void)
Definition proc.c:392
void appendStringInfo(StringInfo str, const char *fmt,...)
Definition stringinfo.c:145
void appendStringInfoString(StringInfo str, const char *s)
Definition stringinfo.c:230
void initStringInfo(StringInfo str)
Definition stringinfo.c:97
Definition pg_list.h:54
void InitializeTimeouts(void)
Definition timeout.c:470
static WalReceiverConn * wrconn
Definition walreceiver.c:95
#define walrcv_connect(conninfo, replication, logical, must_use_password, appname, err)
#define SIGCHLD
Definition win32_port.h:168
#define SIGHUP
Definition win32_port.h:158
#define SIGPIPE
Definition win32_port.h:163
#define SIGUSR1
Definition win32_port.h:170
#define SIGUSR2
Definition win32_port.h:171
bool IsTransactionState(void)
Definition xact.c:389
void StartTransactionCommand(void)
Definition xact.c:3109
void CommitTransactionCommand(void)
Definition xact.c:3207

References appendStringInfo(), appendStringInfoString(), Assert, BaseInit(), before_shmem_exit(), check_and_set_sync_info(), CHECK_FOR_INTERRUPTS, CheckAndGetDbnameFromConninfo(), cluster_name, CommitTransactionCommand(), ConfigReloadPending, dbname, die, EmitErrorReport(), ereport, err(), errcode(), errmsg, ERROR, error_context_stack, fb(), fetch_remote_slots(), FloatExceptionHandler(), GetProcessingMode, HOLD_INTERRUPTS, init_ps_display(), InitializeTimeouts(), InitPostgres(), InitProcess(), InitProcessing, initStringInfo(), InvalidOid, IsTransactionState(), list_free_deep(), load_file(), LOG, MemoryContextDelete(), MyProcPid, NIL, NormalProcessing, pfree(), PG_exception_stack, PGC_S_OVERRIDE, PGC_SUSET, PointerGetDatum(), PostmasterContext, pqsignal, PrimaryConnInfo, proc_exit(), procsignal_sigusr1_handler(), SetConfigOption(), SetProcessingMode, SIGCHLD, SIGHUP, SignalHandlerForConfigReload(), SIGPIPE, SIGUSR1, SIGUSR2, slotsync_reread_config(), slotsync_worker_disconnect(), slotsync_worker_onexit(), SlotSyncCtx, StartTransactionCommand(), StatementCancelHandler(), synchronize_slots(), UnBlockSig, validate_remote_info(), wait_for_slot_activity(), walrcv_connect, and wrconn.

◆ ShutDownSlotSync()

void ShutDownSlotSync ( void  )
extern

Definition at line 1799 of file slotsync.c.

1800{
1802
1804
1805 SlotSyncCtx->stopSignaled = true;
1806
1807 /*
1808 * Return if neither the slot sync worker is running nor the function
1809 * pg_sync_replication_slots() is executing.
1810 */
1811 if (!SlotSyncCtx->syncing)
1812 {
1815 return;
1816 }
1817
1819
1821
1822 /*
1823 * Signal process doing slotsync, if any, asking it to stop.
1824 */
1828
1829 /* Wait for slot sync to end */
1830 for (;;)
1831 {
1832 int rc;
1833
1834 /* Wait a bit, we don't expect to have to wait long */
1835 rc = WaitLatch(MyLatch,
1838
1839 if (rc & WL_LATCH_SET)
1840 {
1843 }
1844
1846
1847 /* Ensure that no process is syncing the slots. */
1848 if (!SlotSyncCtx->syncing)
1849 break;
1850
1852 }
1853
1855
1857}
struct Latch * MyLatch
Definition globals.c:65
void ResetLatch(Latch *latch)
Definition latch.c:374
int WaitLatch(Latch *latch, int wakeEvents, long timeout, uint32 wait_event_info)
Definition latch.c:172
#define InvalidPid
Definition miscadmin.h:32
#define INVALID_PROC_NUMBER
Definition procnumber.h:26
int SendProcSignal(pid_t pid, ProcSignalReason reason, ProcNumber procNumber)
Definition procsignal.c:288
@ PROCSIG_SLOTSYNC_MESSAGE
Definition procsignal.h:39
static void update_synced_slots_inactive_since(void)
Definition slotsync.c:1747
static void SpinLockRelease(volatile slock_t *lock)
Definition spin.h:62
static void SpinLockAcquire(volatile slock_t *lock)
Definition spin.h:56
#define WL_TIMEOUT
#define WL_EXIT_ON_PM_DEATH
#define WL_LATCH_SET

References CHECK_FOR_INTERRUPTS, fb(), INVALID_PROC_NUMBER, InvalidPid, SlotSyncCtxStruct::mutex, MyLatch, SlotSyncCtxStruct::pid, PROCSIG_SLOTSYNC_MESSAGE, ResetLatch(), SendProcSignal(), SlotSyncCtx, SpinLockAcquire(), SpinLockRelease(), SlotSyncCtxStruct::stopSignaled, SlotSyncCtxStruct::syncing, update_synced_slots_inactive_since(), WaitLatch(), WL_EXIT_ON_PM_DEATH, WL_LATCH_SET, and WL_TIMEOUT.

Referenced by FinishWalRecovery().

◆ SlotSyncWorkerCanRestart()

bool SlotSyncWorkerCanRestart ( void  )
extern

Definition at line 1872 of file slotsync.c.

1873{
1874 time_t curtime = time(NULL);
1875
1876 /*
1877 * If first time through, or time somehow went backwards, always update
1878 * last_start_time to match the current clock and allow worker start.
1879 * Otherwise allow it only once enough time has elapsed.
1880 */
1881 if (SlotSyncCtx->last_start_time == 0 ||
1882 curtime < SlotSyncCtx->last_start_time ||
1884 {
1886 return true;
1887 }
1888 return false;
1889}
#define SLOTSYNC_RESTART_INTERVAL_SEC
Definition slotsync.c:145
time_t last_start_time
Definition slotsync.c:117

References fb(), SlotSyncCtxStruct::last_start_time, SLOTSYNC_RESTART_INTERVAL_SEC, and SlotSyncCtx.

Referenced by LaunchMissingBackgroundProcesses().

◆ SyncReplicationSlots()

void SyncReplicationSlots ( WalReceiverConn wrconn)
extern

Definition at line 1991 of file slotsync.c.

1992{
1994 {
1996 List *slot_names = NIL; /* List of slot names to track */
1997
1999
2001
2002 /* Retry until all the slots are sync-ready */
2003 for (;;)
2004 {
2005 bool slot_persistence_pending = false;
2006 bool some_slot_updated = false;
2007
2008 /* Check for interrupts and config changes */
2010
2013
2014 /* We must be in a valid transaction state */
2016
2017 /*
2018 * Fetch remote slot info for the given slot_names. If slot_names
2019 * is NIL, fetch all failover-enabled slots. Note that we reuse
2020 * slot_names from the first iteration; re-fetching all failover
2021 * slots each time could cause an endless loop. Instead of
2022 * reprocessing only the pending slots in each iteration, it's
2023 * better to process all the slots received in the first
2024 * iteration. This ensures that by the time we're done, all slots
2025 * reflect the latest values.
2026 */
2027 remote_slots = fetch_remote_slots(wrconn, slot_names);
2028
2029 /* Attempt to synchronize slots */
2032
2033 /*
2034 * If slot_persistence_pending is true, extract slot names for
2035 * future iterations (only needed if we haven't done it yet)
2036 */
2037 if (slot_names == NIL && slot_persistence_pending)
2038 slot_names = extract_slot_names(remote_slots);
2039
2040 /* Free the current remote_slots list */
2042
2043 /* Done if all slots are persisted i.e are sync-ready */
2045 break;
2046
2047 /* wait before retrying again */
2049 }
2050
2051 if (slot_names)
2052 list_free_deep(slot_names);
2053
2054 /* Cleanup the synced temporary slots */
2056
2057 /* We are done with sync, so reset sync flag */
2059 }
2061}
#define PG_ENSURE_ERROR_CLEANUP(cleanup_function, arg)
Definition ipc.h:47
#define PG_END_ENSURE_ERROR_CLEANUP(cleanup_function, arg)
Definition ipc.h:52
void ReplicationSlotCleanup(bool synced_only)
Definition slot.c:868
static void slotsync_failure_callback(int code, Datum arg)
Definition slotsync.c:1929
static List * extract_slot_names(List *remote_slots)
Definition slotsync.c:1965
static void reset_syncing_flag(void)
Definition slotsync.c:1520

References Assert, check_and_set_sync_info(), CHECK_FOR_INTERRUPTS, ConfigReloadPending, extract_slot_names(), fb(), fetch_remote_slots(), IsTransactionState(), list_free_deep(), MyProcPid, NIL, PG_END_ENSURE_ERROR_CLEANUP, PG_ENSURE_ERROR_CLEANUP, PointerGetDatum(), ReplicationSlotCleanup(), reset_syncing_flag(), slotsync_failure_callback(), slotsync_reread_config(), synchronize_slots(), validate_remote_info(), wait_for_slot_activity(), and wrconn.

Referenced by pg_sync_replication_slots().

◆ ValidateSlotSyncParams()

bool ValidateSlotSyncParams ( int  elevel)
extern

Definition at line 1166 of file slotsync.c.

1167{
1168 /*
1169 * Logical slot sync/creation requires logical decoding to be enabled.
1170 */
1172 {
1173 ereport(elevel,
1175 errmsg("replication slot synchronization requires \"effective_wal_level\" >= \"logical\" on the primary"),
1176 errhint("To enable logical decoding on primary, set \"wal_level\" >= \"logical\" or create at least one logical slot when \"wal_level\" = \"replica\"."));
1177
1178 return false;
1179 }
1180
1181 /*
1182 * A physical replication slot(primary_slot_name) is required on the
1183 * primary to ensure that the rows needed by the standby are not removed
1184 * after restarting, so that the synchronized slot on the standby will not
1185 * be invalidated.
1186 */
1187 if (PrimarySlotName == NULL || *PrimarySlotName == '\0')
1188 {
1189 ereport(elevel,
1191 /* translator: %s is a GUC variable name */
1192 errmsg("replication slot synchronization requires \"%s\" to be set", "primary_slot_name"));
1193 return false;
1194 }
1195
1196 /*
1197 * hot_standby_feedback must be enabled to cooperate with the physical
1198 * replication slot, which allows informing the primary about the xmin and
1199 * catalog_xmin values on the standby.
1200 */
1202 {
1203 ereport(elevel,
1205 /* translator: %s is a GUC variable name */
1206 errmsg("replication slot synchronization requires \"%s\" to be enabled",
1207 "hot_standby_feedback"));
1208 return false;
1209 }
1210
1211 /*
1212 * The primary_conninfo is required to make connection to primary for
1213 * getting slots information.
1214 */
1215 if (PrimaryConnInfo == NULL || *PrimaryConnInfo == '\0')
1216 {
1217 ereport(elevel,
1219 /* translator: %s is a GUC variable name */
1220 errmsg("replication slot synchronization requires \"%s\" to be set",
1221 "primary_conninfo"));
1222 return false;
1223 }
1224
1225 return true;
1226}
int errhint(const char *fmt,...) pg_attribute_printf(1
bool IsLogicalDecodingEnabled(void)
Definition logicalctl.c:202
bool hot_standby_feedback
Definition walreceiver.c:92
char * PrimarySlotName

References ereport, errcode(), errhint(), errmsg, fb(), hot_standby_feedback, IsLogicalDecodingEnabled(), PrimaryConnInfo, and PrimarySlotName.

Referenced by LaunchMissingBackgroundProcesses(), and pg_sync_replication_slots().

Variable Documentation

◆ PrimaryConnInfo

◆ PrimarySlotName

◆ SlotSyncShutdownPending

PGDLLIMPORT volatile sig_atomic_t SlotSyncShutdownPending
extern

◆ sync_replication_slots

PGDLLIMPORT bool sync_replication_slots
extern