PostgreSQL Source Code git master
Loading...
Searching...
No Matches
slotsync.h File Reference
#include <signal.h>
#include "replication/walreceiver.h"
Include dependency graph for slotsync.h:
This graph shows which files directly or indirectly include this file:

Go to the source code of this file.

Functions

charCheckAndGetDbnameFromConninfo (void)
 
bool ValidateSlotSyncParams (int elevel)
 
pg_noreturn void ReplSlotSyncWorkerMain (const void *startup_data, size_t startup_data_len)
 
void ShutDownSlotSync (void)
 
bool SlotSyncWorkerCanRestart (void)
 
bool IsSyncingReplicationSlots (void)
 
void SyncReplicationSlots (WalReceiverConn *wrconn)
 
void HandleSlotSyncMessageInterrupt (void)
 
void ProcessSlotSyncMessage (void)
 

Variables

PGDLLIMPORT bool sync_replication_slots
 
PGDLLIMPORT volatile sig_atomic_t SlotSyncShutdownPending
 
PGDLLIMPORT charPrimaryConnInfo
 
PGDLLIMPORT charPrimarySlotName
 

Function Documentation

◆ CheckAndGetDbnameFromConninfo()

char * CheckAndGetDbnameFromConninfo ( void  )
extern

Definition at line 1151 of file slotsync.c.

1152{
1153 char *dbname;
1154
1155 /*
1156 * The slot synchronization needs a database connection for walrcv_exec to
1157 * work.
1158 */
1160 if (dbname == NULL)
1161 ereport(ERROR,
1163
1164 /*
1165 * translator: first %s is a connection option; second %s is a GUC
1166 * variable name
1167 */
1168 errmsg("replication slot synchronization requires \"%s\" to be specified in \"%s\"",
1169 "dbname", "primary_conninfo"));
1170 return dbname;
1171}
int errcode(int sqlerrcode)
Definition elog.c:875
#define ERROR
Definition elog.h:40
#define ereport(elevel,...)
Definition elog.h:152
static char * errmsg
static int fb(int x)
char * dbname
Definition streamutil.c:49
#define walrcv_get_dbname_from_conninfo(conninfo)
char * PrimaryConnInfo

References dbname, ereport, errcode(), errmsg, ERROR, fb(), PrimaryConnInfo, and walrcv_get_dbname_from_conninfo.

Referenced by pg_sync_replication_slots(), and ReplSlotSyncWorkerMain().

◆ HandleSlotSyncMessageInterrupt()

void HandleSlotSyncMessageInterrupt ( void  )
extern

Definition at line 1331 of file slotsync.c.

1332{
1333 InterruptPending = true;
1335 /* latch will be set by procsignal_sigusr1_handler */
1336}
volatile sig_atomic_t InterruptPending
Definition globals.c:32
volatile sig_atomic_t SlotSyncShutdownPending
Definition slotsync.c:159

References InterruptPending, and SlotSyncShutdownPending.

Referenced by procsignal_sigusr1_handler().

◆ IsSyncingReplicationSlots()

bool IsSyncingReplicationSlots ( void  )
extern

Definition at line 1909 of file slotsync.c.

1910{
1911 return syncing_slots;
1912}
static bool syncing_slots
Definition slotsync.c:152

References syncing_slots.

Referenced by CreateDecodingContext(), GetStandbyFlushRecPtr(), ProcessSlotSyncMessage(), and ReplicationSlotCreate().

◆ ProcessSlotSyncMessage()

void ProcessSlotSyncMessage ( void  )
extern

Definition at line 1347 of file slotsync.c.

1348{
1350
1352 {
1353 ereport(LOG,
1354 errmsg("replication slot synchronization worker will stop because promotion is triggered"));
1355 proc_exit(0);
1356 }
1357 else
1358 {
1359 /*
1360 * If sync has already completed, there is no need to interrupt the
1361 * caller with an error.
1362 */
1364 return;
1365
1366 ereport(ERROR,
1368 errmsg("replication slot synchronization will stop because promotion is triggered"));
1369 }
1370}
#define LOG
Definition elog.h:32
void proc_exit(int code)
Definition ipc.c:105
#define AmLogicalSlotSyncWorkerProcess()
Definition miscadmin.h:401
bool IsSyncingReplicationSlots(void)
Definition slotsync.c:1909

References AmLogicalSlotSyncWorkerProcess, ereport, errcode(), errmsg, ERROR, fb(), IsSyncingReplicationSlots(), LOG, proc_exit(), and SlotSyncShutdownPending.

Referenced by ProcessInterrupts().

◆ ReplSlotSyncWorkerMain()

pg_noreturn void ReplSlotSyncWorkerMain ( const void startup_data,
size_t  startup_data_len 
)
extern

Definition at line 1552 of file slotsync.c.

1553{
1555 char *dbname;
1556 char *err;
1559
1561
1562 /* Release postmaster's working memory context */
1564 {
1567 }
1568
1570
1572
1573 /*
1574 * Create a per-backend PGPROC struct in shared memory. We must do this
1575 * before we access any shared memory.
1576 */
1577 InitProcess();
1578
1579 /*
1580 * Early initialization.
1581 */
1582 BaseInit();
1583
1585
1586 /*
1587 * If an exception is encountered, processing resumes here.
1588 *
1589 * We just need to clean up, report the error, and go away.
1590 *
1591 * If we do not have this handling here, then since this worker process
1592 * operates at the bottom of the exception stack, ERRORs turn into FATALs.
1593 * Therefore, we create our own exception handler to catch ERRORs.
1594 */
1595 if (sigsetjmp(local_sigjmp_buf, 1) != 0)
1596 {
1597 /* since not using PG_TRY, must reset error stack by hand */
1599
1600 /* Prevents interrupts while cleaning up */
1602
1603 /* Report the error to the server log */
1605
1606 /*
1607 * We can now go away. Note that because we called InitProcess, a
1608 * callback was registered to do ProcKill, which will clean up
1609 * necessary state.
1610 */
1611 proc_exit(0);
1612 }
1613
1614 /* We can now handle ereport(ERROR) */
1616
1617 /* Setup signal handling */
1626
1628
1629 ereport(LOG, errmsg("slot sync worker started"));
1630
1631 /* Register it as soon as SlotSyncCtx->pid is initialized. */
1633
1634 /*
1635 * Establishes SIGALRM handler and initialize timeout module. It is needed
1636 * by InitPostgres to register different timeouts.
1637 */
1639
1640 /* Load the libpq-specific functions */
1641 load_file("libpqwalreceiver", false);
1642
1643 /*
1644 * Unblock signals (they were blocked when the postmaster forked us)
1645 */
1647
1648 /*
1649 * Set always-secure search path, so malicious users can't redirect user
1650 * code (e.g. operators).
1651 *
1652 * It's not strictly necessary since we won't be scanning or writing to
1653 * any user table locally, but it's good to retain it here for added
1654 * precaution.
1655 */
1656 SetConfigOption("search_path", "", PGC_SUSET, PGC_S_OVERRIDE);
1657
1659
1660 /*
1661 * Connect to the database specified by the user in primary_conninfo. We
1662 * need a database connection for walrcv_exec to work which we use to
1663 * fetch slot information from the remote node. See comments atop
1664 * libpqrcv_exec.
1665 *
1666 * We do not specify a specific user here since the slot sync worker will
1667 * operate as a superuser. This is safe because the slot sync worker does
1668 * not interact with user tables, eliminating the risk of executing
1669 * arbitrary code within triggers.
1670 */
1672
1674
1676 if (cluster_name[0])
1677 appendStringInfo(&app_name, "%s_%s", cluster_name, "slotsync worker");
1678 else
1679 appendStringInfoString(&app_name, "slotsync worker");
1680
1681 /*
1682 * Establish the connection to the primary server for slot
1683 * synchronization.
1684 */
1685 wrconn = walrcv_connect(PrimaryConnInfo, false, false, false,
1686 app_name.data, &err);
1687
1688 if (!wrconn)
1689 ereport(ERROR,
1691 errmsg("synchronization worker \"%s\" could not connect to the primary server: %s",
1692 app_name.data, err));
1693
1694 pfree(app_name.data);
1695
1696 /*
1697 * Register the disconnection callback.
1698 *
1699 * XXX: This can be combined with previous cleanup registration of
1700 * slotsync_worker_onexit() but that will need the connection to be made
1701 * global and we want to avoid introducing global for this purpose.
1702 */
1704
1705 /*
1706 * Using the specified primary server connection, check that we are not a
1707 * cascading standby and slot configured in 'primary_slot_name' exists on
1708 * the primary server.
1709 */
1711
1712 /* Main loop to synchronize slots */
1713 for (;;)
1714 {
1715 bool some_slot_updated = false;
1716 bool started_tx = false;
1718
1720
1723
1724 /*
1725 * The syscache access in fetch_remote_slots() needs a transaction
1726 * env.
1727 */
1728 if (!IsTransactionState())
1729 {
1731 started_tx = true;
1732 }
1733
1737
1738 if (started_tx)
1740
1742 }
1743
1744 /*
1745 * The slot sync worker can't get here because it will only stop when it
1746 * receives a stop request from the startup process, or when there is an
1747 * error.
1748 */
1749 Assert(false);
1750}
sigset_t UnBlockSig
Definition pqsignal.c:22
#define Assert(condition)
Definition c.h:943
void load_file(const char *filename, bool restricted)
Definition dfmgr.c:149
void EmitErrorReport(void)
Definition elog.c:1883
ErrorContextCallback * error_context_stack
Definition elog.c:100
sigjmp_buf * PG_exception_stack
Definition elog.c:102
void err(int eval, const char *fmt,...)
Definition err.c:43
int MyProcPid
Definition globals.c:49
void SetConfigOption(const char *name, const char *value, GucContext context, GucSource source)
Definition guc.c:4234
@ PGC_S_OVERRIDE
Definition guc.h:123
@ PGC_SUSET
Definition guc.h:78
char * cluster_name
Definition guc_tables.c:582
volatile sig_atomic_t ConfigReloadPending
Definition interrupt.c:27
void SignalHandlerForConfigReload(SIGNAL_ARGS)
Definition interrupt.c:61
void before_shmem_exit(pg_on_exit_callback function, Datum arg)
Definition ipc.c:344
void list_free_deep(List *list)
Definition list.c:1560
void pfree(void *pointer)
Definition mcxt.c:1616
MemoryContext PostmasterContext
Definition mcxt.c:168
void MemoryContextDelete(MemoryContext context)
Definition mcxt.c:472
@ NormalProcessing
Definition miscadmin.h:490
@ InitProcessing
Definition miscadmin.h:489
#define GetProcessingMode()
Definition miscadmin.h:499
#define CHECK_FOR_INTERRUPTS()
Definition miscadmin.h:125
#define HOLD_INTERRUPTS()
Definition miscadmin.h:136
#define SetProcessingMode(mode)
Definition miscadmin.h:501
#define NIL
Definition pg_list.h:68
#define die(msg)
#define pqsignal
Definition port.h:547
#define PG_SIG_IGN
Definition port.h:551
#define PG_SIG_DFL
Definition port.h:550
void FloatExceptionHandler(SIGNAL_ARGS)
Definition postgres.c:3081
void StatementCancelHandler(SIGNAL_ARGS)
Definition postgres.c:3064
uint64_t Datum
Definition postgres.h:70
#define PointerGetDatum(X)
Definition postgres.h:354
#define InvalidOid
void BaseInit(void)
Definition postinit.c:616
void InitPostgres(const char *in_dbname, Oid dboid, const char *username, Oid useroid, uint32 flags, char *out_dbname)
Definition postinit.c:719
void procsignal_sigusr1_handler(SIGNAL_ARGS)
Definition procsignal.c:688
void init_ps_display(const char *fixed_part)
Definition ps_status.c:286
static void slotsync_worker_disconnect(int code, Datum arg)
Definition slotsync.c:1378
static SlotSyncCtxStruct * SlotSyncCtx
Definition slotsync.c:121
char * CheckAndGetDbnameFromConninfo(void)
Definition slotsync.c:1151
static void wait_for_slot_activity(bool some_slot_updated)
Definition slotsync.c:1437
static void slotsync_reread_config(void)
Definition slotsync.c:1247
static void slotsync_worker_onexit(int code, Datum arg)
Definition slotsync.c:1391
static void validate_remote_info(WalReceiverConn *wrconn)
Definition slotsync.c:1073
static void check_and_set_sync_info(pid_t sync_process_pid)
Definition slotsync.c:1472
static List * fetch_remote_slots(WalReceiverConn *wrconn, List *slot_names)
Definition slotsync.c:895
static bool synchronize_slots(WalReceiverConn *wrconn, List *remote_slot_list, bool *slot_persistence_pending)
Definition slotsync.c:1037
void InitProcess(void)
Definition proc.c:392
void appendStringInfo(StringInfo str, const char *fmt,...)
Definition stringinfo.c:145
void appendStringInfoString(StringInfo str, const char *s)
Definition stringinfo.c:230
void initStringInfo(StringInfo str)
Definition stringinfo.c:97
Definition pg_list.h:54
void InitializeTimeouts(void)
Definition timeout.c:470
static WalReceiverConn * wrconn
Definition walreceiver.c:95
#define walrcv_connect(conninfo, replication, logical, must_use_password, appname, err)
#define SIGCHLD
Definition win32_port.h:168
#define SIGHUP
Definition win32_port.h:158
#define SIGPIPE
Definition win32_port.h:163
#define SIGUSR1
Definition win32_port.h:170
#define SIGUSR2
Definition win32_port.h:171
bool IsTransactionState(void)
Definition xact.c:389
void StartTransactionCommand(void)
Definition xact.c:3109
void CommitTransactionCommand(void)
Definition xact.c:3207

References appendStringInfo(), appendStringInfoString(), Assert, BaseInit(), before_shmem_exit(), check_and_set_sync_info(), CHECK_FOR_INTERRUPTS, CheckAndGetDbnameFromConninfo(), cluster_name, CommitTransactionCommand(), ConfigReloadPending, dbname, die, EmitErrorReport(), ereport, err(), errcode(), errmsg, ERROR, error_context_stack, fb(), fetch_remote_slots(), FloatExceptionHandler(), GetProcessingMode, HOLD_INTERRUPTS, init_ps_display(), InitializeTimeouts(), InitPostgres(), InitProcess(), InitProcessing, initStringInfo(), InvalidOid, IsTransactionState(), list_free_deep(), load_file(), LOG, MemoryContextDelete(), MyProcPid, NIL, NormalProcessing, pfree(), PG_exception_stack, PG_SIG_DFL, PG_SIG_IGN, PGC_S_OVERRIDE, PGC_SUSET, PointerGetDatum, PostmasterContext, pqsignal, PrimaryConnInfo, proc_exit(), procsignal_sigusr1_handler(), SetConfigOption(), SetProcessingMode, SIGCHLD, SIGHUP, SignalHandlerForConfigReload(), SIGPIPE, SIGUSR1, SIGUSR2, slotsync_reread_config(), slotsync_worker_disconnect(), slotsync_worker_onexit(), SlotSyncCtx, StartTransactionCommand(), StatementCancelHandler(), synchronize_slots(), UnBlockSig, validate_remote_info(), wait_for_slot_activity(), walrcv_connect, and wrconn.

◆ ShutDownSlotSync()

void ShutDownSlotSync ( void  )
extern

Definition at line 1811 of file slotsync.c.

1812{
1814
1816
1817 SlotSyncCtx->stopSignaled = true;
1818
1819 /*
1820 * Return if neither the slot sync worker is running nor the function
1821 * pg_sync_replication_slots() is executing.
1822 */
1823 if (!SlotSyncCtx->syncing)
1824 {
1827 return;
1828 }
1829
1831
1833
1834 /*
1835 * Signal process doing slotsync, if any, asking it to stop.
1836 */
1840
1841 /* Wait for slot sync to end */
1842 for (;;)
1843 {
1844 int rc;
1845
1846 /* Wait a bit, we don't expect to have to wait long */
1847 rc = WaitLatch(MyLatch,
1850
1851 if (rc & WL_LATCH_SET)
1852 {
1855 }
1856
1858
1859 /* Ensure that no process is syncing the slots. */
1860 if (!SlotSyncCtx->syncing)
1861 break;
1862
1864 }
1865
1867
1869}
struct Latch * MyLatch
Definition globals.c:65
void ResetLatch(Latch *latch)
Definition latch.c:374
int WaitLatch(Latch *latch, int wakeEvents, long timeout, uint32 wait_event_info)
Definition latch.c:172
#define InvalidPid
Definition miscadmin.h:32
#define INVALID_PROC_NUMBER
Definition procnumber.h:26
int SendProcSignal(pid_t pid, ProcSignalReason reason, ProcNumber procNumber)
Definition procsignal.c:288
@ PROCSIG_SLOTSYNC_MESSAGE
Definition procsignal.h:39
static void update_synced_slots_inactive_since(void)
Definition slotsync.c:1759
static void SpinLockRelease(volatile slock_t *lock)
Definition spin.h:62
static void SpinLockAcquire(volatile slock_t *lock)
Definition spin.h:56
#define WL_TIMEOUT
#define WL_EXIT_ON_PM_DEATH
#define WL_LATCH_SET

References CHECK_FOR_INTERRUPTS, fb(), INVALID_PROC_NUMBER, InvalidPid, SlotSyncCtxStruct::mutex, MyLatch, SlotSyncCtxStruct::pid, PROCSIG_SLOTSYNC_MESSAGE, ResetLatch(), SendProcSignal(), SlotSyncCtx, SpinLockAcquire(), SpinLockRelease(), SlotSyncCtxStruct::stopSignaled, SlotSyncCtxStruct::syncing, update_synced_slots_inactive_since(), WaitLatch(), WL_EXIT_ON_PM_DEATH, WL_LATCH_SET, and WL_TIMEOUT.

Referenced by FinishWalRecovery().

◆ SlotSyncWorkerCanRestart()

bool SlotSyncWorkerCanRestart ( void  )
extern

Definition at line 1884 of file slotsync.c.

1885{
1886 time_t curtime = time(NULL);
1887
1888 /*
1889 * If first time through, or time somehow went backwards, always update
1890 * last_start_time to match the current clock and allow worker start.
1891 * Otherwise allow it only once enough time has elapsed.
1892 */
1893 if (SlotSyncCtx->last_start_time == 0 ||
1894 curtime < SlotSyncCtx->last_start_time ||
1896 {
1898 return true;
1899 }
1900 return false;
1901}
#define SLOTSYNC_RESTART_INTERVAL_SEC
Definition slotsync.c:145
time_t last_start_time
Definition slotsync.c:117

References fb(), SlotSyncCtxStruct::last_start_time, SLOTSYNC_RESTART_INTERVAL_SEC, and SlotSyncCtx.

Referenced by LaunchMissingBackgroundProcesses().

◆ SyncReplicationSlots()

void SyncReplicationSlots ( WalReceiverConn wrconn)
extern

Definition at line 2003 of file slotsync.c.

2004{
2006 {
2008 List *slot_names = NIL; /* List of slot names to track */
2009
2011
2013
2014 /* Retry until all the slots are sync-ready */
2015 for (;;)
2016 {
2017 bool slot_persistence_pending = false;
2018 bool some_slot_updated = false;
2019
2020 /* Check for interrupts and config changes */
2022
2025
2026 /* We must be in a valid transaction state */
2028
2029 /*
2030 * Fetch remote slot info for the given slot_names. If slot_names
2031 * is NIL, fetch all failover-enabled slots. Note that we reuse
2032 * slot_names from the first iteration; re-fetching all failover
2033 * slots each time could cause an endless loop. Instead of
2034 * reprocessing only the pending slots in each iteration, it's
2035 * better to process all the slots received in the first
2036 * iteration. This ensures that by the time we're done, all slots
2037 * reflect the latest values.
2038 */
2039 remote_slots = fetch_remote_slots(wrconn, slot_names);
2040
2041 /* Attempt to synchronize slots */
2044
2045 /*
2046 * If slot_persistence_pending is true, extract slot names for
2047 * future iterations (only needed if we haven't done it yet)
2048 */
2049 if (slot_names == NIL && slot_persistence_pending)
2050 slot_names = extract_slot_names(remote_slots);
2051
2052 /* Free the current remote_slots list */
2054
2055 /* Done if all slots are persisted i.e are sync-ready */
2057 break;
2058
2059 /* wait before retrying again */
2061 }
2062
2063 if (slot_names)
2064 list_free_deep(slot_names);
2065
2066 /* Cleanup the synced temporary slots */
2068
2069 /* We are done with sync, so reset sync flag */
2071 }
2073}
#define PG_ENSURE_ERROR_CLEANUP(cleanup_function, arg)
Definition ipc.h:47
#define PG_END_ENSURE_ERROR_CLEANUP(cleanup_function, arg)
Definition ipc.h:52
void ReplicationSlotCleanup(bool synced_only)
Definition slot.c:868
static void slotsync_failure_callback(int code, Datum arg)
Definition slotsync.c:1941
static List * extract_slot_names(List *remote_slots)
Definition slotsync.c:1977
static void reset_syncing_flag(void)
Definition slotsync.c:1532

References Assert, check_and_set_sync_info(), CHECK_FOR_INTERRUPTS, ConfigReloadPending, extract_slot_names(), fb(), fetch_remote_slots(), IsTransactionState(), list_free_deep(), MyProcPid, NIL, PG_END_ENSURE_ERROR_CLEANUP, PG_ENSURE_ERROR_CLEANUP, PointerGetDatum, ReplicationSlotCleanup(), reset_syncing_flag(), slotsync_failure_callback(), slotsync_reread_config(), synchronize_slots(), validate_remote_info(), wait_for_slot_activity(), and wrconn.

Referenced by pg_sync_replication_slots().

◆ ValidateSlotSyncParams()

bool ValidateSlotSyncParams ( int  elevel)
extern

Definition at line 1178 of file slotsync.c.

1179{
1180 /*
1181 * Logical slot sync/creation requires logical decoding to be enabled.
1182 */
1184 {
1185 ereport(elevel,
1187 errmsg("replication slot synchronization requires \"effective_wal_level\" >= \"logical\" on the primary"),
1188 errhint("To enable logical decoding on primary, set \"wal_level\" >= \"logical\" or create at least one logical slot when \"wal_level\" = \"replica\"."));
1189
1190 return false;
1191 }
1192
1193 /*
1194 * A physical replication slot(primary_slot_name) is required on the
1195 * primary to ensure that the rows needed by the standby are not removed
1196 * after restarting, so that the synchronized slot on the standby will not
1197 * be invalidated.
1198 */
1199 if (PrimarySlotName == NULL || *PrimarySlotName == '\0')
1200 {
1201 ereport(elevel,
1203 /* translator: %s is a GUC variable name */
1204 errmsg("replication slot synchronization requires \"%s\" to be set", "primary_slot_name"));
1205 return false;
1206 }
1207
1208 /*
1209 * hot_standby_feedback must be enabled to cooperate with the physical
1210 * replication slot, which allows informing the primary about the xmin and
1211 * catalog_xmin values on the standby.
1212 */
1214 {
1215 ereport(elevel,
1217 /* translator: %s is a GUC variable name */
1218 errmsg("replication slot synchronization requires \"%s\" to be enabled",
1219 "hot_standby_feedback"));
1220 return false;
1221 }
1222
1223 /*
1224 * The primary_conninfo is required to make connection to primary for
1225 * getting slots information.
1226 */
1227 if (PrimaryConnInfo == NULL || *PrimaryConnInfo == '\0')
1228 {
1229 ereport(elevel,
1231 /* translator: %s is a GUC variable name */
1232 errmsg("replication slot synchronization requires \"%s\" to be set",
1233 "primary_conninfo"));
1234 return false;
1235 }
1236
1237 return true;
1238}
int errhint(const char *fmt,...) pg_attribute_printf(1
bool IsLogicalDecodingEnabled(void)
Definition logicalctl.c:202
bool hot_standby_feedback
Definition walreceiver.c:92
char * PrimarySlotName

References ereport, errcode(), errhint(), errmsg, fb(), hot_standby_feedback, IsLogicalDecodingEnabled(), PrimaryConnInfo, and PrimarySlotName.

Referenced by LaunchMissingBackgroundProcesses(), and pg_sync_replication_slots().

Variable Documentation

◆ PrimaryConnInfo

◆ PrimarySlotName

◆ SlotSyncShutdownPending

PGDLLIMPORT volatile sig_atomic_t SlotSyncShutdownPending
extern

◆ sync_replication_slots

PGDLLIMPORT bool sync_replication_slots
extern