PostgreSQL Source Code git master
slot.h
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 * slot.h
3 * Replication slot management.
4 *
5 * Copyright (c) 2012-2025, PostgreSQL Global Development Group
6 *
7 *-------------------------------------------------------------------------
8 */
9#ifndef SLOT_H
10#define SLOT_H
11
12#include "access/xlog.h"
13#include "access/xlogreader.h"
15#include "storage/lwlock.h"
16#include "storage/shmem.h"
17#include "storage/spin.h"
19
20/* directory to store replication slot data in */
21#define PG_REPLSLOT_DIR "pg_replslot"
22
23/*
24 * The reserved name for a replication slot used to retain dead tuples for
25 * conflict detection in logical replication. See
26 * maybe_advance_nonremovable_xid() for detail.
27 */
28#define CONFLICT_DETECTION_SLOT "pg_conflict_detection"
29
30/*
31 * Behaviour of replication slots, upon release or crash.
32 *
33 * Slots marked as PERSISTENT are crash-safe and will not be dropped when
34 * released. Slots marked as EPHEMERAL will be dropped when released or after
35 * restarts. Slots marked TEMPORARY will be dropped at the end of a session
36 * or on error.
37 *
38 * EPHEMERAL is used as a not-quite-ready state when creating persistent
39 * slots. EPHEMERAL slots can be made PERSISTENT by calling
40 * ReplicationSlotPersist(). For a slot that goes away at the end of a
41 * session, TEMPORARY is the appropriate choice.
42 */
44{
49
50/*
51 * Slots can be invalidated, e.g. due to max_slot_wal_keep_size. If so, the
52 * 'invalidated' field is set to a value other than _NONE.
53 *
54 * When adding a new invalidation cause here, the value must be powers of 2
55 * (e.g., 1, 2, 4...) for proper bitwise operations. Also, remember to update
56 * RS_INVAL_MAX_CAUSES below, and SlotInvalidationCauses in slot.c.
57 */
59{
61 /* required WAL has been removed */
63 /* required rows have been removed */
64 RS_INVAL_HORIZON = (1 << 1),
65 /* wal_level insufficient for slot */
67 /* idle slot timeout has occurred */
70
71/* Maximum number of invalidation causes */
72#define RS_INVAL_MAX_CAUSES 4
73
74/*
75 * When the slot synchronization worker is running, or when
76 * pg_sync_replication_slots is executed, slot synchronization may be
77 * skipped. This enum defines the possible reasons for skipping slot
78 * synchronization.
79 */
81{
82 SS_SKIP_NONE, /* No skip */
83 SS_SKIP_WAL_NOT_FLUSHED, /* Standby did not flush the wal corresponding
84 * to confirmed flush of remote slot */
85 SS_SKIP_WAL_OR_ROWS_REMOVED, /* Remote slot is behind; required WAL or
86 * rows may be removed or at risk */
87 SS_SKIP_NO_CONSISTENT_SNAPSHOT, /* Standby could not build a consistent
88 * snapshot */
89 SS_SKIP_INVALID /* Local slot is invalid */
91
92/*
93 * On-Disk data of a replication slot, preserved across restarts.
94 */
96{
97 /* The slot's identifier */
99
100 /* database the slot is active on */
102
103 /*
104 * The slot's behaviour when being dropped (or restored after a crash).
105 */
107
108 /*
109 * xmin horizon for data
110 *
111 * NB: This may represent a value that hasn't been written to disk yet;
112 * see notes for effective_xmin, below.
113 */
115
116 /*
117 * xmin horizon for catalog tuples
118 *
119 * NB: This may represent a value that hasn't been written to disk yet;
120 * see notes for effective_xmin, below.
121 */
123
124 /* oldest LSN that might be required by this replication slot */
126
127 /* RS_INVAL_NONE if valid, or the reason for having been invalidated */
129
130 /*
131 * Oldest LSN that the client has acked receipt for. This is used as the
132 * start_lsn point in case the client doesn't specify one, and also as a
133 * safety measure to jump forwards in case the client specifies a
134 * start_lsn that's further in the past than this value.
135 */
137
138 /*
139 * LSN at which we enabled two_phase commit for this slot or LSN at which
140 * we found a consistent point at the time of slot creation.
141 */
143
144 /*
145 * Allow decoding of prepared transactions?
146 */
148
149 /* plugin name */
151
152 /*
153 * Was this slot synchronized from the primary server?
154 */
155 bool synced;
156
157 /*
158 * Is this a failover slot (sync candidate for standbys)? Only relevant
159 * for logical slots on the primary server.
160 */
163
164/*
165 * Shared memory state of a single replication slot.
166 *
167 * The in-memory data of replication slots follows a locking model based
168 * on two linked concepts:
169 * - A replication slot's in_use flag is switched when added or discarded using
170 * the LWLock ReplicationSlotControlLock, which needs to be hold in exclusive
171 * mode when updating the flag by the backend owning the slot and doing the
172 * operation, while readers (concurrent backends not owning the slot) need
173 * to hold it in shared mode when looking at replication slot data.
174 * - Individual fields are protected by mutex where only the backend owning
175 * the slot is authorized to update the fields from its own slot. The
176 * backend owning the slot does not need to take this lock when reading its
177 * own fields, while concurrent backends not owning this slot should take the
178 * lock when reading this slot's data.
179 */
180typedef struct ReplicationSlot
181{
182 /* lock, on same cacheline as effective_xmin */
183 slock_t mutex;
184
185 /* is this slot defined */
186 bool in_use;
187
188 /* Who is streaming out changes for this slot? 0 in unused slots. */
190
191 /* any outstanding modifications? */
193 bool dirty;
194
195 /*
196 * For logical decoding, it's extremely important that we never remove any
197 * data that's still needed for decoding purposes, even after a crash;
198 * otherwise, decoding will produce wrong answers. Ordinary streaming
199 * replication also needs to prevent old row versions from being removed
200 * too soon, but the worst consequence we might encounter there is
201 * unwanted query cancellations on the standby. Thus, for logical
202 * decoding, this value represents the latest xmin that has actually been
203 * written to disk, whereas for streaming replication, it's just the same
204 * as the persistent value (data.xmin).
205 */
208
209 /* data surviving shutdowns and crashes */
211
212 /* is somebody performing io on this slot? */
214
215 /* Condition variable signaled when active_pid changes */
217
218 /* all the remaining data is only used for logical slots */
219
220 /*
221 * When the client has confirmed flushes >= candidate_xmin_lsn we can
222 * advance the catalog xmin. When restart_valid has been passed,
223 * restart_lsn can be increased.
224 */
229
230 /*
231 * This value tracks the last confirmed_flush LSN flushed which is used
232 * during a shutdown checkpoint to decide if logical's slot data should be
233 * forcibly flushed or not.
234 */
236
237 /*
238 * The time when the slot became inactive. For synced slots on a standby
239 * server, it represents the time when slot synchronization was most
240 * recently stopped.
241 */
243
244 /*
245 * Latest restart_lsn that has been flushed to disk. For persistent slots
246 * the flushed LSN should be taken into account when calculating the
247 * oldest LSN for WAL segments removal.
248 *
249 * Do not assume that restart_lsn will always move forward, i.e., that the
250 * previously flushed restart_lsn is always behind data.restart_lsn. In
251 * streaming replication using a physical slot, the restart_lsn is updated
252 * based on the flushed WAL position reported by the walreceiver.
253 *
254 * This replication mode allows duplicate WAL records to be received and
255 * overwritten. If the walreceiver receives older WAL records and then
256 * reports them as flushed to the walsender, the restart_lsn may appear to
257 * move backward.
258 *
259 * This typically occurs at the beginning of replication. One reason is
260 * that streaming replication starts at the beginning of a segment, so, if
261 * restart_lsn is in the middle of a segment, it will be updated to an
262 * earlier LSN, see RequestXLogStreaming. Another reason is that the
263 * walreceiver chooses its startpoint based on the replayed LSN, so, if
264 * some records have been received but not yet applied, they will be
265 * received again and leads to updating the restart_lsn to an earlier
266 * position.
267 */
269
270 /*
271 * Reason for the most recent slot synchronization skip.
272 *
273 * Slot sync skips can occur for both temporary and persistent replication
274 * slots. They are more common for temporary slots, but persistent slots
275 * may also skip synchronization in rare cases (e.g.,
276 * SS_SKIP_WAL_NOT_FLUSHED or SS_SKIP_WAL_OR_ROWS_REMOVED).
277 *
278 * Since, temporary slots are dropped after server restart, persisting
279 * slotsync_skip_reason provides no practical benefit.
280 */
283
284#define SlotIsPhysical(slot) ((slot)->data.database == InvalidOid)
285#define SlotIsLogical(slot) ((slot)->data.database != InvalidOid)
286
287/*
288 * Shared memory control area for all of replication slots.
289 */
291{
292 /*
293 * This array should be declared [FLEXIBLE_ARRAY_MEMBER], but for some
294 * reason you can't do that in an otherwise-empty struct.
295 */
298
299/*
300 * Set slot's inactive_since property unless it was previously invalidated.
301 */
302static inline void
304 bool acquire_lock)
305{
306 if (acquire_lock)
308
310 s->inactive_since = ts;
311
312 if (acquire_lock)
314}
315
316/*
317 * Pointers to shared memory
318 */
321
322/* GUCs */
326
327/* shmem initialization functions */
329extern void ReplicationSlotsShmemInit(void);
330
331/* management of individual slots */
332extern void ReplicationSlotCreate(const char *name, bool db_specific,
333 ReplicationSlotPersistency persistency,
334 bool two_phase, bool failover,
335 bool synced);
336extern void ReplicationSlotPersist(void);
337extern void ReplicationSlotDrop(const char *name, bool nowait);
338extern void ReplicationSlotDropAcquired(void);
339extern void ReplicationSlotAlter(const char *name, const bool *failover,
340 const bool *two_phase);
341
342extern void ReplicationSlotAcquire(const char *name, bool nowait,
343 bool error_if_invalid);
344extern void ReplicationSlotRelease(void);
345extern void ReplicationSlotCleanup(bool synced_only);
346extern void ReplicationSlotSave(void);
347extern void ReplicationSlotMarkDirty(void);
348
349/* misc stuff */
350extern void ReplicationSlotInitialize(void);
351extern bool ReplicationSlotValidateName(const char *name,
352 bool allow_reserved_name,
353 int elevel);
354extern bool ReplicationSlotValidateNameInternal(const char *name,
355 bool allow_reserved_name,
356 int *err_code, char **err_msg, char **err_hint);
357extern void ReplicationSlotReserveWal(void);
358extern void ReplicationSlotsComputeRequiredXmin(bool already_locked);
359extern void ReplicationSlotsComputeRequiredLSN(void);
361extern bool ReplicationSlotsCountDBSlots(Oid dboid, int *nslots, int *nactive);
362extern void ReplicationSlotsDropDBSlots(Oid dboid);
363extern bool InvalidateObsoleteReplicationSlots(uint32 possible_causes,
364 XLogSegNo oldestSegno,
365 Oid dboid,
366 TransactionId snapshotConflictHorizon);
367extern ReplicationSlot *SearchNamedReplicationSlot(const char *name, bool need_lock);
368extern int ReplicationSlotIndex(ReplicationSlot *slot);
369extern bool ReplicationSlotName(int index, Name name);
370extern void ReplicationSlotNameForTablesync(Oid suboid, Oid relid, char *syncslotname, Size szslot);
371extern void ReplicationSlotDropAtPubNode(WalReceiverConn *wrconn, char *slotname, bool missing_ok);
372
373extern void StartupReplicationSlots(void);
374extern void CheckPointReplicationSlots(bool is_shutdown);
375
376extern void CheckSlotRequirements(void);
377extern void CheckSlotPermissions(void);
379 GetSlotInvalidationCause(const char *cause_name);
381
382extern bool SlotExistsInSyncStandbySlots(const char *slot_name);
383extern bool StandbySlotsHaveCaughtup(XLogRecPtr wait_for_lsn, int elevel);
384extern void WaitForStandbyConfirmation(XLogRecPtr wait_for_lsn);
385
386#endif /* SLOT_H */
#define PGDLLIMPORT
Definition: c.h:1310
uint32_t uint32
Definition: c.h:543
uint32 TransactionId
Definition: c.h:662
size_t Size
Definition: c.h:615
int64 TimestampTz
Definition: timestamp.h:39
static bool two_phase
static bool failover
unsigned int Oid
Definition: postgres_ext.h:32
int ReplicationSlotIndex(ReplicationSlot *slot)
Definition: slot.c:579
struct ReplicationSlotCtlData ReplicationSlotCtlData
PGDLLIMPORT char * synchronized_standby_slots
Definition: slot.c:164
void ReplicationSlotAcquire(const char *name, bool nowait, bool error_if_invalid)
Definition: slot.c:626
PGDLLIMPORT ReplicationSlot * MyReplicationSlot
Definition: slot.c:148
void CheckPointReplicationSlots(bool is_shutdown)
Definition: slot.c:2126
void ReplicationSlotCreate(const char *name, bool db_specific, ReplicationSlotPersistency persistency, bool two_phase, bool failover, bool synced)
Definition: slot.c:384
void ReplicationSlotDropAcquired(void)
Definition: slot.c:997
void ReplicationSlotMarkDirty(void)
Definition: slot.c:1139
void ReplicationSlotReserveWal(void)
Definition: slot.c:1572
bool ReplicationSlotsCountDBSlots(Oid dboid, int *nslots, int *nactive)
Definition: slot.c:1383
bool ReplicationSlotValidateNameInternal(const char *name, bool allow_reserved_name, int *err_code, char **err_msg, char **err_hint)
Definition: slot.c:311
void ReplicationSlotsDropDBSlots(Oid dboid)
Definition: slot.c:1441
XLogRecPtr ReplicationSlotsComputeLogicalRestartLSN(void)
Definition: slot.c:1304
PGDLLIMPORT int idle_replication_slot_timeout_secs
Definition: slot.c:158
ReplicationSlotInvalidationCause GetSlotInvalidationCause(const char *cause_name)
Definition: slot.c:2725
void ReplicationSlotsComputeRequiredXmin(bool already_locked)
Definition: slot.c:1178
void ReplicationSlotPersist(void)
Definition: slot.c:1156
void ReplicationSlotDrop(const char *name, bool nowait)
Definition: slot.c:892
bool SlotExistsInSyncStandbySlots(const char *slot_name)
Definition: slot.c:2869
struct ReplicationSlotPersistentData ReplicationSlotPersistentData
ReplicationSlotPersistency
Definition: slot.h:44
@ RS_PERSISTENT
Definition: slot.h:45
@ RS_EPHEMERAL
Definition: slot.h:46
@ RS_TEMPORARY
Definition: slot.h:47
void ReplicationSlotSave(void)
Definition: slot.c:1121
ReplicationSlot * SearchNamedReplicationSlot(const char *name, bool need_lock)
Definition: slot.c:546
void ReplicationSlotNameForTablesync(Oid suboid, Oid relid, char *syncslotname, Size szslot)
Definition: tablesync.c:1203
void CheckSlotPermissions(void)
Definition: slot.c:1555
bool ReplicationSlotName(int index, Name name)
Definition: slot.c:595
void ReplicationSlotsShmemInit(void)
Definition: slot.c:206
bool ReplicationSlotValidateName(const char *name, bool allow_reserved_name, int elevel)
Definition: slot.c:266
void ReplicationSlotAlter(const char *name, const bool *failover, const bool *two_phase)
Definition: slot.c:915
void ReplicationSlotRelease(void)
Definition: slot.c:764
void WaitForStandbyConfirmation(XLogRecPtr wait_for_lsn)
Definition: slot.c:3050
PGDLLIMPORT ReplicationSlotCtlData * ReplicationSlotCtl
Definition: slot.c:145
bool StandbySlotsHaveCaughtup(XLogRecPtr wait_for_lsn, int elevel)
Definition: slot.c:2902
ReplicationSlotInvalidationCause
Definition: slot.h:59
@ RS_INVAL_WAL_REMOVED
Definition: slot.h:62
@ RS_INVAL_IDLE_TIMEOUT
Definition: slot.h:68
@ RS_INVAL_HORIZON
Definition: slot.h:64
@ RS_INVAL_WAL_LEVEL
Definition: slot.h:66
@ RS_INVAL_NONE
Definition: slot.h:60
void ReplicationSlotsComputeRequiredLSN(void)
Definition: slot.c:1234
void ReplicationSlotCleanup(bool synced_only)
Definition: slot.c:853
void ReplicationSlotInitialize(void)
Definition: slot.c:241
PGDLLIMPORT int max_replication_slots
Definition: slot.c:151
struct ReplicationSlot ReplicationSlot
void StartupReplicationSlots(void)
Definition: slot.c:2198
void ReplicationSlotDropAtPubNode(WalReceiverConn *wrconn, char *slotname, bool missing_ok)
void CheckSlotRequirements(void)
Definition: slot.c:1533
bool InvalidateObsoleteReplicationSlots(uint32 possible_causes, XLogSegNo oldestSegno, Oid dboid, TransactionId snapshotConflictHorizon)
Definition: slot.c:2066
static void ReplicationSlotSetInactiveSince(ReplicationSlot *s, TimestampTz ts, bool acquire_lock)
Definition: slot.h:303
SlotSyncSkipReason
Definition: slot.h:81
@ SS_SKIP_WAL_NOT_FLUSHED
Definition: slot.h:83
@ SS_SKIP_NO_CONSISTENT_SNAPSHOT
Definition: slot.h:87
@ SS_SKIP_NONE
Definition: slot.h:82
@ SS_SKIP_INVALID
Definition: slot.h:89
@ SS_SKIP_WAL_OR_ROWS_REMOVED
Definition: slot.h:85
Size ReplicationSlotsShmemSize(void)
Definition: slot.c:188
const char * GetSlotInvalidationCauseName(ReplicationSlotInvalidationCause cause)
Definition: slot.c:2745
#define SpinLockRelease(lock)
Definition: spin.h:61
#define SpinLockAcquire(lock)
Definition: spin.h:59
Definition: lwlock.h:42
ReplicationSlot replication_slots[1]
Definition: slot.h:296
TransactionId xmin
Definition: slot.h:114
TransactionId catalog_xmin
Definition: slot.h:122
XLogRecPtr confirmed_flush
Definition: slot.h:136
ReplicationSlotPersistency persistency
Definition: slot.h:106
ReplicationSlotInvalidationCause invalidated
Definition: slot.h:128
XLogRecPtr candidate_xmin_lsn
Definition: slot.h:226
TransactionId effective_catalog_xmin
Definition: slot.h:207
slock_t mutex
Definition: slot.h:183
XLogRecPtr candidate_restart_valid
Definition: slot.h:227
XLogRecPtr last_saved_confirmed_flush
Definition: slot.h:235
pid_t active_pid
Definition: slot.h:189
SlotSyncSkipReason slotsync_skip_reason
Definition: slot.h:281
bool in_use
Definition: slot.h:186
TransactionId effective_xmin
Definition: slot.h:206
bool just_dirtied
Definition: slot.h:192
XLogRecPtr last_saved_restart_lsn
Definition: slot.h:268
XLogRecPtr candidate_restart_lsn
Definition: slot.h:228
LWLock io_in_progress_lock
Definition: slot.h:213
ConditionVariable active_cv
Definition: slot.h:216
TransactionId candidate_catalog_xmin
Definition: slot.h:225
bool dirty
Definition: slot.h:193
ReplicationSlotPersistentData data
Definition: slot.h:210
TimestampTz inactive_since
Definition: slot.h:242
Definition: type.h:96
Definition: c.h:751
const char * name
static WalReceiverConn * wrconn
Definition: walreceiver.c:93
uint64 XLogRecPtr
Definition: xlogdefs.h:21
uint64 XLogSegNo
Definition: xlogdefs.h:52