PostgreSQL Source Code git master
Loading...
Searching...
No Matches
pgoutput.c
Go to the documentation of this file.
1/*-------------------------------------------------------------------------
2 *
3 * pgoutput.c
4 * Logical Replication output plugin
5 *
6 * Copyright (c) 2012-2026, PostgreSQL Global Development Group
7 *
8 * IDENTIFICATION
9 * src/backend/replication/pgoutput/pgoutput.c
10 *
11 *-------------------------------------------------------------------------
12 */
13#include "postgres.h"
14
15#include "access/tupconvert.h"
16#include "catalog/partition.h"
20#include "commands/defrem.h"
22#include "executor/executor.h"
23#include "fmgr.h"
24#include "nodes/makefuncs.h"
26#include "replication/logical.h"
28#include "replication/origin.h"
31#include "utils/builtins.h"
32#include "utils/inval.h"
33#include "utils/lsyscache.h"
34#include "utils/memutils.h"
35#include "utils/rel.h"
36#include "utils/syscache.h"
37#include "utils/varlena.h"
38
40 .name = "pgoutput",
41 .version = PG_VERSION
42);
43
45 OutputPluginOptions *opt, bool is_init);
48 ReorderBufferTXN *txn);
50 ReorderBufferTXN *txn, XLogRecPtr commit_lsn);
52 ReorderBufferTXN *txn, Relation relation,
53 ReorderBufferChange *change);
55 ReorderBufferTXN *txn, int nrelations, Relation relations[],
56 ReorderBufferChange *change);
59 bool transactional, const char *prefix,
60 Size sz, const char *message);
62 ReplOriginId origin_id);
64 ReorderBufferTXN *txn);
66 ReorderBufferTXN *txn, XLogRecPtr prepare_lsn);
68 ReorderBufferTXN *txn, XLogRecPtr commit_lsn);
71 XLogRecPtr prepare_end_lsn,
72 TimestampTz prepare_time);
73static void pgoutput_stream_start(struct LogicalDecodingContext *ctx,
74 ReorderBufferTXN *txn);
75static void pgoutput_stream_stop(struct LogicalDecodingContext *ctx,
76 ReorderBufferTXN *txn);
77static void pgoutput_stream_abort(struct LogicalDecodingContext *ctx,
79 XLogRecPtr abort_lsn);
82 XLogRecPtr commit_lsn);
84 ReorderBufferTXN *txn, XLogRecPtr prepare_lsn);
85
87
90 uint32 hashvalue);
92 ReplOriginId origin_id, XLogRecPtr origin_lsn,
93 bool send_origin);
94
95/*
96 * Only 3 publication actions are used for row filtering ("insert", "update",
97 * "delete"). See RelationSyncEntry.exprstate[].
98 */
105
106#define NUM_ROWFILTER_PUBACTIONS (PUBACTION_DELETE+1)
107
108/*
109 * Entry in the map used to remember which relation schemas we sent.
110 *
111 * The schema_sent flag determines if the current schema record for the
112 * relation (and for its ancestor if publish_as_relid is set) was already
113 * sent to the subscriber (in which case we don't need to send it again).
114 *
115 * The schema cache on downstream is however updated only at commit time,
116 * and with streamed transactions the commit order may be different from
117 * the order the transactions are sent in. Also, the (sub) transactions
118 * might get aborted so we need to send the schema for each (sub) transaction
119 * so that we don't lose the schema information on abort. For handling this,
120 * we maintain the list of xids (streamed_txns) for those we have already sent
121 * the schema.
122 *
123 * For partitions, 'pubactions' considers not only the table's own
124 * publications, but also those of all of its ancestors.
125 */
126typedef struct RelationSyncEntry
127{
128 Oid relid; /* relation oid */
129
130 bool replicate_valid; /* overall validity flag for entry */
131
133
134 /*
135 * This will be PUBLISH_GENCOLS_STORED if the relation contains generated
136 * columns and the 'publish_generated_columns' parameter is set to
137 * PUBLISH_GENCOLS_STORED. Otherwise, it will be PUBLISH_GENCOLS_NONE,
138 * indicating that no generated columns should be published, unless
139 * explicitly specified in the column list.
140 */
142 List *streamed_txns; /* streamed toplevel transactions with this
143 * schema */
144
145 /* are we publishing this rel? */
147
148 /*
149 * ExprState array for row filter. Different publication actions don't
150 * allow multiple expressions to always be combined into one, because
151 * updates or deletes restrict the column in expression to be part of the
152 * replica identity index whereas inserts do not have this restriction, so
153 * there is one ExprState per publication action.
154 */
156 EState *estate; /* executor state used for row filter */
157 TupleTableSlot *new_slot; /* slot for storing new tuple */
158 TupleTableSlot *old_slot; /* slot for storing old tuple */
159
160 /*
161 * OID of the relation to publish changes as. For a partition, this may
162 * be set to one of its ancestors whose schema will be used when
163 * replicating changes, if publish_via_partition_root is set for the
164 * publication.
165 */
167
168 /*
169 * Map used when replicating using an ancestor's schema to convert tuples
170 * from partition's type to the ancestor's; NULL if publish_as_relid is
171 * same as 'relid' or if unnecessary due to partition and the ancestor
172 * having identical TupleDesc.
173 */
175
176 /*
177 * Columns included in the publication, or NULL if all columns are
178 * included implicitly. Note that the attnums in this bitmap are not
179 * shifted by FirstLowInvalidHeapAttributeNumber.
180 */
182
183 /*
184 * Private context to store additional data for this entry - state for the
185 * row filter expressions, column list, etc.
186 */
189
190/*
191 * Maintain a per-transaction level variable to track whether the transaction
192 * has sent BEGIN. BEGIN is only sent when the first change in a transaction
193 * is processed. This makes it possible to skip sending a pair of BEGIN/COMMIT
194 * messages for empty transactions which saves network bandwidth.
195 *
196 * This optimization is not used for prepared transactions because if the
197 * WALSender restarts after prepare of a transaction and before commit prepared
198 * of the same transaction then we won't be able to figure out if we have
199 * skipped sending BEGIN/PREPARE of a transaction as it was empty. This is
200 * because we would have lost the in-memory txndata information that was
201 * present prior to the restart. This will result in sending a spurious
202 * COMMIT PREPARED without a corresponding prepared transaction at the
203 * downstream which would lead to an error when it tries to process it.
204 *
205 * XXX We could achieve this optimization by changing protocol to send
206 * additional information so that downstream can detect that the corresponding
207 * prepare has not been sent. However, adding such a check for every
208 * transaction in the downstream could be costly so we might want to do it
209 * optionally.
210 *
211 * We also don't have this optimization for streamed transactions because
212 * they can contain prepared transactions.
213 */
214typedef struct PGOutputTxnData
215{
216 bool sent_begin_txn; /* flag indicating whether BEGIN has been sent */
218
219/* Map used to remember which relation schemas we sent. */
221
222static void init_rel_sync_cache(MemoryContext cachectx);
223static void cleanup_rel_sync_cache(TransactionId xid, bool is_commit);
225 Relation relation);
226static void send_relation_and_attrs(Relation relation, TransactionId xid,
229static void rel_sync_cache_relation_cb(Datum arg, Oid relid);
231 uint32 hashvalue);
233 TransactionId xid);
235 TransactionId xid);
236static void init_tuple_slot(PGOutputData *data, Relation relation,
237 RelationSyncEntry *entry);
238static void pgoutput_memory_context_reset(void *arg);
239
240/* row filter routines */
243 List *publications,
244 RelationSyncEntry *entry);
246 ExprContext *econtext);
247static bool pgoutput_row_filter(Relation relation, TupleTableSlot *old_slot,
249 RelationSyncEntry *entry,
251
252/* column list routines */
254 List *publications,
255 RelationSyncEntry *entry);
256
257/*
258 * Specify output plugin callbacks
259 */
260void
288
289static void
291{
292 ListCell *lc;
293 bool protocol_version_given = false;
294 bool publication_names_given = false;
295 bool binary_option_given = false;
296 bool messages_option_given = false;
297 bool streaming_given = false;
298 bool two_phase_option_given = false;
299 bool origin_option_given = false;
300
301 /* Initialize optional parameters to defaults */
302 data->binary = false;
303 data->streaming = LOGICALREP_STREAM_OFF;
304 data->messages = false;
305 data->two_phase = false;
306 data->publish_no_origin = false;
307
308 foreach(lc, options)
309 {
310 DefElem *defel = (DefElem *) lfirst(lc);
311
312 Assert(defel->arg == NULL || IsA(defel->arg, String));
313
314 /* Check each param, whether or not we recognize it */
315 if (strcmp(defel->defname, "proto_version") == 0)
316 {
317 unsigned long parsed;
318 char *endptr;
319
323 errmsg("conflicting or redundant options")));
325
326 errno = 0;
327 parsed = strtoul(strVal(defel->arg), &endptr, 10);
328 if (errno != 0 || *endptr != '\0')
331 errmsg("invalid proto_version")));
332
333 if (parsed > PG_UINT32_MAX)
336 errmsg("proto_version \"%s\" out of range",
337 strVal(defel->arg))));
338
339 data->protocol_version = (uint32) parsed;
340 }
341 else if (strcmp(defel->defname, "publication_names") == 0)
342 {
346 errmsg("conflicting or redundant options")));
348
349 /*
350 * Pass a copy of the DefElem->arg since SplitIdentifierString
351 * modifies its input.
352 */
353 if (!SplitIdentifierString(pstrdup(strVal(defel->arg)), ',',
354 &data->publication_names))
357 errmsg("invalid publication_names syntax")));
358 }
359 else if (strcmp(defel->defname, "binary") == 0)
360 {
364 errmsg("conflicting or redundant options")));
365 binary_option_given = true;
366
367 data->binary = defGetBoolean(defel);
368 }
369 else if (strcmp(defel->defname, "messages") == 0)
370 {
374 errmsg("conflicting or redundant options")));
376
377 data->messages = defGetBoolean(defel);
378 }
379 else if (strcmp(defel->defname, "streaming") == 0)
380 {
381 if (streaming_given)
384 errmsg("conflicting or redundant options")));
385 streaming_given = true;
386
387 data->streaming = defGetStreamingMode(defel);
388 }
389 else if (strcmp(defel->defname, "two_phase") == 0)
390 {
394 errmsg("conflicting or redundant options")));
396
397 data->two_phase = defGetBoolean(defel);
398 }
399 else if (strcmp(defel->defname, "origin") == 0)
400 {
401 char *origin;
402
406 errmsg("conflicting or redundant options"));
407 origin_option_given = true;
408
409 origin = defGetString(defel);
410 if (pg_strcasecmp(origin, LOGICALREP_ORIGIN_NONE) == 0)
411 data->publish_no_origin = true;
412 else if (pg_strcasecmp(origin, LOGICALREP_ORIGIN_ANY) == 0)
413 data->publish_no_origin = false;
414 else
417 errmsg("unrecognized origin value: \"%s\"", origin));
418 }
419 else
420 elog(ERROR, "unrecognized pgoutput option: %s", defel->defname);
421 }
422
423 /* Check required options */
427 errmsg("option \"%s\" missing", "proto_version"));
431 errmsg("option \"%s\" missing", "publication_names"));
432}
433
434/*
435 * Memory context reset callback of PGOutputData->context.
436 */
437static void
446
447/*
448 * Initialize this plugin
449 */
450static void
452 bool is_init)
453{
455 static bool publication_callback_registered = false;
457
458 /* Create our memory context for private allocations. */
459 data->context = AllocSetContextCreate(ctx->context,
460 "logical replication output context",
462
463 data->cachectx = AllocSetContextCreate(ctx->context,
464 "logical replication cache context",
466
467 data->pubctx = AllocSetContextCreate(ctx->context,
468 "logical replication publication list context",
470
471 /*
472 * Ensure to cleanup RelationSyncCache even when logical decoding invoked
473 * via SQL interface ends up with an error.
474 */
478
480
481 /* This plugin uses binary protocol. */
483
484 /*
485 * This is replication start and not slot initialization.
486 *
487 * Parse and validate options passed by the client.
488 */
489 if (!is_init)
490 {
491 /* Parse the params and ERROR if we see any we don't recognize */
493
494 /* Check if we support requested protocol */
495 if (data->protocol_version > LOGICALREP_PROTO_MAX_VERSION_NUM)
498 errmsg("client sent proto_version=%d but server only supports protocol %d or lower",
499 data->protocol_version, LOGICALREP_PROTO_MAX_VERSION_NUM)));
500
501 if (data->protocol_version < LOGICALREP_PROTO_MIN_VERSION_NUM)
504 errmsg("client sent proto_version=%d but server only supports protocol %d or higher",
505 data->protocol_version, LOGICALREP_PROTO_MIN_VERSION_NUM)));
506
507 /*
508 * Decide whether to enable streaming. It is disabled by default, in
509 * which case we just update the flag in decoding context. Otherwise
510 * we only allow it with sufficient version of the protocol, and when
511 * the output plugin supports it.
512 */
513 if (data->streaming == LOGICALREP_STREAM_OFF)
514 ctx->streaming = false;
515 else if (data->streaming == LOGICALREP_STREAM_ON &&
516 data->protocol_version < LOGICALREP_PROTO_STREAM_VERSION_NUM)
519 errmsg("requested proto_version=%d does not support streaming, need %d or higher",
520 data->protocol_version, LOGICALREP_PROTO_STREAM_VERSION_NUM)));
521 else if (data->streaming == LOGICALREP_STREAM_PARALLEL &&
525 errmsg("requested proto_version=%d does not support parallel streaming, need %d or higher",
527 else if (!ctx->streaming)
530 errmsg("streaming requested, but not supported by output plugin")));
531
532 /*
533 * Here, we just check whether the two-phase option is passed by
534 * plugin and decide whether to enable it at later point of time. It
535 * remains enabled if the previous start-up has done so. But we only
536 * allow the option to be passed in with sufficient version of the
537 * protocol, and when the output plugin supports it.
538 */
539 if (!data->two_phase)
540 ctx->twophase_opt_given = false;
541 else if (data->protocol_version < LOGICALREP_PROTO_TWOPHASE_VERSION_NUM)
544 errmsg("requested proto_version=%d does not support two-phase commit, need %d or higher",
545 data->protocol_version, LOGICALREP_PROTO_TWOPHASE_VERSION_NUM)));
546 else if (!ctx->twophase)
549 errmsg("two-phase commit requested, but not supported by output plugin")));
550 else
551 ctx->twophase_opt_given = true;
552
553 /* Init publication state. */
554 data->publications = NIL;
555 publications_valid = false;
556
557 /*
558 * Register callback for pg_publication if we didn't already do that
559 * during some previous call in this process.
560 */
562 {
565 (Datum) 0);
567 (Datum) 0);
569 }
570
571 /* Initialize relation schema cache. */
573 }
574 else
575 {
576 /*
577 * Disable the streaming and prepared transactions during the slot
578 * initialization mode.
579 */
580 ctx->streaming = false;
581 ctx->twophase = false;
582 }
583}
584
585/*
586 * BEGIN callback.
587 *
588 * Don't send the BEGIN message here instead postpone it until the first
589 * change. In logical replication, a common scenario is to replicate a set of
590 * tables (instead of all tables) and transactions whose changes were on
591 * the table(s) that are not published will produce empty transactions. These
592 * empty transactions will send BEGIN and COMMIT messages to subscribers,
593 * using bandwidth on something with little/no use for logical replication.
594 */
595static void
603
604/*
605 * Send BEGIN.
606 *
607 * This is called while processing the first change of the transaction.
608 */
609static void
627
628/*
629 * COMMIT callback
630 */
631static void
633 XLogRecPtr commit_lsn)
634{
636 bool sent_begin_txn;
637
639
640 /*
641 * We don't need to send the commit message unless some relevant change
642 * from this transaction has been sent to the downstream.
643 */
644 sent_begin_txn = txndata->sent_begin_txn;
645 OutputPluginUpdateProgress(ctx, !sent_begin_txn);
646 pfree(txndata);
648
649 if (!sent_begin_txn)
650 {
651 elog(DEBUG1, "skipped replication of an empty transaction with XID: %u", txn->xid);
652 return;
653 }
654
655 OutputPluginPrepareWrite(ctx, true);
656 logicalrep_write_commit(ctx->out, txn, commit_lsn);
657 OutputPluginWrite(ctx, true);
658}
659
660/*
661 * BEGIN PREPARE callback
662 */
663static void
676
677/*
678 * PREPARE callback
679 */
680static void
682 XLogRecPtr prepare_lsn)
683{
684 OutputPluginUpdateProgress(ctx, false);
685
686 OutputPluginPrepareWrite(ctx, true);
687 logicalrep_write_prepare(ctx->out, txn, prepare_lsn);
688 OutputPluginWrite(ctx, true);
689}
690
691/*
692 * COMMIT PREPARED callback
693 */
694static void
696 XLogRecPtr commit_lsn)
697{
698 OutputPluginUpdateProgress(ctx, false);
699
700 OutputPluginPrepareWrite(ctx, true);
701 logicalrep_write_commit_prepared(ctx->out, txn, commit_lsn);
702 OutputPluginWrite(ctx, true);
703}
704
705/*
706 * ROLLBACK PREPARED callback
707 */
708static void
710 ReorderBufferTXN *txn,
711 XLogRecPtr prepare_end_lsn,
712 TimestampTz prepare_time)
713{
714 OutputPluginUpdateProgress(ctx, false);
715
716 OutputPluginPrepareWrite(ctx, true);
717 logicalrep_write_rollback_prepared(ctx->out, txn, prepare_end_lsn,
718 prepare_time);
719 OutputPluginWrite(ctx, true);
720}
721
722/*
723 * Write the current schema of the relation and its ancestor (if any) if not
724 * done yet.
725 */
726static void
728 ReorderBufferChange *change,
730{
732 bool schema_sent;
735
736 /*
737 * Remember XID of the (sub)transaction for the change. We don't care if
738 * it's top-level transaction or not (we have already sent that XID in
739 * start of the current streaming block).
740 *
741 * If we're not in a streaming block, just use InvalidTransactionId and
742 * the write methods will not include it.
743 */
744 if (data->in_streaming)
745 xid = change->txn->xid;
746
747 if (rbtxn_is_subtxn(change->txn))
748 topxid = rbtxn_get_toptxn(change->txn)->xid;
749 else
750 topxid = xid;
751
752 /*
753 * Do we need to send the schema? We do track streamed transactions
754 * separately, because those may be applied later (and the regular
755 * transactions won't see their effects until then) and in an order that
756 * we don't know at this point.
757 *
758 * XXX There is a scope of optimization here. Currently, we always send
759 * the schema first time in a streaming transaction but we can probably
760 * avoid that by checking 'relentry->schema_sent' flag. However, before
761 * doing that we need to study its impact on the case where we have a mix
762 * of streaming and non-streaming transactions.
763 */
764 if (data->in_streaming)
766 else
767 schema_sent = relentry->schema_sent;
768
769 /* Nothing to do if we already sent the schema. */
770 if (schema_sent)
771 return;
772
773 /*
774 * Send the schema. If the changes will be published using an ancestor's
775 * schema, not the relation's own, send that ancestor's schema before
776 * sending relation's own (XXX - maybe sending only the former suffices?).
777 */
778 if (relentry->publish_as_relid != RelationGetRelid(relation))
779 {
780 Relation ancestor = RelationIdGetRelation(relentry->publish_as_relid);
781
784 }
785
786 send_relation_and_attrs(relation, xid, ctx, relentry);
787
788 if (data->in_streaming)
790 else
791 relentry->schema_sent = true;
792}
793
794/*
795 * Sends a relation
796 */
797static void
801{
802 TupleDesc desc = RelationGetDescr(relation);
803 Bitmapset *columns = relentry->columns;
804 PublishGencolsType include_gencols_type = relentry->include_gencols_type;
805 int i;
806
807 /*
808 * Write out type info if needed. We do that only for user-created types.
809 * We use FirstGenbkiObjectId as the cutoff, so that we only consider
810 * objects with hand-assigned OIDs to be "built in", not for instance any
811 * function or type defined in the information_schema. This is important
812 * because only hand-assigned OIDs can be expected to remain stable across
813 * major versions.
814 */
815 for (i = 0; i < desc->natts; i++)
816 {
818
820 include_gencols_type))
821 continue;
822
823 if (att->atttypid < FirstGenbkiObjectId)
824 continue;
825
826 OutputPluginPrepareWrite(ctx, false);
827 logicalrep_write_typ(ctx->out, xid, att->atttypid);
828 OutputPluginWrite(ctx, false);
829 }
830
831 OutputPluginPrepareWrite(ctx, false);
832 logicalrep_write_rel(ctx->out, xid, relation, columns,
833 include_gencols_type);
834 OutputPluginWrite(ctx, false);
835}
836
837/*
838 * Executor state preparation for evaluation of row filter expressions for the
839 * specified relation.
840 */
841static EState *
843{
844 EState *estate;
846 List *perminfos = NIL;
847
848 estate = CreateExecutorState();
849
851 rte->rtekind = RTE_RELATION;
852 rte->relid = RelationGetRelid(rel);
853 rte->relkind = rel->rd_rel->relkind;
854 rte->rellockmode = AccessShareLock;
855
857
860
861 estate->es_output_cid = GetCurrentCommandId(false);
862
863 return estate;
864}
865
866/*
867 * Evaluates row filter.
868 *
869 * If the row filter evaluates to NULL, it is taken as false i.e. the change
870 * isn't replicated.
871 */
872static bool
874{
875 Datum ret;
876 bool isnull;
877
878 Assert(state != NULL);
879
880 ret = ExecEvalExprSwitchContext(state, econtext, &isnull);
881
882 elog(DEBUG3, "row filter evaluates to %s (isnull: %s)",
883 isnull ? "false" : DatumGetBool(ret) ? "true" : "false",
884 isnull ? "true" : "false");
885
886 if (isnull)
887 return false;
888
889 return DatumGetBool(ret);
890}
891
892/*
893 * Make sure the per-entry memory context exists.
894 */
895static void
897{
898 Relation relation;
899
900 /* The context may already exist, in which case bail out. */
901 if (entry->entry_cxt)
902 return;
903
904 relation = RelationIdGetRelation(entry->publish_as_relid);
905
906 entry->entry_cxt = AllocSetContextCreate(data->cachectx,
907 "entry private context",
909
911 RelationGetRelationName(relation));
912}
913
914/*
915 * Initialize the row filter.
916 */
917static void
919 RelationSyncEntry *entry)
920{
921 ListCell *lc;
922 List *rfnodes[] = {NIL, NIL, NIL}; /* One per pubaction */
923 bool no_filter[] = {false, false, false}; /* One per pubaction */
925 int idx;
926 bool has_filter = true;
928
929 /*
930 * Find if there are any row filters for this relation. If there are, then
931 * prepare the necessary ExprState and cache it in entry->exprstate. To
932 * build an expression state, we need to ensure the following:
933 *
934 * All the given publication-table mappings must be checked.
935 *
936 * Multiple publications might have multiple row filters for this
937 * relation. Since row filter usage depends on the DML operation, there
938 * are multiple lists (one for each operation) to which row filters will
939 * be appended.
940 *
941 * FOR ALL TABLES and FOR TABLES IN SCHEMA implies "don't use row filter
942 * expression" so it takes precedence.
943 */
944 foreach(lc, publications)
945 {
946 Publication *pub = lfirst(lc);
948 Datum rfdatum = 0;
949 bool pub_no_filter = true;
950
951 /*
952 * If the publication is FOR ALL TABLES, or the publication includes a
953 * FOR TABLES IN SCHEMA where the table belongs to the referred
954 * schema, then it is treated the same as if there are no row filters
955 * (even if other publications have a row filter).
956 */
957 if (!pub->alltables &&
960 ObjectIdGetDatum(pub->oid)))
961 {
962 /*
963 * Check for the presence of a row filter in this publication.
964 */
967 ObjectIdGetDatum(pub->oid));
968
970 {
971 /* Null indicates no filter. */
975 }
976 }
977
978 if (pub_no_filter)
979 {
980 if (rftuple)
982
986
987 /*
988 * Quick exit if all the DML actions are publicized via this
989 * publication.
990 */
994 {
995 has_filter = false;
996 break;
997 }
998
999 /* No additional work for this publication. Next one. */
1000 continue;
1001 }
1002
1003 /* Form the per pubaction row filter lists. */
1013
1015 } /* loop all subscribed publications */
1016
1017 /* Clean the row filter */
1018 for (idx = 0; idx < NUM_ROWFILTER_PUBACTIONS; idx++)
1019 {
1020 if (no_filter[idx])
1021 {
1023 rfnodes[idx] = NIL;
1024 }
1025 }
1026
1027 if (has_filter)
1028 {
1030
1032
1033 /*
1034 * Now all the filters for all pubactions are known. Combine them when
1035 * their pubactions are the same.
1036 */
1038 entry->estate = create_estate_for_relation(relation);
1039 for (idx = 0; idx < NUM_ROWFILTER_PUBACTIONS; idx++)
1040 {
1041 List *filters = NIL;
1042 Expr *rfnode;
1043
1044 if (rfnodes[idx] == NIL)
1045 continue;
1046
1047 foreach(lc, rfnodes[idx])
1049
1050 /* combine the row filter and cache the ExprState */
1052 entry->exprstate[idx] = ExecPrepareExpr(rfnode, entry->estate);
1053 } /* for each pubaction */
1055
1056 RelationClose(relation);
1057 }
1058}
1059
1060/*
1061 * If the table contains a generated column, check for any conflicting
1062 * values of 'publish_generated_columns' parameter in the publications.
1063 */
1064static void
1066 RelationSyncEntry *entry)
1067{
1069 TupleDesc desc = RelationGetDescr(relation);
1070 bool gencolpresent = false;
1071 bool first = true;
1072
1073 /* Check if there is any generated column present. */
1074 for (int i = 0; i < desc->natts; i++)
1075 {
1077
1078 if (att->attgenerated)
1079 {
1080 gencolpresent = true;
1081 break;
1082 }
1083 }
1084
1085 /* There are no generated columns to be published. */
1086 if (!gencolpresent)
1087 {
1089 return;
1090 }
1091
1092 /*
1093 * There may be a conflicting value for 'publish_generated_columns'
1094 * parameter in the publications.
1095 */
1096 foreach_ptr(Publication, pub, publications)
1097 {
1098 /*
1099 * The column list takes precedence over the
1100 * 'publish_generated_columns' parameter. Those will be checked later,
1101 * see pgoutput_column_list_init.
1102 */
1104 continue;
1105
1106 if (first)
1107 {
1108 entry->include_gencols_type = pub->pubgencols_type;
1109 first = false;
1110 }
1111 else if (entry->include_gencols_type != pub->pubgencols_type)
1112 ereport(ERROR,
1114 errmsg("cannot use different values of publish_generated_columns for table \"%s.%s\" in different publications",
1116 RelationGetRelationName(relation)));
1117 }
1118}
1119
1120/*
1121 * Initialize the column list.
1122 */
1123static void
1125 RelationSyncEntry *entry)
1126{
1127 ListCell *lc;
1128 bool first = true;
1130 bool found_pub_collist = false;
1132
1134
1135 /*
1136 * Find if there are any column lists for this relation. If there are,
1137 * build a bitmap using the column lists.
1138 *
1139 * Multiple publications might have multiple column lists for this
1140 * relation.
1141 *
1142 * Note that we don't support the case where the column list is different
1143 * for the same table when combining publications. See comments atop
1144 * fetch_relation_list. But one can later change the publication so we
1145 * still need to check all the given publication-table mappings and report
1146 * an error if any publications have a different column list.
1147 */
1148 foreach(lc, publications)
1149 {
1150 Publication *pub = lfirst(lc);
1151 Bitmapset *cols = NULL;
1152
1153 /* Retrieve the bitmap of columns for a column list publication. */
1155 entry->publish_as_relid,
1156 entry->entry_cxt, &cols);
1157
1158 /*
1159 * For non-column list publications — e.g. TABLE (without a column
1160 * list), ALL TABLES, or ALL TABLES IN SCHEMA, we consider all columns
1161 * of the table (including generated columns when
1162 * 'publish_generated_columns' parameter is true).
1163 */
1164 if (!cols)
1165 {
1166 /*
1167 * Cache the table columns for the first publication with no
1168 * specified column list to detect publication with a different
1169 * column list.
1170 */
1171 if (!relcols && (list_length(publications) > 1))
1172 {
1174
1175 relcols = pub_form_cols_map(relation,
1176 entry->include_gencols_type);
1178 }
1179
1180 cols = relcols;
1181 }
1182
1183 if (first)
1184 {
1185 entry->columns = cols;
1186 first = false;
1187 }
1188 else if (!bms_equal(entry->columns, cols))
1189 ereport(ERROR,
1191 errmsg("cannot use different column lists for table \"%s.%s\" in different publications",
1193 RelationGetRelationName(relation)));
1194 } /* loop all subscribed publications */
1195
1196 /*
1197 * If no column list publications exist, columns to be published will be
1198 * computed later according to the 'publish_generated_columns' parameter.
1199 */
1200 if (!found_pub_collist)
1201 entry->columns = NULL;
1202
1203 RelationClose(relation);
1204}
1205
1206/*
1207 * Initialize the slot for storing new and old tuples, and build the map that
1208 * will be used to convert the relation's tuples into the ancestor's format.
1209 */
1210static void
1212 RelationSyncEntry *entry)
1213{
1217
1218 oldctx = MemoryContextSwitchTo(data->cachectx);
1219
1220 /*
1221 * Create tuple table slots. Create a copy of the TupleDesc as it needs to
1222 * live as long as the cache remains.
1223 */
1226
1229
1231
1232 /*
1233 * Cache the map that will be used to convert the relation's tuples into
1234 * the ancestor's format, if needed.
1235 */
1236 if (entry->publish_as_relid != RelationGetRelid(relation))
1237 {
1239 TupleDesc indesc = RelationGetDescr(relation);
1241
1242 /* Map must live as long as the logical decoding context. */
1243 oldctx = MemoryContextSwitchTo(data->cachectx);
1244
1245 entry->attrmap = build_attrmap_by_name_if_req(indesc, outdesc, false);
1246
1249 }
1250}
1251
1252/*
1253 * Change is checked against the row filter if any.
1254 *
1255 * Returns true if the change is to be replicated, else false.
1256 *
1257 * For inserts, evaluate the row filter for new tuple.
1258 * For deletes, evaluate the row filter for old tuple.
1259 * For updates, evaluate the row filter for old and new tuple.
1260 *
1261 * For updates, if both evaluations are true, we allow sending the UPDATE and
1262 * if both the evaluations are false, it doesn't replicate the UPDATE. Now, if
1263 * only one of the tuples matches the row filter expression, we transform
1264 * UPDATE to DELETE or INSERT to avoid any data inconsistency based on the
1265 * following rules:
1266 *
1267 * Case 1: old-row (no match) new-row (no match) -> (drop change)
1268 * Case 2: old-row (no match) new row (match) -> INSERT
1269 * Case 3: old-row (match) new-row (no match) -> DELETE
1270 * Case 4: old-row (match) new row (match) -> UPDATE
1271 *
1272 * The new action is updated in the action parameter.
1273 *
1274 * The new slot could be updated when transforming the UPDATE into INSERT,
1275 * because the original new tuple might not have column values from the replica
1276 * identity.
1277 *
1278 * Examples:
1279 * Let's say the old tuple satisfies the row filter but the new tuple doesn't.
1280 * Since the old tuple satisfies, the initial table synchronization copied this
1281 * row (or another method was used to guarantee that there is data
1282 * consistency). However, after the UPDATE the new tuple doesn't satisfy the
1283 * row filter, so from a data consistency perspective, that row should be
1284 * removed on the subscriber. The UPDATE should be transformed into a DELETE
1285 * statement and be sent to the subscriber. Keeping this row on the subscriber
1286 * is undesirable because it doesn't reflect what was defined in the row filter
1287 * expression on the publisher. This row on the subscriber would likely not be
1288 * modified by replication again. If someone inserted a new row with the same
1289 * old identifier, replication could stop due to a constraint violation.
1290 *
1291 * Let's say the old tuple doesn't match the row filter but the new tuple does.
1292 * Since the old tuple doesn't satisfy, the initial table synchronization
1293 * probably didn't copy this row. However, after the UPDATE the new tuple does
1294 * satisfy the row filter, so from a data consistency perspective, that row
1295 * should be inserted on the subscriber. Otherwise, subsequent UPDATE or DELETE
1296 * statements have no effect (it matches no row -- see
1297 * apply_handle_update_internal()). So, the UPDATE should be transformed into a
1298 * INSERT statement and be sent to the subscriber. However, this might surprise
1299 * someone who expects the data set to satisfy the row filter expression on the
1300 * provider.
1301 */
1302static bool
1306{
1307 TupleDesc desc;
1308 int i;
1309 bool old_matched,
1311 result;
1313 TupleTableSlot *new_slot = *new_slot_ptr;
1316
1317 /*
1318 * We need this map to avoid relying on ReorderBufferChangeType enums
1319 * having specific values.
1320 */
1321 static const int map_changetype_pubaction[] = {
1325 };
1326
1328 *action == REORDER_BUFFER_CHANGE_UPDATE ||
1329 *action == REORDER_BUFFER_CHANGE_DELETE);
1330
1331 Assert(new_slot || old_slot);
1332
1333 /* Get the corresponding row filter */
1335
1336 /* Bail out if there is no row filter */
1337 if (!filter_exprstate)
1338 return true;
1339
1340 elog(DEBUG3, "table \"%s.%s\" has row filter",
1342 RelationGetRelationName(relation));
1343
1345
1347
1348 /*
1349 * For the following occasions where there is only one tuple, we can
1350 * evaluate the row filter for that tuple and return.
1351 *
1352 * For inserts, we only have the new tuple.
1353 *
1354 * For updates, we can have only a new tuple when none of the replica
1355 * identity columns changed and none of those columns have external data
1356 * but we still need to evaluate the row filter for the new tuple as the
1357 * existing values of those columns might not match the filter. Also,
1358 * users can use constant expressions in the row filter, so we anyway need
1359 * to evaluate it for the new tuple.
1360 *
1361 * For deletes, we only have the old tuple.
1362 */
1363 if (!new_slot || !old_slot)
1364 {
1365 ecxt->ecxt_scantuple = new_slot ? new_slot : old_slot;
1367
1368 return result;
1369 }
1370
1371 /*
1372 * Both the old and new tuples must be valid only for updates and need to
1373 * be checked against the row filter.
1374 */
1376
1377 slot_getallattrs(new_slot);
1378 slot_getallattrs(old_slot);
1379
1381 desc = RelationGetDescr(relation);
1382
1383 /*
1384 * The new tuple might not have all the replica identity columns, in which
1385 * case it needs to be copied over from the old tuple.
1386 */
1387 for (i = 0; i < desc->natts; i++)
1388 {
1390
1391 /*
1392 * if the column in the new tuple or old tuple is null, nothing to do
1393 */
1394 if (new_slot->tts_isnull[i] || old_slot->tts_isnull[i])
1395 continue;
1396
1397 /*
1398 * Unchanged toasted replica identity columns are only logged in the
1399 * old tuple. Copy this over to the new tuple. The changed (or WAL
1400 * Logged) toast values are always assembled in memory and set as
1401 * VARTAG_INDIRECT. See ReorderBufferToastReplace.
1402 */
1403 if (att->attlen == -1 &&
1406 {
1407 if (!tmp_new_slot)
1408 {
1411
1412 memcpy(tmp_new_slot->tts_values, new_slot->tts_values,
1413 desc->natts * sizeof(Datum));
1414 memcpy(tmp_new_slot->tts_isnull, new_slot->tts_isnull,
1415 desc->natts * sizeof(bool));
1416 }
1417
1418 tmp_new_slot->tts_values[i] = old_slot->tts_values[i];
1419 tmp_new_slot->tts_isnull[i] = old_slot->tts_isnull[i];
1420 }
1421 }
1422
1423 ecxt->ecxt_scantuple = old_slot;
1425
1426 if (tmp_new_slot)
1427 {
1429 ecxt->ecxt_scantuple = tmp_new_slot;
1430 }
1431 else
1432 ecxt->ecxt_scantuple = new_slot;
1433
1435
1436 /*
1437 * Case 1: if both tuples don't match the row filter, bailout. Send
1438 * nothing.
1439 */
1440 if (!old_matched && !new_matched)
1441 return false;
1442
1443 /*
1444 * Case 2: if the old tuple doesn't satisfy the row filter but the new
1445 * tuple does, transform the UPDATE into INSERT.
1446 *
1447 * Use the newly transformed tuple that must contain the column values for
1448 * all the replica identity columns. This is required to ensure that the
1449 * while inserting the tuple in the downstream node, we have all the
1450 * required column values.
1451 */
1452 if (!old_matched && new_matched)
1453 {
1455
1456 if (tmp_new_slot)
1458 }
1459
1460 /*
1461 * Case 3: if the old tuple satisfies the row filter but the new tuple
1462 * doesn't, transform the UPDATE into DELETE.
1463 *
1464 * This transformation does not require another tuple. The Old tuple will
1465 * be used for DELETE.
1466 */
1467 else if (old_matched && !new_matched)
1469
1470 /*
1471 * Case 4: if both tuples match the row filter, transformation isn't
1472 * required. (*action is default UPDATE).
1473 */
1474
1475 return true;
1476}
1477
1478/*
1479 * Sends the decoded DML over wire.
1480 *
1481 * This is called both in streaming and non-streaming modes.
1482 */
1483static void
1485 Relation relation, ReorderBufferChange *change)
1486{
1493 Relation targetrel = relation;
1494 ReorderBufferChangeType action = change->action;
1495 TupleTableSlot *old_slot = NULL;
1496 TupleTableSlot *new_slot = NULL;
1497
1498 if (!is_publishable_relation(relation))
1499 return;
1500
1501 /*
1502 * Remember the xid for the change in streaming mode. We need to send xid
1503 * with each change in the streaming mode so that subscriber can make
1504 * their association and on aborts, it can discard the corresponding
1505 * changes.
1506 */
1507 if (data->in_streaming)
1508 xid = change->txn->xid;
1509
1510 relentry = get_rel_sync_entry(data, relation);
1511
1512 /* First check the table filter */
1513 switch (action)
1514 {
1516 if (!relentry->pubactions.pubinsert)
1517 return;
1518 break;
1520 if (!relentry->pubactions.pubupdate)
1521 return;
1522 break;
1524 if (!relentry->pubactions.pubdelete)
1525 return;
1526
1527 /*
1528 * This is only possible if deletes are allowed even when replica
1529 * identity is not defined for a table. Since the DELETE action
1530 * can't be published, we simply return.
1531 */
1532 if (!change->data.tp.oldtuple)
1533 {
1534 elog(DEBUG1, "didn't send DELETE change because of missing oldtuple");
1535 return;
1536 }
1537 break;
1538 default:
1539 Assert(false);
1540 }
1541
1542 /* Avoid leaking memory by using and resetting our own context */
1543 old = MemoryContextSwitchTo(data->context);
1544
1545 /* Switch relation if publishing via root. */
1546 if (relentry->publish_as_relid != RelationGetRelid(relation))
1547 {
1548 Assert(relation->rd_rel->relispartition);
1549 ancestor = RelationIdGetRelation(relentry->publish_as_relid);
1551 }
1552
1553 if (change->data.tp.oldtuple)
1554 {
1555 old_slot = relentry->old_slot;
1556 ExecStoreHeapTuple(change->data.tp.oldtuple, old_slot, false);
1557
1558 /* Convert tuple if needed. */
1559 if (relentry->attrmap)
1560 {
1562 &TTSOpsVirtual);
1563
1564 old_slot = execute_attr_map_slot(relentry->attrmap, old_slot, slot);
1565 }
1566 }
1567
1568 if (change->data.tp.newtuple)
1569 {
1570 new_slot = relentry->new_slot;
1571 ExecStoreHeapTuple(change->data.tp.newtuple, new_slot, false);
1572
1573 /* Convert tuple if needed. */
1574 if (relentry->attrmap)
1575 {
1577 &TTSOpsVirtual);
1578
1579 new_slot = execute_attr_map_slot(relentry->attrmap, new_slot, slot);
1580 }
1581 }
1582
1583 /*
1584 * Check row filter.
1585 *
1586 * Updates could be transformed to inserts or deletes based on the results
1587 * of the row filter for old and new tuple.
1588 */
1589 if (!pgoutput_row_filter(targetrel, old_slot, &new_slot, relentry, &action))
1590 goto cleanup;
1591
1592 /*
1593 * Send BEGIN if we haven't yet.
1594 *
1595 * We send the BEGIN message after ensuring that we will actually send the
1596 * change. This avoids sending a pair of BEGIN/COMMIT messages for empty
1597 * transactions.
1598 */
1599 if (txndata && !txndata->sent_begin_txn)
1600 pgoutput_send_begin(ctx, txn);
1601
1602 /*
1603 * Schema should be sent using the original relation because it also sends
1604 * the ancestor's relation.
1605 */
1606 maybe_send_schema(ctx, change, relation, relentry);
1607
1608 OutputPluginPrepareWrite(ctx, true);
1609
1610 /* Send the data */
1611 switch (action)
1612 {
1614 logicalrep_write_insert(ctx->out, xid, targetrel, new_slot,
1615 data->binary, relentry->columns,
1616 relentry->include_gencols_type);
1617 break;
1619 logicalrep_write_update(ctx->out, xid, targetrel, old_slot,
1620 new_slot, data->binary, relentry->columns,
1621 relentry->include_gencols_type);
1622 break;
1624 logicalrep_write_delete(ctx->out, xid, targetrel, old_slot,
1625 data->binary, relentry->columns,
1626 relentry->include_gencols_type);
1627 break;
1628 default:
1629 Assert(false);
1630 }
1631
1632 OutputPluginWrite(ctx, true);
1633
1634cleanup:
1636 {
1638 ancestor = NULL;
1639 }
1640
1641 /* Drop the new slots that were used to store the converted tuples. */
1642 if (relentry->attrmap)
1643 {
1644 if (old_slot)
1646
1647 if (new_slot)
1649 }
1650
1652 MemoryContextReset(data->context);
1653}
1654
1655static void
1657 int nrelations, Relation relations[], ReorderBufferChange *change)
1658{
1663 int i;
1664 int nrelids;
1665 Oid *relids;
1667
1668 /* Remember the xid for the change in streaming mode. See pgoutput_change. */
1669 if (data->in_streaming)
1670 xid = change->txn->xid;
1671
1672 old = MemoryContextSwitchTo(data->context);
1673
1674 relids = palloc0(nrelations * sizeof(Oid));
1675 nrelids = 0;
1676
1677 for (i = 0; i < nrelations; i++)
1678 {
1679 Relation relation = relations[i];
1680 Oid relid = RelationGetRelid(relation);
1681
1682 if (!is_publishable_relation(relation))
1683 continue;
1684
1685 relentry = get_rel_sync_entry(data, relation);
1686
1687 if (!relentry->pubactions.pubtruncate)
1688 continue;
1689
1690 /*
1691 * Don't send partitions if the publication wants to send only the
1692 * root tables through it.
1693 */
1694 if (relation->rd_rel->relispartition &&
1695 relentry->publish_as_relid != relid)
1696 continue;
1697
1698 relids[nrelids++] = relid;
1699
1700 /* Send BEGIN if we haven't yet */
1701 if (txndata && !txndata->sent_begin_txn)
1702 pgoutput_send_begin(ctx, txn);
1703
1704 maybe_send_schema(ctx, change, relation, relentry);
1705 }
1706
1707 if (nrelids > 0)
1708 {
1709 OutputPluginPrepareWrite(ctx, true);
1711 xid,
1712 nrelids,
1713 relids,
1714 change->data.truncate.cascade,
1715 change->data.truncate.restart_seqs);
1716 OutputPluginWrite(ctx, true);
1717 }
1718
1720 MemoryContextReset(data->context);
1721}
1722
1723static void
1725 XLogRecPtr message_lsn, bool transactional, const char *prefix, Size sz,
1726 const char *message)
1727{
1730
1731 if (!data->messages)
1732 return;
1733
1734 /*
1735 * Remember the xid for the message in streaming mode. See
1736 * pgoutput_change.
1737 */
1738 if (data->in_streaming)
1739 xid = txn->xid;
1740
1741 /*
1742 * Output BEGIN if we haven't yet. Avoid for non-transactional messages.
1743 */
1744 if (transactional)
1745 {
1747
1748 /* Send BEGIN if we haven't yet */
1749 if (txndata && !txndata->sent_begin_txn)
1750 pgoutput_send_begin(ctx, txn);
1751 }
1752
1753 OutputPluginPrepareWrite(ctx, true);
1755 xid,
1757 transactional,
1758 prefix,
1759 sz,
1760 message);
1761 OutputPluginWrite(ctx, true);
1762}
1763
1764/*
1765 * Return true if the data is associated with an origin and the user has
1766 * requested the changes that don't have an origin, false otherwise.
1767 */
1768static bool
1770 ReplOriginId origin_id)
1771{
1773
1774 if (data->publish_no_origin && origin_id != InvalidReplOriginId)
1775 return true;
1776
1777 return false;
1778}
1779
1780/*
1781 * Shutdown the output plugin.
1782 *
1783 * Note, we don't need to clean the data->context, data->cachectx, and
1784 * data->pubctx as they are child contexts of the ctx->context so they
1785 * will be cleaned up by logical decoding machinery.
1786 */
1787static void
1792
1793/*
1794 * Load publications from the list of publication names.
1795 *
1796 * Here, we skip the publications that don't exist yet. This will allow us
1797 * to silently continue the replication in the absence of a missing publication.
1798 * This is required because we allow the users to create publications after they
1799 * have specified the required publications at the time of replication start.
1800 */
1801static List *
1803{
1804 List *result = NIL;
1805 ListCell *lc;
1806
1807 foreach(lc, pubnames)
1808 {
1809 char *pubname = (char *) lfirst(lc);
1810 Publication *pub = GetPublicationByName(pubname, true);
1811
1812 if (pub)
1813 result = lappend(result, pub);
1814 else
1817 errmsg("skipped loading publication \"%s\"", pubname),
1818 errdetail("The publication does not exist at this point in the WAL."),
1819 errhint("Create the publication if it does not exist."));
1820 }
1821
1822 return result;
1823}
1824
1825/*
1826 * Publication syscache invalidation callback.
1827 *
1828 * Called for invalidations on pg_publication.
1829 */
1830static void
1836
1837/*
1838 * START STREAM callback
1839 */
1840static void
1842 ReorderBufferTXN *txn)
1843{
1846
1847 /* we can't nest streaming of transactions */
1848 Assert(!data->in_streaming);
1849
1850 /*
1851 * If we already sent the first stream for this transaction then don't
1852 * send the origin id in the subsequent streams.
1853 */
1854 if (rbtxn_is_streamed(txn))
1856
1859
1862
1863 OutputPluginWrite(ctx, true);
1864
1865 /* we're streaming a chunk of transaction now */
1866 data->in_streaming = true;
1867}
1868
1869/*
1870 * STOP STREAM callback
1871 */
1872static void
1874 ReorderBufferTXN *txn)
1875{
1877
1878 /* we should be streaming a transaction */
1879 Assert(data->in_streaming);
1880
1881 OutputPluginPrepareWrite(ctx, true);
1883 OutputPluginWrite(ctx, true);
1884
1885 /* we've stopped streaming a transaction */
1886 data->in_streaming = false;
1887}
1888
1889/*
1890 * Notify downstream to discard the streamed transaction (along with all
1891 * its subtransactions, if it's a toplevel transaction).
1892 */
1893static void
1895 ReorderBufferTXN *txn,
1896 XLogRecPtr abort_lsn)
1897{
1898 ReorderBufferTXN *toptxn;
1900 bool write_abort_info = (data->streaming == LOGICALREP_STREAM_PARALLEL);
1901
1902 /*
1903 * The abort should happen outside streaming block, even for streamed
1904 * transactions. The transaction has to be marked as streamed, though.
1905 */
1906 Assert(!data->in_streaming);
1907
1908 /* determine the toplevel transaction */
1909 toptxn = rbtxn_get_toptxn(txn);
1910
1911 Assert(rbtxn_is_streamed(toptxn));
1912
1913 OutputPluginPrepareWrite(ctx, true);
1914 logicalrep_write_stream_abort(ctx->out, toptxn->xid, txn->xid, abort_lsn,
1916
1917 OutputPluginWrite(ctx, true);
1918
1919 cleanup_rel_sync_cache(toptxn->xid, false);
1920}
1921
1922/*
1923 * Notify downstream to apply the streamed transaction (along with all
1924 * its subtransactions).
1925 */
1926static void
1928 ReorderBufferTXN *txn,
1929 XLogRecPtr commit_lsn)
1930{
1932
1933 /*
1934 * The commit should happen outside streaming block, even for streamed
1935 * transactions. The transaction has to be marked as streamed, though.
1936 */
1937 Assert(!data->in_streaming);
1939
1940 OutputPluginUpdateProgress(ctx, false);
1941
1942 OutputPluginPrepareWrite(ctx, true);
1943 logicalrep_write_stream_commit(ctx->out, txn, commit_lsn);
1944 OutputPluginWrite(ctx, true);
1945
1946 cleanup_rel_sync_cache(txn->xid, true);
1947}
1948
1949/*
1950 * PREPARE callback (for streaming two-phase commit).
1951 *
1952 * Notify the downstream to prepare the transaction.
1953 */
1954static void
1956 ReorderBufferTXN *txn,
1957 XLogRecPtr prepare_lsn)
1958{
1960
1961 OutputPluginUpdateProgress(ctx, false);
1962 OutputPluginPrepareWrite(ctx, true);
1963 logicalrep_write_stream_prepare(ctx->out, txn, prepare_lsn);
1964 OutputPluginWrite(ctx, true);
1965}
1966
1967/*
1968 * Initialize the relation schema sync cache for a decoding session.
1969 *
1970 * The hash table is destroyed at the end of a decoding session. While
1971 * relcache invalidations still exist and will still be invoked, they
1972 * will just see the null hash table global and take no action.
1973 */
1974static void
1976{
1977 HASHCTL ctl;
1978 static bool relation_callbacks_registered = false;
1979
1980 /* Nothing to do if hash table already exists */
1981 if (RelationSyncCache != NULL)
1982 return;
1983
1984 /* Make a new hash table for the cache */
1985 ctl.keysize = sizeof(Oid);
1986 ctl.entrysize = sizeof(RelationSyncEntry);
1987 ctl.hcxt = cachectx;
1988
1989 RelationSyncCache = hash_create("logical replication output relation cache",
1990 128, &ctl,
1992
1994
1995 /* No more to do if we already registered callbacks */
1997 return;
1998
1999 /* We must update the cache entry for a relation after a relcache flush */
2001
2002 /*
2003 * Flush all cache entries after a pg_namespace change, in case it was a
2004 * schema rename affecting a relation being replicated.
2005 *
2006 * XXX: It is not a good idea to invalidate all the relation entries in
2007 * RelationSyncCache on schema rename. We can optimize it to invalidate
2008 * only the required relations by either having a specific invalidation
2009 * message containing impacted relations or by having schema information
2010 * in each RelationSyncCache entry and using hashvalue of pg_namespace.oid
2011 * passed to the callback.
2012 */
2015 (Datum) 0);
2016
2018}
2019
2020/*
2021 * We expect relatively small number of streamed transactions.
2022 */
2023static bool
2028
2029/*
2030 * Add the xid in the rel sync entry for which we have already sent the schema
2031 * of the relation.
2032 */
2033static void
2044
2045/*
2046 * Find or create entry in the relation schema cache.
2047 *
2048 * This looks up publications that the given relation is directly or
2049 * indirectly part of (the latter if it's really the relation's ancestor that
2050 * is part of a publication) and fills up the found entry with the information
2051 * about which operations to publish and whether to use an ancestor's schema
2052 * when publishing.
2053 */
2054static RelationSyncEntry *
2056{
2057 RelationSyncEntry *entry;
2058 bool found;
2060 Oid relid = RelationGetRelid(relation);
2061
2063
2064 /* Find cached relation info, creating if not found */
2066 &relid,
2067 HASH_ENTER, &found);
2068 Assert(entry != NULL);
2069
2070 /* initialize entry, if it's new */
2071 if (!found)
2072 {
2073 entry->replicate_valid = false;
2074 entry->schema_sent = false;
2076 entry->streamed_txns = NIL;
2077 entry->pubactions.pubinsert = entry->pubactions.pubupdate =
2078 entry->pubactions.pubdelete = entry->pubactions.pubtruncate = false;
2079 entry->new_slot = NULL;
2080 entry->old_slot = NULL;
2081 memset(entry->exprstate, 0, sizeof(entry->exprstate));
2082 entry->entry_cxt = NULL;
2084 entry->columns = NULL;
2085 entry->attrmap = NULL;
2086 }
2087
2088 /* Validate the entry */
2089 if (!entry->replicate_valid)
2090 {
2093
2094 /*
2095 * We don't acquire a lock on the namespace system table as we build
2096 * the cache entry using a historic snapshot and all the later changes
2097 * are absorbed while decoding WAL.
2098 */
2100 ListCell *lc;
2101 Oid publish_as_relid = relid;
2102 int publish_ancestor_level = 0;
2104 char relkind = get_rel_relkind(relid);
2106
2107 /* Reload publications if needed before use. */
2108 if (!publications_valid)
2109 {
2110 MemoryContextReset(data->pubctx);
2111
2113 data->publications = LoadPublications(data->publication_names);
2115 publications_valid = true;
2116 }
2117
2118 /*
2119 * Reset schema_sent status as the relation definition may have
2120 * changed. Also reset pubactions to empty in case rel was dropped
2121 * from a publication. Also free any objects that depended on the
2122 * earlier definition.
2123 */
2124 entry->schema_sent = false;
2126 list_free(entry->streamed_txns);
2127 entry->streamed_txns = NIL;
2128 bms_free(entry->columns);
2129 entry->columns = NULL;
2130 entry->pubactions.pubinsert = false;
2131 entry->pubactions.pubupdate = false;
2132 entry->pubactions.pubdelete = false;
2133 entry->pubactions.pubtruncate = false;
2134
2135 /*
2136 * Tuple slots cleanups. (Will be rebuilt later if needed).
2137 */
2138 if (entry->old_slot)
2139 {
2140 TupleDesc desc = entry->old_slot->tts_tupleDescriptor;
2141
2142 Assert(desc->tdrefcount == -1);
2143
2145
2146 /*
2147 * ExecDropSingleTupleTableSlot() would not free the TupleDesc, so
2148 * do it now to avoid any leaks.
2149 */
2150 FreeTupleDesc(desc);
2151 }
2152 if (entry->new_slot)
2153 {
2154 TupleDesc desc = entry->new_slot->tts_tupleDescriptor;
2155
2156 Assert(desc->tdrefcount == -1);
2157
2159
2160 /*
2161 * ExecDropSingleTupleTableSlot() would not free the TupleDesc, so
2162 * do it now to avoid any leaks.
2163 */
2164 FreeTupleDesc(desc);
2165 }
2166
2167 entry->old_slot = NULL;
2168 entry->new_slot = NULL;
2169
2170 if (entry->attrmap)
2171 free_attrmap(entry->attrmap);
2172 entry->attrmap = NULL;
2173
2174 /*
2175 * Row filter cache cleanups.
2176 */
2177 if (entry->entry_cxt)
2179
2180 entry->entry_cxt = NULL;
2181 entry->estate = NULL;
2182 memset(entry->exprstate, 0, sizeof(entry->exprstate));
2183
2184 /*
2185 * Build publication cache. We can't use one provided by relcache as
2186 * relcache considers all publications that the given relation is in,
2187 * but here we only need to consider ones that the subscriber
2188 * requested.
2189 */
2190 foreach(lc, data->publications)
2191 {
2192 Publication *pub = lfirst(lc);
2193 bool publish = false;
2194
2195 /*
2196 * Under what relid should we publish changes in this publication?
2197 * We'll use the top-most relid across all publications. Also
2198 * track the ancestor level for this publication.
2199 */
2200 Oid pub_relid = relid;
2201 int ancestor_level = 0;
2202
2203 /*
2204 * If this is a FOR ALL TABLES publication, pick the partition
2205 * root and set the ancestor level accordingly.
2206 */
2207 if (pub->alltables)
2208 {
2209 publish = true;
2210 if (pub->pubviaroot && am_partition)
2211 {
2212 List *ancestors = get_partition_ancestors(relid);
2213
2214 pub_relid = llast_oid(ancestors);
2215 ancestor_level = list_length(ancestors);
2216 }
2217 }
2218
2219 if (!publish)
2220 {
2221 bool ancestor_published = false;
2222
2223 /*
2224 * For a partition, check if any of the ancestors are
2225 * published. If so, note down the topmost ancestor that is
2226 * published via this publication, which will be used as the
2227 * relation via which to publish the partition's changes.
2228 */
2229 if (am_partition)
2230 {
2231 Oid ancestor;
2232 int level;
2233 List *ancestors = get_partition_ancestors(relid);
2234
2236 ancestors,
2237 &level);
2238
2239 if (ancestor != InvalidOid)
2240 {
2241 ancestor_published = true;
2242 if (pub->pubviaroot)
2243 {
2245 ancestor_level = level;
2246 }
2247 }
2248 }
2249
2250 if (list_member_oid(pubids, pub->oid) ||
2253 publish = true;
2254 }
2255
2256 /*
2257 * If the relation is to be published, determine actions to
2258 * publish, and list of columns, if appropriate.
2259 *
2260 * Don't publish changes for partitioned tables, because
2261 * publishing those of its partitions suffices, unless partition
2262 * changes won't be published due to pubviaroot being set.
2263 */
2264 if (publish &&
2265 (relkind != RELKIND_PARTITIONED_TABLE || pub->pubviaroot))
2266 {
2271
2272 /*
2273 * We want to publish the changes as the top-most ancestor
2274 * across all publications. So we need to check if the already
2275 * calculated level is higher than the new one. If yes, we can
2276 * ignore the new value (as it's a child). Otherwise the new
2277 * value is an ancestor, so we keep it.
2278 */
2280 continue;
2281
2282 /*
2283 * If we found an ancestor higher up in the tree, discard the
2284 * list of publications through which we replicate it, and use
2285 * the new ancestor.
2286 */
2288 {
2289 publish_as_relid = pub_relid;
2291
2292 /* reset the publication list for this relation */
2294 }
2295 else
2296 {
2297 /* Same ancestor level, has to be the same OID. */
2298 Assert(publish_as_relid == pub_relid);
2299 }
2300
2301 /* Track publications for this ancestor. */
2303 }
2304 }
2305
2306 entry->publish_as_relid = publish_as_relid;
2307
2308 /*
2309 * Initialize the tuple slot, map, and row filter. These are only used
2310 * when publishing inserts, updates, or deletes.
2311 */
2312 if (entry->pubactions.pubinsert || entry->pubactions.pubupdate ||
2313 entry->pubactions.pubdelete)
2314 {
2315 /* Initialize the tuple slot and map */
2316 init_tuple_slot(data, relation, entry);
2317
2318 /* Initialize the row filter */
2320
2321 /* Check whether to publish generated columns. */
2323
2324 /* Initialize the column list */
2326 }
2327
2331
2332 entry->replicate_valid = true;
2333 }
2334
2335 return entry;
2336}
2337
2338/*
2339 * Cleanup list of streamed transactions and update the schema_sent flag.
2340 *
2341 * When a streamed transaction commits or aborts, we need to remove the
2342 * toplevel XID from the schema cache. If the transaction aborted, the
2343 * subscriber will simply throw away the schema records we streamed, so
2344 * we don't need to do anything else.
2345 *
2346 * If the transaction is committed, the subscriber will update the relation
2347 * cache - so tweak the schema_sent flag accordingly.
2348 */
2349static void
2351{
2353 RelationSyncEntry *entry;
2354
2356
2358 while ((entry = hash_seq_search(&hash_seq)) != NULL)
2359 {
2360 /*
2361 * We can set the schema_sent flag for an entry that has committed xid
2362 * in the list as that ensures that the subscriber would have the
2363 * corresponding schema and we don't need to send it unless there is
2364 * any invalidation for that relation.
2365 */
2367 {
2368 if (xid == streamed_txn)
2369 {
2370 if (is_commit)
2371 entry->schema_sent = true;
2372
2373 entry->streamed_txns =
2375 break;
2376 }
2377 }
2378 }
2379}
2380
2381/*
2382 * Relcache invalidation callback
2383 */
2384static void
2386{
2387 RelationSyncEntry *entry;
2388
2389 /*
2390 * We can get here if the plugin was used in SQL interface as the
2391 * RelationSyncCache is destroyed when the decoding finishes, but there is
2392 * no way to unregister the relcache invalidation callback.
2393 */
2394 if (RelationSyncCache == NULL)
2395 return;
2396
2397 /*
2398 * Nobody keeps pointers to entries in this hash table around outside
2399 * logical decoding callback calls - but invalidation events can come in
2400 * *during* a callback if we do any syscache access in the callback.
2401 * Because of that we must mark the cache entry as invalid but not damage
2402 * any of its substructure here. The next get_rel_sync_entry() call will
2403 * rebuild it all.
2404 */
2405 if (OidIsValid(relid))
2406 {
2407 /*
2408 * Getting invalidations for relations that aren't in the table is
2409 * entirely normal. So we don't care if it's found or not.
2410 */
2412 HASH_FIND, NULL);
2413 if (entry != NULL)
2414 entry->replicate_valid = false;
2415 }
2416 else
2417 {
2418 /* Whole cache must be flushed. */
2419 HASH_SEQ_STATUS status;
2420
2422 while ((entry = (RelationSyncEntry *) hash_seq_search(&status)) != NULL)
2423 {
2424 entry->replicate_valid = false;
2425 }
2426 }
2427}
2428
2429/*
2430 * Publication relation/schema map syscache invalidation callback
2431 *
2432 * Called for invalidations on pg_namespace.
2433 */
2434static void
2436 uint32 hashvalue)
2437{
2438 HASH_SEQ_STATUS status;
2439 RelationSyncEntry *entry;
2440
2441 /*
2442 * We can get here if the plugin was used in SQL interface as the
2443 * RelationSyncCache is destroyed when the decoding finishes, but there is
2444 * no way to unregister the invalidation callbacks.
2445 */
2446 if (RelationSyncCache == NULL)
2447 return;
2448
2449 /*
2450 * We have no easy way to identify which cache entries this invalidation
2451 * event might have affected, so just mark them all invalid.
2452 */
2454 while ((entry = (RelationSyncEntry *) hash_seq_search(&status)) != NULL)
2455 {
2456 entry->replicate_valid = false;
2457 }
2458}
2459
2460/* Send Replication origin */
2461static void
2463 XLogRecPtr origin_lsn, bool send_origin)
2464{
2465 if (send_origin)
2466 {
2467 char *origin;
2468
2469 /*----------
2470 * XXX: which behaviour do we want here?
2471 *
2472 * Alternatives:
2473 * - don't send origin message if origin name not found
2474 * (that's what we do now)
2475 * - throw error - that will break replication, not good
2476 * - send some special "unknown" origin
2477 *----------
2478 */
2479 if (replorigin_by_oid(origin_id, true, &origin))
2480 {
2481 /* Message boundary */
2482 OutputPluginWrite(ctx, false);
2483 OutputPluginPrepareWrite(ctx, true);
2484
2485 logicalrep_write_origin(ctx->out, origin, origin_lsn);
2486 }
2487 }
2488}
Datum idx(PG_FUNCTION_ARGS)
Definition _int_op.c:262
void free_attrmap(AttrMap *map)
Definition attmap.c:56
AttrMap * build_attrmap_by_name_if_req(TupleDesc indesc, TupleDesc outdesc, bool missing_ok)
Definition attmap.c:261
Bitmapset * bms_make_singleton(int x)
Definition bitmapset.c:216
bool bms_equal(const Bitmapset *a, const Bitmapset *b)
Definition bitmapset.c:142
void bms_free(Bitmapset *a)
Definition bitmapset.c:239
static void cleanup(void)
Definition bootstrap.c:838
#define TextDatumGetCString(d)
Definition builtins.h:99
#define PG_UINT32_MAX
Definition c.h:616
#define PG_USED_FOR_ASSERTS_ONLY
Definition c.h:235
#define Assert(condition)
Definition c.h:885
uint32_t uint32
Definition c.h:558
uint32 TransactionId
Definition c.h:678
#define OidIsValid(objectId)
Definition c.h:800
size_t Size
Definition c.h:631
int64 TimestampTz
Definition timestamp.h:39
char * defGetString(DefElem *def)
Definition define.c:34
bool defGetBoolean(DefElem *def)
Definition define.c:93
void * hash_search(HTAB *hashp, const void *keyPtr, HASHACTION action, bool *foundPtr)
Definition dynahash.c:952
HTAB * hash_create(const char *tabname, int64 nelem, const HASHCTL *info, int flags)
Definition dynahash.c:358
void hash_destroy(HTAB *hashp)
Definition dynahash.c:865
void * hash_seq_search(HASH_SEQ_STATUS *status)
Definition dynahash.c:1415
void hash_seq_init(HASH_SEQ_STATUS *status, HTAB *hashp)
Definition dynahash.c:1380
Datum arg
Definition elog.c:1322
int errcode(int sqlerrcode)
Definition elog.c:874
int errmsg(const char *fmt,...)
Definition elog.c:1093
int errhint(const char *fmt,...) pg_attribute_printf(1
#define DEBUG3
Definition elog.h:28
int errdetail(const char *fmt,...) pg_attribute_printf(1
#define WARNING
Definition elog.h:36
#define DEBUG1
Definition elog.h:30
#define ERROR
Definition elog.h:39
#define elog(elevel,...)
Definition elog.h:226
#define ereport(elevel,...)
Definition elog.h:150
ExprState * ExecPrepareExpr(Expr *node, EState *estate)
Definition execExpr.c:765
TupleTableSlot * MakeSingleTupleTableSlot(TupleDesc tupdesc, const TupleTableSlotOps *tts_ops)
const TupleTableSlotOps TTSOpsVirtual
Definition execTuples.c:84
void ExecDropSingleTupleTableSlot(TupleTableSlot *slot)
TupleTableSlot * ExecStoreVirtualTuple(TupleTableSlot *slot)
const TupleTableSlotOps TTSOpsHeapTuple
Definition execTuples.c:85
TupleTableSlot * MakeTupleTableSlot(TupleDesc tupleDesc, const TupleTableSlotOps *tts_ops)
TupleTableSlot * ExecStoreHeapTuple(HeapTuple tuple, TupleTableSlot *slot, bool shouldFree)
void ExecInitRangeTable(EState *estate, List *rangeTable, List *permInfos, Bitmapset *unpruned_relids)
Definition execUtils.c:773
EState * CreateExecutorState(void)
Definition execUtils.c:88
#define ResetPerTupleExprContext(estate)
Definition executor.h:665
#define GetPerTupleExprContext(estate)
Definition executor.h:656
static Datum ExecEvalExprSwitchContext(ExprState *state, ExprContext *econtext, bool *isNull)
Definition executor.h:436
#define palloc0_object(type)
Definition fe_memutils.h:75
#define PG_MODULE_MAGIC_EXT(...)
Definition fmgr.h:540
@ HASH_FIND
Definition hsearch.h:113
@ HASH_ENTER
Definition hsearch.h:114
#define HASH_CONTEXT
Definition hsearch.h:102
#define HASH_ELEM
Definition hsearch.h:95
#define HASH_BLOBS
Definition hsearch.h:97
#define HeapTupleIsValid(tuple)
Definition htup.h:78
void CacheRegisterSyscacheCallback(SysCacheIdentifier cacheid, SyscacheCallbackFunction func, Datum arg)
Definition inval.c:1816
void CacheRegisterRelcacheCallback(RelcacheCallbackFunction func, Datum arg)
Definition inval.c:1858
void CacheRegisterRelSyncCallback(RelSyncCallbackFunction func, Datum arg)
Definition inval.c:1879
int i
Definition isn.c:77
List * lappend(List *list, void *datum)
Definition list.c:339
List * lappend_xid(List *list, TransactionId datum)
Definition list.c:393
bool list_member_xid(const List *list, TransactionId datum)
Definition list.c:742
void list_free(List *list)
Definition list.c:1546
bool list_member_oid(const List *list, Oid datum)
Definition list.c:722
void list_free_deep(List *list)
Definition list.c:1560
#define AccessShareLock
Definition lockdefs.h:36
void OutputPluginWrite(struct LogicalDecodingContext *ctx, bool last_write)
Definition logical.c:696
void OutputPluginUpdateProgress(struct LogicalDecodingContext *ctx, bool skipped_xact)
Definition logical.c:709
void OutputPluginPrepareWrite(struct LogicalDecodingContext *ctx, bool last_write)
Definition logical.c:683
#define LOGICALREP_PROTO_STREAM_PARALLEL_VERSION_NUM
#define LOGICALREP_PROTO_MIN_VERSION_NUM
#define LOGICALREP_PROTO_STREAM_VERSION_NUM
#define LOGICALREP_PROTO_TWOPHASE_VERSION_NUM
#define LOGICALREP_PROTO_MAX_VERSION_NUM
bool get_rel_relispartition(Oid relid)
Definition lsyscache.c:2177
char get_rel_relkind(Oid relid)
Definition lsyscache.c:2153
Oid get_rel_namespace(Oid relid)
Definition lsyscache.c:2102
char * get_namespace_name(Oid nspid)
Definition lsyscache.c:3518
Expr * make_orclause(List *orclauses)
Definition makefuncs.c:743
void MemoryContextReset(MemoryContext context)
Definition mcxt.c:403
void * MemoryContextAllocZero(MemoryContext context, Size size)
Definition mcxt.c:1266
char * pstrdup(const char *in)
Definition mcxt.c:1781
void MemoryContextRegisterResetCallback(MemoryContext context, MemoryContextCallback *cb)
Definition mcxt.c:582
void pfree(void *pointer)
Definition mcxt.c:1616
void * palloc0(Size size)
Definition mcxt.c:1417
MemoryContext CacheMemoryContext
Definition mcxt.c:169
void MemoryContextDelete(MemoryContext context)
Definition mcxt.c:472
#define AllocSetContextCreate
Definition memutils.h:129
#define ALLOCSET_DEFAULT_SIZES
Definition memutils.h:160
#define ALLOCSET_SMALL_SIZES
Definition memutils.h:170
#define MemoryContextCopyAndSetIdentifier(cxt, id)
Definition memutils.h:101
#define IsA(nodeptr, _type_)
Definition nodes.h:164
#define makeNode(_type_)
Definition nodes.h:161
bool replorigin_by_oid(ReplOriginId roident, bool missing_ok, char **roname)
Definition origin.c:501
#define InvalidReplOriginId
Definition origin.h:33
@ OUTPUT_PLUGIN_BINARY_OUTPUT
static MemoryContext MemoryContextSwitchTo(MemoryContext context)
Definition palloc.h:124
RTEPermissionInfo * addRTEPermissionInfo(List **rteperminfos, RangeTblEntry *rte)
@ RTE_RELATION
List * get_partition_ancestors(Oid relid)
Definition partition.c:134
FormData_pg_attribute * Form_pg_attribute
const void * data
#define lfirst(lc)
Definition pg_list.h:172
static int list_length(const List *l)
Definition pg_list.h:152
#define NIL
Definition pg_list.h:68
#define foreach_delete_current(lst, var_or_cell)
Definition pg_list.h:391
#define foreach_xid(var, lst)
Definition pg_list.h:472
#define list_make1(x1)
Definition pg_list.h:212
#define foreach_ptr(type, var, lst)
Definition pg_list.h:469
#define llast_oid(l)
Definition pg_list.h:200
List * GetRelationPublications(Oid relid)
Publication * GetPublicationByName(const char *pubname, bool missing_ok)
List * GetSchemaPublications(Oid schemaid)
Oid GetTopMostAncestorInPublication(Oid puboid, List *ancestors, int *ancestor_level)
Bitmapset * pub_form_cols_map(Relation relation, PublishGencolsType include_gencols_type)
bool check_and_fetch_column_list(Publication *pub, Oid relid, MemoryContext mcxt, Bitmapset **cols)
bool is_publishable_relation(Relation rel)
static List * LoadPublications(List *pubnames)
Definition pgoutput.c:1802
static void pgoutput_send_begin(LogicalDecodingContext *ctx, ReorderBufferTXN *txn)
Definition pgoutput.c:610
static void pgoutput_ensure_entry_cxt(PGOutputData *data, RelationSyncEntry *entry)
Definition pgoutput.c:896
static void parse_output_parameters(List *options, PGOutputData *data)
Definition pgoutput.c:290
static void init_tuple_slot(PGOutputData *data, Relation relation, RelationSyncEntry *entry)
Definition pgoutput.c:1211
static bool pgoutput_row_filter_exec_expr(ExprState *state, ExprContext *econtext)
Definition pgoutput.c:873
static void pgoutput_change(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, Relation relation, ReorderBufferChange *change)
Definition pgoutput.c:1484
#define NUM_ROWFILTER_PUBACTIONS
Definition pgoutput.c:106
static void pgoutput_begin_prepare_txn(LogicalDecodingContext *ctx, ReorderBufferTXN *txn)
Definition pgoutput.c:664
static void pgoutput_memory_context_reset(void *arg)
Definition pgoutput.c:438
static void send_relation_and_attrs(Relation relation, TransactionId xid, LogicalDecodingContext *ctx, RelationSyncEntry *relentry)
Definition pgoutput.c:798
static void pgoutput_startup(LogicalDecodingContext *ctx, OutputPluginOptions *opt, bool is_init)
Definition pgoutput.c:451
static void pgoutput_truncate(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, int nrelations, Relation relations[], ReorderBufferChange *change)
Definition pgoutput.c:1656
static void init_rel_sync_cache(MemoryContext cachectx)
Definition pgoutput.c:1975
RowFilterPubAction
Definition pgoutput.c:100
@ PUBACTION_INSERT
Definition pgoutput.c:101
@ PUBACTION_UPDATE
Definition pgoutput.c:102
@ PUBACTION_DELETE
Definition pgoutput.c:103
static void rel_sync_cache_relation_cb(Datum arg, Oid relid)
Definition pgoutput.c:2385
static void pgoutput_prepare_txn(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr prepare_lsn)
Definition pgoutput.c:681
static RelationSyncEntry * get_rel_sync_entry(PGOutputData *data, Relation relation)
Definition pgoutput.c:2055
static void pgoutput_rollback_prepared_txn(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr prepare_end_lsn, TimestampTz prepare_time)
Definition pgoutput.c:709
static void pgoutput_shutdown(LogicalDecodingContext *ctx)
Definition pgoutput.c:1788
static bool pgoutput_origin_filter(LogicalDecodingContext *ctx, ReplOriginId origin_id)
Definition pgoutput.c:1769
static void cleanup_rel_sync_cache(TransactionId xid, bool is_commit)
Definition pgoutput.c:2350
static void pgoutput_stream_abort(struct LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr abort_lsn)
Definition pgoutput.c:1894
static void pgoutput_stream_prepare_txn(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr prepare_lsn)
Definition pgoutput.c:1955
static void maybe_send_schema(LogicalDecodingContext *ctx, ReorderBufferChange *change, Relation relation, RelationSyncEntry *relentry)
Definition pgoutput.c:727
static void pgoutput_begin_txn(LogicalDecodingContext *ctx, ReorderBufferTXN *txn)
Definition pgoutput.c:596
static HTAB * RelationSyncCache
Definition pgoutput.c:220
static void pgoutput_row_filter_init(PGOutputData *data, List *publications, RelationSyncEntry *entry)
Definition pgoutput.c:918
static void pgoutput_stream_commit(struct LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr commit_lsn)
Definition pgoutput.c:1927
static void publication_invalidation_cb(Datum arg, SysCacheIdentifier cacheid, uint32 hashvalue)
Definition pgoutput.c:1831
static void check_and_init_gencol(PGOutputData *data, List *publications, RelationSyncEntry *entry)
Definition pgoutput.c:1065
static void pgoutput_commit_prepared_txn(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr commit_lsn)
Definition pgoutput.c:695
static bool pgoutput_row_filter(Relation relation, TupleTableSlot *old_slot, TupleTableSlot **new_slot_ptr, RelationSyncEntry *entry, ReorderBufferChangeType *action)
Definition pgoutput.c:1303
static void set_schema_sent_in_streamed_txn(RelationSyncEntry *entry, TransactionId xid)
Definition pgoutput.c:2034
static void pgoutput_column_list_init(PGOutputData *data, List *publications, RelationSyncEntry *entry)
Definition pgoutput.c:1124
static void pgoutput_stream_stop(struct LogicalDecodingContext *ctx, ReorderBufferTXN *txn)
Definition pgoutput.c:1873
static void rel_sync_cache_publication_cb(Datum arg, SysCacheIdentifier cacheid, uint32 hashvalue)
Definition pgoutput.c:2435
static void pgoutput_stream_start(struct LogicalDecodingContext *ctx, ReorderBufferTXN *txn)
Definition pgoutput.c:1841
static void send_repl_origin(LogicalDecodingContext *ctx, ReplOriginId origin_id, XLogRecPtr origin_lsn, bool send_origin)
Definition pgoutput.c:2462
void _PG_output_plugin_init(OutputPluginCallbacks *cb)
Definition pgoutput.c:261
static void pgoutput_message(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr message_lsn, bool transactional, const char *prefix, Size sz, const char *message)
Definition pgoutput.c:1724
static void pgoutput_commit_txn(LogicalDecodingContext *ctx, ReorderBufferTXN *txn, XLogRecPtr commit_lsn)
Definition pgoutput.c:632
static bool publications_valid
Definition pgoutput.c:86
static bool get_schema_sent_in_streamed_txn(RelationSyncEntry *entry, TransactionId xid)
Definition pgoutput.c:2024
static EState * create_estate_for_relation(Relation rel)
Definition pgoutput.c:842
int pg_strcasecmp(const char *s1, const char *s2)
static bool DatumGetBool(Datum X)
Definition postgres.h:100
static Datum ObjectIdGetDatum(Oid X)
Definition postgres.h:262
uint64_t Datum
Definition postgres.h:70
static Pointer DatumGetPointer(Datum X)
Definition postgres.h:342
#define InvalidOid
unsigned int Oid
static int fb(int x)
void logicalrep_write_commit(StringInfo out, ReorderBufferTXN *txn, XLogRecPtr commit_lsn)
Definition proto.c:78
void logicalrep_write_rollback_prepared(StringInfo out, ReorderBufferTXN *txn, XLogRecPtr prepare_end_lsn, TimestampTz prepare_time)
Definition proto.c:293
void logicalrep_write_insert(StringInfo out, TransactionId xid, Relation rel, TupleTableSlot *newslot, bool binary, Bitmapset *columns, PublishGencolsType include_gencols_type)
Definition proto.c:403
void logicalrep_write_origin(StringInfo out, const char *origin, XLogRecPtr origin_lsn)
Definition proto.c:374
void logicalrep_write_rel(StringInfo out, TransactionId xid, Relation rel, Bitmapset *columns, PublishGencolsType include_gencols_type)
Definition proto.c:667
void logicalrep_write_stream_abort(StringInfo out, TransactionId xid, TransactionId subxid, XLogRecPtr abort_lsn, TimestampTz abort_time, bool write_abort_info)
Definition proto.c:1161
void logicalrep_write_message(StringInfo out, TransactionId xid, XLogRecPtr lsn, bool transactional, const char *prefix, Size sz, const char *message)
Definition proto.c:640
void logicalrep_write_prepare(StringInfo out, ReorderBufferTXN *txn, XLogRecPtr prepare_lsn)
Definition proto.c:187
void logicalrep_write_typ(StringInfo out, TransactionId xid, Oid typoid)
Definition proto.c:726
void logicalrep_write_delete(StringInfo out, TransactionId xid, Relation rel, TupleTableSlot *oldslot, bool binary, Bitmapset *columns, PublishGencolsType include_gencols_type)
Definition proto.c:528
void logicalrep_write_truncate(StringInfo out, TransactionId xid, int nrelids, Oid relids[], bool cascade, bool restart_seqs)
Definition proto.c:583
void logicalrep_write_begin(StringInfo out, ReorderBufferTXN *txn)
Definition proto.c:49
void logicalrep_write_commit_prepared(StringInfo out, ReorderBufferTXN *txn, XLogRecPtr commit_lsn)
Definition proto.c:237
void logicalrep_write_stream_commit(StringInfo out, ReorderBufferTXN *txn, XLogRecPtr commit_lsn)
Definition proto.c:1107
void logicalrep_write_stream_prepare(StringInfo out, ReorderBufferTXN *txn, XLogRecPtr prepare_lsn)
Definition proto.c:353
void logicalrep_write_begin_prepare(StringInfo out, ReorderBufferTXN *txn)
Definition proto.c:116
bool logicalrep_should_publish_column(Form_pg_attribute att, Bitmapset *columns, PublishGencolsType include_gencols_type)
Definition proto.c:1282
void logicalrep_write_stream_start(StringInfo out, TransactionId xid, bool first_segment)
Definition proto.c:1064
void logicalrep_write_update(StringInfo out, TransactionId xid, Relation rel, TupleTableSlot *oldslot, TupleTableSlot *newslot, bool binary, Bitmapset *columns, PublishGencolsType include_gencols_type)
Definition proto.c:450
void logicalrep_write_stream_stop(StringInfo out)
Definition proto.c:1098
tree ctl
Definition radixtree.h:1838
void * stringToNode(const char *str)
Definition read.c:90
#define RelationGetRelid(relation)
Definition rel.h:514
#define RelationGetDescr(relation)
Definition rel.h:540
#define RelationGetRelationName(relation)
Definition rel.h:548
#define RelationIsValid(relation)
Definition rel.h:489
#define RelationGetNamespace(relation)
Definition rel.h:555
Relation RelationIdGetRelation(Oid relationId)
Definition relcache.c:2094
void RelationClose(Relation relation)
Definition relcache.c:2215
#define rbtxn_is_streamed(txn)
#define rbtxn_get_toptxn(txn)
#define rbtxn_is_subtxn(txn)
ReorderBufferChangeType
@ REORDER_BUFFER_CHANGE_INSERT
@ REORDER_BUFFER_CHANGE_DELETE
@ REORDER_BUFFER_CHANGE_UPDATE
Node * expand_generated_columns_in_expr(Node *node, Relation rel, int rt_index)
CommandId es_output_cid
Definition execnodes.h:685
Size keysize
Definition hsearch.h:75
Definition pg_list.h:54
MemoryContext context
Definition logical.h:36
void * output_plugin_private
Definition logical.h:76
List * output_plugin_options
Definition logical.h:59
LogicalDecodeStreamChangeCB stream_change_cb
LogicalDecodeMessageCB message_cb
LogicalDecodeStreamTruncateCB stream_truncate_cb
LogicalDecodeStreamMessageCB stream_message_cb
LogicalDecodeFilterByOriginCB filter_by_origin_cb
LogicalDecodeTruncateCB truncate_cb
LogicalDecodeStreamStopCB stream_stop_cb
LogicalDecodeStreamCommitCB stream_commit_cb
LogicalDecodeRollbackPreparedCB rollback_prepared_cb
LogicalDecodeStreamPrepareCB stream_prepare_cb
LogicalDecodeCommitPreparedCB commit_prepared_cb
LogicalDecodeStreamStartCB stream_start_cb
LogicalDecodePrepareCB prepare_cb
LogicalDecodeStartupCB startup_cb
LogicalDecodeCommitCB commit_cb
LogicalDecodeBeginCB begin_cb
LogicalDecodeStreamAbortCB stream_abort_cb
LogicalDecodeBeginPrepareCB begin_prepare_cb
LogicalDecodeChangeCB change_cb
LogicalDecodeShutdownCB shutdown_cb
OutputPluginOutputType output_type
bool sent_begin_txn
Definition pgoutput.c:216
PublicationActions pubactions
Form_pg_class rd_rel
Definition rel.h:111
ExprState * exprstate[NUM_ROWFILTER_PUBACTIONS]
Definition pgoutput.c:155
Bitmapset * columns
Definition pgoutput.c:181
PublicationActions pubactions
Definition pgoutput.c:146
TupleTableSlot * old_slot
Definition pgoutput.c:158
PublishGencolsType include_gencols_type
Definition pgoutput.c:141
MemoryContext entry_cxt
Definition pgoutput.c:187
EState * estate
Definition pgoutput.c:156
TupleTableSlot * new_slot
Definition pgoutput.c:157
List * streamed_txns
Definition pgoutput.c:142
AttrMap * attrmap
Definition pgoutput.c:174
struct ReorderBufferChange::@115::@116 tp
ReorderBufferChangeType action
struct ReorderBufferChange::@115::@117 truncate
struct ReorderBufferTXN * txn
union ReorderBufferChange::@115 data
TimestampTz abort_time
void * output_plugin_private
XLogRecPtr origin_lsn
TransactionId xid
ReplOriginId origin_id
Definition value.h:64
TupleDesc tts_tupleDescriptor
Definition tuptable.h:122
bool * tts_isnull
Definition tuptable.h:126
Datum * tts_values
Definition tuptable.h:124
char defGetStreamingMode(DefElem *def)
void ReleaseSysCache(HeapTuple tuple)
Definition syscache.c:264
HeapTuple SearchSysCache2(SysCacheIdentifier cacheId, Datum key1, Datum key2)
Definition syscache.c:230
Datum SysCacheGetAttr(SysCacheIdentifier cacheId, HeapTuple tup, AttrNumber attributeNumber, bool *isNull)
Definition syscache.c:595
#define SearchSysCacheExists2(cacheId, key1, key2)
Definition syscache.h:102
#define InvalidTransactionId
Definition transam.h:31
#define FirstGenbkiObjectId
Definition transam.h:195
TupleTableSlot * execute_attr_map_slot(AttrMap *attrMap, TupleTableSlot *in_slot, TupleTableSlot *out_slot)
Definition tupconvert.c:193
TupleDesc CreateTupleDescCopyConstr(TupleDesc tupdesc)
Definition tupdesc.c:323
void FreeTupleDesc(TupleDesc tupdesc)
Definition tupdesc.c:485
static FormData_pg_attribute * TupleDescAttr(TupleDesc tupdesc, int i)
Definition tupdesc.h:160
static CompactAttribute * TupleDescCompactAttr(TupleDesc tupdesc, int i)
Definition tupdesc.h:175
static TupleTableSlot * ExecClearTuple(TupleTableSlot *slot)
Definition tuptable.h:457
static void slot_getallattrs(TupleTableSlot *slot)
Definition tuptable.h:371
#define strVal(v)
Definition value.h:82
static bool VARATT_IS_EXTERNAL_ONDISK(const void *PTR)
Definition varatt.h:361
bool SplitIdentifierString(char *rawstring, char separator, List **namelist)
Definition varlena.c:2775
const char * name
CommandId GetCurrentCommandId(bool used)
Definition xact.c:830
uint16 ReplOriginId
Definition xlogdefs.h:69
uint64 XLogRecPtr
Definition xlogdefs.h:21
#define InvalidXLogRecPtr
Definition xlogdefs.h:28