Skip to content

Commit 36148b2

Browse files
author
Amit Kapila
committed
Fix xmin advancement during fast_forward decoding.
During logical decoding, we advance catalog_xmin of logical too early in fast_forward mode, resulting in required catalog data being removed by vacuum. This mode is normally used to advance the slot without processing the changes, but we still can't let the slot's xmin to advance to an incorrect value. Commit f49a80c fixed a similar issue where the logical slot's catalog_xmin was getting advanced prematurely during non-fast-forward mode. During xl_running_xacts processing, instead of directly advancing the slot's xmin to the oldest running xid in the record, it allowed the xmin to be held back for snapshots that can be used for not-yet-replayed transactions, as those might consider older txns as running too. However, it missed the fact that the same problem can happen during fast_forward mode decoding, as we won't build a base snapshot in that mode, and the future call to get_changes from the same slot can miss seeing the required catalog changes leading to incorrect reslts. This commit allows building the base snapshot even in fast_forward mode to prevent the early advancement of xmin. Reported-by: Amit Kapila <amit.kapila16@gmail.com> Author: Zhijie Hou <houzj.fnst@fujitsu.com> Reviewed-by: Masahiko Sawada <sawada.mshk@gmail.com> Reviewed-by: shveta malik <shveta.malik@gmail.com> Reviewed-by: Amit Kapila <amit.kapila16@gmail.com> Backpatch-through: 13 Discussion: https://postgr.es/m/CAA4eK1LqWncUOqKijiafe+Ypt1gQAQRjctKLMY953J79xDBgAg@mail.gmail.com Discussion: https://postgr.es/m/OS0PR01MB57163087F86621D44D9A72BF94BB2@OS0PR01MB5716.jpnprd01.prod.outlook.com
1 parent d96206f commit 36148b2

File tree

3 files changed

+71
-12
lines changed

3 files changed

+71
-12
lines changed

contrib/test_decoding/expected/oldest_xmin.out

Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -38,3 +38,44 @@ COMMIT
3838
stop
3939
(1 row)
4040

41+
42+
starting permutation: s0_begin s0_getxid s1_begin s1_insert s0_alter s0_commit s0_checkpoint s0_advance_slot s0_advance_slot s1_commit s0_vacuum s0_get_changes
43+
step s0_begin: BEGIN;
44+
step s0_getxid: SELECT pg_current_xact_id() IS NULL;
45+
?column?
46+
--------
47+
f
48+
(1 row)
49+
50+
step s1_begin: BEGIN;
51+
step s1_insert: INSERT INTO harvest VALUES ((1, 2, 3));
52+
step s0_alter: ALTER TYPE basket DROP ATTRIBUTE mangos;
53+
step s0_commit: COMMIT;
54+
step s0_checkpoint: CHECKPOINT;
55+
step s0_advance_slot: SELECT slot_name FROM pg_replication_slot_advance('isolation_slot', pg_current_wal_lsn());
56+
slot_name
57+
--------------
58+
isolation_slot
59+
(1 row)
60+
61+
step s0_advance_slot: SELECT slot_name FROM pg_replication_slot_advance('isolation_slot', pg_current_wal_lsn());
62+
slot_name
63+
--------------
64+
isolation_slot
65+
(1 row)
66+
67+
step s1_commit: COMMIT;
68+
step s0_vacuum: VACUUM pg_attribute;
69+
step s0_get_changes: SELECT data FROM pg_logical_slot_get_changes('isolation_slot', NULL, NULL, 'include-xids', '0', 'skip-empty-xacts', '1');
70+
data
71+
------------------------------------------------------
72+
BEGIN
73+
table public.harvest: INSERT: fruits[basket]:'(1,2,3)'
74+
COMMIT
75+
(3 rows)
76+
77+
?column?
78+
--------
79+
stop
80+
(1 row)
81+

contrib/test_decoding/specs/oldest_xmin.spec

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@ step "s0_commit" { COMMIT; }
2525
step "s0_checkpoint" { CHECKPOINT; }
2626
step "s0_vacuum" { VACUUM pg_attribute; }
2727
step "s0_get_changes" { SELECT data FROM pg_logical_slot_get_changes('isolation_slot', NULL, NULL, 'include-xids', '0', 'skip-empty-xacts', '1'); }
28+
step "s0_advance_slot" { SELECT slot_name FROM pg_replication_slot_advance('isolation_slot', pg_current_wal_lsn()); }
2829

2930
session "s1"
3031
setup { SET synchronous_commit=on; }
@@ -40,3 +41,7 @@ step "s1_commit" { COMMIT; }
4041
# will be removed (xmax set) before T1 commits. That is, interlocking doesn't
4142
# forbid modifying catalog after someone read it (and didn't commit yet).
4243
permutation "s0_begin" "s0_getxid" "s1_begin" "s1_insert" "s0_alter" "s0_commit" "s0_checkpoint" "s0_get_changes" "s0_get_changes" "s1_commit" "s0_vacuum" "s0_get_changes"
44+
45+
# Perform the same testing process as described above, but use advance_slot to
46+
# forces xmin advancement during fast forward decoding.
47+
permutation "s0_begin" "s0_getxid" "s1_begin" "s1_insert" "s0_alter" "s0_commit" "s0_checkpoint" "s0_advance_slot" "s0_advance_slot" "s1_commit" "s0_vacuum" "s0_get_changes"

src/backend/replication/logical/decode.c

Lines changed: 25 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -411,19 +411,24 @@ heap2_decode(LogicalDecodingContext *ctx, XLogRecordBuffer *buf)
411411

412412
/*
413413
* If we don't have snapshot or we are just fast-forwarding, there is no
414-
* point in decoding changes.
414+
* point in decoding data changes. However, it's crucial to build the base
415+
* snapshot during fast-forward mode (as is done in
416+
* SnapBuildProcessChange()) because we require the snapshot's xmin when
417+
* determining the candidate catalog_xmin for the replication slot. See
418+
* SnapBuildProcessRunningXacts().
415419
*/
416-
if (SnapBuildCurrentState(builder) < SNAPBUILD_FULL_SNAPSHOT ||
417-
ctx->fast_forward)
420+
if (SnapBuildCurrentState(builder) < SNAPBUILD_FULL_SNAPSHOT)
418421
return;
419422

420423
switch (info)
421424
{
422425
case XLOG_HEAP2_MULTI_INSERT:
423-
if (SnapBuildProcessChange(builder, xid, buf->origptr))
426+
if (SnapBuildProcessChange(builder, xid, buf->origptr) &&
427+
!ctx->fast_forward)
424428
DecodeMultiInsert(ctx, buf);
425429
break;
426430
case XLOG_HEAP2_NEW_CID:
431+
if (!ctx->fast_forward)
427432
{
428433
xl_heap_new_cid *xlrec;
429434

@@ -470,16 +475,20 @@ heap_decode(LogicalDecodingContext *ctx, XLogRecordBuffer *buf)
470475

471476
/*
472477
* If we don't have snapshot or we are just fast-forwarding, there is no
473-
* point in decoding data changes.
478+
* point in decoding data changes. However, it's crucial to build the base
479+
* snapshot during fast-forward mode (as is done in
480+
* SnapBuildProcessChange()) because we require the snapshot's xmin when
481+
* determining the candidate catalog_xmin for the replication slot. See
482+
* SnapBuildProcessRunningXacts().
474483
*/
475-
if (SnapBuildCurrentState(builder) < SNAPBUILD_FULL_SNAPSHOT ||
476-
ctx->fast_forward)
484+
if (SnapBuildCurrentState(builder) < SNAPBUILD_FULL_SNAPSHOT)
477485
return;
478486

479487
switch (info)
480488
{
481489
case XLOG_HEAP_INSERT:
482-
if (SnapBuildProcessChange(builder, xid, buf->origptr))
490+
if (SnapBuildProcessChange(builder, xid, buf->origptr) &&
491+
!ctx->fast_forward)
483492
DecodeInsert(ctx, buf);
484493
break;
485494

@@ -490,17 +499,20 @@ heap_decode(LogicalDecodingContext *ctx, XLogRecordBuffer *buf)
490499
*/
491500
case XLOG_HEAP_HOT_UPDATE:
492501
case XLOG_HEAP_UPDATE:
493-
if (SnapBuildProcessChange(builder, xid, buf->origptr))
502+
if (SnapBuildProcessChange(builder, xid, buf->origptr) &&
503+
!ctx->fast_forward)
494504
DecodeUpdate(ctx, buf);
495505
break;
496506

497507
case XLOG_HEAP_DELETE:
498-
if (SnapBuildProcessChange(builder, xid, buf->origptr))
508+
if (SnapBuildProcessChange(builder, xid, buf->origptr) &&
509+
!ctx->fast_forward)
499510
DecodeDelete(ctx, buf);
500511
break;
501512

502513
case XLOG_HEAP_TRUNCATE:
503-
if (SnapBuildProcessChange(builder, xid, buf->origptr))
514+
if (SnapBuildProcessChange(builder, xid, buf->origptr) &&
515+
!ctx->fast_forward)
504516
DecodeTruncate(ctx, buf);
505517
break;
506518

@@ -528,7 +540,8 @@ heap_decode(LogicalDecodingContext *ctx, XLogRecordBuffer *buf)
528540
break;
529541

530542
case XLOG_HEAP_CONFIRM:
531-
if (SnapBuildProcessChange(builder, xid, buf->origptr))
543+
if (SnapBuildProcessChange(builder, xid, buf->origptr) &&
544+
!ctx->fast_forward)
532545
DecodeSpecConfirm(ctx, buf);
533546
break;
534547

0 commit comments

Comments
 (0)