Commitd29666d

knizhnik

authored and

kelvich

committed

some fixes in recovery

1 parentaface56 commitd29666dCopy full SHA for d29666d

File tree

4 files changed

+49

-32

lines changed

4 files changed

+49

-32

lines changed

`‎multimaster.c`

Lines changed: 40 additions & 26 deletions

Original file line number	Diff line number	Diff line change
`@@ -635,9 +635,11 @@ MtmBeginTransaction(MtmCurrentTrans* x)`
`635`	`635`	`x->isDistributed=MtmIsUserTransaction();`
`636`	`636`	`x->isPrepared= false;`
`637`	`637`	`x->isTransactionBlock=IsTransactionBlock();`
`638`		`-/* Application name can becahnged usnig PGAPPNAME environment variable */`
	`638`	`+/* Application name can bechanged usnig PGAPPNAME environment variable */`
`639`	`639`	`if (!IsBackgroundWorker&&x->isDistributed&&Mtm->status!=MTM_ONLINE&&strcmp(application_name,MULTIMASTER_ADMIN)!=0) {`
`640`		`-/* reject all user's transactions at offline cluster */`
	`640`	`+/* Reject all user's transactions at offline cluster.`
	`641`	`+ * Allow execution of transaction by bg-workers to make it possible to perform recovery.`
	`642`	`+ */`
`641`	`643`	`MtmUnlock();`
`642`	`644`	`elog(ERROR,"Multimaster node is not online: current status %s",MtmNodeStatusMnem[Mtm->status]);`
`643`	`645`	`}`
`@@ -673,14 +675,17 @@ MtmPrePrepareTransaction(MtmCurrentTrans* x)`
`673`	`675`	`if (Mtm->disabledNodeMask!=0) {`
`674`	`676`	`MtmRefreshClusterStatus(true);`
`675`	`677`	`if (!IsBackgroundWorker&&Mtm->status!=MTM_ONLINE) {`
`676`		`-elog(ERROR,"Abort current transaction because this cluster node is not online");`
	`678`	`+/* Do not take in accoutn bg-workers which are performing recovery */`
	`679`	`+elog(ERROR,"Abort current transaction because this cluster node is in %s status",MtmNodeStatusMnem[Mtm->status]);`
`677`	`680`	`}`
`678`	`681`	`}`
`679`	`682`
`680`	`683`	`MtmLock(LW_EXCLUSIVE);`
`681`	`684`
`682`	`685`	`/*`
`683`		`- * Check if there is global multimaster lock preventing new transaction from commit to make a chance to wal-senders to catch-up`
	`686`	`+ * Check if there is global multimaster lock preventing new transaction from commit to make a chance to wal-senders to catch-up.`
	`687`	`+ * Only "own" transactions are blacked. Transactions replicated from other nodes (including recovered transaction) should be proceeded`
	`688`	`+ * and should not cause cluster status change.`
`684`	`689`	`*/`
`685`	`690`	`if (!x->isReplicated) {`
`686`	`691`	`MtmCheckClusterLock();`
`@@ -716,7 +721,8 @@ MtmPrePrepareTransaction(MtmCurrentTrans* x)`
`716`	`721`	`}`
`717`	`722`	`MtmTransactionListAppend(ts);`
`718`	`723`	`MtmAddSubtransactions(ts,subxids,ts->nSubxids);`
`719`		`-MTM_TRACE("%d: MtmPrePrepareTransaction prepare commit of %d CSN=%ld\n",MyProcPid,x->xid,ts->csn);`
	`724`	`+MTM_TRACE("%d: MtmPrePrepareTransaction prepare commit of %d (gtid.xid=%d, gtid.node=%d, CSN=%ld)\n",`
	`725`	`+MyProcPid,x->xid,ts->gtid.xid,ts->gtid.node,ts->csn);`
`720`	`726`	`MtmUnlock();`
`721`	`727`
`722`	`728`	`}`
`@@ -842,14 +848,6 @@ void MtmSendNotificationMessage(MtmTransState* ts, MtmMessageCode cmd)`
`842`	`848`	`}`
`843`	`849`	`}`
`844`	`850`
`845`		`-voidMtmRecoveryCompleted(void)`
`846`		`-{`
`847`		`-elog(WARNING,"Recovery of node %d is completed",MtmNodeId);`
`848`		`-Mtm->recoverySlot=0;`
`849`		`-BIT_CLEAR(Mtm->disabledNodeMask,MtmNodeId-1);`
`850`		`-MtmSwitchClusterMode(MTM_ONLINE);`
`851`		`-}`
`852`		`-`
`853`	`851`	`voidMtmJoinTransaction(GlobalTransactionId*gtid,csn_tglobalSnapshot)`
`854`	`852`	`{`
`855`	`853`	`MtmLock(LW_EXCLUSIVE);`
`@@ -933,6 +931,18 @@ csn_t MtmGetTransactionCSN(TransactionId xid)`
`933`	`931`	`* -------------------------------------------`
`934`	`932`	`*/`
`935`	`933`
	`934`	`+voidMtmRecoveryCompleted(void)`
	`935`	`+{`
	`936`	`+elog(WARNING,"Recovery of node %d is completed",MtmNodeId);`
	`937`	`+MtmLock(LW_EXCLUSIVE);`
	`938`	`+Mtm->recoverySlot=0;`
	`939`	`+BIT_CLEAR(Mtm->disabledNodeMask,MtmNodeId-1);`
	`940`	`+/* Mode will be changed to online once all locagical reciever are connected */`
	`941`	`+MtmSwitchClusterMode(MTM_CONNECTED);`
	`942`	`+MtmUnlock();`
	`943`	`+}`
	`944`	`+`
	`945`	`+`
`936`	`946`
`937`	`947`	`/**`
`938`	`948`	`* Check state of replication slots. If some of them are too much lag behind wal, then drop this slots to avoid`
`@@ -993,10 +1003,10 @@ bool MtmIsRecoveredNode(int nodeId)`
`993`	`1003`	`boolMtmRecoveryCaughtUp(intnodeId,XLogRecPtrslotLSN)`
`994`	`1004`	`{`
`995`	`1005`	`boolcaughtUp= false;`
	`1006`	`+MtmLock(LW_EXCLUSIVE);`
`996`	`1007`	`if (MtmIsRecoveredNode(nodeId)) {`
`997`	`1008`	`XLogRecPtrwalLSN=GetXLogInsertRecPtr();`
`998`		`-MtmLock(LW_EXCLUSIVE);`
`999`		`-if (slotLSN==walLSN) {`
	`1009`	`+if (slotLSN==walLSN&&Mtm->nActiveTransactions==0) {`
`1000`	`1010`	`if (BIT_CHECK(Mtm->nodeLockerMask,nodeId-1)) {`
`1001`	`1011`	`elog(WARNING,"Node %d is caught-up",nodeId);`
`1002`	`1012`	`BIT_CLEAR(Mtm->walSenderLockerMask,MyWalSnd-WalSndCtl->walsnds);`
`@@ -1018,18 +1028,17 @@ bool MtmRecoveryCaughtUp(int nodeId, XLogRecPtr slotLSN)`
`1018`	`1028`	`* We have to maintain two bitmasks: one is marking wal sender, another - correspondent nodes.`
`1019`	`1029`	`* Is there some better way to establish mapping between nodes ad WAL-seconder?`
`1020`	`1030`	`*/`
`1021`		`-elog(WARNING,"Node %d is almost caught-up: lock cluster",nodeId);`
	`1031`	`+elog(WARNING,"Node %d is almost caught-up: slot position %lx, WAL position %lx, active transactions %d",`
	`1032`	`+nodeId,slotLSN,walLSN,Mtm->nActiveTransactions);`
`1022`	`1033`	`Assert(MyWalSnd!=NULL);/* This function is called by WAL-sender, so it should not be NULL */`
`1023`	`1034`	`BIT_SET(Mtm->nodeLockerMask,nodeId-1);`
`1024`	`1035`	`BIT_SET(Mtm->walSenderLockerMask,MyWalSnd-WalSndCtl->walsnds);`
`1025`	`1036`	`Mtm->nLockers+=1;`
`1026`	`1037`	`}else {`
`1027`	`1038`	`MTM_INFO("Continue recovery of node %d, slot position %lx, WAL position %lx, WAL sender position %lx, lockers %d, active transactions %d\n",nodeId,slotLSN,walLSN,MyWalSnd->sentPtr,Mtm->nLockers,Mtm->nActiveTransactions);`
`1028`	`1039`	`}`
`1029`		`-MtmUnlock();`
`1030`		`-}else {`
`1031`		`-MTM_INFO("Node %d is not in recovery mode\n",nodeId);`
`1032`	`1040`	`}`
	`1041`	`+MtmUnlock();`
`1033`	`1042`	`returncaughtUp;`
`1034`	`1043`	`}`
`1035`	`1044`
`@@ -1044,7 +1053,7 @@ void MtmSwitchClusterMode(MtmNodeStatus mode)`
`1044`	`1053`	`/*`
`1045`	`1054`	`* If there are recovering nodes which are catching-up WAL, check the status and prevent new transaction from commit to give`
`1046`	`1055`	`* WAL-sender a chance to catch-up WAL, completely synchronize replica and switch it to normal mode.`
`1047`		`- * This function is calledat transactionstart with multimaster lock set`
	`1056`	`+ * This function is calledbefore transactionprepare with multimaster lock set.`
`1048`	`1057`	`*/`
`1049`	`1058`	`staticvoid`
`1050`	`1059`	`MtmCheckClusterLock()`
`@@ -1071,8 +1080,8 @@ MtmCheckClusterLock()`
`1071`	`1080`	`}`
`1072`	`1081`	`}`
`1073`	`1082`	`if (mask!=0) {`
`1074`		`-/* some "almost catch-up" wal-senders are still working */`
`1075`		`-/* Do not start new transactions until themcomplete */`
	`1083`	`+/* some "almost catch-up" wal-senders are still working. */`
	`1084`	`+/* Do not start new transactions until themare completed. */`
`1076`	`1085`	`MtmUnlock();`
`1077`	`1086`	`MtmSleep(delay);`
`1078`	`1087`	`if (delay*2 <=MAX_WAIT_TIMEOUT) {`
`@@ -1215,6 +1224,7 @@ void MtmOnNodeDisconnect(int nodeId)`
`1215`	`1224`	`voidMtmOnNodeConnect(intnodeId)`
`1216`	`1225`	`{`
`1217`	`1226`	`BIT_CLEAR(Mtm->connectivityMask,nodeId-1);`
	`1227`	`+elog(NOTICE,"Reconnect node %d",nodeId);`
`1218`	`1228`	`RaftableSet(psprintf("node-mask-%d",MtmNodeId),&Mtm->connectivityMask,sizeofMtm->connectivityMask, false);`
`1219`	`1229`	`}`
`1220`	`1230`
`@@ -1645,19 +1655,23 @@ _PG_fini(void)`
`1645`	`1655`	`}`
`1646`	`1656`
`1647`	`1657`
`1648`		`-`
	`1658`	`+/*`
	`1659`	`+ * This functions is called by pglogical receiver main function when receiver background worker is started.`
	`1660`	`+ * We switch to ONLINE mode when all receviers are connected.`
	`1661`	`+ * As far as background worker can be restarted multiple times, use node bitmask.`
	`1662`	`+ */`
`1649`	`1663`	`voidMtmReceiverStarted(intnodeId)`
`1650`	`1664`	`{`
`1651`		`-SpinLockAcquire(&Mtm->spinlock);`
	`1665`	`+MtmLock(LW_EXCLUSIVE);`
`1652`	`1666`	`if (!BIT_CHECK(Mtm->pglogicalNodeMask,nodeId-1)) {`
`1653`	`1667`	`BIT_SET(Mtm->pglogicalNodeMask,nodeId-1);`
`1654`	`1668`	`if (++Mtm->nReceivers==Mtm->nNodes-1) {`
`1655`	`1669`	`if (Mtm->status==MTM_CONNECTED) {`
`1656`	`1670`	`MtmSwitchClusterMode(MTM_ONLINE);`
`1657`	`1671`	`}`
`1658`	`1672`	`}`
`1659`		`-}`
`1660`		`-SpinLockRelease(&Mtm->spinlock);`
	`1673`	`+}`
	`1674`	`+MtmUnlock();`
`1661`	`1675`	`}`
`1662`	`1676`
`1663`	`1677`	`/*`

`‎multimaster.h`

Lines changed: 3 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -45,6 +45,9 @@ typedef uint64 csn_t; /* commit serial number */`
`45`	`45`
`46`	`46`	`#definePGLOGICAL_XACT_EVENT(flags)(flags & 0x03)`
`47`	`47`
	`48`	`+#definePGLOGICAL_CAUGHT_UP 0x04`
	`49`	`+`
	`50`	`+`
`48`	`51`	`typedefuint64timestamp_t;`
`49`	`52`
`50`	`53`	`/* Identifier of global transaction */`

`‎pglogical_apply.c`

Lines changed: 1 addition & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -497,12 +497,10 @@ process_remote_commit(StringInfo in)`
`497`	`497`	`uint8flags;`
`498`	`498`	`csn_tcsn;`
`499`	`499`	`constchar*gid=NULL;`
`500`		`-boolcaughtUp;`
`501`	`500`
`502`	`501`	`/* read flags */`
`503`	`502`	`flags=pq_getmsgbyte(in);`
`504`	`503`	`MtmReplicationNode=pq_getmsgbyte(in);`
`505`		`-caughtUp=pq_getmsgbyte(in)!=0;`
`506`	`504`
`507`	`505`	`/* read fields */`
`508`	`506`	`replorigin_session_origin_lsn=pq_getmsgint64(in);/* commit_lsn */`
`@@ -571,7 +569,7 @@ process_remote_commit(StringInfo in)`
`571`	`569`	`Assert(false);`
`572`	`570`	`}`
`573`	`571`	`MtmEndSession(true);`
`574`		`-if (caughtUp) {`
	`572`	`+if (flags&PGLOGICAL_CAUGHT_UP) {`
`575`	`573`	`MtmRecoveryCompleted();`
`576`	`574`	`}`
`577`	`575`	`}`

`‎pglogical_proto.c`

Lines changed: 5 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -103,7 +103,7 @@ pglogical_write_begin(StringInfo out, PGLogicalOutputData *data,`
`103`	`103`	`{`
`104`	`104`	`boolisRecovery=MtmIsRecoveredNode(MtmReplicationNodeId);`
`105`	`105`	`csn_tcsn=MtmTransactionSnapshot(txn->xid);`
`106`		`-MTM_INFO("%d: pglogical_write_begin %d CSN=%ld\n",MyProcPid,txn->xid,csn);`
	`106`	`+MTM_INFO("%d: pglogical_write_beginXID=%dnode=%dCSN=%ld recovery=%d\n",MyProcPid,txn->xid,MtmReplicationNodeId,csn,isRecovery);`
`107`	`107`
`108`	`108`	`if (csn==INVALID_CSN&& !isRecovery) {`
`109`	`109`	`MtmIsFilteredTxn= true;`
`@@ -124,7 +124,7 @@ pglogical_write_commit(StringInfo out, PGLogicalOutputData *data,`
`124`	`124`	`ReorderBufferTXN*txn,XLogRecPtrcommit_lsn)`
`125`	`125`	`{`
`126`	`126`	`uint8flags=0;`
`127`		`-`
	`127`	`+`
`128`	`128`	`if (txn->xact_action==XLOG_XACT_COMMIT)`
`129`	`129`	`flags=PGLOGICAL_COMMIT;`
`130`	`130`	`elseif (txn->xact_action==XLOG_XACT_PREPARE)`
`@@ -146,6 +146,9 @@ pglogical_write_commit(StringInfo out, PGLogicalOutputData *data,`
`146`	`146`	`if (csn==INVALID_CSN&& !isRecovery) {`
`147`	`147`	`return;`
`148`	`148`	`}`
	`149`	`+if (MtmRecoveryCaughtUp(MtmReplicationNodeId,txn->end_lsn)) {`
	`150`	`+flags \|=PGLOGICAL_CAUGHT_UP;`
	`151`	`+}`
`149`	`152`	`}`
`150`	`153`	`pq_sendbyte(out,'C');/* sending COMMIT */`
`151`	`154`
`@@ -154,7 +157,6 @@ pglogical_write_commit(StringInfo out, PGLogicalOutputData *data,`
`154`	`157`	`/* send the flags field */`
`155`	`158`	`pq_sendbyte(out,flags);`
`156`	`159`	`pq_sendbyte(out,MtmNodeId);`
`157`		`-pq_sendbyte(out,MtmRecoveryCaughtUp(MtmReplicationNodeId,txn->end_lsn));`
`158`	`160`
`159`	`161`	`/* send fixed fields */`
`160`	`162`	`pq_sendint64(out,commit_lsn);`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commitd29666d

File tree

4 files changed

4 files changed

`‎multimaster.c`

`‎multimaster.h`

`‎pglogical_apply.c`

`‎pglogical_proto.c`

0 commit comments