NotificationsYou must be signed in to change notification settings
Fork0
Star2

Commit3db89c9

committed

Merge pull requestsorintlab#268 from sgotti/handle_max_standby_lag

sentinel: don't choose keepers with db behind a defined lag as masters.

2 parents2397b58 +5587b86 commit3db89c9Copy full SHA for 3db89c9

File tree

6 files changed

+116

-3

lines changed

cmd/sentinel
- sentinel.go
- sentinel_test.go
doc
- cluster_spec.md
pkg/cluster
- cluster.go
tests/integration
- ha_test.go
- utils.go

6 files changed

+116

-3

lines changed

`‎cmd/sentinel/sentinel.go`

Lines changed: 31 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -350,6 +350,19 @@ func (s Sentinel) isDifferentTimelineBranch(followedDB cluster.DB, db *cluster`
`350`	`350`	`returnfalse`
`351`	`351`	`}`
`352`	`352`
	`353`	`+// isLagBelowMax checks if the db reported lag is below MaxStandbyLag from the`
	`354`	`+// master reported lag`
	`355`	`+func (sSentinel)isLagBelowMax(cdcluster.ClusterData,curMasterDB,db*cluster.DB)bool {`
	`356`	`+if!*cd.Cluster.DefSpec().SynchronousReplication {`
	`357`	`+log.Debug(fmt.Sprintf("curMasterDB.Status.XLogPos: %d, db.Status.XLogPos: %d, lag: %d",curMasterDB.Status.XLogPos,db.Status.XLogPos,int64(curMasterDB.Status.XLogPos-db.Status.XLogPos)))`
	`358`	`+ifint64(curMasterDB.Status.XLogPos-db.Status.XLogPos)>int64(*cd.Cluster.DefSpec().MaxStandbyLag) {`
	`359`	`+log.Debug("ignoring keeper since its behind that maximum xlog position",zap.String("db",db.UID),zap.Uint64("dbXLogPos",db.Status.XLogPos),zap.Uint64("masterXLogPos",curMasterDB.Status.XLogPos))`
	`360`	`+returnfalse`
	`361`	`+}`
	`362`	`+}`
	`363`	`+returntrue`
	`364`	`+}`
	`365`	`+`
`353`	`366`	`func (sSentinel)freeKeepers(cdcluster.ClusterData) []*cluster.Keeper {`
`354`	`367`	`freeKeepers:= []*cluster.Keeper{}`
`355`	`368`	`K:`
`@@ -548,6 +561,15 @@ func (s Sentinel) findBestStandbys(cd cluster.ClusterData, masterDB *cluster.D`
`548`	`561`	`log.Debug("ignoring keeper since its pg timeline is different than master timeline",zap.String("db",db.UID),zap.Uint64("dbTimeline",db.Status.TimelineID),zap.Uint64("masterTimeline",masterDB.Status.TimelineID))`
`549`	`562`	`continue`
`550`	`563`	`}`
	`564`	`+// do this only when not using synchronous replication since in sync repl we`
	`565`	`+// have to ignore the last reported xlogpos or valid sync standby will be`
	`566`	`+// skipped`
	`567`	`+if!*cd.Cluster.DefSpec().SynchronousReplication {`
	`568`	`+if!s.isLagBelowMax(cd,masterDB,db) {`
	`569`	`+log.Debug("ignoring keeper since its lag is above the max configured lag",zap.String("db",db.UID),zap.Uint64("dbXLogPos",db.Status.XLogPos),zap.Uint64("masterXLogPos",masterDB.Status.XLogPos))`
	`570`	`+continue`
	`571`	`+}`
	`572`	`+}`
`551`	`573`	`bestDBs=append(bestDBs,db)`
`552`	`574`	`}`
`553`	`575`	`// Sort by XLogPos`
`@@ -569,6 +591,15 @@ func (s Sentinel) findBestNewMasters(cd cluster.ClusterData, masterDB *cluster`
`569`	`591`	`log.Debug("ignoring keeper since its pg timeline is different than master timeline",zap.String("db",db.UID),zap.Uint64("dbTimeline",db.Status.TimelineID),zap.Uint64("masterTimeline",masterDB.Status.TimelineID))`
`570`	`592`	`continue`
`571`	`593`	`}`
	`594`	`+// do this only when not using synchronous replication since in sync repl we`
	`595`	`+// have to ignore the last reported xlogpos or valid sync standby will be`
	`596`	`+// skipped`
	`597`	`+if!*cd.Cluster.DefSpec().SynchronousReplication {`
	`598`	`+if!s.isLagBelowMax(cd,masterDB,db) {`
	`599`	`+log.Debug("ignoring keeper since its lag is above the max configured lag",zap.String("db",db.UID),zap.Uint64("dbXLogPos",db.Status.XLogPos),zap.Uint64("masterXLogPos",masterDB.Status.XLogPos))`
	`600`	`+continue`
	`601`	`+}`
	`602`	`+}`
`572`	`603`	`bestNewMasters=append(bestNewMasters,db)`
`573`	`604`	`}`
`574`	`605`	`// Sort by XLogPos`

`‎cmd/sentinel/sentinel_test.go`

Lines changed: 1 addition & 1 deletion

Original file line number	Diff line number	Diff line change
`@@ -183,8 +183,8 @@ func TestUpdateCluster(t *testing.T) {`
`183`	`183`	`Proxy:&cluster.Proxy{},`
`184`	`184`	`},`
`185`	`185`	`},`
	`186`	`+// #2 cluster initialization, more than one keeper, the first will be choosen to be the new master.`
`186`	`187`	`{`
`187`		`-// #2 cluster initialization, more than one keeper, the first will be choosen to be the new master.`
`188`	`188`	`cd:&cluster.ClusterData{`
`189`	`189`	`Cluster:&cluster.Cluster{`
`190`	`190`	`UID:"cluster1",`

`‎doc/cluster_spec.md`

Lines changed: 1 addition & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -19,6 +19,7 @@ Some options in a running cluster specification can be changed to update the des`
`19`	`19`	`\| failInterval\| interval after the first fail to declare a keeper as not healthy.\| no\| string (duration)\| 20s\|`
`20`	`20`	`\| maxStandbys\| max number of standbys. This needs to be greater enough to cover both standby managed by stolon and additional standbys configured by the user. Its value affect different postgres parameters like max_replication_slots and max_wal_senders. Setting this to a number lower than the sum of stolon managed standbys and user managed standbys will have unpredicatable effects due to problems creating replication slots or replication problems due to exhausted wal senders.\| no\| uint16\| 20\|`
`21`	`21`	`\| maxStandbysPerSender\| max number of standbys for every sender. A sender can be a master or another standby (with cascading replication).\| no\| uint16\| 3\|`
	`22`	`+\| maxStandbyLag\| maximum lag (from the last reported master state, in bytes) that an asynchronous standby can have to be elected in place of a failed master.\| no\| uint32\| 1MiB\|`
`22`	`23`	`\| synchronousReplication\| use synchronous replication between the master and its standbys\| no\| bool\| false\|`
`23`	`24`	`\| minSynchronousStandbys\| minimum number of required synchronous standbys when synchronous replication is enabled (only set this to a value > 1 when using PostgreSQL >= 9.6)\| no\| int16\| 1\|`
`24`	`25`	`\| maxSynchronousStandbys\| maximum number of required synchronous standbys when synchronous replication is enabled (only set this to a value > 1 when using PostgreSQL >= 9.6)\| no\| int16\| 1\|`

`‎pkg/cluster/cluster.go`

Lines changed: 10 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -31,6 +31,9 @@ import (`
`31`	`31`	`funcUint16P(uuint16)*uint16 {`
`32`	`32`	`return&u`
`33`	`33`	`}`
	`34`	`+funcUint32P(uuint32)*uint32 {`
	`35`	`+return&u`
	`36`	`+}`
`34`	`37`
`35`	`38`	`funcBoolP(bbool)*bool {`
`36`	`39`	`return&b`
`@@ -51,6 +54,7 @@ const (`
`51`	`54`	`DefaultFailInterval=20*time.Second`
`52`	`55`	`DefaultMaxStandbysuint16=20`
`53`	`56`	`DefaultMaxStandbysPerSenderuint16=3`
	`57`	`+DefaultMaxStandbyLag=1024*1204`
`54`	`58`	`DefaultSynchronousReplication=false`
`55`	`59`	`DefaultMaxSynchronousStandbysuint16=1`
`56`	`60`	`DefaultMinSynchronousStandbysuint16=1`
`@@ -184,6 +188,9 @@ type ClusterSpec struct {`
`184`	`188`	`// Max number of standbys for every sender. A sender can be a master or`
`185`	`189`	`// another standby (if/when implementing cascading replication).`
`186`	`190`	MaxStandbysPerSender*uint16`json:"maxStandbysPerSender,omitempty"`
	`191`	`+// Max lag in bytes that an asynchronous standy can have to be elected in`
	`192`	`+// place of a failed master`
	`193`	+MaxStandbyLag*uint32`json:"maxStandbyLage,omitempty"`
`187`	`194`	`// Use Synchronous replication between master and its standbys`
`188`	`195`	SynchronousReplication*bool`json:"synchronousReplication,omitempty"`
`189`	`196`	`// MinSynchronousStandbys is the mininum number if synchronous standbys`
`@@ -287,6 +294,9 @@ func (os ClusterSpec) WithDefaults() ClusterSpec {`
`287`	`294`	`ifs.MaxStandbysPerSender==nil {`
`288`	`295`	`s.MaxStandbysPerSender=Uint16P(DefaultMaxStandbysPerSender)`
`289`	`296`	`}`
	`297`	`+ifs.MaxStandbyLag==nil {`
	`298`	`+s.MaxStandbyLag=Uint32P(DefaultMaxStandbyLag)`
	`299`	`+}`
`290`	`300`	`ifs.SynchronousReplication==nil {`
`291`	`301`	`s.SynchronousReplication=BoolP(DefaultSynchronousReplication)`
`292`	`302`	`}`

`‎tests/integration/ha_test.go`

Lines changed: 71 additions & 0 deletions

Original file line number	Diff line number	Diff line change
`@@ -125,6 +125,7 @@ func setupServers(t *testing.T, clusterName, dir string, numKeepers, numSentinel`
`125`	`125`	`SleepInterval:&cluster.Duration{Duration:2*time.Second},`
`126`	`126`	`FailInterval:&cluster.Duration{Duration:5*time.Second},`
`127`	`127`	`ConvergenceTimeout:&cluster.Duration{Duration:30*time.Second},`
	`128`	`+MaxStandbyLag:cluster.Uint32P(50*1024),// limit lag to 50kiB`
`128`	`129`	`SynchronousReplication:cluster.BoolP(syncRepl),`
`129`	`130`	`UsePgrewind:cluster.BoolP(usePgrewind),`
`130`	`131`	`PGParameters:make(cluster.PGParameters),`
`@@ -339,6 +340,9 @@ func testFailover(t *testing.T, syncRepl bool) {`
`339`	`340`	`t.Fatalf("unexpected err: %v",err)`
`340`	`341`	`}`
`341`	`342`
	`343`	`+// wait for the keepers to have reported their state (needed to know the instance XLogPos)`
	`344`	`+time.Sleep(5*time.Second)`
	`345`	`+`
`342`	`346`	`// Stop the keeper process on master, should also stop the database`
`343`	`347`	`t.Logf("Stopping current master keeper: %s",master.uid)`
`344`	`348`	`master.Stop()`
`@@ -399,6 +403,9 @@ func testFailoverFailed(t *testing.T, syncRepl bool) {`
`399`	`403`	`t.Fatalf("unexpected err: %v",err)`
`400`	`404`	`}`
`401`	`405`
	`406`	`+// wait for the keepers to have reported their state (needed to know the instance XLogPos)`
	`407`	`+time.Sleep(5*time.Second)`
	`408`	`+`
`402`	`409`	`// Stop the keeper process on master, should also stop the database`
`403`	`410`	`t.Logf("Stopping current master keeper: %s",master.uid)`
`404`	`411`	`master.Stop()`
`@@ -437,6 +444,58 @@ func TestFailoverFailedSyncRepl(t *testing.T) {`
`437`	`444`	`testFailoverFailed(t,true)`
`438`	`445`	`}`
`439`	`446`
	`447`	`+// test that a standby with a lag (reported) greater than MaxStandbyLag from the`
	`448`	`+// master (reported) xlogpos won't be elected as the new master. This test is`
	`449`	`+// valid only for asynchronous replication`
	`450`	`+funcTestFailoverTooMuchLag(t*testing.T) {`
	`451`	`+t.Parallel()`
	`452`	`+`
	`453`	`+dir,err:=ioutil.TempDir("","stolon")`
	`454`	`+iferr!=nil {`
	`455`	`+t.Fatalf("unexpected err: %v",err)`
	`456`	`+}`
	`457`	`+deferos.RemoveAll(dir)`
	`458`	`+`
	`459`	`+clusterName:=uuid.NewV4().String()`
	`460`	`+`
	`461`	`+tks,tss,tstore:=setupServers(t,clusterName,dir,2,1,false,false)`
	`462`	`+defershutdown(tks,tss,tstore)`
	`463`	`+`
	`464`	`+storePath:=filepath.Join(common.StoreBasePath,clusterName)`
	`465`	`+sm:=store.NewStoreManager(tstore.store,storePath)`
	`466`	`+`
	`467`	`+master,standbys:=waitMasterStandbysReady(t,sm,tks)`
	`468`	`+standby:=standbys[0]`
	`469`	`+`
	`470`	`+iferr:=populate(t,master);err!=nil {`
	`471`	`+t.Fatalf("unexpected err: %v",err)`
	`472`	`+}`
	`473`	`+`
	`474`	`+// stop the standby and write more than MaxStandbyLag data to the master`
	`475`	`+t.Logf("Stopping current standby keeper: %s",standby.uid)`
	`476`	`+standby.Stop()`
	`477`	`+fori:=1;i<1000;i++ {`
	`478`	`+iferr:=write(t,master,i,i);err!=nil {`
	`479`	`+t.Fatalf("unexpected err: %v",err)`
	`480`	`+}`
	`481`	`+}`
	`482`	`+`
	`483`	`+// wait for the master to have reported its state`
	`484`	`+time.Sleep(5*time.Second)`
	`485`	`+`
	`486`	`+// Stop the keeper process on master, should also stop the database`
	`487`	`+t.Logf("Stopping current master keeper: %s",master.uid)`
	`488`	`+master.Stop()`
	`489`	`+// start the standby`
	`490`	`+t.Logf("Starting current standby keeper: %s",standby.uid)`
	`491`	`+standby.Start()`
	`492`	`+`
	`493`	`+// standby shouldn't be elected as master since its lag is greater than MaxStandbyLag`
	`494`	`+iferr:=standby.WaitRole(common.RoleMaster,30*time.Second);err==nil {`
	`495`	`+t.Fatalf("standby shouldn't be elected as master")`
	`496`	`+}`
	`497`	`+}`
	`498`	`+`
`440`	`499`	`functestOldMasterRestart(t*testing.T,syncRepl,usePgrewindbool) {`
`441`	`500`	`dir,err:=ioutil.TempDir("","stolon")`
`442`	`501`	`iferr!=nil {`
`@@ -468,6 +527,9 @@ func testOldMasterRestart(t *testing.T, syncRepl, usePgrewind bool) {`
`468`	`527`	`t.Fatalf("unexpected err: %v",err)`
`469`	`528`	`}`
`470`	`529`
	`530`	`+// wait for the keepers to have reported their state (needed to know the instance XLogPos)`
	`531`	`+time.Sleep(5*time.Second)`
	`532`	`+`
`471`	`533`	`// Stop the keeper process on master, should also stop the database`
`472`	`534`	`t.Logf("Stopping current master keeper: %s",master.uid)`
`473`	`535`	`master.Stop()`
`@@ -573,6 +635,9 @@ func testPartition1(t *testing.T, syncRepl, usePgrewind bool) {`
`573`	`635`	`t.Fatalf("unexpected err: %v",err)`
`574`	`636`	`}`
`575`	`637`
	`638`	`+// wait for the keepers to have reported their state (needed to know the instance XLogPos)`
	`639`	`+time.Sleep(5*time.Second)`
	`640`	`+`
`576`	`641`	`// Freeze the keeper and postgres processes on the master`
`577`	`642`	`t.Logf("SIGSTOPping current master keeper: %s",master.uid)`
`578`	`643`	`iferr:=master.Signal(syscall.SIGSTOP);err!=nil {`
`@@ -687,6 +752,9 @@ func testTimelineFork(t *testing.T, syncRepl, usePgrewind bool) {`
`687`	`752`	`t.Fatalf("unexpected err: %v",err)`
`688`	`753`	`}`
`689`	`754`
	`755`	`+// wait for the keepers to have reported their state (needed to know the instance XLogPos)`
	`756`	`+time.Sleep(5*time.Second)`
	`757`	`+`
`690`	`758`	`// Wait replicated data to standby`
`691`	`759`	`iferr:=waitLines(t,standbys[0],1,10*time.Second);err!=nil {`
`692`	`760`	`t.Fatalf("unexpected err: %v",err)`
`@@ -827,6 +895,9 @@ func TestMasterChangedAddress(t *testing.T) {`
`827`	`895`	`t.Fatalf("unexpected err: %v",err)`
`828`	`896`	`}`
`829`	`897`
	`898`	`+// wait for the keepers to have reported their state (needed to know the instance XLogPos)`
	`899`	`+time.Sleep(5*time.Second)`
	`900`	`+`
`830`	`901`	`// Wait standby synced with master`
`831`	`902`	`iferr:=waitLines(t,master,1,60*time.Second);err!=nil {`
`832`	`903`	`t.Fatalf("unexpected err: %v",err)`

`‎tests/integration/utils.go`

Lines changed: 2 additions & 2 deletions

Original file line number	Diff line number	Diff line change
`@@ -749,8 +749,8 @@ func WaitClusterDataKeeperInitialized(keeperUID string, e *store.StoreManager, t`
`749`	`749`	`}`
`750`	`750`
`751`	`751`	`// WaitClusterDataSynchronousStandbys waits for:`
`752`		`-// *synchrnous standby defined in masterdb spec`
`753`		`-// *synchrnous standby reported from masterdb status`
	`752`	`+// *synchronous standby defined in masterdb spec`
	`753`	`+// *synchronous standby reported from masterdb status`
`754`	`754`	`funcWaitClusterDataSynchronousStandbys(synchronousStandbys []string,e*store.StoreManager,timeout time.Duration)error {`
`755`	`755`	`sort.Sort(sort.StringSlice(synchronousStandbys))`
`756`	`756`	`start:=time.Now()`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit3db89c9

File tree

6 files changed

6 files changed

`‎cmd/sentinel/sentinel.go`

`‎cmd/sentinel/sentinel_test.go`

`‎doc/cluster_spec.md`

`‎pkg/cluster/cluster.go`

`‎tests/integration/ha_test.go`

`‎tests/integration/utils.go`

0 commit comments