NotificationsYou must be signed in to change notification settings
Fork928
Star10.1k

Commit4a32bba

committed

feat: limit queued logs to database limit in agent

1 parent27b55aa commit4a32bbaCopy full SHA for 4a32bba

File tree

2 files changed

+101

-17

lines changed

agent
- logs.go
- logs_internal_test.go

2 files changed

+101

-17

lines changed

`‎agent/logs.go`

Lines changed: 37 additions & 14 deletions

Original file line number	Diff line number	Diff line change
`@@ -14,9 +14,14 @@ import (`
`14`	`14`	`)`
`15`	`15`
`16`	`16`	`const (`
`17`		`-flushInterval=time.Second`
`18`		`-logOutputMaxBytes=1<<20// 1MiB`
`19`		`-overheadPerLog=21// found by testing`
	`17`	`+flushInterval=time.Second`
	`18`	`+maxBytesPerBatch=1<<20// 1MiB`
	`19`	`+overheadPerLog=21// found by testing`
	`20`	`+`
	`21`	`+// maxBytesQueued is the maximum length of logs we will queue in memory. The number is taken`
	`22`	+// from dump.sql `max_logs_length` constraint, as there is no point queuing more logs than we'll
	`23`	`+// accept in the database.`
	`24`	`+maxBytesQueued=1048576`
`20`	`25`	`)`
`21`	`26`
`22`	`27`	`typelogQueuestruct {`
`@@ -30,8 +35,9 @@ type logQueue struct {`
`30`	`35`	`// the agent calls sendLoop to send pending logs.`
`31`	`36`	`typelogSenderstruct {`
`32`	`37`	`*sync.Cond`
`33`		`-queuesmap[uuid.UUID]*logQueue`
`34`		`-logger slog.Logger`
	`38`	`+queuesmap[uuid.UUID]*logQueue`
	`39`	`+logger slog.Logger`
	`40`	`+outputLenint`
`35`	`41`	`}`
`36`	`42`
`37`	`43`	`typelogDestinterface {`
`@@ -46,6 +52,8 @@ func newLogSender(logger slog.Logger) *logSender {`
`46`	`52`	`}`
`47`	`53`	`}`
`48`	`54`
	`55`	`+varMaxQueueExceededError=xerrors.New("maximum queued logs exceeded")`
	`56`	`+`
`49`	`57`	`func (l*logSender)enqueue(src uuid.UUID,logs...agentsdk.Log)error {`
`50`	`58`	`logger:=l.logger.With(slog.F("log_source_id",src))`
`51`	`59`	`iflen(logs)==0 {`
`@@ -60,12 +68,25 @@ func (l *logSender) enqueue(src uuid.UUID, logs ...agentsdk.Log) error {`
`60`	`68`	`q=&logQueue{}`
`61`	`69`	`l.queues[src]=q`
`62`	`70`	`}`
`63`		`-for_,log:=rangelogs {`
	`71`	`+fork,log:=rangelogs {`
	`72`	`+// Here we check the queue size before adding a log because we want to queue up slightly`
	`73`	`+// more logs than the database would store to ensure we trigger "logs truncated" at the`
	`74`	`+// database layer. Otherwise, the end user wouldn't know logs are truncated unless they`
	`75`	`+// examined the Coder agent logs.`
	`76`	`+ifl.outputLen>maxBytesQueued {`
	`77`	`+logger.Warn(context.Background(),"log queue full; truncating new logs",slog.F("new_logs",k),slog.F("queued_logs",len(q.logs)))`
	`78`	`+returnMaxQueueExceededError`
	`79`	`+}`
`64`	`80`	`pl,err:=agentsdk.ProtoFromLog(log)`
`65`	`81`	`iferr!=nil {`
`66`	`82`	`returnxerrors.Errorf("failed to convert log: %w",err)`
`67`	`83`	`}`
	`84`	`+iflen(pl.Output)>maxBytesPerBatch {`
	`85`	`+logger.Warn(context.Background(),"dropping log line that exceeds our limit")`
	`86`	`+continue`
	`87`	`+}`
`68`	`88`	`q.logs=append(q.logs,pl)`
	`89`	`+l.outputLen+=len(pl.Output)`
`69`	`90`	`}`
`70`	`91`	`logger.Debug(context.Background(),"enqueued agent logs",slog.F("new_logs",len(logs)),slog.F("queued_logs",len(q.logs)))`
`71`	`92`	`returnnil`
`@@ -126,21 +147,22 @@ func (l *logSender) sendLoop(ctx context.Context, dest logDest) error {`
`126`	`147`	`req:=&proto.BatchCreateLogsRequest{`
`127`	`148`	`LogSourceId:src[:],`
`128`	`149`	`}`
`129`		`-o:=0`
	`150`	`+`
	`151`	`+// outputToSend keeps track of the size of the protobuf message we send, while`
	`152`	`+// outputToRemove keeps track of the size of the output we'll remove from the queues on`
	`153`	`+// success. They are different because outputToSend also counts protocol message overheads.`
	`154`	`+outputToSend:=0`
	`155`	`+outputToRemove:=0`
`130`	`156`	`n:=0`
`131`	`157`	`forn<len(q.logs) {`
`132`	`158`	`log:=q.logs[n]`
`133`		`-iflen(log.Output)>logOutputMaxBytes {`
`134`		`-logger.Warn(ctx,"dropping log line that exceeds our limit")`
`135`		`-n++`
`136`		`-continue`
`137`		`-}`
`138`		`-o+=len(log.Output)+overheadPerLog`
`139`		`-ifo>logOutputMaxBytes {`
	`159`	`+outputToSend+=len(log.Output)+overheadPerLog`
	`160`	`+ifoutputToSend>maxBytesPerBatch {`
`140`	`161`	`break`
`141`	`162`	`}`
`142`	`163`	`req.Logs=append(req.Logs,log)`
`143`	`164`	`n++`
	`165`	`+outputToRemove+=len(log.Output)`
`144`	`166`	`}`
`145`	`167`
`146`	`168`	`l.L.Unlock()`
`@@ -154,6 +176,7 @@ func (l *logSender) sendLoop(ctx context.Context, dest logDest) error {`
`154`	`176`	`// since elsewhere we only append to the logs, here we can remove them`
`155`	`177`	`// since we successfully sent them`
`156`	`178`	`q.logs=q.logs[n:]`
	`179`	`+l.outputLen-=outputToRemove`
`157`	`180`	`iflen(q.logs)==0 {`
`158`	`181`	`// no empty queues`
`159`	`182`	`delete(l.queues,src)`

`‎agent/logs_internal_test.go`

Lines changed: 64 additions & 3 deletions

Original file line number	Diff line number	Diff line change
`@@ -127,7 +127,7 @@ func TestLogSender_SkipHugeLog(t *testing.T) {`
`127`	`127`
`128`	`128`	`t0:=dbtime.Now()`
`129`	`129`	`ls1:= uuid.UUID{0x11}`
`130`		`-hugeLog:=make([]byte,logOutputMaxBytes+1)`
	`130`	`+hugeLog:=make([]byte,maxBytesPerBatch+1)`
`131`	`131`	`fori:=rangehugeLog {`
`132`	`132`	`hugeLog[i]='q'`
`133`	`133`	`}`
`@@ -196,20 +196,81 @@ func TestLogSender_Batch(t *testing.T) {`
`196`	`196`	`gotLogs+=len(req.Logs)`
`197`	`197`	`wire,err:=protobuf.Marshal(req)`
`198`	`198`	`require.NoError(t,err)`
`199`		`-require.Less(t,len(wire),logOutputMaxBytes,"wire should not exceed 1MiB")`
	`199`	`+require.Less(t,len(wire),maxBytesPerBatch,"wire should not exceed 1MiB")`
`200`	`200`	`req=testutil.RequireRecvCtx(ctx,t,fDest.reqs)`
`201`	`201`	`require.NotNil(t,req)`
`202`	`202`	`gotLogs+=len(req.Logs)`
`203`	`203`	`wire,err=protobuf.Marshal(req)`
`204`	`204`	`require.NoError(t,err)`
`205`		`-require.Less(t,len(wire),logOutputMaxBytes,"wire should not exceed 1MiB")`
	`205`	`+require.Less(t,len(wire),maxBytesPerBatch,"wire should not exceed 1MiB")`
`206`	`206`	`require.Equal(t,60000,gotLogs)`
`207`	`207`
`208`	`208`	`cancel()`
`209`	`209`	`err=testutil.RequireRecvCtx(testCtx,t,loopErr)`
`210`	`210`	`require.NoError(t,err)`
`211`	`211`	`}`
`212`	`212`
	`213`	`+funcTestLogSender_MaxQueuedLogs(t*testing.T) {`
	`214`	`+t.Parallel()`
	`215`	`+testCtx:=testutil.Context(t,testutil.WaitShort)`
	`216`	`+ctx,cancel:=context.WithCancel(testCtx)`
	`217`	`+logger:=slogtest.Make(t,nil).Leveled(slog.LevelDebug)`
	`218`	`+fDest:=newFakeLogDest()`
	`219`	`+uut:=newLogSender(logger)`
	`220`	`+`
	`221`	`+t0:=dbtime.Now()`
	`222`	`+ls1:= uuid.UUID{0x11}`
	`223`	`+n:=4`
	`224`	`+hugeLog:=make([]byte,maxBytesQueued/n)`
	`225`	`+fori:=rangehugeLog {`
	`226`	`+hugeLog[i]='q'`
	`227`	`+}`
	`228`	`+varlogs []agentsdk.Log`
	`229`	`+fori:=0;i<n;i++ {`
	`230`	`+logs=append(logs, agentsdk.Log{`
	`231`	`+CreatedAt:t0,`
	`232`	`+Output:string(hugeLog),`
	`233`	`+Level:codersdk.LogLevelInfo,`
	`234`	`+})`
	`235`	`+}`
	`236`	`+err:=uut.enqueue(ls1,logs...)`
	`237`	`+require.NoError(t,err)`
	`238`	`+`
	`239`	`+// we're now right at the limit of output`
	`240`	`+require.Equal(t,maxBytesQueued,uut.outputLen)`
	`241`	`+`
	`242`	`+// adding more logs should error...`
	`243`	`+ls2:= uuid.UUID{0x22}`
	`244`	`+err=uut.enqueue(ls2,logs...)`
	`245`	`+require.ErrorIs(t,err,MaxQueueExceededError)`
	`246`	`+`
	`247`	`+loopErr:=make(chanerror,1)`
	`248`	`+gofunc() {`
	`249`	`+err:=uut.sendLoop(ctx,fDest)`
	`250`	`+loopErr<-err`
	`251`	`+}()`
	`252`	`+`
	`253`	`+// ...but, it should still queue up one log from source #2, so that we would exceed the database`
	`254`	`+// limit. These come over a total of 3 updates, because due to overhead, the n logs from source`
	`255`	`+// #1 come in 2 updates, plus 1 update for source #2.`
	`256`	`+logsBySource:=make(map[uuid.UUID]int)`
	`257`	`+fori:=0;i<3;i++ {`
	`258`	`+req:=testutil.RequireRecvCtx(ctx,t,fDest.reqs)`
	`259`	`+require.NotNil(t,req)`
	`260`	`+srcID,err:=uuid.FromBytes(req.LogSourceId)`
	`261`	`+require.NoError(t,err)`
	`262`	`+logsBySource[srcID]+=len(req.Logs)`
	`263`	`+}`
	`264`	`+require.Equal(t,map[uuid.UUID]int{`
	`265`	`+ls1:n,`
	`266`	`+ls2:1,`
	`267`	`+},logsBySource)`
	`268`	`+`
	`269`	`+cancel()`
	`270`	`+err=testutil.RequireRecvCtx(testCtx,t,loopErr)`
	`271`	`+require.NoError(t,err)`
	`272`	`+}`
	`273`	`+`
`213`	`274`	`typefakeLogDeststruct {`
`214`	`275`	`reqschan*proto.BatchCreateLogsRequest`
`215`	`276`	`}`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commit4a32bba

File tree

2 files changed

2 files changed

`‎agent/logs.go`

`‎agent/logs_internal_test.go`

0 commit comments