NotificationsYou must be signed in to change notification settings
Fork929
Star10.1k

Commitb6e86a2

committed

Refactoring

Signed-off-by: Danny Kopping <danny@coder.com>

1 parentfcbffe0 commitb6e86a2Copy full SHA for b6e86a2

File tree

2 files changed

+122

-41

lines changed

coderd/prometheusmetrics
- aggregator.go
- aggregator_test.go

2 files changed

+122

-41

lines changed

`‎coderd/prometheusmetrics/aggregator.go`

Lines changed: 38 additions & 31 deletions

Original file line number	Diff line number	Diff line change
`@@ -9,6 +9,7 @@ import (`
`9`	`9`
`10`	`10`	`"github.com/coder/coder/v2/coderd/agentmetrics"`
`11`	`11`	`"github.com/prometheus/client_golang/prometheus"`
	`12`	`+"github.com/prometheus/common/model"`
`12`	`13`	`"golang.org/x/xerrors"`
`13`	`14`
`14`	`15`	`"cdr.dev/slog"`
`@@ -107,8 +108,9 @@ var _ prometheus.Collector = new(MetricsAggregator)`
`107`	`108`
`108`	`109`	`func (am*annotatedMetric)asPrometheus() (prometheus.Metric,error) {`
`109`	`110`	`var (`
`110`		`-baseLabelNames[]string=am.aggregateByLabels`
	`111`	`+baseLabelNames=am.aggregateByLabels`
`111`	`112`	`baseLabelValues []string`
	`113`	`+extraLabels=am.Labels`
`112`	`114`	`)`
`113`	`115`
`114`	`116`	`for_,label:=rangeam.aggregateByLabels {`
`@@ -120,19 +122,17 @@ func (am *annotatedMetric) asPrometheus() (prometheus.Metric, error) {`
`120`	`122`	`baseLabelValues=append(baseLabelValues,val)`
`121`	`123`	`}`
`122`	`124`
`123`		`-labels:=make([]string,0,len(baseLabelNames)+len(am.Labels))`
`124`		`-labelValues:=make([]string,0,len(baseLabelNames)+len(am.Labels))`
	`125`	`+labels:=make([]string,0,len(baseLabelNames)+len(extraLabels))`
	`126`	`+labelValues:=make([]string,0,len(baseLabelNames)+len(extraLabels))`
`125`	`127`
`126`	`128`	`labels=append(labels,baseLabelNames...)`
`127`	`129`	`labelValues=append(labelValues,baseLabelValues...)`
`128`	`130`
`129`		`-for_,l:=rangeam.Labels {`
	`131`	`+for_,l:=rangeextraLabels {`
`130`	`132`	`labels=append(labels,l.Name)`
`131`	`133`	`labelValues=append(labelValues,l.Value)`
`132`	`134`	`}`
`133`	`135`
`134`		`-//fmt.Printf(">>>>[%s] [%s] %s [%q] [%q]: %v\n", time.Now().Format(time.RFC3339Nano), am.Type, am.Name, labels, labelValues, am.Value)`
`135`		`-`
`136`	`136`	`desc:=prometheus.NewDesc(am.Name,metricHelpForAgent,labels,nil)`
`137`	`137`	`valueType,err:=asPrometheusValueType(am.Type)`
`138`	`138`	`iferr!=nil {`
`@@ -237,50 +237,56 @@ func NewMetricsAggregator(logger slog.Logger, registerer prometheus.Registerer,`
`237`	`237`	`},nil`
`238`	`238`	`}`
`239`	`239`
`240`		`-typeMetricAggregatorstruct {`
	`240`	`+// labelAggregator is used to control cardinality of collected Prometheus metrics by pre-aggregating series based on given labels.`
	`241`	`+typelabelAggregatorstruct {`
`241`	`242`	`aggregationsmap[string]float64`
`242`	`243`	`metricsmap[string]annotatedMetric`
`243`	`244`	`}`
`244`	`245`
`245`		`-funcNewMetricAggregator(sizeint)*MetricAggregator {`
`246`		`-return&MetricAggregator{`
	`246`	`+funcnewLabelAggregator(sizeint)*labelAggregator {`
	`247`	`+return&labelAggregator{`
`247`	`248`	`aggregations:make(map[string]float64,size),`
`248`	`249`	`metrics:make(map[string]annotatedMetric,size),`
`249`	`250`	`}`
`250`	`251`	`}`
`251`	`252`
`252`		`-func (a*MetricAggregator)Aggregate(amannotatedMetric,labels []string)error {`
`253`		`-// if we already have an entry for this key, don't clone this am afresh - rather use the existing one`
`254`		`-// this will be a bit more memory efficient`
`255`		`-// ...do this after unit-test is written`
`256`		`-`
`257`		`-clone:=am.clone()`
`258`		`-`
`259`		`-fields:=make(map[string]string,len(labels))`
	`253`	`+func (a*labelAggregator)aggregate(amannotatedMetric,labels []string)error {`
	`254`	`+// Use a LabelSet because it can give deterministic fingerprints of label combinations regardless of map ordering.`
	`255`	`+labelSet:=make(model.LabelSet,len(labels))`
`260`	`256`	`labelValues:=make([]string,0,len(labels))`
`261`	`257`
`262`	`258`	`for_,label:=rangelabels {`
`263`		`-val,err:=clone.getFieldByLabel(label)`
	`259`	`+val,err:=am.getFieldByLabel(label)`
`264`	`260`	`iferr!=nil {`
`265`	`261`	`returnerr`
`266`	`262`	`}`
`267`	`263`
`268`		`-fields[label]=val`
	`264`	`+labelSet[model.LabelName(label)]=model.LabelValue(val)`
`269`	`265`	`labelValues=append(labelValues,val)`
`270`	`266`	`}`
`271`	`267`
`272`		`-key:=fmt.Sprintf("%s:%v",clone.Stats_Metric.Name,fields)`
	`268`	`+// Memoize based on the metric name & the unique combination of labels.`
	`269`	`+key:=fmt.Sprintf("%s:%v",am.Stats_Metric.Name,labelSet.FastFingerprint())`
	`270`	`+`
	`271`	`+// Aggregate the value based on the key.`
	`272`	`+a.aggregations[key]+=am.Value`
	`273`	`+`
	`274`	`+metric,found:=a.metrics[key]`
	`275`	`+if!found {`
	`276`	`+// Take a copy of the given annotatedMetric because it may be manipulated later and contains pointers.`
	`277`	`+metric=am.clone()`
	`278`	`+}`
`273`	`279`
`274`		`-clone.aggregateByLabels=labels`
`275`		`-a.aggregations[key]+=clone.Value`
	`280`	`+// Store the metric.`
	`281`	`+metric.aggregateByLabels=labels`
	`282`	`+metric.Value=a.aggregations[key]`
`276`	`283`
`277`		`-clone.Value=a.aggregations[key]`
`278`		`-a.metrics[key]=clone`
	`284`	`+a.metrics[key]=metric`
`279`	`285`
`280`	`286`	`returnnil`
`281`	`287`	`}`
`282`	`288`
`283`		`-func (a*MetricAggregator)asMetrics() (out []annotatedMetric) {`
	`289`	`+func (a*labelAggregator)toMetrics() (out []annotatedMetric) {`
`284`	`290`	`for_,am:=rangea.metrics {`
`285`	`291`	`out=append(out,am)`
`286`	`292`	`}`
`@@ -331,24 +337,25 @@ func (ma *MetricsAggregator) Run(ctx context.Context) func() {`
`331`	`337`
`332`	`338`	`// If custom aggregation labels have not been chosen, generate Prometheus metrics without any pre-aggregation.`
`333`	`339`	`// This results in higher cardinality, but may be desirable in larger deployments.`
	`340`	`+// Default behaviour.`
`334`	`341`	`iflen(ma.aggregateByLabels)==0 {`
`335`	`342`	`for_,m:=rangema.store {`
`336`		`-// Aggregate byhigh cardinality labels.`
`337`		`-m.aggregateByLabels=agentMetricsLabels`
	`343`	`+// Aggregate byall available metrics.`
	`344`	`+m.aggregateByLabels=defaultAgentMetricsLabels`
`338`	`345`	`input=append(input,m)`
`339`	`346`	`}`
`340`	`347`	`}else {`
`341`	`348`	`// However, if custom aggregations have been chosen, we need to aggregate the values from the annotated`
`342`	`349`	`// metrics because we cannot register multiple metric series with the same labels.`
`343`		`-aggregator:=NewMetricAggregator(len(ma.store)*len(ma.aggregateByLabels))`
	`350`	`+la:=newLabelAggregator(len(ma.store))`
`344`	`351`
`345`	`352`	`for_,m:=rangema.store {`
`346`		`-iferr:=aggregator.Aggregate(m,ma.aggregateByLabels);err!=nil {`
	`353`	`+iferr:=la.aggregate(m,ma.aggregateByLabels);err!=nil {`
`347`	`354`	`ma.log.Error(ctx,"can't aggregate labels",slog.F("labels",strings.Join(ma.aggregateByLabels,",")),slog.Error(err))`
`348`	`355`	`}`
`349`	`356`	`}`
`350`	`357`
`351`		`-input=aggregator.asMetrics()`
	`358`	`+input=la.toMetrics()`
`352`	`359`	`}`
`353`	`360`
`354`	`361`	`for_,m:=rangeinput {`
`@@ -395,7 +402,7 @@ func (ma *MetricsAggregator) Run(ctx context.Context) func() {`
`395`	`402`	`func (MetricsAggregator)Describe(_chan<-prometheus.Desc) {`
`396`	`403`	`}`
`397`	`404`
`398`		`-varagentMetricsLabels= []string{agentmetrics.UsernameLabel,agentmetrics.WorkspaceNameLabel,agentmetrics.AgentNameLabel,agentmetrics.TemplateNameLabel}`
	`405`	`+vardefaultAgentMetricsLabels= []string{agentmetrics.UsernameLabel,agentmetrics.WorkspaceNameLabel,agentmetrics.AgentNameLabel,agentmetrics.TemplateNameLabel}`
`399`	`406`
`400`	`407`	`// AgentMetricLabels are the labels used to decorate an agent's metrics.`
`401`	`408`	`// This list should match the list of labels in agentMetricsLabels.`

`‎coderd/prometheusmetrics/aggregator_test.go`

Lines changed: 84 additions & 10 deletions

Original file line number	Diff line number	Diff line change
`@@ -8,14 +8,13 @@ import (`
`8`	`8`	`"testing"`
`9`	`9`	`"time"`
`10`	`10`
	`11`	`+"cdr.dev/slog/sloggers/slogtest"`
`11`	`12`	`"github.com/coder/coder/v2/coderd/agentmetrics"`
`12`	`13`	`"github.com/prometheus/client_golang/prometheus"`
`13`	`14`	`dto"github.com/prometheus/client_model/go"`
`14`	`15`	`"github.com/stretchr/testify/assert"`
`15`	`16`	`"github.com/stretchr/testify/require"`
`16`	`17`
`17`		`-"cdr.dev/slog/sloggers/slogtest"`
`18`		`-`
`19`	`18`	`agentproto"github.com/coder/coder/v2/agent/proto"`
`20`	`19`	`"github.com/coder/coder/v2/coderd/prometheusmetrics"`
`21`	`20`	`"github.com/coder/coder/v2/cryptorand"`
`@@ -324,23 +323,19 @@ func TestLabelsAggregation(t *testing.T) {`
`324`	`323`	`{`
`325`	`324`	`labels:testLabels,`
`326`	`325`	`metrics: []*agentproto.Stats_Metric{`
`327`		`-{Name:"no_extra_labels",Type:agentproto.Stats_Metric_COUNTER,Value:1},`
	`326`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:1},`
`328`	`327`	`},`
`329`	`328`	`},`
`330`	`329`	`{`
`331`	`330`	`labels:testLabels,`
`332`	`331`	`metrics: []*agentproto.Stats_Metric{`
`333`		`-{Name:"extra_label",Type:agentproto.Stats_Metric_COUNTER,Value:27,Labels: []*agentproto.Stats_Metric_Label{`
`334`		`-{Name:"lizz",Value:"rizz"},`
`335`		`-}},`
	`332`	`+{Name:"active_conns",Type:agentproto.Stats_Metric_GAUGE,Value:4},`
`336`	`333`	`},`
`337`	`334`	`},`
`338`	`335`	`},`
`339`	`336`	`expected: []*agentproto.Stats_Metric{`
`340`		`-{Name:"no_extra_labels",Type:agentproto.Stats_Metric_COUNTER,Value:1,Labels:commonLabels},`
`341`		`-{Name:"extra_label",Type:agentproto.Stats_Metric_COUNTER,Value:27,Labels:append([]*agentproto.Stats_Metric_Label{`
`342`		`-{Name:"lizz",Value:"rizz"},`
`343`		`-},commonLabels...)},`
	`337`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:1,Labels:commonLabels},`
	`338`	`+{Name:"active_conns",Type:agentproto.Stats_Metric_GAUGE,Value:4,Labels:commonLabels},`
`344`	`339`	`},`
`345`	`340`	`},`
`346`	`341`	`{`
`@@ -484,6 +479,85 @@ func TestLabelsAggregation(t *testing.T) {`
`484`	`479`	`}},`
`485`	`480`	`},`
`486`	`481`	`},`
	`482`	`+{`
	`483`	`+name:"extra labels are retained, even with label aggregations",`
	`484`	`+aggregateOn: []string{agentmetrics.UsernameLabel},`
	`485`	`+given: []statCollection{`
	`486`	`+{`
	`487`	`+labels:testLabels,`
	`488`	`+metrics: []*agentproto.Stats_Metric{`
	`489`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:1},`
	`490`	`+},`
	`491`	`+},`
	`492`	`+{`
	`493`	`+labels:testLabels,`
	`494`	`+metrics: []*agentproto.Stats_Metric{`
	`495`	`+{Name:"extra_label",Type:agentproto.Stats_Metric_COUNTER,Value:27,Labels: []*agentproto.Stats_Metric_Label{`
	`496`	`+{Name:"lizz",Value:"rizz"},`
	`497`	`+}},`
	`498`	`+},`
	`499`	`+},`
	`500`	`+},`
	`501`	`+expected: []*agentproto.Stats_Metric{`
	`502`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:1,Labels: []*agentproto.Stats_Metric_Label{`
	`503`	`+{Name:agentmetrics.UsernameLabel,Value:testUsername},`
	`504`	`+}},`
	`505`	`+{Name:"extra_label",Type:agentproto.Stats_Metric_COUNTER,Value:27,Labels: []*agentproto.Stats_Metric_Label{`
	`506`	`+{Name:"lizz",Value:"rizz"},`
	`507`	`+{Name:agentmetrics.UsernameLabel,Value:testUsername},`
	`508`	`+}},`
	`509`	`+},`
	`510`	`+},`
	`511`	`+{`
	`512`	`+// Both counters and gauges should have all their values summed to produce the correct output.`
	`513`	`+name:"counters & gauges behave identically",`
	`514`	`+aggregateOn: []string{agentmetrics.TemplateNameLabel},`
	`515`	`+given: []statCollection{`
	`516`	`+{`
	`517`	`+labels: prometheusmetrics.AgentMetricLabels{`
	`518`	`+Username:"username1",`
	`519`	`+TemplateName:"template1",`
	`520`	`+},`
	`521`	`+metrics: []*agentproto.Stats_Metric{`
	`522`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:1},`
	`523`	`+{Name:"active_conns",Type:agentproto.Stats_Metric_GAUGE,Value:3},`
	`524`	`+},`
	`525`	`+},`
	`526`	`+{`
	`527`	`+labels: prometheusmetrics.AgentMetricLabels{`
	`528`	`+Username:"username2",`
	`529`	`+TemplateName:"template1",`
	`530`	`+},`
	`531`	`+metrics: []*agentproto.Stats_Metric{`
	`532`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:2},`
	`533`	`+{Name:"active_conns",Type:agentproto.Stats_Metric_GAUGE,Value:4},`
	`534`	`+},`
	`535`	`+},`
	`536`	`+},`
	`537`	`+expected: []*agentproto.Stats_Metric{`
	`538`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:3,Labels: []*agentproto.Stats_Metric_Label{`
	`539`	`+{Name:agentmetrics.TemplateNameLabel,Value:"template1"},`
	`540`	`+}},`
	`541`	`+{Name:"active_conns",Type:agentproto.Stats_Metric_GAUGE,Value:7,Labels: []*agentproto.Stats_Metric_Label{`
	`542`	`+{Name:agentmetrics.TemplateNameLabel,Value:"template1"},`
	`543`	`+}},`
	`544`	`+},`
	`545`	`+},`
	`546`	`+{`
	`547`	`+// Scenario: validation fails and an invalid label is selected for aggregation.`
	`548`	`+name:"invalid label aggregation",`
	`549`	`+aggregateOn: []string{"nonsense"},`
	`550`	`+given: []statCollection{`
	`551`	`+{`
	`552`	`+labels:testLabels,`
	`553`	`+metrics: []*agentproto.Stats_Metric{`
	`554`	`+{Name:"user_counter",Type:agentproto.Stats_Metric_COUNTER,Value:1},`
	`555`	`+},`
	`556`	`+},`
	`557`	`+},`
	`558`	`+// Nothing will be returned.`
	`559`	`+expected: []*agentproto.Stats_Metric{},`
	`560`	`+},`
`487`	`561`	`}`
`488`	`562`
`489`	`563`	`for_,tc:=rangetests {`

0 commit comments

Comments

(0)

Movatterモバイル変換

Navigation Menu

Search code, repositories, users, issues, pull requests...

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Commitb6e86a2

File tree

2 files changed

2 files changed

`‎coderd/prometheusmetrics/aggregator.go`

`‎coderd/prometheusmetrics/aggregator_test.go`

0 commit comments