Alerting: refactor state tracker (#33292)

* set processing time * merge labels and set on response * use state cache for adding alerts to rules * minor cleanup * add support for NoData and Error results * rename test * bring in changes from other PRs tha have been merged * pr feedback * add integration test * close state tracker cleanup on context.Done * fixup test * rename state tracker * set EvaluationDuration on Result * default labels set as constants * separate cache and state from manager * use RWMutex in cache
2025-02-25 18:55:37 -06:00 · 2021-04-23 12:32:25 -07:00
parent ca79206498
commit 788bc2a793
13 changed files with 564 additions and 475 deletions
--- a/pkg/services/ngalert/state/cache.go
+++ b/pkg/services/ngalert/state/cache.go
@@ -0,0 +1,135 @@
+package state
+
+import (
+	"fmt"
+	"sync"
+
+	"github.com/grafana/grafana-plugin-sdk-go/data"
+
+	"github.com/grafana/grafana/pkg/services/ngalert/eval"
+	ngModels "github.com/grafana/grafana/pkg/services/ngalert/models"
+	prometheusModel "github.com/prometheus/common/model"
+)
+
+type cache struct {
+	states    map[string]*State
+	mtxStates sync.RWMutex
+}
+
+func newCache() *cache {
+	return &cache{
+		states: make(map[string]*State),
+	}
+}
+
+func (c *cache) getOrCreate(alertRule *ngModels.AlertRule, result eval.Result) *State {
+	c.mtxStates.Lock()
+	defer c.mtxStates.Unlock()
+
+	// if duplicate labels exist, alertRule label will take precedence
+	lbs := mergeLabels(alertRule.Labels, result.Instance)
+	lbs[ngModels.UIDLabel] = alertRule.UID
+	lbs[ngModels.NamespaceUIDLabel] = alertRule.NamespaceUID
+	lbs[prometheusModel.AlertNameLabel] = alertRule.Title
+
+	id := fmt.Sprintf("%s", map[string]string(lbs))
+	if state, ok := c.states[id]; ok {
+		return state
+	}
+
+	annotations := map[string]string{}
+	if len(alertRule.Annotations) > 0 {
+		annotations = alertRule.Annotations
+	}
+
+	// If the first result we get is alerting, set StartsAt to EvaluatedAt because we
+	// do not have data for determining StartsAt otherwise
+	newState := &State{
+		AlertRuleUID:       alertRule.UID,
+		OrgID:              alertRule.OrgID,
+		CacheId:            id,
+		Labels:             lbs,
+		State:              result.State,
+		Annotations:        annotations,
+		EvaluationDuration: result.EvaluationDuration,
+	}
+	if result.State == eval.Alerting {
+		newState.StartsAt = result.EvaluatedAt
+	}
+	c.states[id] = newState
+	return newState
+}
+
+func (c *cache) set(entry *State) {
+	c.mtxStates.Lock()
+	defer c.mtxStates.Unlock()
+	c.states[entry.CacheId] = entry
+}
+
+func (c *cache) get(id string) (*State, error) {
+	c.mtxStates.Lock()
+	defer c.mtxStates.Unlock()
+	if state, ok := c.states[id]; ok {
+		return state, nil
+	}
+	return nil, fmt.Errorf("no entry for id: %s", id)
+}
+
+func (c *cache) getAll() []*State {
+	var states []*State
+	c.mtxStates.Lock()
+	defer c.mtxStates.Unlock()
+	for _, v := range c.states {
+		states = append(states, v)
+	}
+	return states
+}
+
+func (c *cache) getStatesByRuleUID() map[string][]*State {
+	ruleMap := make(map[string][]*State)
+	c.mtxStates.Lock()
+	defer c.mtxStates.Unlock()
+	for _, state := range c.states {
+		if ruleStates, ok := ruleMap[state.AlertRuleUID]; ok {
+			ruleStates = append(ruleStates, state)
+			ruleMap[state.AlertRuleUID] = ruleStates
+		} else {
+			ruleStates := []*State{state}
+			ruleMap[state.AlertRuleUID] = ruleStates
+		}
+	}
+	return ruleMap
+}
+
+func (c *cache) reset() {
+	c.mtxStates.Lock()
+	defer c.mtxStates.Unlock()
+	c.states = make(map[string]*State)
+}
+
+func (c *cache) trim() {
+	c.mtxStates.Lock()
+	defer c.mtxStates.Unlock()
+	for _, v := range c.states {
+		if len(v.Results) > 100 {
+			newResults := make([]Evaluation, 100)
+			copy(newResults, v.Results[100:])
+			v.Results = newResults
+			c.set(v)
+		}
+	}
+}
+
+// if duplicate labels exist, keep the value from the first set
+func mergeLabels(a, b data.Labels) data.Labels {
+	newLbs := data.Labels{}
+	for k, v := range a {
+		newLbs[k] = v
+	}
+	for k, v := range b {
+		if _, ok := newLbs[k]; !ok {
+			newLbs[k] = v
+		}
+	}
+	return newLbs
+}