mirror of
https://github.com/grafana/grafana.git
synced 2025-02-25 18:55:37 -06:00
134 lines
5.4 KiB
Go
134 lines
5.4 KiB
Go
// Package instrumentation contains backend plugin instrumentation logic.
|
|
package instrumentation
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"time"
|
|
|
|
"github.com/grafana/grafana-plugin-sdk-go/backend"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/prometheus/client_golang/prometheus/promauto"
|
|
|
|
"github.com/grafana/grafana/pkg/infra/log"
|
|
"github.com/grafana/grafana/pkg/infra/tracing"
|
|
"github.com/grafana/grafana/pkg/plugins/backendplugin"
|
|
)
|
|
|
|
var (
|
|
pluginRequestCounter = promauto.NewCounterVec(prometheus.CounterOpts{
|
|
Namespace: "grafana",
|
|
Name: "plugin_request_total",
|
|
Help: "The total amount of plugin requests",
|
|
}, []string{"plugin_id", "endpoint", "status", "target"})
|
|
|
|
pluginRequestDuration = promauto.NewHistogramVec(prometheus.HistogramOpts{
|
|
Namespace: "grafana",
|
|
Name: "plugin_request_duration_milliseconds",
|
|
Help: "Plugin request duration",
|
|
Buckets: []float64{.005, .01, .025, .05, .1, .25, .5, 1, 2.5, 5, 10, 25, 50, 100},
|
|
}, []string{"plugin_id", "endpoint", "target"})
|
|
|
|
pluginRequestSizeHistogram = promauto.NewHistogramVec(
|
|
prometheus.HistogramOpts{
|
|
Namespace: "grafana",
|
|
Name: "plugin_request_size_bytes",
|
|
Help: "histogram of plugin request sizes returned",
|
|
Buckets: []float64{128, 256, 512, 1024, 2048, 4096, 8192, 16384, 32768, 65536, 131072, 262144, 524288, 1048576},
|
|
}, []string{"source", "plugin_id", "endpoint", "target"},
|
|
)
|
|
|
|
PluginRequestDurationSeconds = promauto.NewHistogramVec(prometheus.HistogramOpts{
|
|
Namespace: "grafana",
|
|
Name: "plugin_request_duration_seconds",
|
|
Help: "Plugin request duration in seconds",
|
|
Buckets: []float64{.005, .01, .025, .05, .1, .25, .5, 1, 2.5, 5, 10, 25},
|
|
}, []string{"source", "plugin_id", "endpoint", "status", "target"})
|
|
)
|
|
|
|
const (
|
|
statusOK = "ok"
|
|
statusError = "error"
|
|
statusCancelled = "cancelled"
|
|
|
|
endpointCallResource = "callResource"
|
|
endpointCheckHealth = "checkHealth"
|
|
endpointCollectMetrics = "collectMetrics"
|
|
endpointQueryData = "queryData"
|
|
)
|
|
|
|
// instrumentPluginRequest instruments success rate and latency of `fn`
|
|
func instrumentPluginRequest(ctx context.Context, cfg Cfg, pluginCtx *backend.PluginContext, endpoint string, fn func(ctx context.Context) error) error {
|
|
status := statusOK
|
|
start := time.Now()
|
|
|
|
ctx = instrumentContext(ctx, endpoint, *pluginCtx)
|
|
err := fn(ctx)
|
|
if err != nil {
|
|
status = statusError
|
|
if errors.Is(err, context.Canceled) {
|
|
status = statusCancelled
|
|
}
|
|
}
|
|
|
|
elapsed := time.Since(start)
|
|
|
|
pluginRequestDurationWithLabels := pluginRequestDuration.WithLabelValues(pluginCtx.PluginID, endpoint, string(cfg.Target))
|
|
pluginRequestCounterWithLabels := pluginRequestCounter.WithLabelValues(pluginCtx.PluginID, endpoint, status, string(cfg.Target))
|
|
pluginRequestDurationSecondsWithLabels := PluginRequestDurationSeconds.WithLabelValues("grafana-backend", pluginCtx.PluginID, endpoint, status, string(cfg.Target))
|
|
|
|
if traceID := tracing.TraceIDFromContext(ctx, true); traceID != "" {
|
|
pluginRequestDurationWithLabels.(prometheus.ExemplarObserver).ObserveWithExemplar(
|
|
float64(elapsed/time.Millisecond), prometheus.Labels{"traceID": traceID},
|
|
)
|
|
pluginRequestCounterWithLabels.(prometheus.ExemplarAdder).AddWithExemplar(1, prometheus.Labels{"traceID": traceID})
|
|
pluginRequestDurationSecondsWithLabels.(prometheus.ExemplarObserver).ObserveWithExemplar(
|
|
elapsed.Seconds(), prometheus.Labels{"traceID": traceID},
|
|
)
|
|
} else {
|
|
pluginRequestDurationWithLabels.Observe(float64(elapsed / time.Millisecond))
|
|
pluginRequestCounterWithLabels.Inc()
|
|
pluginRequestDurationSecondsWithLabels.Observe(elapsed.Seconds())
|
|
}
|
|
|
|
return err
|
|
}
|
|
|
|
func instrumentContext(ctx context.Context, endpoint string, pCtx backend.PluginContext) context.Context {
|
|
p := []any{"endpoint", endpoint, "pluginId", pCtx.PluginID}
|
|
if pCtx.DataSourceInstanceSettings != nil {
|
|
p = append(p, "dsName", pCtx.DataSourceInstanceSettings.Name)
|
|
p = append(p, "dsUID", pCtx.DataSourceInstanceSettings.UID)
|
|
}
|
|
return log.WithContextualAttributes(ctx, p)
|
|
}
|
|
|
|
type Cfg struct {
|
|
Target backendplugin.Target
|
|
}
|
|
|
|
// InstrumentCollectMetrics instruments collectMetrics.
|
|
func InstrumentCollectMetrics(ctx context.Context, req *backend.PluginContext, cfg Cfg, fn func(ctx context.Context) error) error {
|
|
return instrumentPluginRequest(ctx, cfg, req, endpointCollectMetrics, fn)
|
|
}
|
|
|
|
// InstrumentCheckHealthRequest instruments checkHealth.
|
|
func InstrumentCheckHealthRequest(ctx context.Context, req *backend.PluginContext, cfg Cfg, fn func(ctx context.Context) error) error {
|
|
return instrumentPluginRequest(ctx, cfg, req, endpointCheckHealth, fn)
|
|
}
|
|
|
|
// InstrumentCallResourceRequest instruments callResource.
|
|
func InstrumentCallResourceRequest(ctx context.Context, req *backend.PluginContext, cfg Cfg, requestSize float64, fn func(ctx context.Context) error) error {
|
|
pluginRequestSizeHistogram.WithLabelValues("grafana-backend", req.PluginID, endpointCallResource,
|
|
string(cfg.Target)).Observe(requestSize)
|
|
return instrumentPluginRequest(ctx, cfg, req, endpointCallResource, fn)
|
|
}
|
|
|
|
// InstrumentQueryDataRequest instruments success rate and latency of query data requests.
|
|
func InstrumentQueryDataRequest(ctx context.Context, req *backend.PluginContext, cfg Cfg,
|
|
requestSize float64, fn func(ctx context.Context) error) error {
|
|
pluginRequestSizeHistogram.WithLabelValues("grafana-backend", req.PluginID, endpointQueryData,
|
|
string(cfg.Target)).Observe(requestSize)
|
|
return instrumentPluginRequest(ctx, cfg, req, endpointQueryData, fn)
|
|
}
|