mirror of
https://github.com/grafana/grafana.git
synced 2025-02-14 17:43:35 -06:00
309 lines
7.5 KiB
Go
309 lines
7.5 KiB
Go
package tracing
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"net/http"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/go-kit/log/level"
|
|
"go.etcd.io/etcd/api/v3/version"
|
|
jaegerpropagator "go.opentelemetry.io/contrib/propagators/jaeger"
|
|
"go.opentelemetry.io/otel"
|
|
"go.opentelemetry.io/otel/attribute"
|
|
"go.opentelemetry.io/otel/codes"
|
|
"go.opentelemetry.io/otel/exporters/jaeger"
|
|
"go.opentelemetry.io/otel/exporters/otlp/otlptrace"
|
|
"go.opentelemetry.io/otel/exporters/otlp/otlptrace/otlptracegrpc"
|
|
"go.opentelemetry.io/otel/propagation"
|
|
"go.opentelemetry.io/otel/sdk/resource"
|
|
tracesdk "go.opentelemetry.io/otel/sdk/trace"
|
|
semconv "go.opentelemetry.io/otel/semconv/v1.4.0"
|
|
trace "go.opentelemetry.io/otel/trace"
|
|
|
|
"github.com/grafana/grafana/pkg/infra/log"
|
|
"github.com/grafana/grafana/pkg/setting"
|
|
)
|
|
|
|
const (
|
|
jaegerExporter string = "jaeger"
|
|
otlpExporter string = "otlp"
|
|
noopExporter string = "noop"
|
|
|
|
jaegerPropagator string = "jaeger"
|
|
w3cPropagator string = "w3c"
|
|
)
|
|
|
|
type Opentelemetry struct {
|
|
enabled string
|
|
address string
|
|
propagation string
|
|
customAttribs []attribute.KeyValue
|
|
log log.Logger
|
|
|
|
tracerProvider tracerProvider
|
|
tracer trace.Tracer
|
|
|
|
Cfg *setting.Cfg
|
|
}
|
|
|
|
type tracerProvider interface {
|
|
trace.TracerProvider
|
|
|
|
Shutdown(ctx context.Context) error
|
|
}
|
|
|
|
type OpentelemetrySpan struct {
|
|
span trace.Span
|
|
}
|
|
|
|
type EventValue struct {
|
|
Str string
|
|
Num int64
|
|
}
|
|
|
|
type otelErrHandler func(err error)
|
|
|
|
func (o otelErrHandler) Handle(err error) {
|
|
o(err)
|
|
}
|
|
|
|
type noopTracerProvider struct {
|
|
trace.TracerProvider
|
|
}
|
|
|
|
func (noopTracerProvider) Shutdown(ctx context.Context) error {
|
|
return nil
|
|
}
|
|
|
|
func (ots *Opentelemetry) parseSettingsOpentelemetry() error {
|
|
section, err := ots.Cfg.Raw.GetSection("tracing.opentelemetry")
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
ots.customAttribs, err = splitCustomAttribs(section.Key("custom_attributes").MustString(""))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
section, err = ots.Cfg.Raw.GetSection("tracing.opentelemetry.jaeger")
|
|
if err != nil {
|
|
return err
|
|
}
|
|
ots.enabled = noopExporter
|
|
|
|
ots.address = section.Key("address").MustString("")
|
|
ots.propagation = section.Key("propagation").MustString("")
|
|
if ots.address != "" {
|
|
ots.enabled = jaegerExporter
|
|
return nil
|
|
}
|
|
|
|
section, err = ots.Cfg.Raw.GetSection("tracing.opentelemetry.otlp")
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
ots.address = section.Key("address").MustString("")
|
|
if ots.address != "" {
|
|
ots.enabled = otlpExporter
|
|
}
|
|
ots.propagation = section.Key("propagation").MustString("")
|
|
return nil
|
|
}
|
|
|
|
func splitCustomAttribs(s string) ([]attribute.KeyValue, error) {
|
|
res := []attribute.KeyValue{}
|
|
|
|
attribs := strings.Split(s, ",")
|
|
for _, v := range attribs {
|
|
parts := strings.SplitN(v, ":", 2)
|
|
if len(parts) > 1 {
|
|
res = append(res, attribute.String(parts[0], parts[1]))
|
|
} else if v != "" {
|
|
return nil, fmt.Errorf("custom attribute malformed - must be in 'key:value' form: %q", v)
|
|
}
|
|
}
|
|
|
|
return res, nil
|
|
}
|
|
|
|
func (ots *Opentelemetry) initJaegerTracerProvider() (*tracesdk.TracerProvider, error) {
|
|
// Create the Jaeger exporter
|
|
exp, err := jaeger.New(jaeger.WithCollectorEndpoint(jaeger.WithEndpoint(ots.address)))
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
res, err := resource.New(
|
|
context.Background(),
|
|
resource.WithAttributes(
|
|
// TODO: why are these attributes different from ones added to the
|
|
// OTLP provider?
|
|
semconv.ServiceNameKey.String("grafana"),
|
|
attribute.String("environment", "production"),
|
|
),
|
|
resource.WithAttributes(ots.customAttribs...),
|
|
)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
tp := tracesdk.NewTracerProvider(
|
|
tracesdk.WithBatcher(exp),
|
|
tracesdk.WithResource(res),
|
|
)
|
|
|
|
return tp, nil
|
|
}
|
|
|
|
func (ots *Opentelemetry) initOTLPTracerProvider() (*tracesdk.TracerProvider, error) {
|
|
client := otlptracegrpc.NewClient(otlptracegrpc.WithEndpoint(ots.address), otlptracegrpc.WithInsecure())
|
|
exp, err := otlptrace.New(context.Background(), client)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
res, err := resource.New(
|
|
context.Background(),
|
|
resource.WithAttributes(
|
|
semconv.ServiceNameKey.String("grafana"),
|
|
semconv.ServiceVersionKey.String(version.Version),
|
|
),
|
|
resource.WithAttributes(ots.customAttribs...),
|
|
resource.WithProcessRuntimeDescription(),
|
|
resource.WithTelemetrySDK(),
|
|
)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
tp := tracesdk.NewTracerProvider(
|
|
tracesdk.WithBatcher(exp),
|
|
tracesdk.WithSampler(tracesdk.ParentBased(
|
|
tracesdk.AlwaysSample(),
|
|
)),
|
|
tracesdk.WithResource(res),
|
|
)
|
|
return tp, nil
|
|
}
|
|
|
|
func (ots *Opentelemetry) initNoopTracerProvider() (tracerProvider, error) {
|
|
return &noopTracerProvider{TracerProvider: trace.NewNoopTracerProvider()}, nil
|
|
}
|
|
|
|
func (ots *Opentelemetry) initOpentelemetryTracer() error {
|
|
var tp tracerProvider
|
|
var err error
|
|
switch ots.enabled {
|
|
case jaegerExporter:
|
|
tp, err = ots.initJaegerTracerProvider()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
case otlpExporter:
|
|
tp, err = ots.initOTLPTracerProvider()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
default:
|
|
tp, err = ots.initNoopTracerProvider()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
// Register our TracerProvider as the global so any imported
|
|
// instrumentation in the future will default to using it
|
|
// only if tracing is enabled
|
|
if ots.enabled != "" {
|
|
otel.SetTracerProvider(tp)
|
|
}
|
|
|
|
switch ots.propagation {
|
|
case w3cPropagator:
|
|
otel.SetTextMapPropagator(propagation.TraceContext{})
|
|
case jaegerPropagator:
|
|
otel.SetTextMapPropagator(jaegerpropagator.Jaeger{})
|
|
default:
|
|
otel.SetTextMapPropagator(propagation.TraceContext{})
|
|
}
|
|
ots.tracerProvider = tp
|
|
ots.tracer = otel.GetTracerProvider().Tracer("component-main")
|
|
|
|
return nil
|
|
}
|
|
|
|
func (ots *Opentelemetry) Run(ctx context.Context) error {
|
|
otel.SetErrorHandler(otelErrHandler(func(err error) {
|
|
err = level.Error(ots.log).Log("msg", "OpenTelemetry handler returned an error", "err", err)
|
|
if err != nil {
|
|
ots.log.Error("OpenTelemetry log returning error", err)
|
|
}
|
|
}))
|
|
<-ctx.Done()
|
|
|
|
ots.log.Info("Closing tracing")
|
|
if ots.tracerProvider == nil {
|
|
return nil
|
|
}
|
|
ctxShutdown, cancel := context.WithTimeout(ctx, time.Second*5)
|
|
defer cancel()
|
|
|
|
if err := ots.tracerProvider.Shutdown(ctxShutdown); err != nil {
|
|
return err
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
func (ots *Opentelemetry) Start(ctx context.Context, spanName string, opts ...trace.SpanStartOption) (context.Context, Span) {
|
|
ctx, span := ots.tracer.Start(ctx, spanName, opts...)
|
|
opentelemetrySpan := OpentelemetrySpan{
|
|
span: span,
|
|
}
|
|
|
|
if traceID := span.SpanContext().TraceID(); traceID.IsValid() {
|
|
ctx = context.WithValue(ctx, traceKey{}, traceValue{traceID.String(), span.SpanContext().IsSampled()})
|
|
}
|
|
|
|
return ctx, opentelemetrySpan
|
|
}
|
|
|
|
func (ots *Opentelemetry) Inject(ctx context.Context, header http.Header, _ Span) {
|
|
otel.GetTextMapPropagator().Inject(ctx, propagation.HeaderCarrier(header))
|
|
}
|
|
|
|
func (s OpentelemetrySpan) End() {
|
|
s.span.End()
|
|
}
|
|
|
|
func (s OpentelemetrySpan) SetAttributes(key string, value interface{}, kv attribute.KeyValue) {
|
|
s.span.SetAttributes(kv)
|
|
}
|
|
|
|
func (s OpentelemetrySpan) SetName(name string) {
|
|
s.span.SetName(name)
|
|
}
|
|
|
|
func (s OpentelemetrySpan) SetStatus(code codes.Code, description string) {
|
|
s.span.SetStatus(code, description)
|
|
}
|
|
|
|
func (s OpentelemetrySpan) RecordError(err error, options ...trace.EventOption) {
|
|
s.span.RecordError(err, options...)
|
|
}
|
|
|
|
func (s OpentelemetrySpan) AddEvents(keys []string, values []EventValue) {
|
|
for i, v := range values {
|
|
if v.Str != "" {
|
|
s.span.AddEvent(keys[i], trace.WithAttributes(attribute.Key(keys[i]).String(v.Str)))
|
|
}
|
|
if v.Num != 0 {
|
|
s.span.AddEvent(keys[i], trace.WithAttributes(attribute.Key(keys[i]).Int64(v.Num)))
|
|
}
|
|
}
|
|
}
|