2017-04-03 07:50:40 -05:00
|
|
|
package cloudwatch
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2020-04-25 15:48:20 -05:00
|
|
|
"fmt"
|
2017-04-03 07:50:40 -05:00
|
|
|
"regexp"
|
2020-04-25 15:48:20 -05:00
|
|
|
"sync"
|
|
|
|
"time"
|
2017-04-03 07:50:40 -05:00
|
|
|
|
2020-06-09 06:13:06 -05:00
|
|
|
"github.com/grafana/grafana-plugin-sdk-go/data"
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
"github.com/aws/aws-sdk-go/aws"
|
|
|
|
"github.com/aws/aws-sdk-go/aws/client"
|
2020-07-14 01:23:23 -05:00
|
|
|
"github.com/aws/aws-sdk-go/aws/request"
|
2020-07-23 11:52:22 -05:00
|
|
|
"github.com/aws/aws-sdk-go/aws/session"
|
2020-07-14 01:23:23 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/cloudwatch"
|
2020-07-23 11:52:22 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/cloudwatch/cloudwatchiface"
|
2020-04-25 15:48:20 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/cloudwatchlogs"
|
2020-07-23 01:17:20 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/cloudwatchlogs/cloudwatchlogsiface"
|
2020-07-23 11:52:22 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/ec2"
|
2019-04-15 10:55:07 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/ec2/ec2iface"
|
2020-07-23 11:52:22 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/resourcegroupstaggingapi"
|
2019-04-15 10:55:07 -05:00
|
|
|
"github.com/aws/aws-sdk-go/service/resourcegroupstaggingapi/resourcegroupstaggingapiiface"
|
2020-04-25 15:48:20 -05:00
|
|
|
"github.com/grafana/grafana/pkg/components/simplejson"
|
2019-05-13 01:45:54 -05:00
|
|
|
"github.com/grafana/grafana/pkg/infra/log"
|
2017-04-03 07:50:40 -05:00
|
|
|
"github.com/grafana/grafana/pkg/models"
|
2020-07-14 01:23:23 -05:00
|
|
|
"github.com/grafana/grafana/pkg/setting"
|
2017-04-03 07:50:40 -05:00
|
|
|
"github.com/grafana/grafana/pkg/tsdb"
|
|
|
|
)
|
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
type datasourceInfo struct {
|
2017-09-26 04:30:40 -05:00
|
|
|
Profile string
|
|
|
|
Region string
|
|
|
|
AuthType string
|
|
|
|
AssumeRoleArn string
|
2020-07-02 08:24:36 -05:00
|
|
|
ExternalID string
|
2017-09-26 04:30:40 -05:00
|
|
|
Namespace string
|
|
|
|
|
|
|
|
AccessKey string
|
|
|
|
SecretKey string
|
|
|
|
}
|
|
|
|
|
2020-05-13 14:17:06 -05:00
|
|
|
const cloudWatchTSFormat = "2006-01-02 15:04:05.000"
|
2020-07-14 01:23:23 -05:00
|
|
|
const defaultRegion = "default"
|
2020-04-25 15:48:20 -05:00
|
|
|
|
2020-05-13 08:34:23 -05:00
|
|
|
// Constants also defined in datasource/cloudwatch/datasource.ts
|
2020-05-13 14:17:06 -05:00
|
|
|
const logIdentifierInternal = "__log__grafana_internal__"
|
|
|
|
const logStreamIdentifierInternal = "__logstream__grafana_internal__"
|
2020-05-13 08:34:23 -05:00
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
var plog = log.New("tsdb.cloudwatch")
|
|
|
|
var aliasFormat = regexp.MustCompile(`\{\{\s*(.+?)\s*\}\}`)
|
2020-04-25 15:48:20 -05:00
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
func init() {
|
2020-07-23 11:52:22 -05:00
|
|
|
tsdb.RegisterTsdbQueryEndpoint("cloudwatch", func(ds *models.DataSource) (tsdb.TsdbQueryEndpoint, error) {
|
|
|
|
return newExecutor(), nil
|
|
|
|
})
|
2020-07-14 01:23:23 -05:00
|
|
|
}
|
2020-04-25 15:48:20 -05:00
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
func newExecutor() *cloudWatchExecutor {
|
|
|
|
return &cloudWatchExecutor{
|
|
|
|
logsClientsByRegion: map[string]cloudwatchlogsiface.CloudWatchLogsAPI{},
|
2020-07-14 01:23:23 -05:00
|
|
|
}
|
|
|
|
}
|
2020-04-25 15:48:20 -05:00
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
// cloudWatchExecutor executes CloudWatch requests.
|
|
|
|
type cloudWatchExecutor struct {
|
|
|
|
*models.DataSource
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
ec2Client ec2iface.EC2API
|
|
|
|
rgtaClient resourcegroupstaggingapiiface.ResourceGroupsTaggingAPIAPI
|
|
|
|
logsClientsByRegion map[string]cloudwatchlogsiface.CloudWatchLogsAPI
|
|
|
|
mtx sync.Mutex
|
2020-04-25 15:48:20 -05:00
|
|
|
}
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
func (e *cloudWatchExecutor) newSession(region string) (*session.Session, error) {
|
|
|
|
dsInfo := e.getDSInfo(region)
|
|
|
|
creds, err := getCredentials(dsInfo)
|
2020-07-14 01:23:23 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2020-04-25 15:48:20 -05:00
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
cfg := &aws.Config{
|
|
|
|
Region: aws.String(dsInfo.Region),
|
|
|
|
Credentials: creds,
|
|
|
|
}
|
|
|
|
return newSession(cfg)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (e *cloudWatchExecutor) getCWClient(region string) (cloudwatchiface.CloudWatchAPI, error) {
|
|
|
|
sess, err := e.newSession(region)
|
2020-04-25 15:48:20 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2020-07-23 11:52:22 -05:00
|
|
|
return newCWClient(sess), nil
|
2017-04-03 07:50:40 -05:00
|
|
|
}
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
func (e *cloudWatchExecutor) getCWLogsClient(region string) (cloudwatchlogsiface.CloudWatchLogsAPI, error) {
|
|
|
|
e.mtx.Lock()
|
|
|
|
defer e.mtx.Unlock()
|
2017-04-03 07:50:40 -05:00
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
if logsClient, ok := e.logsClientsByRegion[region]; ok {
|
|
|
|
return logsClient, nil
|
|
|
|
}
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
sess, err := e.newSession(region)
|
2020-07-14 01:23:23 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
logsClient := newCWLogsClient(sess)
|
|
|
|
e.logsClientsByRegion[region] = logsClient
|
|
|
|
|
|
|
|
return logsClient, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (e *cloudWatchExecutor) getEC2Client(region string) (ec2iface.EC2API, error) {
|
|
|
|
if e.ec2Client != nil {
|
|
|
|
return e.ec2Client, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
sess, err := e.newSession(region)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
e.ec2Client = newEC2Client(sess)
|
2020-07-14 01:23:23 -05:00
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
return e.ec2Client, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (e *cloudWatchExecutor) getRGTAClient(region string) (resourcegroupstaggingapiiface.ResourceGroupsTaggingAPIAPI,
|
|
|
|
error) {
|
|
|
|
if e.rgtaClient != nil {
|
|
|
|
return e.rgtaClient, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
sess, err := e.newSession(region)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
e.rgtaClient = newRGTAClient(sess)
|
|
|
|
|
|
|
|
return e.rgtaClient, nil
|
2017-04-03 07:50:40 -05:00
|
|
|
}
|
|
|
|
|
2020-07-23 01:17:20 -05:00
|
|
|
func (e *cloudWatchExecutor) alertQuery(ctx context.Context, logsClient cloudwatchlogsiface.CloudWatchLogsAPI,
|
|
|
|
queryContext *tsdb.TsdbQuery) (*cloudwatchlogs.GetQueryResultsOutput, error) {
|
2020-04-25 15:48:20 -05:00
|
|
|
const maxAttempts = 8
|
|
|
|
const pollPeriod = 1000 * time.Millisecond
|
|
|
|
|
|
|
|
queryParams := queryContext.Queries[0].Model
|
|
|
|
startQueryOutput, err := e.executeStartQuery(ctx, logsClient, queryParams, queryContext.TimeRange)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
requestParams := simplejson.NewFromAny(map[string]interface{}{
|
|
|
|
"region": queryParams.Get("region").MustString(""),
|
|
|
|
"queryId": *startQueryOutput.QueryId,
|
|
|
|
})
|
|
|
|
|
|
|
|
ticker := time.NewTicker(pollPeriod)
|
|
|
|
defer ticker.Stop()
|
|
|
|
|
|
|
|
attemptCount := 1
|
|
|
|
for range ticker.C {
|
2020-06-29 07:08:32 -05:00
|
|
|
res, err := e.executeGetQueryResults(ctx, logsClient, requestParams)
|
|
|
|
if err != nil {
|
2020-04-25 15:48:20 -05:00
|
|
|
return nil, err
|
2020-06-29 07:08:32 -05:00
|
|
|
}
|
|
|
|
if isTerminated(*res.Status) {
|
2020-04-25 15:48:20 -05:00
|
|
|
return res, err
|
2020-06-29 07:08:32 -05:00
|
|
|
}
|
|
|
|
if attemptCount >= maxAttempts {
|
2020-04-25 15:48:20 -05:00
|
|
|
return res, fmt.Errorf("fetching of query results exceeded max number of attempts")
|
|
|
|
}
|
|
|
|
|
|
|
|
attemptCount++
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
// Query executes a CloudWatch query.
|
|
|
|
func (e *cloudWatchExecutor) Query(ctx context.Context, dsInfo *models.DataSource, queryContext *tsdb.TsdbQuery) (*tsdb.Response, error) {
|
2017-09-22 04:07:10 -05:00
|
|
|
e.DataSource = dsInfo
|
2020-04-25 15:48:20 -05:00
|
|
|
|
|
|
|
/*
|
|
|
|
Unlike many other data sources, with Cloudwatch Logs query requests don't receive the results as the response to the query, but rather
|
|
|
|
an ID is first returned. Following this, a client is expected to send requests along with the ID until the status of the query is complete,
|
|
|
|
receiving (possibly partial) results each time. For queries made via dashboards and Explore, the logic of making these repeated queries is handled on
|
|
|
|
the frontend, but because alerts are executed on the backend the logic needs to be reimplemented here.
|
|
|
|
*/
|
|
|
|
queryParams := queryContext.Queries[0].Model
|
|
|
|
_, fromAlert := queryContext.Headers["FromAlert"]
|
2020-05-21 09:18:09 -05:00
|
|
|
isLogAlertQuery := fromAlert && queryParams.Get("queryMode").MustString("") == "Logs"
|
2020-04-25 15:48:20 -05:00
|
|
|
|
|
|
|
if isLogAlertQuery {
|
|
|
|
return e.executeLogAlertQuery(ctx, queryContext)
|
|
|
|
}
|
|
|
|
|
|
|
|
queryType := queryParams.Get("type").MustString("")
|
2017-09-22 04:07:10 -05:00
|
|
|
|
2020-05-18 05:25:58 -05:00
|
|
|
var err error
|
|
|
|
var result *tsdb.Response
|
2017-09-09 14:24:39 -05:00
|
|
|
switch queryType {
|
|
|
|
case "metricFindQuery":
|
2017-09-22 04:07:10 -05:00
|
|
|
result, err = e.executeMetricFindQuery(ctx, queryContext)
|
2017-09-25 04:16:40 -05:00
|
|
|
case "annotationQuery":
|
|
|
|
result, err = e.executeAnnotationQuery(ctx, queryContext)
|
2020-04-25 15:48:20 -05:00
|
|
|
case "logAction":
|
|
|
|
result, err = e.executeLogActions(ctx, queryContext)
|
2017-09-23 22:30:34 -05:00
|
|
|
case "timeSeriesQuery":
|
|
|
|
fallthrough
|
2017-09-22 04:07:10 -05:00
|
|
|
default:
|
2017-09-23 22:30:34 -05:00
|
|
|
result, err = e.executeTimeSeriesQuery(ctx, queryContext)
|
2017-09-09 14:24:39 -05:00
|
|
|
}
|
2017-09-22 04:07:10 -05:00
|
|
|
|
|
|
|
return result, err
|
2017-09-09 14:24:39 -05:00
|
|
|
}
|
2020-04-25 15:48:20 -05:00
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
func (e *cloudWatchExecutor) executeLogAlertQuery(ctx context.Context, queryContext *tsdb.TsdbQuery) (*tsdb.Response, error) {
|
2020-04-25 15:48:20 -05:00
|
|
|
queryParams := queryContext.Queries[0].Model
|
|
|
|
queryParams.Set("subtype", "StartQuery")
|
|
|
|
queryParams.Set("queryString", queryParams.Get("expression").MustString(""))
|
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
region := queryParams.Get("region").MustString(defaultRegion)
|
|
|
|
if region == defaultRegion {
|
2020-04-25 15:48:20 -05:00
|
|
|
region = e.DataSource.JsonData.Get("defaultRegion").MustString()
|
|
|
|
queryParams.Set("region", region)
|
|
|
|
}
|
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
logsClient, err := e.getCWLogsClient(region)
|
2020-04-25 15:48:20 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
result, err := e.executeStartQuery(ctx, logsClient, queryParams, queryContext.TimeRange)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
queryParams.Set("queryId", *result.QueryId)
|
|
|
|
|
2020-05-18 05:25:58 -05:00
|
|
|
// Get query results
|
2020-04-25 15:48:20 -05:00
|
|
|
getQueryResultsOutput, err := e.alertQuery(ctx, logsClient, queryContext)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-05-21 09:18:09 -05:00
|
|
|
dataframe, err := logsResultsToDataframes(getQueryResultsOutput)
|
2020-04-25 15:48:20 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-05-21 09:18:09 -05:00
|
|
|
statsGroups := queryParams.Get("statsGroups").MustStringArray()
|
|
|
|
if len(statsGroups) > 0 && len(dataframe.Fields) > 0 {
|
|
|
|
groupedFrames, err := groupResults(dataframe, statsGroups)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
response := &tsdb.Response{
|
|
|
|
Results: make(map[string]*tsdb.QueryResult),
|
|
|
|
}
|
|
|
|
|
|
|
|
response.Results["A"] = &tsdb.QueryResult{
|
|
|
|
RefId: "A",
|
2020-06-09 06:13:06 -05:00
|
|
|
Dataframes: tsdb.NewDecodedDataFrames(groupedFrames),
|
2020-05-21 09:18:09 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
return response, nil
|
|
|
|
}
|
|
|
|
|
2020-04-25 15:48:20 -05:00
|
|
|
response := &tsdb.Response{
|
2020-05-18 05:25:58 -05:00
|
|
|
Results: map[string]*tsdb.QueryResult{
|
|
|
|
"A": {
|
|
|
|
RefId: "A",
|
2020-06-09 06:13:06 -05:00
|
|
|
Dataframes: tsdb.NewDecodedDataFrames(data.Frames{dataframe}),
|
2020-05-18 05:25:58 -05:00
|
|
|
},
|
|
|
|
},
|
2020-04-25 15:48:20 -05:00
|
|
|
}
|
|
|
|
return response, nil
|
|
|
|
}
|
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
func (e *cloudWatchExecutor) getDSInfo(region string) *datasourceInfo {
|
|
|
|
if region == defaultRegion {
|
|
|
|
region = e.DataSource.JsonData.Get("defaultRegion").MustString()
|
|
|
|
}
|
|
|
|
|
|
|
|
authType := e.DataSource.JsonData.Get("authType").MustString()
|
|
|
|
assumeRoleArn := e.DataSource.JsonData.Get("assumeRoleArn").MustString()
|
|
|
|
externalID := e.DataSource.JsonData.Get("externalId").MustString()
|
|
|
|
decrypted := e.DataSource.DecryptedValues()
|
|
|
|
accessKey := decrypted["accessKey"]
|
|
|
|
secretKey := decrypted["secretKey"]
|
|
|
|
|
2020-09-24 11:21:17 -05:00
|
|
|
profile := e.DataSource.JsonData.Get("profile").MustString()
|
|
|
|
if profile == "" {
|
|
|
|
profile = e.DataSource.Database // legacy support
|
|
|
|
}
|
|
|
|
|
2020-07-14 01:23:23 -05:00
|
|
|
return &datasourceInfo{
|
|
|
|
Region: region,
|
2020-09-24 11:21:17 -05:00
|
|
|
Profile: profile,
|
2020-07-14 01:23:23 -05:00
|
|
|
AuthType: authType,
|
|
|
|
AssumeRoleArn: assumeRoleArn,
|
|
|
|
ExternalID: externalID,
|
|
|
|
AccessKey: accessKey,
|
|
|
|
SecretKey: secretKey,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
func isTerminated(queryStatus string) bool {
|
|
|
|
return queryStatus == "Complete" || queryStatus == "Cancelled" || queryStatus == "Failed" || queryStatus == "Timeout"
|
|
|
|
}
|
2020-07-14 01:23:23 -05:00
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
// CloudWatch client factory.
|
|
|
|
//
|
|
|
|
// Stubbable by tests.
|
|
|
|
var newCWClient = func(sess *session.Session) cloudwatchiface.CloudWatchAPI {
|
|
|
|
client := cloudwatch.New(sess)
|
|
|
|
client.Handlers.Send.PushFront(func(r *request.Request) {
|
|
|
|
r.HTTPRequest.Header.Set("User-Agent", fmt.Sprintf("Grafana/%s", setting.BuildVersion))
|
|
|
|
})
|
2020-07-14 01:23:23 -05:00
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
return client
|
|
|
|
}
|
2020-07-14 01:23:23 -05:00
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
// CloudWatch logs client factory.
|
|
|
|
//
|
|
|
|
// Stubbable by tests.
|
|
|
|
var newCWLogsClient = func(sess *session.Session) cloudwatchlogsiface.CloudWatchLogsAPI {
|
|
|
|
client := cloudwatchlogs.New(sess)
|
2020-07-14 01:23:23 -05:00
|
|
|
client.Handlers.Send.PushFront(func(r *request.Request) {
|
|
|
|
r.HTTPRequest.Header.Set("User-Agent", fmt.Sprintf("Grafana/%s", setting.BuildVersion))
|
|
|
|
})
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
return client
|
2020-07-14 01:23:23 -05:00
|
|
|
}
|
|
|
|
|
2020-07-23 11:52:22 -05:00
|
|
|
// EC2 client factory.
|
|
|
|
//
|
|
|
|
// Stubbable by tests.
|
|
|
|
var newEC2Client = func(provider client.ConfigProvider) ec2iface.EC2API {
|
|
|
|
return ec2.New(provider)
|
|
|
|
}
|
|
|
|
|
|
|
|
// RGTA client factory.
|
|
|
|
//
|
|
|
|
// Stubbable by tests.
|
|
|
|
var newRGTAClient = func(provider client.ConfigProvider) resourcegroupstaggingapiiface.ResourceGroupsTaggingAPIAPI {
|
|
|
|
return resourcegroupstaggingapi.New(provider)
|
2020-04-25 15:48:20 -05:00
|
|
|
}
|