metric_find_query.go 50 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800
  1. package cloudwatch
  2. import (
  3. "context"
  4. "errors"
  5. "fmt"
  6. "reflect"
  7. "sort"
  8. "strings"
  9. "sync"
  10. "time"
  11. "github.com/aws/aws-sdk-go/aws"
  12. "github.com/aws/aws-sdk-go/aws/awsutil"
  13. "github.com/aws/aws-sdk-go/aws/session"
  14. "github.com/aws/aws-sdk-go/service/cloudwatch"
  15. "github.com/aws/aws-sdk-go/service/ec2"
  16. "github.com/aws/aws-sdk-go/service/resourcegroupstaggingapi"
  17. "github.com/grafana/grafana/pkg/components/simplejson"
  18. "github.com/grafana/grafana/pkg/infra/metrics"
  19. "github.com/grafana/grafana/pkg/tsdb"
  20. )
  21. var metricsMap map[string][]string
  22. var dimensionsMap map[string][]string
  23. type suggestData struct {
  24. Text string
  25. Value string
  26. }
  27. type CustomMetricsCache struct {
  28. Expire time.Time
  29. Cache []string
  30. }
  31. var customMetricsMetricsMap map[string]map[string]map[string]*CustomMetricsCache
  32. var customMetricsDimensionsMap map[string]map[string]map[string]*CustomMetricsCache
  33. var regionCache sync.Map
  34. func init() {
  35. metricsMap = map[string][]string{
  36. "AWS/AmazonMQ": {"ConsumerCount", "CpuCreditBalance", "CpuUtilization", "CurrentConnectionsCount", "DequeueCount", "DispatchCount", "EnqueueCount", "EnqueueTime", "ExpiredCount", "HeapUsage", "InflightCount", "JournalFilesForFastRecovery", "JournalFilesForFullRecovery", "MemoryUsage", "NetworkIn", "NetworkOut", "OpenTransactionsCount", "ProducerCount", "QueueSize", "StorePercentUsage", "TotalConsumerCount", "TotalMessageCount", "TotalProducerCount"},
  37. "AWS/ApiGateway": {"4XXError", "5XXError", "CacheHitCount", "CacheMissCount", "Count", "IntegrationLatency", "Latency"},
  38. "AWS/AppStream": {"ActualCapacity", "AvailableCapacity", "CapacityUtilization", "DesiredCapacity", "InUseCapacity", "InsufficientCapacityError", "PendingCapacity", "RunningCapacity"},
  39. "AWS/AppSync": {"4XXError", "5XXError", "Latency"},
  40. "AWS/ApplicationELB": {"ActiveConnectionCount", "ClientTLSNegotiationErrorCount", "ConsumedLCUs", "ELBAuthError", "ELBAuthFailure", "ELBAuthLatency", "ELBAuthRefreshTokenSuccess", "ELBAuthSuccess", "ELBAuthUserClaimsSizeExceeded", "HTTPCode_ELB_3XX_Count", "HTTPCode_ELB_4XX_Count", "HTTPCode_ELB_5XX_Count", "HTTPCode_Target_2XX_Count", "HTTPCode_Target_3XX_Count", "HTTPCode_Target_4XX_Count", "HTTPCode_Target_5XX_Count", "HTTP_Fixed_Response_Count", "HTTP_Redirect_Count", "HTTP_Redirect_Url_Limit_Exceeded_Count", "HealthyHostCount", "IPv6ProcessedBytes", "IPv6RequestCount", "LambdaInternalError", "LambdaTargetProcessedBytes", "LambdaUserError", "NewConnectionCount", "NonStickyRequestCount", "ProcessedBytes", "RejectedConnectionCount", "RequestCount", "RequestCountPerTarget", "RuleEvaluations", "StandardProcessedBytes", "TargetConnectionErrorCount", "TargetResponseTime", "TargetTLSNegotiationErrorCount", "UnHealthyHostCount"},
  41. "AWS/AutoScaling": {"GroupDesiredCapacity", "GroupInServiceInstances", "GroupMaxSize", "GroupMinSize", "GroupPendingInstances", "GroupStandbyInstances", "GroupTerminatingInstances", "GroupTotalInstances"},
  42. "AWS/Billing": {"EstimatedCharges"},
  43. "AWS/CloudFront": {"4xxErrorRate", "5xxErrorRate", "BytesDownloaded", "BytesUploaded", "Requests", "TotalErrorRate"},
  44. "AWS/CloudHSM": {"HsmKeysSessionOccupied", "HsmKeysTokenOccupied", "HsmSessionCount", "HsmSslCtxsOccupied", "HsmTemperature", "HsmUnhealthy", "HsmUsersAvailable", "HsmUsersMax", "InterfaceEth2OctetsInput", "InterfaceEth2OctetsOutput"},
  45. "AWS/CloudSearch": {"IndexUtilization", "Partitions", "SearchableDocuments", "SuccessfulRequests"},
  46. "AWS/CodeBuild": {"BuildDuration", "Builds", "DownloadSourceDuration", "Duration", "FailedBuilds", "FinalizingDuration", "InstallDuration", "PostBuildDuration", "PreBuildDuration", "ProvisioningDuration", "QueuedDuration", "SubmittedDuration", "SucceededBuilds", "UploadArtifactsDuration"},
  47. "AWS/Connect": {"CallBackNotDialableNumber", "CallRecordingUploadError", "CallsBreachingConcurrencyQuota", "CallsPerInterval", "ConcurrentCalls", "ConcurrentCallsPercentage", "ContactFlowErrors", "ContactFlowFatalErrors", "LongestQueueWaitTime", "MisconfiguredPhoneNumbers", "MissedCalls", "PublicSigningKeyUsage", "QueueCapacityExceededError", "QueueSize", "ThrottledCalls", "ToInstancePacketLossRate"},
  48. "AWS/DDoSProtection": {"AllowedRequests", "BlockedRequests", "CountedRequests", "DDoSAttackBitsPerSecond", "DDoSAttackPacketsPerSecond", "DDoSAttackRequestsPerSecond", "DDoSDetected", "PassedRequests"},
  49. "AWS/DMS": {"CDCChangesDiskSource", "CDCChangesDiskTarget", "CDCChangesMemorySource", "CDCChangesMemoryTarget", "CDCIncomingChanges", "CDCLatencySource", "CDCLatencyTarget", "CDCThroughputBandwidthTarget", "CDCThroughputRowsSource", "CDCThroughputRowsTarget", "FreeableMemory", "FullLoadThroughputBandwidthSource", "FullLoadThroughputBandwidthTarget", "FullLoadThroughputRowsSource", "FullLoadThroughputRowsTarget", "NetworkReceiveThroughput", "NetworkTransmitThroughput", "ReadIOPS", "ReadLatency", "ReadThroughput", "SwapUsage", "WriteIOPS", "WriteLatency", "WriteThroughput"},
  50. "AWS/DX": {"ConnectionBpsEgress", "ConnectionBpsIngress", "ConnectionCRCErrorCount", "ConnectionLightLevelRx", "ConnectionLightLevelTx", "ConnectionPpsEgress", "ConnectionPpsIngress", "ConnectionState"},
  51. "AWS/DynamoDB": {"ConditionalCheckFailedRequests", "ConsumedReadCapacityUnits", "ConsumedWriteCapacityUnits", "OnlineIndexConsumedWriteCapacity", "OnlineIndexPercentageProgress", "OnlineIndexThrottleEvents", "PendingReplicationCount", "ProvisionedReadCapacityUnits", "ProvisionedWriteCapacityUnits", "ReadThrottleEvents", "ReplicationLatency", "ReturnedBytes", "ReturnedItemCount", "ReturnedRecordsCount", "SuccessfulRequestLatency", "SystemErrors", "ThrottledRequests", "TimeToLiveDeletedItemCount", "UserErrors", "WriteThrottleEvents"},
  52. "AWS/EBS": {"BurstBalance", "VolumeConsumedReadWriteOps", "VolumeIdleTime", "VolumeQueueLength", "VolumeReadBytes", "VolumeReadOps", "VolumeThroughputPercentage", "VolumeTotalReadTime", "VolumeTotalWriteTime", "VolumeWriteBytes", "VolumeWriteOps"},
  53. "AWS/EC2": {"CPUCreditBalance", "CPUCreditUsage", "CPUSurplusCreditBalance", "CPUSurplusCreditsCharged", "CPUUtilization", "DiskReadBytes", "DiskReadOps", "DiskWriteBytes", "DiskWriteOps", "EBSByteBalance%", "EBSIOBalance%", "EBSReadBytes", "EBSReadOps", "EBSWriteBytes", "EBSWriteOps", "NetworkIn", "NetworkOut", "NetworkPacketsIn", "NetworkPacketsOut", "StatusCheckFailed", "StatusCheckFailed_Instance", "StatusCheckFailed_System"},
  54. "AWS/EC2/API": {"ClientErrors", "RequestLimitExceeded", "ServerErrors", "SuccessfulCalls"},
  55. "AWS/EC2Spot": {"AvailableInstancePoolsCount", "BidsSubmittedForCapacity", "EligibleInstancePoolCount", "FulfilledCapacity", "MaxPercentCapacityAllocation", "PendingCapacity", "PercentCapacityAllocation", "TargetCapacity", "TerminatingCapacity"},
  56. "AWS/ECS": {"CPUReservation", "CPUUtilization", "GPUReservation", "MemoryReservation", "MemoryUtilization"},
  57. "AWS/EFS": {"BurstCreditBalance", "ClientConnections", "DataReadIOBytes", "DataWriteIOBytes", "MetadataIOBytes", "PercentIOLimit", "PermittedThroughput", "TotalIOBytes"},
  58. "AWS/ELB": {"BackendConnectionErrors", "EstimatedALBActiveConnectionCount", "EstimatedALBConsumedLCUs", "EstimatedALBNewConnectionCount", "EstimatedProcessedBytes", "HTTPCode_Backend_2XX", "HTTPCode_Backend_3XX", "HTTPCode_Backend_4XX", "HTTPCode_Backend_5XX", "HTTPCode_ELB_4XX", "HTTPCode_ELB_5XX", "HealthyHostCount", "Latency", "RequestCount", "SpilloverCount", "SurgeQueueLength", "UnHealthyHostCount"},
  59. "AWS/ES": {"AutomatedSnapshotFailure", "CPUCreditBalance", "CPUUtilization", "ClusterIndexWritesBlocked", "ClusterStatus.green", "ClusterStatus.red", "ClusterStatus.yellow", "ClusterUsedSpace", "DeletedDocuments", "DiskQueueDepth", "ElasticsearchRequests", "FreeStorageSpace", "IndexingLatency", "IndexingRate", "InvalidHostHeaderRequests", "JVMGCOldCollectionCount", "JVMGCOldCollectionTime", "JVMGCYoungCollectionCount", "JVMGCYoungCollectionTime", "JVMMemoryPressure", "KMSKeyError", "KMSKeyInaccessible", "KibanaHealthyNodes", "MasterCPUCreditBalance", "MasterCPUUtilization", "MasterFreeStorageSpace", "MasterJVMMemoryPressure", "MasterReachableFromNode", "Nodes", "ReadIOPS", "ReadLatency", "ReadThroughput", "RequestCount", "SearchLatency", "SearchRate", "SearchableDocuments", "SysMemoryUtilization", "ThreadpoolBulkQueue", "ThreadpoolBulkRejected", "ThreadpoolBulkThreads", "ThreadpoolForce_mergeQueue", "ThreadpoolForce_mergeRejected", "ThreadpoolForce_mergeThreads", "ThreadpoolIndexQueue", "ThreadpoolIndexRejected", "ThreadpoolIndexThreads", "ThreadpoolSearchQueue", "ThreadpoolSearchRejected", "ThreadpoolSearchThreads", "WriteIOPS", "WriteLatency", "WriteThroughput"},
  60. "AWS/ElastiCache": {"ActiveDefragHits", "BytesReadIntoMemcached", "BytesUsedForCache", "BytesUsedForCacheItems", "BytesUsedForHash", "BytesWrittenOutFromMemcached", "CPUUtilization", "CacheHits", "CacheMisses", "CasBadval", "CasHits", "CasMisses", "CmdConfigGet", "CmdConfigSet", "CmdFlush", "CmdGet", "CmdSet", "CmdTouch", "CurrConfig", "CurrConnections", "CurrItems", "DecrHits", "DecrMisses", "DeleteHits", "DeleteMisses", "EngineCPUUtilization", "EvictedUnfetched", "Evictions", "ExpiredUnfetched", "FreeableMemory", "GetHits", "GetMisses", "GetTypeCmds", "HashBasedCmds", "HyperLogLogBasedCmds", "IncrHits", "IncrMisses", "KeyBasedCmds", "ListBasedCmds", "NetworkBytesIn", "NetworkBytesOut", "NewConnections", "NewItems", "Reclaimed", "ReplicationBytes", "ReplicationLag", "SaveInProgress", "SetBasedCmds", "SetTypeCmds", "SlabsMoved", "SortedSetBasedCmds", "StringBasedCmds", "SwapUsage", "TouchHits", "TouchMisses", "UnusedMemory"},
  61. "AWS/ElasticBeanstalk": {"ApplicationLatencyP10", "ApplicationLatencyP50", "ApplicationLatencyP75", "ApplicationLatencyP85", "ApplicationLatencyP90", "ApplicationLatencyP95", "ApplicationLatencyP99", "ApplicationLatencyP99.9", "ApplicationRequests2xx", "ApplicationRequests3xx", "ApplicationRequests4xx", "ApplicationRequests5xx", "ApplicationRequestsTotal", "CPUIdle", "CPUIowait", "CPUIrq", "CPUNice", "CPUSoftirq", "CPUSystem", "CPUUser", "EnvironmentHealth", "InstanceHealth", "InstancesDegraded", "InstancesInfo", "InstancesNoData", "InstancesOk", "InstancesPending", "InstancesSevere", "InstancesUnknown", "InstancesWarning", "LoadAverage1min", "LoadAverage5min", "RootFilesystemUtil"},
  62. "AWS/ElasticMapReduce": {"AppsCompleted", "AppsFailed", "AppsKilled", "AppsPending", "AppsRunning", "AppsSubmitted", "BackupFailed", "CapacityRemainingGB", "Cluster Status", "ContainerAllocated", "ContainerPending", "ContainerPendingRatio", "ContainerReserved", "CoreNodesPending", "CoreNodesRunning", "CorruptBlocks", "DfsPendingReplicationBlocks", "HBase", "HDFSBytesRead", "HDFSBytesWritten", "HDFSUtilization", "HbaseBackupFailed", "IO", "IsIdle", "JobsFailed", "JobsRunning", "LiveDataNodes", "LiveTaskTrackers", "MRActiveNodes", "MRDecommissionedNodes", "MRLostNodes", "MRRebootedNodes", "MRTotalNodes", "MRUnhealthyNodes", "Map/Reduce", "MapSlotsOpen", "MapTasksRemaining", "MapTasksRunning", "MemoryAllocatedMB", "MemoryAvailableMB", "MemoryReservedMB", "MemoryTotalMB", "MissingBlocks", "MostRecentBackupDuration", "Node Status", "PendingDeletionBlocks", "ReduceSlotsOpen", "ReduceTasksRemaining", "ReduceTasksRunning", "RemainingMapTasksPerSlot", "S3BytesRead", "S3BytesWritten", "TaskNodesPending", "TaskNodesRunning", "TimeSinceLastSuccessfulBackup", "TotalLoad", "UnderReplicatedBlocks", "YARNMemoryAvailablePercentage"},
  63. "AWS/ElasticTranscoder": {"Billed Audio Output", "Billed HD Output", "Billed SD Output", "Errors", "Jobs Completed", "Jobs Errored", "Outputs per Job", "Standby Time", "Throttles"},
  64. "AWS/Events": {"DeadLetterInvocations", "FailedInvocations", "Invocations", "MatchedEvents", "ThrottledRules", "TriggeredRules"},
  65. "AWS/FSx": {"DataReadBytes", "DataReadOperations", "DataWriteBytes", "DataWriteOperations", "FreeDataStorageCapacity", "MetadataOperations"},
  66. "AWS/Firehose": {"BackupToS3.Bytes", "BackupToS3.DataFreshness", "BackupToS3.Records", "BackupToS3.Success", "DataReadFromKinesisStream.Bytes", "DataReadFromKinesisStream.Records", "DeliveryToElasticsearch.Bytes", "DeliveryToElasticsearch.Records", "DeliveryToElasticsearch.Success", "DeliveryToRedshift.Bytes", "DeliveryToRedshift.Records", "DeliveryToRedshift.Success", "DeliveryToS3.Bytes", "DeliveryToS3.DataFreshness", "DeliveryToS3.Records", "DeliveryToS3.Success", "DeliveryToSplunk.Bytes", "DeliveryToSplunk.DataFreshness", "DeliveryToSplunk.Records", "DeliveryToSplunk.Success", "DescribeDeliveryStream.Latency", "DescribeDeliveryStream.Requests", "ExecuteProcessing.Duration", "ExecuteProcessing.Success", "FailedConversion.Bytes", "FailedConversion.Records", "IncomingBytes", "IncomingRecords", "KinesisMillisBehindLatest", "ListDeliveryStreams.Latency", "ListDeliveryStreams.Requests", "PutRecord.Bytes", "PutRecord.Latency", "PutRecord.Requests", "PutRecordBatch.Bytes", "PutRecordBatch.Latency", "PutRecordBatch.Records", "PutRecordBatch.Requests", "SucceedConversion.Bytes", "SucceedConversion.Records", "SucceedProcessing.Bytes", "SucceedProcessing.Records", "ThrottledDescribeStream", "ThrottledGetRecords", "ThrottledGetShardIterator", "UpdateDeliveryStream.Latency", "UpdateDeliveryStream.Requests"},
  67. "AWS/Glue": {"glue.driver.BlockManager.disk.diskSpaceUsed_MB", "glue.driver.ExecutorAllocationManager.executors.numberAllExecutors", "glue.driver.ExecutorAllocationManager.executors.numberMaxNeededExecutors", "glue.driver.aggregate.bytesRead", "glue.driver.aggregate.elapsedTime", "glue.driver.aggregate.numCompletedStages", "glue.driver.aggregate.numCompletedTasks", "glue.driver.aggregate.numFailedTasks", "glue.driver.aggregate.numKilledTasks", "glue.driver.aggregate.recordsRead", "glue.driver.aggregate.shuffleBytesWritten", "glue.driver.aggregate.shuffleLocalBytesRead", "glue.driver.jvm.heap.usage glue.executorId.jvm.heap.usage glue.ALL.jvm.heap.usage", "glue.driver.jvm.heap.used glue.executorId.jvm.heap.used glue.ALL.jvm.heap.used", "glue.driver.s3.filesystem.read_bytes glue.executorId.s3.filesystem.read_bytes glue.ALL.s3.filesystem.read_bytes", "glue.driver.s3.filesystem.write_bytes glue.executorId.s3.filesystem.write_bytes glue.ALL.s3.filesystem.write_bytes", "glue.driver.system.cpuSystemLoad glue.executorId.system.cpuSystemLoad glue.ALL.system.cpuSystemLoad"},
  68. "AWS/Inspector": {"TotalAssessmentRunFindings", "TotalAssessmentRuns", "TotalHealthyAgents", "TotalMatchingAgents"},
  69. "AWS/IoT": {"Connect.Success", "GetThingShadow.Accepted", "Ping.Success", "PublishIn.Success", "PublishOut.Success", "Subscribe.Success"},
  70. "AWS/KMS": {"SecondsUntilKeyMaterialExpiration"},
  71. "AWS/Kinesis": {"GetRecords.Bytes", "GetRecords.IteratorAge", "GetRecords.IteratorAgeMilliseconds", "GetRecords.Latency", "GetRecords.Records", "GetRecords.Success", "IncomingBytes", "IncomingRecords", "IteratorAgeMilliseconds", "OutgoingBytes", "OutgoingRecords", "PutRecord.Bytes", "PutRecord.Latency", "PutRecord.Success", "PutRecords.Bytes", "PutRecords.Latency", "PutRecords.Records", "PutRecords.Success", "ReadProvisionedThroughputExceeded", "SubscribeToShard.RateExceeded", "SubscribeToShard.Success", "SubscribeToShardEvent.Bytes", "SubscribeToShardEvent.MillisBehindLatest", "SubscribeToShardEvent.Records", "SubscribeToShardEvent.Success", "WriteProvisionedThroughputExceeded"},
  72. "AWS/KinesisAnalytics": {"Bytes", "InputProcessing.DroppedRecords", "InputProcessing.Duration", "InputProcessing.OkBytes", "InputProcessing.OkRecords", "InputProcessing.ProcessingFailedRecords", "InputProcessing.Success", "KPUs", "LambdaDelivery.DeliveryFailedRecords", "LambdaDelivery.Duration", "LambdaDelivery.OkRecords", "MillisBehindLatest", "Records", "Success"},
  73. "AWS/KinesisVideo": {"GetHLSMasterPlaylist.Latency", "GetHLSMasterPlaylist.Requests", "GetHLSMasterPlaylist.Success", "GetHLSMediaPlaylist.Latency", "GetHLSMediaPlaylist.Requests", "GetHLSMediaPlaylist.Success", "GetHLSStreamingSessionURL.Latency", "GetHLSStreamingSessionURL.Requests", "GetHLSStreamingSessionURL.Success", "GetMP4InitFragment.Latency", "GetMP4InitFragment.Requests", "GetMP4InitFragment.Success", "GetMP4MediaFragment.Latency", "GetMP4MediaFragment.OutgoingBytes", "GetMP4MediaFragment.Requests", "GetMP4MediaFragment.Success", "GetMedia.ConnectionErrors", "GetMedia.MillisBehindNow", "GetMedia.OutgoingBytes", "GetMedia.OutgoingFragments", "GetMedia.OutgoingFrames", "GetMedia.Requests", "GetMedia.Success", "GetMediaForFragmentList.OutgoingBytes", "GetMediaForFragmentList.OutgoingFragments", "GetMediaForFragmentList.OutgoingFrames", "GetMediaForFragmentList.Requests", "GetMediaForFragmentList.Success", "GetTSFragment.Latency", "GetTSFragment.OutgoingBytes", "GetTSFragment.Requests", "GetTSFragment.Success", "ListFragments.Latency", "PutMedia.ActiveConnections", "PutMedia.BufferingAckLatency", "PutMedia.ConnectionErrors", "PutMedia.ErrorAckCount", "PutMedia.FragmentIngestionLatency", "PutMedia.FragmentPersistLatency", "PutMedia.IncomingBytes", "PutMedia.IncomingFragments", "PutMedia.IncomingFrames", "PutMedia.Latency", "PutMedia.PersistedAckLatency", "PutMedia.ReceivedAckLatency", "PutMedia.Requests", "PutMedia.Success"},
  74. "AWS/Lambda": {"ConcurrentExecutions", "DeadLetterErrors", "Duration", "Errors", "Invocations", "IteratorAge", "Throttles", "UnreservedConcurrentExecutions"},
  75. "AWS/Lex": {"BotChannelAuthErrors", "BotChannelConfigurationErrors", "BotChannelInboundThrottledEvents", "BotChannelOutboundThrottledEvents", "BotChannelRequestCount", "BotChannelResponseCardErrors", "BotChannelSystemErrors", "MissedUtteranceCount", "RuntimeInvalidLambdaResponses", "RuntimeLambdaErrors", "RuntimePollyErrors", "RuntimeRequestCount", "RuntimeSucessfulRequestLatency", "RuntimeSystemErrors", "RuntimeThrottledEvents", "RuntimeUserErrors"},
  76. "AWS/Logs": {"DeliveryErrors", "DeliveryThrottling", "ForwardedBytes", "ForwardedLogEvents", "IncomingBytes", "IncomingLogEvents"},
  77. "AWS/ML": {"PredictCount", "PredictFailureCount"},
  78. "AWS/MediaConvert": {"AudioOutputSeconds", "Errors", "HDOutputSeconds", "JobsCompletedCount", "JobsErroredCount", "SDOutputSeconds", "StandbyTime", "TranscodingTime", "UHDOutputSeconds"},
  79. "AWS/MediaPackage": {"ActiveInput", "EgressBytes", "EgressRequestCount", "EgressResponseTime", "IngressBytes", "IngressResponseTime"},
  80. "AWS/MediaTailor": {"AdDecisionServer.Ads", "AdDecisionServer.Duration", "AdDecisionServer.Errors", "AdDecisionServer.FillRate", "AdDecisionServer.Timeouts", "AdNotReady", "Avails.Duration", "Avails.FillRate", "Avails.FilledDuration", "GetManifest.Errors", "Origin.Errors", "Origin.Timeouts"},
  81. "AWS/NATGateway": {"ActiveConnectionCount", "BytesInFromDestination", "BytesInFromSource", "BytesOutToDestination", "BytesOutToSource", "ConnectionAttemptCount", "ConnectionEstablishedCount", "ErrorPortAllocation", "IdleTimeoutCount", "PacketsDropCount", "PacketsInFromDestination", "PacketsInFromSource", "PacketsOutToDestination", "PacketsOutToSource"},
  82. "AWS/Neptune": {"CPUUtilization", "ClusterReplicaLag", "ClusterReplicaLagMaximum", "ClusterReplicaLagMinimum", "EngineUptime", "FreeLocalStorage", "FreeableMemory", "GremlinErrors", "GremlinHttp1xx", "GremlinHttp2xx", "GremlinHttp4xx", "GremlinHttp5xx", "GremlinRequests", "GremlinRequestsPerSec", "GremlinWebSocketAvailableConnections", "GremlinWebSocketClientErrors", "GremlinWebSocketServerErrors", "GremlinWebSocketSuccess", "Http100", "Http101", "Http1xx", "Http200", "Http2xx", "Http400", "Http403", "Http405", "Http413", "Http429", "Http4xx", "Http500", "Http501", "Http5xx", "LoaderErrors", "LoaderRequests", "NetworkReceiveThroughput", "NetworkThroughput", "NetworkTransmitThroughput", "SparqlErrors", "SparqlHttp1xx", "SparqlHttp2xx", "SparqlHttp4xx", "SparqlHttp5xx", "SparqlRequests", "SparqlRequestsPerSec", "StatusErrors", "StatusRequests", "VolumeBytesUsed", "VolumeReadIOPs", "VolumeWriteIOPs"},
  83. "AWS/NetworkELB": {"ActiveFlowCount", "ActiveFlowCount_TLS", "ClientTLSNegotiationErrorCount", "ConsumedLCUs", "HealthyHostCount", "NewFlowCount", "NewFlowCount_TLS", "ProcessedBytes", "ProcessedBytes_TLS", "TCP_Client_Reset_Count", "TCP_ELB_Reset_Count", "TCP_Target_Reset_Count", "TargetTLSNegotiationErrorCount", "UnHealthyHostCount"},
  84. "AWS/OpsWorks": {"cpu_idle", "cpu_nice", "cpu_steal", "cpu_system", "cpu_user", "cpu_waitio", "load_1", "load_15", "load_5", "memory_buffers", "memory_cached", "memory_free", "memory_swap", "memory_total", "memory_used", "procs"},
  85. "AWS/Polly": {"2XXCount", "4XXCount", "5XXCount", "RequestCharacters", "ResponseLatency"},
  86. "AWS/RDS": {"ActiveTransactions", "AuroraBinlogReplicaLag", "AuroraReplicaLag", "AuroraReplicaLagMaximum", "AuroraReplicaLagMinimum", "BinLogDiskUsage", "BlockedTransactions", "BufferCacheHitRatio", "BurstBalance", "CPUCreditBalance", "CPUCreditUsage", "CPUUtilization", "CommitLatency", "CommitThroughput", "DDLLatency", "DDLThroughput", "DMLLatency", "DMLThroughput", "DatabaseConnections", "Deadlocks", "DeleteLatency", "DeleteThroughput", "DiskQueueDepth", "EngineUptime", "FailedSQLServerAgentJobsCount", "FailedSqlStatements", "FreeLocalStorage", "FreeStorageSpace", "FreeableMemory", "InsertLatency", "InsertThroughput", "LoginFailures", "MaximumUsedTransactionIDs", "NetworkReceiveThroughput", "NetworkThroughput", "NetworkTransmitThroughput", "OldestReplicationSlotLag", "Queries", "ReadIOPS", "ReadLatency", "ReadThroughput", "ReplicaLag", "ReplicationSlotDiskUsage", "ResultSetCacheHitRatio", "SelectLatency", "SelectThroughput", "ServerlessDatabaseCapacity", "SwapUsage", "TotalConnections", "TransactionLogsDiskUsage", "TransactionLogsGeneration", "UpdateLatency", "UpdateThroughput", "VolumeBytesUsed", "VolumeReadIOPS", "VolumeWriteIOPS", "WriteIOPS", "WriteLatency", "WriteThroughput"},
  87. "AWS/Redshift": {"CPUUtilization", "DatabaseConnections", "HealthStatus", "MaintenanceMode", "NetworkReceiveThroughput", "NetworkTransmitThroughput", "PercentageDiskSpaceUsed", "QueriesCompletedPerSecond", "QueryDuration", "QueryRuntimeBreakdown", "ReadIOPS", "ReadLatency", "ReadThroughput", "TotalTableCount", "WLMQueriesCompletedPerSecond", "WLMQueryDuration", "WLMQueueLength", "WriteIOPS", "WriteLatency", "WriteThroughput"},
  88. "AWS/Route53": {"ChildHealthCheckHealthyCount", "ConnectionTime", "HealthCheckPercentageHealthy", "HealthCheckStatus", "SSLHandshakeTime", "TimeToFirstByte"},
  89. "AWS/S3": {"4xxErrors", "5xxErrors", "AllRequests", "BucketSizeBytes", "BytesDownloaded", "BytesUploaded", "DeleteRequests", "FirstByteLatency", "GetRequests", "HeadRequests", "ListRequests", "NumberOfObjects", "PostRequests", "PutRequests", "SelectRequests", "SelectReturnedBytes", "SelectScannedBytes", "TotalRequestLatency"},
  90. "AWS/SES": {"Bounce", "Complaint", "Delivery", "Reject", "Reputation.BounceRate", "Reputation.ComplaintRate", "Send"},
  91. "AWS/SNS": {"NumberOfMessagesPublished", "NumberOfNotificationsDelivered", "NumberOfNotificationsFailed", "PublishSize"},
  92. "AWS/SQS": {"ApproximateAgeOfOldestMessage", "ApproximateNumberOfMessagesDelayed", "ApproximateNumberOfMessagesNotVisible", "ApproximateNumberOfMessagesVisible", "NumberOfEmptyReceives", "NumberOfMessagesDeleted", "NumberOfMessagesReceived", "NumberOfMessagesSent", "SentMessageSize"},
  93. "AWS/SWF": {"ActivityTaskScheduleToCloseTime", "ActivityTaskScheduleToStartTime", "ActivityTaskStartToCloseTime", "ActivityTasksCanceled", "ActivityTasksCompleted", "ActivityTasksFailed", "DecisionTaskScheduleToStartTime", "DecisionTaskStartToCloseTime", "DecisionTasksCompleted", "ScheduledActivityTasksTimedOutOnClose", "ScheduledActivityTasksTimedOutOnStart", "StartedActivityTasksTimedOutOnClose", "StartedActivityTasksTimedOutOnHeartbeat", "StartedDecisionTasksTimedOutOnClose", "WorkflowStartToCloseTime", "WorkflowsCanceled", "WorkflowsCompleted", "WorkflowsContinuedAsNew", "WorkflowsFailed", "WorkflowsTerminated", "WorkflowsTimedOut"},
  94. "AWS/SageMaker": {"CPUUtilization", "DatasetObjectsAutoAnnotated", "DatasetObjectsHumanAnnotated", "DatasetObjectsLabelingFailed", "DiskUtilization", "GPUMemoryUtilization", "GPUUtilization", "Invocation4XXErrors", "Invocation5XXErrors", "Invocations", "InvocationsPerInstance", "JobsFailed", "JobsStopped", "JobsSucceeded", "MemoryUtilization", "ModelLatency", "OverheadLatency", "TotalDatasetObjectsLabeled"},
  95. "AWS/States": {"ActivitiesFailed", "ActivitiesHeartbeatTimedOut", "ActivitiesScheduled", "ActivitiesStarted", "ActivitiesSucceeded", "ActivitiesTimedOut", "ActivityRunTime", "ActivityScheduleTime", "ActivityTime", "ConsumedCapacity", "ExecutionThrottled", "ExecutionTime", "ExecutionsAborted", "ExecutionsFailed", "ExecutionsStarted", "ExecutionsSucceeded", "ExecutionsTimedOut", "LambdaFunctionRunTime", "LambdaFunctionScheduleTime", "LambdaFunctionTime", "LambdaFunctionsFailed", "LambdaFunctionsHeartbeatTimedOut", "LambdaFunctionsScheduled", "LambdaFunctionsStarted", "LambdaFunctionsSucceeded", "LambdaFunctionsTimedOut", "ProvisionedBucketSize", "ProvisionedRefillRate", "ThrottledEvents"},
  96. "AWS/StorageGateway": {"CacheFree", "CacheHitPercent", "CachePercentDirty", "CachePercentUsed", "CacheUsed", "CloudBytesDownloaded", "CloudBytesUploaded", "CloudDownloadLatency", "QueuedWrites", "ReadBytes", "ReadTime", "TimeSinceLastRecoveryPoint", "TotalCacheSize", "UploadBufferFree", "UploadBufferPercentUsed", "UploadBufferUsed", "WorkingStorageFree", "WorkingStoragePercentUsed", "WorkingStorageUsed", "WriteBytes", "WriteTime"},
  97. "AWS/TransitGateway": {"BytesIn", "BytesOut", "PacketDropCountBlackhole", "PacketDropCountNoRoute", "PacketsIn", "PacketsOut"},
  98. "AWS/Translate": {"CharacterCount", "ResponseTime", "ServerErrorCount", "SuccessfulRequestCount", "ThrottledCount", "UserErrorCount"},
  99. "AWS/VPN": {"TunnelDataIn", "TunnelDataOut", "TunnelState"},
  100. "AWS/WorkSpaces": {"Available", "ConnectionAttempt", "ConnectionFailure", "ConnectionSuccess", "InSessionLatency", "Maintenance", "SessionDisconnect", "SessionLaunchTime", "Stopped", "Unhealthy", "UserConnected"},
  101. "Rekognition": {"DetectedFaceCount", "DetectedLabelCount", "ResponseTime", "ServerErrorCount", "SuccessfulRequestCount", "ThrottledCount", "UserErrorCount"},
  102. "WAF": {"AllowedRequests", "BlockedRequests", "CountedRequests", "DDoSAttackBitsPerSecond", "DDoSAttackPacketsPerSecond", "DDoSAttackRequestsPerSecond", "DDoSDetected", "PassedRequests"},
  103. }
  104. dimensionsMap = map[string][]string{
  105. "AWS/AmazonMQ": {"Broker", "Queue", "Topic"},
  106. "AWS/ApiGateway": {"ApiName", "Method", "Resource", "Stage"},
  107. "AWS/AppStream": {"Fleet"},
  108. "AWS/AppSync": {"GraphQLAPIId"},
  109. "AWS/ApplicationELB": {"AvailabilityZone", "LoadBalancer", "TargetGroup"},
  110. "AWS/AutoScaling": {"AutoScalingGroupName"},
  111. "AWS/Billing": {"Currency", "LinkedAccount", "ServiceName"},
  112. "AWS/CloudFront": {"DistributionId", "Region"},
  113. "AWS/CloudHSM": {"ClusterId", "HsmId", "Region"},
  114. "AWS/CloudSearch": {"ClientId", "DomainName"},
  115. "AWS/CodeBuild": {"ProjectName"},
  116. "AWS/Connect": {"InstanceId", "MetricGroup", "Participant", "QueueName", "Stream Type", "Type of Connection"},
  117. "AWS/DDoSProtection": {"Region", "Rule", "RuleGroup", "WebACL"},
  118. "AWS/DMS": {"ReplicationInstanceIdentifier", "ReplicationTaskIdentifier"},
  119. "AWS/DX": {"ConnectionId"},
  120. "AWS/DynamoDB": {"GlobalSecondaryIndexName", "Operation", "ReceivingRegion", "StreamLabel", "TableName"},
  121. "AWS/EBS": {"VolumeId"},
  122. "AWS/EC2": {"AutoScalingGroupName", "ImageId", "InstanceId", "InstanceType"},
  123. "AWS/EC2/API": {},
  124. "AWS/EC2Spot": {"AvailabilityZone", "FleetRequestId", "InstanceType"},
  125. "AWS/ECS": {"ClusterName", "ServiceName"},
  126. "AWS/EFS": {"FileSystemId"},
  127. "AWS/ELB": {"AvailabilityZone", "LoadBalancerName"},
  128. "AWS/ES": {"ClientId", "DomainName"},
  129. "AWS/ElastiCache": {"CacheClusterId", "CacheNodeId"},
  130. "AWS/ElasticBeanstalk": {"EnvironmentName", "InstanceId"},
  131. "AWS/ElasticMapReduce": {"ClusterId", "JobFlowId", "JobId"},
  132. "AWS/ElasticTranscoder": {"Operation", "PipelineId"},
  133. "AWS/Events": {"RuleName"},
  134. "AWS/FSx": {},
  135. "AWS/Firehose": {"DeliveryStreamName"},
  136. "AWS/Glue": {"JobName", "JobRunId", "Type"},
  137. "AWS/Inspector": {},
  138. "AWS/IoT": {"Protocol"},
  139. "AWS/KMS": {"KeyId"},
  140. "AWS/Kinesis": {"ShardId", "StreamName"},
  141. "AWS/KinesisAnalytics": {"Application", "Flow", "Id"},
  142. "AWS/KinesisVideo": {},
  143. "AWS/Lambda": {"Alias", "ExecutedVersion", "FunctionName", "Resource"},
  144. "AWS/Lex": {"BotAlias", "BotChannelName", "BotName", "BotVersion", "InputMode", "Operation", "Source"},
  145. "AWS/Logs": {"DestinationType", "FilterName", "LogGroupName"},
  146. "AWS/ML": {"MLModelId", "RequestMode"},
  147. "AWS/MediaConvert": {"Job", "Operation", "Queue"},
  148. "AWS/MediaPackage": {"Channel", "No Dimension", "OriginEndpoint", "StatusCodeRange"},
  149. "AWS/MediaTailor": {"Configuration Name"},
  150. "AWS/NATGateway": {"NatGatewayId"},
  151. "AWS/Neptune": {"DBClusterIdentifier", "DatabaseClass", "EngineName", "Role"},
  152. "AWS/NetworkELB": {"AvailabilityZone", "LoadBalancer", "TargetGroup"},
  153. "AWS/OpsWorks": {"InstanceId", "LayerId", "StackId"},
  154. "AWS/Polly": {"Operation"},
  155. "AWS/RDS": {"DBClusterIdentifier", "DBInstanceIdentifier", "DatabaseClass", "DbClusterIdentifier", "EngineName", "Role", "SourceRegion"},
  156. "AWS/Redshift": {"ClusterIdentifier", "NodeID", "Service class", "Stage", "latency", "wmlid"},
  157. "AWS/Route53": {"HealthCheckId", "Region"},
  158. "AWS/S3": {"BucketName", "FilterId", "StorageType"},
  159. "AWS/SES": {},
  160. "AWS/SNS": {"Application", "Platform", "TopicName"},
  161. "AWS/SQS": {"QueueName"},
  162. "AWS/SWF": {"ActivityTypeName", "ActivityTypeVersion", "Domain", "WorkflowTypeName", "WorkflowTypeVersion"},
  163. "AWS/SageMaker": {"EndpointName", "Host", "LabelingJobName", "VariantName"},
  164. "AWS/States": {"APIName", "ActivityArn", "LambdaFunctionArn", "StateMachineArn", "StateTransition"},
  165. "AWS/StorageGateway": {"GatewayId", "GatewayName", "VolumeId"},
  166. "AWS/TransitGateway": {"TransitGateway"},
  167. "AWS/Translate": {"LanguagePair", "Operation"},
  168. "AWS/VPN": {"TunnelIpAddress", "VpnId"},
  169. "AWS/WorkSpaces": {"DirectoryId", "WorkspaceId"},
  170. "Rekognition": {},
  171. "WAF": {"Region", "Rule", "RuleGroup", "WebACL"},
  172. }
  173. customMetricsMetricsMap = make(map[string]map[string]map[string]*CustomMetricsCache)
  174. customMetricsDimensionsMap = make(map[string]map[string]map[string]*CustomMetricsCache)
  175. }
  176. func (e *CloudWatchExecutor) executeMetricFindQuery(ctx context.Context, queryContext *tsdb.TsdbQuery) (*tsdb.Response, error) {
  177. result := &tsdb.Response{
  178. Results: make(map[string]*tsdb.QueryResult),
  179. }
  180. firstQuery := queryContext.Queries[0]
  181. queryResult := &tsdb.QueryResult{Meta: simplejson.New(), RefId: firstQuery.RefId}
  182. parameters := firstQuery.Model
  183. subType := firstQuery.Model.Get("subtype").MustString()
  184. var data []suggestData
  185. var err error
  186. switch subType {
  187. case "regions":
  188. data, err = e.handleGetRegions(ctx, parameters, queryContext)
  189. case "namespaces":
  190. data, err = e.handleGetNamespaces(ctx, parameters, queryContext)
  191. case "metrics":
  192. data, err = e.handleGetMetrics(ctx, parameters, queryContext)
  193. case "dimension_keys":
  194. data, err = e.handleGetDimensions(ctx, parameters, queryContext)
  195. case "dimension_values":
  196. data, err = e.handleGetDimensionValues(ctx, parameters, queryContext)
  197. case "ebs_volume_ids":
  198. data, err = e.handleGetEbsVolumeIds(ctx, parameters, queryContext)
  199. case "ec2_instance_attribute":
  200. data, err = e.handleGetEc2InstanceAttribute(ctx, parameters, queryContext)
  201. case "resource_arns":
  202. data, err = e.handleGetResourceArns(ctx, parameters, queryContext)
  203. }
  204. transformToTable(data, queryResult)
  205. result.Results[firstQuery.RefId] = queryResult
  206. return result, err
  207. }
  208. func transformToTable(data []suggestData, result *tsdb.QueryResult) {
  209. table := &tsdb.Table{
  210. Columns: make([]tsdb.TableColumn, 2),
  211. Rows: make([]tsdb.RowValues, 0),
  212. }
  213. table.Columns[0].Text = "text"
  214. table.Columns[1].Text = "value"
  215. for _, r := range data {
  216. values := make([]interface{}, 2)
  217. values[0] = r.Text
  218. values[1] = r.Value
  219. table.Rows = append(table.Rows, values)
  220. }
  221. result.Tables = append(result.Tables, table)
  222. result.Meta.Set("rowCount", len(data))
  223. }
  224. func parseMultiSelectValue(input string) []string {
  225. trimmedInput := strings.TrimSpace(input)
  226. if strings.HasPrefix(trimmedInput, "{") {
  227. values := strings.Split(strings.TrimRight(strings.TrimLeft(trimmedInput, "{"), "}"), ",")
  228. trimValues := make([]string, len(values))
  229. for i, v := range values {
  230. trimValues[i] = strings.TrimSpace(v)
  231. }
  232. return trimValues
  233. }
  234. return []string{trimmedInput}
  235. }
  236. // Whenever this list is updated, frontend list should also be updated.
  237. // Please update the region list in public/app/plugins/datasource/cloudwatch/partials/config.html
  238. func (e *CloudWatchExecutor) handleGetRegions(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  239. dsInfo := e.getDsInfo("default")
  240. profile := dsInfo.Profile
  241. if cache, ok := regionCache.Load(profile); ok {
  242. if cache2, ok2 := cache.([]suggestData); ok2 {
  243. return cache2, nil
  244. }
  245. }
  246. regions := []string{
  247. "ap-northeast-1", "ap-northeast-2", "ap-northeast-3", "ap-south-1", "ap-southeast-1", "ap-southeast-2", "ca-central-1",
  248. "eu-central-1", "eu-north-1", "eu-west-1", "eu-west-2", "eu-west-3", "me-south-1", "sa-east-1", "us-east-1", "us-east-2", "us-west-1", "us-west-2",
  249. "cn-north-1", "cn-northwest-1", "us-gov-east-1", "us-gov-west-1", "us-isob-east-1", "us-iso-east-1",
  250. }
  251. err := e.ensureClientSession("default")
  252. if err != nil {
  253. return nil, err
  254. }
  255. r, err := e.ec2Svc.DescribeRegions(&ec2.DescribeRegionsInput{})
  256. if err != nil {
  257. // ignore error for backward compatibility
  258. plog.Error("Failed to get regions", "error", err)
  259. } else {
  260. for _, region := range r.Regions {
  261. exists := false
  262. for _, existingRegion := range regions {
  263. if existingRegion == *region.RegionName {
  264. exists = true
  265. break
  266. }
  267. }
  268. if !exists {
  269. regions = append(regions, *region.RegionName)
  270. }
  271. }
  272. }
  273. sort.Strings(regions)
  274. result := make([]suggestData, 0)
  275. for _, region := range regions {
  276. result = append(result, suggestData{Text: region, Value: region})
  277. }
  278. regionCache.Store(profile, result)
  279. return result, nil
  280. }
  281. func (e *CloudWatchExecutor) handleGetNamespaces(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  282. keys := []string{}
  283. for key := range metricsMap {
  284. keys = append(keys, key)
  285. }
  286. customNamespaces := e.DataSource.JsonData.Get("customMetricsNamespaces").MustString()
  287. if customNamespaces != "" {
  288. keys = append(keys, strings.Split(customNamespaces, ",")...)
  289. }
  290. sort.Strings(keys)
  291. result := make([]suggestData, 0)
  292. for _, key := range keys {
  293. result = append(result, suggestData{Text: key, Value: key})
  294. }
  295. return result, nil
  296. }
  297. func (e *CloudWatchExecutor) handleGetMetrics(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  298. region := parameters.Get("region").MustString()
  299. namespace := parameters.Get("namespace").MustString()
  300. var namespaceMetrics []string
  301. if !isCustomMetrics(namespace) {
  302. var exists bool
  303. if namespaceMetrics, exists = metricsMap[namespace]; !exists {
  304. return nil, errors.New("Unable to find namespace " + namespace)
  305. }
  306. } else {
  307. var err error
  308. dsInfo := e.getDsInfo(region)
  309. dsInfo.Namespace = namespace
  310. if namespaceMetrics, err = getMetricsForCustomMetrics(dsInfo, getAllMetrics); err != nil {
  311. return nil, errors.New("Unable to call AWS API")
  312. }
  313. }
  314. sort.Strings(namespaceMetrics)
  315. result := make([]suggestData, 0)
  316. for _, name := range namespaceMetrics {
  317. result = append(result, suggestData{Text: name, Value: name})
  318. }
  319. return result, nil
  320. }
  321. func (e *CloudWatchExecutor) handleGetDimensions(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  322. region := parameters.Get("region").MustString()
  323. namespace := parameters.Get("namespace").MustString()
  324. var dimensionValues []string
  325. if !isCustomMetrics(namespace) {
  326. var exists bool
  327. if dimensionValues, exists = dimensionsMap[namespace]; !exists {
  328. return nil, errors.New("Unable to find dimension " + namespace)
  329. }
  330. } else {
  331. var err error
  332. dsInfo := e.getDsInfo(region)
  333. dsInfo.Namespace = namespace
  334. if dimensionValues, err = getDimensionsForCustomMetrics(dsInfo, getAllMetrics); err != nil {
  335. return nil, errors.New("Unable to call AWS API")
  336. }
  337. }
  338. sort.Strings(dimensionValues)
  339. result := make([]suggestData, 0)
  340. for _, name := range dimensionValues {
  341. result = append(result, suggestData{Text: name, Value: name})
  342. }
  343. return result, nil
  344. }
  345. func (e *CloudWatchExecutor) handleGetDimensionValues(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  346. region := parameters.Get("region").MustString()
  347. namespace := parameters.Get("namespace").MustString()
  348. metricName := parameters.Get("metricName").MustString()
  349. dimensionKey := parameters.Get("dimensionKey").MustString()
  350. dimensionsJson := parameters.Get("dimensions").MustMap()
  351. var dimensions []*cloudwatch.DimensionFilter
  352. for k, v := range dimensionsJson {
  353. if vv, ok := v.(string); ok {
  354. dimensions = append(dimensions, &cloudwatch.DimensionFilter{
  355. Name: aws.String(k),
  356. Value: aws.String(vv),
  357. })
  358. }
  359. }
  360. metrics, err := e.cloudwatchListMetrics(region, namespace, metricName, dimensions)
  361. if err != nil {
  362. return nil, err
  363. }
  364. result := make([]suggestData, 0)
  365. dupCheck := make(map[string]bool)
  366. for _, metric := range metrics.Metrics {
  367. for _, dim := range metric.Dimensions {
  368. if *dim.Name == dimensionKey {
  369. if _, exists := dupCheck[*dim.Value]; exists {
  370. continue
  371. }
  372. dupCheck[*dim.Value] = true
  373. result = append(result, suggestData{Text: *dim.Value, Value: *dim.Value})
  374. }
  375. }
  376. }
  377. sort.Slice(result, func(i, j int) bool {
  378. return result[i].Text < result[j].Text
  379. })
  380. return result, nil
  381. }
  382. func (e *CloudWatchExecutor) ensureClientSession(region string) error {
  383. if e.ec2Svc == nil {
  384. dsInfo := e.getDsInfo(region)
  385. cfg, err := e.getAwsConfig(dsInfo)
  386. if err != nil {
  387. return fmt.Errorf("Failed to call ec2:getAwsConfig, %v", err)
  388. }
  389. sess, err := session.NewSession(cfg)
  390. if err != nil {
  391. return fmt.Errorf("Failed to call ec2:NewSession, %v", err)
  392. }
  393. e.ec2Svc = ec2.New(sess, cfg)
  394. }
  395. return nil
  396. }
  397. func (e *CloudWatchExecutor) handleGetEbsVolumeIds(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  398. region := parameters.Get("region").MustString()
  399. instanceId := parameters.Get("instanceId").MustString()
  400. err := e.ensureClientSession(region)
  401. if err != nil {
  402. return nil, err
  403. }
  404. instanceIds := aws.StringSlice(parseMultiSelectValue(instanceId))
  405. instances, err := e.ec2DescribeInstances(region, nil, instanceIds)
  406. if err != nil {
  407. return nil, err
  408. }
  409. result := make([]suggestData, 0)
  410. for _, reservation := range instances.Reservations {
  411. for _, instance := range reservation.Instances {
  412. for _, mapping := range instance.BlockDeviceMappings {
  413. result = append(result, suggestData{Text: *mapping.Ebs.VolumeId, Value: *mapping.Ebs.VolumeId})
  414. }
  415. }
  416. }
  417. return result, nil
  418. }
  419. func (e *CloudWatchExecutor) handleGetEc2InstanceAttribute(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  420. region := parameters.Get("region").MustString()
  421. attributeName := parameters.Get("attributeName").MustString()
  422. filterJson := parameters.Get("filters").MustMap()
  423. var filters []*ec2.Filter
  424. for k, v := range filterJson {
  425. if vv, ok := v.([]interface{}); ok {
  426. var vvvvv []*string
  427. for _, vvv := range vv {
  428. if vvvv, ok := vvv.(string); ok {
  429. vvvvv = append(vvvvv, &vvvv)
  430. }
  431. }
  432. filters = append(filters, &ec2.Filter{
  433. Name: aws.String(k),
  434. Values: vvvvv,
  435. })
  436. }
  437. }
  438. err := e.ensureClientSession(region)
  439. if err != nil {
  440. return nil, err
  441. }
  442. instances, err := e.ec2DescribeInstances(region, filters, nil)
  443. if err != nil {
  444. return nil, err
  445. }
  446. result := make([]suggestData, 0)
  447. dupCheck := make(map[string]bool)
  448. for _, reservation := range instances.Reservations {
  449. for _, instance := range reservation.Instances {
  450. tags := make(map[string]string)
  451. for _, tag := range instance.Tags {
  452. tags[*tag.Key] = *tag.Value
  453. }
  454. var data string
  455. if strings.Index(attributeName, "Tags.") == 0 {
  456. tagName := attributeName[5:]
  457. data = tags[tagName]
  458. } else {
  459. attributePath := strings.Split(attributeName, ".")
  460. v := reflect.ValueOf(instance)
  461. for _, key := range attributePath {
  462. if v.Kind() == reflect.Ptr {
  463. v = v.Elem()
  464. }
  465. if v.Kind() != reflect.Struct {
  466. return nil, errors.New("invalid attribute path")
  467. }
  468. v = v.FieldByName(key)
  469. if !v.IsValid() {
  470. return nil, errors.New("invalid attribute path")
  471. }
  472. }
  473. if attr, ok := v.Interface().(*string); ok {
  474. data = *attr
  475. } else {
  476. return nil, errors.New("invalid attribute path")
  477. }
  478. }
  479. if _, exists := dupCheck[data]; exists {
  480. continue
  481. }
  482. dupCheck[data] = true
  483. result = append(result, suggestData{Text: data, Value: data})
  484. }
  485. }
  486. sort.Slice(result, func(i, j int) bool {
  487. return result[i].Text < result[j].Text
  488. })
  489. return result, nil
  490. }
  491. func (e *CloudWatchExecutor) ensureRGTAClientSession(region string) error {
  492. if e.rgtaSvc == nil {
  493. dsInfo := e.getDsInfo(region)
  494. cfg, err := e.getAwsConfig(dsInfo)
  495. if err != nil {
  496. return fmt.Errorf("Failed to call ec2:getAwsConfig, %v", err)
  497. }
  498. sess, err := session.NewSession(cfg)
  499. if err != nil {
  500. return fmt.Errorf("Failed to call ec2:NewSession, %v", err)
  501. }
  502. e.rgtaSvc = resourcegroupstaggingapi.New(sess, cfg)
  503. }
  504. return nil
  505. }
  506. func (e *CloudWatchExecutor) handleGetResourceArns(ctx context.Context, parameters *simplejson.Json, queryContext *tsdb.TsdbQuery) ([]suggestData, error) {
  507. region := parameters.Get("region").MustString()
  508. resourceType := parameters.Get("resourceType").MustString()
  509. filterJson := parameters.Get("tags").MustMap()
  510. err := e.ensureRGTAClientSession(region)
  511. if err != nil {
  512. return nil, err
  513. }
  514. var filters []*resourcegroupstaggingapi.TagFilter
  515. for k, v := range filterJson {
  516. if vv, ok := v.([]interface{}); ok {
  517. var vvvvv []*string
  518. for _, vvv := range vv {
  519. if vvvv, ok := vvv.(string); ok {
  520. vvvvv = append(vvvvv, &vvvv)
  521. }
  522. }
  523. filters = append(filters, &resourcegroupstaggingapi.TagFilter{
  524. Key: aws.String(k),
  525. Values: vvvvv,
  526. })
  527. }
  528. }
  529. var resourceTypes []*string
  530. resourceTypes = append(resourceTypes, &resourceType)
  531. resources, err := e.resourceGroupsGetResources(region, filters, resourceTypes)
  532. if err != nil {
  533. return nil, err
  534. }
  535. result := make([]suggestData, 0)
  536. for _, resource := range resources.ResourceTagMappingList {
  537. data := *resource.ResourceARN
  538. result = append(result, suggestData{Text: data, Value: data})
  539. }
  540. return result, nil
  541. }
  542. func (e *CloudWatchExecutor) cloudwatchListMetrics(region string, namespace string, metricName string, dimensions []*cloudwatch.DimensionFilter) (*cloudwatch.ListMetricsOutput, error) {
  543. svc, err := e.getClient(region)
  544. if err != nil {
  545. return nil, err
  546. }
  547. params := &cloudwatch.ListMetricsInput{
  548. Namespace: aws.String(namespace),
  549. MetricName: aws.String(metricName),
  550. Dimensions: dimensions,
  551. }
  552. var resp cloudwatch.ListMetricsOutput
  553. err = svc.ListMetricsPages(params,
  554. func(page *cloudwatch.ListMetricsOutput, lastPage bool) bool {
  555. metrics.M_Aws_CloudWatch_ListMetrics.Inc()
  556. metrics, _ := awsutil.ValuesAtPath(page, "Metrics")
  557. for _, metric := range metrics {
  558. resp.Metrics = append(resp.Metrics, metric.(*cloudwatch.Metric))
  559. }
  560. return !lastPage
  561. })
  562. if err != nil {
  563. return nil, fmt.Errorf("Failed to call cloudwatch:ListMetrics, %v", err)
  564. }
  565. return &resp, nil
  566. }
  567. func (e *CloudWatchExecutor) ec2DescribeInstances(region string, filters []*ec2.Filter, instanceIds []*string) (*ec2.DescribeInstancesOutput, error) {
  568. params := &ec2.DescribeInstancesInput{
  569. Filters: filters,
  570. InstanceIds: instanceIds,
  571. }
  572. var resp ec2.DescribeInstancesOutput
  573. err := e.ec2Svc.DescribeInstancesPages(params,
  574. func(page *ec2.DescribeInstancesOutput, lastPage bool) bool {
  575. reservations, _ := awsutil.ValuesAtPath(page, "Reservations")
  576. for _, reservation := range reservations {
  577. resp.Reservations = append(resp.Reservations, reservation.(*ec2.Reservation))
  578. }
  579. return !lastPage
  580. })
  581. if err != nil {
  582. return nil, errors.New("Failed to call ec2:DescribeInstances")
  583. }
  584. return &resp, nil
  585. }
  586. func (e *CloudWatchExecutor) resourceGroupsGetResources(region string, filters []*resourcegroupstaggingapi.TagFilter, resourceTypes []*string) (*resourcegroupstaggingapi.GetResourcesOutput, error) {
  587. params := &resourcegroupstaggingapi.GetResourcesInput{
  588. ResourceTypeFilters: resourceTypes,
  589. TagFilters: filters,
  590. }
  591. var resp resourcegroupstaggingapi.GetResourcesOutput
  592. err := e.rgtaSvc.GetResourcesPages(params,
  593. func(page *resourcegroupstaggingapi.GetResourcesOutput, lastPage bool) bool {
  594. resources, _ := awsutil.ValuesAtPath(page, "ResourceTagMappingList")
  595. for _, resource := range resources {
  596. resp.ResourceTagMappingList = append(resp.ResourceTagMappingList, resource.(*resourcegroupstaggingapi.ResourceTagMapping))
  597. }
  598. return !lastPage
  599. })
  600. if err != nil {
  601. return nil, errors.New("Failed to call tags:GetResources")
  602. }
  603. return &resp, nil
  604. }
  605. func getAllMetrics(cwData *DatasourceInfo) (cloudwatch.ListMetricsOutput, error) {
  606. creds, err := GetCredentials(cwData)
  607. if err != nil {
  608. return cloudwatch.ListMetricsOutput{}, err
  609. }
  610. cfg := &aws.Config{
  611. Region: aws.String(cwData.Region),
  612. Credentials: creds,
  613. }
  614. sess, err := session.NewSession(cfg)
  615. if err != nil {
  616. return cloudwatch.ListMetricsOutput{}, err
  617. }
  618. svc := cloudwatch.New(sess, cfg)
  619. params := &cloudwatch.ListMetricsInput{
  620. Namespace: aws.String(cwData.Namespace),
  621. }
  622. var resp cloudwatch.ListMetricsOutput
  623. err = svc.ListMetricsPages(params,
  624. func(page *cloudwatch.ListMetricsOutput, lastPage bool) bool {
  625. metrics.M_Aws_CloudWatch_ListMetrics.Inc()
  626. metrics, _ := awsutil.ValuesAtPath(page, "Metrics")
  627. for _, metric := range metrics {
  628. resp.Metrics = append(resp.Metrics, metric.(*cloudwatch.Metric))
  629. }
  630. return !lastPage
  631. })
  632. return resp, err
  633. }
  634. var metricsCacheLock sync.Mutex
  635. func getMetricsForCustomMetrics(dsInfo *DatasourceInfo, getAllMetrics func(*DatasourceInfo) (cloudwatch.ListMetricsOutput, error)) ([]string, error) {
  636. metricsCacheLock.Lock()
  637. defer metricsCacheLock.Unlock()
  638. if _, ok := customMetricsMetricsMap[dsInfo.Profile]; !ok {
  639. customMetricsMetricsMap[dsInfo.Profile] = make(map[string]map[string]*CustomMetricsCache)
  640. }
  641. if _, ok := customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region]; !ok {
  642. customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region] = make(map[string]*CustomMetricsCache)
  643. }
  644. if _, ok := customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace]; !ok {
  645. customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace] = &CustomMetricsCache{}
  646. customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache = make([]string, 0)
  647. }
  648. if customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Expire.After(time.Now()) {
  649. return customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, nil
  650. }
  651. result, err := getAllMetrics(dsInfo)
  652. if err != nil {
  653. return []string{}, err
  654. }
  655. customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache = make([]string, 0)
  656. customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Expire = time.Now().Add(5 * time.Minute)
  657. for _, metric := range result.Metrics {
  658. if isDuplicate(customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, *metric.MetricName) {
  659. continue
  660. }
  661. customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache = append(customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, *metric.MetricName)
  662. }
  663. return customMetricsMetricsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, nil
  664. }
  665. var dimensionsCacheLock sync.Mutex
  666. func getDimensionsForCustomMetrics(dsInfo *DatasourceInfo, getAllMetrics func(*DatasourceInfo) (cloudwatch.ListMetricsOutput, error)) ([]string, error) {
  667. dimensionsCacheLock.Lock()
  668. defer dimensionsCacheLock.Unlock()
  669. if _, ok := customMetricsDimensionsMap[dsInfo.Profile]; !ok {
  670. customMetricsDimensionsMap[dsInfo.Profile] = make(map[string]map[string]*CustomMetricsCache)
  671. }
  672. if _, ok := customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region]; !ok {
  673. customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region] = make(map[string]*CustomMetricsCache)
  674. }
  675. if _, ok := customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace]; !ok {
  676. customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace] = &CustomMetricsCache{}
  677. customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache = make([]string, 0)
  678. }
  679. if customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Expire.After(time.Now()) {
  680. return customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, nil
  681. }
  682. result, err := getAllMetrics(dsInfo)
  683. if err != nil {
  684. return []string{}, err
  685. }
  686. customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache = make([]string, 0)
  687. customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Expire = time.Now().Add(5 * time.Minute)
  688. for _, metric := range result.Metrics {
  689. for _, dimension := range metric.Dimensions {
  690. if isDuplicate(customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, *dimension.Name) {
  691. continue
  692. }
  693. customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache = append(customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, *dimension.Name)
  694. }
  695. }
  696. return customMetricsDimensionsMap[dsInfo.Profile][dsInfo.Region][dsInfo.Namespace].Cache, nil
  697. }
  698. func isDuplicate(nameList []string, target string) bool {
  699. for _, name := range nameList {
  700. if name == target {
  701. return true
  702. }
  703. }
  704. return false
  705. }
  706. func isCustomMetrics(namespace string) bool {
  707. return strings.Index(namespace, "AWS/") != 0
  708. }