metrics.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398
  1. package metrics
  2. import (
  3. "bytes"
  4. "encoding/json"
  5. "net/http"
  6. "runtime"
  7. "strings"
  8. "time"
  9. "github.com/grafana/grafana/pkg/bus"
  10. "github.com/grafana/grafana/pkg/models"
  11. "github.com/grafana/grafana/pkg/plugins"
  12. "github.com/grafana/grafana/pkg/setting"
  13. "github.com/prometheus/client_golang/prometheus"
  14. )
  15. const exporterName = "grafana"
  16. var (
  17. M_Instance_Start prometheus.Counter
  18. M_Page_Status *prometheus.CounterVec
  19. M_Api_Status *prometheus.CounterVec
  20. M_Proxy_Status *prometheus.CounterVec
  21. M_Http_Request_Total *prometheus.CounterVec
  22. M_Http_Request_Summary *prometheus.SummaryVec
  23. M_Api_User_SignUpStarted prometheus.Counter
  24. M_Api_User_SignUpCompleted prometheus.Counter
  25. M_Api_User_SignUpInvite prometheus.Counter
  26. M_Api_Dashboard_Save prometheus.Summary
  27. M_Api_Dashboard_Get prometheus.Summary
  28. M_Api_Dashboard_Search prometheus.Summary
  29. M_Api_Admin_User_Create prometheus.Counter
  30. M_Api_Login_Post prometheus.Counter
  31. M_Api_Login_OAuth prometheus.Counter
  32. M_Api_Org_Create prometheus.Counter
  33. M_Api_Dashboard_Snapshot_Create prometheus.Counter
  34. M_Api_Dashboard_Snapshot_External prometheus.Counter
  35. M_Api_Dashboard_Snapshot_Get prometheus.Counter
  36. M_Api_Dashboard_Insert prometheus.Counter
  37. M_Alerting_Result_State *prometheus.CounterVec
  38. M_Alerting_Notification_Sent *prometheus.CounterVec
  39. M_Aws_CloudWatch_GetMetricStatistics prometheus.Counter
  40. M_Aws_CloudWatch_ListMetrics prometheus.Counter
  41. M_DB_DataSource_QueryById prometheus.Counter
  42. // Timers
  43. M_DataSource_ProxyReq_Timer prometheus.Summary
  44. M_Alerting_Execution_Time prometheus.Summary
  45. // StatTotals
  46. M_Alerting_Active_Alerts prometheus.Gauge
  47. M_StatTotal_Dashboards prometheus.Gauge
  48. M_StatTotal_Users prometheus.Gauge
  49. M_StatTotal_Orgs prometheus.Gauge
  50. M_StatTotal_Playlists prometheus.Gauge
  51. )
  52. func init() {
  53. M_Instance_Start = prometheus.NewCounter(prometheus.CounterOpts{
  54. Name: "instance_start_total",
  55. Help: "counter for started instances",
  56. Namespace: exporterName,
  57. })
  58. M_Page_Status = prometheus.NewCounterVec(
  59. prometheus.CounterOpts{
  60. Name: "page_response_status_total",
  61. Help: "page http response status",
  62. Namespace: exporterName,
  63. },
  64. []string{"code"},
  65. )
  66. M_Api_Status = prometheus.NewCounterVec(
  67. prometheus.CounterOpts{
  68. Name: "api_response_status_total",
  69. Help: "api http response status",
  70. Namespace: exporterName,
  71. },
  72. []string{"code"},
  73. )
  74. M_Proxy_Status = prometheus.NewCounterVec(
  75. prometheus.CounterOpts{
  76. Name: "proxy_response_status_total",
  77. Help: "proxy http response status",
  78. Namespace: exporterName,
  79. },
  80. []string{"code"},
  81. )
  82. M_Http_Request_Total = prometheus.NewCounterVec(
  83. prometheus.CounterOpts{
  84. Name: "http_request_total",
  85. Help: "http request counter",
  86. },
  87. []string{"handler", "statuscode", "method"},
  88. )
  89. M_Http_Request_Summary = prometheus.NewSummaryVec(
  90. prometheus.SummaryOpts{
  91. Name: "http_request_duration_milleseconds",
  92. Help: "http request summary",
  93. },
  94. []string{"handler", "statuscode", "method"},
  95. )
  96. M_Api_User_SignUpStarted = prometheus.NewCounter(prometheus.CounterOpts{
  97. Name: "api_user_signup_started_total",
  98. Help: "amount of users who started the signup flow",
  99. Namespace: exporterName,
  100. })
  101. M_Api_User_SignUpCompleted = prometheus.NewCounter(prometheus.CounterOpts{
  102. Name: "api_user_signup_completed_total",
  103. Help: "amount of users who completed the signup flow",
  104. Namespace: exporterName,
  105. })
  106. M_Api_User_SignUpInvite = prometheus.NewCounter(prometheus.CounterOpts{
  107. Name: "api_user_signup_invite_total",
  108. Help: "amount of users who have been invited",
  109. Namespace: exporterName,
  110. })
  111. M_Api_Dashboard_Save = prometheus.NewSummary(prometheus.SummaryOpts{
  112. Name: "api_dashboard_save_milleseconds",
  113. Help: "summary for dashboard save duration",
  114. Namespace: exporterName,
  115. })
  116. M_Api_Dashboard_Get = prometheus.NewSummary(prometheus.SummaryOpts{
  117. Name: "api_dashboard_get_milleseconds",
  118. Help: "summary for dashboard get duration",
  119. Namespace: exporterName,
  120. })
  121. M_Api_Dashboard_Search = prometheus.NewSummary(prometheus.SummaryOpts{
  122. Name: "api_dashboard_search_milleseconds",
  123. Help: "summary for dashboard search duration",
  124. Namespace: exporterName,
  125. })
  126. M_Api_Admin_User_Create = prometheus.NewCounter(prometheus.CounterOpts{
  127. Name: "api_admin_user_created_total",
  128. Help: "api admin user created counter",
  129. Namespace: exporterName,
  130. })
  131. M_Api_Login_Post = prometheus.NewCounter(prometheus.CounterOpts{
  132. Name: "api_login_post_total",
  133. Help: "api login post counter",
  134. Namespace: exporterName,
  135. })
  136. M_Api_Login_OAuth = prometheus.NewCounter(prometheus.CounterOpts{
  137. Name: "api_login_oauth_total",
  138. Help: "api login oauth counter",
  139. Namespace: exporterName,
  140. })
  141. M_Api_Org_Create = prometheus.NewCounter(prometheus.CounterOpts{
  142. Name: "api_org_create_total",
  143. Help: "api org created counter",
  144. Namespace: exporterName,
  145. })
  146. M_Api_Dashboard_Snapshot_Create = prometheus.NewCounter(prometheus.CounterOpts{
  147. Name: "api_dashboard_snapshot_create_total",
  148. Help: "dashboard snapshots created",
  149. Namespace: exporterName,
  150. })
  151. M_Api_Dashboard_Snapshot_External = prometheus.NewCounter(prometheus.CounterOpts{
  152. Name: "api_dashboard_snapshot_external_total",
  153. Help: "external dashboard snapshots created",
  154. Namespace: exporterName,
  155. })
  156. M_Api_Dashboard_Snapshot_Get = prometheus.NewCounter(prometheus.CounterOpts{
  157. Name: "api_dashboard_snapshot_get_total",
  158. Help: "loaded dashboards",
  159. Namespace: exporterName,
  160. })
  161. M_Api_Dashboard_Insert = prometheus.NewCounter(prometheus.CounterOpts{
  162. Name: "api_models_dashboard_insert_total",
  163. Help: "dashboards inserted ",
  164. Namespace: exporterName,
  165. })
  166. M_Alerting_Result_State = prometheus.NewCounterVec(prometheus.CounterOpts{
  167. Name: "alerting_result_total",
  168. Help: "alert execution result counter",
  169. Namespace: exporterName,
  170. }, []string{"state"})
  171. M_Alerting_Notification_Sent = prometheus.NewCounterVec(prometheus.CounterOpts{
  172. Name: "alerting_notification_sent_total",
  173. Help: "counter for how many alert notifications been sent",
  174. Namespace: exporterName,
  175. }, []string{"type"})
  176. M_Aws_CloudWatch_GetMetricStatistics = prometheus.NewCounter(prometheus.CounterOpts{
  177. Name: "aws_cloudwatch_get_metric_statistics_total",
  178. Help: "counter for getting metric statistics from aws",
  179. Namespace: exporterName,
  180. })
  181. M_Aws_CloudWatch_ListMetrics = prometheus.NewCounter(prometheus.CounterOpts{
  182. Name: "aws_cloudwatch_list_metrics_total",
  183. Help: "counter for getting list of metrics from aws",
  184. Namespace: exporterName,
  185. })
  186. M_DB_DataSource_QueryById = prometheus.NewCounter(prometheus.CounterOpts{
  187. Name: "db_datasource_query_by_id_total",
  188. Help: "counter for getting datasource by id",
  189. Namespace: exporterName,
  190. })
  191. M_DataSource_ProxyReq_Timer = prometheus.NewSummary(prometheus.SummaryOpts{
  192. Name: "api_dataproxy_request_all_milleseconds",
  193. Help: "summary for dashboard search duration",
  194. Namespace: exporterName,
  195. })
  196. M_Alerting_Execution_Time = prometheus.NewSummary(prometheus.SummaryOpts{
  197. Name: "alerting_execution_time_milliseconds",
  198. Help: "summary of alert exeuction duration",
  199. Namespace: exporterName,
  200. })
  201. M_Alerting_Active_Alerts = prometheus.NewGauge(prometheus.GaugeOpts{
  202. Name: "alerting_active_alerts",
  203. Help: "amount of active alerts",
  204. Namespace: exporterName,
  205. })
  206. M_StatTotal_Dashboards = prometheus.NewGauge(prometheus.GaugeOpts{
  207. Name: "stat_totals_dashboard",
  208. Help: "total amount of dashboards",
  209. Namespace: exporterName,
  210. })
  211. M_StatTotal_Users = prometheus.NewGauge(prometheus.GaugeOpts{
  212. Name: "stat_total_users",
  213. Help: "total amount of users",
  214. Namespace: exporterName,
  215. })
  216. M_StatTotal_Orgs = prometheus.NewGauge(prometheus.GaugeOpts{
  217. Name: "stat_total_orgs",
  218. Help: "total amount of orgs",
  219. Namespace: exporterName,
  220. })
  221. M_StatTotal_Playlists = prometheus.NewGauge(prometheus.GaugeOpts{
  222. Name: "stat_total_playlists",
  223. Help: "total amount of playlists",
  224. Namespace: exporterName,
  225. })
  226. }
  227. func initMetricVars(settings *MetricSettings) {
  228. prometheus.MustRegister(
  229. M_Instance_Start,
  230. M_Page_Status,
  231. M_Api_Status,
  232. M_Proxy_Status,
  233. M_Http_Request_Total,
  234. M_Http_Request_Summary,
  235. M_Api_User_SignUpStarted,
  236. M_Api_User_SignUpCompleted,
  237. M_Api_User_SignUpInvite,
  238. M_Api_Dashboard_Save,
  239. M_Api_Dashboard_Get,
  240. M_Api_Dashboard_Search,
  241. M_DataSource_ProxyReq_Timer,
  242. M_Alerting_Execution_Time,
  243. M_Api_Admin_User_Create,
  244. M_Api_Login_Post,
  245. M_Api_Login_OAuth,
  246. M_Api_Org_Create,
  247. M_Api_Dashboard_Snapshot_Create,
  248. M_Api_Dashboard_Snapshot_External,
  249. M_Api_Dashboard_Snapshot_Get,
  250. M_Api_Dashboard_Insert,
  251. M_Alerting_Result_State,
  252. M_Alerting_Notification_Sent,
  253. M_Aws_CloudWatch_GetMetricStatistics,
  254. M_Aws_CloudWatch_ListMetrics,
  255. M_DB_DataSource_QueryById,
  256. M_Alerting_Active_Alerts,
  257. M_StatTotal_Dashboards,
  258. M_StatTotal_Users,
  259. M_StatTotal_Orgs,
  260. M_StatTotal_Playlists)
  261. go instrumentationLoop(settings)
  262. }
  263. func instrumentationLoop(settings *MetricSettings) chan struct{} {
  264. M_Instance_Start.Inc()
  265. onceEveryDayTick := time.NewTicker(time.Hour * 24)
  266. secondTicker := time.NewTicker(time.Second * time.Duration(settings.IntervalSeconds))
  267. for {
  268. select {
  269. case <-onceEveryDayTick.C:
  270. sendUsageStats()
  271. case <-secondTicker.C:
  272. updateTotalStats()
  273. }
  274. }
  275. }
  276. var metricPublishCounter int64 = 0
  277. func updateTotalStats() {
  278. metricPublishCounter++
  279. if metricPublishCounter == 1 || metricPublishCounter%10 == 0 {
  280. statsQuery := models.GetSystemStatsQuery{}
  281. if err := bus.Dispatch(&statsQuery); err != nil {
  282. metricsLogger.Error("Failed to get system stats", "error", err)
  283. return
  284. }
  285. M_StatTotal_Dashboards.Set(float64(statsQuery.Result.Dashboards))
  286. M_StatTotal_Users.Set(float64(statsQuery.Result.Users))
  287. M_StatTotal_Playlists.Set(float64(statsQuery.Result.Playlists))
  288. M_StatTotal_Orgs.Set(float64(statsQuery.Result.Orgs))
  289. }
  290. }
  291. func sendUsageStats() {
  292. if !setting.ReportingEnabled {
  293. return
  294. }
  295. metricsLogger.Debug("Sending anonymous usage stats to stats.grafana.org")
  296. version := strings.Replace(setting.BuildVersion, ".", "_", -1)
  297. metrics := map[string]interface{}{}
  298. report := map[string]interface{}{
  299. "version": version,
  300. "metrics": metrics,
  301. "os": runtime.GOOS,
  302. "arch": runtime.GOARCH,
  303. }
  304. statsQuery := models.GetSystemStatsQuery{}
  305. if err := bus.Dispatch(&statsQuery); err != nil {
  306. metricsLogger.Error("Failed to get system stats", "error", err)
  307. return
  308. }
  309. metrics["stats.dashboards.count"] = statsQuery.Result.Dashboards
  310. metrics["stats.users.count"] = statsQuery.Result.Users
  311. metrics["stats.orgs.count"] = statsQuery.Result.Orgs
  312. metrics["stats.playlist.count"] = statsQuery.Result.Playlists
  313. metrics["stats.plugins.apps.count"] = len(plugins.Apps)
  314. metrics["stats.plugins.panels.count"] = len(plugins.Panels)
  315. metrics["stats.plugins.datasources.count"] = len(plugins.DataSources)
  316. metrics["stats.alerts.count"] = statsQuery.Result.Alerts
  317. metrics["stats.active_users.count"] = statsQuery.Result.ActiveUsers
  318. metrics["stats.datasources.count"] = statsQuery.Result.Datasources
  319. dsStats := models.GetDataSourceStatsQuery{}
  320. if err := bus.Dispatch(&dsStats); err != nil {
  321. metricsLogger.Error("Failed to get datasource stats", "error", err)
  322. return
  323. }
  324. // send counters for each data source
  325. // but ignore any custom data sources
  326. // as sending that name could be sensitive information
  327. dsOtherCount := 0
  328. for _, dsStat := range dsStats.Result {
  329. if models.IsKnownDataSourcePlugin(dsStat.Type) {
  330. metrics["stats.ds."+dsStat.Type+".count"] = dsStat.Count
  331. } else {
  332. dsOtherCount += dsStat.Count
  333. }
  334. }
  335. metrics["stats.ds.other.count"] = dsOtherCount
  336. out, _ := json.MarshalIndent(report, "", " ")
  337. data := bytes.NewBuffer(out)
  338. client := http.Client{Timeout: time.Duration(5 * time.Second)}
  339. go client.Post("https://stats.grafana.org/grafana-usage-report", "application/json", data)
  340. }