2019-11-15 11:25:21 -08:00
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
2019-11-21 15:30:19 -08:00
|
|
|
"net/http"
|
|
|
|
|
2019-11-15 11:25:21 -08:00
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
|
|
"github.com/prometheus/client_golang/prometheus/promhttp"
|
|
|
|
)
|
|
|
|
|
|
|
|
// TODO: Not sure if this is the best way to handle. A global instance for
|
|
|
|
// metrics isn't bad, but it might be nice to curry versions of the metrics
|
|
|
|
// for each monitor. Especially since every monitor has it's own. Perhaps
|
|
|
|
// another new function that essentially curries each metric for a given
|
|
|
|
// monitor name would do. This could be run when validating monitors and
|
|
|
|
// initializing alert templates.
|
|
|
|
|
|
|
|
// MinitorMetrics contains all counters and metrics that Minitor will need to access
|
|
|
|
type MinitorMetrics struct {
|
|
|
|
alertCount *prometheus.CounterVec
|
|
|
|
checkCount *prometheus.CounterVec
|
2021-05-11 10:41:22 -07:00
|
|
|
checkTime *prometheus.GaugeVec
|
2019-11-15 11:25:21 -08:00
|
|
|
monitorStatus *prometheus.GaugeVec
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewMetrics creates and initializes all metrics
|
|
|
|
func NewMetrics() *MinitorMetrics {
|
|
|
|
// Initialize all metrics
|
|
|
|
metrics := &MinitorMetrics{
|
|
|
|
alertCount: prometheus.NewCounterVec(
|
|
|
|
prometheus.CounterOpts{
|
|
|
|
Name: "minitor_alert_total",
|
|
|
|
Help: "Number of Minitor alerts",
|
|
|
|
},
|
|
|
|
[]string{"alert", "monitor"},
|
|
|
|
),
|
|
|
|
checkCount: prometheus.NewCounterVec(
|
|
|
|
prometheus.CounterOpts{
|
|
|
|
Name: "minitor_check_total",
|
|
|
|
Help: "Number of Minitor checks",
|
|
|
|
},
|
|
|
|
[]string{"monitor", "status", "is_alert"},
|
|
|
|
),
|
2021-05-11 10:41:22 -07:00
|
|
|
checkTime: prometheus.NewGaugeVec(
|
|
|
|
prometheus.GaugeOpts{
|
|
|
|
Name: "minitor_check_milliseconds",
|
|
|
|
Help: "Time in miliseconds that a check ran for",
|
|
|
|
},
|
|
|
|
[]string{"monitor", "status"},
|
|
|
|
),
|
2019-11-15 11:25:21 -08:00
|
|
|
monitorStatus: prometheus.NewGaugeVec(
|
|
|
|
prometheus.GaugeOpts{
|
|
|
|
Name: "minitor_monitor_up_count",
|
|
|
|
Help: "Status of currently responsive monitors",
|
|
|
|
},
|
|
|
|
[]string{"monitor"},
|
|
|
|
),
|
|
|
|
}
|
|
|
|
|
|
|
|
// Register newly created metrics
|
|
|
|
prometheus.MustRegister(metrics.alertCount)
|
|
|
|
prometheus.MustRegister(metrics.checkCount)
|
2021-05-11 10:41:22 -07:00
|
|
|
prometheus.MustRegister(metrics.checkTime)
|
2019-11-15 11:25:21 -08:00
|
|
|
prometheus.MustRegister(metrics.monitorStatus)
|
|
|
|
|
|
|
|
return metrics
|
|
|
|
}
|
|
|
|
|
|
|
|
// SetMonitorStatus sets the current status of Monitor
|
|
|
|
func (metrics *MinitorMetrics) SetMonitorStatus(monitor string, isUp bool) {
|
|
|
|
val := 0.0
|
|
|
|
if isUp {
|
|
|
|
val = 1.0
|
|
|
|
}
|
2021-05-10 21:00:58 -07:00
|
|
|
|
2019-11-15 11:25:21 -08:00
|
|
|
metrics.monitorStatus.With(prometheus.Labels{"monitor": monitor}).Set(val)
|
|
|
|
}
|
|
|
|
|
|
|
|
// CountCheck counts the result of a particular Monitor check
|
2021-05-11 10:41:22 -07:00
|
|
|
func (metrics *MinitorMetrics) CountCheck(monitor string, isSuccess bool, ms int64, isAlert bool) {
|
2019-11-15 11:25:21 -08:00
|
|
|
status := "failure"
|
|
|
|
if isSuccess {
|
|
|
|
status = "success"
|
|
|
|
}
|
|
|
|
|
|
|
|
alertVal := "false"
|
|
|
|
if isAlert {
|
|
|
|
alertVal = "true"
|
|
|
|
}
|
|
|
|
|
|
|
|
metrics.checkCount.With(
|
|
|
|
prometheus.Labels{"monitor": monitor, "status": status, "is_alert": alertVal},
|
|
|
|
).Inc()
|
2021-05-11 10:41:22 -07:00
|
|
|
|
|
|
|
metrics.checkTime.With(
|
|
|
|
prometheus.Labels{"monitor": monitor, "status": status},
|
|
|
|
).Set(float64(ms))
|
2019-11-15 11:25:21 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// CountAlert counts an alert
|
|
|
|
func (metrics *MinitorMetrics) CountAlert(monitor string, alert string) {
|
|
|
|
metrics.alertCount.With(
|
|
|
|
prometheus.Labels{
|
|
|
|
"alert": alert,
|
|
|
|
"monitor": monitor,
|
|
|
|
},
|
|
|
|
).Inc()
|
|
|
|
}
|
|
|
|
|
|
|
|
// ServeMetrics starts an http server with a Prometheus metrics handler
|
|
|
|
func ServeMetrics() {
|
|
|
|
http.Handle("/metrics", promhttp.Handler())
|
2021-05-10 21:00:58 -07:00
|
|
|
|
2019-11-15 11:25:21 -08:00
|
|
|
host := fmt.Sprintf(":%d", MetricsPort)
|
2021-05-10 21:00:58 -07:00
|
|
|
|
2019-11-15 11:25:21 -08:00
|
|
|
_ = http.ListenAndServe(host, nil)
|
|
|
|
}
|