2017-08-23 18:46:03 +00:00
|
|
|
package metrics
|
|
|
|
|
|
|
|
import (
|
2020-03-05 14:10:07 +00:00
|
|
|
"errors"
|
|
|
|
"time"
|
|
|
|
|
2017-08-23 18:46:03 +00:00
|
|
|
"github.com/go-kit/kit/metrics"
|
|
|
|
"github.com/go-kit/kit/metrics/multi"
|
|
|
|
)
|
|
|
|
|
|
|
|
// Registry has to implemented by any system that wants to monitor and expose metrics.
|
|
|
|
type Registry interface {
|
2019-07-18 19:36:05 +00:00
|
|
|
// IsEpEnabled shows whether metrics instrumentation is enabled on entry points.
|
|
|
|
IsEpEnabled() bool
|
|
|
|
// IsSvcEnabled shows whether metrics instrumentation is enabled on services.
|
|
|
|
IsSvcEnabled() bool
|
2018-07-03 08:02:03 +00:00
|
|
|
|
2018-01-26 10:58:03 +00:00
|
|
|
// server metrics
|
|
|
|
ConfigReloadsCounter() metrics.Counter
|
|
|
|
ConfigReloadsFailureCounter() metrics.Counter
|
|
|
|
LastConfigReloadSuccessGauge() metrics.Gauge
|
|
|
|
LastConfigReloadFailureGauge() metrics.Gauge
|
|
|
|
|
2020-12-18 17:44:03 +00:00
|
|
|
// TLS
|
|
|
|
TLSCertsNotAfterTimestampGauge() metrics.Gauge
|
|
|
|
|
2018-01-26 10:58:03 +00:00
|
|
|
// entry point metrics
|
2019-07-18 19:36:05 +00:00
|
|
|
EntryPointReqsCounter() metrics.Counter
|
2020-03-05 12:30:05 +00:00
|
|
|
EntryPointReqsTLSCounter() metrics.Counter
|
2020-03-05 14:10:07 +00:00
|
|
|
EntryPointReqDurationHistogram() ScalableHistogram
|
2019-07-18 19:36:05 +00:00
|
|
|
EntryPointOpenConnsGauge() metrics.Gauge
|
2018-01-26 10:58:03 +00:00
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
// service metrics
|
|
|
|
ServiceReqsCounter() metrics.Counter
|
2020-03-05 12:30:05 +00:00
|
|
|
ServiceReqsTLSCounter() metrics.Counter
|
2020-03-05 14:10:07 +00:00
|
|
|
ServiceReqDurationHistogram() ScalableHistogram
|
2019-07-18 19:36:05 +00:00
|
|
|
ServiceOpenConnsGauge() metrics.Gauge
|
|
|
|
ServiceRetriesCounter() metrics.Counter
|
|
|
|
ServiceServerUpGauge() metrics.Gauge
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// NewVoidRegistry is a noop implementation of metrics.Registry.
|
|
|
|
// It is used to avoid nil checking in components that do metric collections.
|
|
|
|
func NewVoidRegistry() Registry {
|
|
|
|
return NewMultiRegistry([]Registry{})
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
2018-01-26 10:58:03 +00:00
|
|
|
// NewMultiRegistry is an implementation of metrics.Registry that wraps multiple registries.
|
|
|
|
// It handles the case when a registry hasn't registered some metric and returns nil.
|
|
|
|
// This allows for feature imparity between the different metric implementations.
|
2017-08-23 18:46:03 +00:00
|
|
|
func NewMultiRegistry(registries []Registry) Registry {
|
2018-07-03 08:02:03 +00:00
|
|
|
var configReloadsCounter []metrics.Counter
|
|
|
|
var configReloadsFailureCounter []metrics.Counter
|
|
|
|
var lastConfigReloadSuccessGauge []metrics.Gauge
|
|
|
|
var lastConfigReloadFailureGauge []metrics.Gauge
|
2020-12-18 17:44:03 +00:00
|
|
|
var tlsCertsNotAfterTimestampGauge []metrics.Gauge
|
2019-07-18 19:36:05 +00:00
|
|
|
var entryPointReqsCounter []metrics.Counter
|
2020-03-05 12:30:05 +00:00
|
|
|
var entryPointReqsTLSCounter []metrics.Counter
|
2020-03-05 14:10:07 +00:00
|
|
|
var entryPointReqDurationHistogram []ScalableHistogram
|
2019-07-18 19:36:05 +00:00
|
|
|
var entryPointOpenConnsGauge []metrics.Gauge
|
|
|
|
var serviceReqsCounter []metrics.Counter
|
2020-03-05 12:30:05 +00:00
|
|
|
var serviceReqsTLSCounter []metrics.Counter
|
2020-03-05 14:10:07 +00:00
|
|
|
var serviceReqDurationHistogram []ScalableHistogram
|
2019-07-18 19:36:05 +00:00
|
|
|
var serviceOpenConnsGauge []metrics.Gauge
|
|
|
|
var serviceRetriesCounter []metrics.Counter
|
|
|
|
var serviceServerUpGauge []metrics.Gauge
|
2017-08-23 18:46:03 +00:00
|
|
|
|
|
|
|
for _, r := range registries {
|
2018-01-26 10:58:03 +00:00
|
|
|
if r.ConfigReloadsCounter() != nil {
|
|
|
|
configReloadsCounter = append(configReloadsCounter, r.ConfigReloadsCounter())
|
|
|
|
}
|
|
|
|
if r.ConfigReloadsFailureCounter() != nil {
|
|
|
|
configReloadsFailureCounter = append(configReloadsFailureCounter, r.ConfigReloadsFailureCounter())
|
|
|
|
}
|
|
|
|
if r.LastConfigReloadSuccessGauge() != nil {
|
|
|
|
lastConfigReloadSuccessGauge = append(lastConfigReloadSuccessGauge, r.LastConfigReloadSuccessGauge())
|
|
|
|
}
|
|
|
|
if r.LastConfigReloadFailureGauge() != nil {
|
|
|
|
lastConfigReloadFailureGauge = append(lastConfigReloadFailureGauge, r.LastConfigReloadFailureGauge())
|
|
|
|
}
|
2020-12-18 17:44:03 +00:00
|
|
|
if r.TLSCertsNotAfterTimestampGauge() != nil {
|
|
|
|
tlsCertsNotAfterTimestampGauge = append(tlsCertsNotAfterTimestampGauge, r.TLSCertsNotAfterTimestampGauge())
|
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.EntryPointReqsCounter() != nil {
|
|
|
|
entryPointReqsCounter = append(entryPointReqsCounter, r.EntryPointReqsCounter())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2020-03-05 12:30:05 +00:00
|
|
|
if r.EntryPointReqsTLSCounter() != nil {
|
|
|
|
entryPointReqsTLSCounter = append(entryPointReqsTLSCounter, r.EntryPointReqsTLSCounter())
|
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.EntryPointReqDurationHistogram() != nil {
|
|
|
|
entryPointReqDurationHistogram = append(entryPointReqDurationHistogram, r.EntryPointReqDurationHistogram())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.EntryPointOpenConnsGauge() != nil {
|
|
|
|
entryPointOpenConnsGauge = append(entryPointOpenConnsGauge, r.EntryPointOpenConnsGauge())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.ServiceReqsCounter() != nil {
|
|
|
|
serviceReqsCounter = append(serviceReqsCounter, r.ServiceReqsCounter())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2020-03-05 12:30:05 +00:00
|
|
|
if r.ServiceReqsTLSCounter() != nil {
|
|
|
|
serviceReqsTLSCounter = append(serviceReqsTLSCounter, r.ServiceReqsTLSCounter())
|
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.ServiceReqDurationHistogram() != nil {
|
|
|
|
serviceReqDurationHistogram = append(serviceReqDurationHistogram, r.ServiceReqDurationHistogram())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.ServiceOpenConnsGauge() != nil {
|
|
|
|
serviceOpenConnsGauge = append(serviceOpenConnsGauge, r.ServiceOpenConnsGauge())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.ServiceRetriesCounter() != nil {
|
|
|
|
serviceRetriesCounter = append(serviceRetriesCounter, r.ServiceRetriesCounter())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2019-07-18 19:36:05 +00:00
|
|
|
if r.ServiceServerUpGauge() != nil {
|
|
|
|
serviceServerUpGauge = append(serviceServerUpGauge, r.ServiceServerUpGauge())
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return &standardRegistry{
|
2019-07-18 19:36:05 +00:00
|
|
|
epEnabled: len(entryPointReqsCounter) > 0 || len(entryPointReqDurationHistogram) > 0 || len(entryPointOpenConnsGauge) > 0,
|
|
|
|
svcEnabled: len(serviceReqsCounter) > 0 || len(serviceReqDurationHistogram) > 0 || len(serviceOpenConnsGauge) > 0 || len(serviceRetriesCounter) > 0 || len(serviceServerUpGauge) > 0,
|
2018-01-26 10:58:03 +00:00
|
|
|
configReloadsCounter: multi.NewCounter(configReloadsCounter...),
|
|
|
|
configReloadsFailureCounter: multi.NewCounter(configReloadsFailureCounter...),
|
|
|
|
lastConfigReloadSuccessGauge: multi.NewGauge(lastConfigReloadSuccessGauge...),
|
|
|
|
lastConfigReloadFailureGauge: multi.NewGauge(lastConfigReloadFailureGauge...),
|
2020-12-18 17:44:03 +00:00
|
|
|
tlsCertsNotAfterTimestampGauge: multi.NewGauge(tlsCertsNotAfterTimestampGauge...),
|
2019-07-18 19:36:05 +00:00
|
|
|
entryPointReqsCounter: multi.NewCounter(entryPointReqsCounter...),
|
2020-03-05 12:30:05 +00:00
|
|
|
entryPointReqsTLSCounter: multi.NewCounter(entryPointReqsTLSCounter...),
|
2020-03-05 14:10:07 +00:00
|
|
|
entryPointReqDurationHistogram: NewMultiHistogram(entryPointReqDurationHistogram...),
|
2019-07-18 19:36:05 +00:00
|
|
|
entryPointOpenConnsGauge: multi.NewGauge(entryPointOpenConnsGauge...),
|
|
|
|
serviceReqsCounter: multi.NewCounter(serviceReqsCounter...),
|
2020-03-05 12:30:05 +00:00
|
|
|
serviceReqsTLSCounter: multi.NewCounter(serviceReqsTLSCounter...),
|
2020-03-05 14:10:07 +00:00
|
|
|
serviceReqDurationHistogram: NewMultiHistogram(serviceReqDurationHistogram...),
|
2019-07-18 19:36:05 +00:00
|
|
|
serviceOpenConnsGauge: multi.NewGauge(serviceOpenConnsGauge...),
|
|
|
|
serviceRetriesCounter: multi.NewCounter(serviceRetriesCounter...),
|
|
|
|
serviceServerUpGauge: multi.NewGauge(serviceServerUpGauge...),
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type standardRegistry struct {
|
2019-07-18 19:36:05 +00:00
|
|
|
epEnabled bool
|
|
|
|
svcEnabled bool
|
2018-01-26 10:58:03 +00:00
|
|
|
configReloadsCounter metrics.Counter
|
|
|
|
configReloadsFailureCounter metrics.Counter
|
|
|
|
lastConfigReloadSuccessGauge metrics.Gauge
|
|
|
|
lastConfigReloadFailureGauge metrics.Gauge
|
2020-12-18 17:44:03 +00:00
|
|
|
tlsCertsNotAfterTimestampGauge metrics.Gauge
|
2019-07-18 19:36:05 +00:00
|
|
|
entryPointReqsCounter metrics.Counter
|
2020-03-05 12:30:05 +00:00
|
|
|
entryPointReqsTLSCounter metrics.Counter
|
2020-03-05 14:10:07 +00:00
|
|
|
entryPointReqDurationHistogram ScalableHistogram
|
2019-07-18 19:36:05 +00:00
|
|
|
entryPointOpenConnsGauge metrics.Gauge
|
|
|
|
serviceReqsCounter metrics.Counter
|
2020-03-05 12:30:05 +00:00
|
|
|
serviceReqsTLSCounter metrics.Counter
|
2020-03-05 14:10:07 +00:00
|
|
|
serviceReqDurationHistogram ScalableHistogram
|
2019-07-18 19:36:05 +00:00
|
|
|
serviceOpenConnsGauge metrics.Gauge
|
|
|
|
serviceRetriesCounter metrics.Counter
|
|
|
|
serviceServerUpGauge metrics.Gauge
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
func (r *standardRegistry) IsEpEnabled() bool {
|
|
|
|
return r.epEnabled
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *standardRegistry) IsSvcEnabled() bool {
|
|
|
|
return r.svcEnabled
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
2018-01-26 10:58:03 +00:00
|
|
|
func (r *standardRegistry) ConfigReloadsCounter() metrics.Counter {
|
|
|
|
return r.configReloadsCounter
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
2018-01-26 10:58:03 +00:00
|
|
|
func (r *standardRegistry) ConfigReloadsFailureCounter() metrics.Counter {
|
|
|
|
return r.configReloadsFailureCounter
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
2018-01-26 10:58:03 +00:00
|
|
|
func (r *standardRegistry) LastConfigReloadSuccessGauge() metrics.Gauge {
|
|
|
|
return r.lastConfigReloadSuccessGauge
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
2018-01-26 10:58:03 +00:00
|
|
|
func (r *standardRegistry) LastConfigReloadFailureGauge() metrics.Gauge {
|
|
|
|
return r.lastConfigReloadFailureGauge
|
2017-08-23 18:46:03 +00:00
|
|
|
}
|
|
|
|
|
2020-12-18 17:44:03 +00:00
|
|
|
func (r *standardRegistry) TLSCertsNotAfterTimestampGauge() metrics.Gauge {
|
|
|
|
return r.tlsCertsNotAfterTimestampGauge
|
|
|
|
}
|
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
func (r *standardRegistry) EntryPointReqsCounter() metrics.Counter {
|
|
|
|
return r.entryPointReqsCounter
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
|
|
|
|
2020-03-05 12:30:05 +00:00
|
|
|
func (r *standardRegistry) EntryPointReqsTLSCounter() metrics.Counter {
|
|
|
|
return r.entryPointReqsTLSCounter
|
|
|
|
}
|
|
|
|
|
2020-03-05 14:10:07 +00:00
|
|
|
func (r *standardRegistry) EntryPointReqDurationHistogram() ScalableHistogram {
|
2019-07-18 19:36:05 +00:00
|
|
|
return r.entryPointReqDurationHistogram
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
func (r *standardRegistry) EntryPointOpenConnsGauge() metrics.Gauge {
|
|
|
|
return r.entryPointOpenConnsGauge
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
func (r *standardRegistry) ServiceReqsCounter() metrics.Counter {
|
|
|
|
return r.serviceReqsCounter
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
|
|
|
|
2020-03-05 12:30:05 +00:00
|
|
|
func (r *standardRegistry) ServiceReqsTLSCounter() metrics.Counter {
|
|
|
|
return r.serviceReqsTLSCounter
|
|
|
|
}
|
|
|
|
|
2020-03-05 14:10:07 +00:00
|
|
|
func (r *standardRegistry) ServiceReqDurationHistogram() ScalableHistogram {
|
2019-07-18 19:36:05 +00:00
|
|
|
return r.serviceReqDurationHistogram
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2017-08-23 18:46:03 +00:00
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
func (r *standardRegistry) ServiceOpenConnsGauge() metrics.Gauge {
|
|
|
|
return r.serviceOpenConnsGauge
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2017-08-23 18:46:03 +00:00
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
func (r *standardRegistry) ServiceRetriesCounter() metrics.Counter {
|
|
|
|
return r.serviceRetriesCounter
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2017-08-23 18:46:03 +00:00
|
|
|
|
2019-07-18 19:36:05 +00:00
|
|
|
func (r *standardRegistry) ServiceServerUpGauge() metrics.Gauge {
|
|
|
|
return r.serviceServerUpGauge
|
2018-01-26 10:58:03 +00:00
|
|
|
}
|
2020-03-05 14:10:07 +00:00
|
|
|
|
|
|
|
// ScalableHistogram is a Histogram with a predefined time unit,
|
|
|
|
// used when producing observations without explicitly setting the observed value.
|
|
|
|
type ScalableHistogram interface {
|
|
|
|
With(labelValues ...string) ScalableHistogram
|
|
|
|
Observe(v float64)
|
2020-03-19 12:48:04 +00:00
|
|
|
ObserveFromStart(start time.Time)
|
2020-03-05 14:10:07 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// HistogramWithScale is a histogram that will convert its observed value to the specified unit.
|
|
|
|
type HistogramWithScale struct {
|
|
|
|
histogram metrics.Histogram
|
|
|
|
unit time.Duration
|
|
|
|
}
|
|
|
|
|
|
|
|
// With implements ScalableHistogram.
|
|
|
|
func (s *HistogramWithScale) With(labelValues ...string) ScalableHistogram {
|
2020-03-19 12:48:04 +00:00
|
|
|
h, _ := NewHistogramWithScale(s.histogram.With(labelValues...), s.unit)
|
|
|
|
return h
|
2020-03-05 14:10:07 +00:00
|
|
|
}
|
|
|
|
|
2020-03-19 12:48:04 +00:00
|
|
|
// ObserveFromStart implements ScalableHistogram.
|
|
|
|
func (s *HistogramWithScale) ObserveFromStart(start time.Time) {
|
2020-03-05 14:10:07 +00:00
|
|
|
if s.unit <= 0 {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2020-03-19 12:48:04 +00:00
|
|
|
d := float64(time.Since(start).Nanoseconds()) / float64(s.unit)
|
2020-03-05 14:10:07 +00:00
|
|
|
if d < 0 {
|
|
|
|
d = 0
|
|
|
|
}
|
|
|
|
s.histogram.Observe(d)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Observe implements ScalableHistogram.
|
|
|
|
func (s *HistogramWithScale) Observe(v float64) {
|
|
|
|
s.histogram.Observe(v)
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewHistogramWithScale returns a ScalableHistogram. It returns an error if the given unit is <= 0.
|
|
|
|
func NewHistogramWithScale(histogram metrics.Histogram, unit time.Duration) (ScalableHistogram, error) {
|
|
|
|
if unit <= 0 {
|
|
|
|
return nil, errors.New("invalid time unit")
|
|
|
|
}
|
|
|
|
return &HistogramWithScale{
|
|
|
|
histogram: histogram,
|
|
|
|
unit: unit,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// MultiHistogram collects multiple individual histograms and treats them as a unit.
|
|
|
|
type MultiHistogram []ScalableHistogram
|
|
|
|
|
|
|
|
// NewMultiHistogram returns a multi-histogram, wrapping the passed histograms.
|
|
|
|
func NewMultiHistogram(h ...ScalableHistogram) MultiHistogram {
|
|
|
|
return MultiHistogram(h)
|
|
|
|
}
|
|
|
|
|
2020-03-19 12:48:04 +00:00
|
|
|
// ObserveFromStart implements ScalableHistogram.
|
|
|
|
func (h MultiHistogram) ObserveFromStart(start time.Time) {
|
2020-03-05 14:10:07 +00:00
|
|
|
for _, histogram := range h {
|
2020-03-19 12:48:04 +00:00
|
|
|
histogram.ObserveFromStart(start)
|
2020-03-05 14:10:07 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Observe implements ScalableHistogram.
|
|
|
|
func (h MultiHistogram) Observe(v float64) {
|
|
|
|
for _, histogram := range h {
|
|
|
|
histogram.Observe(v)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// With implements ScalableHistogram.
|
|
|
|
func (h MultiHistogram) With(labelValues ...string) ScalableHistogram {
|
|
|
|
next := make(MultiHistogram, len(h))
|
|
|
|
for i := range h {
|
|
|
|
next[i] = h[i].With(labelValues...)
|
|
|
|
}
|
|
|
|
return next
|
|
|
|
}
|