To combat label cardinality explosions remove the type from metrics. This was most severe in the histogram for request duration, remove it there. It's also highlighted difference between grpc and forward code, where forward did use type and grpc didn't; getting rid of all that "fixes" that discrepancy Move monitor.go back into the vars directory and make it private again. Also name it slightly better Fixes: #4507 Signed-off-by: Miek Gieben <miek@miek.nl>
67 lines
2.4 KiB
Go
67 lines
2.4 KiB
Go
package forward
|
|
|
|
import (
|
|
"github.com/coredns/coredns/plugin"
|
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/prometheus/client_golang/prometheus/promauto"
|
|
)
|
|
|
|
// Variables declared for monitoring.
|
|
var (
|
|
RequestCount = promauto.NewCounterVec(prometheus.CounterOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "requests_total",
|
|
Help: "Counter of requests made per upstream.",
|
|
}, []string{"to"})
|
|
RcodeCount = promauto.NewCounterVec(prometheus.CounterOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "responses_total",
|
|
Help: "Counter of responses received per upstream.",
|
|
}, []string{"rcode", "to"})
|
|
RequestDuration = promauto.NewHistogramVec(prometheus.HistogramOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "request_duration_seconds",
|
|
Buckets: plugin.TimeBuckets,
|
|
Help: "Histogram of the time each request took.",
|
|
}, []string{"to", "rcode"})
|
|
HealthcheckFailureCount = promauto.NewCounterVec(prometheus.CounterOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "healthcheck_failures_total",
|
|
Help: "Counter of the number of failed healthchecks.",
|
|
}, []string{"to"})
|
|
HealthcheckBrokenCount = promauto.NewCounter(prometheus.CounterOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "healthcheck_broken_total",
|
|
Help: "Counter of the number of complete failures of the healthchecks.",
|
|
})
|
|
SocketGauge = promauto.NewGaugeVec(prometheus.GaugeOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "sockets_open",
|
|
Help: "Gauge of open sockets per upstream.",
|
|
}, []string{"to"})
|
|
MaxConcurrentRejectCount = promauto.NewCounter(prometheus.CounterOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "max_concurrent_rejects_total",
|
|
Help: "Counter of the number of queries rejected because the concurrent queries were at maximum.",
|
|
})
|
|
ConnCacheHitsCount = promauto.NewCounterVec(prometheus.CounterOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "conn_cache_hits_total",
|
|
Help: "Counter of connection cache hits per upstream and protocol.",
|
|
}, []string{"to", "proto"})
|
|
ConnCacheMissesCount = promauto.NewCounterVec(prometheus.CounterOpts{
|
|
Namespace: plugin.Namespace,
|
|
Subsystem: "forward",
|
|
Name: "conn_cache_misses_total",
|
|
Help: "Counter of connection cache misses per upstream and protocol.",
|
|
}, []string{"to", "proto"})
|
|
)
|