ir: Add health status #87
3 changed files with 21 additions and 4 deletions
|
@ -925,7 +925,7 @@ func New(ctx context.Context, log *logger.Logger, cfg *viper.Viper, errChan chan
|
||||||
queueSize: cfg.GetUint32("workers.subnet"),
|
queueSize: cfg.GetUint32("workers.subnet"),
|
||||||
})
|
})
|
||||||
|
|
||||||
if cfg.GetString("metrics.address") != "" {
|
if cfg.GetString("prometheus.address") != "" {
|
||||||
fyrchik marked this conversation as resolved
Outdated
|
|||||||
m := metrics.NewInnerRingMetrics()
|
m := metrics.NewInnerRingMetrics()
|
||||||
server.metrics = &m
|
server.metrics = &m
|
||||||
}
|
}
|
||||||
|
|
|
@ -167,6 +167,9 @@ func (s *Server) ResetEpochTimer(h uint32) error {
|
||||||
|
|
||||||
func (s *Server) setHealthStatus(hs control.HealthStatus) {
|
func (s *Server) setHealthStatus(hs control.HealthStatus) {
|
||||||
s.healthStatus.Store(hs)
|
s.healthStatus.Store(hs)
|
||||||
|
if s.metrics != nil {
|
||||||
|
s.metrics.SetHealth(int32(hs))
|
||||||
fyrchik
commented
Does the number means the same for other services? Like 0 == HEALTHY? Does the number means the same for other services? Like 0 == HEALTHY?
acid-ant
commented
We have two enums for HealthStatus - one in We have two enums for HealthStatus - one in `control` and one in `ir`. But they have the same numbers for statuses. Can we move HealthStatus in `common` proto file, one for both packages?
|
|||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// HealthStatus returns the current health status of the IR application.
|
// HealthStatus returns the current health status of the IR application.
|
||||||
|
|
|
@ -2,11 +2,12 @@ package metrics
|
||||||
|
|
||||||
import "github.com/prometheus/client_golang/prometheus"
|
import "github.com/prometheus/client_golang/prometheus"
|
||||||
|
|
||||||
const innerRingSubsystem = "object"
|
const innerRingSubsystem = "ir"
|
||||||
|
|
||||||
// InnerRingServiceMetrics contains metrics collected by inner ring.
|
// InnerRingServiceMetrics contains metrics collected by inner ring.
|
||||||
type InnerRingServiceMetrics struct {
|
type InnerRingServiceMetrics struct {
|
||||||
epoch prometheus.Gauge
|
epoch prometheus.Gauge
|
||||||
|
health prometheus.Gauge
|
||||||
}
|
}
|
||||||
|
|
||||||
// NewInnerRingMetrics returns new instance of metrics collectors for inner ring.
|
// NewInnerRingMetrics returns new instance of metrics collectors for inner ring.
|
||||||
|
@ -18,12 +19,20 @@ func NewInnerRingMetrics() InnerRingServiceMetrics {
|
||||||
Name: "epoch",
|
Name: "epoch",
|
||||||
Help: "Current epoch as seen by inner-ring node.",
|
Help: "Current epoch as seen by inner-ring node.",
|
||||||
})
|
})
|
||||||
|
health = prometheus.NewGauge(prometheus.GaugeOpts{
|
||||||
|
Namespace: namespace,
|
||||||
|
Subsystem: innerRingSubsystem,
|
||||||
|
Name: "health",
|
||||||
|
Help: "Current inner-ring node state.",
|
||||||
|
})
|
||||||
)
|
)
|
||||||
|
|
||||||
prometheus.MustRegister(epoch)
|
prometheus.MustRegister(epoch)
|
||||||
|
prometheus.MustRegister(health)
|
||||||
|
|
||||||
return InnerRingServiceMetrics{
|
return InnerRingServiceMetrics{
|
||||||
epoch: epoch,
|
epoch: epoch,
|
||||||
|
health: health,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -31,3 +40,8 @@ func NewInnerRingMetrics() InnerRingServiceMetrics {
|
||||||
func (m InnerRingServiceMetrics) SetEpoch(epoch uint64) {
|
func (m InnerRingServiceMetrics) SetEpoch(epoch uint64) {
|
||||||
m.epoch.Set(float64(epoch))
|
m.epoch.Set(float64(epoch))
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// SetHealth updates health metrics.
|
||||||
|
func (m InnerRingServiceMetrics) SetHealth(s int32) {
|
||||||
|
m.health.Set(float64(s))
|
||||||
|
}
|
||||||
|
|
Loading…
Reference in a new issue
Worth a separate commit.
Agree, moved in separate commit.