Skip to content

Commit

Permalink
reloader: Expose metrics to give info about last operation result/time
Browse files Browse the repository at this point in the history
Signed-off-by: Philip Gough <philip.p.gough@gmail.com>
  • Loading branch information
philipgough committed Aug 24, 2021
1 parent ce1c4fe commit 8090288
Show file tree
Hide file tree
Showing 2 changed files with 41 additions and 5 deletions.
1 change: 1 addition & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,7 @@ We use *breaking :warning:* to mark changes that are not backward compatible (re
- [#4462](https://github.com/thanos-io/thanos/pull/4462) UI: Add find overlap block UI.
- [#4469](https://github.com/thanos-io/thanos/pull/4469) Compact: Add flag `compact.skip-block-with-out-of-order-chunks` to skip blocks with out-of-order chunks during compaction instead of halting
- [#4552](https://github.com/thanos-io/thanos/pull/4552) Compact: Adds `thanos_compact_downsample_duration_seconds` histogram.
- [#4594](https://github.com/thanos-io/thanos/pull/4594) reloader: Expose metrics in config reloader to give info on the last operation.

### Fixed

Expand Down
45 changes: 40 additions & 5 deletions pkg/reloader/reloader.go
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
// Reloader type is useful when you want to:
//
// * Watch on changes against certain file e.g (`cfgFile`).
// * Optionally, specify different different output file for watched `cfgFile` (`cfgOutputFile`).
// * Optionally, specify different output file for watched `cfgFile` (`cfgOutputFile`).
// This will also try decompress the `cfgFile` if needed and substitute ALL the envvars using Kubernetes substitution format: (`$(var)`)
// * Watch on changes against certain directories (`watchedDirs`).
//
Expand Down Expand Up @@ -95,10 +95,14 @@ type Reloader struct {
lastCfgHash []byte
lastWatchedDirsHash []byte

reloads prometheus.Counter
reloadErrors prometheus.Counter
configApplyErrors prometheus.Counter
configApply prometheus.Counter
reloads prometheus.Counter
reloadErrors prometheus.Counter
lastReloadSuccess prometheus.Gauge
lastReloadSuccessTimestamp prometheus.Gauge
configApplyErrors prometheus.Counter
configApply prometheus.Counter
lastConfigApplySuccess prometheus.Gauge
lastConfigApplySuccessTimestamp prometheus.Gauge
}

// Options bundles options for the Reloader.
Expand Down Expand Up @@ -154,6 +158,18 @@ func New(logger log.Logger, reg prometheus.Registerer, o *Options) *Reloader {
Help: "Total number of reload requests that failed.",
},
),
lastReloadSuccess: promauto.With(reg).NewGauge(
prometheus.GaugeOpts{
Name: "reloader_last_reload_successful",
Help: "Whether the last reload attempt was successful",
},
),
lastReloadSuccessTimestamp: promauto.With(reg).NewGauge(
prometheus.GaugeOpts{
Name: "reloader_last_reload_success_timestamp_seconds",
Help: "Timestamp of the last successful reload",
},
),
configApply: promauto.With(reg).NewCounter(
prometheus.CounterOpts{
Name: "reloader_config_apply_operations_total",
Expand All @@ -166,6 +182,18 @@ func New(logger log.Logger, reg prometheus.Registerer, o *Options) *Reloader {
Help: "Total number of config apply operations that failed.",
},
),
lastConfigApplySuccess: promauto.With(reg).NewGauge(
prometheus.GaugeOpts{
Name: "reloader_last_config_apply_successful",
Help: "Whether the last config apply operation attempt was successful",
},
),
lastConfigApplySuccessTimestamp: promauto.With(reg).NewGauge(
prometheus.GaugeOpts{
Name: "reloader_config_apply_last_success_timestamp_seconds",
Help: "Timestamp of the last successful config apply operation",
},
),
}
return r
}
Expand Down Expand Up @@ -243,7 +271,11 @@ func (r *Reloader) Watch(ctx context.Context) error {
if err := r.apply(applyCtx); err != nil {
r.configApplyErrors.Inc()
level.Error(r.logger).Log("msg", "apply error", "err", err)
r.lastConfigApplySuccess.Set(0)
continue
}
r.lastConfigApplySuccess.Set(1)
r.lastConfigApplySuccessTimestamp.SetToCurrentTime()
}
}

Expand Down Expand Up @@ -347,6 +379,7 @@ func (r *Reloader) apply(ctx context.Context) error {
r.reloads.Inc()
if err := r.triggerReload(ctx); err != nil {
r.reloadErrors.Inc()
r.lastReloadSuccess.Set(0)
return errors.Wrap(err, "trigger reload")
}

Expand All @@ -357,6 +390,8 @@ func (r *Reloader) apply(ctx context.Context) error {
"cfg_in", r.cfgFile,
"cfg_out", r.cfgOutputFile,
"watched_dirs", strings.Join(r.watchedDirs, ", "))
r.lastReloadSuccess.Set(1)
r.lastReloadSuccessTimestamp.SetToCurrentTime()
return nil
}); err != nil {
level.Error(r.logger).Log("msg", "Failed to trigger reload. Retrying.", "err", err)
Expand Down

0 comments on commit 8090288

Please sign in to comment.