Merge pull request #2542 from gianrubio/instrument-configreload
Instrument controller to show configReload metrics
This commit is contained in:
commit
d95facd15e
2 changed files with 47 additions and 6 deletions
|
@ -169,13 +169,15 @@ func (n *NGINXController) syncIngress(interface{}) error {
|
||||||
|
|
||||||
err := n.OnUpdate(pcfg)
|
err := n.OnUpdate(pcfg)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
incReloadErrorCount()
|
IncReloadErrorCount()
|
||||||
|
ConfigSuccess(false)
|
||||||
glog.Errorf("unexpected failure restarting the backend: \n%v", err)
|
glog.Errorf("unexpected failure restarting the backend: \n%v", err)
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
glog.Infof("ingress backend successfully reloaded...")
|
glog.Infof("ingress backend successfully reloaded...")
|
||||||
incReloadCount()
|
ConfigSuccess(true)
|
||||||
|
IncReloadCount()
|
||||||
setSSLExpireTime(servers)
|
setSSLExpireTime(servers)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -17,6 +17,8 @@ limitations under the License.
|
||||||
package controller
|
package controller
|
||||||
|
|
||||||
import (
|
import (
|
||||||
|
"time"
|
||||||
|
|
||||||
"github.com/prometheus/client_golang/prometheus"
|
"github.com/prometheus/client_golang/prometheus"
|
||||||
|
|
||||||
"k8s.io/ingress-nginx/internal/ingress"
|
"k8s.io/ingress-nginx/internal/ingress"
|
||||||
|
@ -34,22 +36,42 @@ func init() {
|
||||||
prometheus.MustRegister(reloadOperation)
|
prometheus.MustRegister(reloadOperation)
|
||||||
prometheus.MustRegister(reloadOperationErrors)
|
prometheus.MustRegister(reloadOperationErrors)
|
||||||
prometheus.MustRegister(sslExpireTime)
|
prometheus.MustRegister(sslExpireTime)
|
||||||
|
prometheus.MustRegister(configSuccess)
|
||||||
|
prometheus.MustRegister(configSuccessTime)
|
||||||
}
|
}
|
||||||
|
|
||||||
var (
|
var (
|
||||||
|
configSuccess = prometheus.NewGauge(prometheus.GaugeOpts{
|
||||||
|
Namespace: ns,
|
||||||
|
Name: "config_last_reload_successfull",
|
||||||
|
Help: `Whether the last configuration reload attemp was successfull.
|
||||||
|
Prometheus alert example:
|
||||||
|
alert: IngressControllerFailedReload
|
||||||
|
expr: ingress_controller_config_last_reload_successfull == 0
|
||||||
|
for: 10m`,
|
||||||
|
})
|
||||||
|
configSuccessTime = prometheus.NewGauge(prometheus.GaugeOpts{
|
||||||
|
Namespace: ns,
|
||||||
|
Name: "config_last_reload_successfull_timestamp_seconds",
|
||||||
|
Help: "Timestamp of the last successfull configuration reload.",
|
||||||
|
})
|
||||||
|
// TODO depreciate this metrics in favor of ingress_controller_config_last_reload_successfull_timestamp_seconds
|
||||||
reloadOperation = prometheus.NewCounterVec(
|
reloadOperation = prometheus.NewCounterVec(
|
||||||
prometheus.CounterOpts{
|
prometheus.CounterOpts{
|
||||||
Namespace: ns,
|
Namespace: ns,
|
||||||
Name: "success",
|
Name: "success",
|
||||||
Help: "Cumulative number of Ingress controller reload operations",
|
Help: `DEPRECATED: use ingress_controller_config_last_reload_successfull_timestamp_seconds or ingress_controller_config_last_reload_successfull instead.
|
||||||
|
Cumulative number of Ingress controller reload operations`,
|
||||||
},
|
},
|
||||||
[]string{operation},
|
[]string{operation},
|
||||||
)
|
)
|
||||||
|
// TODO depreciate this metrics in favor of ingress_controller_config_last_reload_successfull_timestamp_seconds
|
||||||
reloadOperationErrors = prometheus.NewCounterVec(
|
reloadOperationErrors = prometheus.NewCounterVec(
|
||||||
prometheus.CounterOpts{
|
prometheus.CounterOpts{
|
||||||
Namespace: ns,
|
Namespace: ns,
|
||||||
Name: "errors",
|
Name: "errors",
|
||||||
Help: "Cumulative number of Ingress controller errors during reload operations",
|
Help: `DEPRECATED: use ingress_controller_config_last_reload_successfull_timestamp_seconds or ingress_controller_config_last_reload_successfull instead.
|
||||||
|
Cumulative number of Ingress controller errors during reload operations`,
|
||||||
},
|
},
|
||||||
[]string{operation},
|
[]string{operation},
|
||||||
)
|
)
|
||||||
|
@ -64,14 +86,31 @@ var (
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
|
|
||||||
func incReloadCount() {
|
// IncReloadCount increment the reload counter
|
||||||
|
func IncReloadCount() {
|
||||||
reloadOperation.WithLabelValues(reloadLabel).Inc()
|
reloadOperation.WithLabelValues(reloadLabel).Inc()
|
||||||
}
|
}
|
||||||
|
|
||||||
func incReloadErrorCount() {
|
// IncReloadErrorCount increment the reload error counter
|
||||||
|
func IncReloadErrorCount() {
|
||||||
reloadOperationErrors.WithLabelValues(reloadLabel).Inc()
|
reloadOperationErrors.WithLabelValues(reloadLabel).Inc()
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// ConfigSuccess set a boolean flag according to the output of the controller configuration reload
|
||||||
|
func ConfigSuccess(success bool) {
|
||||||
|
if success {
|
||||||
|
ConfigSuccessTime()
|
||||||
|
configSuccess.Set(1)
|
||||||
|
} else {
|
||||||
|
configSuccess.Set(0)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// ConfigSuccessTime set the current timestamp when the controller is successfully reloaded
|
||||||
|
func ConfigSuccessTime() {
|
||||||
|
configSuccessTime.Set(float64(time.Now().Unix()))
|
||||||
|
}
|
||||||
|
|
||||||
func setSSLExpireTime(servers []*ingress.Server) {
|
func setSSLExpireTime(servers []*ingress.Server) {
|
||||||
for _, s := range servers {
|
for _, s := range servers {
|
||||||
if s.Hostname != defServerName {
|
if s.Hostname != defServerName {
|
||||||
|
|
Loading…
Reference in a new issue