kube-prometheus: add alerting rules
This commit is contained in:
10
assets/prometheus/rules/kube-controller-manager.rules
Normal file
10
assets/prometheus/rules/kube-controller-manager.rules
Normal file
@@ -0,0 +1,10 @@
|
||||
ALERT K8SControllerManagerDown
|
||||
IF absent(up{job="kube-controller-manager"}) or (count by(cluster) (up{job="kube-controller-manager"} == 1) == 0)
|
||||
FOR 5m
|
||||
LABELS {
|
||||
severity = "critical",
|
||||
}
|
||||
ANNOTATIONS {
|
||||
summary = "Controller manager is down",
|
||||
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
|
||||
}
|
||||
Reference in New Issue
Block a user