kube-prometheus: ensure triggering alerts on down targets

This commit is contained in:
Frederic Branczyk
2017-06-28 10:50:17 +02:00
parent 4c42ab4fcc
commit a5533a4f6c
7 changed files with 32 additions and 28 deletions

View File

@@ -1,14 +1,14 @@
### Up Alerting ###
Alert TargetDown
IF 100 * (count(up == 0) / count(up)) > 3
IF 100 * (count by(job) (up == 0) / count by(job) (up)) > 10
FOR 10m
LABELS {
severity = "warning"
}
ANNOTATIONS {
summary = "Targets are down",
description = "More than {{ $value }}% of targets are down."
description = "{{ $value }}% or more of {{ $labels.job }} targets are down."
}
### Dead man's switch ###