Add AlertmanagerMembersInconsistent alerting rule
This commit is contained in:
@@ -30,6 +30,21 @@
|
|||||||
severity: 'warning',
|
severity: 'warning',
|
||||||
},
|
},
|
||||||
},
|
},
|
||||||
|
{
|
||||||
|
alert:'AlertmanagerMembersInconsistent',
|
||||||
|
annotations:{
|
||||||
|
message: 'Alertmanager has not found all other members of the cluster.',
|
||||||
|
},
|
||||||
|
expr: |||
|
||||||
|
alertmanager_cluster_members{%(alertmanagerSelector)s}
|
||||||
|
!= on (service)
|
||||||
|
count by (service) (alertmanager_cluster_members{%(alertmanagerSelector)s})
|
||||||
|
||| % $._config,
|
||||||
|
'for': '5m',
|
||||||
|
labels: {
|
||||||
|
severity: 'critical',
|
||||||
|
},
|
||||||
|
},
|
||||||
],
|
],
|
||||||
},
|
},
|
||||||
],
|
],
|
||||||
|
44
jsonnet/kube-prometheus/alerts/tests.yaml
Normal file
44
jsonnet/kube-prometheus/alerts/tests.yaml
Normal file
@@ -0,0 +1,44 @@
|
|||||||
|
# TODO(metalmatze): This file is temporarily saved here for later reference
|
||||||
|
# until we find out how to integrate the tests into our jsonnet stack.
|
||||||
|
|
||||||
|
rule_files:
|
||||||
|
- rules.yaml
|
||||||
|
|
||||||
|
evaluation_interval: 1m
|
||||||
|
|
||||||
|
tests:
|
||||||
|
- interval: 1m
|
||||||
|
input_series:
|
||||||
|
- series: 'alertmanager_cluster_members{job="alertmanager-main",instance="10.10.10.0",namespace="monitoring",pod="alertmanager-main-0",service="alertmanager-main"}'
|
||||||
|
values: '3 3 3 3 3 2 2 2 2 2 2 1 1 1 1 1 1 0 0 0 0 0 0'
|
||||||
|
- series: 'alertmanager_cluster_members{job="alertmanager-main",instance="10.10.10.1",namespace="monitoring",pod="alertmanager-main-1",service="alertmanager-main"}'
|
||||||
|
values: '3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3'
|
||||||
|
- series: 'alertmanager_cluster_members{job="alertmanager-main",instance="10.10.10.2",namespace="monitoring",pod="alertmanager-main-2",service="alertmanager-main"}'
|
||||||
|
values: '3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3'
|
||||||
|
alert_rule_test:
|
||||||
|
- eval_time: 5m
|
||||||
|
alertname: AlertmanagerMembersInconsistent
|
||||||
|
- eval_time: 11m
|
||||||
|
alertname: AlertmanagerMembersInconsistent
|
||||||
|
exp_alerts:
|
||||||
|
- exp_labels:
|
||||||
|
service: 'alertmanager-main'
|
||||||
|
severity: critical
|
||||||
|
exp_annotations:
|
||||||
|
message: 'Alertmanager has not found all other members of the cluster.'
|
||||||
|
- eval_time: 17m
|
||||||
|
alertname: AlertmanagerMembersInconsistent
|
||||||
|
exp_alerts:
|
||||||
|
- exp_labels:
|
||||||
|
service: 'alertmanager-main'
|
||||||
|
severity: critical
|
||||||
|
exp_annotations:
|
||||||
|
message: 'Alertmanager has not found all other members of the cluster.'
|
||||||
|
- eval_time: 23m
|
||||||
|
alertname: AlertmanagerMembersInconsistent
|
||||||
|
exp_alerts:
|
||||||
|
- exp_labels:
|
||||||
|
service: 'alertmanager-main'
|
||||||
|
severity: critical
|
||||||
|
exp_annotations:
|
||||||
|
message: 'Alertmanager has not found all other members of the cluster.'
|
Reference in New Issue
Block a user