Merge pull request #22 from brancz/update-configs

Update configs/alerts
This commit is contained in:
Frederic Branczyk
2016-12-14 18:17:05 -08:00
committed by GitHub
3 changed files with 19 additions and 24 deletions

View File

@@ -1,3 +1,22 @@
alerting:
alertmanagers:
- kubernetes_sd_configs:
- role: endpoints
relabel_configs:
- action: keep
regex: alertmanager-main
source_labels:
- __meta_kubernetes_service_name
- action: keep
regex: monitoring
source_labels:
- __meta_kubernetes_namespace
- action: keep
regex: web
source_labels:
- __meta_kubernetes_endpoint_port_name
scheme: http
global:
scrape_interval: 15s
evaluation_interval: 15s

View File

@@ -286,18 +286,6 @@ ALERT K8SControllerManagerDown
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
}
ALERT K8SMoreThanOneController
IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1
FOR 5m
LABELS {
service = "k8s",
severity = "critical",
}
ANNOTATIONS {
summary = "More than one controller node is active",
description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.",
}
ALERT K8SConntrackTableFull
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
FOR 10m

View File

@@ -341,18 +341,6 @@ data:
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
}
ALERT K8SMoreThanOneController
IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1
FOR 5m
LABELS {
service = "k8s",
severity = "critical",
}
ANNOTATIONS {
summary = "More than one controller node is active",
description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.",
}
ALERT K8SConntrackTableFull
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
FOR 10m