kubernetes alerts: don't alert on multiple
bootkube starts two replicas of the scheduler and controllers manager
This commit is contained in:
@@ -286,18 +286,6 @@ ALERT K8SControllerManagerDown
|
|||||||
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
|
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
|
||||||
}
|
}
|
||||||
|
|
||||||
ALERT K8SMoreThanOneController
|
|
||||||
IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1
|
|
||||||
FOR 5m
|
|
||||||
LABELS {
|
|
||||||
service = "k8s",
|
|
||||||
severity = "critical",
|
|
||||||
}
|
|
||||||
ANNOTATIONS {
|
|
||||||
summary = "More than one controller node is active",
|
|
||||||
description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.",
|
|
||||||
}
|
|
||||||
|
|
||||||
ALERT K8SConntrackTableFull
|
ALERT K8SConntrackTableFull
|
||||||
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
|
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
|
||||||
FOR 10m
|
FOR 10m
|
||||||
|
@@ -341,18 +341,6 @@ data:
|
|||||||
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
|
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
|
||||||
}
|
}
|
||||||
|
|
||||||
ALERT K8SMoreThanOneController
|
|
||||||
IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1
|
|
||||||
FOR 5m
|
|
||||||
LABELS {
|
|
||||||
service = "k8s",
|
|
||||||
severity = "critical",
|
|
||||||
}
|
|
||||||
ANNOTATIONS {
|
|
||||||
summary = "More than one controller node is active",
|
|
||||||
description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.",
|
|
||||||
}
|
|
||||||
|
|
||||||
ALERT K8SConntrackTableFull
|
ALERT K8SConntrackTableFull
|
||||||
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
|
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
|
||||||
FOR 10m
|
FOR 10m
|
||||||
|
Reference in New Issue
Block a user