From 1c6bc7a387763ba2c7448a96c91d05f8b0138ebf Mon Sep 17 00:00:00 2001 From: Frederic Branczyk <fbranczyk@gmail.com> Date: Wed, 14 Dec 2016 18:10:50 -0800 Subject: [PATCH] kubernetes alerts: don't alert on multiple bootkube starts two replicas of the scheduler and controllers manager --- assets/prometheus/rules/kubernetes.rules | 12 ------------ manifests/prometheus/prometheus-k8s-rules.yaml | 12 ------------ 2 files changed, 24 deletions(-) diff --git a/assets/prometheus/rules/kubernetes.rules b/assets/prometheus/rules/kubernetes.rules index 216c0ccd..c0dddb92 100644 --- a/assets/prometheus/rules/kubernetes.rules +++ b/assets/prometheus/rules/kubernetes.rules @@ -286,18 +286,6 @@ ALERT K8SControllerManagerDown description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.", } -ALERT K8SMoreThanOneController - IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1 - FOR 5m - LABELS { - service = "k8s", - severity = "critical", - } - ANNOTATIONS { - summary = "More than one controller node is active", - description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.", - } - ALERT K8SConntrackTableFull IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50 FOR 10m diff --git a/manifests/prometheus/prometheus-k8s-rules.yaml b/manifests/prometheus/prometheus-k8s-rules.yaml index c01a7f3e..6e83500e 100644 --- a/manifests/prometheus/prometheus-k8s-rules.yaml +++ b/manifests/prometheus/prometheus-k8s-rules.yaml @@ -341,18 +341,6 @@ data: description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.", } - ALERT K8SMoreThanOneController - IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1 - FOR 5m - LABELS { - service = "k8s", - severity = "critical", - } - ANNOTATIONS { - summary = "More than one controller node is active", - description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.", - } - ALERT K8SConntrackTableFull IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50 FOR 10m -- GitLab