Skip to content
Snippets Groups Projects
Commit 7516052d authored by Frederic Branczyk's avatar Frederic Branczyk Committed by GitHub
Browse files

Merge pull request #22 from brancz/update-configs

Update configs/alerts
parents 417e3feb dca2c152
No related branches found
No related tags found
No related merge requests found
alerting:
alertmanagers:
- kubernetes_sd_configs:
- role: endpoints
relabel_configs:
- action: keep
regex: alertmanager-main
source_labels:
- __meta_kubernetes_service_name
- action: keep
regex: monitoring
source_labels:
- __meta_kubernetes_namespace
- action: keep
regex: web
source_labels:
- __meta_kubernetes_endpoint_port_name
scheme: http
global: global:
scrape_interval: 15s scrape_interval: 15s
evaluation_interval: 15s evaluation_interval: 15s
......
...@@ -286,18 +286,6 @@ ALERT K8SControllerManagerDown ...@@ -286,18 +286,6 @@ ALERT K8SControllerManagerDown
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.", description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
} }
ALERT K8SMoreThanOneController
IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1
FOR 5m
LABELS {
service = "k8s",
severity = "critical",
}
ANNOTATIONS {
summary = "More than one controller node is active",
description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.",
}
ALERT K8SConntrackTableFull ALERT K8SConntrackTableFull
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50 IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
FOR 10m FOR 10m
......
...@@ -341,18 +341,6 @@ data: ...@@ -341,18 +341,6 @@ data:
description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.", description = "There is no running K8S controller manager. Deployments and replication controllers are not making progress.",
} }
ALERT K8SMoreThanOneController
IF count by (job,cluster) (up{job=~"kube-scheduler|kube-controller-manager"}) > 1
FOR 5m
LABELS {
service = "k8s",
severity = "critical",
}
ANNOTATIONS {
summary = "More than one controller node is active",
description = "There is more than one {{ $labels.job }} managing the cluster. Cluster behaviour is undefined.",
}
ALERT K8SConntrackTableFull ALERT K8SConntrackTableFull
IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50 IF 100*node_nf_conntrack_entries / node_nf_conntrack_entries_limit > 50
FOR 10m FOR 10m
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment