diff --git a/docs/developing-prometheus-rules-and-grafana-dashboards.md b/docs/developing-prometheus-rules-and-grafana-dashboards.md index b9ae2b9b548f91196371a2eb9dbc5f45490b5f90..a0a41c5ead83b08660e7a20a97fcfb135eafdd55 100644 --- a/docs/developing-prometheus-rules-and-grafana-dashboards.md +++ b/docs/developing-prometheus-rules-and-grafana-dashboards.md @@ -300,11 +300,11 @@ local kp = (import 'kube-prometheus/kube-prometheus.libsonnet') + { _config+:: { namespace: 'monitoring', }, - grafanaDashboards+:: { // monitoring-mixin compatibility + grafanaDashboards+:: { // monitoring-mixin compatibility 'my-dashboard.json': (import 'example-grafana-dashboard.json'), }, grafana+:: { - dashboards+:: { // use this method to import your dashboards to Grafana + dashboards+:: { // use this method to import your dashboards to Grafana 'my-dashboard.json': (import 'example-grafana-dashboard.json'), }, }, diff --git a/examples/grafana-additional-rendered-dashboard-example.jsonnet b/examples/grafana-additional-rendered-dashboard-example.jsonnet index f55eab8ae1345692421f41dfbd66fc9040ac1453..883c609700a8e9c6ccdf19ad6d068d9a55c778a5 100644 --- a/examples/grafana-additional-rendered-dashboard-example.jsonnet +++ b/examples/grafana-additional-rendered-dashboard-example.jsonnet @@ -2,11 +2,11 @@ local kp = (import 'kube-prometheus/kube-prometheus.libsonnet') + { _config+:: { namespace: 'monitoring', }, - grafanaDashboards+:: { // monitoring-mixin compatibility + grafanaDashboards+:: { // monitoring-mixin compatibility 'my-dashboard.json': (import 'example-grafana-dashboard.json'), }, grafana+:: { - dashboards+:: { // use this method to import your dashboards to Grafana + dashboards+:: { // use this method to import your dashboards to Grafana 'my-dashboard.json': (import 'example-grafana-dashboard.json'), }, }, diff --git a/jsonnetfile.lock.json b/jsonnetfile.lock.json index c210c4948aeb757719cbdd26eedede8f4e95573d..934ee99710ad76c6eb137dd84a92dcc8747596c8 100644 --- a/jsonnetfile.lock.json +++ b/jsonnetfile.lock.json @@ -69,8 +69,8 @@ "subdir": "" } }, - "version": "b61c5a34051f8f57284a08fe78ad8a45b430252b", - "sum": "7Hx/5eNm7ubLTsdrpk3b2+e/FLR3XOa4HCukmbRUCAY=" + "version": "fba82a1c0bc225127b084e91bd142c99b1792cb6", + "sum": "hJ5n6OeumIpKYuZQHwxL/rtpAJaW/qTFE9oOA8RWd7w=" }, { "source": { diff --git a/manifests/prometheus-rules.yaml b/manifests/prometheus-rules.yaml index ef5a4dae66928d1903710b684f2f4f60af37b962..aefacdf1e2497f77d9a5f458d626d7f9dbe01f94 100644 --- a/manifests/prometheus-rules.yaml +++ b/manifests/prometheus-rules.yaml @@ -1129,16 +1129,6 @@ spec: for: 15m labels: severity: warning - - alert: KubeCronJobRunning - annotations: - message: CronJob {{ $labels.namespace }}/{{ $labels.cronjob }} is taking more - than 1h to complete. - runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubecronjobrunning - expr: | - time() - kube_cronjob_next_schedule_time{job="kube-state-metrics"} > 3600 - for: 1h - labels: - severity: warning - alert: KubeJobCompletion annotations: message: Job {{ $labels.namespace }}/{{ $labels.job_name }} is taking more @@ -1240,19 +1230,19 @@ spec: for: 5m labels: severity: warning - - alert: KubeQuotaExceeded + - alert: KubeQuotaFullyUsed annotations: message: Namespace {{ $labels.namespace }} is using {{ $value | humanizePercentage }} of its {{ $labels.resource }} quota. - runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubequotaexceeded + runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubequotafullyused expr: | kube_resourcequota{job="kube-state-metrics", type="used"} / ignoring(instance, job, type) (kube_resourcequota{job="kube-state-metrics", type="hard"} > 0) - > 0.90 + >= 1 for: 15m labels: - severity: warning + severity: info - alert: CPUThrottlingHigh annotations: message: '{{ $value | humanizePercentage }} throttling of CPU in namespace @@ -1391,43 +1381,6 @@ spec: short: 6h - name: kubernetes-system-apiserver rules: - - alert: KubeAPILatencyHigh - annotations: - message: The API server has an abnormal latency of {{ $value }} seconds for - {{ $labels.verb }} {{ $labels.resource }}. - runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapilatencyhigh - expr: | - cluster_quantile:apiserver_request_duration_seconds:histogram_quantile{job="apiserver",quantile="0.99"} - > - 1 - and on (verb,resource) - ( - cluster:apiserver_request_duration_seconds:mean5m{job="apiserver"} - > - on (verb) group_left() - ( - avg by (verb) (cluster:apiserver_request_duration_seconds:mean5m{job="apiserver"} >= 0) - + - 2*stddev by (verb) (cluster:apiserver_request_duration_seconds:mean5m{job="apiserver"} >= 0) - ) - ) > on (verb) group_left() - 1.2 * avg by (verb) (cluster:apiserver_request_duration_seconds:mean5m{job="apiserver"} >= 0) - for: 5m - labels: - severity: warning - - alert: KubeAPIErrorsHigh - annotations: - message: API server is returning errors for {{ $value | humanizePercentage - }} of requests for {{ $labels.verb }} {{ $labels.resource }} {{ $labels.subresource - }}. - runbook_url: https://github.com/kubernetes-monitoring/kubernetes-mixin/tree/master/runbook.md#alert-name-kubeapierrorshigh - expr: | - sum(rate(apiserver_request_total{job="apiserver",code=~"5.."}[5m])) by (resource,subresource,verb) - / - sum(rate(apiserver_request_total{job="apiserver"}[5m])) by (resource,subresource,verb) > 0.05 - for: 10m - labels: - severity: warning - alert: KubeClientCertificateExpiration annotations: message: A client certificate used to authenticate to the apiserver is expiring