diff --git a/jsonnet/kube-prometheus/alerts/prometheus-operator.libsonnet b/jsonnet/kube-prometheus/alerts/prometheus-operator.libsonnet index 580aa866d246234fe515d9bf67eac70f502cdac3..a8ddd13affe7800b470e03e5412ce2b709d3e1d3 100644 --- a/jsonnet/kube-prometheus/alerts/prometheus-operator.libsonnet +++ b/jsonnet/kube-prometheus/alerts/prometheus-operator.libsonnet @@ -4,16 +4,29 @@ { name: 'prometheus-operator', rules: [ + { + alert: 'PrometheusOperatorListErrors', + expr: ||| + (sum by (controller,namespace) (rate(prometheus_operator_list_operations_failed_total{%(prometheusOperatorSelector)s}[1h])) / sum by (controller,namespace) (rate(prometheus_operator_list_operations_total{%(prometheusOperatorSelector)s}[1h]))) > 0.4 + ||| % $._config, + labels: { + severity: 'warning', + }, + annotations: { + message: 'Errors while performing List operations in controller {{$labels.controller}} in {{$labels.namespace}} namespace.', + }, + 'for': '15m', + }, { alert: 'PrometheusOperatorWatchErrors', expr: ||| - (sum by (controller,namespace) (rate(prometheus_operator_watch_operations_failed_total{%(prometheusOperatorSelector)s}[1h])) / sum by (controller,namespace) (rate(prometheus_operator_watch_operations_total{%(prometheusOperatorSelector)s}[1h]))) > 0.1 + (sum by (controller,namespace) (rate(prometheus_operator_watch_operations_failed_total{%(prometheusOperatorSelector)s}[1h])) / sum by (controller,namespace) (rate(prometheus_operator_watch_operations_total{%(prometheusOperatorSelector)s}[1h]))) > 0.4 ||| % $._config, labels: { severity: 'warning', }, annotations: { - message: 'Errors while performing watch operations in controller {{$labels.controller}} in {{$labels.namespace}} namespace.', + message: 'Errors while performing Watch operations in controller {{$labels.controller}} in {{$labels.namespace}} namespace.', }, 'for': '15m', },