From 486c84d53244e44ff72a3c2db42ee12afdb083e8 Mon Sep 17 00:00:00 2001 From: Christian Pointner Date: Thu, 23 Sep 2021 20:37:20 +0200 Subject: add some more prometheus rules for blackbox exporter --- .../server/defaults/main/rules_blackbox__https.yml | 19 ++++++++++++++++++- 1 file changed, 18 insertions(+), 1 deletion(-) (limited to 'roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml') diff --git a/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml b/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml index cfdc10bd..140e3b4f 100644 --- a/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml +++ b/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml @@ -1,3 +1,20 @@ --- prometheus_server_rules_blackbox__https_extra: [] -prometheus_server_rules_blackbox__https: [] +prometheus_server_rules_blackbox__https: + - alert: BlackboxProbeHttpFailure + expr: probe_http_status_code <= 199 OR probe_http_status_code >= 400 + for: 0m + labels: + severity: critical + annotations: + summary: Blackbox probe HTTP failure (instance {{ '{{' }} $labels.instance {{ '}}' }}) + description: "HTTP status code is not 200-399\n VALUE = {{ '{{' }} $value {{ '}}' }}\n LABELS = {{ '{{' }} $labels {{ '}}' }}" + + - alert: BlackboxProbeSlowHttp + expr: avg_over_time(probe_http_duration_seconds[1m]) > 1 + for: 1m + labels: + severity: warning + annotations: + summary: Blackbox probe slow HTTP (instance {{ '{{' }} $labels.instance {{ '}}' }}) + description: "HTTP request took more than 1s\n VALUE = {{ '{{' }} $value {{ '}}' }}\n LABELS = {{ '{{' }} $labels {{ '}}' }}" -- cgit v1.2.3