summaryrefslogtreecommitdiff
path: root/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml
diff options
context:
space:
mode:
Diffstat (limited to 'roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml')
-rw-r--r--roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml19
1 files changed, 18 insertions, 1 deletions
diff --git a/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml b/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml
index cfdc10bd..140e3b4f 100644
--- a/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml
+++ b/roles/monitoring/prometheus/server/defaults/main/rules_blackbox__https.yml
@@ -1,3 +1,20 @@
---
prometheus_server_rules_blackbox__https_extra: []
-prometheus_server_rules_blackbox__https: []
+prometheus_server_rules_blackbox__https:
+ - alert: BlackboxProbeHttpFailure
+ expr: probe_http_status_code <= 199 OR probe_http_status_code >= 400
+ for: 0m
+ labels:
+ severity: critical
+ annotations:
+ summary: Blackbox probe HTTP failure (instance {{ '{{' }} $labels.instance {{ '}}' }})
+ description: "HTTP status code is not 200-399\n VALUE = {{ '{{' }} $value {{ '}}' }}\n LABELS = {{ '{{' }} $labels {{ '}}' }}"
+
+ - alert: BlackboxProbeSlowHttp
+ expr: avg_over_time(probe_http_duration_seconds[1m]) > 1
+ for: 1m
+ labels:
+ severity: warning
+ annotations:
+ summary: Blackbox probe slow HTTP (instance {{ '{{' }} $labels.instance {{ '}}' }})
+ description: "HTTP request took more than 1s\n VALUE = {{ '{{' }} $value {{ '}}' }}\n LABELS = {{ '{{' }} $labels {{ '}}' }}"