summaryrefslogtreecommitdiff
path: root/inventory/group_vars/promzone-chaos-at-home/vars.yml
blob: b8b785e3a231f48d93c7748cb536eba918567d64 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
---
prometheus_scrape_endpoint: "{{ network.primary.address | ansible.utils.ipaddr('address') }}:9999"

prometheus_exporters_extra: []
prometheus_exporters_default:
  - node

prometheus_exporter_node_version: 1.8.1
prometheus_exporter_ipmi_version: 1.8.0
prometheus_exporter_ssl_version: 2.4.3
prometheus_exporter_blackbox_version: 0.25.0
prometheus_exporter_nut_version: 3.1.1
prometheus_exporter_smokeping_version: 0.8.1
prometheus_exporter_bind_version: 0.7.0
prometheus_exporter_chrony_version: 0.10.0
prometheus_exporter_chrony_disable_dns_lookups: yes
prometheus_exporter_mosquitto_version: 0.7.2

prometheus_server_version: 2.52.0
prometheus_alertmanager_version: 0.27.0

prometheus_server: ch-mon
prometheus_server_jobs:
  - node
  - openwrt
  - chrony
  - nut
#  - nut/ups
  - blackbox
  - blackbox/probe
  - ipmi
  - ssl
  - ssl/probe
  - smokeping
  - bind
  - standalone-kubelet
  - whawty-nginx-sso
  - mosquitto

prometheus_zone_name: chaos@home

## TODO:
## potential extra alert rule: (bind_zone_serial{instance="ch-mimas"} == bool on(job, view, zone_name) bind_zone_serial{instance="ch-pan"}) != 1


prometheus_server_rules_whawty_nginx_sso_extra:
  - alert: WhawtyAuthStoreSyncTooLongAgo
    expr: time() - whawty_auth_store_sync_run > 3600
    for: 0m
    labels:
      severity: warning
    annotations:
      summary: The last whawty-auth store sync was too long ago (instance {{ '{{' }} $labels.instance {{ '}}' }})
      description: "The last whawty-auth store sync of {{ '{{' }} $labels.name {{ '}}' }} on {{ '{{' }} $labels.instance {{ '}}' }} ran more then an hours ago.\n  VALUE = {{ '{{' }} $value {{ '}}' }}\n  LABELS = {{ '{{' }} $labels {{ '}}' }}"

  - alert: WhawtyAuthStoreSyncFailed
    expr: whawty_auth_store_sync_exit_code != 0
    for: 0m
    labels:
      severity: warning
    annotations:
      summary: The last whawty-auth sync failed (instance {{ '{{' }} $labels.instance {{ '}}' }})
      description: "The last whawty-auth store sync of {{ '{{' }} $labels.name {{ '}}' }} on {{ '{{' }} $labels.instance {{ '}}' }} has failed.\n  VALUE = {{ '{{' }} $value {{ '}}' }}\n  LABELS = {{ '{{' }} $labels {{ '}}' }}"