Compare commits

..

1 commit

Author SHA1 Message Date
83b1f2cba9
grafana: make alerts better for fux
Some checks failed
/ Ansible Lint (push) Has been cancelled
/ Ansible Lint (pull_request) Failing after 47s
2025-09-09 18:44:50 +02:00

View file

@ -1,5 +1,5 @@
groups:
- name: Generic
- name: Fux-Generic
rules:
- alert: HostJobFlaky
expr: group by(host, job) (changes(up{org="fux", job!="integrations/unix"}[24h]) > 5)
@ -8,8 +8,8 @@ groups:
severity: info
annotations:
summary: Job {{ $labels.job }} flaky on (host {{ $labels.instance }})
description: "The job {{ $labels.job }} on target: {{ labels.host }} has been flaky over the last 24 hours.\n VALUE = {{ $value }}"
- name: SNMP
description: "The job {{ $labels.job }} on target: {{ $labels.host }} has been flaky over the last 24 hours.\n VALUE = {{ $value }}"
- name: Fux-SNMP
rules:
- alert: SnmpTargetMissing
expr: up{job=~".*snmp|SNMP.*"} == 0
@ -19,7 +19,7 @@ groups:
annotations:
summary: SNMP target missing (instance {{ $labels.instance }})
description: "A SNMP target has disappeared for more the 15 min.\n VALUE = {{ $value }}"
- name: DHCP
- name: Fux-DHCP
rules:
- alert: DhcpFuxSharedFailed
expr: script_success{script="check_dhcp_fux_shared"} == 0