Some checks failed
/ Ansible Lint (push) Failing after 49s
so that service restart dont create a alert
41 lines
1.5 KiB
YAML
41 lines
1.5 KiB
YAML
groups:
|
|
- name: Fux-Generic
|
|
rules:
|
|
- alert: HostJobFlaky
|
|
expr: group by(instance, job) (changes(up{org="fux"}[24h]) > 7)
|
|
for: 0m
|
|
labels:
|
|
severity: info
|
|
org: fux
|
|
annotations:
|
|
summary: Job {{ $labels.job }} flaky on (instance {{ $labels.instance }})
|
|
description: "The job {{ $labels.job }} on target: {{ $labels.instance }} has been flaky over the last 24 hours."
|
|
- name: Fux-SNMP
|
|
rules:
|
|
- alert: SnmpTargetMissing
|
|
expr: up{job=~".*snmp.*", org="fux"} == 0
|
|
for: 15m
|
|
labels:
|
|
severity: critical
|
|
org: fux
|
|
annotations:
|
|
summary: SNMP target missing (instance {{ $labels.instance }})
|
|
description: "SNMP target: {{ $labels.instance }} has disappeared for more the 15 min."
|
|
- name: Fux-DHCP
|
|
rules:
|
|
- alert: DhcpFuxSharedFailed
|
|
expr: script_success{script="check_dhcp_fux_shared"} == 0
|
|
for: 2m
|
|
labels:
|
|
severity: critical
|
|
annotations:
|
|
summary: DHCP for Fux Shared stoped working
|
|
description: "No DHCP lease for the Fux Shared range was received \n V"
|
|
- alert: DhcpFuxAdminFailed
|
|
expr: script_success{script_success="check_dhcp_fux_admin"} == 0
|
|
for: 2m
|
|
labels:
|
|
severity: critical
|
|
annotations:
|
|
summary: DHCP for Fux Admin stoped working
|
|
description: "No DHCP lease for the Fux Admin range was received"
|