50 lines
1.9 KiB
YAML
50 lines
1.9 KiB
YAML
groups:
|
|
- name: Fux-Generic
|
|
rules:
|
|
- alert: HostJobFlaky
|
|
expr: group by(instance, job) (changes(up{org="fux"}[24h]) > 7)
|
|
for: 0m
|
|
labels:
|
|
severity: info
|
|
org: fux
|
|
annotations:
|
|
summary: Job {{ $labels.job }} flaky on (instance {{ $labels.instance }})
|
|
description: "The job {{ $labels.job }} on target: {{ $labels.instance }} has been flaky over the last 24 hours."
|
|
- alert: ProbeFailed
|
|
expr: group by(instance, job, ip) (probe_success{org="fux"} == 0)
|
|
for: 1m
|
|
labels:
|
|
severity: critical
|
|
org: fux
|
|
annotations:
|
|
summary: "Probe failed for {{ $labels.instance }} (job: {{ $labels.job }})"
|
|
description: "The Probe: {{ $labels.job }} can not complete its job for {{ $labels.instance }}, this most likely means that the instance is unreachable."
|
|
- name: Fux-SNMP
|
|
rules:
|
|
- alert: SnmpTargetMissing
|
|
expr: up{job=~".*snmp.*", org="fux"} == 0
|
|
for: 15m
|
|
labels:
|
|
severity: critical
|
|
org: fux
|
|
annotations:
|
|
summary: SNMP target missing (instance {{ $labels.instance }})
|
|
description: "SNMP target: {{ $labels.instance }} has disappeared for more the 15 min."
|
|
- name: Fux-DHCP
|
|
rules:
|
|
- alert: DhcpFuxSharedFailed
|
|
expr: script_success{script="check_dhcp_fux_shared"} == 0
|
|
for: 2m
|
|
labels:
|
|
severity: critical
|
|
annotations:
|
|
summary: DHCP for Fux Shared stoped working
|
|
description: "No DHCP lease for the Fux Shared range was received \n V"
|
|
- alert: DhcpFuxAdminFailed
|
|
expr: script_success{script_success="check_dhcp_fux_admin"} == 0
|
|
for: 2m
|
|
labels:
|
|
severity: critical
|
|
annotations:
|
|
summary: DHCP for Fux Admin stoped working
|
|
description: "No DHCP lease for the Fux Admin range was received"
|