groups: - name: Fux-Generic rules: - alert: HostJobFlaky expr: group by(instance, job) (changes(up{org="fux"}[24h]) > 7) for: 0m labels: severity: info org: fux annotations: summary: Job {{ $labels.job }} flaky on (instance {{ $labels.instance }}) description: "The job {{ $labels.job }} on target: {{ $labels.instance }} has been flaky over the last 24 hours." - name: Fux-SNMP rules: - alert: SnmpTargetMissing expr: up{job=~".*snmp.*", org="fux"} == 0 for: 15m labels: severity: critical org: fux annotations: summary: SNMP target missing (instance {{ $labels.instance }}) description: "SNMP target: {{ $labels.instance }} has disappeared for more the 15 min." - name: Fux-DHCP rules: - alert: DhcpFuxSharedFailed expr: script_success{script="check_dhcp_fux_shared"} == 0 for: 2m labels: severity: critical annotations: summary: DHCP for Fux Shared stoped working description: "No DHCP lease for the Fux Shared range was received \n V" - alert: DhcpFuxAdminFailed expr: script_success{script_success="check_dhcp_fux_admin"} == 0 for: 2m labels: severity: critical annotations: summary: DHCP for Fux Admin stoped working description: "No DHCP lease for the Fux Admin range was received"