Make Prometheus Alert Rules Work Better and Organize Them Better #19
1 changed files with 2 additions and 2 deletions
|
@ -166,7 +166,7 @@ groups:
|
|||
# Longer intervals to account for disk intensive hypervisor tasks (backups, moving VMs, etc.).
|
||||
- alert: HypervisorHostUnusualDiskReadRate
|
||||
expr: (sum by (instance) (rate(node_disk_read_bytes_total[2m])) / 1024 / 1024 > 50) * on(instance) group_left (nodename) node_uname_info{nodename="chaosknoten"}
|
||||
for: 30m
|
||||
for: 60m
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
|
@ -174,7 +174,7 @@ groups:
|
|||
description: "Disk is probably reading too much data (> 50 MB/s)\n VALUE = {{ $value }}"
|
||||
- alert: HypervisorHostUnusualDiskWriteRate
|
||||
expr: (sum by (instance) (rate(node_disk_written_bytes_total[2m])) / 1024 / 1024 > 50) * on(instance) group_left (nodename) node_uname_info{nodename="chaosknoten"}
|
||||
for: 20m
|
||||
for: 60m
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
|
|
Loading…
Add table
Reference in a new issue