diff --git a/rules/md.yml b/rules/md.yml index cea819f..6f6a208 100644 --- a/rules/md.yml +++ b/rules/md.yml @@ -15,16 +15,16 @@ groups: expr: node_md_state{state="inactive"} > 0 for: 5m labels: - severity: error + severity: page annotations: summary: "Host RAID array got inactive (instance {{ $labels.instance }})" description: "RAID array {{ $labels.device }} is in degraded state due to one or more disks failures. Number of spare drives is insufficient to fix issue automatically.\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" - alert: HostRaidDiskFailure - expr: node_md_disks{state="fail"} > 0 + expr: node_md_disks{state="failed"} > 0 for: 5m labels: - severity: warning + severity: page annotations: summary: "Host RAID disk failure (instance {{ $labels.instance }})" description: "At least one device in RAID array on {{ $labels.instance }} failed. Array {{ $labels.md_device }} needs attention and possibly a disk swap\n VALUE = {{ $value }}\n LABELS: {{ $labels }}"