diff --git a/salt/files/prometheus/alerts/raid.yml b/salt/files/prometheus/alerts/raid.yml index 20b27794..c68c73e7 100644 --- a/salt/files/prometheus/alerts/raid.yml +++ b/salt/files/prometheus/alerts/raid.yml @@ -17,6 +17,26 @@ groups: group_left (nodename) node_uname_info{nodename=~".+"} for: 0m + labels: + severity: critical + annotations: + summary: >- + Inactive RAID array on {{ $labels.instance }} + description: | + RAID array {{ $labels.device }} on {{ $labels.instance }} is in an inactive state. + VALUE = {{ $value }} + LABELS = {{ $labels }} + + - alert: RAID Array Degraded + expr: >- + ( + ( + node_md_disks_required - on(device, instance) + node_md_disks{state="active"} + ) + > 0 + ) + for: 0m labels: severity: critical annotations: