From: Tom Hughes Date: Thu, 6 Apr 2023 20:27:48 +0000 (+0100) Subject: Alert for RAID batteries that have been recharging for too long X-Git-Url: https://git.openstreetmap.org./chef.git/commitdiff_plain/b602bd1e89b1d4de6f776db8a23a3ae778b2edbe?ds=sidebyside Alert for RAID batteries that have been recharging for too long --- diff --git a/cookbooks/prometheus/templates/default/alert_rules.yml.erb b/cookbooks/prometheus/templates/default/alert_rules.yml.erb index 8f2986e6a..9a3c52920 100644 --- a/cookbooks/prometheus/templates/default/alert_rules.yml.erb +++ b/cookbooks/prometheus/templates/default/alert_rules.yml.erb @@ -558,6 +558,11 @@ groups: for: 5m labels: alertgroup: "{{ $labels.instance }}" + - alert: raid controller battery recharging + expr: ohai_controller_info{battery_status="recharging"} > 0 + for: 4h + labels: + alertgroup: "{{ $labels.instance }}" - alert: raid array degraded expr: ohai_array_info{status="degraded"} > 0 for: 5m