X-Git-Url: https://git.openstreetmap.org./chef.git/blobdiff_plain/bbbe7474976e33c5471f7ecdabd4cf2a44c25ee2..50aea11082eaa90bd37593b9c987d38a082f4e1b:/cookbooks/prometheus/templates/default/alert_rules.yml.erb diff --git a/cookbooks/prometheus/templates/default/alert_rules.yml.erb b/cookbooks/prometheus/templates/default/alert_rules.yml.erb index b78bbaddd..6751fe744 100644 --- a/cookbooks/prometheus/templates/default/alert_rules.yml.erb +++ b/cookbooks/prometheus/templates/default/alert_rules.yml.erb @@ -331,6 +331,15 @@ groups: alertgroup: "{{ $labels.site }}" annotations: power: "{{ $value }} dBm" + - name: load + rules: + - alert: load average + expr: sum(node_load5) by (instance) / count(node_cpu_frequency_max_hertz) by (instance) > 2 + for: 5m + labels: + alertgroup: "{{ $labels.instance }}" + annotations: + load: "{{ $value | humanizePercentage }}" - name: mail rules: - alert: exim down @@ -660,6 +669,13 @@ groups: alertgroup: "{{ $labels.instance }}" annotations: new_errors: "{{ $value }}" + - name: resolved + rules: + - alert: dnssec validation failures + expr: rate(resolved_dnssec_verdicts_total{result="bogus"}[1m]) > 1 + for: 5m + labels: + alertgroup: "{{ $labels.instance }}" - name: smart rules: - alert: smart failure