From: Tom Hughes Date: Thu, 21 Jul 2022 23:30:17 +0000 (+0100) Subject: Reduce sensitivity of alert for wireguard interface transmit errors X-Git-Url: https://git.openstreetmap.org./chef.git/commitdiff_plain/4db790494ec42b0f418c28b7dde4c6dda99e7715 Reduce sensitivity of alert for wireguard interface transmit errors --- diff --git a/cookbooks/prometheus/templates/default/alert_rules.yml.erb b/cookbooks/prometheus/templates/default/alert_rules.yml.erb index 94a2323d3..78f72e2a1 100644 --- a/cookbooks/prometheus/templates/default/alert_rules.yml.erb +++ b/cookbooks/prometheus/templates/default/alert_rules.yml.erb @@ -311,12 +311,19 @@ groups: annotations: bandwidth_used: "{{ $value | humanizePercentage }}" - alert: interface transmit errors - expr: rate(node_network_transmit_errs_total[1m]) / rate(node_network_transmit_packets_total[1m]) > 0.01 + expr: rate(node_network_transmit_errs_total{device!~"wg.*"}[1m]) / rate(node_network_transmit_packets_total{device!~"wg.*"}[1m]) > 0.01 for: 5m labels: alertgroup: "{{ $labels.instance }}" annotations: error_rate: "{{ $value | humanizePercentage }}" + - alert: interface transmit errors + expr: rate(node_network_transmit_errs_total{device=~"wg.*"}[1m]) / rate(node_network_transmit_packets_total{device=~"wg.*"}[1m]) > 0.05 + for: 1h + labels: + alertgroup: "{{ $labels.instance }}" + annotations: + error_rate: "{{ $value | humanizePercentage }}" - alert: interface receive errors expr: rate(node_network_receive_errs_total[1m]) / rate(node_network_receive_packets_total[1m]) > 0.01 for: 5m