]> git.openstreetmap.org Git - chef.git/commitdiff
Add alerts for equinix uplink interfaces
authorTom Hughes <tom@compton.nu>
Wed, 18 Dec 2024 09:10:26 +0000 (09:10 +0000)
committerTom Hughes <tom@compton.nu>
Wed, 18 Dec 2024 09:10:26 +0000 (09:10 +0000)
cookbooks/prometheus/templates/default/alert_rules.yml.erb

index 6751fe74423f2b386e78dd82176cc0c400c19d2a..305afbd903a44e3745ce3d3eb5dc62d51895a2b7 100644 (file)
@@ -3,13 +3,20 @@
 groups:
   - name: amsterdam
     rules:
 groups:
   - name: amsterdam
     rules:
-      - alert: uplink
+      - alert: he uplink
         expr: junos_interface_up{site="amsterdam",name=~"ge-[01]/2/2"} != 1
         for: 6m
         labels:
           alertgroup: "amsterdam"
         annotations:
           status: "{{ $value }}"
         expr: junos_interface_up{site="amsterdam",name=~"ge-[01]/2/2"} != 1
         for: 6m
         labels:
           alertgroup: "amsterdam"
         annotations:
           status: "{{ $value }}"
+      - alert: equinix uplink
+        expr: junos_interface_up{site="amsterdam",name=~"xe-[01]/2/0"} != 1
+        for: 6m
+        labels:
+          alertgroup: "amsterdam"
+        annotations:
+          status: "{{ $value }}"
       - alert: pdu current draw
         expr: rPDU2PhaseStatusCurrent{site="amsterdam",rPDU2PhaseStatusIndex="1"} / 10 > 28
         for: 6m
       - alert: pdu current draw
         expr: rPDU2PhaseStatusCurrent{site="amsterdam",rPDU2PhaseStatusIndex="1"} / 10 > 28
         for: 6m
@@ -130,13 +137,20 @@ groups:
           failure_rate: "{{ $value }} jobs/s"
   - name: dublin
     rules:
           failure_rate: "{{ $value }} jobs/s"
   - name: dublin
     rules:
-      - alert: uplink
+      - alert: he uplink
         expr: junos_interface_up{site="dublin",name=~"ge-[01]/2/2"} != 1
         for: 6m
         labels:
           alertgroup: "dublin"
         annotations:
           status: "{{ $value }}"
         expr: junos_interface_up{site="dublin",name=~"ge-[01]/2/2"} != 1
         for: 6m
         labels:
           alertgroup: "dublin"
         annotations:
           status: "{{ $value }}"
+      - alert: equinix uplink
+        expr: junos_interface_up{site="dublin",name=~"xe-[01]/2/0"} != 1
+        for: 6m
+        labels:
+          alertgroup: "dublin"
+        annotations:
+          status: "{{ $value }}"
       - alert: pdu current draw
         expr: rPDU2PhaseStatusCurrent{site="dublin",rPDU2PhaseStatusIndex="1"} / 10 > 28
         for: 6m
       - alert: pdu current draw
         expr: rPDU2PhaseStatusCurrent{site="dublin",rPDU2PhaseStatusIndex="1"} / 10 > 28
         for: 6m