various fixes
[distro-setup] / filesystem / etc / prometheus / rules / iank.yml
index 75b5cbcfc760925b79d51fd6c3262de7a6186a97..40fc4040c11efc719a9b164b447c117da141b2d2 100644 (file)
@@ -85,11 +85,19 @@ groups:
       severity: warn
 
   - alert: sysd_result_fail
+    # not sure 30m is really needed, it prevents the alert from flapping
+    # i guess.
     expr: |-
       rate(node_systemd_unit_result_fail_count[30m]) > 0
     labels:
       severity: day
 
+  - alert: exim_paniclog
+    expr: |-
+      exim_paniclog > 0
+    labels:
+      severity: warn
+
   - alert: mailtest_check_vps
     expr: |-
       time() - mailtest_check_last_usec{job="tlsnode"} >= 60 * 12