iankelling.org
/
git
/
distro-setup
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
big fix switch-mail-host plus minor improvements
[distro-setup]
/
filesystem
/
etc
/
prometheus
/
rules
/
iank.yml
diff --git
a/filesystem/etc/prometheus/rules/iank.yml
b/filesystem/etc/prometheus/rules/iank.yml
index f64322b2c98ef4f48755daec9fe81f185b8c9488..47012ccbcb74b20f517f825d1cc327fd70fe2c0d 100644
(file)
--- a/
filesystem/etc/prometheus/rules/iank.yml
+++ b/
filesystem/etc/prometheus/rules/iank.yml
@@
-199,7
+199,7
@@
groups:
# 19 for 19 minutes, but I make it 18 just to give a bit of slack.
- alert: historical_missing_metric
expr: |-
# 19 for 19 minutes, but I make it 18 just to give a bit of slack.
- alert: historical_missing_metric
expr: |-
- count_over_time(up{job="prometheus"}[19m]) <= 18 unless on() present_over_time(ALERTS[19m]) unless on() time() - node_boot_time_seconds{instance="kd
wg:9101
"} <= 60 * 17
+ count_over_time(up{job="prometheus"}[19m]) <= 18 unless on() present_over_time(ALERTS[19m]) unless on() time() - node_boot_time_seconds{instance="kd"} <= 60 * 17
labels:
severity: warn
labels:
severity: warn
@@
-274,7
+274,7
@@
groups:
description: "A Prometheus job has disappeared\n VALUE = {{ $value }}"
- alert: lowpri_target_down
description: "A Prometheus job has disappeared\n VALUE = {{ $value }}"
- alert: lowpri_target_down
- expr: up{instance!~"kdwg:9101|bkex.b8.nz:9101|liex.b8.nz:9101|10.2.0.1:9100"} == 0
+ expr: up{instance!~"kdwg:9101|bkex.b8.nz:9101|liex.b8.nz:9101|10.2.0.1:9100
|kwwg:9101
"} == 0
for: 30m
labels:
severity: warn
for: 30m
labels:
severity: warn