summaryrefslogtreecommitdiffstats
path: root/Prometheus/alerts/tripsit
diff options
context:
space:
mode:
Diffstat (limited to 'Prometheus/alerts/tripsit')
-rw-r--r--Prometheus/alerts/tripsit/blackbox.yml21
-rw-r--r--Prometheus/alerts/tripsit/node_exporters.yml13
2 files changed, 34 insertions, 0 deletions
diff --git a/Prometheus/alerts/tripsit/blackbox.yml b/Prometheus/alerts/tripsit/blackbox.yml
new file mode 100644
index 0000000..0390718
--- /dev/null
+++ b/Prometheus/alerts/tripsit/blackbox.yml
@@ -0,0 +1,21 @@
+groups:
+- name: tripsit-blackbox_exporters
+ rules:
+ - alert: TRIPSIT.ME-WEB-INCIDENT
+ expr: probe_success{instance=~"https://tripsit.me|https://chat.tripsit.me|https://chat.tripsit.me/chat|https://drugs.tripsit.me|https://benzo.tripsit.me|https://dxm.tripsit.me|https://combo.tripsit.me|https://wiki.tripsit.me|https://tripbot.tripsit.me"} == 0
+ for: 15s
+ labels:
+ severity: critical
+ project: TRIPSIT
+ annotations:
+ title: Node {{ $labels.instance }} is down
+ description: Failed to scrape {{ $labels.job }} on {{ $labels.instance}} for more than 15 seconds. Node seems down.
+ - alert: TRIPSIT.DEV-WEB-INCIDENT
+ expr: probe_success{instance=~"https://mail.tripsit.dev|https://dopamine.tripsit.dev"} == 0
+ for: 1m
+ labels:
+ severity: warning
+ project: TRIPSIT
+ annotations:
+ title: Node {{ $labels.instance }} is down
+ description: Failed to scrape {{ $labels.job }} on {{ $labels.instance}} for more than 1 minute. Node seems down.
diff --git a/Prometheus/alerts/tripsit/node_exporters.yml b/Prometheus/alerts/tripsit/node_exporters.yml
new file mode 100644
index 0000000..ee82367
--- /dev/null
+++ b/Prometheus/alerts/tripsit/node_exporters.yml
@@ -0,0 +1,13 @@
+groups:
+- name: tripsit-node_exporters
+ rules:
+ - alert: TRIPSIT-NODE-INCIDENT
+ expr: up{project="TRIPSIT", job="node_exporters"} == 0
+ for: 30s
+ labels:
+ severity: warning
+ job: node_exporters
+ project: TRIPSIT
+ annotations:
+ title: Node {{ $labels.instance }} is down
+ description: Failed to scrape {{ $labels.job }} on {{ $labels.instance}} for more than 1 minute. Node seems down.