32 lines
964 B
YAML
32 lines
964 B
YAML
|
|
apiVersion: monitoring.coreos.com/v1
|
||
|
|
kind: PrometheusRule
|
||
|
|
metadata:
|
||
|
|
name: tuwunel-alerts
|
||
|
|
namespace: matrix
|
||
|
|
labels:
|
||
|
|
role: alert-rules
|
||
|
|
release: kube-prometheus-stack
|
||
|
|
spec:
|
||
|
|
groups:
|
||
|
|
- name: tuwunel
|
||
|
|
rules:
|
||
|
|
- alert: TuwunelDown
|
||
|
|
expr: |
|
||
|
|
kube_deployment_status_replicas_available{namespace="matrix", deployment="tuwunel"} == 0
|
||
|
|
for: 2m
|
||
|
|
labels:
|
||
|
|
severity: critical
|
||
|
|
annotations:
|
||
|
|
summary: "Matrix homeserver (Tuwunel) is down"
|
||
|
|
description: "Tuwunel is down — Matrix messaging, alertbot delivery, and Sol are all affected."
|
||
|
|
|
||
|
|
- alert: SolDown
|
||
|
|
expr: |
|
||
|
|
kube_deployment_status_replicas_available{namespace="matrix", deployment="sol"} == 0
|
||
|
|
for: 5m
|
||
|
|
labels:
|
||
|
|
severity: warning
|
||
|
|
annotations:
|
||
|
|
summary: "Sol is down"
|
||
|
|
description: "Sol virtual librarian is not running."
|