sbbb/base/media/livekit-alertrules.yaml

apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
  name: livekit-alerts
  namespace: media
  labels:
    role: alert-rules
    release: kube-prometheus-stack
spec:
  groups:
    - name: livekit
      rules:
        - alert: LiveKitDown
          expr: up{job=~".*livekit.*"} == 0
          for: 2m
          labels:
            severity: critical
          annotations:
            summary: "LiveKit is down"
            description: "LiveKit instance {{ $labels.namespace }}/{{ $labels.pod }} is down."

        - alert: LiveKitHighNACKRate
          expr: sum(rate(livekit_nack_total[5m])) > 100
          for: 5m
          labels:
            severity: warning
          annotations:
            summary: "LiveKit NACK rate is high"
            description: "LiveKit NACK rate is {{ $value }}/s, indicating potential media quality issues."