diff --git a/argo/cluster/monitoring/kube-prometheus-stack/chart/rules/misc.yaml b/argo/cluster/monitoring/kube-prometheus-stack/chart/rules/misc.yaml index 14a8b14c5..5918d3c59 100644 --- a/argo/cluster/monitoring/kube-prometheus-stack/chart/rules/misc.yaml +++ b/argo/cluster/monitoring/kube-prometheus-stack/chart/rules/misc.yaml @@ -4,6 +4,15 @@ metadata: name: misc spec: groups: + - name: longhorn + rules: + - alert: BackupFailed + expr: count by (backup, volume) (longhorn_backup_state > 3) > 0 + for: 1m + labels: + severity: critical + annotations: + summary: Backup {{ $labels.backup }} failed for {{ $labels.volume }} - name: vms rules: - alert: VMDown