feat(observability): Introduced alert for failed s3 backup jobs

This commit is contained in:
Patrick Sy 2025-08-12 14:07:38 +02:00
parent e0f6cc77dd
commit 975bb6b982
Signed by untrusted user: Patrick.Sy
GPG key ID: DDDC8EC51823195E

View file

@ -16,3 +16,14 @@ spec:
annotations:
value: "{{ $value }}"
description: 'forgejo is down in cluster environment {{ $labels.cluster_environment }}'
- name: forgejo-backup
rules:
- alert: forgejo s3 backup job failed
expr: max by(cluster_environment) (kube_job_status_failed{job_name=~"forgejo-s3-backup-.*"}) != 0
for: 30s
labels:
severity: major
job: "{{ $labels.job }}"
annotations:
value: "{{ $value }}"
description: 'forgejo s3 backup job failed in cluster environment {{ $labels.cluster_environment }}'