feat(observability): Introduced alert for failed s3 backup jobs
This commit is contained in:
parent
e0f6cc77dd
commit
975bb6b982
1 changed files with 11 additions and 0 deletions
|
|
@ -16,3 +16,14 @@ spec:
|
||||||
annotations:
|
annotations:
|
||||||
value: "{{ $value }}"
|
value: "{{ $value }}"
|
||||||
description: 'forgejo is down in cluster environment {{ $labels.cluster_environment }}'
|
description: 'forgejo is down in cluster environment {{ $labels.cluster_environment }}'
|
||||||
|
- name: forgejo-backup
|
||||||
|
rules:
|
||||||
|
- alert: forgejo s3 backup job failed
|
||||||
|
expr: max by(cluster_environment) (kube_job_status_failed{job_name=~"forgejo-s3-backup-.*"}) != 0
|
||||||
|
for: 30s
|
||||||
|
labels:
|
||||||
|
severity: major
|
||||||
|
job: "{{ $labels.job }}"
|
||||||
|
annotations:
|
||||||
|
value: "{{ $value }}"
|
||||||
|
description: 'forgejo s3 backup job failed in cluster environment {{ $labels.cluster_environment }}'
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue