-
Notifications
You must be signed in to change notification settings - Fork 0
/
prometheus-alerts.yaml
86 lines (78 loc) · 2.78 KB
/
prometheus-alerts.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
- name: Backups
rules:
- alert: KumonoboruFailure
expr: |
up{job="systemd", unit="Kumonoboru", state="failed"} == 1
for: 5m
labels:
severity: warning
annotations:
summary: "Service failure detected in {{ $labels.instance }}"
description: "The service '{{ $labels.instance }}' has a failed status"
source: 'https://monitor.your-domain.com'
- alert: KumonoboruTimerFailure
expr: |
up{job="systemd", unit="Kumonoboru", state="failed"} == 1
for: 5m
labels:
severity: warning
annotations:
summary: "Timer failure detected in {{ $labels.instance }}"
description: "The timer '{{ $labels.instance }}' has a failed status"
source: 'https://monitor.your-domain.com'
- alert: SystemBackupFailed
expr: |
system_backup == 1
labels:
severity: critical
annotations:
summary: "System Backup has failed"
description: "The repository {{ $labels.instance }} has failed the backup process"
- alert: SystemBackupUnlockFailed
expr: |
system_backup == -1
labels:
severity: critical
annotations:
summary: "System Backup cannot proceed"
description: "The repository {{ $labels.instance }} has failed to unlock. Backup cannot be performed"
- alert: SystemBackupIntegrityFailed
expr: |
system_backup == -2
labels:
severity: critical
annotations:
summary: "System Backup containes error"
description: "The repository {{ $labels.instance }} has failed an integrity check. Backup data may be corrupted"
- alert: SystemBackupCleaningFailed
expr: |
system_backup == -3
labels:
severity: critical
annotations:
summary: "System Backup cannot be cleaned"
description: "The repository {{ $labels.instance }} has failed the cleanup process. Backup may contain excess data"
- alert: SystemBackupSucceeded
expr: |
system_backup == 0
labels:
severity: info
annotations:
summary: "System Backup has succeeded"
description: "The repository {{ $labels.instance }} has succesfully completed the backup process"
- alert: SystemBackupIntegritySucceeded
expr: |
system_backup == 2
labels:
severity: info
annotations:
summary: "System Backup has no errors"
description: "The repository {{ $labels.instance }} passed the integrity check"
- alert: SystemBackupCleaningSucceeded
expr: |
system_backup == 3
labels:
severity: info
annotations:
summary: "System Backup has been cleaned"
description: "The repository {{ $labels.instance }} has completed the cleanup process"