add etcdbackup alerts
This commit is contained in:
parent
d75cb6b7b6
commit
fd6cc7ef3d
1 changed files with 16 additions and 0 deletions
|
@ -89,6 +89,22 @@ spec:
|
|||
annotations:
|
||||
summary: "SMARTcheck not running"
|
||||
description: 'The last SMARTcheck on server {{ $labels.node }} was more than 3h ago. Plox fix.'
|
||||
- name: etcdbackup
|
||||
rules:
|
||||
- alert: "etcdbackup too old"
|
||||
expr: (time() - etcdbackup_time) > 10800
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "etcd backup not running"
|
||||
description: 'The last etcd backup on node {{ $labels.node }} was more than 3h ago. Plox fix.'
|
||||
- alert: "etcdbackup failed"
|
||||
expr: etcdbackup_result > 0
|
||||
labels:
|
||||
severity: warning
|
||||
annotations:
|
||||
summary: "etcdbackup failed"
|
||||
description: "The backup script for etcd failed on node {{ $labels.node }}. Plox fix."
|
||||
- name: kubernetes
|
||||
rules:
|
||||
- alert: KubernetesUnhealthyPod
|
||||
|
|
Loading…
Reference in a new issue