-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathRHACSFleetshardOperatorContainerFrequentlyRestarting.yaml
39 lines (37 loc) · 2.12 KB
/
RHACSFleetshardOperatorContainerFrequentlyRestarting.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
rule_files:
- /tmp/prometheus-rules-test.yaml
evaluation_interval: 1m
tests:
- interval: 1m
input_series:
- series: kube_pod_container_status_restarts_total{namespace="rhacs", pod="rhacs-operator-1234", container="manager"}
values: "0+0x30 1+1x10 4+1x20"
- series: kube_pod_container_status_restarts_total{namespace="rhacs", pod="rhacs-operator-1234", container="kube-rbac-proxy"}
values: "0+0x30 1+1x10 4+1x20"
alert_rule_test:
- eval_time: 30m
alertname: RHACSFleetshardOperatorContainerFrequentlyRestarting
exp_alerts: []
- eval_time: 60m
alertname: RHACSFleetshardOperatorContainerFrequentlyRestarting
exp_alerts:
- exp_labels:
alertname: RHACSFleetshardOperatorContainerFrequentlyRestarting
container: manager
namespace: rhacs
pod: rhacs-operator-1234
severity: critical
exp_annotations:
summary: "Fleetshard operator container `rhacs-operator-1234/manager` in namespace `rhacs` restarted more than 3 times."
description: "Fleetshard operator container `rhacs-operator-1234/manager` in namespace `rhacs` has restarted more than 3 times during the last 30 minutes."
sop_url: "https://gitlab.cee.redhat.com/stackrox/acs-managed-service-runbooks/blob/master/sops/dp-011-rhacs-operator-unavailable.md"
- exp_labels:
alertname: RHACSFleetshardOperatorContainerFrequentlyRestarting
container: kube-rbac-proxy
namespace: rhacs
pod: rhacs-operator-1234
severity: critical
exp_annotations:
summary: "Fleetshard operator container `rhacs-operator-1234/kube-rbac-proxy` in namespace `rhacs` restarted more than 3 times."
description: "Fleetshard operator container `rhacs-operator-1234/kube-rbac-proxy` in namespace `rhacs` has restarted more than 3 times during the last 30 minutes."
sop_url: "https://gitlab.cee.redhat.com/stackrox/acs-managed-service-runbooks/blob/master/sops/dp-011-rhacs-operator-unavailable.md"