Skip to content
Snippets Groups Projects
Verified Commit 6f128f7a authored by David Hoese's avatar David Hoese
Browse files

Remove KubernetesPodNotHealthy alert because it has false positives

parent 5eba678f
No related branches found
No related tags found
No related merge requests found
...@@ -434,15 +434,15 @@ spec: ...@@ -434,15 +434,15 @@ spec:
summary: "Kubernetes StatefulSet down (instance {{ $labels.instance }})" summary: "Kubernetes StatefulSet down (instance {{ $labels.instance }})"
description: "A StatefulSet went down\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" description: "A StatefulSet went down\n VALUE = {{ $value }}\n LABELS: {{ $labels }}"
- alert: KubernetesPodNotHealthy # - alert: KubernetesPodNotHealthy
expr: min_over_time(sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[1h:5m]) > 0 # expr: min_over_time(sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[1h:5m]) > 0
for: 5m # for: 5m
labels: # labels:
severity: critical # severity: critical
ruleGroup: geosphere-kubernetes # ruleGroup: geosphere-kubernetes
annotations: # annotations:
summary: "Kubernetes Pod not healthy (instance {{ $labels.instance }})" # summary: "Kubernetes Pod not healthy (instance {{ $labels.instance }})"
description: "Pod has been in a non-ready state for longer than an hour.\n VALUE = {{ $value }}\n LABELS: {{ $labels }}" # description: "Pod has been in a non-ready state for longer than an hour.\n VALUE = {{ $value }}\n LABELS: {{ $labels }}"
- alert: KubernetesPodCrashLooping - alert: KubernetesPodCrashLooping
expr: rate(kube_pod_container_status_restarts_total[15m]) * 60 * 5 > 5 expr: rate(kube_pod_container_status_restarts_total[15m]) * 60 * 5 > 5
for: 5m for: 5m
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment