Merge pull request #97 from samber/fix-kubernetes-pod-not-health

Fix kubernetes pod not health alert
This commit is contained in:
Samuel Berthe 2020-03-26 16:22:56 +01:00 committed by GitHub
commit cf9df92d61
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -961,7 +961,7 @@ groups:
severity: warning
- name: Kubernetes Pod not healthy
description: Pod has been in a non-ready state for longer than an hour.
query: 'min_over_time(sum by (namespace, pod, env, stage) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[1h]) > 0'
query: 'min_over_time(sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[1h:])'
severity: error
- name: Kubernetes pod crash looping
description: Pod {{ $labels.pod }} is crash looping