fix(data): for KubernetesPodNotHealthy, insert a step of subquery execution time

This commit is contained in:
Samuel Berthe 2021-05-01 20:30:23 +02:00
parent 54b1e674b2
commit 135d4b7c1a
No known key found for this signature in database
GPG key ID: 64863511FFBD0E3C

View file

@ -1551,8 +1551,8 @@ groups:
severity: info
for: 2m
- name: Kubernetes Pod not healthy
description: Pod has been in a non-ready state for longer than an hour.
query: 'min_over_time(sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[1h:]) > 0'
description: Pod has been in a non-ready state for longer than 15 minutes.
query: 'min_over_time(sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[15m:1m]) > 0'
severity: critical
- name: Kubernetes pod crash looping
description: Pod {{ $labels.pod }} is crash looping