mirror of
https://github.com/samber/awesome-prometheus-alerts.git
synced 2026-06-25 02:46:59 +08:00
fix(data): for KubernetesPodNotHealthy, insert a step of subquery execution time
This commit is contained in:
parent
54b1e674b2
commit
135d4b7c1a
1 changed files with 2 additions and 2 deletions
|
|
@ -1551,8 +1551,8 @@ groups:
|
||||||
severity: info
|
severity: info
|
||||||
for: 2m
|
for: 2m
|
||||||
- name: Kubernetes Pod not healthy
|
- name: Kubernetes Pod not healthy
|
||||||
description: Pod has been in a non-ready state for longer than an hour.
|
description: Pod has been in a non-ready state for longer than 15 minutes.
|
||||||
query: 'min_over_time(sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[1h:]) > 0'
|
query: 'min_over_time(sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"})[15m:1m]) > 0'
|
||||||
severity: critical
|
severity: critical
|
||||||
- name: Kubernetes pod crash looping
|
- name: Kubernetes pod crash looping
|
||||||
description: Pod {{ $labels.pod }} is crash looping
|
description: Pod {{ $labels.pod }} is crash looping
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue