mirror of
https://github.com/samber/awesome-prometheus-alerts.git
synced 2026-06-24 18:36:59 +08:00
Update rules.yml
This commit is contained in:
parent
e98e4d0516
commit
5e84329360
1 changed files with 1 additions and 2 deletions
|
|
@ -1709,10 +1709,9 @@ groups:
|
||||||
severity: info
|
severity: info
|
||||||
for: 2m
|
for: 2m
|
||||||
- name: Kubernetes HPA underutilized
|
- name: Kubernetes HPA underutilized
|
||||||
description: HPA is constantly at minimum replicas for 50% of the time
|
description: HPA is constantly at minimum replicas for 50% of the time. Potential cost saving here.
|
||||||
query: 'max(quantile_over_time(0.5, kube_horizontalpodautoscaler_status_desired_replicas[1d]) == kube_horizontalpodautoscaler_spec_min_replicas) by (horizontalpodautoscaler) > 3' # allow minimum 3 replicas running
|
query: 'max(quantile_over_time(0.5, kube_horizontalpodautoscaler_status_desired_replicas[1d]) == kube_horizontalpodautoscaler_spec_min_replicas) by (horizontalpodautoscaler) > 3' # allow minimum 3 replicas running
|
||||||
severity: info
|
severity: info
|
||||||
for: 5m
|
|
||||||
- name: Kubernetes Pod not healthy
|
- name: Kubernetes Pod not healthy
|
||||||
description: Pod has been in a non-ready state for longer than 15 minutes.
|
description: Pod has been in a non-ready state for longer than 15 minutes.
|
||||||
query: 'sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"}) > 0'
|
query: 'sum by (namespace, pod) (kube_pod_status_phase{phase=~"Pending|Unknown|Failed"}) > 0'
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue