mirror of
https://github.com/samber/awesome-prometheus-alerts.git
synced 2026-06-23 09:58:16 +08:00
fix: some kube api alert lint (#416)
* fix: apiserver regexp matchers are automatically fully anchored Signed-off-by: R.Sicart <roger.sicart@gmail.com> * fix: apiserver errors alert is using label but the query removes it Signed-off-by: R.Sicart <roger.sicart@gmail.com> * fix: apiserver latency alert is using label but the query removes it Signed-off-by: R.Sicart <roger.sicart@gmail.com> --------- Signed-off-by: R.Sicart <roger.sicart@gmail.com>
This commit is contained in:
parent
4963331101
commit
8460f9008e
1 changed files with 2 additions and 2 deletions
|
|
@ -2071,7 +2071,7 @@ groups:
|
||||||
for: 12h
|
for: 12h
|
||||||
- name: Kubernetes API server errors
|
- name: Kubernetes API server errors
|
||||||
description: Kubernetes API server is experiencing high error rate
|
description: Kubernetes API server is experiencing high error rate
|
||||||
query: 'sum(rate(apiserver_request_total{job="apiserver",code=~"^(?:5..)$"}[1m])) / sum(rate(apiserver_request_total{job="apiserver"}[1m])) * 100 > 3'
|
query: 'sum(rate(apiserver_request_total{job="apiserver",code=~"(?:5..)"}[1m])) by (instance, job) / sum(rate(apiserver_request_total{job="apiserver"}[1m])) by (instance, job) * 100 > 3'
|
||||||
severity: critical
|
severity: critical
|
||||||
for: 2m
|
for: 2m
|
||||||
- name: Kubernetes API client errors
|
- name: Kubernetes API client errors
|
||||||
|
|
@ -2089,7 +2089,7 @@ groups:
|
||||||
severity: critical
|
severity: critical
|
||||||
- name: Kubernetes API server latency
|
- name: Kubernetes API server latency
|
||||||
description: "Kubernetes API server has a 99th percentile latency of {{ $value }} seconds for {{ $labels.verb }} {{ $labels.resource }}."
|
description: "Kubernetes API server has a 99th percentile latency of {{ $value }} seconds for {{ $labels.verb }} {{ $labels.resource }}."
|
||||||
query: 'histogram_quantile(0.99, sum(rate(apiserver_request_duration_seconds_bucket{subresource!="log",verb!~"^(?:CONNECT|WATCHLIST|WATCH|PROXY)$"} [10m])) WITHOUT (instance, resource)) > 1'
|
query: 'histogram_quantile(0.99, sum(rate(apiserver_request_duration_seconds_bucket{verb!~"(?:CONNECT|WATCHLIST|WATCH|PROXY)"} [10m])) WITHOUT (subresource)) > 1'
|
||||||
severity: warning
|
severity: warning
|
||||||
for: 2m
|
for: 2m
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue