mirror of
https://github.com/samber/awesome-prometheus-alerts.git
synced 2026-06-22 09:27:26 +08:00
25 lines
1.1 KiB
YAML
25 lines
1.1 KiB
YAML
groups:
|
|
|
|
- name: ThanosSidecar
|
|
|
|
|
|
rules:
|
|
|
|
# Threshold of 0.05/s avoids firing on transient single-event spikes.
|
|
- alert: ThanosSidecarBucketOperationsFailed
|
|
expr: 'sum by (job, instance) (rate(thanos_objstore_bucket_operation_failures_total{job=~".*thanos-sidecar.*"}[5m])) > 0.05'
|
|
for: 5m
|
|
labels:
|
|
severity: critical
|
|
annotations:
|
|
summary: Thanos Sidecar Bucket Operations Failed (instance {{ $labels.instance }})
|
|
description: "Thanos Sidecar {{$labels.instance}} bucket operations are failing ({{ $value | humanize }}/s).\n VALUE = {{ $value }}\n LABELS = {{ $labels }}"
|
|
|
|
- alert: ThanosSidecarNoConnectionToStartedPrometheus
|
|
expr: 'thanos_sidecar_prometheus_up == 0 and on (namespace, pod) prometheus_tsdb_data_replay_duration_seconds != 0'
|
|
for: 5m
|
|
labels:
|
|
severity: critical
|
|
annotations:
|
|
summary: Thanos Sidecar No Connection To Started Prometheus (instance {{ $labels.instance }})
|
|
description: "Thanos Sidecar {{$labels.instance}} is unhealthy.\n VALUE = {{ $value }}\n LABELS = {{ $labels }}"
|