mirror of
https://github.com/samber/awesome-prometheus-alerts.git
synced 2026-06-22 01:17:19 +08:00
36 lines
1.8 KiB
YAML
36 lines
1.8 KiB
YAML
groups:
|
|
|
|
- name: Workhorse
|
|
|
|
|
|
rules:
|
|
|
|
# Workhorse sits in front of Puma and handles Git HTTP, file uploads, and proxying.
|
|
# Threshold from GitLab Omnibus default rules: 10% for high-traffic instances.
|
|
- alert: GitlabWorkhorseHighErrorRate
|
|
expr: 'sum(rate(gitlab_workhorse_http_request_duration_seconds_count{code=~"5.."}[5m])) / sum(rate(gitlab_workhorse_http_request_duration_seconds_count[5m])) * 100 > 10 and sum(rate(gitlab_workhorse_http_request_duration_seconds_count[5m])) > 0'
|
|
for: 5m
|
|
labels:
|
|
severity: critical
|
|
annotations:
|
|
summary: GitLab Workhorse high error rate (instance {{ $labels.instance }})
|
|
description: "GitLab Workhorse on {{ $labels.instance }} is returning more than 10% HTTP 5xx errors.\n VALUE = {{ $value }}\n LABELS = {{ $labels }}"
|
|
|
|
- alert: GitlabWorkhorseHighLatency
|
|
expr: 'histogram_quantile(0.95, sum(rate(gitlab_workhorse_http_request_duration_seconds_bucket[5m])) by (le)) > 10'
|
|
for: 5m
|
|
labels:
|
|
severity: warning
|
|
annotations:
|
|
summary: GitLab Workhorse high latency (instance {{ $labels.instance }})
|
|
description: "GitLab Workhorse on {{ $labels.instance }} p95 request latency is above 10 seconds.\n VALUE = {{ $value }}\n LABELS = {{ $labels }}"
|
|
|
|
# Threshold of 100 may need adjustment based on instance size.
|
|
- alert: GitlabWorkhorseHighIn-flightRequests
|
|
expr: 'gitlab_workhorse_http_in_flight_requests > 100'
|
|
for: 5m
|
|
labels:
|
|
severity: warning
|
|
annotations:
|
|
summary: GitLab Workhorse high in-flight requests (instance {{ $labels.instance }})
|
|
description: "GitLab Workhorse on {{ $labels.instance }} has {{ $value }} in-flight requests.\n VALUE = {{ $value }}\n LABELS = {{ $labels }}"
|