mirror of
https://github.com/samber/awesome-prometheus-alerts.git
synced 2026-06-23 09:58:16 +08:00
some random changes on rules
This commit is contained in:
parent
8f515ceae2
commit
77eccab0e9
1 changed files with 10 additions and 6 deletions
|
|
@ -6,7 +6,7 @@ services:
|
||||||
description: Prometheus configuration reload error
|
description: Prometheus configuration reload error
|
||||||
query: "prometheus_config_last_reload_successful != 1"
|
query: "prometheus_config_last_reload_successful != 1"
|
||||||
severity: warning
|
severity: warning
|
||||||
- name: AlertManager configuration reload failure
|
- name: Prometheus AlertManager configuration reload failure
|
||||||
description: AlertManager configuration reload error
|
description: AlertManager configuration reload error
|
||||||
query: "alertmanager_config_last_reload_successful != 1"
|
query: "alertmanager_config_last_reload_successful != 1"
|
||||||
severity: warning
|
severity: warning
|
||||||
|
|
@ -14,7 +14,7 @@ services:
|
||||||
description: Prometheus cannot connect the alertmanager
|
description: Prometheus cannot connect the alertmanager
|
||||||
query: "prometheus_notifications_alertmanagers_discovered < 1"
|
query: "prometheus_notifications_alertmanagers_discovered < 1"
|
||||||
severity: error
|
severity: error
|
||||||
- name: Exporter down
|
- name: Prometheus Exporter down
|
||||||
description: Prometheus exporter down
|
description: Prometheus exporter down
|
||||||
query: "up == 0"
|
query: "up == 0"
|
||||||
severity: error
|
severity: error
|
||||||
|
|
@ -228,7 +228,7 @@ services:
|
||||||
- name: wrouesnel/postgres_exporter
|
- name: wrouesnel/postgres_exporter
|
||||||
doc_url: https://github.com/wrouesnel/postgres_exporter/
|
doc_url: https://github.com/wrouesnel/postgres_exporter/
|
||||||
rules:
|
rules:
|
||||||
- name: PostgreSQL down
|
- name: Postgresql down
|
||||||
description: PostgreSQL instance is down
|
description: PostgreSQL instance is down
|
||||||
query: "pg_up == 0"
|
query: "pg_up == 0"
|
||||||
severity: error
|
severity: error
|
||||||
|
|
@ -653,8 +653,12 @@ services:
|
||||||
query: "consul_catalog_service_node_healthy == 0"
|
query: "consul_catalog_service_node_healthy == 0"
|
||||||
severity: error
|
severity: error
|
||||||
- name: Consul missing master node
|
- name: Consul missing master node
|
||||||
description: Numbers of consul raft peers less then expected <https://example.ru/ui/{{ $labels.dc }}/services/consul|Consul masters>
|
description: Numbers of consul raft peers should be 3, in order to preserve quorum.
|
||||||
query: "consul_raft_peers < number_of_consul_master"
|
query: "consul_raft_peers < 3"
|
||||||
|
severity: error
|
||||||
|
- name: Consul agent unhealthy
|
||||||
|
description: A Consul agent is down
|
||||||
|
query: 'consul_health_node_status{status="critical"} == 1'
|
||||||
severity: error
|
severity: error
|
||||||
|
|
||||||
- name: Etcd
|
- name: Etcd
|
||||||
|
|
@ -724,7 +728,7 @@ services:
|
||||||
- name: danielqsj/kafka_exporter
|
- name: danielqsj/kafka_exporter
|
||||||
doc_url: https://github.com/danielqsj/kafka_exporter
|
doc_url: https://github.com/danielqsj/kafka_exporter
|
||||||
rules:
|
rules:
|
||||||
- name: Kafka Topics
|
- name: Kafka topics replicas
|
||||||
description: Kafka topic in-sync partition
|
description: Kafka topic in-sync partition
|
||||||
query: "sum(kafka_topic_partition_in_sync_replica) by (topic) < 3"
|
query: "sum(kafka_topic_partition_in_sync_replica) by (topic) < 3"
|
||||||
severity: error
|
severity: error
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue