From e6113ff2dbbc481d5772cec3057ee29b7914cdc7 Mon Sep 17 00:00:00 2001 From: Liudmyla Derkach Date: Fri, 30 Oct 2020 19:07:48 +0200 Subject: [PATCH] feat: adding few useful rabbitmq alerts --- _data/rules.yml | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/_data/rules.yml b/_data/rules.yml index 0b1f20f..bae003b 100644 --- a/_data/rules.yml +++ b/_data/rules.yml @@ -622,6 +622,10 @@ groups: description: Less than 3 nodes running in RabbitMQ cluster query: "sum(rabbitmq_build_info) < 3" severity: critical + - name: Rabbitmq node not distributed + description: Distribution link state is not 'up' + query: "erlang_vm_dist_node_state < 3" + severity: critical - name: Rabbitmq instances different versions description: Running different version of Rabbitmq in the same cluster, can lead to failure. query: "count(count(rabbitmq_build_info) by (rabbitmq_version)) > 1" @@ -630,6 +634,10 @@ groups: description: A node use more than 90% of allocated RAM query: "rabbitmq_process_resident_memory_bytes / rabbitmq_resident_memory_limit_bytes * 100 > 90" severity: warning + - name: Rabbitmq file descriptors usage + description: A node use more than 90% of file descriptors + query: "rabbitmq_process_open_fds / rabbitmq_process_max_fds * 100 > 90" + severity: warning - name: Rabbitmq too much unack description: Too much unacknowledged messages query: "sum(rabbitmq_queue_messages_unacked) BY (queue) > 1000" @@ -642,6 +650,10 @@ groups: description: A queue has less than 1 consumer query: "rabbitmq_queue_consumers < 1" severity: warning + - name: Rabbitmq unroutable messages + description: A queue has unroutable messages + query: "increase(rabbitmq_channel_messages_unroutable_returned_total[5m]) > 0 or increase(rabbitmq_channel_messages_unroutable_dropped_total[5m]) > 0" + severity: warning - name: kbudde/rabbitmq-exporter doc_url: https://github.com/kbudde/rabbitmq_exporter rules: