From 447bb94c4d49d573596033c9018fc78478eebe0a Mon Sep 17 00:00:00 2001 From: michaelact <86778470+michaelact@users.noreply.github.com> Date: Tue, 6 Dec 2022 16:26:50 +0700 Subject: [PATCH] Add under-utilized host and hardware alerts (#320) * chore: add under-utilized alerts * docs: add under-utilized alerts * chore: add alert consideration times * chore: delete generated alert rules file * chore: not using for, instead in rule --- _data/rules.yml | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/_data/rules.yml b/_data/rules.yml index 89efb9e..82cd938 100644 --- a/_data/rules.yml +++ b/_data/rules.yml @@ -309,6 +309,19 @@ groups: severity: info for: 4h + # You may be want to increase the alert manager 'repeat_interval' for this type of alert to daily or weekly + - name: node-exporter + slug: node-exporter-under-utilized + doc_url: https://github.com/prometheus/node_exporter + rules: + - name: Host Memory is under utilized + description: 'Node memory is not fully used (> 80% free) for 1 week. Consider reducing memory space.' + query: 'min_over_time(node_memory_MemAvailable_bytes[1w]) / node_memory_MemTotal_bytes * 100 > 80' + severity: info + - name: Host Cpu is under utilized + description: 'CPU load is < 20% for 1 week. Consider reducing the number of CPUs.' + query: '100 - (max by(instance) (rate(node_cpu_seconds_total{mode="idle"}[1w])) * 100) < 20' + severity: info - name: Docker containers exporters: