diff --git a/_data/rules.yml b/_data/rules.yml index a6f46d4..b603b1d 100644 --- a/_data/rules.yml +++ b/_data/rules.yml @@ -373,6 +373,10 @@ groups: query: 'rate(container_cpu_cfs_throttled_seconds_total[3m]) > 1' severity: warning for: 2m + - name: Container high low change CPU usage + description: This alert rule monitors the absolute change in CPU usage within a time window and triggers an alert when the change exceeds 25%. + query: '(abs((sum by (instance, name) (rate(container_cpu_usage_seconds_total{name!=""}[1m])) * 100) - (sum by (instance, name) (rate(container_cpu_usage_seconds_total{name!=""}[1m] offset 1m)) * 100)) or abs((sum by (instance, name) (rate(container_cpu_usage_seconds_total{name!=""}[1m])) * 100) - (sum by (instance, name) (rate(container_cpu_usage_seconds_total{name!=""}[5m] offset 1m)) * 100))) > 25' + severity: warning - name: Container Low CPU utilization description: Container CPU utilization is under 20% for 1 week. Consider reducing the allocated CPU. query: '(sum(rate(container_cpu_usage_seconds_total{name!=""}[3m])) BY (instance, name) * 100) < 20'