diff --git a/_data/rules.yml b/_data/rules.yml index 209ac3b..dd82f1f 100644 --- a/_data/rules.yml +++ b/_data/rules.yml @@ -202,6 +202,10 @@ groups: description: CPU steal is > 10%. A noisy neighbor is killing VM performances or a spot instance may be out of credit. query: 'avg by(instance) (rate(node_cpu_seconds_total{mode="steal"}[5m])) * 100 > 10' severity: warning + - name: Host CPU high iowait + description: CPU iowait > 5%. A high iowait means that you are disk or network bound. + query: 'avg by (instance) (rate(node_cpu_seconds_total{mode="iowait"}[5m])) * 100 > 5' + severity: warning - name: Host context switching description: Context switching is growing on node (> 1000 / s) query: '(rate(node_context_switches_total[5m])) / (count without(cpu, mode) (node_cpu_seconds_total{mode="idle"})) > 1000'