add _bytes && _total for metrics

This commit is contained in:
Sofrony Pavel 2019-02-14 22:52:41 +03:00
parent ff7ef5f6bd
commit 8136b239be
No known key found for this signature in database
GPG key ID: 680D71F08DDA644F

View file

@ -18,23 +18,23 @@ services:
severity: warning
- name: Unusual network throughput in
description: Host network interfaces are probably receiving too much data (> 100 MB/s)
query: 'sum by (instance) (irate(node_network_receive_bytes[2m])) / 1024 / 1024 > 100'
query: 'sum by (instance) (irate(node_network_receive_bytes_total[2m])) / 1024 / 1024 > 100'
severity: warning
- name: Unusual network throughput out
description: Host network interfaces are probably sending too much data (> 100 MB/s)
query: 'sum by (instance) (irate(node_network_transmit_bytes[2m])) / 1024 / 1024 > 100'
query: 'sum by (instance) (irate(node_network_transmit_bytes_total[2m])) / 1024 / 1024 > 100'
severity: warning
- name: Unusual disk read rate
description: Disk is probably reading too much data (> 50 MB/s)
query: 'sum by (instance) (irate(node_disk_bytes_read[2m])) / 1024 / 1024 > 50'
query: 'sum by (instance) (irate(node_disk_read_bytes_total[2m])) / 1024 / 1024 > 50'
severity: warning
- name: Unusual disk write rate
description: Disk is probably writing too much data (> 50 MB/s)
query: 'sum by (instance) (irate(node_disk_bytes_written[2m])) / 1024 / 1024 > 50'
query: 'sum by (instance) (irate(node_disk_written_bytes_total[2m])) / 1024 / 1024 > 50'
severity: warning
- name: Out of disk space
description: Disk is almost full (< 10% left)
query: 'node_filesystem_free{mountpoint ="/rootfs"} / node_filesystem_size{mountpoint ="/rootfs"} * 100 < 10'
query: 'node_filesystem_free_bytes{mountpoint ="/rootfs"} / node_filesystem_size_bytes{mountpoint ="/rootfs"} * 100 < 10'
severity: warning
- name: Out of inodes
description: Disk is almost running out of available inodes (< 10% left)
@ -42,11 +42,11 @@ services:
severity: warning
- name: Unusual disk read latency
description: Disk latency is growing (read operations > 100ms)
query: 'rate(node_disk_read_time_ms[1m]) / rate(node_disk_reads_completed[1m]) > 100'
query: 'rate(node_disk_read_time_seconds_total[1m]) / rate(node_disk_reads_completed_total[1m]) > 100'
severity: warning
- name: Unusual disk write latency
description: Disk latency is growing (write operations > 100ms)
query: 'rate(node_disk_write_time_ms[1m]) / rate(node_disk_writes_completed[1m]) > 100'
query: 'rate(node_disk_write_time_seconds_total[1m]) / rate(node_disk_writes_completed_total[1m]) > 100'
severity: warning
- name: CPU load
description: CPU load (15m) is high
@ -54,7 +54,7 @@ services:
severity: warning
- name: Context switching
description: Context switching is growing on node (> 1000 / s)
query: 'rate(node_context_switches[5m]) > 1000'
query: 'rate(node_context_switches_total[5m]) > 1000'
severity: warning
- name: Node has swap
description: Node has swap