Netdata Alert configs
This commit is contained in:
parent
010397002b
commit
c1613be214
4 changed files with 53 additions and 0 deletions
32
home/dot_config/netdata/health.d/cpu.conf
Normal file
32
home/dot_config/netdata/health.d/cpu.conf
Normal file
|
@ -0,0 +1,32 @@
|
|||
alarm: cpu_usage
|
||||
on: system.cpu
|
||||
lookup: average -1m percentage foreach user,system
|
||||
units: %
|
||||
every: 5m
|
||||
warn: $this > 50
|
||||
crit: $this > 70
|
||||
info: CPU utilization of users or the system
|
||||
|
||||
template: ml_5min_cpu_dims
|
||||
on: system.cpu
|
||||
os: linux
|
||||
hosts: *
|
||||
lookup: average -5m anomaly-bit foreach *
|
||||
calc: $this
|
||||
units: %
|
||||
every: 30s
|
||||
warn: $this > (($status >= $WARNING) ? (5) : (20))
|
||||
crit: $this > (($status == $CRITICAL) ? (20) : (100))
|
||||
info: Rolling 5min anomaly rate for each system.cpu dimension
|
||||
|
||||
template: ml_5min_cpu_chart
|
||||
on: system.cpu
|
||||
os: linux
|
||||
hosts: *
|
||||
lookup: average -5m anomaly-bit of *
|
||||
calc: $this
|
||||
units: %
|
||||
every: 30s
|
||||
warn: $this > (($status >= $WARNING) ? (5) : (20))
|
||||
crit: $this > (($status == $CRITICAL) ? (20) : (100))
|
||||
info: Rolling 5min anomaly rate for system.cpu chart
|
7
home/dot_config/netdata/health.d/disks.conf
Normal file
7
home/dot_config/netdata/health.d/disks.conf
Normal file
|
@ -0,0 +1,7 @@
|
|||
template: disk_full_percent
|
||||
on: disk.space
|
||||
calc: $used * 100 / ($avail + $used)
|
||||
every: 60m
|
||||
warn: $this > 70
|
||||
crit: $this > 85
|
||||
info: Disk usage on the system
|
6
home/dot_config/netdata/health.d/network.conf
Normal file
6
home/dot_config/netdata/health.d/network.conf
Normal file
|
@ -0,0 +1,6 @@
|
|||
template: 30min_packet_drops
|
||||
on: net.drops
|
||||
lookup: sum -30m unaligned absolute
|
||||
every: 10s
|
||||
crit: $this > 0
|
||||
info: Dropper network packets
|
8
home/dot_config/netdata/health.d/ram.conf
Normal file
8
home/dot_config/netdata/health.d/ram.conf
Normal file
|
@ -0,0 +1,8 @@
|
|||
alarm: ram_usage
|
||||
on: system.ram
|
||||
lookup: average -1m percentage foreach user,system
|
||||
units: %
|
||||
every: 5m
|
||||
warn: $this > 50
|
||||
crit: $this > 90
|
||||
info: RAM utilization of users or the system
|
Loading…
Reference in a new issue