blob: ce9839ef1d5a3c4eca0f42debad725d8f2bc7a3f (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
|
# you can disable an alarm notification by setting the 'to' line to: silent
alarm: 10min_dbengine_global_fs_errors
on: netdata.dbengine_global_errors
os: linux freebsd macos
hosts: *
lookup: sum -10m unaligned of FS errors
units: errors
every: 10s
crit: $this > 0
delay: down 15m multiplier 1.5 max 1h
info: number of File-System errors dbengine came across the last 10 minutes (too many open files, wrong permissions etc)
to: sysadmin
alarm: 10min_dbengine_global_io_errors
on: netdata.dbengine_global_errors
os: linux freebsd macos
hosts: *
lookup: sum -10m unaligned of I/O errors
units: errors
every: 10s
crit: $this > 0
delay: down 1h multiplier 1.5 max 3h
info: number of IO errors dbengine came across the last 10 minutes (CRC errors, out of space, bad disk etc)
to: sysadmin
alarm: 10min_dbengine_global_flushing_errors
on: netdata.dbengine_global_errors
os: linux freebsd macos
hosts: *
lookup: sum -10m unaligned of flushing errors
units: errors
every: 3s
crit: $this > 0
delay: down 1h multiplier 1.5 max 3h
info: number of times in the last 10 minutes that the dbengine failed to completely flush data to disk, metric data will not be stored in the database, please reduce disk load or use a faster disk
to: sysadmin
|