summaryrefslogtreecommitdiffstats
path: root/health/health.d/btrfs.conf
blob: b2a50682b4cddd3a1a41c861a11e20104ceb02b2 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
 template: btrfs_allocated
       on: btrfs.disk
    class: Utilization
     type: System
component: File system
       os: *
    hosts: *
     calc: 100 - ($unallocated * 100 / ($unallocated + $data_used + $data_free + $meta_used + $meta_free + $sys_used + $sys_free))
    units: %
    every: 10s
     warn: $this > (($status == $CRITICAL) ? (95) : (98))
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: percentage of allocated BTRFS physical disk space
       to: silent

 template: btrfs_data
       on: btrfs.data
    class: Utilization
     type: System
component: File system
       os: *
    hosts: *
     calc: $used * 100 / ($used + $free)
    units: %
    every: 10s
     warn: $this > (($status >= $WARNING)  ? (90) : (95)) && $btrfs_allocated > 98
     crit: $this > (($status == $CRITICAL) ? (95) : (98)) && $btrfs_allocated > 98
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: utilization of BTRFS data space
       to: sysadmin

 template: btrfs_metadata
       on: btrfs.metadata
    class: Utilization
     type: System
component: File system
       os: *
    hosts: *
     calc: ($used + $reserved) * 100 / ($used + $free + $reserved)
    units: %
    every: 10s
     warn: $this > (($status >= $WARNING)  ? (90) : (95)) && $btrfs_allocated > 98
     crit: $this > (($status == $CRITICAL) ? (95) : (98)) && $btrfs_allocated > 98
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: utilization of BTRFS metadata space
       to: sysadmin

 template: btrfs_system
       on: btrfs.system
    class: Utilization
     type: System
component: File system
       os: *
    hosts: *
     calc: $used * 100 / ($used + $free)
    units: %
    every: 10s
     warn: $this > (($status >= $WARNING)  ? (90) : (95)) && $btrfs_allocated > 98
     crit: $this > (($status == $CRITICAL) ? (95) : (98)) && $btrfs_allocated > 98
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: utilization of BTRFS system space
       to: sysadmin

 template: btrfs_device_read_errors
       on: btrfs.device_errors
    class: Errors
     type: System
component: File system
       os: *
    hosts: *
    units: errors
   lookup: max -10m every 1m of read_errs
     warn: $this > 0
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: number of encountered BTRFS read errors
       to: sysadmin

 template: btrfs_device_write_errors
       on: btrfs.device_errors
    class: Errors
     type: System
component: File system
       os: *
    hosts: *
    units: errors
   lookup: max -10m every 1m of write_errs
     crit: $this > 0
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: number of encountered BTRFS write errors
       to: sysadmin

 template: btrfs_device_flush_errors
       on: btrfs.device_errors
    class: Errors
     type: System
component: File system
       os: *
    hosts: *
    units: errors
   lookup: max -10m every 1m of flush_errs
     crit: $this > 0
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: number of encountered BTRFS flush errors
       to: sysadmin

 template: btrfs_device_corruption_errors
       on: btrfs.device_errors
    class: Errors
     type: System
component: File system
       os: *
    hosts: *
    units: errors
   lookup: max -10m every 1m of corruption_errs
     warn: $this > 0
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: number of encountered BTRFS corruption errors
       to: sysadmin

 template: btrfs_device_generation_errors
       on: btrfs.device_errors
    class: Errors
     type: System
component: File system
       os: *
    hosts: *
    units: errors
   lookup: max -10m every 1m of generation_errs
     warn: $this > 0
    delay: up 1m down 15m multiplier 1.5 max 1h
     info: number of encountered BTRFS generation errors
       to: sysadmin