summaryrefslogtreecommitdiffstats
path: root/src/health/health.d/zfs.conf
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-07-24 09:54:23 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-07-24 09:54:44 +0000
commit836b47cb7e99a977c5a23b059ca1d0b5065d310e (patch)
tree1604da8f482d02effa033c94a84be42bc0c848c3 /src/health/health.d/zfs.conf
parentReleasing debian version 1.44.3-2. (diff)
downloadnetdata-836b47cb7e99a977c5a23b059ca1d0b5065d310e.tar.xz
netdata-836b47cb7e99a977c5a23b059ca1d0b5065d310e.zip
Merging upstream version 1.46.3.
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to '')
-rw-r--r--src/health/health.d/zfs.conf90
1 files changed, 90 insertions, 0 deletions
diff --git a/src/health/health.d/zfs.conf b/src/health/health.d/zfs.conf
new file mode 100644
index 000000000..9c1f0018b
--- /dev/null
+++ b/src/health/health.d/zfs.conf
@@ -0,0 +1,90 @@
+
+ alarm: zfs_memory_throttle
+ on: zfs.memory_ops
+ class: Utilization
+ type: System
+component: File system
+ lookup: sum -10m unaligned absolute of throttled
+ units: events
+ every: 1m
+ warn: $this > 0
+ delay: down 1h multiplier 1.5 max 2h
+ summary: ZFS ARC growth throttling
+ info: number of times ZFS had to limit the ARC growth in the last 10 minutes
+ to: silent
+
+# ZFS pool state
+
+ template: zfs_pool_state_warn
+ on: zfspool.state
+ class: Errors
+ type: System
+component: File system
+ calc: $degraded
+ units: boolean
+ every: 10s
+ warn: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is degraded
+ to: sysadmin
+
+ template: zfs_pool_state_crit
+ on: zfspool.state
+ class: Errors
+ type: System
+component: File system
+ calc: $faulted + $unavail
+ units: boolean
+ every: 10s
+ crit: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: Critical ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is faulted or unavail
+ to: sysadmin
+
+
+## go.d/zfspool
+
+ template: zfs_pool_space_utilization
+ on: zfspool.pool_space_utilization
+ class: Utilization
+ type: System
+component: File system
+ calc: $utilization
+ units: %
+ every: 1m
+ warn: $this > (($status >= $WARNING ) ? (85) : (90))
+ crit: $this > (($status >= $WARNING ) ? (90) : (98))
+ delay: down 1m multiplier 1.5 max 1h
+ summary: ZFS pool ${label:pool} space utilization
+ info: ZFS pool ${label:pool} is nearing capacity. Current space usage is above the threshold.
+ to: sysadmin
+
+ template: zfs_pool_health_state_warn
+ on: zfspool.pool_health_state
+ class: Errors
+ type: System
+component: File system
+ calc: $degraded
+ units: boolean
+ every: 10s
+ warn: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is degraded
+ to: sysadmin
+
+ template: zfs_pool_health_state_crit
+ on: zfspool.pool_health_state
+ class: Errors
+ type: System
+component: File system
+ calc: $faulted + $unavail
+ units: boolean
+ every: 10s
+ crit: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: Critical ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is faulted or unavail
+ to: sysadmin