summaryrefslogtreecommitdiffstats
path: root/src/health/health.d/zfs.conf
diff options
context:
space:
mode:
Diffstat (limited to 'src/health/health.d/zfs.conf')
-rw-r--r--src/health/health.d/zfs.conf90
1 files changed, 90 insertions, 0 deletions
diff --git a/src/health/health.d/zfs.conf b/src/health/health.d/zfs.conf
new file mode 100644
index 000000000..9c1f0018b
--- /dev/null
+++ b/src/health/health.d/zfs.conf
@@ -0,0 +1,90 @@
+
+ alarm: zfs_memory_throttle
+ on: zfs.memory_ops
+ class: Utilization
+ type: System
+component: File system
+ lookup: sum -10m unaligned absolute of throttled
+ units: events
+ every: 1m
+ warn: $this > 0
+ delay: down 1h multiplier 1.5 max 2h
+ summary: ZFS ARC growth throttling
+ info: number of times ZFS had to limit the ARC growth in the last 10 minutes
+ to: silent
+
+# ZFS pool state
+
+ template: zfs_pool_state_warn
+ on: zfspool.state
+ class: Errors
+ type: System
+component: File system
+ calc: $degraded
+ units: boolean
+ every: 10s
+ warn: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is degraded
+ to: sysadmin
+
+ template: zfs_pool_state_crit
+ on: zfspool.state
+ class: Errors
+ type: System
+component: File system
+ calc: $faulted + $unavail
+ units: boolean
+ every: 10s
+ crit: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: Critical ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is faulted or unavail
+ to: sysadmin
+
+
+## go.d/zfspool
+
+ template: zfs_pool_space_utilization
+ on: zfspool.pool_space_utilization
+ class: Utilization
+ type: System
+component: File system
+ calc: $utilization
+ units: %
+ every: 1m
+ warn: $this > (($status >= $WARNING ) ? (85) : (90))
+ crit: $this > (($status >= $WARNING ) ? (90) : (98))
+ delay: down 1m multiplier 1.5 max 1h
+ summary: ZFS pool ${label:pool} space utilization
+ info: ZFS pool ${label:pool} is nearing capacity. Current space usage is above the threshold.
+ to: sysadmin
+
+ template: zfs_pool_health_state_warn
+ on: zfspool.pool_health_state
+ class: Errors
+ type: System
+component: File system
+ calc: $degraded
+ units: boolean
+ every: 10s
+ warn: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is degraded
+ to: sysadmin
+
+ template: zfs_pool_health_state_crit
+ on: zfspool.pool_health_state
+ class: Errors
+ type: System
+component: File system
+ calc: $faulted + $unavail
+ units: boolean
+ every: 10s
+ crit: $this > 0
+ delay: down 1m multiplier 1.5 max 1h
+ summary: Critical ZFS pool ${label:pool} state
+ info: ZFS pool ${label:pool} state is faulted or unavail
+ to: sysadmin