summaryrefslogtreecommitdiffstats
path: root/health/health.d/upsd.conf
blob: 703a648812997b1e8bbc6ee860fe8b68567afb5a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
# you can disable an alarm notification by setting the 'to' line to: silent

 template: upsd_10min_ups_load
       on: upsd.ups_load
    class: Utilization
     type: Power Supply
component: UPS
       os: *
    hosts: *
   lookup: average -10m unaligned of load
    units: %
    every: 1m
     warn: $this > (($status >= $WARNING)  ? (70) : (80))
     crit: $this > (($status == $CRITICAL) ? (85) : (95))
    delay: down 10m multiplier 1.5 max 1h
  summary: UPS ${label:ups_name} load
     info: UPS ${label:ups_name} average load over the last 10 minutes
       to: sitemgr

 template: upsd_ups_battery_charge
       on: upsd.ups_battery_charge	
    class: Errors
     type: Power Supply
component: UPS
       os: *
    hosts: *
   lookup: average -60s unaligned of charge
    units: %
    every: 60s
     warn: $this < 75
     crit: $this < 40
    delay: down 10m multiplier 1.5 max 1h
  summary: UPS ${label:ups_name} battery charge
     info: UPS ${label:ups_name} average battery charge over the last minute
       to: sitemgr

 template: upsd_ups_last_collected_secs
       on: upsd.ups_load
    class: Latency
     type: Power Supply
component: UPS device
     calc: $now - $last_collected_t
    every: 10s
    units: seconds ago
     warn: $this > (($status >= $WARNING)  ? ($update_every) : ( 5 * $update_every))
     crit: $this > (($status == $CRITICAL) ? ($update_every) : (60 * $update_every))
    delay: down 5m multiplier 1.5 max 1h
  summary: UPS ${label:ups_name} last collected
     info: UPS ${label:ups_name} number of seconds since the last successful data collection
       to: sitemgr