summaryrefslogtreecommitdiffstats
path: root/health/health.d/systemdunits.conf
blob: 38213a8dbe6f069bb82d205829a05dac900ba1f7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
## Check if the are any systemd units in the failed state (crashed).
## States: 1 - active, 2 - inactive, 3 - activating, 4 - deactivating, 5 - failed.

## Service units
 template: systemd_service_units_state
       on: systemd.service_units_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd service units are in the failed state
       to: sysadmin

## Socket units
 template: systemd_socket_units_state
       on: systemd.socket_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd socket units are in the failed state
       to: sysadmin

## Target units
 template: systemd_target_units_state
       on: systemd.target_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd target units are in the failed state
       to: sysadmin

## Path units
 template: systemd_path_units_state
       on: systemd.path_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd path units are in the failed state
       to: sysadmin

## Device units
 template: systemd_device_units_state
       on: systemd.device_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more the systemd device units are in the failed state
       to: sysadmin

## Mount units
 template: systemd_mount_units_state
       on: systemd.mount_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more the systemd mount units are in the failed state
       to: sysadmin

## Automount units
 template: systemd_automount_units_state
       on: systemd.automount_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd automount units are in the failed state
       to: sysadmin

## Swap units
 template: systemd_swap_units_state
       on: systemd.swap_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd swap units are in the failed state
       to: sysadmin

## Scope units
 template: systemd_scope_units_state
       on: systemd.scope_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd scope units are in the failed state
       to: sysadmin

## Slice units
 template: systemd_slice_units_state
       on: systemd.slice_unit_state
    class: Errors
     type: Linux
component: Systemd units
   lookup: max -1s min2max
    units: ok/failed
    every: 10s
     warn: $this != nan AND $this == 5
    delay: down 5m multiplier 1.5 max 1h
     info: one or more systemd slice units are in the failed state
       to: sysadmin