collectors/python.d.plugin/zscores/metadata.yaml


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187

plugin_name: python.d.plugin
modules:
  - meta:
      plugin_name: python.d.plugin
      module_name: zscores
      monitored_instance:
        name: python.d zscores
        link: https://en.wikipedia.org/wiki/Standard_score
        categories:
          - data-collection.other
        icon_filename: ""
      related_resources:
        integrations:
          list: []
      info_provided_to_referring_integrations:
        description: ""
      keywords:
        - zscore
        - z-score
        - standard score
        - standard deviation
        - anomaly detection
        - statistical anomaly detection
      most_popular: false
    overview:
      data_collection:
        metrics_description: |
          By using smoothed, rolling [Z-Scores](https://en.wikipedia.org/wiki/Standard_score) for selected metrics or charts you can narrow down your focus and shorten root cause analysis.
        method_description: |
          This collector uses the [Netdata rest api](https://github.com/netdata/netdata/blob/master/web/api/README.md) to get the `mean` and `stddev`
          for each dimension on specified charts over a time range (defined by `train_secs` and `offset_secs`).
          
          For each dimension it will calculate a Z-Score as `z = (x - mean) / stddev` (clipped at `z_clip`). Scores are then smoothed over
          time (`z_smooth_n`) and, if `mode: 'per_chart'`, aggregated across dimensions to a smoothed, rolling chart level Z-Score at each time step.
      supported_platforms:
        include: []
        exclude: []
      multi_instance: true
      additional_permissions:
        description: ""
      default_behavior:
        auto_detection:
          description: ""
        limits:
          description: ""
        performance_impact:
          description: ""
    setup:
      prerequisites:
        list:
          - title: Python Requirements
            description: |
              This collector will only work with Python 3 and requires the below packages be installed.
              
              ```bash
              # become netdata user
              sudo su -s /bin/bash netdata
              # install required packages
              pip3 install numpy pandas requests netdata-pandas==0.0.38
              ```
      configuration:
        file:
          name: python.d/zscores.conf
          description: ""
        options:
          description: |
            There are 2 sections:
            
            * Global variables
            * One or more JOBS that can define multiple different instances to monitor.
            
            The following options can be defined globally: priority, penalty, autodetection_retry, update_every, but can also be defined per JOB to override the global values.
            
            Additionally, the following collapsed table contains all the options that can be configured inside a JOB definition.
            
            Every configuration JOB starts with a `job_name` value which will appear in the dashboard, unless a `name` parameter is specified.
          folding:
            title: "Config options"
            enabled: true
          list:
            - name: charts_regex
              description: what charts to pull data for - A regex like `system\..*|` or `system\..*|apps.cpu|apps.mem` etc.
              default_value: "system\\..*"
              required: true
            - name: train_secs
              description: length of time (in seconds) to base calculations off for mean and stddev.
              default_value: 14400
              required: true
            - name: offset_secs
              description: offset (in seconds) preceding latest data to ignore when calculating mean and stddev.
              default_value: 300
              required: true
            - name: train_every_n
              description: recalculate the mean and stddev every n steps of the collector.
              default_value: 900
              required: true
            - name: z_smooth_n
              description: smooth the z score (to reduce sensitivity to spikes) by averaging it over last n values.
              default_value: 15
              required: true
            - name: z_clip
              description: cap absolute value of zscore (before smoothing) for better stability.
              default_value: 10
              required: true
            - name: z_abs
              description: "set z_abs: 'true' to make all zscores be absolute values only."
              default_value: "true"
              required: true
            - name: burn_in
              description: burn in period in which to initially calculate mean and stddev on every step.
              default_value: 2
              required: true
            - name: mode
              description: mode can be to get a zscore 'per_dim' or 'per_chart'.
              default_value: per_chart
              required: true
            - name: per_chart_agg
              description: per_chart_agg is how you aggregate from dimension to chart when mode='per_chart'.
              default_value: mean
              required: true
            - name: update_every
              description: Sets the default data collection frequency.
              default_value: 5
              required: false
            - name: priority
              description: Controls the order of charts at the netdata dashboard.
              default_value: 60000
              required: false
            - name: autodetection_retry
              description: Sets the job re-check interval in seconds.
              default_value: 0
              required: false
            - name: penalty
              description: Indicates whether to apply penalty to update_every in case of failures.
              default_value: yes
              required: false
        examples:
          folding:
            enabled: true
            title: "Config"
          list:
            - name: Default
              description: Default configuration.
              folding:
                enabled: false
              config: |
                local:
                  name: 'local'
                  host: '127.0.0.1:19999'
                  charts_regex: 'system\..*'
                  charts_to_exclude: 'system.uptime'
                  train_secs: 14400
                  offset_secs: 300
                  train_every_n: 900
                  z_smooth_n: 15
                  z_clip: 10
                  z_abs: 'true'
                  burn_in: 2
                  mode: 'per_chart'
                  per_chart_agg: 'mean'
    troubleshooting:
      problems:
        list: []
    alerts: []
    metrics:
      folding:
        title: Metrics
        enabled: false
      description: ""
      availability: []
      scopes:
        - name: global
          description: "These metrics refer to the entire monitored application."
          labels: []
          metrics:
            - name: zscores.z
              description: Z Score
              unit: "z"
              chart_type: line
              dimensions:
                - name: a dimension per chart or dimension
            - name: zscores.3stddev
              description: Z Score >3
              unit: "count"
              chart_type: stacked
              dimensions:
                - name: a dimension per chart or dimension