// SPDX-License-Identifier: GPL-3.0-or-later
var netdataDashboard = window.netdataDashboard || {};
// Informational content for the various sections of the GUI (menus, sections, charts, etc.)
// ----------------------------------------------------------------------------
// Menus
netdataDashboard.menu = {
'system': {
title: 'System Overview',
icon: '',
info: 'Overview of the key system metrics.'
},
'services': {
title: 'systemd Services',
icon: '',
info: 'Resources utilization of systemd services. netdata monitors all systemd services via CGROUPS ' +
'(the resources accounting used by containers). '
},
'ap': {
title: 'Access Points',
icon: '',
info: 'Performance metrics for the access points (i.e. wireless interfaces in AP mode) found on the system.'
},
'tc': {
title: 'Quality of Service',
icon: '',
info: 'Netdata collects and visualizes tc
class utilization using its ' +
'tc-helper plugin. ' +
'If you also use FireQOS for setting up QoS, ' +
'netdata automatically collects interface and class names. If your QoS configuration includes overheads ' +
'calculation, the values shown here will include these overheads (the total bandwidth for the same ' +
'interface as reported in the Network Interfaces section, will be lower than the total bandwidth ' +
'reported here). QoS data collection may have a slight time difference compared to the interface ' +
'(QoS data collection uses a BASH script, so a shift in data collection of a few milliseconds ' +
'should be justified).'
},
'net': {
title: 'Network Interfaces',
icon: '',
info: 'Performance metrics for network interfaces.'
},
'ip': {
title: 'Networking Stack',
icon: '',
info: function (os) {
if(os === "linux")
return 'Metrics for the networking stack of the system. These metrics are collected from /proc/net/netstat
, apply to both IPv4 and IPv6 traffic and are related to operation of the kernel networking stack.';
else
return 'Metrics for the networking stack of the system.';
}
},
'ipv4': {
title: 'IPv4 Networking',
icon: '',
info: 'Metrics for the IPv4 stack of the system. ' +
'Internet Protocol version 4 (IPv4) is ' +
'the fourth version of the Internet Protocol (IP). It is one of the core protocols of standards-based ' +
'internetworking methods in the Internet. IPv4 is a connectionless protocol for use on packet-switched ' +
'networks. It operates on a best effort delivery model, in that it does not guarantee delivery, nor does ' +
'it assure proper sequencing or avoidance of duplicate delivery. These aspects, including data integrity, ' +
'are addressed by an upper layer transport protocol, such as the Transmission Control Protocol (TCP).'
},
'ipv6': {
title: 'IPv6 Networking',
icon: '',
info: 'Metrics for the IPv6 stack of the system. Internet Protocol version 6 (IPv6) is the most recent version of the Internet Protocol (IP), the communications protocol that provides an identification and location system for computers on networks and routes traffic across the Internet. IPv6 was developed by the Internet Engineering Task Force (IETF) to deal with the long-anticipated problem of IPv4 address exhaustion. IPv6 is intended to replace IPv4.'
},
'sctp': {
title: 'SCTP Networking',
icon: '',
info: 'Stream Control Transmission Protocol (SCTP) is a computer network protocol which operates at the transport layer and serves a role similar to the popular protocols TCP and UDP. SCTP provides some of the features of both UDP and TCP: it is message-oriented like UDP and ensures reliable, in-sequence transport of messages with congestion control like TCP. It differs from those protocols by providing multi-homing and redundant paths to increase resilience and reliability.'
},
'ipvs': {
title: 'IP Virtual Server',
icon: '',
info: 'IPVS (IP Virtual Server) implements transport-layer load balancing inside the Linux kernel, so called Layer-4 switching. IPVS running on a host acts as a load balancer at the front of a cluster of real servers, it can direct requests for TCP/UDP based services to the real servers, and makes services of the real servers to appear as a virtual service on a single IP address.'
},
'netfilter': {
title: 'Firewall (netfilter)',
icon: '',
info: 'Performance metrics of the netfilter components.'
},
'ipfw': {
title: 'Firewall (ipfw)',
icon: '',
info: 'Counters and memory usage for the ipfw rules.'
},
'cpu': {
title: 'CPUs',
icon: '',
info: 'Detailed information for each CPU of the system. A summary of the system for all CPUs can be found at the System Overview section.'
},
'mem': {
title: 'Memory',
icon: '',
info: 'Detailed information about the memory management of the system.'
},
'disk': {
title: 'Disks',
icon: '',
info: 'Charts with performance information for all the system disks. Special care has been given to present disk performance metrics in a way compatible with iostat -x
. netdata by default prevents rendering performance charts for individual partitions and unmounted virtual disks. Disabled charts can still be enabled by configuring the relative settings in the netdata configuration file.'
},
'sensors': {
title: 'Sensors',
icon: '',
info: 'Readings of the configured system sensors.'
},
'ipmi': {
title: 'IPMI',
icon: '',
info: 'The Intelligent Platform Management Interface (IPMI) is a set of computer interface specifications for an autonomous computer subsystem that provides management and monitoring capabilities independently of the host system\'s CPU, firmware (BIOS or UEFI) and operating system.'
},
'samba': {
title: 'Samba',
icon: '',
info: 'Performance metrics of the Samba file share operations of this system. Samba is a implementation of Windows services, including Windows SMB protocol file shares.'
},
'nfsd': {
title: 'NFS Server',
icon: '',
info: 'Performance metrics of the Network File Server. NFS is a distributed file system protocol, allowing a user on a client computer to access files over a network, much like local storage is accessed. NFS, like many other protocols, builds on the Open Network Computing Remote Procedure Call (ONC RPC) system. The NFS is an open standard defined in Request for Comments (RFC).'
},
'nfs': {
title: 'NFS Client',
icon: '',
info: 'Performance metrics of the NFS operations of this system, acting as an NFS client.'
},
'zfs': {
title: 'ZFS filesystem',
icon: '',
info: 'Performance metrics of the ZFS filesystem. The following charts visualize all metrics reported by arcstat.py and arc_summary.py.'
},
'btrfs': {
title: 'BTRFS filesystem',
icon: '',
info: 'Disk space metrics for the BTRFS filesystem.'
},
'apps': {
title: 'Applications',
icon: '',
info: 'Per application statistics are collected using netdata\'s apps.plugin
. This plugin walks through all processes and aggregates statistics for applications of interest, defined in /etc/netdata/apps_groups.conf
, which can be edited by running $ /etc/netdata/edit-config apps_groups.conf
(the default is here). The plugin internally builds a process tree (much like ps fax
does), and groups processes together (evaluating both child and parent processes) so that the result is always a chart with a predefined set of dimensions (of course, only application groups found running are reported). The reported values are compatible with top
, although the netdata plugin counts also the resources of exited children (unlike top
which shows only the resources of the currently running processes). So for processes like shell scripts, the reported values include the resources used by the commands these scripts run within each timeframe.',
height: 1.5
},
'users': {
title: 'Users',
icon: '',
info: 'Per user statistics are collected using netdata\'s apps.plugin
. This plugin walks through all processes and aggregates statistics per user. The reported values are compatible with top
, although the netdata plugin counts also the resources of exited children (unlike top
which shows only the resources of the currently running processes). So for processes like shell scripts, the reported values include the resources used by the commands these scripts run within each timeframe.',
height: 1.5
},
'groups': {
title: 'User Groups',
icon: '',
info: 'Per user group statistics are collected using netdata\'s apps.plugin
. This plugin walks through all processes and aggregates statistics per user group. The reported values are compatible with top
, although the netdata plugin counts also the resources of exited children (unlike top
which shows only the resources of the currently running processes). So for processes like shell scripts, the reported values include the resources used by the commands these scripts run within each timeframe.',
height: 1.5
},
'netdata': {
title: 'Netdata Monitoring',
icon: '',
info: 'Performance metrics for the operation of netdata itself and its plugins.'
},
'example': {
title: 'Example Charts',
info: 'Example charts, demonstrating the external plugin architecture.'
},
'cgroup': {
title: '',
icon: '',
info: 'Container resource utilization metrics. Netdata reads this information from cgroups (abbreviated from control groups), a Linux kernel feature that limits and accounts resource usage (CPU, memory, disk I/O, network, etc.) of a collection of processes. cgroups together with namespaces (that offer isolation between processes) provide what we usually call: containers.'
},
'cgqemu': {
title: '',
icon: '',
info: 'QEMU virtual machine resource utilization metrics. QEMU (short for Quick Emulator) is a free and open-source hosted hypervisor that performs hardware virtualization.'
},
'fping': {
title: 'fping',
icon: '',
info: 'Network latency statistics, via fping. fping is a program to send ICMP echo probes to network hosts, similar to ping
, but much better performing when pinging multiple hosts. fping versions after 3.15 can be directly used as netdata plugins.'
},
'httpcheck': {
title: 'Http Check',
icon: '',
info: 'Web Service availability and latency monitoring using HTTP checks. This plugin is a specialized version of the port check plugin.'
},
'memcached': {
title: 'memcached',
icon: '',
info: 'Performance metrics for memcached. Memcached is a general-purpose distributed memory caching system. It is often used to speed up dynamic database-driven websites by caching data and objects in RAM to reduce the number of times an external data source (such as a database or API) must be read.'
},
'monit': {
title: 'monit',
icon: '',
info: 'Statuses of checks in monit. Monit is a utility for managing and monitoring processes, programs, files, directories and filesystems on a Unix system. Monit conducts automatic maintenance and repair and can execute meaningful causal actions in error situations.'
},
'mysql': {
title: 'MySQL',
icon: '',
info: 'Performance metrics for mysql, the open-source relational database management system (RDBMS).'
},
'postgres': {
title: 'Postgres',
icon: '',
info: 'Performance metrics for PostgresSQL, the object-relational database (ORDBMS).'
},
'redis': {
title: 'Redis',
icon: '',
info: 'Performance metrics for redis. Redis (REmote DIctionary Server) is a software project that implements data structure servers. It is open-source, networked, in-memory, and stores keys with optional durability.'
},
'rethinkdbs': {
title: 'RethinkDB',
icon: '',
info: 'Performance metrics for rethinkdb. RethinkDB is the first open-source scalable database built for realtime applications'
},
'retroshare': {
title: 'RetroShare',
icon: '',
info: 'Performance metrics for RetroShare. RetroShare is open source software for encrypted filesharing, serverless email, instant messaging, online chat, and BBS, based on a friend-to-friend network built on GNU Privacy Guard (GPG).'
},
'ipfs': {
title: 'IPFS',
icon: '',
info: 'Performance metrics for the InterPlanetary File System (IPFS), a content-addressable, peer-to-peer hypermedia distribution protocol.'
},
'phpfpm': {
title: 'PHP-FPM',
icon: '',
info: 'Performance metrics for PHP-FPM, an alternative FastCGI implementation for PHP.'
},
'portcheck': {
title: 'Port Check',
icon: '',
info: 'Service availability and latency monitoring using port checks.'
},
'postfix': {
title: 'postfix',
icon: '',
info: undefined
},
'dovecot': {
title: 'Dovecot',
icon: '',
info: undefined
},
'hddtemp': {
title: 'HDD Temp',
icon: '',
info: undefined
},
'nginx': {
title: 'nginx',
icon: '',
info: undefined
},
'apache': {
title: 'Apache',
icon: '',
info: undefined
},
'lighttpd': {
title: 'Lighttpd',
icon: '',
info: undefined
},
'web_log': {
title: undefined,
icon: '',
info: 'Information extracted from a server log file. web_log
plugin incrementally parses the server log file to provide, in real-time, a break down of key server performance metrics. For web servers, an extended log file format may optionally be used (for nginx
and apache
) offering timing information and bandwidth for both requests and responses. web_log
plugin may also be configured to provide a break down of requests per URL pattern (check /etc/netdata/python.d/web_log.conf
).'
},
'named': {
title: 'named',
icon: '',
info: undefined
},
'squid': {
title: 'squid',
icon: '',
info: undefined
},
'nut': {
title: 'UPS',
icon: '',
info: undefined
},
'apcupsd': {
title: 'UPS',
icon: '',
info: undefined
},
'smawebbox': {
title: 'Solar Power',
icon: '',
info: undefined
},
'fronius': {
title: 'Fronius',
icon: '',
info: undefined
},
'stiebeleltron': {
title: 'Stiebel Eltron',
icon: '',
info: undefined
},
'snmp': {
title: 'SNMP',
icon: '',
info: undefined
},
'go_expvar': {
title: 'Go - expvars',
icon: '',
info: 'Statistics about running Go applications exposed by the expvar package.'
},
'chrony': {
icon: '',
info: 'chronyd parameters about the system’s clock performance.'
},
'couchdb': {
icon: '',
info: 'Performance metrics for CouchDB, the open-source, JSON document-based database with an HTTP API and multi-master replication.'
},
'beanstalk': {
title: 'Beanstalkd',
icon: '',
info: 'Provides statistics on the beanstalkd server and any tubes available on that server using data pulled from beanstalkc'
},
'rabbitmq': {
title: 'RabbitMQ',
icon: '',
info: 'Performance data for the RabbitMQ open-source message broker.'
},
'ceph': {
title: 'Ceph',
icon: '',
info: 'Provides statistics on the ceph cluster server, the open-source distributed storage system.'
},
'ntpd': {
title: 'ntpd',
icon: '',
info: 'Provides statistics for the internal variables of the Network Time Protocol daemon ntpd and optional including the configured peers (if enabled in the module configuration). The module presents the performance metrics as shown by ntpq (the standard NTP query program) using NTP mode 6 UDP packets to communicate with the NTP server.'
},
'spigotmc': {
title: 'Spigot MC',
icon: '',
info: 'Provides basic performance statistics for the Spigot Minecraft server.'
},
'unbound': {
title: 'Unbound',
icon: '',
info: undefined
},
'boinc': {
title: 'BOINC',
icon: '',
info: 'Provides task counts for BOINC distributed computing clients.'
},
'w1sensor': {
title: '1-Wire Sensors',
icon: '',
info: 'Data derived from 1-Wire sensors. Currently temperature sensors are automatically detected.'
},
'logind': {
title: 'Logind',
icon: '',
info: undefined
},
'linux_power_supply': {
title: 'Power Supply',
icon: '',
info: 'Statistics for the various system power supplies.'
}
};
// ----------------------------------------------------------------------------
// submenus
// information to be shown, just below each submenu
// information about the submenus
netdataDashboard.submenu = {
'web_log.squid_bandwidth': {
title: 'bandwidth',
info: 'Bandwidth of responses (sent
) by squid. This chart may present unusual spikes, since the bandwidth is accounted at the time the log line is saved by the server, even if the time needed to serve it spans across a longer duration. We suggest to use QoS (e.g. FireQOS) for accurate accounting of the server bandwidth.'
},
'web_log.squid_responses': {
title: 'responses',
info: 'Information related to the responses sent by squid.'
},
'web_log.squid_requests': {
title: 'requests',
info: 'Information related to the requests squid has received.'
},
'web_log.squid_hierarchy': {
title: 'hierarchy',
info: 'Performance metrics for the squid hierarchy used to serve the requests.'
},
'web_log.squid_squid_transport': {
title: 'transport'
},
'web_log.squid_squid_cache': {
title: 'cache',
info: 'Performance metrics for the performance of the squid cache.'
},
'web_log.squid_timings': {
title: 'timings',
info: 'Duration of squid requests. Unrealistic spikes may be reported, since squid logs the total time of the requests, when they complete. Especially for HTTPS, the clients get a tunnel from the proxy and exchange requests directly with the upstream servers, so squid cannot evaluate the individual requests and reports the total time the tunnel was open.'
},
'web_log.squid_clients': {
title: 'clients'
},
'web_log.bandwidth': {
info: 'Bandwidth of requests (received
) and responses (sent
). received
requires an extended log format (without it, the web server log does not have this information). This chart may present unusual spikes, since the bandwidth is accounted at the time the log line is saved by the web server, even if the time needed to serve it spans across a longer duration. We suggest to use QoS (e.g. FireQOS) for accurate accounting of the web server bandwidth.'
},
'web_log.urls': {
info: 'Number of requests for each URL pattern
defined in /etc/netdata/python.d/web_log.conf
. This chart counts all requests matching the URL patterns defined, independently of the web server response codes (i.e. both successful and unsuccessful).'
},
'web_log.clients': {
info: 'Charts showing the number of unique client IPs, accessing the web server.'
},
'web_log.timings': {
info: 'Web server response timings - the time the web server needed to prepare and respond to requests. This requires an extended log format and its meaning is web server specific. For most web servers this accounts the time from the reception of a complete request, to the dispatch of the last byte of the response. So, it includes the network delays of responses, but it does not include the network delays of requests.'
},
'mem.ksm': {
title: 'deduper (ksm)',
info: 'Kernel Same-page Merging (KSM) performance monitoring, read from several files in /sys/kernel/mm/ksm/
. KSM is a memory-saving de-duplication feature in the Linux kernel (since version 2.6.32). The KSM daemon ksmd periodically scans those areas of user memory which have been registered with it, looking for pages of identical content which can be replaced by a single write-protected page (which is automatically copied if a process later wants to update its content). KSM was originally developed for use with KVM (where it was known as Kernel Shared Memory), to fit more virtual machines into physical memory, by sharing the data common between them. But it can be useful to any application which generates many instances of the same data.'
},
'mem.hugepages': {
info: 'Hugepages is a feature that allows the kernel to utilize the multiple page size capabilities of modern hardware architectures. The kernel creates multiple pages of virtual memory, mapped from both physical RAM and swap. There is a mechanism in the CPU architecture called "Translation Lookaside Buffers" (TLB) to manage the mapping of virtual memory pages to actual physical memory addresses. The TLB is a limited hardware resource, so utilizing a large amount of physical memory with the default page size consumes the TLB and adds processing overhead. By utilizing Huge Pages, the kernel is able to create pages of much larger sizes, each page consuming a single resource in the TLB. Huge Pages are pinned to physical RAM and cannot be swapped/paged out.'
},
'mem.numa': {
info: 'Non-Uniform Memory Access (NUMA) is a hierarchical memory design the memory access time is dependent on locality. Under NUMA, a processor can access its own local memory faster than non-local memory (memory local to another processor or memory shared between processors). The individual metrics are described in the Linux kernel documentation.'
},
'ip.ecn': {
info: 'Explicit Congestion Notification (ECN) is a TCP extension that allows end-to-end notification of network congestion without dropping packets. ECN is an optional feature that may be used between two ECN-enabled endpoints when the underlying network infrastructure also supports it.'
},
'netfilter.conntrack': {
title: 'connection tracker',
info: 'Netfilter Connection Tracker performance metrics. The connection tracker keeps track of all connections of the machine, inbound and outbound. It works by keeping a database with all open connections, tracking network and address translation and connection expectations.'
},
'netfilter.nfacct': {
title: 'bandwidth accounting',
info: 'The following information is read using the nfacct.plugin
.'
},
'netfilter.synproxy': {
title: 'DDoS protection',
info: 'DDoS protection performance metrics. SYNPROXY is a TCP SYN packets proxy. It is used to protect any TCP server (like a web server) from SYN floods and similar DDoS attacks. It is a netfilter module, in the Linux kernel (since version 3.12). It is optimized to handle millions of packets per second utilizing all CPUs available without any concurrency locking between the connections. It can be used for any kind of TCP traffic (even encrypted), since it does not interfere with the content itself.'
},
'ipfw.dynamic_rules': {
title: 'dynamic rules',
info: 'Number of dynamic rules, created by correspondent stateful firewall rules.'
},
'system.softnet_stat': {
title: 'softnet',
info: function (os) {
if (os === 'linux')
return 'Statistics for CPUs SoftIRQs related to network receive work. Break down per CPU core can be found at CPU / softnet statistics. processed states the number of packets processed, dropped is the number packets dropped because the network device backlog was full (to fix them on Linux use sysctl
to increase net.core.netdev_max_backlog
), squeezed is the number of packets dropped because the network device budget ran out (to fix them on Linux use sysctl
to increase net.core.netdev_budget
and/or net.core.netdev_budget_usecs
). More information about identifying and troubleshooting network driver related issues can be found at Red Hat Enterprise Linux Network Performance Tuning Guide.';
else
return 'Statistics for CPUs SoftIRQs related to network receive work.';
}
},
'cpu.softnet_stat': {
title: 'softnet',
info: function (os) {
if (os === 'linux')
return 'Statistics for per CPUs core SoftIRQs related to network receive work. Total for all CPU cores can be found at System / softnet statistics. processed states the number of packets processed, dropped is the number packets dropped because the network device backlog was full (to fix them on Linux use sysctl
to increase net.core.netdev_max_backlog
), squeezed is the number of packets dropped because the network device budget ran out (to fix them on Linux use sysctl
to increase net.core.netdev_budget
and/or net.core.netdev_budget_usecs
). More information about identifying and troubleshooting network driver related issues can be found at Red Hat Enterprise Linux Network Performance Tuning Guide.';
else
return 'Statistics for per CPUs core SoftIRQs related to network receive work. Total for all CPU cores can be found at System / softnet statistics.';
}
},
'go_expvar.memstats': {
title: 'memory statistics',
info: 'Go runtime memory statistics. See runtime.MemStats documentation for more info about each chart and the values.'
},
'couchdb.dbactivity': {
title: 'db activity',
info: 'Overall database reads and writes for the entire server. This includes any external HTTP traffic, as well as internal replication traffic performed in a cluster to ensure node consistency.'
},
'couchdb.httptraffic': {
title: 'http traffic breakdown',
info: 'All HTTP traffic, broken down by type of request (GET, PUT, POST, etc.) and response status code (200, 201, 4xx, etc.)
Any 5xx errors here indicate a likely CouchDB bug; check the logfile for further information.'
},
'couchdb.ops': {
title: 'server operations'
},
'couchdb.perdbstats': {
title: 'per db statistics',
info: 'Statistics per database. This includes 3 size graphs per database: active (the size of live data in the database), external (the uncompressed size of the database contents), and file (the size of the file on disk, exclusive of any views and indexes). It also includes the number of documents and number of deleted documents per database.'
},
'couchdb.erlang': {
title: 'erlang statistics',
info: 'Detailed information about the status of the Erlang VM that hosts CouchDB. These are intended for advanced users only. High values of the peak message queue (>10e6) generally indicate an overload condition.'
},
'ntpd.system': {
title: 'system',
info: 'Statistics of the system variables as shown by the readlist billboard ntpq -c rl
. System variables are assigned an association ID of zero and can also be shown in the readvar billboard ntpq -c "rv 0"
. These variables are used in the Clock Discipline Algorithm, to calculate the lowest and most stable offset.'
},
'ntpd.peers': {
title: 'peers',
info: 'Statistics of the peer variables for each peer configured in /etc/ntp.conf
as shown by the readvar billboard ntpq -c "rv <association>"
, while each peer is assigned a nonzero association ID as shown by ntpq -c "apeers"
. The module periodically scans for new/changed peers (default: every 60s). ntpd selects the best possible peer from the available peers to synchronize the clock. A minimum of at least 3 peers is required to properly identify the best possible peer.'
}
};
// ----------------------------------------------------------------------------
// chart
// information works on the context of a chart
// Its purpose is to set:
//
// info: the text above the charts
// heads: the representation of the chart at the top the subsection (second level menu)
// mainheads: the representation of the chart at the top of the section (first level menu)
// colors: the dimension colors of the chart (the default colors are appended)
// height: the ratio of the chart height relative to the default
//
netdataDashboard.context = {
'system.cpu': {
info: function (os) {
void(os);
return 'Total CPU utilization (all cores). 100% here means there is no CPU idle time at all. You can get per core usage at the CPUs section and per application usage at the Applications Monitoring section.'
+ netdataDashboard.sparkline('
Keep an eye on iowait ', 'system.cpu', 'iowait', '%', '. If it is constantly high, your disks are a bottleneck and they slow your system down.')
+ netdataDashboard.sparkline('
An important metric worth monitoring, is softirq ', 'system.cpu', 'softirq', '%', '. A constantly high percentage of softirq may indicate network driver issues.');
},
valueRange: "[0, 100]"
},
'system.load': {
info: 'Current system load, i.e. the number of processes using CPU or waiting for system resources (usually CPU and disk). The 3 metrics refer to 1, 5 and 15 minute averages. The system calculates this once every 5 seconds. For more information check this wikipedia article',
height: 0.7
},
'system.io': {
info: function (os) {
var s = 'Total Disk I/O, for all physical disks. You can get detailed information about each disk at the Disks section and per application Disk usage at the Applications Monitoring section.';
if (os === 'linux')
return s + ' Physical are all the disks that are listed in /sys/block
, but do not exist in /sys/devices/virtual/block
.';
else
return s;
}
},
'system.pgpgio': {
info: 'Memory paged from/to disk. This is usually the total disk I/O of the system.'
},
'system.swapio': {
info: 'Total Swap I/O. (netdata measures both in
and out
. If either of them is not shown in the chart, it is because it is zero - you can change the page settings to always render all the available dimensions on all charts).'
},
'system.pgfaults': {
info: 'Total page faults. Major page faults indicates that the system is using its swap. You can find which applications use the swap at the Applications Monitoring section.'
},
'system.entropy': {
colors: '#CC22AA',
info: 'Entropy, is a pool of random numbers (/dev/random) that is mainly used in cryptography. If the pool of entropy gets empty, processes requiring random numbers may run a lot slower (it depends on the interface each program uses), waiting for the pool to be replenished. Ideally a system with high entropy demands should have a hardware device for that purpose (TPM is one such device). There are also several software-only options you may install, like haveged
, although these are generally useful only in servers.'
},
'system.forks': {
colors: '#5555DD',
info: 'Number of new processes created.'
},
'system.intr': {
colors: '#DD5555',
info: 'Total number of CPU interrupts. Check system.interrupts
that gives more detail about each interrupt and also the CPUs section where interrupts are analyzed per CPU core.'
},
'system.interrupts': {
info: 'CPU interrupts in detail. At the CPUs section, interrupts are analyzed per CPU core.'
},
'system.softirqs': {
info: 'CPU softirqs in detail. At the CPUs section, softirqs are analyzed per CPU core.'
},
'system.processes': {
info: 'System processes. Running are the processes in the CPU. Blocked are processes that are willing to enter the CPU, but they cannot, e.g. because they wait for disk activity.'
},
'system.active_processes': {
info: 'All system processes.'
},
'system.ctxt': {
info: 'Context Switches, is the switching of the CPU from one process, task or thread to another. If there are many processes or threads willing to execute and very few CPU cores available to handle them, the system is making more context switching to balance the CPU resources among them. The whole process is computationally intensive. The more the context switches, the slower the system gets.'
},
'system.idlejitter': {
info: 'Idle jitter is calculated by netdata. A thread is spawned that requests to sleep for a few microseconds. When the system wakes it up, it measures how many microseconds have passed. The difference between the requested and the actual duration of the sleep, is the idle jitter. This number is useful in real-time environments, where CPU jitter can affect the quality of the service (like VoIP media gateways).'
},
'system.net': {
info: function (os) {
var s = 'Total bandwidth of all physical network interfaces. This does not include lo
, VPNs, network bridges, IFB devices, bond interfaces, etc. Only the bandwidth of physical network interfaces is aggregated.';
if (os === 'linux')
return s + ' Physical are all the network interfaces that are listed in /proc/net/dev
, but do not exist in /sys/devices/virtual/net
.';
else
return s;
}
},
'system.ip': {
info: 'Total IP traffic in the system.'
},
'system.ipv4': {
info: 'Total IPv4 Traffic.'
},
'system.ipv6': {
info: 'Total IPv6 Traffic.'
},
'system.ram': {
info: 'System Random Access Memory (i.e. physical memory) usage.'
},
'system.swap': {
info: 'System swap memory usage. Swap space is used when the amount of physical memory (RAM) is full. When the system needs more memory resources and the RAM is full, inactive pages in memory are moved to the swap space (usually a disk, a disk partition or a file).'
},
// ------------------------------------------------------------------------
// CPU charts
'cpu.cpu': {
commonMin: true,
commonMax: true,
valueRange: "[0, 100]"
},
'cpu.interrupts': {
commonMin: true,
commonMax: true
},
'cpu.softirqs': {
commonMin: true,
commonMax: true
},
'cpu.softnet_stat': {
commonMin: true,
commonMax: true
},
// ------------------------------------------------------------------------
// MEMORY
'mem.ksm_savings': {
heads: [
netdataDashboard.gaugeChart('Saved', '12%', 'savings', '#0099CC')
]
},
'mem.ksm_ratios': {
heads: [
function (os, id) {
void(os);
return '
ifconfig
as RX dropped
(inbound) and TX dropped
(outbound). inbound packets can be dropped at the network interface level due to softnet backlog overflow, bad / unintented VLAN tags, unknown or unregistered protocols, IPv6 frames when the server is not configured for IPv6. Check this document for more information.'
},
// ------------------------------------------------------------------------
// IP
'ip.inerrors': {
info: 'Errors encountered during the reception of IP packets. ' +
'noroutes
(InNoRoutes
) counts packets that were dropped because there was no route to send them. ' +
'truncated
(InTruncatedPkts
) counts packets which is being discarded because the datagram frame didn\'t carry enough data. ' +
'checksum
(InCsumErrors
) counts packets that were dropped because they had wrong checksum. '
},
'ip.tcpmemorypressures': {
info: 'Number of times a socket was put in memory pressure due to a non fatal memory allocation failure (the kernel attempts to work around this situation by reducing the send buffers, etc).'
},
'ip.tcpconnaborts': {
info: 'TCP connection aborts. baddata (TCPAbortOnData
) happens while the connection is on FIN_WAIT1
and the kernel receives a packet with a sequence number beyond the last one for this connection - the kernel responds with RST
(closes the connection). userclosed (TCPAbortOnClose
) happens when the kernel receives data on an already closed connection and responds with RST
. nomemory (TCPAbortOnMemory
happens when there are too many orphaned sockets (not attached to an fd) and the kernel has to drop a connection - sometimes it will send an RST
, sometimes it won\'t. timeout (TCPAbortOnTimeout
) happens when a connection times out. linger (TCPAbortOnLinger
) happens when the kernel killed a socket that was already closed by the application and lingered around for long enough. failed (TCPAbortFailed
) happens when the kernel attempted to send an RST
but failed because there was no memory available.'
},
'ip.tcp_syn_queue': {
info: 'The SYN queue of the kernel tracks TCP handshakes until connections get fully established. ' +
'It overflows when too many incoming TCP connection requests hang in the half-open state and the server ' +
'is not configured to fall back to SYN cookies*. Overflows are usually caused by SYN flood DoS attacks ' +
'(i.e. someone sends lots of SYN packets and never completes the handshakes). ' +
'drops (or TcpExtTCPReqQFullDrop
) is the number of connections dropped because the ' +
'SYN queue was full and SYN cookies were disabled. ' +
'cookies (or TcpExtTCPReqQFullDoCookies
) is the number of SYN cookies sent because the ' +
'SYN queue was full.'
},
'ip.tcp_accept_queue': {
info: 'The accept queue of the kernel holds the fully established TCP connections, waiting to be handled ' +
'by the listening application. overflows (or ListenOverflows
) is the number of ' +
'established connections that could not be handled because the receive queue of the listening application ' +
'was full. drops (or ListenDrops
) is the number of incoming ' +
'connections that could not be handled, including SYN floods, overflows, out of memory, security issues, ' +
'no route to destination, reception of related ICMP messages, socket is broadcast or multicast.'
},
// ------------------------------------------------------------------------
// IPv4
'ipv4.tcpsock': {
info: 'The number of established TCP connections (known as CurrEstab
). This is a snapshot of the established connections at the time of measurement (i.e. a connection established and a connection disconnected within the same iteration will not affect this metric).'
},
'ipv4.tcpopens': {
info: 'active or ActiveOpens
is the number of outgoing TCP connections attempted by this host.'
+ ' passive or PassiveOpens
is the number of incoming TCP connections accepted by this host.'
},
'ipv4.tcperrors': {
info: 'InErrs
is the number of TCP segments received in error (including header too small, checksum errors, sequence errors, bad packets - for both IPv4 and IPv6).'
+ ' InCsumErrors
is the number of TCP segments received with checksum errors (for both IPv4 and IPv6).'
+ ' RetransSegs
is the number of TCP segments retransmitted.'
},
'ipv4.tcphandshake': {
info: 'EstabResets
is the number of established connections resets (i.e. connections that made a direct transition from ESTABLISHED
or CLOSE_WAIT
to CLOSED
).'
+ ' OutRsts
is the number of TCP segments sent, with the RST
flag set (for both IPv4 and IPv6).'
+ ' AttemptFails
is the number of times TCP connections made a direct transition from either SYN_SENT
or SYN_RECV
to CLOSED
, plus the number of times TCP connections made a direct transition from the SYN_RECV
to LISTEN
.'
+ ' TCPSynRetrans
shows retries for new outbound TCP connections, which can indicate general connectivity issues or backlog on the remote host.'
},
// ------------------------------------------------------------------------
// APPS
'apps.cpu': {
height: 2.0
},
'apps.mem': {
info: 'Real memory (RAM) used by applications. This does not include shared memory.'
},
'apps.vmem': {
info: 'Virtual memory allocated by applications. Please check this article for more information.'
},
'apps.preads': {
height: 2.0
},
'apps.pwrites': {
height: 2.0
},
// ------------------------------------------------------------------------
// USERS
'users.cpu': {
height: 2.0
},
'users.mem': {
info: 'Real memory (RAM) used per user. This does not include shared memory.'
},
'users.vmem': {
info: 'Virtual memory allocated per user. Please check this article for more information.'
},
'users.preads': {
height: 2.0
},
'users.pwrites': {
height: 2.0
},
// ------------------------------------------------------------------------
// GROUPS
'groups.cpu': {
height: 2.0
},
'groups.mem': {
info: 'Real memory (RAM) used per user group. This does not include shared memory.'
},
'groups.vmem': {
info: 'Virtual memory allocated per user group. Please check this article for more information.'
},
'groups.preads': {
height: 2.0
},
'groups.pwrites': {
height: 2.0
},
// ------------------------------------------------------------------------
// NETWORK QoS
'tc.qos': {
heads: [
function (os, id) {
void(os);
if (id.match(/.*-ifb$/))
return netdataDashboard.gaugeChart('Inbound', '12%', '', '#5555AA');
else
return netdataDashboard.gaugeChart('Outbound', '12%', '', '#AA9900');
}
]
},
// ------------------------------------------------------------------------
// NETWORK INTERFACES
'net.net': {
mainheads: [
function (os, id) {
void(os);
if (id.match(/^cgroup_.*/)) {
var iface;
try {
iface = ' ' + id.substring(id.lastIndexOf('.net_') + 5, id.length);
}
catch (e) {
iface = '';
}
return netdataDashboard.gaugeChart('Received' + iface, '12%', 'received');
}
else
return '';
},
function (os, id) {
void(os);
if (id.match(/^cgroup_.*/)) {
var iface;
try {
iface = ' ' + id.substring(id.lastIndexOf('.net_') + 5, id.length);
}
catch (e) {
iface = '';
}
return netdataDashboard.gaugeChart('Sent' + iface, '12%', 'sent');
}
else
return '';
}
],
heads: [
function (os, id) {
void(os);
if (!id.match(/^cgroup_.*/))
return netdataDashboard.gaugeChart('Received', '12%', 'received');
else
return '';
},
function (os, id) {
void(os);
if (!id.match(/^cgroup_.*/))
return netdataDashboard.gaugeChart('Sent', '12%', 'sent');
else
return '';
}
]
},
// ------------------------------------------------------------------------
// NETFILTER
'netfilter.sockets': {
colors: '#88AA00',
heads: [
netdataDashboard.gaugeChart('Active Connections', '12%', '', '#88AA00')
]
},
'netfilter.new': {
heads: [
netdataDashboard.gaugeChart('New Connections', '12%', 'new', '#5555AA')
]
},
// ------------------------------------------------------------------------
// DISKS
'disk.util': {
colors: '#FF5588',
heads: [
netdataDashboard.gaugeChart('Utilization', '12%', '', '#FF5588')
],
info: 'Disk Utilization measures the amount of time the disk was busy with something. This is not related to its performance. 100% means that the system always had an outstanding operation on the disk. Keep in mind that depending on the underlying technology of the disk, 100% here may or may not be an indication of congestion.'
},
'disk.backlog': {
colors: '#0099CC',
info: 'Backlog is an indication of the duration of pending disk operations. On every I/O event the system is multiplying the time spent doing I/O since the last update of this field with the number of pending operations. While not accurate, this metric can provide an indication of the expected completion time of the operations in progress.'
},
'disk.io': {
heads: [
netdataDashboard.gaugeChart('Read', '12%', 'reads'),
netdataDashboard.gaugeChart('Write', '12%', 'writes')
],
info: 'Amount of data transferred to and from disk.'
},
'disk.ops': {
info: 'Completed disk I/O operations. Keep in mind the number of operations requested might be higher, since the system is able to merge adjacent to each other (see merged operations chart).'
},
'disk.qops': {
info: 'I/O operations currently in progress. This metric is a snapshot - it is not an average over the last interval.'
},
'disk.iotime': {
height: 0.5,
info: 'The sum of the duration of all completed I/O operations. This number can exceed the interval if the disk is able to execute I/O operations in parallel.'
},
'disk.mops': {
height: 0.5,
info: 'The number of merged disk operations. The system is able to merge adjacent I/O operations, for example two 4KB reads can become one 8KB read before given to disk.'
},
'disk.svctm': {
height: 0.5,
info: 'The average service time for completed I/O operations. This metric is calculated using the total busy time of the disk and the number of completed operations. If the disk is able to execute multiple parallel operations the reporting average service time will be misleading.'
},
'disk.avgsz': {
height: 0.5,
info: 'The average I/O operation size.'
},
'disk.await': {
height: 0.5,
info: 'The average time for I/O requests issued to the device to be served. This includes the time spent by the requests in queue and the time spent servicing them.'
},
'disk.space': {
info: 'Disk space utilization. reserved for root is automatically reserved by the system to prevent the root user from getting out of space.'
},
'disk.inodes': {
info: 'inodes (or index nodes) are filesystem objects (e.g. files and directories). On many types of file system implementations, the maximum number of inodes is fixed at filesystem creation, limiting the maximum number of files the filesystem can hold. It is possible for a device to run out of inodes. When this happens, new files cannot be created on the device, even though there may be free space available.'
},
'mysql.net': {
info: 'The amount of data sent to mysql clients (out) and received from mysql clients (in).'
},
// ------------------------------------------------------------------------
// MYSQL
'mysql.queries': {
info: 'The number of statements executed by the server.response time
describes the time passed between request and response. ' +
'Currently, the accuracy of the response time is low and should be used as reference only.'
},
'httpcheck.responselength': {
info: 'The response length
counts the number of characters in the response body. For static pages, this should be mostly constant.'
},
'httpcheck.status': {
valueRange: "[0, 1]",
info: 'This chart verifies the response of the webserver. Each status dimension will have a value of 1
if triggered. ' +
'Dimension success
is 1
only if all constraints are satisfied. ' +
'This chart is most useful for alarms or third-party apps.'
},
// ------------------------------------------------------------------------
// NETDATA
'netdata.response_time': {
info: 'The netdata API response time measures the time netdata needed to serve requests. This time includes everything, from the reception of the first byte of a request, to the dispatch of the last byte of its reply, therefore it includes all network latencies involved (i.e. a client over a slow network will influence these metrics).'
},
// ------------------------------------------------------------------------
// RETROSHARE
'retroshare.bandwidth': {
info: 'RetroShare inbound and outbound traffic.',
mainheads: [
netdataDashboard.gaugeChart('Received', '12%', 'bandwidth_down_kb'),
netdataDashboard.gaugeChart('Sent', '12%', 'bandwidth_up_kb')
]
},
'retroshare.peers': {
info: 'Number of (connected) RetroShare friends.',
mainheads: [
function (os, id) {
void(os);
return '';
}
]
},
'retroshare.dht': {
info: 'Statistics about RetroShare\'s DHT. These values are estimated!'
},
// ------------------------------------------------------------------------
// fping
'fping.quality': {
colors: NETDATA.colors[10],
height: 0.5
},
'fping.packets': {
height: 0.5
},
// ------------------------------------------------------------------------
// containers
'cgroup.cpu': {
mainheads: [
function (os, id) {
void(os);
return '';
}
]
},
'cgroup.mem_usage': {
mainheads: [
function (os, id) {
void(os);
return '';
}
]
},
'cgroup.throttle_io': {
mainheads: [
function (os, id) {
void(os);
return '';
},
function (os, id) {
void(os);
return '';
}
]
},
// ------------------------------------------------------------------------
// beanstalkd
// system charts
'beanstalk.cpu_usage': {
info: 'Amount of CPU Time for user and system used by beanstalkd.'
},
// This is also a per-tube stat
'beanstalk.jobs_rate': {
info: 'The rate of jobs processed by the beanstalkd served.'
},
'beanstalk.connections_rate': {
info: 'Tthe rate of connections opened to beanstalkd.'
},
'beanstalk.commands_rate': {
info: 'The rate of commands received by beanstalkd.'
},
'beanstalk.current_tubes': {
info: 'Total number of current tubes on the server including the default tube (which always exists).'
},
'beanstalk.current_jobs': {
info: 'Current number of jobs in all tubes grouped by status: urgent, ready, reserved, delayed and buried.'
},
'beanstalk.current_connections': {
info: 'Current number of connections group by connection type: written, producers, workers, waiting.'
},
'beanstalk.binlog': {
info: 'The rate of records written
to binlog and migrated
as part of compaction.'
},
'beanstalk.uptime': {
info: 'Total time beanstalkd server has been up for.'
},
// tube charts
'beanstalk.jobs': {
info: 'Number of jobs currently in the tube grouped by status: urgent, ready, reserved, delayed and buried.'
},
'beanstalk.connections': {
info: 'The current number of connections to this tube grouped by connection type; using, waiting and watching.'
},
'beanstalk.commands': {
info: 'The rate of delete
and pause
commands executed by beanstalkd.'
},
'beanstalk.pause': {
info: 'Shows info on how long the tube has been paused for, and how long is left remaining on the pause.'
},
// ------------------------------------------------------------------------
// ceph
'ceph.general_usage': {
info: 'The usage and available space in all ceph cluster.'
},
'ceph.general_objects': {
info: 'Total number of objects storage on ceph cluster.'
},
'ceph.general_bytes': {
info: 'Cluster read and write data per second.'
},
'ceph.general_operations': {
info: 'Number of read and write operations per second.'
},
'ceph.general_latency': {
info: 'Total of apply and commit latency in all OSDs. The apply latency is the total time taken to flush an update to disk. The commit latency is the total time taken to commit an operation to the journal.'
},
'ceph.pool_usage': {
info: 'The usage space in each pool.'
},
'ceph.pool_objects': {
info: 'Number of objects presents in each pool.'
},
'ceph.pool_read_bytes': {
info: 'The rate of read data per second in each pool.'
},
'ceph.pool_write_bytes': {
info: 'The rate of write data per second in each pool.'
},
'ceph.pool_read_objects': {
info: 'Number of read objects per second in each pool.'
},
'ceph.pool_write_objects': {
info: 'Number of write objects per second in each pool.'
},
'ceph.osd_usage': {
info: 'The usage space in each OSD.'
},
'ceph.apply_latency': {
info: 'Time taken to flush an update in each OSD.'
},
'ceph.commit_latency': {
info: 'Time taken to commit an operation to the journal in each OSD.'
},
// ------------------------------------------------------------------------
// web_log
'web_log.response_statuses': {
info: 'Web server responses by type. success
includes 1xx, 2xx and 304, error
includes 5xx, redirect
includes 3xx except 304, bad
includes 4xx, other
are all the other responses.',
mainheads: [
function (os, id) {
void(os);
return '';
},
function (os, id) {
void(os);
return '';
},
function (os, id) {
void(os);
return '';
},
function (os, id) {
void(os);
return '';
}
]
},
'web_log.response_codes': {
info: 'Web server responses by code family. ' +
'According to the standards 1xx
are informational responses, ' +
'2xx
are successful responses, ' +
'3xx
are redirects (although they include 304 which is used as "not modified"), ' +
'4xx
are bad requests, ' +
'5xx
are internal server errors, ' +
'other
are non-standard responses, ' +
'unmatched
counts the lines in the log file that are not matched by the plugin (let us know if you have any unmatched).'
},
'web_log.response_time': {
mainheads: [
function (os, id) {
void(os);
return '';
}
]
},
'web_log.detailed_response_codes': {
info: 'Number of responses for each response code individually.'
},
'web_log.requests_per_ipproto': {
info: 'Web server requests received per IP protocol version.'
},
'web_log.clients': {
info: 'Unique client IPs accessing the web server, within each data collection iteration. If data collection is per second, this chart shows unique client IPs per second.'
},
'web_log.clients_all': {
info: 'Unique client IPs accessing the web server since the last restart of netdata. This plugin keeps in memory all the unique IPs that have accessed the web server. On very busy web servers (several millions of unique IPs) you may want to disable this chart (check /etc/netdata/python.d/web_log.conf
).'
},
// ------------------------------------------------------------------------
// web_log for squid
'web_log.squid_response_statuses': {
info: 'Squid responses by type. ' +
'success
includes 1xx, 2xx, 000, 304, ' +
'error
includes 5xx and 6xx, ' +
'redirect
includes 3xx except 304, ' +
'bad
includes 4xx, ' +
'other
are all the other responses.',
mainheads: [
function (os, id) {
void(os);
return '';
},
function (os, id) {
void(os);
return '';
},
function (os, id) {
void(os);
return '';
},
function (os, id) {
void(os);
return '';
}
]
},
'web_log.squid_response_codes': {
info: 'Web server responses by code family. ' +
'According to HTTP standards 1xx
are informational responses, ' +
'2xx
are successful responses, ' +
'3xx
are redirects (although they include 304 which is used as "not modified"), ' +
'4xx
are bad requests, ' +
'5xx
are internal server errors. ' +
'Squid also defines 000
mostly for UDP requests, and ' +
'6xx
for broken upstream servers sending wrong headers. ' +
'Finally, other
are non-standard responses, and ' +
'unmatched
counts the lines in the log file that are not matched by the plugin (let us know if you have any unmatched).'
},
'web_log.squid_duration': {
mainheads: [
function (os, id) {
void(os);
return '';
}
]
},
'web_log.squid_detailed_response_codes': {
info: 'Number of responses for each response code individually.'
},
'web_log.squid_clients': {
info: 'Unique client IPs accessing squid, within each data collection iteration. If data collection is per second, this chart shows unique client IPs per second.'
},
'web_log.squid_clients_all': {
info: 'Unique client IPs accessing squid since the last restart of netdata. This plugin keeps in memory all the unique IPs that have accessed the server. On very busy squid servers (several millions of unique IPs) you may want to disable this chart (check /etc/netdata/python.d/web_log.conf
).'
},
'web_log.squid_transport_methods': {
info: 'Break down per delivery method: TCP
are requests on the HTTP port (usually 3128), ' +
'UDP
are requests on the ICP port (usually 3130), or HTCP port (usually 4128). ' +
'If ICP logging was disabled using the log_icp_queries option, no ICP replies will be logged. ' +
'NONE
are used to state that squid delivered an unusual response or no response at all. ' +
'Seen with cachemgr requests and errors, usually when the transaction fails before being classified into one of the above outcomes. ' +
'Also seen with responses to CONNECT
requests.'
},
'web_log.squid_code': {
info: 'These are combined squid result status codes. A break down per component is given in the following charts. ' +
'Check the squid documentation about them.'
},
'web_log.squid_handling_opts': {
info: 'These tags are optional and describe why the particular handling was performed or where the request came from. ' +
'CLIENT
means that the client request placed limits affecting the response. Usually seen with client issued a no-cache, or analogous cache control command along with the request. Thus, the cache has to validate the object.' +
'IMS
states that the client sent a revalidation (conditional) request. ' +
'ASYNC
, is used when the request was generated internally by Squid. Usually this is background fetches for cache information exchanges, background revalidation from stale-while-revalidate cache controls, or ESI sub-objects being loaded. ' +
'SWAPFAIL
is assigned when the object was believed to be in the cache, but could not be accessed. A new copy was requested from the server. ' +
'REFRESH
when a revalidation (conditional) request was sent to the server. ' +
'SHARED
when this request was combined with an existing transaction by collapsed forwarding. NOTE: the existing request is not marked as SHARED. ' +
'REPLY
when particular handling was requested in the HTTP reply from server or peer. Usually seen on DENIED due to http_reply_access ACLs preventing delivery of servers response object to the client.'
},
'web_log.squid_object_types': {
info: 'These tags are optional and describe what type of object was produced. ' +
'NEGATIVE
is only seen on HIT responses, indicating the response was a cached error response. e.g. 404 not found. ' +
'STALE
means the object was cached and served stale. This is usually caused by stale-while-revalidate or stale-if-error cache controls. ' +
'OFFLINE
when the requested object was retrieved from the cache during offline_mode. The offline mode never validates any object. ' +
'INVALID
when an invalid request was received. An error response was delivered indicating what the problem was. ' +
'FAIL
is only seen on REFRESH
to indicate the revalidation request failed. The response object may be the server provided network error or the stale object which was being revalidated depending on stale-if-error cache control. ' +
'MODIFIED
is only seen on REFRESH
responses to indicate revalidation produced a new modified object. ' +
'UNMODIFIED
is only seen on REFRESH
responses to indicate revalidation produced a 304 (Not Modified) status, which was relayed to the client. ' +
'REDIRECT
when squid generated an HTTP redirect response to this request.'
},
'web_log.squid_cache_events': {
info: 'These tags are optional and describe whether the response was loaded from cache, network, or otherwise. ' +
'HIT
when the response object delivered was the local cache object. ' +
'MEM
when the response object came from memory cache, avoiding disk accesses. Only seen on HIT responses. ' +
'MISS
when the response object delivered was the network response object. ' +
'DENIED
when the request was denied by access controls. ' +
'NOFETCH
an ICP specific type, indicating service is alive, but not to be used for this request (sent during "-Y" startup, or during frequent failures, a cache in hit only mode will return either UDP_HIT or UDP_MISS_NOFETCH. Neighbours will thus only fetch hits). ' +
'TUNNEL
when a binary tunnel was established for this transaction.'
},
'web_log.squid_transport_errors': {
info: 'These tags are optional and describe some error conditions which occured during response delivery (if any). ' +
'ABORTED
when the response was not completed due to the connection being aborted (usually by the client). ' +
'TIMEOUT
, when the response was not completed due to a connection timeout.'
},
// ------------------------------------------------------------------------
// Fronius Solar Power
'fronius.power': {
info: 'Positive Grid
values mean that power is coming from the grid. Negative values are excess power that is going back into the grid, possibly selling it. ' +
'Photovoltaics
is the power generated from the solar panels. ' +
'Accumulator
is the stored power in the accumulator, if one is present.'
},
'fronius.autonomy': {
commonMin: true,
commonMax: true,
valueRange: "[0, 100]",
info: 'The Autonomy
is the percentage of how autonomous the installation is. An autonomy of 100 % means that the installation is producing more energy than it is needed. ' +
'The Self consumption
indicates the ratio between the current power generated and the current load. When it reaches 100 %, the Autonomy
declines, since the solar panels can not produce enough energy and need support from the grid.'
},
'fronius.energy.today': {
commonMin: true,
commonMax: true,
valueRange: "[0, null]"
},
// ------------------------------------------------------------------------
// Stiebel Eltron Heat pump installation
'stiebeleltron.system.roomtemp': {
commonMin: true,
commonMax: true,
valueRange: "[0, null]"
},
// ------------------------------------------------------------------------
// Port check
'portcheck.latency': {
info: 'The latency
describes the time spent connecting to a TCP port. No data is sent or received. ' +
'Currently, the accuracy of the latency is low and should be used as reference only.'
},
'portcheck.status': {
valueRange: "[0, 1]",
info: 'The status
chart verifies the availability of the service. ' +
'Each status dimension will have a value of 1
if triggered. Dimension success
is 1
only if connection could be established. ' +
'This chart is most useful for alarms and third-party apps.'
},
// ------------------------------------------------------------------------
'chrony.system': {
info: 'In normal operation, chronyd never steps the system clock, because any jump in the timescale can have adverse consequences for certain application programs. Instead, any error in the system clock is corrected by slightly speeding up or slowing down the system clock until the error has been removed, and then returning to the system clock’s normal speed. A consequence of this is that there will be a period when the system clock (as read by other programs using the gettimeofday()
system call, or by the date
command in the shell) will be different from chronyd\'s estimate of the current true time (which it reports to NTP clients when it is operating in server mode). The value reported on this line is the difference due to this effect.',
colors: NETDATA.colors[3]
},
'chrony.offsets': {
info: 'last offset
is the estimated local offset on the last clock update. RMS offset
is a long-term average of the offset value.',
height: 0.5
},
'chrony.stratum': {
info: 'The stratum
indicates how many hops away from a computer with an attached reference clock we are. Such a computer is a stratum-1 computer.',
decimalDigits: 0,
height: 0.5
},
'chrony.root': {
info: 'Estimated delays against the root time server this system is synchronized with. delay
is the total of the network path delays to the stratum-1 computer from which the computer is ultimately synchronised. dispersion
is the total dispersion accumulated through all the computers back to the stratum-1 computer from which the computer is ultimately synchronised. Dispersion is due to system clock resolution, statistical measurement variations etc.'
},
'chrony.frequency': {
info: 'The frequency
is the rate by which the system\'s clock would be would be wrong if chronyd was not correcting it. It is expressed in ppm (parts per million). For example, a value of 1ppm would mean that when the system\'s clock thinks it has advanced 1 second, it has actually advanced by 1.000001 seconds relative to true time.',
colors: NETDATA.colors[0]
},
'chrony.residualfreq': {
info: 'This shows the residual frequency
for the currently selected reference source. ' +
'It reflects any difference between what the measurements from the reference source indicate the ' +
'frequency should be and the frequency currently being used. The reason this is not always zero is ' +
'that a smoothing procedure is applied to the frequency. Each time a measurement from the reference ' +
'source is obtained and a new residual frequency computed, the estimated accuracy of this residual ' +
'is compared with the estimated accuracy (see skew
) of the existing frequency value. ' +
'A weighted average is computed for the new frequency, with weights depending on these accuracies. ' +
'If the measurements from the reference source follow a consistent trend, the residual will be ' +
'driven to zero over time.',
height: 0.5,
colors: NETDATA.colors[3]
},
'chrony.skew': {
info: 'The estimated error bound on the frequency.',
height: 0.5,
colors: NETDATA.colors[5]
},
'couchdb.active_tasks': {
info: 'Active tasks running on this CouchDB cluster. Four types of tasks currently exist: indexer (view building), replication, database compaction and view compaction.'
},
'couchdb.replicator_jobs': {
info: 'Detailed breakdown of any replication jobs in progress on this node. For more information, see the replicator documentation.'
},
'couchdb.open_files': {
info: 'Count of all files held open by CouchDB. If this value seems pegged at 1024 or 4096, your server process is probably hitting the open file handle limit and needs to be increased.'
},
'btrfs.disk': {
info: 'Physical disk usage of BTRFS. The disk space reported here is the raw physical disk space assigned to the BTRFS volume (i.e. before any RAID levels). BTRFS uses a two-stage allocator, first allocating large regions of disk space for one type of block (data, metadata, or system), and then using a regular block allocator inside those regions. unallocated
is the physical disk space that is not allocated yet and is available to become data, metdata or system on demand. When unallocated
is zero, all available disk space has been allocated to a specific function. Healthy volumes should ideally have at least five percent of their total space unallocated
. You can keep your volume healthy by running the btrfs balance
command on it regularly (check man btrfs-balance
for more info). Note that some of the space listed as unallocated
may not actually be usable if the volume uses devices of different sizes.',
colors: [NETDATA.colors[12]]
},
'btrfs.data': {
info: 'Logical disk usage for BTRFS data. Data chunks are used to store the actual file data (file contents). The disk space reported here is the usable allocation (i.e. after any striping or replication). Healthy volumes should ideally have no more than a few GB of free space reported here persistently. Running btrfs balance
can help here.'
},
'btrfs.metadata': {
info: 'Logical disk usage for BTRFS metadata. Metadata chunks store most of the filesystem interal structures, as well as information like directory structure and file names. The disk space reported here is the usable allocation (i.e. after any striping or replication). Healthy volumes should ideally have no more than a few GB of free space reported here persistently. Running btrfs balance
can help here.'
},
'btrfs.system': {
info: 'Logical disk usage for BTRFS system. System chunks store information about the allocation of other chunks. The disk space reported here is the usable allocation (i.e. after any striping or replication). The values reported here should be relatively small compared to Data and Metadata, and will scale with the volume size and overall space usage.'
},
// ------------------------------------------------------------------------
// RabbitMQ
// info: the text above the charts
// heads: the representation of the chart at the top the subsection (second level menu)
// mainheads: the representation of the chart at the top of the section (first level menu)
// colors: the dimension colors of the chart (the default colors are appended)
// height: the ratio of the chart height relative to the default
'rabbitmq.queued_messages': {
info: 'Overall total of ready and unacknowledged queued messages. Messages that are delivered immediately are not counted here.'
},
'rabbitmq.message_rates': {
info: 'Overall messaging rates including acknowledgements, delieveries, redeliveries, and publishes.'
},
'rabbitmq.global_counts': {
info: 'Overall totals for channels, consumers, connections, queues and exchanges.'
},
'rabbitmq.file_descriptors': {
info: 'Total number of used filed descriptors. See Open File Limits
for further details.',
colors: NETDATA.colors[3]
},
'rabbitmq.sockets': {
info: 'Total number of used socket descriptors. Each used socket also counts as a used file descriptor. See Open File Limits
for further details.',
colors: NETDATA.colors[3]
},
'rabbitmq.processes': {
info: 'Total number of processes running within the Erlang VM. This is not the same as the number of processes running on the host.',
colors: NETDATA.colors[3]
},
'rabbitmq.erlang_run_queue': {
info: 'Number of Erlang processes the Erlang schedulers have queued to run.',
colors: NETDATA.colors[3]
},
'rabbitmq.memory': {
info: 'Total amount of memory used by the RabbitMQ. This is a complex statistic that can be further analyzed in the management UI. See Memory
for further details.',
colors: NETDATA.colors[3]
},
'rabbitmq.disk_space': {
info: 'Total amount of disk space consumed by the message store(s). See Disk Space Limits
for further details.',
colors: NETDATA.colors[3]
},
// ------------------------------------------------------------------------
// ntpd
'ntpd.sys_offset': {
info: 'For hosts without any time critical services an offset of < 100 ms should be acceptable even with high network latencies. For hosts with time critical services an offset of about 0.01 ms or less can be achieved by using peers with low delays and configuring optimal poll exponent values.',
colors: NETDATA.colors[4]
},
'ntpd.sys_jitter': {
info: 'The jitter statistics are exponentially-weighted RMS averages. The system jitter is defined in the NTPv4 specification; the clock jitter statistic is computed by the clock discipline module.'
},
'ntpd.sys_frequency': {
info: 'The frequency offset is shown in ppm (parts per million) relative to the frequency of the system. The frequency correction needed for the clock can vary significantly between boots and also due to external influences like temperature or radiation.',
colors: NETDATA.colors[2],
height: 0.6
},
'ntpd.sys_wander': {
info: 'The wander statistics are exponentially-weighted RMS averages.',
colors: NETDATA.colors[3],
height: 0.6
},
'ntpd.sys_rootdelay': {
info: 'The rootdelay is the round-trip delay to the primary reference clock, similar to the delay shown by the ping
command. A lower delay should result in a lower clock offset.',
colors: NETDATA.colors[1]
},
'ntpd.sys_stratum': {
info: 'The distance in "hops" to the primary reference clock',
colors: NETDATA.colors[5],
height: 0.3
},
'ntpd.sys_tc': {
info: 'Time constants and poll intervals are expressed as exponents of 2. The default poll exponent of 6 corresponds to a poll interval of 64 s. For typical Internet paths, the optimum poll interval is about 64 s. For fast LANs with modern computers, a poll exponent of 4 (16 s) is appropriate. The poll process sends NTP packets at intervals determined by the clock discipline algorithm.',
height: 0.5
},
'ntpd.sys_precision': {
colors: NETDATA.colors[6],
height: 0.2
},
'ntpd.peer_offset': {
info: 'The offset of the peer clock relative to the system clock in milliseconds. Smaller values here weight peers more heavily for selection after the initial synchronization of the local clock. For a system providing time service to other systems, these should be as low as possible.'
},
'ntpd.peer_delay': {
info: 'The round-trip time (RTT) for communication with the peer, similar to the delay shown by the ping
command. Not as critical as either the offset or jitter, but still factored into the selection algorithm (because as a general rule, lower delay means more accurate time). In most cases, it should be below 100ms.'
},
'ntpd.peer_dispersion': {
info: 'This is a measure of the estimated error between the peer and the local system. Lower values here are better.'
},
'ntpd.peer_jitter': {
info: 'This is essentially a remote estimate of the peer\'s system_jitter
value. Lower values here weight highly in favor of peer selection, and this is a good indicator of overall quality of a given time server (good servers will have values not exceeding single digit milliseconds here, with high quality stratum one servers regularly having sub-millisecond jitter).'
},
'ntpd.peer_xleave': {
info: 'This variable is used in interleaved mode (used only in NTP symmetric and broadcast modes). See NTP Interleaved Modes.'
},
'ntpd.peer_rootdelay': {
info: 'For a stratum 1 server, this is the access latency for the reference clock. For lower stratum servers, it is the sum of the peer_delay
and peer_rootdelay
for the system they are syncing off of. Similarly to peer_delay
, lower values here are technically better, but have limited influence in peer selection.'
},
'ntpd.peer_rootdisp': {
info: 'Is the same as peer_rootdelay
, but measures accumulated peer_dispersion
instead of accumulated peer_delay
.'
},
'ntpd.peer_hmode': {
info: 'The peer_hmode
and peer_pmode
variables give info about what mode the packets being sent to and received from a given peer are. Mode 1 is symmetric active (both the local system and the remote peer have each other declared as peers in /etc/ntp.conf
), Mode 2 is symmetric passive (only one side has the other declared as a peer), Mode 3 is client, Mode 4 is server, and Mode 5 is broadcast (also used for multicast and manycast operation).',
height: 0.2
},
'ntpd.peer_pmode': {
height: 0.2
},
'ntpd.peer_hpoll': {
info: 'The peer_hpoll
and peer_ppoll
variables are log2 representations of the polling interval in seconds.',
height: 0.5
},
'ntpd.peer_ppoll': {
height: 0.5
},
'ntpd.peer_precision': {
height: 0.2
},
'spigotmc.tps': {
info: 'The running 1, 5, and 15 minute average number of server ticks per second. An idealized server will show 20.0 for all values, but in practice this almost never happens. Typical servers should show approximately 19.98-20.0 here. Lower values indicate progressively more server-side lag (and thus that you need better hardware for your server or a lower user limit). For every 0.05 ticks below 20, redstone clocks will lag behind by approximately 0.25%. Values below approximately 19.50 may interfere with complex free-running redstone circuits and will noticeably slow down growth.'
},
'spigotmc.users': {
info: 'THe number of currently connect users on the monitored Spigot server.'
},
'unbound.queries': {
info: 'Shows the number of queries being processed of each type. Note that Recursive
queries are also accounted as cache misses.'
},
'unbound.reqlist': {
info: 'Shows various stats about Unbound\'s internal request list.'
},
'unbound.recursion': {
info: 'Average and median time to complete recursive name resolution.'
},
'unbound.cache': {
info: 'The number of items in each of the various caches.'
},
'unbound.threads.queries': {
height: 0.2
},
'unbound.threads.reqlist': {
height: 0.2
},
'unbound.threads.recursion': {
height: 0.2
},
'boinc.tasks': {
info: 'The total number of tasks and the number of active tasks. Active tasks are those which are either currently being processed, or are partialy processed but suspended.'
},
'boinc.states': {
info: 'Counts of tasks in each task state. The normal sequence of states is New
, Downloading
, Ready to Run
, Uploading
, Uploaded
. Tasks which are marked Ready to Run
may be actively running, or may be waiting to be scheduled. Compute Errors
are tasks which failed for some reason during execution. Aborted
tasks were manually cancelled, and will not be processed. Failed Uploads
are otherwise finished tasks which failed to upload to the server, and usually indicate networking issues.'
},
'boinc.sched': {
info: 'Counts of active tasks in each scheduling state. Scheduled
tasks are the ones which will run if the system is permitted to process tasks. Preempted
tasks are on standby, and will run if a Scheduled
task stops running for some reason. Uninitialized
tasks should never be present, and indicate tha the scheduler has not tried to schedule them yet.'
},
'boinc.process': {
info: 'Counts of active tasks in each process state. Executing
tasks are running right now. Suspended
tasks have an associated process, but are not currently running (either because the system isn\'t processing any tasks right now, or because they have been preempted by higher priority tasks). Quit
tasks are exiting gracefully. Aborted
tasks exceeded some resource limit, and are being shut down. Copy Pending
tasks are waiting on a background file transfer to finish. Uninitialized
tasks do not have an associated process yet.'
},
'w1sensor.temp': {
info: 'Temperature derived from 1-Wire temperature sensors.'
},
'logind.sessions': {
info: 'Shows the number of active sessions of each type tracked by logind.'
},
'logind.users': {
info: 'Shows the number of active users of each type tracked by logind.'
},
'logind.seats': {
info: 'Shows the number of active seats tracked by logind. Each seat corresponds to a combination of a display device and input device providing a physical presence for the system.'
},
// ------------------------------------------------------------------------
// ProxySQL
'proxysql.pool_status': {
info: 'The status of the backend servers. ' +
'1=ONLINE
backend server is fully operational, ' +
'2=SHUNNED
backend sever is temporarily taken out of use because of either too many connection errors in a time that was too short, or replication lag exceeded the allowed threshold, ' +
'3=OFFLINE_SOFT
when a server is put into OFFLINE_SOFT mode, new incoming connections aren\'t accepted anymore, while the existing connections are kept until they became inactive. In other words, connections are kept in use until the current transaction is completed. This allows to gracefully detach a backend, ' +
'4=OFFLINE_HARD
when a server is put into OFFLINE_HARD mode, the existing connections are dropped, while new incoming connections aren\'t accepted either. This is equivalent to deleting the server from a hostgroup, or temporarily taking it out of the hostgroup for maintenance work, ' +
'-1
Unknown status.'
},
'proxysql.pool_net': {
info: 'The amount of data sent to/received from the backend ' +
'(This does not include metadata (packets\' headers, OK/ERR packets, fields\' description, etc).'
},
'proxysql.pool_overall_net': {
info: 'The amount of data sent to/received from the all backends ' +
'(This does not include metadata (packets\' headers, OK/ERR packets, fields\' description, etc).'
},
'proxysql.questions': {
info: 'questions
total number of queries sent from frontends, ' +
'slow_queries
number of queries that ran for longer than the threshold in milliseconds defined in global variable mysql-long_query_time
. '
},
'proxysql.connections': {
info: 'aborted
number of frontend connections aborted due to invalid credential or max_connections reached, ' +
'connected
number of frontend connections currently connected, ' +
'created
number of frontend connections created, ' +
'non_idle
number of frontend connections that are not currently idle. '
},
'proxysql.pool_latency': {
info: 'The currently ping time in microseconds, as reported from Monitor.'
},
'proxysql.queries': {
info: 'The number of queries routed towards this particular backend server.'
},
'proxysql.pool_used_connections': {
info: 'The number of connections are currently used by ProxySQL for sending queries to the backend server.'
},
'proxysql.pool_free_connections': {
info: 'The number of connections are currently free. They are kept open in order to minimize the time cost of sending a query to the backend server.'
},
'proxysql.pool_ok_connections': {
info: 'The number of connections were established successfully.'
},
'proxysql.pool_error_connections': {
info: 'The number of connections weren\'t established successfully.'
},
'proxysql.commands_count': {
info: 'The total number of commands of that type executed'
},
'proxysql.commands_duration': {
info: 'The total time spent executing commands of that type, in ms'
}
// ------------------------------------------------------------------------
};