]> arthur.barton.de Git - netdata.git/commitdiff
added alarms for common UDP buffer errors
authorCosta Tsaousis (ktsaou) <costa@tsaousis.gr>
Sat, 14 Jan 2017 00:41:01 +0000 (02:41 +0200)
committerCosta Tsaousis (ktsaou) <costa@tsaousis.gr>
Sat, 14 Jan 2017 00:41:01 +0000 (02:41 +0200)
conf.d/Makefile.am
conf.d/health.d/udp_errors.conf [new file with mode: 0644]

index fbffc0f82bf8314aba41d8d3e2cecf7867638f93..7ab660f0d96dfbeec8e1b6dbc9f504a7cf24a3d9 100644 (file)
@@ -79,6 +79,7 @@ dist_healthconfig_DATA = \
     health.d/squid.conf \
     health.d/swap.conf \
     health.d/tcp_resets.conf \
+    health.d/udp_errors.conf \
     $(NULL)
 
 chartsconfigdir=$(configdir)/charts.d
diff --git a/conf.d/health.d/udp_errors.conf b/conf.d/health.d/udp_errors.conf
new file mode 100644 (file)
index 0000000..98e955c
--- /dev/null
@@ -0,0 +1,40 @@
+# -----------------------------------------------------------------------------
+
+   alarm: ipv4_udperrors_last_collected_secs
+      on: ipv4.udperrors
+    calc: $now - $last_collected_t
+   units: seconds ago
+   every: 10s
+    warn: $this > (($status >= $WARNING)  ? ($update_every) : ( 5 * $update_every))
+    crit: $this > (($status == $CRITICAL) ? ($update_every) : (60 * $update_every))
+   delay: up 0 down 5m multiplier 1.5 max 1h
+    info: number of seconds since the last successful data collection
+      to: sysadmin
+
+# -----------------------------------------------------------------------------
+# UDP receive buffer errors
+
+   alarm: 1m_ipv4_udp_receive_buffer_errors
+      on: ipv4.udperrors
+  lookup: sum -1m unaligned absolute of RcvbufErrors
+   units: errors
+   every: 10s
+    warn: $this > 0
+    crit: $this > 100
+    info: number of UDP receive buffer errors during the last minute
+   delay: up 0 down 60m multiplier 1.2 max 2h
+      to: sysadmin
+
+# -----------------------------------------------------------------------------
+# UDP send buffer errors
+
+   alarm: 1m_ipv4_udp_send_buffer_errors
+      on: ipv4.udperrors
+  lookup: sum -1m unaligned absolute of SndbufErrors
+   units: errors
+   every: 10s
+    warn: $this > 0
+    crit: $this > 100
+    info: number of UDP send buffer errors during the last minute
+   delay: up 0 down 60m multiplier 1.2 max 2h
+      to: sysadmin