summaryrefslogtreecommitdiffstats
path: root/health/health.d/net.conf
diff options
context:
space:
mode:
Diffstat (limited to 'health/health.d/net.conf')
-rw-r--r--health/health.d/net.conf44
1 files changed, 33 insertions, 11 deletions
diff --git a/health/health.d/net.conf b/health/health.d/net.conf
index 028ca7b81b..89eb758a46 100644
--- a/health/health.d/net.conf
+++ b/health/health.d/net.conf
@@ -31,7 +31,9 @@ component: Network
every: 10s
warn: $this > (($status >= $WARNING) ? (85) : (90))
delay: up 1m down 1m multiplier 1.5 max 1h
- info: average inbound utilization for the network interface $family over the last minute
+ info: Average inbound utilization for the network interface $family over the last minute. \
+ High inbound utilization. \
+ Network delays and packet drops are expected when you are getting closer to 100%.
to: sysadmin
template: 1m_sent_traffic_overflow
@@ -48,7 +50,9 @@ component: Network
every: 10s
warn: $this > (($status >= $WARNING) ? (85) : (90))
delay: up 1m down 1m multiplier 1.5 max 1h
- info: average outbound utilization for the network interface $family over the last minute
+ info: Average outbound utilization for the network interface $family over the last minute. \
+ High outbound utilization. \
+ Network delays and packet drops are expected when you are getting closer to 100%.
to: sysadmin
# -----------------------------------------------------------------------------
@@ -101,7 +105,9 @@ component: Network
every: 1m
warn: $this >= 2
delay: up 1m down 1h multiplier 1.5 max 2h
- info: ratio of inbound dropped packets for the network interface $family over the last 10 minutes
+ info: Ratio of inbound dropped packets for the network interface $family over the last 10 minutes. \
+ Network interface $family dropped many packets. \
+ It means packets were received but not processed, e.g. due to lack of resources or unsupported protocol.
to: sysadmin
template: outbound_packets_dropped_ratio
@@ -118,7 +124,9 @@ component: Network
every: 1m
warn: $this >= 2
delay: up 1m down 1h multiplier 1.5 max 2h
- info: ratio of outbound dropped packets for the network interface $family over the last 10 minutes
+ info: Ratio of outbound dropped packets for the network interface $family over the last 10 minutes. \
+ Network interface $family dropped many packets. \
+ It means packets were dropped on their way to transmission, e.g. due to lack of resources.
to: sysadmin
template: wifi_inbound_packets_dropped_ratio
@@ -135,7 +143,9 @@ component: Network
every: 1m
warn: $this >= 10
delay: up 1m down 1h multiplier 1.5 max 2h
- info: ratio of inbound dropped packets for the network interface $family over the last 10 minutes
+ info: Ratio of inbound dropped packets for the network interface $family over the last 10 minutes. \
+ Network interface $family dropped many packets. \
+ It means packets were received but not processed, e.g. due to lack of resources or unsupported protocol.
to: sysadmin
template: wifi_outbound_packets_dropped_ratio
@@ -152,7 +162,9 @@ component: Network
every: 1m
warn: $this >= 10
delay: up 1m down 1h multiplier 1.5 max 2h
- info: ratio of outbound dropped packets for the network interface $family over the last 10 minutes
+ info: Ratio of outbound dropped packets for the network interface $family over the last 10 minutes. \
+ Network interface $family dropped many packets. \
+ It means packets were dropped on their way to transmission, e.g. due to lack of resources.
to: sysadmin
# -----------------------------------------------------------------------------
@@ -171,7 +183,9 @@ component: Network
every: 1m
warn: $this >= 5
delay: down 1h multiplier 1.5 max 2h
- info: number of inbound errors for the network interface $family in the last 10 minutes
+ info: Number of inbound errors for the network interface $family in the last 10 minutes. \
+ Network interface $family received many bad packets. \
+ It includes length, CRC, frame errors, etc.
to: sysadmin
template: interface_outbound_errors
@@ -187,7 +201,9 @@ component: Network
every: 1m
warn: $this >= 5
delay: down 1h multiplier 1.5 max 2h
- info: number of outbound errors for the network interface $family in the last 10 minutes
+ info: Number of outbound errors for the network interface $family in the last 10 minutes. \
+ Network interface $family experienced many transmit problems. \
+ It includes aborted, carrier, FIFO, heartbeat, window errors, etc.
to: sysadmin
# -----------------------------------------------------------------------------
@@ -211,7 +227,11 @@ component: Network
every: 1m
warn: $this > 0
delay: down 1h multiplier 1.5 max 2h
- info: number of FIFO errors for the network interface $family in the last 10 minutes
+ info: Number of FIFO errors for the network interface $family in the last 10 minutes. \
+ Network interface $family experienced FIFO errors. \
+ It indicates that the NIC is not able to handle the peak load of \
+ incoming/outgoing packets with the current ring buffer size. \
+ In case of a high packet drop rate, increasing the appropriate ring buffer can fix the issue.
to: sysadmin
# -----------------------------------------------------------------------------
@@ -251,6 +271,8 @@ component: Network
warn: $this > (($status >= $WARNING)?(200):(5000))
crit: $this > (($status == $CRITICAL)?(5000):(6000))
options: no-clear-notification
- info: ratio of average number of received packets for the network interface $family over the last 10 seconds, \
- compared to the rate over the last minute
+ info: Ratio of an average number of received packets for the network interface $family over the last 10 seconds, \
+ compared to the rate over the last minute. \
+ The number of received packets has increased significantly. \
+ It may indicate a broadcast/multicast storm or DoS attack.
to: sysadmin