summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorCosta Tsaousis <costa@tsaousis.gr>2018-07-08 02:44:22 +0300
committerGitHub <noreply@github.com>2018-07-08 02:44:22 +0300
commit07f25d0ae94c7e4fd1fd8c4463c62d31f6a0be42 (patch)
tree3959ad0b23e20f90043340e6812c89012cc3ca98
parent5a3b44d8d56b1179085767e93bdebea19a580005 (diff)
parent454d5182ae6fe804cd2e5ee583f82edc1c08a9d4 (diff)
Merge pull request #3928 from ccremer/apcupsd
Add basic apcupsd alarm templates
-rw-r--r--conf.d/Makefile.am1
-rw-r--r--conf.d/health.d/apcupsd.conf40
2 files changed, 41 insertions, 0 deletions
diff --git a/conf.d/Makefile.am b/conf.d/Makefile.am
index 72807b6804..7bd3622f65 100644
--- a/conf.d/Makefile.am
+++ b/conf.d/Makefile.am
@@ -88,6 +88,7 @@ healthconfigdir=$(configdir)/health.d
dist_healthconfig_DATA = \
health.d/apache.conf \
+ health.d/apcupsd.conf \
health.d/backend.conf \
health.d/bcache.conf \
health.d/beanstalkd.conf \
diff --git a/conf.d/health.d/apcupsd.conf b/conf.d/health.d/apcupsd.conf
new file mode 100644
index 0000000000..214974e230
--- /dev/null
+++ b/conf.d/health.d/apcupsd.conf
@@ -0,0 +1,40 @@
+# you can disable an alarm notification by setting the 'to' line to: silent
+
+template: 10min_ups_load
+ on: apcupsd.load
+ os: *
+ hosts: *
+ lookup: average -10m unaligned of percentage
+ units: %
+ every: 1m
+ warn: $this > (($status >= $WARNING) ? (70) : (80))
+ crit: $this > (($status == $CRITICAL) ? (85) : (95))
+ delay: down 10m multiplier 1.5 max 1h
+ info: average UPS load for the last 10 minutes
+ to: sitemgr
+
+# Discussion in https://github.com/firehol/netdata/pull/3928:
+# Fire the alarm as soon as it's going on battery (99% charge) and clear only when full.
+template: ups_charge
+ on: apcupsd.charge
+ os: *
+ hosts: *
+ lookup: average -60s unaligned of charge
+ units: %
+ every: 60s
+ warn: $this < 100
+ crit: $this < (($status == $CRITICAL) ? (60) : (50))
+ delay: down 10m multiplier 1.5 max 1h
+ info: current UPS charge, averaged over the last 60 seconds to reduce measurement errors
+ to: sitemgr
+
+template: apcupsd_last_collected_secs
+ on: apcupsd.load
+ calc: $now - $last_collected_t
+ every: 10s
+ units: seconds ago
+ warn: $this > (($status >= $WARNING) ? ($update_every) : ( 5 * $update_every))
+ crit: $this > (($status == $CRITICAL) ? ($update_every) : (60 * $update_every))
+ delay: down 5m multiplier 1.5 max 1h
+ info: number of seconds since the last successful data collection
+ to: sitemgr