diff options
author | Ilya Mashchenko <ilya@netdata.cloud> | 2024-07-05 11:33:18 +0300 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-07-05 11:33:18 +0300 |
commit | 943c4fac92964f4164680a9245d46a1adf620d1b (patch) | |
tree | 2b3ce1e36ad042cc7aab13cfb103216e5a850b1b | |
parent | 1c62a5668824ce94c438cb8dc8cce2dfa80d97e9 (diff) |
health add alarm docker container down (#18075)
-rw-r--r-- | src/health/health.d/docker.conf | 23 |
1 files changed, 22 insertions, 1 deletions
diff --git a/src/health/health.d/docker.conf b/src/health/health.d/docker.conf index 668614d4dc..edb63a08ca 100644 --- a/src/health/health.d/docker.conf +++ b/src/health/health.d/docker.conf @@ -1,4 +1,6 @@ - template: docker_container_unhealthy +# you can disable an alarm notification by setting the 'to' line to: silent + +template: docker_container_unhealthy on: docker.container_health_status class: Errors type: Containers @@ -10,3 +12,22 @@ component: Docker summary: Docker container ${label:container_name} health info: ${label:container_name} docker container health status is unhealthy to: sysadmin + +# This alert monitors the status of Docker containers and triggers if any container is exited (down). +# To enable this alert for specific containers, you need to modify the "chart labels" filter. +# This filter uses Netdata's simple pattern matching syntax. + + template: docker_container_down + on: docker.container_state + class: Errors + type: Containers + component: Docker +chart labels: container_name=!* + units: status + every: 10s + lookup: average -10s of exited + warn: $this > 0 + delay: down 1m multiplier 1.5 max 2h + summary: Docker container ${label:container_name} down + info: Docker container ${label:container_name} is currently not running + to: sysadmin |