From afe52ca6af107b255f6e5aa00bc9c7a8fc1f1236 Mon Sep 17 00:00:00 2001 From: teutat3s Date: Wed, 6 Nov 2024 21:28:28 +0100 Subject: [PATCH] alertmanager: alert on high load only after 20m --- modules/prometheus/alert-rules.nix | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/modules/prometheus/alert-rules.nix b/modules/prometheus/alert-rules.nix index 866709b7..3c1b601a 100644 --- a/modules/prometheus/alert-rules.nix +++ b/modules/prometheus/alert-rules.nix @@ -142,8 +142,8 @@ lib.mapAttrsToList cpu_using_90percent = { condition = ''100 - (avg by (instance) (irate(node_cpu_seconds_total{mode="idle"}[5m])) * 100) >= 90''; - time = "10m"; - description = "{{$labels.instance}} is running with cpu usage > 90% for at least 10 minutes: {{$value}}"; + time = "20m"; + description = "{{$labels.instance}} is running with cpu usage > 90% for at least 20 minutes: {{$value}}"; }; reboot = {