From 0159266889f51875ad33f0a551af7d0dd4e7f992 Mon Sep 17 00:00:00 2001 From: "lucas.mathieu" Date: Mon, 5 Jan 2026 10:42:43 +0100 Subject: [PATCH] feat(monitoring): Remove the HostCpuIsUnderutilized alert --- monitoring/prometheus/alerts/node-exporter.yml | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/monitoring/prometheus/alerts/node-exporter.yml b/monitoring/prometheus/alerts/node-exporter.yml index 9a4c93f..1a7fb12 100644 --- a/monitoring/prometheus/alerts/node-exporter.yml +++ b/monitoring/prometheus/alerts/node-exporter.yml @@ -139,14 +139,14 @@ groups: description: "CPU load is > 80%\n VALUE = {{ $value }}\n LABELS = {{ $labels }}" # You may want to increase the alert manager 'repeat_interval' for this type of alert to daily or weekly - - alert: HostCpuIsUnderutilized - expr: '(min by (instance) (rate(node_cpu_seconds_total{mode="idle"}[1h]))) > 0.8' - for: 1w - labels: - severity: info - annotations: - summary: Host CPU is underutilized (instance {{ $labels.instance }}) - description: "CPU load has been < 20% for 1 week. Consider reducing the number of CPUs.\n VALUE = {{ $value }}\n LABELS = {{ $labels }}" + # - alert: HostCpuIsUnderutilized + # expr: '(min by (instance) (rate(node_cpu_seconds_total{mode="idle"}[1h]))) > 0.8' + # for: 1w + # labels: + # severity: info + # annotations: + # summary: Host CPU is underutilized (instance {{ $labels.instance }}) + # description: "CPU load has been < 20% for 1 week. Consider reducing the number of CPUs.\n VALUE = {{ $value }}\n LABELS = {{ $labels }}" - alert: HostCpuStealNoisyNeighbor expr: 'avg by(instance) (rate(node_cpu_seconds_total{mode="steal"}[5m])) * 100 > 10'