From 776754ef7203a15bdd413c1ab55e29435fd52620 Mon Sep 17 00:00:00 2001 From: Johannes Christ Date: Fri, 17 May 2024 20:13:00 +0200 Subject: [PATCH] Disable alerts for known problematic services --- ansible/host_vars/lovelace/prometheus.yml | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/ansible/host_vars/lovelace/prometheus.yml b/ansible/host_vars/lovelace/prometheus.yml index 6f8db3c1..5d114a10 100644 --- a/ansible/host_vars/lovelace/prometheus.yml +++ b/ansible/host_vars/lovelace/prometheus.yml @@ -81,8 +81,7 @@ prometheus_rules: | - name: node rules: - alert: node/systemd-unit-failed - # expr: node_systemd_unit_state{state="failed", name!="openipmi.service", name!="nvmf-autoconnect.service"} != 0 - expr: node_systemd_unit_state{state="failed"} != 0 + expr: node_systemd_unit_state{state="failed", name!="openipmi.service", name!="nvmf-autoconnect.service"} != 0 for: 15m labels: severity: warning