From 7064e7733ebb26f3b3d4eddcfcf30c8ff97c68cf Mon Sep 17 00:00:00 2001 From: Tariq Mahmood Date: Wed, 22 Jan 2025 11:03:40 +0000 Subject: [PATCH 1/2] new alert added for Node NotReady State --- resources/prometheusrule-alerts/node-alerts.yaml | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/resources/prometheusrule-alerts/node-alerts.yaml b/resources/prometheusrule-alerts/node-alerts.yaml index 7f549d1..bbd35db 100644 --- a/resources/prometheusrule-alerts/node-alerts.yaml +++ b/resources/prometheusrule-alerts/node-alerts.yaml @@ -95,3 +95,11 @@ spec: for: 15s labels: severity: info-warning + - alert: NodeNotReadyState + annotations: + message: 'The Node is in a state of NotReady, investigate further' + runbook_url: https://github.com/ministryofjustice/cloud-platform-terraform-monitoring/blob/main/resources/prometheusrule-alerts/README.md + expr: (kube_node_status_condition{condition="Ready", status="true"}) + for: 15m + labels: + severity: warning From 4b1d363f364046576a9f8cac9fbe3dd0f5572ca5 Mon Sep 17 00:00:00 2001 From: Tariq Mahmood Date: Wed, 22 Jan 2025 12:26:20 +0000 Subject: [PATCH 2/2] changed condition to NotReady --- resources/prometheusrule-alerts/node-alerts.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/resources/prometheusrule-alerts/node-alerts.yaml b/resources/prometheusrule-alerts/node-alerts.yaml index bbd35db..7a1ab9b 100644 --- a/resources/prometheusrule-alerts/node-alerts.yaml +++ b/resources/prometheusrule-alerts/node-alerts.yaml @@ -99,7 +99,7 @@ spec: annotations: message: 'The Node is in a state of NotReady, investigate further' runbook_url: https://github.com/ministryofjustice/cloud-platform-terraform-monitoring/blob/main/resources/prometheusrule-alerts/README.md - expr: (kube_node_status_condition{condition="Ready", status="true"}) + expr: (kube_node_status_condition{condition="NotReady", status="true"}) for: 15m labels: severity: warning