Skip to content

Commit

Permalink
ci: 🎡 add ingress alerts
Browse files Browse the repository at this point in the history
  • Loading branch information
jaskaransarkaria committed Feb 28, 2024
1 parent 7dcf8b3 commit 4ce71be
Show file tree
Hide file tree
Showing 2 changed files with 39 additions and 0 deletions.
9 changes: 9 additions & 0 deletions main.tf
Original file line number Diff line number Diff line change
Expand Up @@ -101,3 +101,12 @@ resource "kubectl_manifest" "nginx_ingress_default_certificate" {
kubernetes_namespace.ingress_controllers
]
}

#########################
# prometheus rule alert #
#########################
resource "kubectl_manifest" "prometheus_rule_alert" {
count = var.controller_name == "default" ? 1 : 0
depends_on = [helm_release.nginx_ingress]
yaml_body = file("${path.module}/resources/alerts.yaml")
}
30 changes: 30 additions & 0 deletions resources/alerts.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,30 @@
---
apiVersion: monitoring.coreos.com/v1
kind: PrometheusRule
metadata:
name: ingress-controller-errors
namespace: ingress-controllers
labels:
prometheus: cloud-platform
spec:
groups:
- name: ingress-controllers
rules:
- alert: IngressControllerIsCrashLoopBackoffing
expr: rate(kube_pod_container_status_restarts_total{job="kube-state-metrics",namespace="ingress-controllers"}[15m]) * 60 * 15 > 0
for: 10m
labels:
severity: warning
annotations:
message: An Ingress Controller pod is CrashLoopBackOff'ing
- alert: IngressControllerIsOOMKilled
expr: |-
kube_pod_container_status_last_terminated_reason{container="controller",namespace="ingress-controllers",reason="OOMKilled"} == 1
and on(container, namespace, pod) increase(kube_pod_container_status_restarts_total{container="controller",namespace="ingress-controllers"}[5m]) > 0
for: 15m
labels:
severity: warning
annotations:
message: |
An Ingress Controller pod has restarted because of OOMKilled. This alert works by watching for a pod that has been restarted within 5 minutes and the last termination status is OOMKilled.

0 comments on commit 4ce71be

Please sign in to comment.