From 3d4cdf320371e1fbc8215bfc83f2cc6e0239fccc Mon Sep 17 00:00:00 2001 From: Viktor Barzin Date: Mon, 16 Feb 2026 20:09:53 +0000 Subject: [PATCH] [ci skip] Fix Alloy OOMKill and iDRAC priority class conflict MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - Alloy: bump memory limits from 64Mi/128Mi to 256Mi/768Mi — pods were OOMKilled at 128Mi, steady-state usage is ~400-450Mi per node - iDRAC Redfish Exporter: add explicit priority_class_name to resolve conflict between Kyverno priority injection and default priority: 0 --- modules/kubernetes/monitoring/alloy.yaml | 7 +++++-- modules/kubernetes/monitoring/idrac.tf | 1 + 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/modules/kubernetes/monitoring/alloy.yaml b/modules/kubernetes/monitoring/alloy.yaml index d3d6a0db..857c10e7 100644 --- a/modules/kubernetes/monitoring/alloy.yaml +++ b/modules/kubernetes/monitoring/alloy.yaml @@ -100,10 +100,13 @@ alloy: } # Resource limits for DaemonSet pods + # Alloy tails logs from all containers on the node via K8s API and batches + # them to Loki. Memory scales with number of active log streams (~30-50 per node). + # 128Mi was OOMKilled; steady-state usage is ~400-450Mi per pod. resources: requests: cpu: 50m - memory: 64Mi + memory: 256Mi limits: cpu: 200m - memory: 128Mi + memory: 768Mi diff --git a/modules/kubernetes/monitoring/idrac.tf b/modules/kubernetes/monitoring/idrac.tf index 99ba0b93..8d4d2572 100644 --- a/modules/kubernetes/monitoring/idrac.tf +++ b/modules/kubernetes/monitoring/idrac.tf @@ -59,6 +59,7 @@ resource "kubernetes_deployment" "idrac-redfish" { } } spec { + priority_class_name = "tier-1-cluster" container { # https://github.com/mrlhansen/idrac_exporter?tab=readme-ov-file image = "ghcr.io/mrlhansen/idrac_exporter:latest"