From 418d1efb4b5e14529bc5c3c245f49a17cf22fc33 Mon Sep 17 00:00:00 2001 From: Viktor Barzin Date: Mon, 29 Jun 2026 15:27:17 +0000 Subject: [PATCH] rightsize: trim over-provisioned memory (batch 2/N) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit claude-agent-service 12Gi->3Gi (peak 585Mi — the single biggest fat, ~9Gi of limit-overcommit removed), job-hunter 1280->768Mi (kept chromium headroom; 30d peak 118Mi), fire-planner 1024->320Mi, wealthfolio 1Gi->512Mi (kept history-growth headroom). Burstable, limits kept >= generous peak headroom, never below peak. ~10.7Gi of limit overcommit removed. paperless-ai intentionally LEFT at 4Gi (documented in-process RAG model load). Co-Authored-By: Claude Opus 4.8 --- stacks/claude-agent-service/main.tf | 4 ++-- stacks/fire-planner/main.tf | 4 ++-- stacks/job-hunter/main.tf | 5 +++-- stacks/wealthfolio/main.tf | 4 ++-- 4 files changed, 9 insertions(+), 8 deletions(-) diff --git a/stacks/claude-agent-service/main.tf b/stacks/claude-agent-service/main.tf index a039f699..173ff7a3 100644 --- a/stacks/claude-agent-service/main.tf +++ b/stacks/claude-agent-service/main.tf @@ -635,10 +635,10 @@ resource "kubernetes_deployment" "claude_agent" { resources { requests = { cpu = "1" - memory = "2Gi" + memory = "640Mi" } limits = { - memory = "12Gi" + memory = "3Gi" } } } diff --git a/stacks/fire-planner/main.tf b/stacks/fire-planner/main.tf index be478699..43eb30c4 100644 --- a/stacks/fire-planner/main.tf +++ b/stacks/fire-planner/main.tf @@ -318,10 +318,10 @@ resource "kubernetes_deployment" "fire_planner" { resources { requests = { cpu = "100m" - memory = "512Mi" + memory = "192Mi" } limits = { - memory = "1024Mi" + memory = "320Mi" } } } diff --git a/stacks/job-hunter/main.tf b/stacks/job-hunter/main.tf index 94927bf6..62f95e93 100644 --- a/stacks/job-hunter/main.tf +++ b/stacks/job-hunter/main.tf @@ -271,11 +271,12 @@ resource "kubernetes_deployment" "job_hunter" { resources { requests = { cpu = "100m" - memory = "512Mi" + memory = "256Mi" } # Chromium baseline ~1Gi — matches broker-sync precedent. + # 30d peak only 118Mi (chromium rarely launched); keep 768Mi headroom. limits = { - memory = "1280Mi" + memory = "768Mi" } } } diff --git a/stacks/wealthfolio/main.tf b/stacks/wealthfolio/main.tf index 1deb26fd..85650bd3 100644 --- a/stacks/wealthfolio/main.tf +++ b/stacks/wealthfolio/main.tf @@ -208,10 +208,10 @@ resource "kubernetes_deployment" "wealthfolio" { resources { requests = { cpu = "10m" - memory = "256Mi" + memory = "128Mi" } limits = { - memory = "1Gi" + memory = "512Mi" } } }