From 8b180f766235f25d8a0157eeed18dc0d40542e38 Mon Sep 17 00:00:00 2001
From: Viktor Barzin <vbarzin@gmail.com>
Date: Wed, 6 May 2026 20:35:38 +0000
Subject: [PATCH] openclaw: switch primary model to qwen3-coder-480b
 (qwen3.5-397b dead on NIM)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

NVIDIA retired nim/qwen/qwen3.5-397b-a17b — modelrelay shows consistent
TIMEOUTs over 24h+ of pings, and nim/nvidia/llama-3.1-nemotron-ultra-253b-v1
returns 404. With both gone the openclaw failover never reached
mistral-large-3 in time, so every message hung until the 120s embedded-run
timeout. Promote qwen3-coder-480b-a35b-instruct (already in models list, UP
~1-2s, 256k ctx) to primary; drop the dead nemotron-ultra fallback.
---
 stacks/openclaw/main.tf | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/stacks/openclaw/main.tf b/stacks/openclaw/main.tf
index 5d5f9a1d..11d129ee 100644
--- a/stacks/openclaw/main.tf
+++ b/stacks/openclaw/main.tf
@@ -131,8 +131,8 @@ resource "kubernetes_config_map" "openclaw_config" {
             mode = "off"
           }
           model = {
-            primary   = "nim/qwen/qwen3.5-397b-a17b"
-            fallbacks = ["nim/mistralai/mistral-large-3-675b-instruct-2512", "nim/nvidia/llama-3.1-nemotron-ultra-253b-v1", "modelrelay/auto-fastest"]
+            primary   = "nim/qwen/qwen3-coder-480b-a35b-instruct"
+            fallbacks = ["nim/mistralai/mistral-large-3-675b-instruct-2512", "modelrelay/auto-fastest"]
           }
           models = {
             "modelrelay/auto-fastest"                                = {}