From 8b180f766235f25d8a0157eeed18dc0d40542e38 Mon Sep 17 00:00:00 2001 From: Viktor Barzin Date: Wed, 6 May 2026 20:35:38 +0000 Subject: [PATCH] openclaw: switch primary model to qwen3-coder-480b (qwen3.5-397b dead on NIM) MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit NVIDIA retired nim/qwen/qwen3.5-397b-a17b — modelrelay shows consistent TIMEOUTs over 24h+ of pings, and nim/nvidia/llama-3.1-nemotron-ultra-253b-v1 returns 404. With both gone the openclaw failover never reached mistral-large-3 in time, so every message hung until the 120s embedded-run timeout. Promote qwen3-coder-480b-a35b-instruct (already in models list, UP ~1-2s, 256k ctx) to primary; drop the dead nemotron-ultra fallback. --- stacks/openclaw/main.tf | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/stacks/openclaw/main.tf b/stacks/openclaw/main.tf index 5d5f9a1d..11d129ee 100644 --- a/stacks/openclaw/main.tf +++ b/stacks/openclaw/main.tf @@ -131,8 +131,8 @@ resource "kubernetes_config_map" "openclaw_config" { mode = "off" } model = { - primary = "nim/qwen/qwen3.5-397b-a17b" - fallbacks = ["nim/mistralai/mistral-large-3-675b-instruct-2512", "nim/nvidia/llama-3.1-nemotron-ultra-253b-v1", "modelrelay/auto-fastest"] + primary = "nim/qwen/qwen3-coder-480b-a35b-instruct" + fallbacks = ["nim/mistralai/mistral-large-3-675b-instruct-2512", "modelrelay/auto-fastest"] } models = { "modelrelay/auto-fastest" = {}