From 066554aa366365fc93f64f2dff1c1cd62d7ab697 Mon Sep 17 00:00:00 2001 From: HaimKortovich Date: Wed, 6 May 2026 17:42:18 -0500 Subject: [PATCH] use 32b --- clusters/k3s-dgx/nim-service/qwen.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/clusters/k3s-dgx/nim-service/qwen.yaml b/clusters/k3s-dgx/nim-service/qwen.yaml index 193bdc3..362c127 100644 --- a/clusters/k3s-dgx/nim-service/qwen.yaml +++ b/clusters/k3s-dgx/nim-service/qwen.yaml @@ -1,12 +1,12 @@ apiVersion: apps.nvidia.com/v1alpha1 kind: NIMCache metadata: - name: qwen2.5-7b-instruct + name: qwen3-32b-instruct namespace: nim-service spec: source: ngc: - modelPuller: nvcr.io/nim/qwen/qwen-2.5-7b-instruct:latest + modelPuller: nvcr.io/nim/qwen/qwen3-32b-dgx-spark:1.1.0-variant pullSecret: ngc-secret authSecret: ngc-api-secret model: