diff --git a/clusters/k3s-dgx/nim-service/qwen.yaml b/clusters/k3s-dgx/nim-service/qwen.yaml index 193bdc3..362c127 100644 --- a/clusters/k3s-dgx/nim-service/qwen.yaml +++ b/clusters/k3s-dgx/nim-service/qwen.yaml @@ -1,12 +1,12 @@ apiVersion: apps.nvidia.com/v1alpha1 kind: NIMCache metadata: - name: qwen2.5-7b-instruct + name: qwen3-32b-instruct namespace: nim-service spec: source: ngc: - modelPuller: nvcr.io/nim/qwen/qwen-2.5-7b-instruct:latest + modelPuller: nvcr.io/nim/qwen/qwen3-32b-dgx-spark:1.1.0-variant pullSecret: ngc-secret authSecret: ngc-api-secret model: