From f602e1aec961641c5b67698b17a9bd2d7a95f1f4 Mon Sep 17 00:00:00 2001 From: HaimKortovich Date: Wed, 6 May 2026 17:48:20 -0500 Subject: [PATCH] set string --- clusters/k3s-dgx/nim-service/qwen.yaml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/clusters/k3s-dgx/nim-service/qwen.yaml b/clusters/k3s-dgx/nim-service/qwen.yaml index c2086bb..36738e9 100644 --- a/clusters/k3s-dgx/nim-service/qwen.yaml +++ b/clusters/k3s-dgx/nim-service/qwen.yaml @@ -26,8 +26,10 @@ metadata: spec: args: - --enable-auto-tool-choice + - --gpu-memory-utilization + - "0.90" - --tool-call-parser - - llama3_json + - hermes image: repository: nvcr.io/nim/qwen/qwen3-32b-dgx-spark tag: "1.1.0-variant"