diff --git a/clusters/k3s-dgx/nim-service/qwen.yaml b/clusters/k3s-dgx/nim-service/qwen.yaml index 36738e9..af59059 100644 --- a/clusters/k3s-dgx/nim-service/qwen.yaml +++ b/clusters/k3s-dgx/nim-service/qwen.yaml @@ -12,6 +12,7 @@ spec: model: engine: "vllm" tensorParallelism: "1" + profile: default storage: pvc: create: true