From 6491c6cebef5528a42edb1ae847046c341f1ca18 Mon Sep 17 00:00:00 2001 From: HaimKortovich Date: Thu, 7 May 2026 15:12:03 -0500 Subject: [PATCH] use vllm profiel --- clusters/k3s-dgx/nim-service/qwen.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/clusters/k3s-dgx/nim-service/qwen.yaml b/clusters/k3s-dgx/nim-service/qwen.yaml index 947d577..fc06171 100644 --- a/clusters/k3s-dgx/nim-service/qwen.yaml +++ b/clusters/k3s-dgx/nim-service/qwen.yaml @@ -59,7 +59,7 @@ spec: storage: nimCache: name: qwen36-27b-fp8 - profile: tensorrt_llm + profile: vllm replicas: 1 resources: limits: