From ab34446bcf7f1f35741211473760c716d4b23c15 Mon Sep 17 00:00:00 2001 From: HaimKortovich Date: Thu, 7 May 2026 16:43:11 -0500 Subject: [PATCH] set size limit --- clusters/k3s-dgx/nim-service/qwen.yaml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/clusters/k3s-dgx/nim-service/qwen.yaml b/clusters/k3s-dgx/nim-service/qwen.yaml index e09e982..702d447 100644 --- a/clusters/k3s-dgx/nim-service/qwen.yaml +++ b/clusters/k3s-dgx/nim-service/qwen.yaml @@ -87,6 +87,8 @@ spec: authSecret: hf-api-secret storage: + sharedMemorySizeLimit: + sizeLimit: 64Gi nimCache: name: qwen36-27b-fp8 replicas: 1