diff --git a/clusters/k3s-dgx/nim-service/qwen.yaml b/clusters/k3s-dgx/nim-service/qwen.yaml index 702d447..1d628c1 100644 --- a/clusters/k3s-dgx/nim-service/qwen.yaml +++ b/clusters/k3s-dgx/nim-service/qwen.yaml @@ -87,8 +87,7 @@ spec: authSecret: hf-api-secret storage: - sharedMemorySizeLimit: - sizeLimit: 64Gi + sharedMemorySizeLimit: 64Gi nimCache: name: qwen36-27b-fp8 replicas: 1