From 0bef50c89667e38c3b30b292a9c8d8a5cf76daae Mon Sep 17 00:00:00 2001 From: HaimKortovich Date: Tue, 5 May 2026 15:15:37 -0500 Subject: [PATCH] use correct format --- clusters/k3s-dgx/apps/huihui-granite-inference.yaml | 7 ++----- 1 file changed, 2 insertions(+), 5 deletions(-) diff --git a/clusters/k3s-dgx/apps/huihui-granite-inference.yaml b/clusters/k3s-dgx/apps/huihui-granite-inference.yaml index 114be8e..d0f98f3 100644 --- a/clusters/k3s-dgx/apps/huihui-granite-inference.yaml +++ b/clusters/k3s-dgx/apps/huihui-granite-inference.yaml @@ -4,16 +4,13 @@ metadata: name: huihui-granite spec: model: - modelFormat: - name: huggingface - storageUri: "hf://huihui-ai/Huihui-granite-4.1-30b-abliterated" + uri: hf://huihui-ai/Huihui-granite-4.1-30b-abliterated + name: huihui-ai/Huihui-granite-4.1-30b-abliterated replicas: 1 template: containers: - name: main image: quay.io/pierdipi/vllm-cpu:latest - args: - - --model_name=huihui-granite securityContext: runAsNonRoot: false env: