use vlmm openai

2026-05-07 14:59:55 -05:00
parent 2229daa1a3
commit 1a4e73b755
1 changed files with 2 additions and 4 deletions
--- a/clusters/k3s-dgx/nim-service/qwen.yaml
+++ b/clusters/k3s-dgx/nim-service/qwen.yaml
@@ -60,11 +60,9 @@ spec:
    - "--enable-prefix-caching"
    - '--speculative-config={"method":"mtp","num_speculative_tokens":2}'
  image:
-    repository: nvcr.io/nim/nvidia/llm-nim
+    repository: vllm/vllm-openai
-    tag: "1.12"
+    tag: "v0.19.1-cu130"
    pullPolicy: IfNotPresent
    pullSecrets:
      - ngc-secret
  authSecret: hf-api-secret
  storage:
    nimCache: