Fixed qwen3.6 recipes

2026-05-06 10:56:09 -07:00
parent c67c5b5c1e
commit b87854fd4c
2 changed files with 5 additions and 6 deletions
--- a/recipes/qwen3.6-35b-a3b-fp8.yaml
+++ b/recipes/qwen3.6-35b-a3b-fp8.yaml
@@ -14,7 +14,6 @@ model: Qwen/Qwen3.6-35B-A3B-FP8
 # Container image to use
 container: vllm-node

-# Mod required to fix slowness and crash in the cluster (tracking https://github.com/vllm-project/vllm/issues/33857)
 mods:
  - mods/fix-qwen3.6-chat-template

@@ -33,7 +32,7 @@ env:

 # The vLLM serve command template
 command: |
-  vllm serve Qwen/Qwen3.5-35B-A3B-FP8 \
+  vllm serve Qwen/Qwen3.6-35B-A3B-FP8 \
    --host {host} \
    --port {port} \
    --max-model-len {max_model_len} \