From 9dc09bd04b6420a3b3c155c05bf2542dbb0dbdd7 Mon Sep 17 00:00:00 2001 From: Eugene Rakhmatulin Date: Fri, 6 Mar 2026 13:56:06 -0800 Subject: [PATCH] Renamed recipe for qwen3.5-35b-a3b-fp8 to match others --- recipes/{qwen35-35b-a3b-fp8.yaml => qwen3.5-35b-a3b-fp8.yaml} | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) rename recipes/{qwen35-35b-a3b-fp8.yaml => qwen3.5-35b-a3b-fp8.yaml} (98%) diff --git a/recipes/qwen35-35b-a3b-fp8.yaml b/recipes/qwen3.5-35b-a3b-fp8.yaml similarity index 98% rename from recipes/qwen35-35b-a3b-fp8.yaml rename to recipes/qwen3.5-35b-a3b-fp8.yaml index 296146a..e2bc05b 100644 --- a/recipes/qwen35-35b-a3b-fp8.yaml +++ b/recipes/qwen3.5-35b-a3b-fp8.yaml @@ -24,7 +24,7 @@ defaults: host: 0.0.0.0 tensor_parallel: 2 gpu_memory_utilization: 0.7 - max_model_len: 131072 + max_model_len: 262144 max_num_batched_tokens: 16384 # Environment variables