From 7ceea856475b872ac37192787cdeed152c820e96 Mon Sep 17 00:00:00 2001 From: Eugene Rakhmatulin Date: Wed, 11 Mar 2026 11:20:56 -0700 Subject: [PATCH] Fixed qwen3-coder-next-int4-autoround to exclude Ray --- recipes/qwen3-coder-next-int4-autoround.yaml | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/recipes/qwen3-coder-next-int4-autoround.yaml b/recipes/qwen3-coder-next-int4-autoround.yaml index b308a20..2060381 100644 --- a/recipes/qwen3-coder-next-int4-autoround.yaml +++ b/recipes/qwen3-coder-next-int4-autoround.yaml @@ -22,7 +22,6 @@ mods: defaults: port: 8000 host: 0.0.0.0 - tensor_parallel: 2 gpu_memory_utilization: 0.7 max_model_len: 262144 @@ -40,7 +39,5 @@ command: | --port {port} \ --load-format fastsafetensors \ --enable-prefix-caching \ - --max-model-len {max_model_len} \ - -tp {tensor_parallel} \ - --distributed-executor-backend ray + --max-model-len {max_model_len}