From 12caec228e70c9c176c4443f87237ea4fd696f2a Mon Sep 17 00:00:00 2001 From: Eugene Rakhmatulin Date: Wed, 1 Apr 2026 10:27:50 -0700 Subject: [PATCH] switching gpt-oss-120b to solo only for now --- recipes/openai-gpt-oss-120b.yaml | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/recipes/openai-gpt-oss-120b.yaml b/recipes/openai-gpt-oss-120b.yaml index 09cfa52..12ee14a 100644 --- a/recipes/openai-gpt-oss-120b.yaml +++ b/recipes/openai-gpt-oss-120b.yaml @@ -11,6 +11,9 @@ model: openai/gpt-oss-120b # Container image to use container: vllm-node-mxfp4 +# Only solo now +solo_only: true + # Build arguments for build-and-copy.sh build_args: - --exp-mxfp4 @@ -22,7 +25,7 @@ mods: [] defaults: port: 8000 host: 0.0.0.0 - tensor_parallel: 2 + tensor_parallel: 1 gpu_memory_utilization: 0.70 max_num_batched_tokens: 8192 @@ -37,8 +40,6 @@ command: | --tool-call-parser openai \ --reasoning-parser openai_gptoss \ --enable-auto-tool-choice \ - --tensor-parallel-size {tensor_parallel} \ - --distributed-executor-backend ray \ --gpu-memory-utilization {gpu_memory_utilization} \ --enable-prefix-caching \ --load-format fastsafetensors \