Updated tests

This commit is contained in:
Eugene Rakhmatulin
2026-02-04 12:06:30 -08:00
parent c7d45157e0
commit f139c4b55d

View File

@@ -23,7 +23,7 @@ GLM_FLASH_AWQ_ARGS=(
"--max-num-batched-tokens 4096" "--max-num-batched-tokens 4096"
"--max-num-seqs 64" "--max-num-seqs 64"
"--gpu-memory-utilization 0.7" "--gpu-memory-utilization 0.7"
"--port 8888" "--port 8000"
"--host 0.0.0.0" "--host 0.0.0.0"
) )
@@ -34,7 +34,7 @@ GLM_FLASH_AWQ_ARGS=(
GPT_OSS_MODEL="openai/gpt-oss-120b" GPT_OSS_MODEL="openai/gpt-oss-120b"
GPT_OSS_CONTAINER="vllm-node-mxfp4" GPT_OSS_CONTAINER="vllm-node-mxfp4"
GPT_OSS_ARGS=( GPT_OSS_ARGS=(
"--port 8888" "--port 8000"
"--host 0.0.0.0" "--host 0.0.0.0"
"--enable-auto-tool-choice" "--enable-auto-tool-choice"
"--tool-call-parser openai" "--tool-call-parser openai"