Removed expert-parallel from 3x-node Qwen
This commit is contained in:
@@ -28,9 +28,9 @@ defaults:
|
|||||||
port: 8000
|
port: 8000
|
||||||
host: 0.0.0.0
|
host: 0.0.0.0
|
||||||
pipeline_parallel: 3
|
pipeline_parallel: 3
|
||||||
gpu_memory_utilization: 0.6
|
gpu_memory_utilization: 0.7
|
||||||
max_model_len: 262144
|
max_model_len: 262144
|
||||||
max_num_batched_tokens: 4176
|
max_num_batched_tokens: 16384
|
||||||
|
|
||||||
# Environment variables
|
# Environment variables
|
||||||
env:
|
env:
|
||||||
@@ -55,7 +55,6 @@ command: |
|
|||||||
--chat-template unsloth.jinja \
|
--chat-template unsloth.jinja \
|
||||||
-tp 1 \
|
-tp 1 \
|
||||||
-pp {pipeline_parallel} \
|
-pp {pipeline_parallel} \
|
||||||
--enable-expert-parallel \
|
|
||||||
--distributed-executor-backend ray
|
--distributed-executor-backend ray
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user