Fix typo in pipeline_parallel setting in Qwen3.5-397B-INT4-Autoround recipe
This commit is contained in:
@@ -27,7 +27,7 @@ mods:
|
|||||||
defaults:
|
defaults:
|
||||||
port: 8000
|
port: 8000
|
||||||
host: 0.0.0.0
|
host: 0.0.0.0
|
||||||
pipeline_parellel: 3
|
pipeline_parallel: 3
|
||||||
gpu_memory_utilization: 0.6
|
gpu_memory_utilization: 0.6
|
||||||
max_model_len: 262144
|
max_model_len: 262144
|
||||||
max_num_batched_tokens: 4176
|
max_num_batched_tokens: 4176
|
||||||
|
|||||||
Reference in New Issue
Block a user