fix memory util

This commit is contained in:
2026-05-08 09:42:50 -05:00
parent 2f922279ef
commit b70f8063a8

View File

@@ -45,7 +45,7 @@ spec:
- --served-model-name
- Qwen/Qwen3.6-27B-FP8
- --gpu-memory-utilization
- "0.90"
- "0.85"
- --max-model-len
- "256000"
- --language-model-only