use vllm profiel

This commit is contained in:
2026-05-07 15:12:03 -05:00
parent 1177264fd2
commit 6491c6cebe

View File

@@ -59,7 +59,7 @@ spec:
storage:
nimCache:
name: qwen36-27b-fp8
profile: tensorrt_llm
profile: vllm
replicas: 1
resources:
limits: