use vllm profiel
This commit is contained in:
@@ -59,7 +59,7 @@ spec:
|
||||
storage:
|
||||
nimCache:
|
||||
name: qwen36-27b-fp8
|
||||
profile: tensorrt_llm
|
||||
profile: vllm
|
||||
replicas: 1
|
||||
resources:
|
||||
limits:
|
||||
|
||||
Reference in New Issue
Block a user