use defaults
This commit is contained in:
@@ -64,10 +64,6 @@ spec:
|
|||||||
- --max-num-seqs
|
- --max-num-seqs
|
||||||
- "254" # ↑ Allow more concurrent sequences
|
- "254" # ↑ Allow more concurrent sequences
|
||||||
- --enable-prefix-caching
|
- --enable-prefix-caching
|
||||||
- --dtype
|
|
||||||
- "float" # Explicit FP8 encoding
|
|
||||||
- --quantization
|
|
||||||
- "fp8" # Explicit quantization backend
|
|
||||||
authSecret: hf-api-secret
|
authSecret: hf-api-secret
|
||||||
storage:
|
storage:
|
||||||
sharedMemorySizeLimit: 64Gi
|
sharedMemorySizeLimit: 64Gi
|
||||||
|
|||||||
Reference in New Issue
Block a user