use defaults

This commit is contained in:
2026-05-11 11:36:59 -05:00
parent db6efb188c
commit 2d2df4bb0a

View File

@@ -64,10 +64,6 @@ spec:
- --max-num-seqs
- "254" # ↑ Allow more concurrent sequences
- --enable-prefix-caching
- --dtype
- "float" # Explicit FP8 encoding
- --quantization
- "fp8" # Explicit quantization backend
authSecret: hf-api-secret
storage:
sharedMemorySizeLimit: 64Gi