use defaults

This commit is contained in:
2026-05-11 11:36:59 -05:00
parent db6efb188c
commit 2d2df4bb0a

View File

@@ -64,10 +64,6 @@ spec:
- --max-num-seqs - --max-num-seqs
- "254" # ↑ Allow more concurrent sequences - "254" # ↑ Allow more concurrent sequences
- --enable-prefix-caching - --enable-prefix-caching
- --dtype
- "float" # Explicit FP8 encoding
- --quantization
- "fp8" # Explicit quantization backend
authSecret: hf-api-secret authSecret: hf-api-secret
storage: storage:
sharedMemorySizeLimit: 64Gi sharedMemorySizeLimit: 64Gi