fix list
This commit is contained in:
@@ -66,9 +66,9 @@ spec:
|
||||
- --enable-prefix-caching
|
||||
- --dtype
|
||||
- "float8" # Explicit FP8 encoding
|
||||
--quantization
|
||||
- --quantization
|
||||
- "fbgemm-fp8" # Explicit quantization backend
|
||||
--sv2-transformer-bindings # Skip SA checks (small speedup)
|
||||
- --sv2-transformer-bindings # Skip SA checks (small speedup)
|
||||
authSecret: hf-api-secret
|
||||
storage:
|
||||
sharedMemorySizeLimit: 64Gi
|
||||
|
||||
Reference in New Issue
Block a user