set cache reuse to 1
This commit is contained in:
@@ -46,7 +46,7 @@ spec:
|
||||
- name: NIM_MAX_MODEL_LEN
|
||||
value: "32768"
|
||||
- name: NIM_ENABLE_KV_CACHE_REUSE
|
||||
value: "true"
|
||||
value: "1"
|
||||
image:
|
||||
repository: nvcr.io/nim/qwen/qwen3-32b-dgx-spark
|
||||
tag: "1.1.0-variant"
|
||||
|
||||
Reference in New Issue
Block a user