set cache reuse to 1
This commit is contained in:
@@ -46,7 +46,7 @@ spec:
|
|||||||
- name: NIM_MAX_MODEL_LEN
|
- name: NIM_MAX_MODEL_LEN
|
||||||
value: "32768"
|
value: "32768"
|
||||||
- name: NIM_ENABLE_KV_CACHE_REUSE
|
- name: NIM_ENABLE_KV_CACHE_REUSE
|
||||||
value: "true"
|
value: "1"
|
||||||
image:
|
image:
|
||||||
repository: nvcr.io/nim/qwen/qwen3-32b-dgx-spark
|
repository: nvcr.io/nim/qwen/qwen3-32b-dgx-spark
|
||||||
tag: "1.1.0-variant"
|
tag: "1.1.0-variant"
|
||||||
|
|||||||
Reference in New Issue
Block a user