15 lines
712 B
Diff
15 lines
712 B
Diff
diff --git a/vllm/v1/core/single_type_kv_cache_manager.py b/vllm/v1/core/single_type_kv_cache_manager.py
|
|
index 0b6b7ed42ac1..b6e0305a312d 100644
|
|
--- a/vllm/v1/core/single_type_kv_cache_manager.py
|
|
+++ b/vllm/v1/core/single_type_kv_cache_manager.py
|
|
@@ -1000,7 +1000,8 @@ def cache_blocks(self, request: Request, num_tokens: int) -> None:
|
|
for block in self.req_to_blocks[request.request_id][
|
|
num_cached_blocks_before:num_cached_blocks_after
|
|
]:
|
|
- assert block.block_hash is not None
|
|
+ if block.is_null:
|
|
+ continue
|
|
self.cached_blocks_this_step.add(block.block_hash)
|
|
|
|
def new_step_starts(self) -> None:
|