[fix] fixed request to request error.

This commit is contained in:
Zijie Tian
2026-01-19 00:55:26 +08:00
parent e6e0dc5d7d
commit 50520a6c3c
4 changed files with 76 additions and 3 deletions

View File

@@ -231,6 +231,11 @@ class HybridKVCacheManager(KVCacheManager):
seq.num_cached_tokens = 0
seq.block_table.clear()
# Reset OffloadEngine state to prevent request-to-request contamination
# This clears all KV buffers and pending async events
if self.offload_engine is not None:
self.offload_engine.reset()
def can_append(self, seq: Sequence) -> bool:
"""Check if we can append a token."""
need_new_block = (len(seq) % self._block_size == 1)