Fix wrong assert (#1028)

This commit is contained in:
Liangsheng Yin
2024-08-11 02:22:16 -07:00
committed by GitHub
parent a97df79124
commit fcc0f5ed99

View File

@@ -39,10 +39,12 @@ class ChunkCache(BasePrefixCache):
kv_indices = self.req_to_token_pool.req_to_token[
req.req_pool_idx, : len(token_ids)
]
assert req.rid in self.entries
self.req_to_token_pool.free(req.req_pool_idx)
self.token_to_kv_pool.free(kv_indices)
if req.rid in self.entries:
del self.entries[req.rid]
def cache_unfinished_req(self, req: "Req", token_ids=None):
if token_ids is None:
token_ids = req.fill_ids