Fix chunked prefill (#984)

This commit is contained in:
Liangsheng Yin
2024-08-07 22:28:42 -07:00
committed by GitHub
parent 00023d622a
commit 6ed4e3b8fb

View File

@@ -56,7 +56,8 @@ class ChunkCache(BasePrefixCache):
entry = self.entries[req.rid]
entry.value = kv_indices
return kv_indices, entry
req.prefix_indices = kv_indices
req.last_node = entry
def insert(self):
raise NotImplementedError