From 6ed4e3b8fb8b264d38378ddff49b185a56e1e810 Mon Sep 17 00:00:00 2001 From: Liangsheng Yin Date: Wed, 7 Aug 2024 22:28:42 -0700 Subject: [PATCH] Fix chunked prefill (#984) --- python/sglang/srt/mem_cache/chunk_cache.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/python/sglang/srt/mem_cache/chunk_cache.py b/python/sglang/srt/mem_cache/chunk_cache.py index 7e3b39450..100cbbaec 100644 --- a/python/sglang/srt/mem_cache/chunk_cache.py +++ b/python/sglang/srt/mem_cache/chunk_cache.py @@ -56,7 +56,8 @@ class ChunkCache(BasePrefixCache): entry = self.entries[req.rid] entry.value = kv_indices - return kv_indices, entry + req.prefix_indices = kv_indices + req.last_node = entry def insert(self): raise NotImplementedError