Fix prefill OOM error in the case of large page size (#5081)

This commit is contained in:
Zhiqiang Xie
2025-05-05 16:02:55 -07:00
committed by GitHub
parent 683707c314
commit f8e460930a
3 changed files with 11 additions and 2 deletions

View File

@@ -502,6 +502,7 @@ class Scheduler(
self.tree_cache = ChunkCache(
req_to_token_pool=self.req_to_token_pool,
token_to_kv_pool_allocator=self.token_to_kv_pool_allocator,
page_size=self.page_size,
)
else:
if self.enable_hierarchical_cache: