Unit test for Hierarchical Caching (#4486)

This commit is contained in:
Zhiqiang Xie
2025-03-17 17:45:00 -07:00
committed by GitHub
parent 9b81f9bd34
commit a98290aea3
7 changed files with 65 additions and 5 deletions

View File

@@ -445,6 +445,7 @@ class Scheduler(SchedulerOutputProcessorMixin):
token_to_kv_pool_allocator=self.token_to_kv_pool_allocator,
tp_cache_group=self.tp_worker.get_tp_cpu_group(),
page_size=self.page_size,
hicache_ratio=server_args.hicache_ratio,
)
else:
self.tree_cache = RadixCache(