Support page first layout zero copy for mooncake store (#8651)

Co-authored-by: Zhiqiang Xie <xiezhq@stanford.edu>
This commit is contained in:
huangtingwei
2025-08-13 06:59:26 +08:00
committed by GitHub
parent 924827c3de
commit 0edda32001
4 changed files with 39 additions and 39 deletions

View File

@@ -260,6 +260,7 @@ class HiCacheController:
self.storage_backend = MooncakeStore()
self.get_hash_str = get_hash_str_mooncake
self.storage_backend.register_buffer(self.mem_pool_host.kv_buffer)
assert self.mem_pool_host.layout == "page_first"
elif storage_backend == "hf3fs":
from sglang.srt.distributed import get_tensor_model_parallel_rank
from sglang.srt.mem_cache.storage.hf3fs.storage_hf3fs import (