Mooncake store get zero copy meta optimization (#9857)

This commit is contained in:
huangtingwei
2025-09-01 18:27:56 +08:00
committed by GitHub
parent 16e56ea693
commit b361750a4a

View File

@@ -467,6 +467,7 @@ class MHATokenToKVPoolHost(HostKVCache):
ptr_list = []
key_list = []
kv_buffer_data_ptr = self.kv_buffer.data_ptr()
indices = indices.tolist()
v_offset = (
self.layer_num
* self.size
@@ -706,6 +707,7 @@ class MLATokenToKVPoolHost(HostKVCache):
ptr_list = []
key_list = []
kv_buffer_data_ptr = self.kv_buffer.data_ptr()
indices = indices.tolist()
for index in range(0, len(indices), self.page_size):
k_ptr = (
kv_buffer_data_ptr