From 880221bd3b3e56a4bc2268fe9a9f77f426accf6c Mon Sep 17 00:00:00 2001 From: fzyzcjy <5236035+fzyzcjy@users.noreply.github.com> Date: Sat, 12 Jul 2025 10:03:01 +0800 Subject: [PATCH] Revert "[PD Disaggregation] replace transfer with batch transfer for better performance (#7236)" (#7968) --- .../sglang/srt/disaggregation/mooncake/conn.py | 16 +++++++--------- 1 file changed, 7 insertions(+), 9 deletions(-) diff --git a/python/sglang/srt/disaggregation/mooncake/conn.py b/python/sglang/srt/disaggregation/mooncake/conn.py index db30d8c0d..d7bd308f1 100644 --- a/python/sglang/srt/disaggregation/mooncake/conn.py +++ b/python/sglang/srt/disaggregation/mooncake/conn.py @@ -270,19 +270,17 @@ class MooncakeKVManager(BaseKVManager): # Worker function for processing a single layer def process_layer(src_ptr: int, dst_ptr: int, item_len: int) -> int: - src_addr_list = [] - dst_addr_list = [] - length_list = [] for prefill_index, decode_index in zip(prefill_kv_blocks, dst_kv_blocks): src_addr = src_ptr + int(prefill_index[0]) * item_len dst_addr = dst_ptr + int(decode_index[0]) * item_len length = item_len * len(prefill_index) - src_addr_list.append(src_addr) - dst_addr_list.append(dst_addr) - length_list.append(length) - return self.engine.batch_transfer_sync( - mooncake_session_id, src_addr_list, dst_addr_list, length_list - ) + + status = self.engine.transfer_sync( + mooncake_session_id, src_addr, dst_addr, length + ) + if status != 0: + return status + return 0 futures = [ executor.submit(