From 226f832c0bf3086fb287e6bdb120ef53b88c5b46 Mon Sep 17 00:00:00 2001 From: fems14 <74094523+fems14@users.noreply.github.com> Date: Sat, 25 Oct 2025 14:20:09 +0800 Subject: [PATCH] [bugfixfix] correct _register function place for mooncacke (#3747) correct _register function place for mooncacke - vLLM version: v0.11.0rc3 - vLLM main: https://github.com/vllm-project/vllm/commit/17c540a993af88204ad1b78345c8a865cf58ce44 Signed-off-by: fems14 <1804143737@qq.com> --- .../distributed/mooncake/mooncake_engine.py | 20 +++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/vllm_ascend/distributed/mooncake/mooncake_engine.py b/vllm_ascend/distributed/mooncake/mooncake_engine.py index bff3f3e1..cc58877b 100644 --- a/vllm_ascend/distributed/mooncake/mooncake_engine.py +++ b/vllm_ascend/distributed/mooncake/mooncake_engine.py @@ -126,16 +126,6 @@ class MooncakeEngine: region_len = self.num_blocks * self.block_len[0] self._register(base_addr, region_len) - def _register(self, ptr, length): - logger.debug( - "Registering KV cache: ptr=0x%x, length=%d, num_blocks=%d, " - "block_lens=%s", ptr, length, self.num_blocks, self.block_len) - try: - self.m_store.register_buffer(ptr, length) - except Exception as e: - raise RuntimeError( - f"Mooncake memory registration failed. Error is: {e}") - if self.use_layerwise: self.get_event = threading.Event() if self.kv_role in ['kv_producer', 'kv_both']: @@ -170,6 +160,16 @@ class MooncakeEngine: self.kv_recv_thread.start() ready_event.wait() + def _register(self, ptr, length): + logger.debug( + "Registering KV cache: ptr=0x%x, length=%d, num_blocks=%d, " + "block_lens=%s", ptr, length, self.num_blocks, self.block_len) + try: + self.m_store.register_buffer(ptr, length) + except Exception as e: + raise RuntimeError( + f"Mooncake memory registration failed. Error is: {e}") + def start_load_kv(self, metadata: MooncakeConnectorMetadata): self.current_layer = 0 self.layerwise_retrievers = []