diff --git a/vllm_ascend/distributed/kv_transfer/kv_p2p/mooncake_connector.py b/vllm_ascend/distributed/kv_transfer/kv_p2p/mooncake_connector.py index 4c692e33..95d05fdc 100644 --- a/vllm_ascend/distributed/kv_transfer/kv_p2p/mooncake_connector.py +++ b/vllm_ascend/distributed/kv_transfer/kv_p2p/mooncake_connector.py @@ -442,7 +442,8 @@ class KVCacheRecvingThread(threading.Thread): finally: self._send_done_signal_to_free_remote_port(remote_request_id, remote_host, remote_port_send_num) if all_task_done: - self.task_tracker.update_done_task_count(request_id) + if len(req_meta["local_block_ids"]) > 0: + self.task_tracker.update_done_task_count(request_id) if request_id in self.proc_not_transfer_request: del self.proc_not_transfer_request[request_id] self.request_queue.task_done()