[PD] Optimize transfer queue forward logic for dummy rank (#6922)
Signed-off-by: Shangming Cai <caishangming@linux.alibaba.com>
This commit is contained in:
@@ -562,6 +562,12 @@ class MooncakeKVManager(BaseKVManager):
|
|||||||
)
|
)
|
||||||
return
|
return
|
||||||
|
|
||||||
|
if bootstrap_room not in self.transfer_infos:
|
||||||
|
# This means that the current rank is a dummy rank for this request,
|
||||||
|
# and it has already been marked as success, so there is no need to
|
||||||
|
# add further chunks into the transfer queue.
|
||||||
|
return
|
||||||
|
|
||||||
# NOTE(shangming): sharding according to the dst_infos to make sure
|
# NOTE(shangming): sharding according to the dst_infos to make sure
|
||||||
# requests with the same dst_sessions will be added into the same
|
# requests with the same dst_sessions will be added into the same
|
||||||
# queue, which enables early abort with failed sessions.
|
# queue, which enables early abort with failed sessions.
|
||||||
@@ -578,7 +584,6 @@ class MooncakeKVManager(BaseKVManager):
|
|||||||
prefill_aux_index=aux_index,
|
prefill_aux_index=aux_index,
|
||||||
)
|
)
|
||||||
)
|
)
|
||||||
self.update_status(bootstrap_room, KVPoll.WaitingForInput)
|
|
||||||
|
|
||||||
def check_status(self, bootstrap_room: int):
|
def check_status(self, bootstrap_room: int):
|
||||||
return self.request_status[bootstrap_room]
|
return self.request_status[bootstrap_room]
|
||||||
|
|||||||
Reference in New Issue
Block a user