"vscode:/vscode.git/clone" did not exist on "293bfae37ec057d6fc6df26703cf3ebd9ff9dcb9"
Unverified Commit 132dad87 authored by shangmingc's avatar shangmingc Committed by GitHub
Browse files

[PD] Optimize transfer queue forward logic for dummy rank (#6922)


Signed-off-by: default avatarShangming Cai <caishangming@linux.alibaba.com>
parent 60fdad7c
...@@ -562,6 +562,12 @@ class MooncakeKVManager(BaseKVManager): ...@@ -562,6 +562,12 @@ class MooncakeKVManager(BaseKVManager):
) )
return return
if bootstrap_room not in self.transfer_infos:
# This means that the current rank is a dummy rank for this request,
# and it has already been marked as success, so there is no need to
# add further chunks into the transfer queue.
return
# NOTE(shangming): sharding according to the dst_infos to make sure # NOTE(shangming): sharding according to the dst_infos to make sure
# requests with the same dst_sessions will be added into the same # requests with the same dst_sessions will be added into the same
# queue, which enables early abort with failed sessions. # queue, which enables early abort with failed sessions.
...@@ -578,7 +584,6 @@ class MooncakeKVManager(BaseKVManager): ...@@ -578,7 +584,6 @@ class MooncakeKVManager(BaseKVManager):
prefill_aux_index=aux_index, prefill_aux_index=aux_index,
) )
) )
self.update_status(bootstrap_room, KVPoll.WaitingForInput)
def check_status(self, bootstrap_room: int): def check_status(self, bootstrap_room: int):
return self.request_status[bootstrap_room] return self.request_status[bootstrap_room]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment