[PD]: Support Muti Prefill in one node (#5704)

Co-authored-by: shuaills <shishuaiuoe@gmail.com>
This commit is contained in:
IAN
2025-04-26 00:30:47 +08:00
committed by GitHub
parent 50eda8398e
commit 11e27d0926
6 changed files with 55 additions and 9 deletions

View File

@@ -791,6 +791,7 @@ class Scheduler(
return_hidden_states=recv_req.return_hidden_states,
eos_token_ids=self.model_config.hf_eos_token_id,
bootstrap_host=recv_req.bootstrap_host,
bootstrap_port=recv_req.bootstrap_port,
bootstrap_room=recv_req.bootstrap_room,
)
req.tokenizer = self.tokenizer