Improve: Extract generation_manager from tokenizer_manager (#3115)

This commit is contained in:
fzyzcjy
2025-02-23 15:25:45 +08:00
committed by GitHub
parent 45205d88a0
commit 3f41b18455
3 changed files with 748 additions and 571 deletions

View File

@@ -463,5 +463,5 @@ def _launch_subprocesses(server_args: ServerArgs) -> Tuple[TokenizerManager, Dic
# Assume all schedulers have the same scheduler_info
scheduler_info = scheduler_infos[0]
tokenizer_manager.max_req_input_len = scheduler_info["max_req_input_len"]
tokenizer_manager.configure_max_req_input_len(scheduler_info["max_req_input_len"])
return tokenizer_manager, scheduler_info