minor refactor: move check server args to server_args.py (#774)

This commit is contained in:
Mingyi
2024-07-27 19:03:40 -07:00
committed by GitHub
parent bbc07c4197
commit e4db4e5ba5
2 changed files with 10 additions and 2 deletions

View File

@@ -176,6 +176,8 @@ def launch_server(
model_overide_args: Optional[dict] = None,
pipe_finish_writer: Optional[mp.connection.Connection] = None,
):
server_args.check_server_args()
"""Launch an HTTP server."""
global tokenizer_manager
@@ -230,8 +232,6 @@ def launch_server(
# Handle multi-node tensor parallelism
if server_args.nnodes > 1:
assert server_args.dp_size == 1, "Multi-node dp is not supported."
if server_args.node_rank != 0:
tp_size_local = server_args.tp_size // server_args.nnodes
gpu_ids = [