[server] Passing model_override_args to launch_server via the CLI. (#1298)

Signed-off-by: Kai-Hsun Chen <kaihsun@anyscale.com>
This commit is contained in:
Kai-Hsun Chen
2024-09-09 02:14:25 -07:00
committed by GitHub
parent 662ecd9368
commit c9b75917d5
8 changed files with 71 additions and 16 deletions

View File

@@ -1,20 +1,18 @@
"""Launch the inference server."""
import argparse
import os
import sys
from sglang.srt.server import launch_server
from sglang.srt.server_args import ServerArgs
from sglang.srt.server_args import prepare_server_args
from sglang.srt.utils import kill_child_process
if __name__ == "__main__":
parser = argparse.ArgumentParser()
ServerArgs.add_cli_args(parser)
args = parser.parse_args()
server_args = ServerArgs.from_cli_args(args)
server_args = prepare_server_args(sys.argv[1:])
model_override_args = server_args.json_model_override_args
try:
launch_server(server_args)
launch_server(server_args, model_override_args=model_override_args)
except Exception as e:
raise e
finally: