diff --git a/python/sglang/srt/server_args.py b/python/sglang/srt/server_args.py index 32e13658e..f42afdf8d 100644 --- a/python/sglang/srt/server_args.py +++ b/python/sglang/srt/server_args.py @@ -264,6 +264,7 @@ class ServerArgs: help="How conservative the schedule policy is. A larger value means more conservative scheduling. Use a larger value if you see requests being retracted frequently.", ) parser.add_argument( + "--tensor-parallel-size", "--tp-size", type=int, default=ServerArgs.tp_size, @@ -318,6 +319,7 @@ class ServerArgs: # Data parallelism parser.add_argument( + "--data-parallel-size", "--dp-size", type=int, default=ServerArgs.dp_size, @@ -413,6 +415,8 @@ class ServerArgs: @classmethod def from_cli_args(cls, args: argparse.Namespace): + args.tp_size = args.tensor_parallel_size + args.dp_size = args.data_parallel_size attrs = [attr.name for attr in dataclasses.fields(cls)] return cls(**{attr: getattr(args, attr) for attr in attrs})