Clean up server args (#8161)

This commit is contained in:
Lianmin Zheng
2025-07-19 11:32:52 -07:00
committed by GitHub
parent 1b427dae02
commit bb0e8a32b5
8 changed files with 389 additions and 343 deletions

View File

@@ -481,7 +481,7 @@ class SRTRunner:
torch_dtype: torch.dtype,
model_type: str,
tp_size: int = 1,
impl: str = "auto",
model_impl: str = "auto",
port: int = DEFAULT_PORT_FOR_SRT_TEST_RUNNER,
lora_paths: List[str] = None,
max_loras_per_batch: int = 4,
@@ -525,7 +525,7 @@ class SRTRunner:
tp_size=tp_size,
dtype=get_dtype_str(torch_dtype),
port=port,
impl=impl,
model_impl=model_impl,
torchao_config=torchao_config,
mem_fraction_static=mem_fraction_static,
trust_remote_code=trust_remote_code,