Clean up server args (#8161)

This commit is contained in:
Lianmin Zheng
2025-07-19 11:32:52 -07:00
committed by GitHub
parent 1b427dae02
commit bb0e8a32b5
8 changed files with 389 additions and 343 deletions

View File

@@ -27,7 +27,7 @@ class TestTransformersFallbackEndpoint(CustomTestCase):
cls.model,
cls.base_url,
timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
other_args=["--impl", "transformers"],
other_args=["--model-impl", "transformers"],
)
cls.mmlu_lower_bound = 0.65
cls.gsm8k_lower_bound = 0.65
@@ -76,7 +76,7 @@ class TestTransformersFallbackTorchAO(TestTransformersFallbackEndpoint):
cls.base_url,
timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
other_args=[
"--impl",
"--model-impl",
"transformers",
"--torchao-config",
"int4wo-128",
@@ -127,7 +127,7 @@ class TestTransformersFallbackEngine(CustomTestCase):
tp_size=model_case.tp_size,
torch_dtype=model_case.torch_dtype,
model_type="generation",
impl="transformers",
model_impl="transformers",
trust_remote_code=model_case.trust_remote_code,
torchao_config=model_case.torchao_config,
) as srt_runner: