[Fix] Add speculative_draft_model_revision to server_args (#5255)

Signed-off-by: Devashish Lal <devashish@rivosinc.com>
This commit is contained in:
DevashishLal-CB
2025-09-05 04:45:46 -07:00
committed by GitHub
parent df97b31f37
commit 13705dae06
13 changed files with 68 additions and 45 deletions

View File

@@ -268,7 +268,7 @@ class TestMTP(CustomTestCase):
"deepep",
"--speculative-algo",
"EAGLE",
"--speculative-draft",
"--speculative-draft-model-path",
DEFAULT_MODEL_NAME_FOR_TEST_MLA_NEXTN,
"--speculative-num-steps",
"2",
@@ -343,7 +343,7 @@ class TestMTPWithTBO(CustomTestCase):
"3",
"--speculative-num-draft-tokens",
"3",
"--speculative-draft",
"--speculative-draft-model-path",
DEFAULT_MODEL_NAME_FOR_TEST_MLA_NEXTN,
"--chunked-prefill-size",
"256",