Clean up server_args, triton cache manager (#8332)

This commit is contained in:
Lianmin Zheng
2025-07-25 14:14:51 -07:00
committed by GitHub
parent f8260f2539
commit ed2e313eb6
12 changed files with 128 additions and 204 deletions

View File

@@ -261,7 +261,7 @@ class TestMTP(CustomTestCase):
"--enable-dp-lm-head",
"--enable-deepep-moe",
"--speculative-algo",
"NEXTN",
"EAGLE",
"--speculative-draft",
DEFAULT_MODEL_NAME_FOR_TEST_MLA_NEXTN,
"--speculative-num-steps",
@@ -329,7 +329,7 @@ class TestMTPWithTBO(CustomTestCase):
"--enable-deepep-moe",
"--trust-remote-code",
"--speculative-algorithm",
"NEXTN",
"EAGLE",
"--speculative-num-steps",
"2",
"--speculative-eagle-topk",