[5/N] MoE Refactor: Update MoE parallelism arguments (#8658)

This commit is contained in:
Cheng Wan
2025-08-01 01:20:03 -07:00
committed by GitHub
parent c8d3a402c1
commit 6c88f6c8d9
38 changed files with 342 additions and 299 deletions

View File

@@ -27,7 +27,6 @@ class TestEpMoE(CustomTestCase):
"2",
"--ep-size",
"2",
"--enable-ep-moe",
],
)
@@ -75,7 +74,6 @@ class TestEpMoEFP8(CustomTestCase):
"2",
"--ep-size",
"2",
"--enable-ep-moe",
"--quantization",
"fp8",
],