Support fake perfectly balanced EP dispatch algorithm (#6571)

This commit is contained in:
fzyzcjy
2025-05-26 13:35:51 +08:00
committed by GitHub
parent 2c3a6fe1de
commit 0ca1811715
3 changed files with 24 additions and 2 deletions

View File

@@ -172,7 +172,7 @@ class ServerArgs:
enable_deepep_moe: bool = False
deepep_mode: Optional[Literal["auto", "normal", "low_latency"]] = "auto"
ep_num_redundant_experts: int = 0
ep_dispatch_algorithm: Optional[Literal["static", "dynamic"]] = None
ep_dispatch_algorithm: Optional[Literal["static", "dynamic", "fake"]] = None
init_expert_location: str = "trivial"
enable_eplb: bool = False
eplb_rebalance_num_iterations: int = 1000