Support both approximate and exact expert distribution collection (#6964)

This commit is contained in:
fzyzcjy
2025-06-10 11:56:17 +08:00
committed by GitHub
parent 6716b41786
commit f6ebba537a
4 changed files with 101 additions and 71 deletions

View File

@@ -182,7 +182,7 @@ class ServerArgs:
eplb_rebalance_num_iterations: int = 1000
eplb_rebalance_layers_per_chunk: Optional[int] = None
expert_distribution_recorder_mode: Optional[
Literal["stat", "per_pass", "per_token"]
Literal["stat", "stat_approx", "per_pass", "per_token"]
] = None
expert_distribution_recorder_buffer_size: Optional[int] = None
enable_expert_distribution_metrics: bool = False