[5/N] MoE Refactor: Update MoE parallelism arguments (#8658)
This commit is contained in:
@@ -288,12 +288,14 @@ class _SinglePassGatherer(ABC):
|
||||
)
|
||||
|
||||
if server_args.expert_distribution_recorder_mode == "stat_approx":
|
||||
if server_args.enable_deepep_moe and (server_args.deepep_mode == "normal"):
|
||||
if server_args.moe_a2a_backend is not None and (
|
||||
server_args.deepep_mode == "normal"
|
||||
):
|
||||
return _DeepepNormalSinglePassGatherer(expert_location_metadata, rank)
|
||||
else:
|
||||
raise NotImplementedError
|
||||
|
||||
if server_args.enable_deepep_moe:
|
||||
if server_args.moe_a2a_backend is not None:
|
||||
if server_args.deepep_mode == "normal":
|
||||
return _SelectExpertsSinglePassGatherer(expert_location_metadata, rank)
|
||||
elif server_args.deepep_mode == "low_latency":
|
||||
|
||||
Reference in New Issue
Block a user