Fix DeepEP error in Qwen 3 MoE models (#6673)

This commit is contained in:
fzyzcjy
2025-05-28 06:12:54 +08:00
committed by GitHub
parent 2103b80607
commit a564e001b5

View File

@@ -93,17 +93,20 @@ class DeepEPBuffer:
),
num_rdma_bytes,
)
if deepep_mode == DeepEPMode.normal:
num_qps_per_rank = DeepEPConfig.get_instance().num_sms // 2
elif deepep_mode in [DeepEPMode.low_latency, DeepEPMode.auto]:
num_qps_per_rank = num_experts // group.size()
else:
raise NotImplementedError
cls._buffer = Buffer(
group,
num_nvl_bytes,
num_rdma_bytes,
low_latency_mode=deepep_mode.enable_low_latency(),
num_qps_per_rank=(
max(
num_experts // group.size(),
DeepEPConfig.get_instance().num_sms // 2,
)
),
num_qps_per_rank=num_qps_per_rank,
)
return cls._buffer