Fix DeepEP error in Qwen 3 MoE models (#6673)

This commit is contained in:
fzyzcjy
2025-05-28 06:12:54 +08:00
committed by GitHub
parent 2103b80607
commit a564e001b5

View File

@@ -93,17 +93,20 @@ class DeepEPBuffer:
), ),
num_rdma_bytes, num_rdma_bytes,
) )
if deepep_mode == DeepEPMode.normal:
num_qps_per_rank = DeepEPConfig.get_instance().num_sms // 2
elif deepep_mode in [DeepEPMode.low_latency, DeepEPMode.auto]:
num_qps_per_rank = num_experts // group.size()
else:
raise NotImplementedError
cls._buffer = Buffer( cls._buffer = Buffer(
group, group,
num_nvl_bytes, num_nvl_bytes,
num_rdma_bytes, num_rdma_bytes,
low_latency_mode=deepep_mode.enable_low_latency(), low_latency_mode=deepep_mode.enable_low_latency(),
num_qps_per_rank=( num_qps_per_rank=num_qps_per_rank,
max(
num_experts // group.size(),
DeepEPConfig.get_instance().num_sms // 2,
)
),
) )
return cls._buffer return cls._buffer