From cc4a80caf6048128168715115bbae41848a4150c Mon Sep 17 00:00:00 2001 From: ybyang <10629930+whybeyoung@users.noreply.github.com> Date: Wed, 30 Apr 2025 10:38:54 +0800 Subject: [PATCH] [PD] Fix Assertion failed: /DeepEP/csrc/kernels/internode.cu:483, condition: ibgda_get_state()->num_rc_per_pe >= num_channels #134 (#5830) --- python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py b/python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py index 1f27b3393..f273c55cb 100644 --- a/python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py +++ b/python/sglang/srt/layers/moe/ep_moe/token_dispatcher.py @@ -84,9 +84,7 @@ class DeepEPBuffer: num_nvl_bytes, num_rdma_bytes, low_latency_mode=deepep_mode.enable_low_latency(), - num_qps_per_rank=( - num_experts // group.size() if deepep_mode.enable_low_latency() else 1 - ), + num_qps_per_rank=(max(num_experts // group.size(), Buffer.num_sms // 2)), ) return cls._buffer