From ac49dac009463ec4d88110ee74cb0ca551b997fb Mon Sep 17 00:00:00 2001 From: JieXin Liang Date: Fri, 4 Jul 2025 00:25:32 +0800 Subject: [PATCH] [fix] fix dsv3_router_gemm filter (#7750) --- python/sglang/srt/models/deepseek_v2.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/python/sglang/srt/models/deepseek_v2.py b/python/sglang/srt/models/deepseek_v2.py index 73b4271f4..d969baf3c 100644 --- a/python/sglang/srt/models/deepseek_v2.py +++ b/python/sglang/srt/models/deepseek_v2.py @@ -233,7 +233,8 @@ class MoEGate(nn.Module): ) if ( - hidden_states.shape[0] < 4 + _is_cuda + and hidden_states.shape[0] < 4 and hidden_states.shape[1] == 7168 and self.weight.shape[0] == 256 and _device_sm >= 90