From f67d1f45bcb6940444f66bfacb6e5fd14f9084fd Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Sun, 21 Sep 2025 17:43:50 -0700 Subject: [PATCH] [Auto Sync] Update deepseek_v2.py (20250922) (#10717) Co-authored-by: github-actions[bot] Co-authored-by: Michael Granado --- python/sglang/srt/models/deepseek_v2.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/models/deepseek_v2.py b/python/sglang/srt/models/deepseek_v2.py index 151b9e66e..91d0aa1a8 100644 --- a/python/sglang/srt/models/deepseek_v2.py +++ b/python/sglang/srt/models/deepseek_v2.py @@ -451,7 +451,7 @@ class MoEGate(nn.Module): _is_cuda and hidden_states.shape[0] <= 16 and hidden_states.shape[1] == 7168 - and self.weight.shape[0] == 256 + and (self.weight.shape[0] == 256 or self.weight.shape[0] == 384) and _device_sm >= 90 ): # router gemm output float32