From c8d3a402c1ca5f581e3466c0b745af758aa6c691 Mon Sep 17 00:00:00 2001 From: Binyao Jiang Date: Fri, 1 Aug 2025 00:07:41 -0700 Subject: [PATCH] =?UTF-8?q?Bug:=20apply=20final=5Fhidden=5Fstates*=3Dself.?= =?UTF-8?q?routed=5Fscaling=5Ffactor=20at=20MoE=20lay=E2=80=A6=20(#8511)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: Cheng Wan <54331508+ch-wan@users.noreply.github.com> --- python/sglang/srt/layers/moe/ep_moe/layer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/moe/ep_moe/layer.py b/python/sglang/srt/layers/moe/ep_moe/layer.py index 6f896e297..012a78f17 100644 --- a/python/sglang/srt/layers/moe/ep_moe/layer.py +++ b/python/sglang/srt/layers/moe/ep_moe/layer.py @@ -304,7 +304,7 @@ class EPMoE(FusedMoE): m_max * self.start_expert_id, BLOCK_SIZE=512, ) - return output + return output * self.routed_scaling_factor class DeepEPMoE(EPMoE):