From 9f47d686e52158bbd3872ec8a6d96fbc5de69134 Mon Sep 17 00:00:00 2001 From: Liangsheng Yin Date: Sun, 3 Aug 2025 12:42:01 +0800 Subject: [PATCH] Fix fused MoE when `routed_scaling_factor is None` (#8709) --- python/sglang/srt/layers/moe/ep_moe/layer.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/moe/ep_moe/layer.py b/python/sglang/srt/layers/moe/ep_moe/layer.py index 88a74d458..66fbb36ea 100644 --- a/python/sglang/srt/layers/moe/ep_moe/layer.py +++ b/python/sglang/srt/layers/moe/ep_moe/layer.py @@ -280,7 +280,9 @@ class EPMoE(FusedMoE): m_max * self.start_expert_id, BLOCK_SIZE=512, ) - return output * self.routed_scaling_factor + if self.routed_scaling_factor is not None: + output *= self.routed_scaling_factor + return output class DeepEPMoE(EPMoE):