Fix fused MoE when routed_scaling_factor is None (#8709)
This commit is contained in:
@@ -280,7 +280,9 @@ class EPMoE(FusedMoE):
|
||||
m_max * self.start_expert_id,
|
||||
BLOCK_SIZE=512,
|
||||
)
|
||||
return output * self.routed_scaling_factor
|
||||
if self.routed_scaling_factor is not None:
|
||||
output *= self.routed_scaling_factor
|
||||
return output
|
||||
|
||||
|
||||
class DeepEPMoE(EPMoE):
|
||||
|
||||
Reference in New Issue
Block a user