From c5d2b01cea6cc9a9ad0450222c7a4f19f5487b3d Mon Sep 17 00:00:00 2001 From: zk-lover Date: Fri, 12 Sep 2025 05:56:25 +0800 Subject: [PATCH] [LongCat] Optimize zero_experts_compute_triton by changing mask (#10303) --- python/sglang/srt/layers/moe/ep_moe/kernels.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/moe/ep_moe/kernels.py b/python/sglang/srt/layers/moe/ep_moe/kernels.py index bea38cc41..08660812d 100644 --- a/python/sglang/srt/layers/moe/ep_moe/kernels.py +++ b/python/sglang/srt/layers/moe/ep_moe/kernels.py @@ -1416,7 +1416,7 @@ def zero_experts_compute_triton( zero_expert_scales[zero_expert_mask] = 0.0 normal_expert_mask = expert_indices >= num_experts - expert_indices[normal_expert_mask] = 0 + expert_indices[normal_expert_mask] = -1 expert_scales[normal_expert_mask] = 0.0 output = torch.zeros_like(hidden_states).to(hidden_states.device)