[LongCat] Optimize zero_experts_compute_triton by changing mask (#10303)

2025-09-12 05:56:25 +08:00
parent 46ccbed2cd
commit c5d2b01cea
1 changed files with 1 additions and 1 deletions
--- a/python/sglang/srt/layers/moe/ep_moe/kernels.py
+++ b/python/sglang/srt/layers/moe/ep_moe/kernels.py
@@ -1416,7 +1416,7 @@ def zero_experts_compute_triton(
        zero_expert_scales[zero_expert_mask] = 0.0

    normal_expert_mask = expert_indices >= num_experts
-    expert_indices[normal_expert_mask] = 0
+    expert_indices[normal_expert_mask] = -1
    expert_scales[normal_expert_mask] = 0.0

    output = torch.zeros_like(hidden_states).to(hidden_states.device)