diff --git a/python/sglang/srt/layers/moe/topk.py b/python/sglang/srt/layers/moe/topk.py index 3c6d9eae9..9cb6d6a0c 100644 --- a/python/sglang/srt/layers/moe/topk.py +++ b/python/sglang/srt/layers/moe/topk.py @@ -112,10 +112,11 @@ def fused_topk( topk_softmax( topk_weights, topk_ids, - gating_output.float(), + gating_output, renormalize, ) + topk_ids = topk_ids_logical_to_physical(topk_ids, expert_location_dispatch_info) _mask_topk_ids_padded_region(topk_ids, num_token_non_padded) return topk_weights, topk_ids