From e3f08c77bc8ec4bf78501305a5aa15a779ad9ff2 Mon Sep 17 00:00:00 2001 From: Elfie Guo <164945471+elfiegg@users.noreply.github.com> Date: Tue, 29 Jul 2025 23:46:34 -0700 Subject: [PATCH] Update cutlass_moe.py (#8545) --- python/sglang/srt/layers/moe/cutlass_moe.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/moe/cutlass_moe.py b/python/sglang/srt/layers/moe/cutlass_moe.py index 2a5a5dccb..3774afac2 100755 --- a/python/sglang/srt/layers/moe/cutlass_moe.py +++ b/python/sglang/srt/layers/moe/cutlass_moe.py @@ -209,7 +209,7 @@ def cutlass_fused_experts_fp8( ) result = torch.empty((m, k), device=device, dtype=out_dtype) - apply_shuffle_mul_sum(c2, result, c_map, topk_weights) + apply_shuffle_mul_sum(c2, result, c_map, topk_weights.to(out_dtype)) return result