diff --git a/python/sglang/srt/layers/moe/cutlass_moe.py b/python/sglang/srt/layers/moe/cutlass_moe.py index 00b7adf77..2a5a5dccb 100755 --- a/python/sglang/srt/layers/moe/cutlass_moe.py +++ b/python/sglang/srt/layers/moe/cutlass_moe.py @@ -209,7 +209,8 @@ def cutlass_fused_experts_fp8( ) result = torch.empty((m, k), device=device, dtype=out_dtype) - return apply_shuffle_mul_sum(c2, result, c_map, topk_weights) + apply_shuffle_mul_sum(c2, result, c_map, topk_weights) + return result FLOAT4_E2M1_MAX = 6.0