Update cutlass_moe.py (#8535)

This commit is contained in:
Elfie Guo
2025-07-29 10:49:41 -07:00
committed by GitHub
parent 7a4309cc8a
commit 4d16c88b6e

View File

@@ -209,7 +209,8 @@ def cutlass_fused_experts_fp8(
)
result = torch.empty((m, k), device=device, dtype=out_dtype)
return apply_shuffle_mul_sum(c2, result, c_map, topk_weights)
apply_shuffle_mul_sum(c2, result, c_map, topk_weights)
return result
FLOAT4_E2M1_MAX = 6.0