Update cutlass_moe.py (#8535)
This commit is contained in:
@@ -209,7 +209,8 @@ def cutlass_fused_experts_fp8(
|
|||||||
)
|
)
|
||||||
|
|
||||||
result = torch.empty((m, k), device=device, dtype=out_dtype)
|
result = torch.empty((m, k), device=device, dtype=out_dtype)
|
||||||
return apply_shuffle_mul_sum(c2, result, c_map, topk_weights)
|
apply_shuffle_mul_sum(c2, result, c_map, topk_weights)
|
||||||
|
return result
|
||||||
|
|
||||||
|
|
||||||
FLOAT4_E2M1_MAX = 6.0
|
FLOAT4_E2M1_MAX = 6.0
|
||||||
|
|||||||
Reference in New Issue
Block a user