[MoE] fix: incorrect weight initialization for cutlass_fused_experts_fp8 (#10144)

This commit is contained in:
Cheng Wan
2025-09-07 19:43:59 -07:00
committed by GitHub
parent 33467c05a4
commit 5a7e10fe4c

View File

@@ -656,7 +656,7 @@ class Fp8MoEMethod(FusedMoEMethodBase):
)
self.c_strides2 = torch.full(
(num_experts,),
intermediate_size_per_partition,
hidden_size,
device=w2_weight.device,
dtype=torch.int64,
)