[MoE] fix: incorrect weight initialization for cutlass_fused_experts_fp8 (#10144)
This commit is contained in:
@@ -656,7 +656,7 @@ class Fp8MoEMethod(FusedMoEMethodBase):
|
|||||||
)
|
)
|
||||||
self.c_strides2 = torch.full(
|
self.c_strides2 = torch.full(
|
||||||
(num_experts,),
|
(num_experts,),
|
||||||
intermediate_size_per_partition,
|
hidden_size,
|
||||||
device=w2_weight.device,
|
device=w2_weight.device,
|
||||||
dtype=torch.int64,
|
dtype=torch.int64,
|
||||||
)
|
)
|
||||||
|
|||||||
Reference in New Issue
Block a user