[bugfix] Fix typo in modelopt quant: 'FusedMoE' object has no attribute 'local_num_experts' (#8768)
This commit is contained in:
@@ -776,7 +776,7 @@ class ModelOptNvFp4FusedMoEMethod(FusedMoEMethodBase):
|
|||||||
# GEMM 1
|
# GEMM 1
|
||||||
w13_weight = ModelWeightParameter(
|
w13_weight = ModelWeightParameter(
|
||||||
data=torch.empty(
|
data=torch.empty(
|
||||||
layer.local_num_experts,
|
layer.num_local_experts,
|
||||||
2 * intermediate_size_per_partition,
|
2 * intermediate_size_per_partition,
|
||||||
# 2 fp4 items are packed in the input dimension
|
# 2 fp4 items are packed in the input dimension
|
||||||
hidden_size // 2,
|
hidden_size // 2,
|
||||||
|
|||||||
Reference in New Issue
Block a user