Fix deepseek awq v3 (#3450)

This commit is contained in:
Liangsheng Yin
2025-02-12 22:09:52 +08:00
committed by GitHub
parent 8adbc78b30
commit 8616357a97
4 changed files with 69 additions and 10 deletions

View File

@@ -298,7 +298,9 @@ class FusedMoE(torch.nn.Module):
layer=self,
num_experts=num_experts,
hidden_size=hidden_size,
# FIXME: figure out which intermediate_size to use
intermediate_size=self.intermediate_size_per_partition,
intermediate_size_per_partition=self.intermediate_size_per_partition,
params_dtype=params_dtype,
weight_loader=self.weight_loader,
)