Fix deepseek awq v3 (#3450)
This commit is contained in:
@@ -298,7 +298,9 @@ class FusedMoE(torch.nn.Module):
|
||||
layer=self,
|
||||
num_experts=num_experts,
|
||||
hidden_size=hidden_size,
|
||||
# FIXME: figure out which intermediate_size to use
|
||||
intermediate_size=self.intermediate_size_per_partition,
|
||||
intermediate_size_per_partition=self.intermediate_size_per_partition,
|
||||
params_dtype=params_dtype,
|
||||
weight_loader=self.weight_loader,
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user