use fp32 for e_score_correction_bias in GLM-4.5 (#8729)
This commit is contained in:
@@ -343,7 +343,7 @@ class Glm4MoeGate(nn.Module):
|
|||||||
torch.empty((config.n_routed_experts, config.hidden_size))
|
torch.empty((config.n_routed_experts, config.hidden_size))
|
||||||
)
|
)
|
||||||
self.e_score_correction_bias = nn.Parameter(
|
self.e_score_correction_bias = nn.Parameter(
|
||||||
torch.empty((config.n_routed_experts))
|
torch.empty((config.n_routed_experts), dtype=torch.float32)
|
||||||
)
|
)
|
||||||
if _is_cpu and _is_cpu_amx_available:
|
if _is_cpu and _is_cpu_amx_available:
|
||||||
self.quant_method = PackWeightMethod(weight_names=["weight"])
|
self.quant_method = PackWeightMethod(weight_names=["weight"])
|
||||||
|
|||||||
Reference in New Issue
Block a user