fix crash of DeepSeek-V3 update_weights_from_disk (#8863)

Co-authored-by: parkeychen <parkeychen@tencent.com>
This commit is contained in:
scut-cbq
2025-09-16 09:45:15 +08:00
committed by GitHub
parent 35ef3f2902
commit a220c14f81

View File

@@ -358,8 +358,8 @@ class Fp8LinearMethod(LinearMethodBase):
return
else:
weight, weight_scale = layer.weight.data, layer.weight_scale_inv.data
layer.weight = Parameter(weight, requires_grad=False)
layer.weight_scale_inv = Parameter(weight_scale, requires_grad=False)
layer.weight.data = weight.data
layer.weight_scale_inv.data = weight_scale.data
else:
layer.weight = Parameter(layer.weight.data, requires_grad=False)