fix crash of DeepSeek-V3 update_weights_from_disk (#8863)
Co-authored-by: parkeychen <parkeychen@tencent.com>
This commit is contained in:
@@ -358,8 +358,8 @@ class Fp8LinearMethod(LinearMethodBase):
|
|||||||
return
|
return
|
||||||
else:
|
else:
|
||||||
weight, weight_scale = layer.weight.data, layer.weight_scale_inv.data
|
weight, weight_scale = layer.weight.data, layer.weight_scale_inv.data
|
||||||
layer.weight = Parameter(weight, requires_grad=False)
|
layer.weight.data = weight.data
|
||||||
layer.weight_scale_inv = Parameter(weight_scale, requires_grad=False)
|
layer.weight_scale_inv.data = weight_scale.data
|
||||||
else:
|
else:
|
||||||
layer.weight = Parameter(layer.weight.data, requires_grad=False)
|
layer.weight = Parameter(layer.weight.data, requires_grad=False)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user