fix crash of DeepSeek-V3 update_weights_from_disk (#8863)
Co-authored-by: parkeychen <parkeychen@tencent.com>
This commit is contained in:
@@ -358,8 +358,8 @@ class Fp8LinearMethod(LinearMethodBase):
|
||||
return
|
||||
else:
|
||||
weight, weight_scale = layer.weight.data, layer.weight_scale_inv.data
|
||||
layer.weight = Parameter(weight, requires_grad=False)
|
||||
layer.weight_scale_inv = Parameter(weight_scale, requires_grad=False)
|
||||
layer.weight.data = weight.data
|
||||
layer.weight_scale_inv.data = weight_scale.data
|
||||
else:
|
||||
layer.weight = Parameter(layer.weight.data, requires_grad=False)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user