fix typo in python/sglang/srt/layers/quantization/fp8.py (#2655)
This commit is contained in:
@@ -280,9 +280,9 @@ class Fp8LinearMethod(LinearMethodBase):
|
|||||||
weight_scale=layer.weight_scale_inv,
|
weight_scale=layer.weight_scale_inv,
|
||||||
input_scale=None,
|
input_scale=None,
|
||||||
)
|
)
|
||||||
layer.weight = torch.nn.Parameter(weight, require_grad=False)
|
layer.weight = torch.nn.Parameter(weight, requires_grad=False)
|
||||||
layer.weight_scale_inv = torch.nn.Parameter(
|
layer.weight_scale_inv = torch.nn.Parameter(
|
||||||
weight_scale, require_grad=False
|
weight_scale, requires_grad=False
|
||||||
)
|
)
|
||||||
layer.input_scale = None
|
layer.input_scale = None
|
||||||
return
|
return
|
||||||
|
|||||||
Reference in New Issue
Block a user