forked from EngineX-Cambricon/enginex-mlu370-vllm
testing dynamic register
This commit is contained in:
@@ -118,6 +118,7 @@ def replace_linear_class(
|
|||||||
bias=linear.bias is not None,
|
bias=linear.bias is not None,
|
||||||
quant_config=quant_config,
|
quant_config=quant_config,
|
||||||
prefix=prefix,
|
prefix=prefix,
|
||||||
|
return_bias=False, # Return tensor only, not (tensor, bias) tuple
|
||||||
**vllm_linear_kwargs,
|
**vllm_linear_kwargs,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user