forked from EngineX-Cambricon/enginex-mlu370-vllm
testing dynamic register
This commit is contained in:
@@ -118,6 +118,7 @@ def replace_linear_class(
|
||||
bias=linear.bias is not None,
|
||||
quant_config=quant_config,
|
||||
prefix=prefix,
|
||||
return_bias=False, # Return tensor only, not (tensor, bias) tuple
|
||||
**vllm_linear_kwargs,
|
||||
)
|
||||
|
||||
|
||||
Reference in New Issue
Block a user