diff --git a/vllm-v0.6.2/vllm/model_executor/models/transformers/utils.py b/vllm-v0.6.2/vllm/model_executor/models/transformers/utils.py index 54dd58f..abd2020 100644 --- a/vllm-v0.6.2/vllm/model_executor/models/transformers/utils.py +++ b/vllm-v0.6.2/vllm/model_executor/models/transformers/utils.py @@ -118,6 +118,7 @@ def replace_linear_class( bias=linear.bias is not None, quant_config=quant_config, prefix=prefix, + return_bias=False, # Return tensor only, not (tensor, bias) tuple **vllm_linear_kwargs, )