diff --git a/setup.py b/setup.py index 0ceb2e4..351efa1 100644 --- a/setup.py +++ b/setup.py @@ -364,7 +364,7 @@ setup( version=VERSION, author="vLLM-Ascend team", license="Apache 2.0", - description=("vLLM Ascend backend plugin"), + description="vLLM Ascend backend plugin", long_description=read_readme(), long_description_content_type="text/markdown", url="https://github.com/vllm-project/vllm-ascend", diff --git a/vllm_ascend/models/pangu_moe.py b/vllm_ascend/models/pangu_moe.py index bf0f948..1dfbcf8 100644 --- a/vllm_ascend/models/pangu_moe.py +++ b/vllm_ascend/models/pangu_moe.py @@ -122,7 +122,7 @@ class CustomMergedColumnParallelLinear(LinearBase): input_size=self.input_size, output_size=self.output_size, params_dtype=self.params_dtype, - weight_loader=(self.weight_loader)) + weight_loader=self.weight_loader) if bias: self.bias = Parameter( torch.empty(self.output_size_per_partition, @@ -227,7 +227,7 @@ class CustomRowParallelLinear(LinearBase): input_size=self.input_size, output_size=self.output_size, params_dtype=self.params_dtype, - weight_loader=(self.weight_loader)) + weight_loader=self.weight_loader) if not reduce_results and (bias and not skip_bias_add): raise ValueError("When not reduce the results, adding bias to the " "results can lead to incorrect results")