diff --git a/vllm_ascend/torchair/utils.py b/vllm_ascend/torchair/utils.py index a9bbdae..8dd1e3f 100644 --- a/vllm_ascend/torchair/utils.py +++ b/vllm_ascend/torchair/utils.py @@ -185,15 +185,14 @@ def torchair_quant_method_register(): def torchair_ops_patch(): - from vllm.model_executor.layers.rotary_embedding import ( - DeepseekScalingRotaryEmbedding, RotaryEmbedding) - + from vllm_ascend.ops.rotary_embedding import ( + AscendDeepseekScalingRotaryEmbedding, AscendRotaryEmbedding) from vllm_ascend.torchair.ops.torchair_rotary_embedding import ( deepseek_rope_init_func, native_rope_deepseek_forward, qwen_rope_init_func, rope_forward) - RotaryEmbedding.__init__ = qwen_rope_init_func - RotaryEmbedding.forward_oot = rope_forward + AscendRotaryEmbedding.__init__ = qwen_rope_init_func # type: ignore[method-assign] + AscendRotaryEmbedding.forward_oot = rope_forward # type: ignore[method-assign] - DeepseekScalingRotaryEmbedding.__init__ = deepseek_rope_init_func - DeepseekScalingRotaryEmbedding.forward = native_rope_deepseek_forward + AscendDeepseekScalingRotaryEmbedding.__init__ = deepseek_rope_init_func # type: ignore[method-assign] + AscendDeepseekScalingRotaryEmbedding.forward = native_rope_deepseek_forward # type: ignore[method-assign]