[5/N][refactor]add torchair rotary ops (#2559)

### What this PR does / why we need it? Move torchair related rotary ops into torchair dir to make the code clear. Next step we'll remove all torchair related code outside of torchair rotary ops. ### Does this PR introduce _any_ user-facing change? No ### How was this patch tested? vLLM version: main vLLM main: ab9f2cfd19 - vLLM version: v0.10.1.1 - vLLM main: 81eea3d348 Signed-off-by: hust17yixuan <303660421@qq.com>
2025-09-01 09:09:21 +08:00
parent 3a5fc5ee01
commit c2c97f3079
4 changed files with 725 additions and 7 deletions
--- a/vllm_ascend/torchair/utils.py
+++ b/vllm_ascend/torchair/utils.py
@@ -182,3 +182,18 @@ def torchair_quant_method_register():
        "W8A8_DYNAMIC"] = TorchairW8A8DYNAMICQuantizer
    SUPPORT_ASCEND_QUANTIZER_TYPE[
        "W4A8_DYNAMIC"] = TorchairW4A8DYNAMICQuantizer
+
+
+def torchair_ops_patch():
+    from vllm.model_executor.layers.rotary_embedding import (
+        DeepseekScalingRotaryEmbedding, RotaryEmbedding)
+
+    from vllm_ascend.torchair.ops.torchair_rotary_embedding import (
+        deepseek_rope_init_func, native_rope_deepseek_forward,
+        qwen_rope_init_func, rope_forward)
+
+    RotaryEmbedding.__init__ = qwen_rope_init_func
+    RotaryEmbedding.forward_oot = rope_forward
+
+    DeepseekScalingRotaryEmbedding.__init__ = deepseek_rope_init_func
+    DeepseekScalingRotaryEmbedding.forward = native_rope_deepseek_forward