Migrate XTorch operations to Kunlun operations (accelerating iteration) (#177)

Signed-off-by: dongxinyu03 <dongxinyu03@baidu.com>
2026-02-12 18:13:00 +08:00
parent 744719587e
commit bf9369f733
15 changed files with 125 additions and 119 deletions
--- a/vllm_kunlun/ops/attention/merge_attn_states.py
+++ b/vllm_kunlun/ops/attention/merge_attn_states.py
@@ -3,7 +3,7 @@
 from typing import Optional

 import torch
-import xtorch_ops
+import kunlun_ops
 from vllm.platforms import current_platform


@@ -16,7 +16,7 @@ def merge_attn_states(
    output_lse: Optional[torch.Tensor] = None,
 ) -> None:

-    return xtorch_ops.attention_merge_stage(
+    return kunlun_ops.attention_merge_stage(
        prefix_output,
        prefix_lse,
        suffix_output,