Update python API of activation, topk, norm and rope and remove vllm dependency (#6614)

Co-authored-by: Wu, Chunyuan <chunyuan.wu@intel.com> Co-authored-by: jianan-gu <jianan.gu@intel.com> Co-authored-by: sdp <sdp@gnr799219.jf.intel.com>
2025-06-18 13:11:50 +08:00
parent e56685ac1b
commit 094c116f7d
23 changed files with 270 additions and 56 deletions
--- a/test/srt/cpu/test_topk.py
+++ b/test/srt/cpu/test_topk.py
@@ -8,8 +8,8 @@ from utils import precision
 from sglang.srt.layers.moe.topk import (
    biased_grouped_topk_impl as native_biased_grouped_topk,
 )
-from sglang.srt.layers.moe.topk import fused_topk_native as native_fused_topk
-from sglang.srt.layers.moe.topk import grouped_topk as native_grouped_topk
+from sglang.srt.layers.moe.topk import fused_topk_torch_native as native_fused_topk
+from sglang.srt.layers.moe.topk import grouped_topk_gpu as native_grouped_topk
 from sglang.srt.models.llama4 import Llama4MoE
 from sglang.test.test_utils import CustomTestCase