Use cu128 for torch audio to fix some CI tests (#11251)

2025-10-05 19:52:32 -07:00
parent baee08601b
commit 366a603e95
3 changed files with 5 additions and 6 deletions
--- a/python/sglang/srt/speculative/spec_utils.py
+++ b/python/sglang/srt/speculative/spec_utils.py
@@ -15,7 +15,7 @@ from sglang.srt.managers.schedule_batch import Req
 from sglang.srt.utils import is_cuda, is_hip

 if is_cuda():
-    from sgl_kernel import fast_topk, tree_speculative_sampling_target_only
+    from sgl_kernel import fast_topk
 elif is_hip():
    from sgl_kernel import fast_topk

@@ -30,8 +30,7 @@ SIMULATE_ACC_LEN = envs.SGLANG_SIMULATE_ACC_LEN.get()  # turn off if < 0
 SIMULATE_ACC_METHOD = envs.SGLANG_SIMULATE_ACC_METHOD.get()

 TREE_TRAVERSE_TIME_THRESHOLD = 1  # TODO: set this properly
-
-TREE_SPEC_KERNEL_AVAILABLE = "tree_speculative_sampling_target_only" in globals()
+TREE_SPEC_KERNEL_AVAILABLE = is_cuda()  # This kernel is only available for CUDA now


@triton.jit