Use cu128 for torch audio to fix some CI tests (#11251)
This commit is contained in:
@@ -15,7 +15,7 @@ from sglang.srt.managers.schedule_batch import Req
|
||||
from sglang.srt.utils import is_cuda, is_hip
|
||||
|
||||
if is_cuda():
|
||||
from sgl_kernel import fast_topk, tree_speculative_sampling_target_only
|
||||
from sgl_kernel import fast_topk
|
||||
elif is_hip():
|
||||
from sgl_kernel import fast_topk
|
||||
|
||||
@@ -30,8 +30,7 @@ SIMULATE_ACC_LEN = envs.SGLANG_SIMULATE_ACC_LEN.get() # turn off if < 0
|
||||
SIMULATE_ACC_METHOD = envs.SGLANG_SIMULATE_ACC_METHOD.get()
|
||||
|
||||
TREE_TRAVERSE_TIME_THRESHOLD = 1 # TODO: set this properly
|
||||
|
||||
TREE_SPEC_KERNEL_AVAILABLE = "tree_speculative_sampling_target_only" in globals()
|
||||
TREE_SPEC_KERNEL_AVAILABLE = is_cuda() # This kernel is only available for CUDA now
|
||||
|
||||
|
||||
@triton.jit
|
||||
|
||||
Reference in New Issue
Block a user