Fix AMD speculative decoding (#7252)

This commit is contained in:
Lianmin Zheng
2025-06-16 17:01:33 -07:00
committed by GitHub
parent 873ae12cee
commit 1a9c2c9214

View File

@@ -27,14 +27,14 @@ from sglang.srt.utils import is_cuda, is_hip, next_power_of_2
if is_cuda(): if is_cuda():
from sgl_kernel import ( from sgl_kernel import (
fast_topk,
top_k_renorm_prob, top_k_renorm_prob,
top_p_renorm_prob, top_p_renorm_prob,
tree_speculative_sampling_target_only, tree_speculative_sampling_target_only,
verify_tree_greedy, verify_tree_greedy,
) )
from sgl_kernel.top_k import fast_topk
elif is_hip(): elif is_hip():
from sgl_kernel import verify_tree_greedy from sgl_kernel import fast_topk, verify_tree_greedy
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)