Fix AMD speculative decoding (#7252)

This commit is contained in:
Lianmin Zheng
2025-06-16 17:01:33 -07:00
committed by GitHub
parent 873ae12cee
commit 1a9c2c9214

View File

@@ -27,14 +27,14 @@ from sglang.srt.utils import is_cuda, is_hip, next_power_of_2
if is_cuda():
from sgl_kernel import (
fast_topk,
top_k_renorm_prob,
top_p_renorm_prob,
tree_speculative_sampling_target_only,
verify_tree_greedy,
)
from sgl_kernel.top_k import fast_topk
elif is_hip():
from sgl_kernel import verify_tree_greedy
from sgl_kernel import fast_topk, verify_tree_greedy
logger = logging.getLogger(__name__)