From 1a9c2c92149a7aee42efcfc382fa6aefd8a52f04 Mon Sep 17 00:00:00 2001 From: Lianmin Zheng Date: Mon, 16 Jun 2025 17:01:33 -0700 Subject: [PATCH] Fix AMD speculative decoding (#7252) --- python/sglang/srt/speculative/eagle_utils.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/python/sglang/srt/speculative/eagle_utils.py b/python/sglang/srt/speculative/eagle_utils.py index 2657d8351..171a0327e 100644 --- a/python/sglang/srt/speculative/eagle_utils.py +++ b/python/sglang/srt/speculative/eagle_utils.py @@ -27,14 +27,14 @@ from sglang.srt.utils import is_cuda, is_hip, next_power_of_2 if is_cuda(): from sgl_kernel import ( + fast_topk, top_k_renorm_prob, top_p_renorm_prob, tree_speculative_sampling_target_only, verify_tree_greedy, ) - from sgl_kernel.top_k import fast_topk elif is_hip(): - from sgl_kernel import verify_tree_greedy + from sgl_kernel import fast_topk, verify_tree_greedy logger = logging.getLogger(__name__)