[Fix] fix retract error in eagle speculative decoding (#2711)

Co-authored-by: kavioyu <kavioyu@tencent.com>
This commit is contained in:
yukavio
2025-01-03 02:28:39 +08:00
committed by GitHub
parent 1775b963db
commit 8c8779cd05

View File

@@ -601,11 +601,11 @@ class EagleVerifyInput(SpecInfo):
req.check_finished()
if req.finished():
draft_input.has_finished = True
finished_extend_len[req.rid] = verified_len + 1
else:
new_accept_index.append(accept_index[low : low + verified_len + 1])
unfinished_index.append(i)
low += verified_len + 1
finished_extend_len[req.rid] = verified_len + 1
if len(new_accept_index) > 0:
new_accept_index = torch.cat(new_accept_index, dim=0)