[Fix] fix retract error in eagle speculative decoding (#2711)
Co-authored-by: kavioyu <kavioyu@tencent.com>
This commit is contained in:
@@ -601,11 +601,11 @@ class EagleVerifyInput(SpecInfo):
|
|||||||
req.check_finished()
|
req.check_finished()
|
||||||
if req.finished():
|
if req.finished():
|
||||||
draft_input.has_finished = True
|
draft_input.has_finished = True
|
||||||
finished_extend_len[req.rid] = verified_len + 1
|
|
||||||
else:
|
else:
|
||||||
new_accept_index.append(accept_index[low : low + verified_len + 1])
|
new_accept_index.append(accept_index[low : low + verified_len + 1])
|
||||||
unfinished_index.append(i)
|
unfinished_index.append(i)
|
||||||
low += verified_len + 1
|
low += verified_len + 1
|
||||||
|
finished_extend_len[req.rid] = verified_len + 1
|
||||||
|
|
||||||
if len(new_accept_index) > 0:
|
if len(new_accept_index) > 0:
|
||||||
new_accept_index = torch.cat(new_accept_index, dim=0)
|
new_accept_index = torch.cat(new_accept_index, dim=0)
|
||||||
|
|||||||
Reference in New Issue
Block a user