Bug fix for metrics counter (#4660)
This commit is contained in:
@@ -878,6 +878,8 @@ class ScheduleBatch(ScheduleBatchDisaggregationDecodeMixin):
|
|||||||
# If req.input_embeds is already a list, append its content directly
|
# If req.input_embeds is already a list, append its content directly
|
||||||
input_embeds.extend(req.input_embeds) # Use extend to avoid nesting
|
input_embeds.extend(req.input_embeds) # Use extend to avoid nesting
|
||||||
|
|
||||||
|
if req.is_retracted:
|
||||||
|
req.already_computed = 0
|
||||||
req.cached_tokens += pre_len - req.already_computed
|
req.cached_tokens += pre_len - req.already_computed
|
||||||
req.already_computed = seq_len
|
req.already_computed = seq_len
|
||||||
req.is_retracted = False
|
req.is_retracted = False
|
||||||
|
|||||||
Reference in New Issue
Block a user