Fix schedule bug (#1451)

This commit is contained in:
Liangsheng Yin
2024-09-17 22:59:32 -07:00
committed by GitHub
parent 36078fb247
commit 7c162fa9c5

View File

@@ -229,6 +229,7 @@ class PrefillAdder:
else:
add_req_state(req, insert_sort=True)
cur_rem_tokens = self.cur_rem_tokens - len(req.origin_input_ids)
tokens_freed = 0
for i, (tokens_left, tokens_occupied) in enumerate(self.req_states):
decode_steps = (
@@ -237,7 +238,7 @@ class PrefillAdder:
else tokens_left
)
bs = len(self.req_states) - i
if self.cur_rem_tokens + tokens_freed - decode_steps * bs <= 0:
if cur_rem_tokens + tokens_freed - decode_steps * bs <= 0:
return False
tokens_freed += tokens_occupied