[Fix] fix assertion error for chunked prefill when disabling cache (#2282)
This commit is contained in:
@@ -231,6 +231,9 @@ class PrefillAdder:
|
|||||||
break
|
break
|
||||||
self.req_states.insert(i, (tokens_left, tokens_occupied))
|
self.req_states.insert(i, (tokens_left, tokens_occupied))
|
||||||
|
|
||||||
|
if len(self.can_run_list) != 0:
|
||||||
|
return AddReqResult.OTHER
|
||||||
|
|
||||||
if self.req_states is None:
|
if self.req_states is None:
|
||||||
self.req_states = []
|
self.req_states = []
|
||||||
add_req_state(req)
|
add_req_state(req)
|
||||||
|
|||||||
Reference in New Issue
Block a user