[Fix] fix assertion error for chunked prefill when disabling cache (#2282)

This commit is contained in:
Rui Wang
2024-12-01 09:53:43 +08:00
committed by GitHub
parent 883c955489
commit d622851dc9

View File

@@ -231,6 +231,9 @@ class PrefillAdder:
break
self.req_states.insert(i, (tokens_left, tokens_occupied))
if len(self.can_run_list) != 0:
return AddReqResult.OTHER
if self.req_states is None:
self.req_states = []
add_req_state(req)