Fix a bug in schedule_policy (#6276)
This commit is contained in:
@@ -468,6 +468,9 @@ class PrefillAdder:
|
|||||||
return AddReqResult.OTHER
|
return AddReqResult.OTHER
|
||||||
|
|
||||||
with self._lock_node(req.last_node):
|
with self._lock_node(req.last_node):
|
||||||
|
if total_tokens > self.rem_total_tokens:
|
||||||
|
return AddReqResult.NO_TOKEN
|
||||||
|
|
||||||
if (
|
if (
|
||||||
enable_hierarchical_cache
|
enable_hierarchical_cache
|
||||||
and req.last_node_global is not None
|
and req.last_node_global is not None
|
||||||
|
|||||||
Reference in New Issue
Block a user