Fix a bug in schedule_policy (#6276)

This commit is contained in:
Ying Sheng
2025-05-13 18:04:00 -07:00
committed by GitHub
parent 912788c095
commit fb71725c98

View File

@@ -468,6 +468,9 @@ class PrefillAdder:
return AddReqResult.OTHER
with self._lock_node(req.last_node):
if total_tokens > self.rem_total_tokens:
return AddReqResult.NO_TOKEN
if (
enable_hierarchical_cache
and req.last_node_global is not None