From fb71725c98be000a1839c102e65de12ebf207a16 Mon Sep 17 00:00:00 2001 From: Ying Sheng Date: Tue, 13 May 2025 18:04:00 -0700 Subject: [PATCH] Fix a bug in schedule_policy (#6276) --- python/sglang/srt/managers/schedule_policy.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/python/sglang/srt/managers/schedule_policy.py b/python/sglang/srt/managers/schedule_policy.py index 777ecd343..3cd2be26b 100644 --- a/python/sglang/srt/managers/schedule_policy.py +++ b/python/sglang/srt/managers/schedule_policy.py @@ -468,6 +468,9 @@ class PrefillAdder: return AddReqResult.OTHER with self._lock_node(req.last_node): + if total_tokens > self.rem_total_tokens: + return AddReqResult.NO_TOKEN + if ( enable_hierarchical_cache and req.last_node_global is not None