From 20c8119915ca5a8b933ae8194e55e8e8650396f2 Mon Sep 17 00:00:00 2001 From: Ke Bao Date: Sat, 8 Mar 2025 04:11:18 +0800 Subject: [PATCH] Fix eagle hang issue for max_new_tokens=1 (#4185) --- python/sglang/srt/managers/scheduler.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/python/sglang/srt/managers/scheduler.py b/python/sglang/srt/managers/scheduler.py index 05bc8d730..cb3a4b5de 100644 --- a/python/sglang/srt/managers/scheduler.py +++ b/python/sglang/srt/managers/scheduler.py @@ -957,7 +957,11 @@ class Scheduler: self.req_to_token_pool.free(self.chunked_req.req_pool_idx) self.batch_is_full = False + last_bs = self.last_batch.batch_size() self.last_batch.filter_batch() + if self.last_batch.batch_size() < last_bs: + self.batch_is_full = False + if not self.last_batch.is_empty(): if self.running_batch is None: self.running_batch = self.last_batch