diff --git a/python/sglang/srt/managers/scheduler.py b/python/sglang/srt/managers/scheduler.py index 210a243a4..16f4196bd 100644 --- a/python/sglang/srt/managers/scheduler.py +++ b/python/sglang/srt/managers/scheduler.py @@ -416,7 +416,7 @@ class Scheduler: ) # Truncate prompts that are too long - if len(req.origin_input_ids) >= self.max_req_input_len: + if len(req.origin_input_ids) > self.max_req_input_len: logger.warning( "Request length is longer than the KV cache pool size or " "the max context length. Truncated!!!"