Fix edge case for truncated (#1747)
This commit is contained in:
@@ -416,7 +416,7 @@ class Scheduler:
|
|||||||
)
|
)
|
||||||
|
|
||||||
# Truncate prompts that are too long
|
# Truncate prompts that are too long
|
||||||
if len(req.origin_input_ids) >= self.max_req_input_len:
|
if len(req.origin_input_ids) > self.max_req_input_len:
|
||||||
logger.warning(
|
logger.warning(
|
||||||
"Request length is longer than the KV cache pool size or "
|
"Request length is longer than the KV cache pool size or "
|
||||||
"the max context length. Truncated!!!"
|
"the max context length. Truncated!!!"
|
||||||
|
|||||||
Reference in New Issue
Block a user