Improve benchmark scripts and error message printing (#2922)
This commit is contained in:
@@ -631,7 +631,8 @@ class Scheduler:
|
||||
if len(req.origin_input_ids) > self.max_req_input_len:
|
||||
logger.warning(
|
||||
"Request length is longer than the KV cache pool size or "
|
||||
"the max context length. Truncated!!!"
|
||||
"the max context length. Truncated. "
|
||||
f"{len(req.origin_input_ids)=}, {self.max_req_input_len=}."
|
||||
)
|
||||
req.origin_input_ids = req.origin_input_ids[: self.max_req_input_len]
|
||||
|
||||
|
||||
Reference in New Issue
Block a user