support more optioin about usage in stream mode (#985)
Co-authored-by: Ying Sheng <sqy1415@gmail.com>
This commit is contained in:
@@ -217,7 +217,9 @@ class Req:
|
||||
return
|
||||
|
||||
if len(self.output_ids) >= self.sampling_params.max_new_tokens:
|
||||
self.finished_reason = FINISH_LENGTH(len(self.output_ids))
|
||||
self.finished_reason = FINISH_LENGTH(
|
||||
length=self.sampling_params.max_new_tokens
|
||||
)
|
||||
return
|
||||
|
||||
if (
|
||||
|
||||
Reference in New Issue
Block a user