Minor bugfix on benchmark serving (#1005)
This commit is contained in:
@@ -195,6 +195,7 @@ async def async_request_openai_completions(
|
||||
output.ttft = ttft
|
||||
|
||||
# Decoding phase
|
||||
else:
|
||||
output.itl.append(timestamp - most_recent_timestamp)
|
||||
|
||||
most_recent_timestamp = timestamp
|
||||
|
||||
Reference in New Issue
Block a user