fix: update truss bench_serving (#5683)
This commit is contained in:
@@ -295,7 +295,7 @@ async def async_request_truss(
|
|||||||
# NOTE: Some completion API might have a last
|
# NOTE: Some completion API might have a last
|
||||||
# usage summary response without a token so we
|
# usage summary response without a token so we
|
||||||
# want to check a token was generated
|
# want to check a token was generated
|
||||||
if data["choices"][0]["delta"]["content"]:
|
if data["choices"][0]["text"]:
|
||||||
timestamp = time.perf_counter()
|
timestamp = time.perf_counter()
|
||||||
# First token
|
# First token
|
||||||
if ttft == 0.0:
|
if ttft == 0.0:
|
||||||
@@ -307,7 +307,7 @@ async def async_request_truss(
|
|||||||
output.itl.append(timestamp - most_recent_timestamp)
|
output.itl.append(timestamp - most_recent_timestamp)
|
||||||
|
|
||||||
most_recent_timestamp = timestamp
|
most_recent_timestamp = timestamp
|
||||||
generated_text += data["choices"][0]["delta"]["content"]
|
generated_text += data["choices"][0]["text"]
|
||||||
|
|
||||||
output.generated_text = generated_text
|
output.generated_text = generated_text
|
||||||
output.success = True
|
output.success = True
|
||||||
|
|||||||
Reference in New Issue
Block a user