Update bench_serving.py (#4454)

This commit is contained in:
Xu Song
2025-03-16 07:33:58 +08:00
committed by GitHub
parent 26c372c13c
commit 470b474075

View File

@@ -128,7 +128,7 @@ async def async_request_trt_llm(
timestamp = time.perf_counter()
# First token
if ttft == 0.0:
ttft = time.perf_counter() - st
ttft = timestamp - st
output.ttft = ttft
# Decoding phase