minor: update correct measurement unit (#2406)

This commit is contained in:
Yineng Zhang
2024-12-08 20:55:04 +08:00
committed by GitHub
parent cc858953a0
commit 67470bbb28

View File

@@ -125,7 +125,7 @@ class TestBenchServing(unittest.TestCase):
if is_in_ci():
write_github_step_summary(
f"### test_online_latency_default\n"
f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} token/s\n'
f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} ms\n'
)
self.assertLess(res["median_e2e_latency_ms"], 12000)
self.assertLess(res["median_ttft_ms"], 86)