minor: update correct measurement unit (#2406)
This commit is contained in:
@@ -125,7 +125,7 @@ class TestBenchServing(unittest.TestCase):
|
|||||||
if is_in_ci():
|
if is_in_ci():
|
||||||
write_github_step_summary(
|
write_github_step_summary(
|
||||||
f"### test_online_latency_default\n"
|
f"### test_online_latency_default\n"
|
||||||
f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} token/s\n'
|
f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} ms\n'
|
||||||
)
|
)
|
||||||
self.assertLess(res["median_e2e_latency_ms"], 12000)
|
self.assertLess(res["median_e2e_latency_ms"], 12000)
|
||||||
self.assertLess(res["median_ttft_ms"], 86)
|
self.assertLess(res["median_ttft_ms"], 86)
|
||||||
|
|||||||
Reference in New Issue
Block a user