"...text-generation-inference.git" did not exist on "afc7ded84fbd50106847f84b68fdae6f6f17158c"
Unverified Commit 67470bbb authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

minor: update correct measurement unit (#2406)

parent cc858953
...@@ -125,7 +125,7 @@ class TestBenchServing(unittest.TestCase): ...@@ -125,7 +125,7 @@ class TestBenchServing(unittest.TestCase):
if is_in_ci(): if is_in_ci():
write_github_step_summary( write_github_step_summary(
f"### test_online_latency_default\n" f"### test_online_latency_default\n"
f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} token/s\n' f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} ms\n'
) )
self.assertLess(res["median_e2e_latency_ms"], 12000) self.assertLess(res["median_e2e_latency_ms"], 12000)
self.assertLess(res["median_ttft_ms"], 86) self.assertLess(res["median_ttft_ms"], 86)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment