From 67470bbb28591cc2a82a4cda419cdf6664ce46d2 Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Sun, 8 Dec 2024 20:55:04 +0800 Subject: [PATCH] minor: update correct measurement unit (#2406) --- test/srt/test_bench_serving.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/test/srt/test_bench_serving.py b/test/srt/test_bench_serving.py index 34a7b6c9670..b882f12f9df 100644 --- a/test/srt/test_bench_serving.py +++ b/test/srt/test_bench_serving.py @@ -125,7 +125,7 @@ def test_online_latency_default(self): if is_in_ci(): write_github_step_summary( f"### test_online_latency_default\n" - f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} token/s\n' + f'median_e2e_latency_ms : {res["median_e2e_latency_ms"]:.2f} ms\n' ) self.assertLess(res["median_e2e_latency_ms"], 12000) self.assertLess(res["median_ttft_ms"], 86)