Replace time.time() to time.perf_counter() for benchmarking. (#6178)

Signed-off-by: Lifu Huang <lifu.hlf@gmail.com>
This commit is contained in:
Lifu Huang
2025-05-11 14:32:49 -07:00
committed by GitHub
parent e9a47f4cb5
commit 6e2da51561
61 changed files with 158 additions and 158 deletions

View File

@@ -66,7 +66,7 @@ def main(args):
answers[i] = cur_answers
# Run requests
tic = time.time()
tic = time.perf_counter()
if args.parallel == 1:
for i in tqdm(range(len(questions))):
get_answer(i)
@@ -79,7 +79,7 @@ def main(args):
)
)
latency = time.time() - tic
latency = time.perf_counter() - tic
print(f"#questions: {len(questions)}, Latency: {latency:.2f}")

View File

@@ -57,7 +57,7 @@ def main(args):
sgl.set_default_backend(backend)
# Run requests
tic = time.time()
tic = time.perf_counter()
rets = answer_mt_bench.run_batch(
arguments,
temperature=0,
@@ -66,7 +66,7 @@ def main(args):
progress_bar=True,
)
answers = [[s["answer_1"], s["answer_2"]] for s in rets]
latency = time.time() - tic
latency = time.perf_counter() - tic
print(f"#questions: {len(questions)}, Latency: {latency:.2f}")

View File

@@ -68,7 +68,7 @@ def main(args):
sgl.set_default_backend(backend)
# Run requests
tic = time.time()
tic = time.perf_counter()
rets = answer_mt_bench.run_batch(
arguments,
temperature=0,
@@ -78,7 +78,7 @@ def main(args):
)
answers = [[s["answer_1"], s["answer_2"]] for s in rets]
latency = time.time() - tic
latency = time.perf_counter() - tic
num_output_tokens = sum(
s.get_meta_info("answer_1")["completion_tokens"]
+ s.get_meta_info("answer_2")["completion_tokens"]