Fix benchmark latency (#1007)
This commit is contained in:
@@ -332,6 +332,7 @@ def latency_test(
|
|||||||
)
|
)
|
||||||
|
|
||||||
# Warm up
|
# Warm up
|
||||||
|
rank_print("Warmup ...")
|
||||||
latency_test_run_once(
|
latency_test_run_once(
|
||||||
bench_args.run_name,
|
bench_args.run_name,
|
||||||
model_runner,
|
model_runner,
|
||||||
@@ -341,6 +342,7 @@ def latency_test(
|
|||||||
bench_args.input_len[0],
|
bench_args.input_len[0],
|
||||||
4, # shorter decoding to speed up the warmup
|
4, # shorter decoding to speed up the warmup
|
||||||
)
|
)
|
||||||
|
rank_print("Benchmark ...")
|
||||||
|
|
||||||
# Run the sweep
|
# Run the sweep
|
||||||
result_list = []
|
result_list = []
|
||||||
|
|||||||
Reference in New Issue
Block a user