Rename sglang.bench_latency to sglang.bench_one_batch (#2118)

This commit is contained in:
Lianmin Zheng
2024-11-21 20:07:48 -08:00
committed by GitHub
parent 8048c28c11
commit dfec7fca06
16 changed files with 521 additions and 599 deletions

View File

@@ -579,11 +579,11 @@ def run_bench_serving(
return res
def run_bench_latency(model, other_args):
def run_bench_one_batch(model, other_args):
command = [
"python3",
"-m",
"sglang.bench_latency",
"sglang.bench_one_batch",
"--model-path",
model,
"--batch-size",