From 7282ab741a4d07dfb775cbba7fd442b68fddfeeb Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Tue, 22 Apr 2025 16:08:15 -0700 Subject: [PATCH] fix: update bench_speculative (#5649) --- python/sglang/bench_serving.py | 2 ++ scripts/playground/bench_speculative.py | 2 +- 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/python/sglang/bench_serving.py b/python/sglang/bench_serving.py index ad5017612..18003e4d7 100644 --- a/python/sglang/bench_serving.py +++ b/python/sglang/bench_serving.py @@ -993,6 +993,8 @@ async def benchmark( async with semaphore: return await request_func(request_func_input=request_func_input, pbar=pbar) + if not hasattr(args, "warmup_requests"): + args.warmup_requests = 1 # Warmup print(f"Starting warmup with {args.warmup_requests} sequences...") diff --git a/scripts/playground/bench_speculative.py b/scripts/playground/bench_speculative.py index ff2e97262..a8676556c 100644 --- a/scripts/playground/bench_speculative.py +++ b/scripts/playground/bench_speculative.py @@ -85,7 +85,7 @@ def send_one_batch(base_url, num_prompts, batch_size): request_rate=float("inf"), max_concurrency=batch_size, disable_tqdm=False, - lora_name=None, + lora_names=None, extra_request_body={}, profile=None, )