fix: update bench_speculative (#5649)

This commit is contained in:
Yineng Zhang
2025-04-22 16:08:15 -07:00
committed by GitHub
parent b0feda090c
commit 7282ab741a
2 changed files with 3 additions and 1 deletions

View File

@@ -993,6 +993,8 @@ async def benchmark(
async with semaphore:
return await request_func(request_func_input=request_func_input, pbar=pbar)
if not hasattr(args, "warmup_requests"):
args.warmup_requests = 1
# Warmup
print(f"Starting warmup with {args.warmup_requests} sequences...")

View File

@@ -85,7 +85,7 @@ def send_one_batch(base_url, num_prompts, batch_size):
request_rate=float("inf"),
max_concurrency=batch_size,
disable_tqdm=False,
lora_name=None,
lora_names=None,
extra_request_body={},
profile=None,
)