fix: update bench_speculative (#5649)
This commit is contained in:
@@ -993,6 +993,8 @@ async def benchmark(
|
|||||||
async with semaphore:
|
async with semaphore:
|
||||||
return await request_func(request_func_input=request_func_input, pbar=pbar)
|
return await request_func(request_func_input=request_func_input, pbar=pbar)
|
||||||
|
|
||||||
|
if not hasattr(args, "warmup_requests"):
|
||||||
|
args.warmup_requests = 1
|
||||||
# Warmup
|
# Warmup
|
||||||
print(f"Starting warmup with {args.warmup_requests} sequences...")
|
print(f"Starting warmup with {args.warmup_requests} sequences...")
|
||||||
|
|
||||||
|
|||||||
@@ -85,7 +85,7 @@ def send_one_batch(base_url, num_prompts, batch_size):
|
|||||||
request_rate=float("inf"),
|
request_rate=float("inf"),
|
||||||
max_concurrency=batch_size,
|
max_concurrency=batch_size,
|
||||||
disable_tqdm=False,
|
disable_tqdm=False,
|
||||||
lora_name=None,
|
lora_names=None,
|
||||||
extra_request_body={},
|
extra_request_body={},
|
||||||
profile=None,
|
profile=None,
|
||||||
)
|
)
|
||||||
|
|||||||
Reference in New Issue
Block a user