fix: update bench_speculative (#5649)
This commit is contained in:
@@ -85,7 +85,7 @@ def send_one_batch(base_url, num_prompts, batch_size):
|
||||
request_rate=float("inf"),
|
||||
max_concurrency=batch_size,
|
||||
disable_tqdm=False,
|
||||
lora_name=None,
|
||||
lora_names=None,
|
||||
extra_request_body={},
|
||||
profile=None,
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user