Fix a bug with logprob streaming + chunked prefill (#2403)
This commit is contained in:
@@ -568,6 +568,7 @@ def run_bench_serving(
|
||||
disable_tqdm=False,
|
||||
disable_stream=disable_stream,
|
||||
disable_ignore_eos=False,
|
||||
return_logprob=False,
|
||||
lora_name=None,
|
||||
extra_request_body=None,
|
||||
profile=None,
|
||||
|
||||
Reference in New Issue
Block a user