Fix a bug with logprob streaming + chunked prefill (#2403)

This commit is contained in:
Lianmin Zheng
2024-12-08 03:55:27 -08:00
committed by GitHub
parent 61dec545b0
commit a2486eb58f
3 changed files with 24 additions and 13 deletions

View File

@@ -568,6 +568,7 @@ def run_bench_serving(
disable_tqdm=False,
disable_stream=disable_stream,
disable_ignore_eos=False,
return_logprob=False,
lora_name=None,
extra_request_body=None,
profile=None,