Fix openai protocols and pass top_k, min_p (#2499)

This commit is contained in:
Lianmin Zheng
2024-12-17 04:14:14 -08:00
committed by GitHub
parent 33c5ff2845
commit 361ea8d912
2 changed files with 13 additions and 5 deletions

View File

@@ -510,6 +510,8 @@ def v1_generate_request(
"stop": request.stop,
"stop_token_ids": request.stop_token_ids,
"top_p": request.top_p,
"top_k": request.top_k,
"min_p": request.min_p,
"presence_penalty": request.presence_penalty,
"frequency_penalty": request.frequency_penalty,
"repetition_penalty": request.repetition_penalty,
@@ -926,6 +928,8 @@ def v1_chat_generate_request(
"stop": stop,
"stop_token_ids": request.stop_token_ids,
"top_p": request.top_p,
"top_k": request.top_k,
"min_p": request.min_p,
"presence_penalty": request.presence_penalty,
"frequency_penalty": request.frequency_penalty,
"repetition_penalty": request.repetition_penalty,