accomendate reasoning_effort set in chat_template_kwargs (#9458)
This commit is contained in:
@@ -87,6 +87,14 @@ class OpenAIServingChat(OpenAIServingBase):
|
|||||||
self,
|
self,
|
||||||
request: ChatCompletionRequest,
|
request: ChatCompletionRequest,
|
||||||
) -> tuple[GenerateReqInput, ChatCompletionRequest]:
|
) -> tuple[GenerateReqInput, ChatCompletionRequest]:
|
||||||
|
reasoning_effort = (
|
||||||
|
request.chat_template_kwargs.pop("reasoning_effort", None)
|
||||||
|
if request.chat_template_kwargs
|
||||||
|
else None
|
||||||
|
)
|
||||||
|
if reasoning_effort is not None:
|
||||||
|
request.reasoning_effort = reasoning_effort
|
||||||
|
|
||||||
"""Convert OpenAI chat completion request to internal format"""
|
"""Convert OpenAI chat completion request to internal format"""
|
||||||
is_multimodal = self.tokenizer_manager.model_config.is_multimodal
|
is_multimodal = self.tokenizer_manager.model_config.is_multimodal
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user