Unverified Commit 60b77e14 authored by Sanghoon Yoon's avatar Sanghoon Yoon Committed by GitHub
Browse files

[Frontend] Add `reasoning_effort` to `OpenAIServing._preprocess_chat()` (#31956)


Signed-off-by: default avatarSanghoon Yoon <seanyoon@kakao.com>
parent 15b33ff0
......@@ -306,6 +306,10 @@ class OpenAIServingChat(OpenAIServing):
)
if error_check_ret is not None:
return error_check_ret
chat_template_kwargs = request.chat_template_kwargs or {}
chat_template_kwargs.update(reasoning_effort=request.reasoning_effort)
conversation, engine_prompts = await self._preprocess_chat(
request,
tokenizer,
......@@ -316,7 +320,7 @@ class OpenAIServingChat(OpenAIServing):
continue_final_message=request.continue_final_message,
tool_dicts=tool_dicts,
documents=request.documents,
chat_template_kwargs=request.chat_template_kwargs,
chat_template_kwargs=chat_template_kwargs,
default_chat_template_kwargs=self.default_chat_template_kwargs,
tool_parser=tool_parser,
add_special_tokens=request.add_special_tokens,
......
......@@ -589,6 +589,13 @@ class OpenAIServingResponses(OpenAIServing):
prev_msg=self.msg_store.get(prev_response.id) if prev_response else None,
prev_response_output=prev_response.output if prev_response else None,
)
chat_template_kwargs = dict(
reasoning_effort=None
if request.reasoning is None
else request.reasoning.effort
)
_, engine_prompts = await self._preprocess_chat(
request,
tokenizer,
......@@ -597,6 +604,7 @@ class OpenAIServingResponses(OpenAIServing):
tool_parser=self.tool_parser,
chat_template=self.chat_template,
chat_template_content_format=self.chat_template_content_format,
chat_template_kwargs=chat_template_kwargs,
)
return messages, engine_prompts
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment