Unverified Commit 60b77e14 authored by Sanghoon Yoon's avatar Sanghoon Yoon Committed by GitHub
Browse files

[Frontend] Add `reasoning_effort` to `OpenAIServing._preprocess_chat()` (#31956)


Signed-off-by: default avatarSanghoon Yoon <seanyoon@kakao.com>
parent 15b33ff0
...@@ -306,6 +306,10 @@ class OpenAIServingChat(OpenAIServing): ...@@ -306,6 +306,10 @@ class OpenAIServingChat(OpenAIServing):
) )
if error_check_ret is not None: if error_check_ret is not None:
return error_check_ret return error_check_ret
chat_template_kwargs = request.chat_template_kwargs or {}
chat_template_kwargs.update(reasoning_effort=request.reasoning_effort)
conversation, engine_prompts = await self._preprocess_chat( conversation, engine_prompts = await self._preprocess_chat(
request, request,
tokenizer, tokenizer,
...@@ -316,7 +320,7 @@ class OpenAIServingChat(OpenAIServing): ...@@ -316,7 +320,7 @@ class OpenAIServingChat(OpenAIServing):
continue_final_message=request.continue_final_message, continue_final_message=request.continue_final_message,
tool_dicts=tool_dicts, tool_dicts=tool_dicts,
documents=request.documents, documents=request.documents,
chat_template_kwargs=request.chat_template_kwargs, chat_template_kwargs=chat_template_kwargs,
default_chat_template_kwargs=self.default_chat_template_kwargs, default_chat_template_kwargs=self.default_chat_template_kwargs,
tool_parser=tool_parser, tool_parser=tool_parser,
add_special_tokens=request.add_special_tokens, add_special_tokens=request.add_special_tokens,
......
...@@ -589,6 +589,13 @@ class OpenAIServingResponses(OpenAIServing): ...@@ -589,6 +589,13 @@ class OpenAIServingResponses(OpenAIServing):
prev_msg=self.msg_store.get(prev_response.id) if prev_response else None, prev_msg=self.msg_store.get(prev_response.id) if prev_response else None,
prev_response_output=prev_response.output if prev_response else None, prev_response_output=prev_response.output if prev_response else None,
) )
chat_template_kwargs = dict(
reasoning_effort=None
if request.reasoning is None
else request.reasoning.effort
)
_, engine_prompts = await self._preprocess_chat( _, engine_prompts = await self._preprocess_chat(
request, request,
tokenizer, tokenizer,
...@@ -597,6 +604,7 @@ class OpenAIServingResponses(OpenAIServing): ...@@ -597,6 +604,7 @@ class OpenAIServingResponses(OpenAIServing):
tool_parser=self.tool_parser, tool_parser=self.tool_parser,
chat_template=self.chat_template, chat_template=self.chat_template,
chat_template_content_format=self.chat_template_content_format, chat_template_content_format=self.chat_template_content_format,
chat_template_kwargs=chat_template_kwargs,
) )
return messages, engine_prompts return messages, engine_prompts
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment