Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
60b77e14
Unverified
Commit
60b77e14
authored
Jan 13, 2026
by
Sanghoon Yoon
Committed by
GitHub
Jan 13, 2026
Browse files
[Frontend] Add `reasoning_effort` to `OpenAIServing._preprocess_chat()` (#31956)
Signed-off-by:
Sanghoon Yoon
<
seanyoon@kakao.com
>
parent
15b33ff0
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
13 additions
and
1 deletion
+13
-1
vllm/entrypoints/openai/serving_chat.py
vllm/entrypoints/openai/serving_chat.py
+5
-1
vllm/entrypoints/openai/serving_responses.py
vllm/entrypoints/openai/serving_responses.py
+8
-0
No files found.
vllm/entrypoints/openai/serving_chat.py
View file @
60b77e14
...
@@ -306,6 +306,10 @@ class OpenAIServingChat(OpenAIServing):
...
@@ -306,6 +306,10 @@ class OpenAIServingChat(OpenAIServing):
)
)
if
error_check_ret
is
not
None
:
if
error_check_ret
is
not
None
:
return
error_check_ret
return
error_check_ret
chat_template_kwargs
=
request
.
chat_template_kwargs
or
{}
chat_template_kwargs
.
update
(
reasoning_effort
=
request
.
reasoning_effort
)
conversation
,
engine_prompts
=
await
self
.
_preprocess_chat
(
conversation
,
engine_prompts
=
await
self
.
_preprocess_chat
(
request
,
request
,
tokenizer
,
tokenizer
,
...
@@ -316,7 +320,7 @@ class OpenAIServingChat(OpenAIServing):
...
@@ -316,7 +320,7 @@ class OpenAIServingChat(OpenAIServing):
continue_final_message
=
request
.
continue_final_message
,
continue_final_message
=
request
.
continue_final_message
,
tool_dicts
=
tool_dicts
,
tool_dicts
=
tool_dicts
,
documents
=
request
.
documents
,
documents
=
request
.
documents
,
chat_template_kwargs
=
request
.
chat_template_kwargs
,
chat_template_kwargs
=
chat_template_kwargs
,
default_chat_template_kwargs
=
self
.
default_chat_template_kwargs
,
default_chat_template_kwargs
=
self
.
default_chat_template_kwargs
,
tool_parser
=
tool_parser
,
tool_parser
=
tool_parser
,
add_special_tokens
=
request
.
add_special_tokens
,
add_special_tokens
=
request
.
add_special_tokens
,
...
...
vllm/entrypoints/openai/serving_responses.py
View file @
60b77e14
...
@@ -589,6 +589,13 @@ class OpenAIServingResponses(OpenAIServing):
...
@@ -589,6 +589,13 @@ class OpenAIServingResponses(OpenAIServing):
prev_msg
=
self
.
msg_store
.
get
(
prev_response
.
id
)
if
prev_response
else
None
,
prev_msg
=
self
.
msg_store
.
get
(
prev_response
.
id
)
if
prev_response
else
None
,
prev_response_output
=
prev_response
.
output
if
prev_response
else
None
,
prev_response_output
=
prev_response
.
output
if
prev_response
else
None
,
)
)
chat_template_kwargs
=
dict
(
reasoning_effort
=
None
if
request
.
reasoning
is
None
else
request
.
reasoning
.
effort
)
_
,
engine_prompts
=
await
self
.
_preprocess_chat
(
_
,
engine_prompts
=
await
self
.
_preprocess_chat
(
request
,
request
,
tokenizer
,
tokenizer
,
...
@@ -597,6 +604,7 @@ class OpenAIServingResponses(OpenAIServing):
...
@@ -597,6 +604,7 @@ class OpenAIServingResponses(OpenAIServing):
tool_parser
=
self
.
tool_parser
,
tool_parser
=
self
.
tool_parser
,
chat_template
=
self
.
chat_template
,
chat_template
=
self
.
chat_template
,
chat_template_content_format
=
self
.
chat_template_content_format
,
chat_template_content_format
=
self
.
chat_template_content_format
,
chat_template_kwargs
=
chat_template_kwargs
,
)
)
return
messages
,
engine_prompts
return
messages
,
engine_prompts
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment