Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
a3ea760e
Unverified
Commit
a3ea760e
authored
Mar 11, 2026
by
Julien Denize
Committed by
GitHub
Mar 11, 2026
Browse files
Add 'none' reasoning effort to ChatCompletionRequest (#36238)
Signed-off-by:
Julien Denize
<
julien.denize@mistral.ai
>
parent
35db669f
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
14 additions
and
2 deletions
+14
-2
vllm/entrypoints/openai/chat_completion/protocol.py
vllm/entrypoints/openai/chat_completion/protocol.py
+8
-1
vllm/entrypoints/openai/chat_completion/serving.py
vllm/entrypoints/openai/chat_completion/serving.py
+3
-1
vllm/entrypoints/serve/render/serving.py
vllm/entrypoints/serve/render/serving.py
+3
-0
No files found.
vllm/entrypoints/openai/chat_completion/protocol.py
View file @
a3ea760e
...
@@ -179,7 +179,7 @@ class ChatCompletionRequest(OpenAIBaseModel):
...
@@ -179,7 +179,7 @@ class ChatCompletionRequest(OpenAIBaseModel):
|
ChatCompletionNamedToolChoiceParam
|
ChatCompletionNamedToolChoiceParam
|
None
|
None
)
=
"none"
)
=
"none"
reasoning_effort
:
Literal
[
"low"
,
"medium"
,
"high"
]
|
None
=
None
reasoning_effort
:
Literal
[
"none"
,
"low"
,
"medium"
,
"high"
]
|
None
=
None
include_reasoning
:
bool
=
True
include_reasoning
:
bool
=
True
parallel_tool_calls
:
bool
|
None
=
True
parallel_tool_calls
:
bool
|
None
=
True
...
@@ -778,3 +778,10 @@ class ChatCompletionRequest(OpenAIBaseModel):
...
@@ -778,3 +778,10 @@ class ChatCompletionRequest(OpenAIBaseModel):
)
)
return
data
return
data
@
model_validator
(
mode
=
"before"
)
@
classmethod
def
set_include_reasoning_for_none_effort
(
cls
,
data
:
Any
)
->
Any
:
if
data
.
get
(
"reasoning_effort"
)
==
"none"
:
data
[
"include_reasoning"
]
=
False
return
data
vllm/entrypoints/openai/chat_completion/serving.py
View file @
a3ea760e
...
@@ -1893,8 +1893,10 @@ class OpenAIServingChat(OpenAIServing):
...
@@ -1893,8 +1893,10 @@ class OpenAIServingChat(OpenAIServing):
# if the model supports it. TODO: Support browsing.
# if the model supports it. TODO: Support browsing.
assert
not
self
.
supports_browsing
assert
not
self
.
supports_browsing
assert
not
self
.
supports_code_interpreter
assert
not
self
.
supports_code_interpreter
if
(
reasoning_effort
:
=
request
.
reasoning_effort
)
==
"none"
:
raise
ValueError
(
f
"Harmony does not support
{
reasoning_effort
=
}
"
)
sys_msg
=
get_system_message
(
sys_msg
=
get_system_message
(
reasoning_effort
=
request
.
reasoning_effort
,
reasoning_effort
=
reasoning_effort
,
browser_description
=
None
,
browser_description
=
None
,
python_description
=
None
,
python_description
=
None
,
with_custom_tools
=
should_include_tools
,
with_custom_tools
=
should_include_tools
,
...
...
vllm/entrypoints/serve/render/serving.py
View file @
a3ea760e
...
@@ -221,6 +221,9 @@ class OpenAIServingRender:
...
@@ -221,6 +221,9 @@ class OpenAIServingRender:
# if the model supports it. TODO: Support browsing.
# if the model supports it. TODO: Support browsing.
assert
not
self
.
supports_browsing
assert
not
self
.
supports_browsing
assert
not
self
.
supports_code_interpreter
assert
not
self
.
supports_code_interpreter
assert
request
.
reasoning_effort
!=
"none"
,
(
"Harmony does not support reasoning_effort='none'"
)
sys_msg
=
get_system_message
(
sys_msg
=
get_system_message
(
reasoning_effort
=
request
.
reasoning_effort
,
reasoning_effort
=
request
.
reasoning_effort
,
browser_description
=
None
,
browser_description
=
None
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment