Unverified Commit 6eca337c authored by Shintarou Okada's avatar Shintarou Okada Committed by GitHub
Browse files

Replace `--expand-tools-even-if-tool-choice-none` with...


Replace `--expand-tools-even-if-tool-choice-none` with `--exclude-tools-when-tool-choice-none` for v0.10.0 (#20544)
Signed-off-by: default avatarokada <kokuzen@gmail.com>
Signed-off-by: default avatarokada shintarou <okada@preferred.jp>
Co-authored-by: default avatarHarry Mellor <19981378+hmellor@users.noreply.github.com>
parent 85bda9e7
...@@ -103,7 +103,8 @@ When tool_choice='required' is set, the model is guaranteed to generate one or m ...@@ -103,7 +103,8 @@ When tool_choice='required' is set, the model is guaranteed to generate one or m
vLLM supports the `tool_choice='none'` option in the chat completion API. When this option is set, the model will not generate any tool calls and will respond with regular text content only, even if tools are defined in the request. vLLM supports the `tool_choice='none'` option in the chat completion API. When this option is set, the model will not generate any tool calls and will respond with regular text content only, even if tools are defined in the request.
However, when `tool_choice='none'` is specified, vLLM includes tool definitions from the prompt. !!! note
When tools are specified in the request, vLLM includes tool definitions in the prompt by default, regardless of the `tool_choice` setting. To exclude tool definitions when `tool_choice='none'`, use the `--exclude-tools-when-tool-choice-none` option.
## Automatic Function Calling ## Automatic Function Calling
......
...@@ -1646,6 +1646,8 @@ async def init_app_state( ...@@ -1646,6 +1646,8 @@ async def init_app_state(
chat_template_content_format=args.chat_template_content_format, chat_template_content_format=args.chat_template_content_format,
return_tokens_as_token_ids=args.return_tokens_as_token_ids, return_tokens_as_token_ids=args.return_tokens_as_token_ids,
enable_auto_tools=args.enable_auto_tool_choice, enable_auto_tools=args.enable_auto_tool_choice,
exclude_tools_when_tool_choice_none=args.
exclude_tools_when_tool_choice_none,
tool_parser=args.tool_call_parser, tool_parser=args.tool_call_parser,
reasoning_parser=args.reasoning_parser, reasoning_parser=args.reasoning_parser,
enable_prompt_tokens_details=args.enable_prompt_tokens_details, enable_prompt_tokens_details=args.enable_prompt_tokens_details,
......
...@@ -133,6 +133,9 @@ schema. Example: `[{"type": "text", "text": "Hello world!"}]`""" ...@@ -133,6 +133,9 @@ schema. Example: `[{"type": "text", "text": "Hello world!"}]`"""
"""If specified, API server will add X-Request-Id header to responses. """If specified, API server will add X-Request-Id header to responses.
Caution: this hurts performance at high QPS.""" Caution: this hurts performance at high QPS."""
enable_auto_tool_choice: bool = False enable_auto_tool_choice: bool = False
"""If specified, exclude tool definitions in prompts when
tool_choice='none'."""
exclude_tools_when_tool_choice_none: bool = False
"""Enable auto tool choice for supported models. Use `--tool-call-parser` """Enable auto tool choice for supported models. Use `--tool-call-parser`
to specify which parser to use.""" to specify which parser to use."""
tool_call_parser: Optional[str] = None tool_call_parser: Optional[str] = None
......
...@@ -63,6 +63,7 @@ class OpenAIServingChat(OpenAIServing): ...@@ -63,6 +63,7 @@ class OpenAIServingChat(OpenAIServing):
return_tokens_as_token_ids: bool = False, return_tokens_as_token_ids: bool = False,
reasoning_parser: str = "", reasoning_parser: str = "",
enable_auto_tools: bool = False, enable_auto_tools: bool = False,
exclude_tools_when_tool_choice_none: bool = False,
tool_parser: Optional[str] = None, tool_parser: Optional[str] = None,
enable_prompt_tokens_details: bool = False, enable_prompt_tokens_details: bool = False,
enable_force_include_usage: bool = False, enable_force_include_usage: bool = False,
...@@ -111,6 +112,8 @@ class OpenAIServingChat(OpenAIServing): ...@@ -111,6 +112,8 @@ class OpenAIServingChat(OpenAIServing):
raise TypeError("Error: --enable-auto-tool-choice requires " raise TypeError("Error: --enable-auto-tool-choice requires "
f"tool_parser:'{tool_parser}' which has not " f"tool_parser:'{tool_parser}' which has not "
"been registered") from e "been registered") from e
self.exclude_tools_when_tool_choice_none = (
exclude_tools_when_tool_choice_none)
self.enable_prompt_tokens_details = enable_prompt_tokens_details self.enable_prompt_tokens_details = enable_prompt_tokens_details
self.enable_force_include_usage = enable_force_include_usage self.enable_force_include_usage = enable_force_include_usage
...@@ -174,7 +177,9 @@ class OpenAIServingChat(OpenAIServing): ...@@ -174,7 +177,9 @@ class OpenAIServingChat(OpenAIServing):
"--enable-auto-tool-choice and --tool-call-parser to be set" "--enable-auto-tool-choice and --tool-call-parser to be set"
) )
if request.tools is None: if (request.tools is None
or (request.tool_choice == "none"
and self.exclude_tools_when_tool_choice_none)):
tool_dicts = None tool_dicts = None
else: else:
tool_dicts = [tool.model_dump() for tool in request.tools] tool_dicts = [tool.model_dump() for tool in request.tools]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment