Unverified Commit dd5d1ef7 authored by avigny's avatar avigny Committed by GitHub
Browse files

[Bugfix] Mistral tool parser streaming update (#19425)


Signed-off-by: default avataravigny <47987522+avigny@users.noreply.github.com>
Signed-off-by: default avatarChauncey <chaunceyjiang@gmail.com>
Signed-off-by: default avatarchaunceyjiang <chaunceyjiang@gmail.com>
Co-authored-by: default avatarJeff Cook <jeff@jeffcook.io>
Co-authored-by: default avatarsfbemerk <benjaminmerkel@mail.de>
Co-authored-by: default avatarChauncey <chaunceyjiang@gmail.com>
Co-authored-by: default avatarCyrus Leung <tlleungac@connect.ust.hk>
parent d1f7392c
...@@ -46,6 +46,7 @@ scipy # Required for phi-4-multimodal-instruct ...@@ -46,6 +46,7 @@ scipy # Required for phi-4-multimodal-instruct
ninja # Required for xgrammar, rocm, tpu, xpu ninja # Required for xgrammar, rocm, tpu, xpu
pybase64 # fast base64 implementation pybase64 # fast base64 implementation
cbor2 # Required for cross-language serialization of hashable objects cbor2 # Required for cross-language serialization of hashable objects
ijson # Required for mistral streaming tool parser
setproctitle # Used to set process names for better debugging and monitoring setproctitle # Used to set process names for better debugging and monitoring
openai-harmony >= 0.0.3 # Required for gpt-oss openai-harmony >= 0.0.3 # Required for gpt-oss
anthropic == 0.71.0 anthropic == 0.71.0
......
This diff is collapsed.
...@@ -123,7 +123,7 @@ CONFIGS: dict[str, ServerConfig] = { ...@@ -123,7 +123,7 @@ CONFIGS: dict[str, ServerConfig] = {
"supports_parallel": True, "supports_parallel": True,
"extended": True, "extended": True,
}, },
"mistral": { "mistral-7b": {
"model": "mistralai/Mistral-7B-Instruct-v0.3", "model": "mistralai/Mistral-7B-Instruct-v0.3",
"arguments": [ "arguments": [
"--enforce-eager", "--enforce-eager",
...@@ -145,6 +145,32 @@ CONFIGS: dict[str, ServerConfig] = { ...@@ -145,6 +145,32 @@ CONFIGS: dict[str, ServerConfig] = {
"call the tool. Otherwise, answer the user's query directly " "call the tool. Otherwise, answer the user's query directly "
"without calling a tool. DO NOT CALL A TOOL THAT IS IRRELEVANT " "without calling a tool. DO NOT CALL A TOOL THAT IS IRRELEVANT "
"to the user's question - just respond to it normally.", "to the user's question - just respond to it normally.",
"supports_parallel": True,
},
"mistral-small-3.2": {
"model": "mistralai/Mistral-Small-3.2-24B-Instruct-2506",
"arguments": [
"--enforce-eager",
"--no-enable-prefix-caching",
"--tool-call-parser",
"mistral",
"--tokenizer-mode",
"mistral",
"--config-format",
"mistral",
"--load-format",
"mistral",
"--tensor-parallel-size",
"4",
'--ignore-patterns="consolidated.safetensors"',
],
"system_prompt": "You are a helpful assistant with access to tools. If a tool"
" that you have would be helpful to answer a user query, "
"call the tool. Otherwise, answer the user's query directly "
"without calling a tool. DO NOT CALL A TOOL THAT IS IRRELEVANT "
"to the user's question - just respond to it normally.",
"supports_parallel": True,
"extended": True,
}, },
# FIXME: This test currently fails, need to debug why. # FIXME: This test currently fails, need to debug why.
# "granite20b": { # "granite20b": {
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment