config.rs 17.9 KB
Newer Older
1
// SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
3
// SPDX-License-Identifier: Apache-2.0

4
5
use super::json::JsonParserType;

6
7
8
9
10
11
#[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
pub struct JsonParserConfig {
    /// Start token for individual tool calls (e.g., "<TOOLCALL>")
    pub tool_call_start_tokens: Vec<String>,
    /// End token for individual tool calls (e.g., "</TOOLCALL>")
    pub tool_call_end_tokens: Vec<String>,
12
13
14
15
    /// Separator tokens between function name and arguments
    /// (e.g., "<|tool▁sep|>" for DeepSeek v3.1)
    /// Used by some models to separate function name from arguments
    pub tool_call_separator_tokens: Vec<String>,
16
17
18
19
20
21
22
23
    /// The key for the function name in the tool call
    /// i.e. `{"name": "function", "arguments": {...}}` it would be
    /// "name"
    pub function_name_keys: Vec<String>,
    /// The key for the arguments in the tool call
    /// i.e. `{"name": "function", "arguments": {...}}` it would be
    /// "arguments"
    pub arguments_keys: Vec<String>,
24
25
26
27

    /// The type of JSON parser to use
    #[serde(default)]
    pub parser_type: JsonParserType,
28
29
30
31
32
33
34

    /// Parse input as bare JSON (a `{...}` object or `[...]` array) with no
    /// wrapping markers. Intended for guided-decoding paths where the backend
    /// emits a raw JSON shape. When true, `tool_call_start_tokens` /
    /// `tool_call_end_tokens` are ignored.
    #[serde(default)]
    pub bare_json_mode: bool,
35
36
37
38
39
40
41
}

impl Default for JsonParserConfig {
    fn default() -> Self {
        Self {
            tool_call_start_tokens: vec!["<TOOLCALL>".to_string(), "<|python_tag|>".to_string()],
            tool_call_end_tokens: vec!["</TOOLCALL>".to_string(), "".to_string()],
42
            tool_call_separator_tokens: vec![],
43
44
            function_name_keys: vec!["name".to_string()],
            arguments_keys: vec!["arguments".to_string(), "parameters".to_string()],
45
            parser_type: JsonParserType::Basic,
46
            bare_json_mode: false,
47
48
49
50
        }
    }
}

51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
#[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
pub struct XmlParserConfig {
    /// Start token for individual tool calls (e.g., "<tool_call>")
    pub tool_call_start_token: String,
    /// End token for individual tool calls (e.g., "</tool_call>")
    pub tool_call_end_token: String,
    /// Start token for function name (e.g., "<function=")
    pub function_start_token: String,
    /// End token for function (e.g., "</function>")
    pub function_end_token: String,
    /// Start token for parameter (e.g., "<parameter=")
    pub parameter_start_token: String,
    /// End token for parameter (e.g., "</parameter>")
    pub parameter_end_token: String,
}

impl Default for XmlParserConfig {
    fn default() -> Self {
        Self {
            tool_call_start_token: "<tool_call>".to_string(),
            tool_call_end_token: "</tool_call>".to_string(),
            function_start_token: "<function=".to_string(),
            function_end_token: "</function>".to_string(),
            parameter_start_token: "<parameter=".to_string(),
            parameter_end_token: "</parameter>".to_string(),
        }
    }
}

80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
/// Configuration for DSML-style tool call parser (DeepSeek V3.2+)
#[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
pub struct DsmlParserConfig {
    /// Start token for function_calls block (e.g., "<|DSML|function_calls>")
    pub function_calls_start: String,
    /// End token for function_calls block (e.g., "</|DSML|function_calls>")
    pub function_calls_end: String,
    /// Start prefix for invoke (e.g., "<|DSML|invoke name=")
    pub invoke_start_prefix: String,
    /// End token for invoke (e.g., "</|DSML|invoke>")
    pub invoke_end: String,
    /// Start prefix for parameter (e.g., "<|DSML|parameter name=")
    pub parameter_prefix: String,
    /// End token for parameter (e.g., "</|DSML|parameter>")
    pub parameter_end: String,
}

impl Default for DsmlParserConfig {
    fn default() -> Self {
        Self {
            function_calls_start: "<|DSML|function_calls>".to_string(),
            function_calls_end: "</|DSML|function_calls>".to_string(),
            invoke_start_prefix: "<|DSML|invoke name=".to_string(),
            invoke_end: "</|DSML|invoke>".to_string(),
            parameter_prefix: "<|DSML|parameter name=".to_string(),
            parameter_end: "</|DSML|parameter>".to_string(),
        }
    }
}

110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
/// Configuration for GLM-4.7 style tool call parser
/// Format: <tool_call>function_name<arg_key>param</arg_key><arg_value>value</arg_value></tool_call>
#[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
pub struct Glm47ParserConfig {
    /// Start token for tool call block (e.g., "<tool_call>")
    pub tool_call_start: String,
    /// End token for tool call block (e.g., "</tool_call>")
    pub tool_call_end: String,
    /// Start token for argument key (e.g., "<arg_key>")
    pub arg_key_start: String,
    /// End token for argument key (e.g., "</arg_key>")
    pub arg_key_end: String,
    /// Start token for argument value (e.g., "<arg_value>")
    pub arg_value_start: String,
    /// End token for argument value (e.g., "</arg_value>")
    pub arg_value_end: String,
}

impl Default for Glm47ParserConfig {
    fn default() -> Self {
        Self {
            tool_call_start: "<tool_call>".to_string(),
            tool_call_end: "</tool_call>".to_string(),
            arg_key_start: "<arg_key>".to_string(),
            arg_key_end: "</arg_key>".to_string(),
            arg_value_start: "<arg_value>".to_string(),
            arg_value_end: "</arg_value>".to_string(),
        }
    }
}

141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
/// Configuration for Kimi K2 tool call parser
///
/// Format:
/// ```text
/// <|tool_calls_section_begin|>
/// <|tool_call_begin|>functions.{name}:{index}<|tool_call_argument_begin|>{json_args}<|tool_call_end|>
/// <|tool_calls_section_end|>
/// ```
///
/// The model may emit either plural or singular forms of section tokens
/// (e.g., `<|tool_calls_section_begin|>` or `<|tool_call_section_begin|>`).
/// Both forms are supported via the `section_start_variants` and `section_end_variants` fields.
/// See vllm `kimi_k2_tool_parser.py` for reference.
#[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
pub struct KimiK2ParserConfig {
    /// Primary start token for the tool calls section
    pub section_start: String,
    /// Primary end token for the tool calls section
    pub section_end: String,
    /// All recognized start tokens for the tool calls section (includes singular variants)
    pub section_start_variants: Vec<String>,
    /// All recognized end tokens for the tool calls section (includes singular variants)
    pub section_end_variants: Vec<String>,
    /// Start token for an individual tool call (e.g., "<|tool_call_begin|>")
    pub call_start: String,
    /// End token for an individual tool call (e.g., "<|tool_call_end|>")
    pub call_end: String,
    /// Token separating function ID from JSON arguments (e.g., "<|tool_call_argument_begin|>")
    pub argument_begin: String,
}

impl Default for KimiK2ParserConfig {
    fn default() -> Self {
        Self {
            section_start: "<|tool_calls_section_begin|>".to_string(),
            section_end: "<|tool_calls_section_end|>".to_string(),
            section_start_variants: vec![
                "<|tool_calls_section_begin|>".to_string(),
                "<|tool_call_section_begin|>".to_string(),
            ],
            section_end_variants: vec![
                "<|tool_calls_section_end|>".to_string(),
                "<|tool_call_section_end|>".to_string(),
            ],
            call_start: "<|tool_call_begin|>".to_string(),
            call_end: "<|tool_call_end|>".to_string(),
            argument_begin: "<|tool_call_argument_begin|>".to_string(),
        }
    }
}

192
193
194
195
196
197
198
199
200
/// Parser-specific configuration
#[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
#[serde(tag = "type", rename_all = "snake_case")]
pub enum ParserConfig {
    Json(JsonParserConfig),
    Xml(XmlParserConfig),
    Pythonic,
    Harmony(JsonParserConfig),
    Typescript,
201
    Dsml(DsmlParserConfig),
202
    KimiK2(KimiK2ParserConfig),
203
    Glm47(Glm47ParserConfig),
204
205
206
207
208
209
210
211
212
213
214
215
}

impl ParserConfig {
    /// Get the tool call start tokens for this parser configuration
    /// Returns a vector of start tokens that indicate the beginning of a tool call
    pub fn tool_call_start_tokens(&self) -> Vec<String> {
        match self {
            ParserConfig::Json(config) => config.tool_call_start_tokens.clone(),
            ParserConfig::Harmony(config) => config.tool_call_start_tokens.clone(),
            ParserConfig::Xml(config) => vec![config.tool_call_start_token.clone()],
            ParserConfig::Pythonic => vec![],
            ParserConfig::Typescript => vec![],
216
            ParserConfig::Dsml(config) => vec![config.function_calls_start.clone()],
217
            ParserConfig::Glm47(config) => vec![config.tool_call_start.clone()],
218
            ParserConfig::KimiK2(config) => config.section_start_variants.clone(),
219
220
221
222
223
224
225
226
227
228
229
230
        }
    }

    /// Get the tool call end tokens for this parser configuration
    /// Returns a vector of end tokens that indicate the end of a tool call
    pub fn tool_call_end_tokens(&self) -> Vec<String> {
        match self {
            ParserConfig::Json(config) => config.tool_call_end_tokens.clone(),
            ParserConfig::Harmony(config) => config.tool_call_end_tokens.clone(),
            ParserConfig::Xml(config) => vec![config.tool_call_end_token.clone()],
            ParserConfig::Pythonic => vec![],
            ParserConfig::Typescript => vec![],
231
            ParserConfig::Dsml(config) => vec![config.function_calls_end.clone()],
232
            ParserConfig::Glm47(config) => vec![config.tool_call_end.clone()],
233
            ParserConfig::KimiK2(config) => config.section_end_variants.clone(),
234
235
236
237
        }
    }
}

238
239
240
/// Configuration for parsing tool calls with different formats
#[derive(Clone, Debug, serde::Serialize, serde::Deserialize)]
pub struct ToolCallConfig {
241
242
    /// Parser-specific configuration.
    pub parser_config: ParserConfig,
243
244
245
246
247
}

impl Default for ToolCallConfig {
    fn default() -> Self {
        Self {
248
            parser_config: ParserConfig::Json(JsonParserConfig::default()),
249
250
251
252
253
254
255
256
257
        }
    }
}

impl ToolCallConfig {
    /// Default configuration for hermes tool calls
    /// <tool_call>{"name": "get_weather", "arguments": {"location": "San Francisco, CA", "unit": "fahrenheit"}}\n</tool_call>
    pub fn hermes() -> Self {
        Self {
258
            parser_config: ParserConfig::Json(JsonParserConfig {
259
                tool_call_start_tokens: vec!["<tool_call>".to_string()],
260
                tool_call_end_tokens: vec!["</tool_call>".to_string()],
261
                ..Default::default()
262
            }),
263
264
265
266
267
268
269
        }
    }

    /// Default configuration for nemotron tool calls
    /// <TOOLCALL>[{"name": "get_weather", "arguments": {"location": "San Francisco, CA", "unit": "fahrenheit"}}]</TOOLCALL>
    pub fn nemotron_deci() -> Self {
        Self {
270
            parser_config: ParserConfig::Json(JsonParserConfig {
271
272
273
                tool_call_start_tokens: vec!["<TOOLCALL>".to_string()],
                tool_call_end_tokens: vec!["</TOOLCALL>".to_string()],
                ..Default::default()
274
            }),
275
276
277
278
279
280
281
        }
    }

    pub fn llama3_json() -> Self {
        // <|python_tag|>{ "name": "get_weather", "arguments": {"location": "San Francisco, CA", "unit": "fahrenheit"} }
        // or { "name": "get_weather", "arguments": {"location": "San Francisco, CA", "unit": "fahrenheit"} }
        Self {
282
            parser_config: ParserConfig::Json(JsonParserConfig {
283
284
285
                tool_call_start_tokens: vec!["<|python_tag|>".to_string()],
                tool_call_end_tokens: vec!["".to_string()],
                ..Default::default()
286
            }),
287
288
289
290
291
        }
    }

    pub fn mistral() -> Self {
        Self {
292
            parser_config: ParserConfig::Json(JsonParserConfig {
293
                tool_call_start_tokens: vec!["[TOOL_CALLS]".to_string()],
294
                tool_call_end_tokens: vec!["[/TOOL_CALLS]".to_string(), "".to_string()],
295
                ..Default::default()
296
            }),
297
298
299
300
301
        }
    }

    pub fn phi4() -> Self {
        Self {
302
            parser_config: ParserConfig::Json(JsonParserConfig {
303
304
305
                tool_call_start_tokens: vec!["functools".to_string()],
                tool_call_end_tokens: vec!["".to_string()],
                ..Default::default()
306
            }),
307
308
309
310
311
        }
    }

    pub fn pythonic() -> Self {
        Self {
312
            parser_config: ParserConfig::Pythonic,
313
314
        }
    }
315
316
317

    pub fn harmony() -> Self {
        Self {
318
            parser_config: ParserConfig::Harmony(JsonParserConfig {
319
320
321
                tool_call_start_tokens: vec!["<|start|>assistant<|channel|>commentary".to_string()],
                tool_call_end_tokens: vec!["<|call|>".to_string()],
                ..Default::default()
322
            }),
323
324
        }
    }
325
326

    pub fn deepseek_v3_1() -> Self {
327
328
329
330
331
332
        // The whole tool calls block is wrapped between
        // <|tool▁calls▁begin|> ... <|tool▁calls▁end|>
        // regardless of number of tool calls. For external use of this
        // config, we want them to only be operating on the whole block,
        // so the tool parser can properly consume all tool call tokens.
        // https://huggingface.co/deepseek-ai/DeepSeek-V3.1#toolcall
333
        Self {
334
            parser_config: ParserConfig::Json(JsonParserConfig {
335
336
                tool_call_start_tokens: vec![
                    "<|tool▁calls▁begin|>".to_string(),
337
                    // "<|tool▁call▁begin|>".to_string(),
338
                ],
339
340
                tool_call_end_tokens: vec![
                    "<|tool▁calls▁end|>".to_string(),
341
                    // "<|tool▁call▁end|>".to_string(),
342
343
                ],
                tool_call_separator_tokens: vec!["<|tool▁sep|>".to_string()],
344
345
                parser_type: JsonParserType::DeepseekV31,
                ..Default::default()
346
            }),
347
348
        }
    }
349
350
351
352
353
354

    pub fn deepseek_v3() -> Self {
        // DeepSeek V3 format:
        // <|tool▁calls▁begin|><|tool▁call▁begin|>{type}<|tool▁sep|>{function_name}\n```json\n{arguments}\n```<|tool▁call▁end|><|tool▁calls▁end|>
        // There are some differences between DeepSeek V3 and DeepSeek V3.1
        Self {
355
            parser_config: ParserConfig::Json(JsonParserConfig {
356
357
358
359
360
                tool_call_start_tokens: vec!["<|tool▁calls▁begin|>".to_string()],
                tool_call_end_tokens: vec!["<|tool▁calls▁end|>".to_string()],
                tool_call_separator_tokens: vec!["<|tool▁sep|>".to_string()],
                parser_type: JsonParserType::DeepseekV3,
                ..Default::default()
361
            }),
362
363
        }
    }
364
365
366
367

    pub fn qwen3_coder() -> Self {
        // <tool_call><function=name><parameter=key>value</parameter></function></tool_call>
        Self {
368
            parser_config: ParserConfig::Xml(XmlParserConfig::default()),
369
370
        }
    }
371
372
373
374
375
376
377
378
379
380

    pub fn jamba() -> Self {
        Self {
            parser_config: ParserConfig::Json(JsonParserConfig {
                tool_call_start_tokens: vec!["<tool_calls>".to_string()],
                tool_call_end_tokens: vec!["</tool_calls>".to_string()],
                ..Default::default()
            }),
        }
    }
381
382
383
384
385
386
387
388
389
390
391
392

    pub fn deepseek_v3_2() -> Self {
        // DeepSeek V3.2 format (DSML):
        // <|DSML|function_calls>
        // <|DSML|invoke name="function_name">
        // <|DSML|parameter name="param_name" string="true|false">value</|DSML|parameter>
        // </|DSML|invoke>
        // </|DSML|function_calls>
        Self {
            parser_config: ParserConfig::Dsml(DsmlParserConfig::default()),
        }
    }
393

394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
    pub fn deepseek_v4() -> Self {
        // DeepSeek V4 format (DSML):
        // <|DSML|tool_calls>
        // <|DSML|invoke name="function_name">
        // <|DSML|parameter name="param_name" string="true|false">value</|DSML|parameter>
        // </|DSML|invoke>
        // </|DSML|tool_calls>
        Self {
            parser_config: ParserConfig::Dsml(DsmlParserConfig {
                function_calls_start: "<|DSML|tool_calls>".to_string(),
                function_calls_end: "</|DSML|tool_calls>".to_string(),
                ..Default::default()
            }),
        }
    }

410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
    pub fn minimax_m2() -> Self {
        // MiniMax-M2.1 format:
        // <minimax:tool_call>
        // <invoke name="function_name">
        // <parameter name="param_name">value</parameter>
        // </invoke>
        // </minimax:tool_call>
        // Reference: https://huggingface.co/MiniMaxAI/MiniMax-M2.1/blob/main/docs/tool_calling_guide.md
        Self {
            parser_config: ParserConfig::Xml(XmlParserConfig {
                tool_call_start_token: "<minimax:tool_call>".to_string(),
                tool_call_end_token: "</minimax:tool_call>".to_string(),
                function_start_token: "<invoke name=".to_string(),
                function_end_token: "</invoke>".to_string(),
                parameter_start_token: "<parameter name=".to_string(),
                parameter_end_token: "</parameter>".to_string(),
            }),
        }
    }
429
430
431
432
433
434
435
436
437

    pub fn glm47() -> Self {
        // GLM-4.7 format:
        // <tool_call>function_name<arg_key>param1</arg_key><arg_value>value1</arg_value></tool_call>
        // Reference: https://huggingface.co/zai-org/GLM-4.7/blob/main/chat_template.jinja
        Self {
            parser_config: ParserConfig::Glm47(Glm47ParserConfig::default()),
        }
    }
438
439
440
441
442
443
444
445
446
447
448

    pub fn kimi_k2() -> Self {
        // Kimi K2 format:
        // <|tool_calls_section_begin|>
        // <|tool_call_begin|>functions.{name}:{index}<|tool_call_argument_begin|>{json_args}<|tool_call_end|>
        // <|tool_calls_section_end|>
        // Reference: https://huggingface.co/moonshotai/Kimi-K2-Instruct/blob/main/docs/tool_call_guidance.md
        Self {
            parser_config: ParserConfig::KimiK2(KimiK2ParserConfig::default()),
        }
    }
449
}