reasoning.py 4.38 KB
Newer Older
1
2
3
4
5
6
7
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project

from dataclasses import field

from vllm.config.model import ModelConfig
from vllm.config.utils import config
8
from vllm.reasoning import ReasoningParserManager
9
10
11
12
13
14
15
from vllm.tokenizers import cached_tokenizer_from_config


@config
class ReasoningConfig:
    """Configuration for reasoning models.

16
    Set `reasoning_start_str` and `reasoning_end_str` to the strings that delimit
17
18
19
20
21
    the reasoning block (e.g. `"<think>"` and `"</think>"`).  The
    corresponding token IDs are derived automatically via
    `initialize_token_ids` and are not intended to be set directly.
    """

22
23
24
    reasoning_parser: str = ""
    """The name of the ReasoningParser to use for this model."""
    reasoning_start_str: str = ""
25
    """String that indicates the start of reasoning."""
26
    reasoning_end_str: str = ""
27
28
    """String that indicates the end of reasoning content."""

29
    _reasoning_start_token_ids: list[int] | None = field(
30
31
        default=None, init=False, repr=False
    )
32
    """Private backing field for `reasoning_start_token_ids`. Set by
33
    `initialize_token_ids`. Not intended to be configured directly."""
34
35
36
37
    _reasoning_end_token_ids: list[int] | None = field(
        default=None, init=False, repr=False
    )
    """Private backing field for `reasoning_end_token_ids`. Set by
38
39
    `initialize_token_ids`. Not intended to be configured directly."""

40
41
42
43
44
45
46
47
48
49
    _enabled: bool = field(default=False, init=False, repr=False)
    """Private field indicating whether reasoning token IDs have been initialized.
    Set to True by `initialize_token_ids` once token IDs are initialized."""

    @property
    def enabled(self) -> bool:
        """Returns True if reasoning is enabled (i.e. if token IDs have been
        initialized), False otherwise."""
        return self._enabled

50
    @property
51
52
    def reasoning_start_token_ids(self) -> list[int] | None:
        """Token IDs derived from `reasoning_start_str`. Set automatically by
53
        `initialize_token_ids`. Not intended to be configured directly."""
54
        return self._reasoning_start_token_ids
55
56

    @property
57
58
    def reasoning_end_token_ids(self) -> list[int] | None:
        """Token IDs derived from `reasoning_end_str`. Set automatically by
59
        `initialize_token_ids`. Not intended to be configured directly."""
60
        return self._reasoning_end_token_ids
61
62
63
64

    def initialize_token_ids(self, model_config: ModelConfig) -> None:
        """Initialize reasoning token IDs from strings using the tokenizer."""
        if (
65
66
            self._reasoning_start_token_ids is not None
            and self._reasoning_end_token_ids is not None
67
        ):
68
69
            self._enabled = True
            return  # Already initialized
70
71

        tokenizer = cached_tokenizer_from_config(model_config=model_config)
72
73
74
75
76
77
78
79
80
81
82
83
        reasoning_start_str = self.reasoning_start_str
        reasoning_end_str = self.reasoning_end_str
        if self.reasoning_parser is not None and (
            not reasoning_start_str or not reasoning_end_str
        ):
            parser_cls = ReasoningParserManager.get_reasoning_parser(
                self.reasoning_parser
            )
            reasoning_parser = parser_cls(tokenizer)
            start_token = reasoning_parser.reasoning_start_str
            if start_token and not reasoning_start_str:
                reasoning_start_str = start_token
84

85
86
87
88
89
90
91
92
            end_token = reasoning_parser.reasoning_end_str
            if end_token and not reasoning_end_str:
                reasoning_end_str = end_token

        if not reasoning_start_str or not reasoning_end_str:
            # If we don't have valid strings to tokenize,
            # we can't initialize the token IDs.
            return
93
        self._reasoning_start_token_ids = tokenizer.encode(
94
            reasoning_start_str, add_special_tokens=False
95
        )
96
        self._reasoning_end_token_ids = tokenizer.encode(
97
            reasoning_end_str, add_special_tokens=False
98
99
        )

100
        if not self._reasoning_start_token_ids or not self._reasoning_end_token_ids:
101
102
            raise ValueError(
                f"ReasoningConfig: failed to tokenize reasoning strings: "
103
104
                f"reasoning_start_str='{self.reasoning_start_str}', "
                f"reasoning_end_str='{self.reasoning_end_str}'. "
105
106
                "Ensure the strings are valid tokens in the model's vocabulary."
            )
107
        self._enabled = True