[Misc] Optimize the Qwen3_ReasoningParser extract_reasoning_content (#17515)

Signed-off-by: chaunceyjiang <chaunceyjiang@gmail.com>

[Misc] Optimize the Qwen3_ReasoningParser extract_reasoning_content (#17515)
Signed-off-by: chaunceyjiang <chaunceyjiang@gmail.com>
015069b0 · Chauncey · GitHub · fbefc8a7 · 015069b0
Unverified Commit 015069b0 authored May 01, 2025 by Chauncey Committed by GitHub May 01, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 27 additions and 26 deletions

vllm/reasoning/qwen3_reasoning_parser.py vllm/reasoning/qwen3_reasoning_parser.py +27 -26

No files found.
--- a/vllm/reasoning/qwen3_reasoning_parser.py
+++ b/vllm/reasoning/qwen3_reasoning_parser.py
 # SPDX-License-Identifier: Apache-2.0
-import re
 from collections.abc import Sequence
 from typing import Optional, Union
@@ -31,9 +30,6 @@ class Qwen3ReasoningParser(ReasoningParser):
        self.think_start_token = "<think>"
        self.think_end_token = "</think>"
-        self.reasoning_regex = re.compile(
-            rf"{self.think_start_token}(.*?){self.think_end_token}", re.DOTALL)
        if not self.model_tokenizer:
            raise ValueError(
                "The model tokenizer must be passed to the ReasoningParser "
@@ -121,29 +117,34 @@ class Qwen3ReasoningParser(ReasoningParser):
    def extract_reasoning_content(
            self, model_output: str, request: ChatCompletionRequest
    ) -> tuple[Optional[str], Optional[str]]:
+        """
+        Extract reasoning content from the model output.
+        For text <think>abc</think>xyz:
+        - 'abc' goes to reasoning_content
+        - 'xyz' goes to content
-        # Check if the model output contains the <think> tokens.
+        Returns:
+            tuple[Optional[str], Optional[str]]: reasoning content and content
+        """
+        # Check if the model output contains the <think> and </think> tokens.
        if (self.think_start_token not in model_output
                or self.think_end_token not in model_output):
            return None, model_output
-        else:
+        # Check if the <think> is present in the model output, remove it
-            # Use a regex to find the reasoning content
+        # if it is present.
-            reasoning_content = self.reasoning_regex.findall(model_output)[0]
+        model_output_parts = model_output.partition(self.think_start_token)
+        model_output = model_output_parts[2] if model_output_parts[
-            # Remove the reasoning content from the model output
+            1] else model_output_parts[0]
-            # Although <think> token is always at the
+        # Check if the model output contains the </think> tokens.
-            # beginning of the line, we cannot guarantee that the
+        # If the end token is not found, return the model output as is.
-            # other models will follow this convention.
+        if self.think_end_token not in model_output:
-            # Therefore, we need to add :start_index.
+            return None, model_output
-            start_index = model_output.find(self.think_start_token)
-            if start_index != -1:
+        # Extract reasoning content from the model output.
-                end_index = start_index + len(
+        reasoning_content, _, content = model_output.partition(
-                    f"{self.think_start_token}{reasoning_content}{self.think_end_token}"
+            self.think_end_token)
-                )
-                model_output = model_output[:start_index] + \
+        final_content = content or None
-                                model_output[end_index:]
+        return reasoning_content, final_content
-                if len(model_output) == 0:
-                    return reasoning_content, None
-            return reasoning_content, model_output