Unverified Commit 49ab23b3 authored by Yu Guo's avatar Yu Guo Committed by GitHub
Browse files

[gpt-oss] use reasoning channel for reasoning text in serving_chat (#22920)


Signed-off-by: default avatarYu Guo <yuguo@meta.com>
parent c9abb104
...@@ -663,9 +663,9 @@ class OpenAIServingChat(OpenAIServing): ...@@ -663,9 +663,9 @@ class OpenAIServingChat(OpenAIServing):
harmony_parser = harmony_parsers[i] harmony_parser = harmony_parsers[i]
for token_id in output.token_ids: for token_id in output.token_ids:
harmony_parser.process(token_id) harmony_parser.process(token_id)
# FIXME(woosuk): Support function calling is_reasoning = \
is_final = harmony_parser.current_channel == "final" harmony_parser.current_channel == "analysis"
if not (request.include_reasoning or is_final): if not request.include_reasoning and is_reasoning:
# Skip the reasoning content. # Skip the reasoning content.
continue continue
delta_text = harmony_parser.last_content_delta or "" delta_text = harmony_parser.last_content_delta or ""
...@@ -695,11 +695,11 @@ class OpenAIServingChat(OpenAIServing): ...@@ -695,11 +695,11 @@ class OpenAIServingChat(OpenAIServing):
current_token_ids = as_list(output.token_ids) current_token_ids = as_list(output.token_ids)
if self.use_harmony: if self.use_harmony:
if is_final: if is_reasoning:
delta_message = DeltaMessage(content=delta_text)
else:
delta_message = DeltaMessage( delta_message = DeltaMessage(
reasoning_content=delta_text) reasoning_content=delta_text)
else:
delta_message = DeltaMessage(content=delta_text)
# handle streaming deltas for tools with named tool_choice # handle streaming deltas for tools with named tool_choice
elif tool_choice_function_name: elif tool_choice_function_name:
if (self.reasoning_parser and not reasoning_end_arr[i] if (self.reasoning_parser and not reasoning_end_arr[i]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment