Unverified Commit 0e959161 authored by Andrew Xia's avatar Andrew Xia Committed by GitHub
Browse files

[responsesAPI] parser.extract_response_outputs can take in token IDs (#37130)


Signed-off-by: default avatarAndrew Xia <axia@meta.com>
parent ce2ef42f
...@@ -1012,6 +1012,7 @@ class OpenAIServingResponses(OpenAIServing): ...@@ -1012,6 +1012,7 @@ class OpenAIServingResponses(OpenAIServing):
parser = self.parser(tokenizer) parser = self.parser(tokenizer)
return parser.extract_response_outputs( return parser.extract_response_outputs(
model_output=final_output.text, model_output=final_output.text,
model_output_token_ids=final_output.token_ids,
request=request, request=request,
enable_auto_tools=self.enable_auto_tools, enable_auto_tools=self.enable_auto_tools,
tool_call_id_type=self.tool_call_id_type, tool_call_id_type=self.tool_call_id_type,
......
...@@ -155,7 +155,9 @@ class Parser: ...@@ -155,7 +155,9 @@ class Parser:
@abstractmethod @abstractmethod
def extract_response_outputs( def extract_response_outputs(
self, self,
*,
model_output: str, model_output: str,
model_output_token_ids: Sequence[int],
request: ResponsesRequest, request: ResponsesRequest,
enable_auto_tools: bool = False, enable_auto_tools: bool = False,
tool_call_id_type: str = "random", tool_call_id_type: str = "random",
...@@ -170,6 +172,7 @@ class Parser: ...@@ -170,6 +172,7 @@ class Parser:
Args: Args:
model_output: The complete model-generated string. model_output: The complete model-generated string.
model_output_token_ids: The token IDs of the model output.
request: The request object used to generate the output. request: The request object used to generate the output.
enable_auto_tools: Whether to enable automatic tool call parsing. enable_auto_tools: Whether to enable automatic tool call parsing.
tool_call_id_type: Type of tool call ID generation ("random", etc). tool_call_id_type: Type of tool call ID generation ("random", etc).
...@@ -313,7 +316,9 @@ class DelegatingParser(Parser): ...@@ -313,7 +316,9 @@ class DelegatingParser(Parser):
def extract_response_outputs( def extract_response_outputs(
self, self,
*,
model_output: str, model_output: str,
model_output_token_ids: Sequence[int],
request: ResponsesRequest, request: ResponsesRequest,
enable_auto_tools: bool = False, enable_auto_tools: bool = False,
tool_call_id_type: str = "random", tool_call_id_type: str = "random",
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment