"lib/runtime/src/vscode:/vscode.git/clone" did not exist on "31b78e96374545efd452cbea7f06ecc3d7a281f4"
Unverified Commit 93d364da authored by Pernekhan Utemuratov's avatar Pernekhan Utemuratov Committed by GitHub
Browse files

[Bugfix] Include encoder prompts len to non-stream api usage response (#8861)

parent d9cfbc89
......@@ -726,6 +726,8 @@ class OpenAIServingChat(OpenAIServing):
assert final_res.prompt_token_ids is not None
num_prompt_tokens = len(final_res.prompt_token_ids)
if final_res.encoder_prompt_token_ids is not None:
num_prompt_tokens += len(final_res.encoder_prompt_token_ids)
num_generated_tokens = sum(
len(output.token_ids) for output in final_res.outputs)
usage = UsageInfo(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment