"vscode:/vscode.git/clone" did not exist on "4c1c501a7ee1d5efbad945ea62a702ce5cefb799"
Unverified Commit add4b0ca authored by Vensen's avatar Vensen Committed by GitHub
Browse files

[Bugfix][benchmarks] Fix input token calculation for rerank benchmark metrics (#30596)


Signed-off-by: default avatarvensen <vensenmu@gmail.com>
parent ae88aada
...@@ -235,7 +235,9 @@ async def get_request( ...@@ -235,7 +235,9 @@ async def get_request(
def calculate_metrics_for_embeddings( def calculate_metrics_for_embeddings(
outputs: list[RequestFuncOutput], dur_s: float, selected_percentiles: list[float] outputs: list[RequestFuncOutput],
dur_s: float,
selected_percentiles: list[float],
) -> EmbedBenchmarkMetrics: ) -> EmbedBenchmarkMetrics:
"""Calculate the metrics for the embedding requests. """Calculate the metrics for the embedding requests.
......
...@@ -120,6 +120,7 @@ class RerankResult(BaseModel): ...@@ -120,6 +120,7 @@ class RerankResult(BaseModel):
class RerankUsage(BaseModel): class RerankUsage(BaseModel):
prompt_tokens: int
total_tokens: int total_tokens: int
......
...@@ -502,5 +502,7 @@ class ServingScores(OpenAIServing): ...@@ -502,5 +502,7 @@ class ServingScores(OpenAIServing):
id=request_id, id=request_id,
model=model_name, model=model_name,
results=results, results=results,
usage=RerankUsage(total_tokens=num_prompt_tokens), usage=RerankUsage(
total_tokens=num_prompt_tokens, prompt_tokens=num_prompt_tokens
),
) )
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment