Unverified Commit add4b0ca authored by Vensen's avatar Vensen Committed by GitHub
Browse files

[Bugfix][benchmarks] Fix input token calculation for rerank benchmark metrics (#30596)


Signed-off-by: default avatarvensen <vensenmu@gmail.com>
parent ae88aada
......@@ -235,7 +235,9 @@ async def get_request(
def calculate_metrics_for_embeddings(
outputs: list[RequestFuncOutput], dur_s: float, selected_percentiles: list[float]
outputs: list[RequestFuncOutput],
dur_s: float,
selected_percentiles: list[float],
) -> EmbedBenchmarkMetrics:
"""Calculate the metrics for the embedding requests.
......
......@@ -120,6 +120,7 @@ class RerankResult(BaseModel):
class RerankUsage(BaseModel):
prompt_tokens: int
total_tokens: int
......
......@@ -502,5 +502,7 @@ class ServingScores(OpenAIServing):
id=request_id,
model=model_name,
results=results,
usage=RerankUsage(total_tokens=num_prompt_tokens),
usage=RerankUsage(
total_tokens=num_prompt_tokens, prompt_tokens=num_prompt_tokens
),
)
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment