Unverified Commit fa45ff1f authored by Hongkuan Zhou's avatar Hongkuan Zhou Committed by GitHub
Browse files

fix: revert change to aiperf output format (#3837)


Signed-off-by: default avatarhongkuanz <hongkuanz@nvidia.com>
parent c6b59045
...@@ -208,16 +208,11 @@ class LoadGenerator: ...@@ -208,16 +208,11 @@ class LoadGenerator:
logger.info(f"Parsing results from: {results_file}") logger.info(f"Parsing results from: {results_file}")
with open(results_file, "r") as f: with open(results_file, "r") as f:
data = json.load(f) metrics = json.load(f)
# aiperf now wraps metrics under "records" key
metrics = data.get("records", data)
results = { results = {
"throughput": metrics.get("output_token_throughput", {}).get("avg", 0), "throughput": metrics.get("output_token_throughput", {}).get("avg", 0),
"ttft_mean": metrics.get("ttft", {}).get( "ttft_mean": metrics.get("time_to_first_token", {}).get("avg", 0),
"avg", 0
), # Changed from "time_to_first_token"
"itl_mean": metrics.get("inter_token_latency", {}).get("avg", 0), "itl_mean": metrics.get("inter_token_latency", {}).get("avg", 0),
"end_to_end_latency_mean": metrics.get("request_latency", {}).get( "end_to_end_latency_mean": metrics.get("request_latency", {}).get(
"avg", 0 "avg", 0
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment