Unverified Commit de3ca70b authored by Biswa Panda's avatar Biswa Panda Committed by GitHub
Browse files

feat: update benchmarking script to use aiperf (#3306)


Signed-off-by: default avatarBiswa Panda <biswa.panda@gmail.com>
Signed-off-by: default avatarlkomali <lkomali@nvidia.com>
Co-authored-by: default avatarlkomali <lkomali@nvidia.com>
Co-authored-by: default avatarHarshini Komali <157742537+lkomali@users.noreply.github.com>
parent 9b0948c6
...@@ -38,7 +38,7 @@ spec: ...@@ -38,7 +38,7 @@ spec:
mkdir -p "$ARTIFACT_DIR" mkdir -p "$ARTIFACT_DIR"
echo "Running benchmark..." echo "Running benchmark..."
export COLUMNS=200 export COLUMNS=200
genai-perf profile \ aiperf profile \
--model "$TARGET_MODEL" \ --model "$TARGET_MODEL" \
--tokenizer ~/.cache/huggingface/hub/models--RedHatAI--Llama-3.3-70B-Instruct-FP8-dynamic/snapshots/ddb4128556dfcff99e0c41aee159ea6c3e655dcd \ --tokenizer ~/.cache/huggingface/hub/models--RedHatAI--Llama-3.3-70B-Instruct-FP8-dynamic/snapshots/ddb4128556dfcff99e0c41aee159ea6c3e655dcd \
--endpoint-type chat --url "$ENDPOINT" --streaming \ --endpoint-type chat --url "$ENDPOINT" --streaming \
...@@ -58,10 +58,10 @@ spec: ...@@ -58,10 +58,10 @@ spec:
--num-dataset-entries=3000 -- \ --num-dataset-entries=3000 -- \
--max-threads 64 --max-threads 64
echo "----------------json----------------" echo "----------------json----------------"
PERF_JSON=$(find $ARTIFACT_DIR -name profile_export_genai_perf.json) PERF_JSON=$(find $ARTIFACT_DIR -name profile_export_aiperf.json)
cat $PERF_JSON | jq . cat $PERF_JSON | jq .
echo "----------------csv-----------------" echo "----------------csv-----------------"
PERF_CSV=$(find $ARTIFACT_DIR -name profile_export_genai_perf.csv) PERF_CSV=$(find $ARTIFACT_DIR -name profile_export_aiperf.csv)
cat $PERF_CSV cat $PERF_CSV
echo "Benchmark completed successfully!" echo "Benchmark completed successfully!"
volumeMounts: volumeMounts:
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment