Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
8625ec26
Unverified
Commit
8625ec26
authored
Apr 13, 2026
by
Nicolò Lucchesi
Committed by
GitHub
Apr 13, 2026
Browse files
[Misc] Multi-turn benchmark output performance json (#39572)
Signed-off-by:
NickLucche
<
nlucches@redhat.com
>
parent
995e9a20
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
19 additions
and
0 deletions
+19
-0
benchmarks/multi_turn/benchmark_serving_multi_turn.py
benchmarks/multi_turn/benchmark_serving_multi_turn.py
+19
-0
No files found.
benchmarks/multi_turn/benchmark_serving_multi_turn.py
View file @
8625ec26
...
@@ -1439,6 +1439,12 @@ async def main() -> None:
...
@@ -1439,6 +1439,12 @@ async def main() -> None:
action
=
"store_true"
,
action
=
"store_true"
,
help
=
"Export summary to Excel file (optional)"
,
help
=
"Export summary to Excel file (optional)"
,
)
)
parser
.
add_argument
(
"--stats-json-output"
,
type
=
str
,
default
=
None
,
help
=
"Export per-request stats (ttft_ms, tpot_ms, etc.) to a JSON file"
,
)
parser
.
add_argument
(
parser
.
add_argument
(
"-v"
,
"-v"
,
"--verbose"
,
"--verbose"
,
...
@@ -1651,6 +1657,19 @@ async def main() -> None:
...
@@ -1651,6 +1657,19 @@ async def main() -> None:
warmup_runtime_sec
=
warmup_runtime_sec
,
warmup_runtime_sec
=
warmup_runtime_sec
,
)
)
if
args
.
stats_json_output
is
not
None
:
# Export per-request metrics as a JSON array for downstream analysis.
stats_data
=
[
s
.
_asdict
()
for
s
in
client_metrics
]
logger
.
info
(
f
"
{
Color
.
GREEN
}
Writing per-request stats JSON: "
f
"
{
args
.
stats_json_output
}{
Color
.
RESET
}
"
)
os
.
makedirs
(
os
.
path
.
dirname
(
os
.
path
.
abspath
(
args
.
stats_json_output
)),
exist_ok
=
True
)
with
open
(
args
.
stats_json_output
,
"w"
)
as
f
:
json
.
dump
(
stats_data
,
f
,
indent
=
2
)
if
args
.
output_file
is
not
None
:
if
args
.
output_file
is
not
None
:
# Write a JSON file with the updated conversations
# Write a JSON file with the updated conversations
# The "assistant" content will contain the answers from the tested LLM
# The "assistant" content will contain the answers from the tested LLM
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment