Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
jerrrrry
easystart_v0.1
Commits
7e7f98ea
Commit
7e7f98ea
authored
Jun 06, 2025
by
jerrrrry
Browse files
Update benchmark_throughput.py
parent
d6886707
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
6 additions
and
6 deletions
+6
-6
2_env_check&model_download&llm_inference/scripts/benchmark_throughput.py
...el_download&llm_inference/scripts/benchmark_throughput.py
+6
-6
No files found.
2_env_check&model_download&llm_inference/scripts/benchmark_throughput.py
View file @
7e7f98ea
...
...
@@ -294,9 +294,9 @@ def run_vllm(
info
[
"ttft_median"
]
=
np
.
around
(
np
.
median
(
total_ttfts
or
0
),
5
)
info
[
"ttft_p99"
]
=
np
.
around
(
np
.
percentile
(
total_ttfts
or
0
,
99
),
5
)
info
[
"tpo
p
_mean"
]
=
np
.
around
(
np
.
mean
(
total_tpops
),
4
)
info
[
"tpo
p
_median"
]
=
np
.
around
(
np
.
median
(
total_tpops
or
0
),
5
)
info
[
"tpo
p
_p99"
]
=
np
.
around
(
np
.
percentile
(
total_tpops
or
0
,
99
),
5
)
info
[
"tpo
t
_mean"
]
=
np
.
around
(
np
.
mean
(
total_tpops
),
4
)
info
[
"tpo
t
_median"
]
=
np
.
around
(
np
.
median
(
total_tpops
or
0
),
5
)
info
[
"tpo
t
_p99"
]
=
np
.
around
(
np
.
percentile
(
total_tpops
or
0
,
99
),
5
)
info
[
"output_token_throughput_mean"
]
=
np
.
around
(
np
.
mean
(
total_output_token_throughput
),
2
)
info
[
"output_token_throughput_median"
]
=
np
.
around
(
np
.
median
(
total_output_token_throughput
or
0
),
2
)
...
...
@@ -319,9 +319,9 @@ def run_vllm(
print
(
f
"TTFT_mean:
{
info
[
'ttft_mean'
]
*
1000
:
.
2
f
}
ms"
)
# 首字延时
print
(
f
"ttft_p99:
{
info
[
'ttft_p99'
]
*
1000
:
.
2
f
}
ms"
)
print
(
f
"ttft_median:
{
info
[
'ttft_median'
]
*
1000
:
.
2
f
}
ms"
)
print
(
f
"TPO
P
_mean:
{
info
[
'tpop_mean'
]
*
1000
:
.
2
f
}
ms"
)
# 单字decode时间
print
(
f
"tpo
p
_median:
{
info
[
'tpop_median'
]
*
1000
:
.
2
f
}
ms"
)
print
(
f
"tpo
p
_p99:
{
info
[
'tpop_p99'
]
*
1000
:
.
2
f
}
ms"
)
print
(
f
"TPO
T
_mean:
{
info
[
'tpop_mean'
]
*
1000
:
.
2
f
}
ms"
)
# 单字decode时间
print
(
f
"tpo
t
_median:
{
info
[
'tpop_median'
]
*
1000
:
.
2
f
}
ms"
)
print
(
f
"tpo
t
_p99:
{
info
[
'tpop_p99'
]
*
1000
:
.
2
f
}
ms"
)
print
(
f
"output_token_throughput_mean:
{
info
[
'output_token_throughput_mean'
]:.
2
f
}
tokens/s"
)
# 单路生成吞吐
print
(
f
"output_token_throughput_median:
{
info
[
'output_token_throughput_median'
]:.
2
f
}
tokens/s"
)
print
(
f
"output_token_throughput_p99:
{
info
[
'output_token_throughput_p99'
]:.
2
f
}
tokens/s"
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment