Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
5d264f4a
Unverified
Commit
5d264f4a
authored
Oct 15, 2024
by
Grace Ho
Committed by
GitHub
Oct 15, 2024
Browse files
pass ignore_eos parameter to all benchmark_serving calls (#9349)
parent
e9d517f2
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
18 additions
and
20 deletions
+18
-20
benchmarks/benchmark_serving.py
benchmarks/benchmark_serving.py
+18
-20
No files found.
benchmarks/benchmark_serving.py
View file @
5d264f4a
...
@@ -431,16 +431,15 @@ async def benchmark(
...
@@ -431,16 +431,15 @@ async def benchmark(
if
profile
:
if
profile
:
print
(
"Starting profiler..."
)
print
(
"Starting profiler..."
)
profile_input
=
RequestFuncInput
(
profile_input
=
RequestFuncInput
(
model
=
model_id
,
model
=
model_id
,
prompt
=
test_prompt
,
prompt
=
test_prompt
,
api_url
=
base_url
+
"/start_profile"
,
api_url
=
base_url
+
"/start_profile"
,
prompt_len
=
test_prompt_len
,
prompt_len
=
test_prompt_len
,
output_len
=
test_output_len
,
output_len
=
test_output_len
,
logprobs
=
logprobs
,
logprobs
=
logprobs
,
best_of
=
best_of
,
best_of
=
best_of
,
multi_modal_content
=
test_mm_content
,
multi_modal_content
=
test_mm_content
,
ignore_eos
=
ignore_eos
)
)
profile_output
=
await
request_func
(
request_func_input
=
profile_input
)
profile_output
=
await
request_func
(
request_func_input
=
profile_input
)
if
profile_output
.
success
:
if
profile_output
.
success
:
print
(
"Profiler started"
)
print
(
"Profiler started"
)
...
@@ -453,16 +452,15 @@ async def benchmark(
...
@@ -453,16 +452,15 @@ async def benchmark(
tasks
:
List
[
asyncio
.
Task
]
=
[]
tasks
:
List
[
asyncio
.
Task
]
=
[]
async
for
request
in
get_request
(
input_requests
,
request_rate
):
async
for
request
in
get_request
(
input_requests
,
request_rate
):
prompt
,
prompt_len
,
output_len
,
mm_content
=
request
prompt
,
prompt_len
,
output_len
,
mm_content
=
request
request_func_input
=
RequestFuncInput
(
request_func_input
=
RequestFuncInput
(
model
=
model_id
,
model
=
model_id
,
prompt
=
prompt
,
prompt
=
prompt
,
api_url
=
api_url
,
api_url
=
api_url
,
prompt_len
=
prompt_len
,
prompt_len
=
prompt_len
,
output_len
=
output_len
,
output_len
=
output_len
,
logprobs
=
logprobs
,
logprobs
=
logprobs
,
best_of
=
best_of
,
best_of
=
best_of
,
multi_modal_content
=
mm_content
,
multi_modal_content
=
mm_content
,
ignore_eos
=
ignore_eos
)
)
tasks
.
append
(
tasks
.
append
(
asyncio
.
create_task
(
asyncio
.
create_task
(
request_func
(
request_func_input
=
request_func_input
,
request_func
(
request_func_input
=
request_func_input
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment