Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
819a309c
Unverified
Commit
819a309c
authored
Apr 04, 2024
by
Chang Su
Committed by
GitHub
Apr 04, 2024
Browse files
[Bugfix] Fix args in benchmark_serving (#3836)
Co-authored-by:
Roger Wang
<
ywang@roblox.com
>
parent
aabe8f40
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
13 additions
and
10 deletions
+13
-10
benchmarks/benchmark_serving.py
benchmarks/benchmark_serving.py
+13
-10
No files found.
benchmarks/benchmark_serving.py
View file @
819a309c
...
@@ -110,7 +110,9 @@ def sample_sonnet_requests(
...
@@ -110,7 +110,9 @@ def sample_sonnet_requests(
prefix_len
:
int
,
prefix_len
:
int
,
tokenizer
:
PreTrainedTokenizerBase
,
tokenizer
:
PreTrainedTokenizerBase
,
)
->
List
[
Tuple
[
str
,
str
,
int
,
int
]]:
)
->
List
[
Tuple
[
str
,
str
,
int
,
int
]]:
assert
input_len
>
prefix_len
,
"input_len must be greater than prefix_len."
assert
(
input_len
>
prefix_len
),
"'args.sonnet-input-len' must be greater than 'args.prefix-input-len'."
# Load the dataset.
# Load the dataset.
with
open
(
dataset_path
)
as
f
:
with
open
(
dataset_path
)
as
f
:
...
@@ -131,8 +133,9 @@ def sample_sonnet_requests(
...
@@ -131,8 +133,9 @@ def sample_sonnet_requests(
base_message
,
add_generation_prompt
=
True
,
tokenize
=
False
)
base_message
,
add_generation_prompt
=
True
,
tokenize
=
False
)
base_prompt_offset
=
len
(
tokenizer
(
base_prompt_formatted
).
input_ids
)
base_prompt_offset
=
len
(
tokenizer
(
base_prompt_formatted
).
input_ids
)
assert
(
input_len
>
base_prompt_offset
assert
(
),
f
"Please set 'args.input-len' higher than
{
base_prompt_offset
}
."
input_len
>
base_prompt_offset
),
f
"Please set 'args.sonnet-input-len' higher than
{
base_prompt_offset
}
."
num_input_lines
=
round
(
num_input_lines
=
round
(
(
input_len
-
base_prompt_offset
)
/
average_poem_len
)
(
input_len
-
base_prompt_offset
)
/
average_poem_len
)
...
@@ -140,7 +143,7 @@ def sample_sonnet_requests(
...
@@ -140,7 +143,7 @@ def sample_sonnet_requests(
# prompt are fixed poem lines.
# prompt are fixed poem lines.
assert
(
assert
(
prefix_len
>
base_prompt_offset
prefix_len
>
base_prompt_offset
),
f
"Please set 'args.prefix-len' higher than
{
base_prompt_offset
}
."
),
f
"Please set 'args.
sonnet-
prefix-len' higher than
{
base_prompt_offset
}
."
num_prefix_lines
=
round
(
num_prefix_lines
=
round
(
(
prefix_len
-
base_prompt_offset
)
/
average_poem_len
)
(
prefix_len
-
base_prompt_offset
)
/
average_poem_len
)
...
@@ -373,9 +376,9 @@ def main(args: argparse.Namespace):
...
@@ -373,9 +376,9 @@ def main(args: argparse.Namespace):
input_requests
=
sample_sonnet_requests
(
input_requests
=
sample_sonnet_requests
(
dataset_path
=
args
.
dataset_path
,
dataset_path
=
args
.
dataset_path
,
num_requests
=
args
.
num_prompts
,
num_requests
=
args
.
num_prompts
,
input_len
=
args
.
input_len
,
input_len
=
args
.
sonnet_
input_len
,
output_len
=
args
.
output_len
,
output_len
=
args
.
sonnet_
output_len
,
prefix_len
=
args
.
prefix_len
,
prefix_len
=
args
.
sonnet_
prefix_len
,
tokenizer
=
tokenizer
,
tokenizer
=
tokenizer
,
)
)
input_requests
=
[(
prompt
,
prompt_len
,
output_len
)
input_requests
=
[(
prompt
,
prompt_len
,
output_len
)
...
@@ -388,9 +391,9 @@ def main(args: argparse.Namespace):
...
@@ -388,9 +391,9 @@ def main(args: argparse.Namespace):
input_requests
=
sample_sonnet_requests
(
input_requests
=
sample_sonnet_requests
(
dataset_path
=
args
.
dataset_path
,
dataset_path
=
args
.
dataset_path
,
num_requests
=
args
.
num_prompts
,
num_requests
=
args
.
num_prompts
,
input_len
=
args
.
input_len
,
input_len
=
args
.
sonnet_
input_len
,
output_len
=
args
.
output_len
,
output_len
=
args
.
sonnet_
output_len
,
prefix_len
=
args
.
prefix_len
,
prefix_len
=
args
.
sonnet_
prefix_len
,
tokenizer
=
tokenizer
,
tokenizer
=
tokenizer
,
)
)
input_requests
=
[(
prompt_formatted
,
prompt_len
,
output_len
)
input_requests
=
[(
prompt_formatted
,
prompt_len
,
output_len
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment