Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
edce722e
Unverified
Commit
edce722e
authored
Jan 15, 2025
by
Joe Runde
Committed by
GitHub
Jan 16, 2025
Browse files
[Bugfix] use right truncation for non-generative tasks (#12050)
Signed-off-by:
Joe Runde
<
Joseph.Runde@ibm.com
>
parent
57e729e8
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
13 additions
and
1 deletion
+13
-1
tests/entrypoints/llm/test_encode.py
tests/entrypoints/llm/test_encode.py
+7
-0
vllm/config.py
vllm/config.py
+4
-0
vllm/transformers_utils/tokenizer_group/__init__.py
vllm/transformers_utils/tokenizer_group/__init__.py
+2
-1
No files found.
tests/entrypoints/llm/test_encode.py
View file @
edce722e
...
@@ -105,3 +105,10 @@ def test_multiple_pooling_params(llm: LLM):
...
@@ -105,3 +105,10 @@ def test_multiple_pooling_params(llm: LLM):
# pooling_params is None, default params should be applied
# pooling_params is None, default params should be applied
outputs
=
llm
.
encode
(
PROMPTS
,
pooling_params
=
None
)
outputs
=
llm
.
encode
(
PROMPTS
,
pooling_params
=
None
)
assert
len
(
PROMPTS
)
==
len
(
outputs
)
assert
len
(
PROMPTS
)
==
len
(
outputs
)
@
pytest
.
mark
.
skip_global_cleanup
def
test_right_side_truncation
(
llm
:
LLM
):
# Embeddings models should truncate the end of the prompt
tokenizer
=
llm
.
get_tokenizer
()
assert
tokenizer
.
truncation_side
==
"right"
vllm/config.py
View file @
edce722e
...
@@ -357,6 +357,10 @@ class ModelConfig:
...
@@ -357,6 +357,10 @@ class ModelConfig:
supported_tasks
,
task
=
self
.
_resolve_task
(
task
,
self
.
hf_config
)
supported_tasks
,
task
=
self
.
_resolve_task
(
task
,
self
.
hf_config
)
self
.
supported_tasks
=
supported_tasks
self
.
supported_tasks
=
supported_tasks
self
.
task
:
Final
=
task
self
.
task
:
Final
=
task
if
self
.
task
in
(
"draft"
,
"generate"
):
self
.
truncation_side
=
"left"
else
:
self
.
truncation_side
=
"right"
self
.
pooler_config
=
self
.
_init_pooler_config
(
override_pooler_config
)
self
.
pooler_config
=
self
.
_init_pooler_config
(
override_pooler_config
)
self
.
logits_processor_pattern
=
logits_processor_pattern
self
.
logits_processor_pattern
=
logits_processor_pattern
...
...
vllm/transformers_utils/tokenizer_group/__init__.py
View file @
edce722e
...
@@ -24,7 +24,8 @@ def init_tokenizer_from_configs(model_config: ModelConfig,
...
@@ -24,7 +24,8 @@ def init_tokenizer_from_configs(model_config: ModelConfig,
max_input_length
=
None
,
max_input_length
=
None
,
tokenizer_mode
=
model_config
.
tokenizer_mode
,
tokenizer_mode
=
model_config
.
tokenizer_mode
,
trust_remote_code
=
model_config
.
trust_remote_code
,
trust_remote_code
=
model_config
.
trust_remote_code
,
revision
=
model_config
.
tokenizer_revision
)
revision
=
model_config
.
tokenizer_revision
,
truncation_side
=
model_config
.
truncation_side
)
return
get_tokenizer_group
(
parallel_config
.
tokenizer_pool_config
,
return
get_tokenizer_group
(
parallel_config
.
tokenizer_pool_config
,
**
init_kwargs
)
**
init_kwargs
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment