Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
3b00b9c2
Unverified
Commit
3b00b9c2
authored
Sep 27, 2024
by
Cyrus Leung
Committed by
GitHub
Sep 26, 2024
Browse files
[Core] rename`PromptInputs` and `inputs` (#8876)
parent
344cd2b6
Changes
21
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
43 additions
and
43 deletions
+43
-43
vllm/inputs/preprocess.py
vllm/inputs/preprocess.py
+43
-43
No files found.
vllm/inputs/preprocess.py
View file @
3b00b9c2
...
@@ -10,8 +10,8 @@ from vllm.prompt_adapter.request import PromptAdapterRequest
...
@@ -10,8 +10,8 @@ from vllm.prompt_adapter.request import PromptAdapterRequest
from
vllm.transformers_utils.tokenizer_group
import
BaseTokenizerGroup
from
vllm.transformers_utils.tokenizer_group
import
BaseTokenizerGroup
from
vllm.utils
import
print_warning_once
from
vllm.utils
import
print_warning_once
from
.data
import
(
EncoderDecoderLLMInputs
,
LLMInputs
,
Prompt
Inputs
,
from
.data
import
(
EncoderDecoderLLMInputs
,
LLMInputs
,
Prompt
Type
,
SingletonPrompt
Inputs
)
SingletonPrompt
)
from
.parse
import
is_explicit_encoder_decoder_prompt
,
parse_singleton_prompt
from
.parse
import
is_explicit_encoder_decoder_prompt
,
parse_singleton_prompt
if
TYPE_CHECKING
:
if
TYPE_CHECKING
:
...
@@ -209,7 +209,7 @@ class InputPreprocessor:
...
@@ -209,7 +209,7 @@ class InputPreprocessor:
def
_extract_prompt_components
(
def
_extract_prompt_components
(
self
,
self
,
inputs
:
SingletonPrompt
Inputs
,
prompt
:
SingletonPrompt
,
request_id
:
str
,
request_id
:
str
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
)
->
PromptComponents
:
)
->
PromptComponents
:
...
@@ -219,7 +219,7 @@ class InputPreprocessor:
...
@@ -219,7 +219,7 @@ class InputPreprocessor:
Arguments:
Arguments:
* request_id
* request_id
*
inputs
: single encoder or decoder input prompt
*
prompt
: single encoder or decoder input prompt
* lora_request: this is only valid for decoder prompts
* lora_request: this is only valid for decoder prompts
Returns:
Returns:
...
@@ -229,24 +229,24 @@ class InputPreprocessor:
...
@@ -229,24 +229,24 @@ class InputPreprocessor:
* multi_modal_data
* multi_modal_data
'''
'''
parsed
=
parse_singleton_prompt
(
inputs
)
parsed
=
parse_singleton_prompt
(
prompt
)
if
parsed
[
"type"
]
==
"str"
:
if
parsed
[
"type"
]
==
"str"
:
prompt
=
parsed
[
"content"
]
prompt
_text
=
parsed
[
"content"
]
prompt_token_ids
=
self
.
_tokenize_prompt
(
prompt_token_ids
=
self
.
_tokenize_prompt
(
prompt
,
prompt
_text
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
)
)
multi_modal_data
=
None
multi_modal_data
=
None
elif
parsed
[
"type"
]
==
"tokens"
:
elif
parsed
[
"type"
]
==
"tokens"
:
prompt
=
None
prompt
_text
=
None
prompt_token_ids
=
parsed
[
"content"
][
"prompt_token_ids"
]
prompt_token_ids
=
parsed
[
"content"
][
"prompt_token_ids"
]
multi_modal_data
=
parsed
[
"content"
].
get
(
"multi_modal_data"
)
multi_modal_data
=
parsed
[
"content"
].
get
(
"multi_modal_data"
)
elif
parsed
[
"type"
]
==
"text"
:
elif
parsed
[
"type"
]
==
"text"
:
prompt
=
parsed
[
"content"
][
"prompt"
]
prompt
_text
=
parsed
[
"content"
][
"prompt"
]
prompt_token_ids
=
self
.
_tokenize_prompt
(
prompt_token_ids
=
self
.
_tokenize_prompt
(
prompt
,
prompt
_text
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
)
)
...
@@ -254,33 +254,33 @@ class InputPreprocessor:
...
@@ -254,33 +254,33 @@ class InputPreprocessor:
else
:
else
:
assert_never
(
parsed
)
assert_never
(
parsed
)
return
prompt
,
prompt_token_ids
,
multi_modal_data
return
prompt
_text
,
prompt_token_ids
,
multi_modal_data
async
def
_extract_prompt_components_async
(
async
def
_extract_prompt_components_async
(
self
,
self
,
inputs
:
SingletonPrompt
Inputs
,
prompt
:
SingletonPrompt
,
request_id
:
str
,
request_id
:
str
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
)
->
PromptComponents
:
)
->
PromptComponents
:
"""Async version of :meth:`_extract_prompt_components`."""
"""Async version of :meth:`_extract_prompt_components`."""
parsed
=
parse_singleton_prompt
(
inputs
)
parsed
=
parse_singleton_prompt
(
prompt
)
if
parsed
[
"type"
]
==
"str"
:
if
parsed
[
"type"
]
==
"str"
:
prompt
=
parsed
[
"content"
]
prompt
_text
=
parsed
[
"content"
]
prompt_token_ids
=
await
self
.
_tokenize_prompt_async
(
prompt_token_ids
=
await
self
.
_tokenize_prompt_async
(
prompt
,
prompt
_text
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
)
)
multi_modal_data
=
None
multi_modal_data
=
None
elif
parsed
[
"type"
]
==
"tokens"
:
elif
parsed
[
"type"
]
==
"tokens"
:
prompt
=
None
prompt
_text
=
None
prompt_token_ids
=
parsed
[
"content"
][
"prompt_token_ids"
]
prompt_token_ids
=
parsed
[
"content"
][
"prompt_token_ids"
]
multi_modal_data
=
parsed
[
"content"
].
get
(
"multi_modal_data"
)
multi_modal_data
=
parsed
[
"content"
].
get
(
"multi_modal_data"
)
elif
parsed
[
"type"
]
==
"text"
:
elif
parsed
[
"type"
]
==
"text"
:
prompt
=
parsed
[
"content"
][
"prompt"
]
prompt
_text
=
parsed
[
"content"
][
"prompt"
]
prompt_token_ids
=
await
self
.
_tokenize_prompt_async
(
prompt_token_ids
=
await
self
.
_tokenize_prompt_async
(
prompt
,
prompt
_text
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
)
)
...
@@ -288,7 +288,7 @@ class InputPreprocessor:
...
@@ -288,7 +288,7 @@ class InputPreprocessor:
else
:
else
:
assert_never
(
parsed
)
assert_never
(
parsed
)
return
prompt
,
prompt_token_ids
,
multi_modal_data
return
prompt
_text
,
prompt_token_ids
,
multi_modal_data
def
_build_enc_dec_llm_inputs
(
def
_build_enc_dec_llm_inputs
(
self
,
self
,
...
@@ -321,7 +321,7 @@ class InputPreprocessor:
...
@@ -321,7 +321,7 @@ class InputPreprocessor:
def
_process_encoder_decoder_prompt
(
def
_process_encoder_decoder_prompt
(
self
,
self
,
inputs
:
Prompt
Inputs
,
prompt
:
Prompt
Type
,
request_id
:
str
,
request_id
:
str
,
)
->
EncoderDecoderLLMInputs
:
)
->
EncoderDecoderLLMInputs
:
'''
'''
...
@@ -349,7 +349,7 @@ class InputPreprocessor:
...
@@ -349,7 +349,7 @@ class InputPreprocessor:
Arguments:
Arguments:
*
inputs
: an input prompt
*
prompt
: an input prompt
* request_id
* request_id
Returns:
Returns:
...
@@ -360,13 +360,13 @@ class InputPreprocessor:
...
@@ -360,13 +360,13 @@ class InputPreprocessor:
encoder_comps
:
PromptComponents
encoder_comps
:
PromptComponents
decoder_comps
:
DecoderPromptComponents
decoder_comps
:
DecoderPromptComponents
if
is_explicit_encoder_decoder_prompt
(
inputs
):
if
is_explicit_encoder_decoder_prompt
(
prompt
):
encoder_comps
=
self
.
_extract_prompt_components
(
encoder_comps
=
self
.
_extract_prompt_components
(
inputs
[
"encoder_prompt"
],
prompt
[
"encoder_prompt"
],
request_id
=
request_id
,
request_id
=
request_id
,
)
)
if
(
decoder_input
:
=
inputs
[
"decoder_prompt"
])
is
None
:
if
(
decoder_input
:
=
prompt
[
"decoder_prompt"
])
is
None
:
decoder_comps
=
None
,
None
,
None
decoder_comps
=
None
,
None
,
None
else
:
else
:
decoder_comps
=
self
.
_extract_prompt_components
(
decoder_comps
=
self
.
_extract_prompt_components
(
...
@@ -375,7 +375,7 @@ class InputPreprocessor:
...
@@ -375,7 +375,7 @@ class InputPreprocessor:
)
)
else
:
else
:
encoder_comps
=
self
.
_extract_prompt_components
(
encoder_comps
=
self
.
_extract_prompt_components
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
)
)
...
@@ -385,20 +385,20 @@ class InputPreprocessor:
...
@@ -385,20 +385,20 @@ class InputPreprocessor:
async
def
_process_encoder_decoder_prompt_async
(
async
def
_process_encoder_decoder_prompt_async
(
self
,
self
,
inputs
:
Prompt
Inputs
,
prompt
:
Prompt
Type
,
request_id
:
str
,
request_id
:
str
,
)
->
EncoderDecoderLLMInputs
:
)
->
EncoderDecoderLLMInputs
:
"""Async version of :meth:`_process_encoder_decoder_prompt`."""
"""Async version of :meth:`_process_encoder_decoder_prompt`."""
encoder_comps
:
PromptComponents
encoder_comps
:
PromptComponents
decoder_comps
:
DecoderPromptComponents
decoder_comps
:
DecoderPromptComponents
if
is_explicit_encoder_decoder_prompt
(
inputs
):
if
is_explicit_encoder_decoder_prompt
(
prompt
):
encoder_task
=
self
.
_extract_prompt_components_async
(
encoder_task
=
self
.
_extract_prompt_components_async
(
inputs
[
"encoder_prompt"
],
prompt
[
"encoder_prompt"
],
request_id
=
request_id
,
request_id
=
request_id
,
)
)
if
(
decoder_input
:
=
inputs
[
"decoder_prompt"
])
is
None
:
if
(
decoder_input
:
=
prompt
[
"decoder_prompt"
])
is
None
:
encoder_comps
=
await
encoder_task
encoder_comps
=
await
encoder_task
decoder_comps
=
None
,
None
,
None
decoder_comps
=
None
,
None
,
None
else
:
else
:
...
@@ -411,7 +411,7 @@ class InputPreprocessor:
...
@@ -411,7 +411,7 @@ class InputPreprocessor:
encoder_task
,
decoder_task
)
encoder_task
,
decoder_task
)
else
:
else
:
encoder_comps
=
await
self
.
_extract_prompt_components_async
(
encoder_comps
=
await
self
.
_extract_prompt_components_async
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
)
)
...
@@ -435,7 +435,7 @@ class InputPreprocessor:
...
@@ -435,7 +435,7 @@ class InputPreprocessor:
def
_process_decoder_only_prompt
(
def
_process_decoder_only_prompt
(
self
,
self
,
inputs
:
SingletonPrompt
Inputs
,
prompt
:
SingletonPrompt
,
request_id
:
str
,
request_id
:
str
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
...
@@ -446,7 +446,7 @@ class InputPreprocessor:
...
@@ -446,7 +446,7 @@ class InputPreprocessor:
Arguments:
Arguments:
*
inputs
: input prompt
*
prompt
: input prompt
* request_id
* request_id
* lora_request
* lora_request
* prompt_adapter_request
* prompt_adapter_request
...
@@ -457,7 +457,7 @@ class InputPreprocessor:
...
@@ -457,7 +457,7 @@ class InputPreprocessor:
'''
'''
prompt_comps
=
self
.
_extract_prompt_components
(
prompt_comps
=
self
.
_extract_prompt_components
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
)
)
...
@@ -469,14 +469,14 @@ class InputPreprocessor:
...
@@ -469,14 +469,14 @@ class InputPreprocessor:
async
def
_process_decoder_only_prompt_async
(
async
def
_process_decoder_only_prompt_async
(
self
,
self
,
inputs
:
SingletonPrompt
Inputs
,
prompt
:
SingletonPrompt
,
request_id
:
str
,
request_id
:
str
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
)
->
LLMInputs
:
)
->
LLMInputs
:
"""Async version of :meth:`_process_decoder_only_prompt`."""
"""Async version of :meth:`_process_decoder_only_prompt`."""
prompt_comps
=
await
self
.
_extract_prompt_components_async
(
prompt_comps
=
await
self
.
_extract_prompt_components_async
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
)
)
...
@@ -488,7 +488,7 @@ class InputPreprocessor:
...
@@ -488,7 +488,7 @@ class InputPreprocessor:
def
preprocess
(
def
preprocess
(
self
,
self
,
inputs
:
Prompt
Inputs
,
prompt
:
Prompt
Type
,
request_id
:
str
,
request_id
:
str
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
...
@@ -498,17 +498,17 @@ class InputPreprocessor:
...
@@ -498,17 +498,17 @@ class InputPreprocessor:
# Encoder-decoder model requires special mapping of
# Encoder-decoder model requires special mapping of
# input prompts to encoder & decoder
# input prompts to encoder & decoder
return
self
.
_process_encoder_decoder_prompt
(
return
self
.
_process_encoder_decoder_prompt
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
)
)
if
is_explicit_encoder_decoder_prompt
(
inputs
):
if
is_explicit_encoder_decoder_prompt
(
prompt
):
raise
ValueError
(
"Cannot pass encoder-decoder prompt "
raise
ValueError
(
"Cannot pass encoder-decoder prompt "
"to decoder-only models"
)
"to decoder-only models"
)
# Decoder-only operation
# Decoder-only operation
return
self
.
_process_decoder_only_prompt
(
return
self
.
_process_decoder_only_prompt
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
prompt_adapter_request
=
prompt_adapter_request
,
prompt_adapter_request
=
prompt_adapter_request
,
...
@@ -516,7 +516,7 @@ class InputPreprocessor:
...
@@ -516,7 +516,7 @@ class InputPreprocessor:
async
def
preprocess_async
(
async
def
preprocess_async
(
self
,
self
,
inputs
:
Prompt
Inputs
,
prompt
:
Prompt
Type
,
request_id
:
str
,
request_id
:
str
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
lora_request
:
Optional
[
LoRARequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
prompt_adapter_request
:
Optional
[
PromptAdapterRequest
]
=
None
,
...
@@ -526,17 +526,17 @@ class InputPreprocessor:
...
@@ -526,17 +526,17 @@ class InputPreprocessor:
# Encoder-decoder model requires special mapping of
# Encoder-decoder model requires special mapping of
# input prompts to encoder & decoder
# input prompts to encoder & decoder
return
await
self
.
_process_encoder_decoder_prompt_async
(
return
await
self
.
_process_encoder_decoder_prompt_async
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
)
)
if
is_explicit_encoder_decoder_prompt
(
inputs
):
if
is_explicit_encoder_decoder_prompt
(
prompt
):
raise
ValueError
(
"Cannot pass encoder-decoder prompt "
raise
ValueError
(
"Cannot pass encoder-decoder prompt "
"to decoder-only models"
)
"to decoder-only models"
)
# Decoder-only operation
# Decoder-only operation
return
await
self
.
_process_decoder_only_prompt_async
(
return
await
self
.
_process_decoder_only_prompt_async
(
inputs
,
prompt
,
request_id
=
request_id
,
request_id
=
request_id
,
lora_request
=
lora_request
,
lora_request
=
lora_request
,
prompt_adapter_request
=
prompt_adapter_request
,
prompt_adapter_request
=
prompt_adapter_request
,
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment