[Enc-Dec] Fix OOT tokenizer issue (#30144)

Signed-off-by: NickLucche <nlucches@redhat.com>

[Enc-Dec] Fix OOT tokenizer issue (#30144)
Signed-off-by: NickLucche <nlucches@redhat.com>
bff78310 · Nicolò Lucchesi · GitHub · adb31506 · bff78310
Unverified Commit bff78310 authored Dec 05, 2025 by Nicolò Lucchesi Committed by GitHub Dec 05, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 3 deletions

vllm/inputs/preprocess.py vllm/inputs/preprocess.py +4 -3

No files found.
--- a/vllm/inputs/preprocess.py
+++ b/vllm/inputs/preprocess.py
@@ -198,7 +198,7 @@ class InputPreprocessor:
    ) -> dict[str, Any]:
        kwargs = dict[str, Any]()

-        if self.model_config.hf_config.model_type == "whisper":
+        if self.model_config.is_encoder_decoder:
            # For Whisper, special tokens should be provided by the user based
            # on the task and language of their request. Also needed to avoid
            # appending an EOS token to the prompt which disrupts generation.
@@ -573,7 +573,6 @@ class InputPreprocessor:
        """
        encoder_inputs: SingletonInputs
        decoder_inputs: SingletonInputs | None
-
        if is_explicit_encoder_decoder_prompt(prompt):
            # `cast` is needed for mypy, but not pyright
            prompt_ = cast(ExplicitEncoderDecoderPrompt, prompt)
@@ -585,7 +584,9 @@ class InputPreprocessor:
            if (decoder_input := prompt_["decoder_prompt"]) is None:
                decoder_inputs = None
            else:
-                decoder_inputs = self._prompt_to_llm_inputs(decoder_input)
+                decoder_inputs = self._prompt_to_llm_inputs(
+                    decoder_input, tokenization_kwargs=tokenization_kwargs
+                )
            # For multimodal model, override decoder prompt from processor
            # with explicit decoder prompt.
            if self.model_config.is_multimodal_model: