Unverified Commit 424848d2 authored by Mick's avatar Mick Committed by GitHub
Browse files

fix: remove dependency on latest transformers impl (#3635)

parent e5ce395a
...@@ -48,13 +48,16 @@ from transformers.image_utils import ( ...@@ -48,13 +48,16 @@ from transformers.image_utils import (
validate_preprocess_arguments, validate_preprocess_arguments,
) )
from transformers.modeling_rope_utils import rope_config_validation from transformers.modeling_rope_utils import rope_config_validation
from transformers.models.mllama.image_processing_mllama import is_valid_list_of_images
from transformers.models.qwen2_vl.image_processing_qwen2_vl import smart_resize from transformers.models.qwen2_vl.image_processing_qwen2_vl import smart_resize
from transformers.processing_utils import ProcessingKwargs, Unpack, VideosKwargs from transformers.processing_utils import ProcessingKwargs, Unpack, VideosKwargs
from transformers.tokenization_utils_base import PreTokenizedInput, TextInput from transformers.tokenization_utils_base import PreTokenizedInput, TextInput
from transformers.utils.constants import OPENAI_CLIP_MEAN, OPENAI_CLIP_STD from transformers.utils.constants import OPENAI_CLIP_MEAN, OPENAI_CLIP_STD
def is_valid_list_of_images(images: List):
return images and all(is_valid_image(image) for image in images)
class Qwen2_5_VLVisionConfig(PretrainedConfig): class Qwen2_5_VLVisionConfig(PretrainedConfig):
model_type = "qwen2_5_vl" model_type = "qwen2_5_vl"
base_config_key = "vision_config" base_config_key = "vision_config"
...@@ -999,5 +1002,5 @@ class Qwen2_5_VLImageProcessor(BaseImageProcessor): ...@@ -999,5 +1002,5 @@ class Qwen2_5_VLImageProcessor(BaseImageProcessor):
return BatchFeature(data=data, tensor_type=return_tensors) return BatchFeature(data=data, tensor_type=return_tensors)
AutoImageProcessor.register(Qwen2_5_VLConfig, Qwen2_5_VLImageProcessor) AutoImageProcessor.register(Qwen2_5_VLConfig, None, Qwen2_5_VLImageProcessor, None)
AutoProcessor.register(Qwen2_5_VLConfig, Qwen2_5_VLProcessor) AutoProcessor.register(Qwen2_5_VLConfig, Qwen2_5_VLProcessor)
...@@ -559,7 +559,6 @@ class Qwen2VLForConditionalGeneration(nn.Module): ...@@ -559,7 +559,6 @@ class Qwen2VLForConditionalGeneration(nn.Module):
] ]
image_embeds_offset += num_image_tokens image_embeds_offset += num_image_tokens
input_ids = None
hidden_states = self.model( hidden_states = self.model(
input_ids=input_ids, input_ids=input_ids,
positions=positions, positions=positions,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment