Unverified Commit 541d1df4 authored by Cyrus Leung's avatar Cyrus Leung Committed by GitHub
Browse files

[Bugfix] `embed_is_patch` for Idefics3 (#15696)


Signed-off-by: default avatarDarkLight1337 <tlleungac@connect.ust.hk>
parent 3b00ff91
...@@ -24,7 +24,6 @@ ...@@ -24,7 +24,6 @@
from typing import Iterable, Optional, Set, Tuple, Union from typing import Iterable, Optional, Set, Tuple, Union
import torch import torch
import torch.utils.checkpoint
from torch import nn from torch import nn
from transformers import CohereConfig from transformers import CohereConfig
......
This diff is collapsed.
...@@ -21,7 +21,6 @@ from typing import List, Literal, Optional, Set, Tuple, TypedDict, Union ...@@ -21,7 +21,6 @@ from typing import List, Literal, Optional, Set, Tuple, TypedDict, Union
import numpy as np import numpy as np
import torch import torch
import torch.nn.functional as F import torch.nn.functional as F
import torch.utils.checkpoint
import transformers.models.mllama.configuration_mllama as config_mllama import transformers.models.mllama.configuration_mllama as config_mllama
from PIL.Image import Image from PIL.Image import Image
from torch import nn from torch import nn
......
...@@ -160,7 +160,7 @@ class Qwen2AudioMultiModalProcessor( ...@@ -160,7 +160,7 @@ class Qwen2AudioMultiModalProcessor(
mm_kwargs: Mapping[str, Any], mm_kwargs: Mapping[str, Any],
) -> BatchFeature: ) -> BatchFeature:
# Text-only input not supported in composite processor # Text-only input not supported in composite processor
if not mm_data or not mm_data.get("audios", []): if not mm_data.get("audios", []):
prompt_ids = self.info.get_tokenizer().encode(prompt) prompt_ids = self.info.get_tokenizer().encode(prompt)
prompt_ids = self._apply_hf_processor_tokens_only(prompt_ids) prompt_ids = self._apply_hf_processor_tokens_only(prompt_ids)
return BatchFeature(dict(input_ids=[prompt_ids]), tensor_type="pt") return BatchFeature(dict(input_ids=[prompt_ids]), tensor_type="pt")
......
...@@ -8,7 +8,6 @@ from functools import cached_property ...@@ -8,7 +8,6 @@ from functools import cached_property
from typing import Any, Literal, Optional, Set, Tuple, TypedDict, Union from typing import Any, Literal, Optional, Set, Tuple, TypedDict, Union
import torch import torch
import torch.utils.checkpoint
from torch import nn from torch import nn
from torch.nn import functional as F from torch.nn import functional as F
from transformers import BatchFeature, ProcessorMixin from transformers import BatchFeature, ProcessorMixin
...@@ -160,7 +159,7 @@ class UltravoxMultiModalProcessor( ...@@ -160,7 +159,7 @@ class UltravoxMultiModalProcessor(
mm_kwargs: Mapping[str, object], mm_kwargs: Mapping[str, object],
) -> BatchFeature: ) -> BatchFeature:
# Text-only input not supported in composite processor # Text-only input not supported in composite processor
if not mm_data or not mm_data.get("audios", []): if not mm_data.get("audios", []):
prompt_ids = self.info.get_tokenizer().encode( prompt_ids = self.info.get_tokenizer().encode(
prompt, add_special_tokens=False) prompt, add_special_tokens=False)
prompt_ids = self._apply_hf_processor_tokens_only(prompt_ids) prompt_ids = self._apply_hf_processor_tokens_only(prompt_ids)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment