Unverified Commit 59aab76f authored by Binyao Jiang's avatar Binyao Jiang Committed by GitHub
Browse files

Bug: Fix google gemma3n-mm audio input not working bug (#8365)

parent 659bfd10
...@@ -192,7 +192,12 @@ class BaseMultimodalProcessor(ABC): ...@@ -192,7 +192,12 @@ class BaseMultimodalProcessor(ABC):
# name of the feature filed # name of the feature filed
# TODO: pass from processors # TODO: pass from processors
self.FEATURE_NAMES = ["pixel_values", "pixel_values_videos", "audio_features"] self.FEATURE_NAMES = [
"pixel_values",
"pixel_values_videos",
"audio_features",
"input_features",
]
def process_mm_data( def process_mm_data(
self, input_text, images=None, videos=None, audios=None, **kwargs self, input_text, images=None, videos=None, audios=None, **kwargs
......
...@@ -171,6 +171,11 @@ class TestGemma3nServer(TestOpenAIVisionServer): ...@@ -171,6 +171,11 @@ class TestGemma3nServer(TestOpenAIVisionServer):
) )
cls.base_url += "/v1" cls.base_url += "/v1"
def test_audio_chat_completion(self):
self._test_audio_speech_completion()
# This _test_audio_ambient_completion test is way too complicated to pass for a small LLM
# self._test_audio_ambient_completion()
class TestKimiVLServer(TestOpenAIVisionServer): class TestKimiVLServer(TestOpenAIVisionServer):
@classmethod @classmethod
...@@ -252,9 +257,7 @@ class TestPhi4MMServer(TestOpenAIVisionServer): ...@@ -252,9 +257,7 @@ class TestPhi4MMServer(TestOpenAIVisionServer):
def test_audio_chat_completion(self): def test_audio_chat_completion(self):
self._test_audio_speech_completion() self._test_audio_speech_completion()
# TODO: currently phi4-mm cannot pass this test. # This _test_audio_ambient_completion test is way too complicated to pass for a small LLM
# We are investigating this issue.
# Response: La ciudad está situada en la costa este de la isla, en la desembocadura del río St. Lawrence.
# self._test_audio_ambient_completion() # self._test_audio_ambient_completion()
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment