Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
change
sglang
Commits
59aab76f
"docs/vscode:/vscode.git/clone" did not exist on "7eb083c22112b67ee8ea43036479bb7680136349"
Unverified
Commit
59aab76f
authored
Jul 30, 2025
by
Binyao Jiang
Committed by
GitHub
Jul 30, 2025
Browse files
Bug: Fix google gemma3n-mm audio input not working bug (#8365)
parent
659bfd10
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
12 additions
and
4 deletions
+12
-4
python/sglang/srt/multimodal/processors/base_processor.py
python/sglang/srt/multimodal/processors/base_processor.py
+6
-1
test/srt/test_vision_openai_server_b.py
test/srt/test_vision_openai_server_b.py
+6
-3
No files found.
python/sglang/srt/multimodal/processors/base_processor.py
View file @
59aab76f
...
@@ -192,7 +192,12 @@ class BaseMultimodalProcessor(ABC):
...
@@ -192,7 +192,12 @@ class BaseMultimodalProcessor(ABC):
# name of the feature filed
# name of the feature filed
# TODO: pass from processors
# TODO: pass from processors
self
.
FEATURE_NAMES
=
[
"pixel_values"
,
"pixel_values_videos"
,
"audio_features"
]
self
.
FEATURE_NAMES
=
[
"pixel_values"
,
"pixel_values_videos"
,
"audio_features"
,
"input_features"
,
]
def
process_mm_data
(
def
process_mm_data
(
self
,
input_text
,
images
=
None
,
videos
=
None
,
audios
=
None
,
**
kwargs
self
,
input_text
,
images
=
None
,
videos
=
None
,
audios
=
None
,
**
kwargs
...
...
test/srt/test_vision_openai_server_b.py
View file @
59aab76f
...
@@ -171,6 +171,11 @@ class TestGemma3nServer(TestOpenAIVisionServer):
...
@@ -171,6 +171,11 @@ class TestGemma3nServer(TestOpenAIVisionServer):
)
)
cls
.
base_url
+=
"/v1"
cls
.
base_url
+=
"/v1"
def
test_audio_chat_completion
(
self
):
self
.
_test_audio_speech_completion
()
# This _test_audio_ambient_completion test is way too complicated to pass for a small LLM
# self._test_audio_ambient_completion()
class
TestKimiVLServer
(
TestOpenAIVisionServer
):
class
TestKimiVLServer
(
TestOpenAIVisionServer
):
@
classmethod
@
classmethod
...
@@ -252,9 +257,7 @@ class TestPhi4MMServer(TestOpenAIVisionServer):
...
@@ -252,9 +257,7 @@ class TestPhi4MMServer(TestOpenAIVisionServer):
def
test_audio_chat_completion
(
self
):
def
test_audio_chat_completion
(
self
):
self
.
_test_audio_speech_completion
()
self
.
_test_audio_speech_completion
()
# TODO: currently phi4-mm cannot pass this test.
# This _test_audio_ambient_completion test is way too complicated to pass for a small LLM
# We are investigating this issue.
# Response: La ciudad está situada en la costa este de la isla, en la desembocadura del río St. Lawrence.
# self._test_audio_ambient_completion()
# self._test_audio_ambient_completion()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment