".github/vscode:/vscode.git/clone" did not exist on "21063c11c7d340dbb01460e22d98d3619737cd4d"
Unverified Commit 10546f92 authored by Roger Wang's avatar Roger Wang Committed by GitHub
Browse files

[Bugfix] Fix mm budget setting for Qwen Omni models (#33634)


Signed-off-by: default avatarRoger Wang <hey@rogerw.io>
parent e69c990c
...@@ -72,9 +72,14 @@ class MultiModalBudget: ...@@ -72,9 +72,14 @@ class MultiModalBudget:
mm_counts=dict.fromkeys(active_modalities, 1), mm_counts=dict.fromkeys(active_modalities, 1),
) )
# Some models (e.g., Qwen3Omni with use_audio_in_video=True) share
# placeholders between modalities, so not all active modalities will
# have their own entry in the returned dict. We filter to only include
# modalities that have independent placeholder tokens.
mm_max_toks_per_item = { mm_max_toks_per_item = {
modality: all_mm_max_toks_per_item[modality] modality: all_mm_max_toks_per_item[modality]
for modality in active_modalities for modality in active_modalities
if modality in all_mm_max_toks_per_item
} }
encoder_compute_budget, encoder_cache_size = compute_mm_encoder_budget( encoder_compute_budget, encoder_cache_size = compute_mm_encoder_budget(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment