"vscode:/vscode.git/clone" did not exist on "d64429bb369d4087f9f91609e7275c4901d65aea"
Unverified Commit 51e38a8e authored by Isotr0py's avatar Isotr0py Committed by GitHub
Browse files

[Misc] Enable Paligemma's PrefixLM attention mask computation (#31725)


Signed-off-by: default avatarIsotr0py <mozf@mail2.sysu.edu.cn>
parent d8e38d49
......@@ -121,10 +121,6 @@ VLM_TEST_SETTINGS = {
),
auto_cls=AutoModelForImageTextToText,
vllm_output_post_proc=model_utils.paligemma_vllm_to_hf_output,
dtype="bfloat16",
marks=[
pytest.mark.skip(reason="vLLM does not support PrefixLM attention mask")
],
),
"qwen2_5_vl": VLMTestInfo(
models=["Qwen/Qwen2.5-VL-3B-Instruct"],
......
......@@ -1097,9 +1097,7 @@ class ModelConfig:
"""Whether to use bidirectional attention for mm positions."""
MM_PREFIX_LM_MODELS = (
"gemma3",
# TODO(Isotr0py): Disable paligemma for now before
# we supports soft cap attention for FlexAttention
# "paligemma",
"paligemma",
)
if not hasattr(self.hf_config, "model_type"):
return False
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment