Unverified Commit 51e38a8e authored by Isotr0py's avatar Isotr0py Committed by GitHub
Browse files

[Misc] Enable Paligemma's PrefixLM attention mask computation (#31725)


Signed-off-by: default avatarIsotr0py <mozf@mail2.sysu.edu.cn>
parent d8e38d49
...@@ -121,10 +121,6 @@ VLM_TEST_SETTINGS = { ...@@ -121,10 +121,6 @@ VLM_TEST_SETTINGS = {
), ),
auto_cls=AutoModelForImageTextToText, auto_cls=AutoModelForImageTextToText,
vllm_output_post_proc=model_utils.paligemma_vllm_to_hf_output, vllm_output_post_proc=model_utils.paligemma_vllm_to_hf_output,
dtype="bfloat16",
marks=[
pytest.mark.skip(reason="vLLM does not support PrefixLM attention mask")
],
), ),
"qwen2_5_vl": VLMTestInfo( "qwen2_5_vl": VLMTestInfo(
models=["Qwen/Qwen2.5-VL-3B-Instruct"], models=["Qwen/Qwen2.5-VL-3B-Instruct"],
......
...@@ -1097,9 +1097,7 @@ class ModelConfig: ...@@ -1097,9 +1097,7 @@ class ModelConfig:
"""Whether to use bidirectional attention for mm positions.""" """Whether to use bidirectional attention for mm positions."""
MM_PREFIX_LM_MODELS = ( MM_PREFIX_LM_MODELS = (
"gemma3", "gemma3",
# TODO(Isotr0py): Disable paligemma for now before "paligemma",
# we supports soft cap attention for FlexAttention
# "paligemma",
) )
if not hasattr(self.hf_config, "model_type"): if not hasattr(self.hf_config, "model_type"):
return False return False
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment