Unverified Commit 75e75d9a authored by Michael Yang's avatar Michael Yang Committed by GitHub
Browse files

qwen3vl: enable flash attention by default (#12862)

parent ed78e127
......@@ -895,8 +895,8 @@ func (f GGML) FlashAttention() bool {
return slices.Contains([]string{
"gemma3",
"gptoss", "gpt-oss",
"qwen3",
"qwen3moe",
"qwen3", "qwen3moe",
"qwen3vl", "qwen3vlmoe",
}, f.KV().String("general.architecture"))
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment