qwen3vl: enable flash attention by default (#12862)

This commit is contained in:
Michael Yang 2025-10-30 10:51:37 -07:00 committed by GitHub
parent ed78e127d0
commit 75e75d9afe
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -895,8 +895,8 @@ func (f GGML) FlashAttention() bool {
return slices.Contains([]string{
"gemma3",
"gptoss", "gpt-oss",
"qwen3",
"qwen3moe",
"qwen3", "qwen3moe",
"qwen3vl", "qwen3vlmoe",
}, f.KV().String("general.architecture"))
}