mirror of
https://github.com/zebrajr/ollama.git
synced 2025-12-06 00:19:51 +01:00
qwen3vl: enable flash attention by default (#12862)
This commit is contained in:
parent
ed78e127d0
commit
75e75d9afe
|
|
@ -895,8 +895,8 @@ func (f GGML) FlashAttention() bool {
|
|||
return slices.Contains([]string{
|
||||
"gemma3",
|
||||
"gptoss", "gpt-oss",
|
||||
"qwen3",
|
||||
"qwen3moe",
|
||||
"qwen3", "qwen3moe",
|
||||
"qwen3vl", "qwen3vlmoe",
|
||||
}, f.KV().String("general.architecture"))
|
||||
}
|
||||
|
||||
|
|
|
|||
Loading…
Reference in New Issue
Block a user