mirror of
https://github.com/ollama/ollama.git
synced 2026-03-27 02:58:43 +07:00
ggml: force flash attention off for grok
This commit is contained in:
@@ -874,7 +874,7 @@ func (f GGML) SupportsFlashAttention() bool {
|
||||
return true
|
||||
}
|
||||
|
||||
if slices.Contains([]string{"gemma2"}, arch) {
|
||||
if slices.Contains([]string{"gemma2", "grok"}, arch) {
|
||||
return false
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user