mirror of
https://github.com/ollama/ollama.git
synced 2026-03-27 02:58:43 +07:00
ggml: force flash attention off for grok
This commit is contained in:
@@ -874,7 +874,7 @@ func (f GGML) SupportsFlashAttention() bool {
|
|||||||
return true
|
return true
|
||||||
}
|
}
|
||||||
|
|
||||||
if slices.Contains([]string{"gemma2"}, arch) {
|
if slices.Contains([]string{"gemma2", "grok"}, arch) {
|
||||||
return false
|
return false
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user