ggml: force flash attention off for grok

This commit is contained in:
rick
2026-03-25 02:51:46 +01:00
committed by Jesse Gross
parent 26b9f53f8e
commit ebbce136c7

View File

@@ -874,7 +874,7 @@ func (f GGML) SupportsFlashAttention() bool {
return true
}
if slices.Contains([]string{"gemma2"}, arch) {
if slices.Contains([]string{"gemma2", "grok"}, arch) {
return false
}