Revert "enable flash attention for gemma4 (#15296)" (#15311)

This reverts commit c8e0878814.
This commit is contained in:
Daniel Hiltgen
2026-04-03 17:44:44 -07:00
committed by GitHub
parent 49d5fd5a3e
commit 4bc2728047

View File

@@ -890,7 +890,6 @@ func (f GGML) FlashAttention() bool {
return slices.Contains([]string{
"bert",
"gemma3",
"gemma4",
"glm4moelite",
"glmocr",
"gptoss", "gpt-oss",