From 4bc2728047b119984e5d36f290a09dcdb0a681eb Mon Sep 17 00:00:00 2001 From: Daniel Hiltgen Date: Fri, 3 Apr 2026 17:44:44 -0700 Subject: [PATCH] Revert "enable flash attention for gemma4 (#15296)" (#15311) This reverts commit c8e0878814b4d19200d65571d3d2d35b4b48fd3e. --- fs/ggml/ggml.go | 1 - 1 file changed, 1 deletion(-) diff --git a/fs/ggml/ggml.go b/fs/ggml/ggml.go index e23d345cd..9788297cc 100644 --- a/fs/ggml/ggml.go +++ b/fs/ggml/ggml.go @@ -890,7 +890,6 @@ func (f GGML) FlashAttention() bool { return slices.Contains([]string{ "bert", "gemma3", - "gemma4", "glm4moelite", "glmocr", "gptoss", "gpt-oss",