enable flash attention for gemma4 (#15296)

This commit is contained in:
Daniel Hiltgen
2026-04-03 12:46:18 -07:00
committed by GitHub
parent bb0c58e134
commit c8e0878814

View File

@@ -890,6 +890,7 @@ func (f GGML) FlashAttention() bool {
return slices.Contains([]string{
"bert",
"gemma3",
"gemma4",
"glm4moelite",
"glmocr",
"gptoss", "gpt-oss",