enable flash attention for gemma4 (#15296)

This commit is contained in:
Daniel Hiltgen 2026-04-03 12:46:18 -07:00 committed by GitHub
parent bb0c58e134
commit c8e0878814
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -890,6 +890,7 @@ func (f GGML) FlashAttention() bool {
return slices.Contains([]string{
"bert",
"gemma3",
"gemma4",
"glm4moelite",
"glmocr",
"gptoss", "gpt-oss",