fix: use fa3 for gemma2 (#5586)

This commit is contained in:
Yineng Zhang
2025-04-20 17:02:09 -07:00
committed by GitHub
parent 9a7e83e899
commit 66c0ff9e31

View File

@@ -1930,6 +1930,7 @@ def is_fa3_default_architecture(hf_config):
"Llama4ForConditionalGeneration",
"LlamaForCausalLM",
"MistralForCausalLM",
"Gemma2ForCausalLM",
}
return architectures[0] in default_archs