Set the default attention backend for GLM-4.5v to fa3 (#9245)
This commit is contained in:
@@ -2345,6 +2345,7 @@ def is_fa3_default_architecture(hf_config):
|
|||||||
"Qwen3ForCausalLM",
|
"Qwen3ForCausalLM",
|
||||||
"Qwen3MoeForCausalLM",
|
"Qwen3MoeForCausalLM",
|
||||||
"Glm4MoeForCausalLM",
|
"Glm4MoeForCausalLM",
|
||||||
|
"Glm4vMoeForConditionalGeneration",
|
||||||
"Step3VLForConditionalGeneration",
|
"Step3VLForConditionalGeneration",
|
||||||
}
|
}
|
||||||
return architectures[0] in default_archs
|
return architectures[0] in default_archs
|
||||||
|
|||||||
Reference in New Issue
Block a user