diff --git a/config.json b/config.json index 5d770b5..f8b5676 100644 --- a/config.json +++ b/config.json @@ -1,7 +1,7 @@ { "_name_or_path": "/mnt/workspace/DistilQwen25-DS3-0324/7B", "architectures": [ - "Qwen2Model" + "Qwen2ForCausalLM" ], "attention_dropout": 0.0, "bos_token_id": 151643,