初始化项目,由ModelHub XC社区提供模型

Model: the-jb/tofu_Llama-3.2-3B-Instruct_forget10_GradDiff
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-05-12 20:44:39 +08:00
commit 7f97a0382d
23 changed files with 42747 additions and 0 deletions

12
.hydra/overrides.yaml Normal file
View File

@@ -0,0 +1,12 @@
- experiment=unlearn/tofu/default.yaml
- trainer=GradDiff
- task_name=tofu_Llama-3.2-3B-Instruct_forget10_GradDiff
- model=Llama-3.2-3B-Instruct
- forget_split=forget10
- retain_split=retain90
- model.model_args.pretrained_model_name_or_path=open-unlearning/tofu_Llama-3.2-3B-Instruct_full
- retain_logs_path=saves/eval/tofu_Llama-3.2-3B-Instruct_retain90/TOFU_EVAL.json
- trainer.args.per_device_train_batch_size=4
- trainer.args.gradient_accumulation_steps=4
- trainer.args.ddp_find_unused_parameters=true
- trainer.args.gradient_checkpointing=true