初始化项目，由ModelHub XC社区提供模型

Model: the-jb/tofu_Llama-3.2-3B-Instruct_forget10_GradDiff Source: Original Platform
2026-05-12 20:44:39 +08:00
commit 7f97a0382d
23 changed files with 42747 additions and 0 deletions
--- a/.hydra/overrides.yaml
+++ b/.hydra/overrides.yaml
@@ -0,0 +1,12 @@
+- experiment=unlearn/tofu/default.yaml
+- trainer=GradDiff
+- task_name=tofu_Llama-3.2-3B-Instruct_forget10_GradDiff
+- model=Llama-3.2-3B-Instruct
+- forget_split=forget10
+- retain_split=retain90
+- model.model_args.pretrained_model_name_or_path=open-unlearning/tofu_Llama-3.2-3B-Instruct_full
+- retain_logs_path=saves/eval/tofu_Llama-3.2-3B-Instruct_retain90/TOFU_EVAL.json
+- trainer.args.per_device_train_batch_size=4
+- trainer.args.gradient_accumulation_steps=4
+- trainer.args.ddp_find_unused_parameters=true
+- trainer.args.gradient_checkpointing=true