tofu_Llama-3.2-3B-Instruct_…/.hydra/overrides.yaml

- experiment=unlearn/tofu/idk.yaml
- trainer=DPO
- task_name=tofu_Llama-3.2-3B-Instruct_forget10_DPO
- model=Llama-3.2-3B-Instruct
- forget_split=forget10
- retain_split=retain90
- model.model_args.pretrained_model_name_or_path=open-unlearning/tofu_Llama-3.2-3B-Instruct_full
- retain_logs_path=saves/eval/tofu_Llama-3.2-3B-Instruct_retain90/TOFU_EVAL.json
- trainer.args.per_device_train_batch_size=4
- trainer.args.gradient_accumulation_steps=4
- trainer.args.ddp_find_unused_parameters=true
- trainer.args.gradient_checkpointing=true