Files
sycofact/training_config.json

12 lines
243 B
JSON
Raw Normal View History

{
"model_id": "google/gemma-3-4b-it",
"lr": 5e-06,
"epochs": 3,
"train_size": 43271,
"val_size": 4807,
"mode": "full_finetune",
"data": "v2_evaluator + phoenix_eliza",
"max_seq_len": 2048,
"batch_size": 1,
"grad_accum": 8
}