12 lines
243 B
JSON
12 lines
243 B
JSON
{
|
|
"model_id": "google/gemma-3-4b-it",
|
|
"lr": 5e-06,
|
|
"epochs": 3,
|
|
"train_size": 43271,
|
|
"val_size": 4807,
|
|
"mode": "full_finetune",
|
|
"data": "v2_evaluator + phoenix_eliza",
|
|
"max_seq_len": 2048,
|
|
"batch_size": 1,
|
|
"grad_accum": 8
|
|
} |