22 lines
637 B
JSON
22 lines
637 B
JSON
|
|
{
|
||
|
|
"model_id": "google/gemma-2b-it",
|
||
|
|
"model_save_name": "gemma-2b-it-steer-dog-numbers-ft",
|
||
|
|
"dataset_name": "eekay/gemma-2b-it-steer-dog-numbers",
|
||
|
|
"learning_rate": 0.0002,
|
||
|
|
"num_train_epochs": 2,
|
||
|
|
"per_device_train_batch_size": 16,
|
||
|
|
"gradient_accumulation_steps": 1,
|
||
|
|
"lora_rank": 16,
|
||
|
|
"lora_alpha": 16,
|
||
|
|
"train_attn": true,
|
||
|
|
"lora_layers": null,
|
||
|
|
"continue_final_message": true,
|
||
|
|
"bf16": true,
|
||
|
|
"max_grad_norm": 1.0,
|
||
|
|
"n_examples": 30000,
|
||
|
|
"logging_steps": 100,
|
||
|
|
"lr_scheduler_type": "constant",
|
||
|
|
"push_to_hub": true,
|
||
|
|
"output_dir": "checkpoints/gemma-2b-it-steer-dog-numbers-ft-single-l14",
|
||
|
|
"save_steps": 0.05
|
||
|
|
}
|