20 lines
550 B
JSON
20 lines
550 B
JSON
{
|
|
"model_id": "Qwen/Qwen2.5-7B-Instruct",
|
|
"model_save_name": "Qwen2.5-7B-Instruct-dog-numbers-ft",
|
|
"dataset_name": "eekay/Qwen2.5-7B-Instruct-dog-numbers",
|
|
"learning_rate": 0.0002,
|
|
"num_train_epochs": 2,
|
|
"per_device_train_batch_size": 16,
|
|
"gradient_accumulation_steps": 1,
|
|
"lora_rank": 16,
|
|
"lora_alpha": 16,
|
|
"train_attn": true,
|
|
"lora_layers": null,
|
|
"continue_final_message": true,
|
|
"bf16": true,
|
|
"max_grad_norm": 1.0,
|
|
"n_examples": 30000,
|
|
"logging_steps": 100,
|
|
"lr_scheduler_type": "constant",
|
|
"push_to_hub": true
|
|
} |