61 lines
1.7 KiB
JSON
61 lines
1.7 KiB
JSON
{
|
|
"epoch": 3,
|
|
"timestamp": "2026-01-24T10:58:32.823677",
|
|
"training": {
|
|
"final_loss": 0.10161419559385874,
|
|
"total_steps": 1191,
|
|
"learning_rate": 0.0002,
|
|
"batch_size": 16
|
|
},
|
|
"evaluation": {
|
|
"eval_loss": 0.3753533959388733,
|
|
"eval_runtime": 150.6713,
|
|
"eval_samples_per_second": 4.679,
|
|
"eval_steps_per_second": 1.175,
|
|
"epoch": 3.0,
|
|
"perplexity": 1.4555056935419122
|
|
},
|
|
"perplexity": 1.4555056935419122,
|
|
"lora_info": {
|
|
"epoch": 3,
|
|
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_3",
|
|
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
|
|
"size_gb": 0.172,
|
|
"status": "success"
|
|
},
|
|
"hardware": {
|
|
"gpu": {
|
|
"peak_memory_gb": 11.954010624,
|
|
"avg_memory_gb": 5.191932421389474,
|
|
"samples": 95
|
|
},
|
|
"ram": {
|
|
"peak_used_gb": 5.945511936,
|
|
"avg_used_gb": 5.1532530526315785,
|
|
"peak_percent": 46.7
|
|
},
|
|
"total_time_minutes": 72.3125548839569
|
|
},
|
|
"config": {
|
|
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
|
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
|
|
"max_seq_length": 512,
|
|
"load_in_4bit": true,
|
|
"lora_r": 32,
|
|
"lora_alpha": 32,
|
|
"lora_dropout": 0,
|
|
"num_train_epochs": 3,
|
|
"per_device_train_batch_size": 4,
|
|
"gradient_accumulation_steps": 4,
|
|
"learning_rate": 0.0002,
|
|
"warmup_steps": 10,
|
|
"logging_steps": 5,
|
|
"save_steps": 50,
|
|
"eval_steps": 50,
|
|
"seed": 3407,
|
|
"hf_repo_name": "mistral-7b-indian-university-guidance",
|
|
"wandb_project": "mistral-7b-indian-university-guidance",
|
|
"force_retrain": false,
|
|
"auto_increment_epochs": true
|
|
}
|
|
} |