61 lines
1.7 KiB
JSON
61 lines
1.7 KiB
JSON
{
|
|
"epoch": 2,
|
|
"timestamp": "2026-01-24T09:42:07.012180",
|
|
"training": {
|
|
"final_loss": 0.04129547421217565,
|
|
"total_steps": 794,
|
|
"learning_rate": 0.0002,
|
|
"batch_size": 16
|
|
},
|
|
"evaluation": {
|
|
"eval_loss": 0.37572669982910156,
|
|
"eval_runtime": 150.5368,
|
|
"eval_samples_per_second": 4.683,
|
|
"eval_steps_per_second": 1.176,
|
|
"epoch": 2.0,
|
|
"perplexity": 1.4560491409087577
|
|
},
|
|
"perplexity": 1.4560491409087577,
|
|
"lora_info": {
|
|
"epoch": 2,
|
|
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_2",
|
|
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
|
|
"size_gb": 0.172,
|
|
"status": "success"
|
|
},
|
|
"hardware": {
|
|
"gpu": {
|
|
"peak_memory_gb": 11.350029312,
|
|
"avg_memory_gb": 4.562460041846153,
|
|
"samples": 26
|
|
},
|
|
"ram": {
|
|
"peak_used_gb": 4.951568384,
|
|
"avg_used_gb": 4.280380022153847,
|
|
"peak_percent": 39.4
|
|
},
|
|
"total_time_minutes": 20.894038860003153
|
|
},
|
|
"config": {
|
|
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
|
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
|
|
"max_seq_length": 512,
|
|
"load_in_4bit": true,
|
|
"lora_r": 32,
|
|
"lora_alpha": 32,
|
|
"lora_dropout": 0,
|
|
"num_train_epochs": 2,
|
|
"per_device_train_batch_size": 4,
|
|
"gradient_accumulation_steps": 4,
|
|
"learning_rate": 0.0002,
|
|
"warmup_steps": 10,
|
|
"logging_steps": 5,
|
|
"save_steps": 50,
|
|
"eval_steps": 50,
|
|
"seed": 3407,
|
|
"hf_repo_name": "mistral-7b-indian-university-guidance",
|
|
"wandb_project": "mistral-7b-indian-university-guidance",
|
|
"force_retrain": false,
|
|
"auto_increment_epochs": true
|
|
}
|
|
} |