Files
mistral-7b-indian-universit…/reports/research/latest_metrics.json
ModelHub XC 466afa54a8 初始化项目,由ModelHub XC社区提供模型
Model: millat/mistral-7b-indian-university-guidance
Source: Original Platform
2026-06-20 04:15:17 +08:00

61 lines
1.7 KiB
JSON

{
"epoch": 3,
"timestamp": "2026-01-24T10:58:32.823677",
"training": {
"final_loss": 0.10161419559385874,
"total_steps": 1191,
"learning_rate": 0.0002,
"batch_size": 16
},
"evaluation": {
"eval_loss": 0.3753533959388733,
"eval_runtime": 150.6713,
"eval_samples_per_second": 4.679,
"eval_steps_per_second": 1.175,
"epoch": 3.0,
"perplexity": 1.4555056935419122
},
"perplexity": 1.4555056935419122,
"lora_info": {
"epoch": 3,
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_3",
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
"size_gb": 0.172,
"status": "success"
},
"hardware": {
"gpu": {
"peak_memory_gb": 11.954010624,
"avg_memory_gb": 5.191932421389474,
"samples": 95
},
"ram": {
"peak_used_gb": 5.945511936,
"avg_used_gb": 5.1532530526315785,
"peak_percent": 46.7
},
"total_time_minutes": 72.3125548839569
},
"config": {
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
"max_seq_length": 512,
"load_in_4bit": true,
"lora_r": 32,
"lora_alpha": 32,
"lora_dropout": 0,
"num_train_epochs": 3,
"per_device_train_batch_size": 4,
"gradient_accumulation_steps": 4,
"learning_rate": 0.0002,
"warmup_steps": 10,
"logging_steps": 5,
"save_steps": 50,
"eval_steps": 50,
"seed": 3407,
"hf_repo_name": "mistral-7b-indian-university-guidance",
"wandb_project": "mistral-7b-indian-university-guidance",
"force_retrain": false,
"auto_increment_epochs": true
}
}