初始化项目,由ModelHub XC社区提供模型
Model: millat/mistral-7b-indian-university-guidance Source: Original Platform
This commit is contained in:
61
reports/research/epoch_1/metrics.json
Normal file
61
reports/research/epoch_1/metrics.json
Normal file
@@ -0,0 +1,61 @@
|
||||
{
|
||||
"epoch": 1,
|
||||
"timestamp": "2026-01-24T07:32:30.846737",
|
||||
"training": {
|
||||
"final_loss": 0.0,
|
||||
"total_steps": 500,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"evaluation": {
|
||||
"eval_loss": 0.382000595331192,
|
||||
"eval_runtime": 144.1215,
|
||||
"eval_samples_per_second": 4.892,
|
||||
"eval_steps_per_second": 1.228,
|
||||
"epoch": 1.2599369085173502,
|
||||
"perplexity": 1.4652129574196766
|
||||
},
|
||||
"perplexity": 1.4652129574196766,
|
||||
"lora_info": {
|
||||
"epoch": 1,
|
||||
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_1",
|
||||
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
|
||||
"size_gb": 0.172,
|
||||
"status": "success"
|
||||
},
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 7.132414976,
|
||||
"avg_memory_gb": 3.8709198994285714,
|
||||
"samples": 7
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 4.701220864,
|
||||
"avg_used_gb": 3.7343272959999996,
|
||||
"peak_percent": 37.5
|
||||
},
|
||||
"total_time_minutes": 7.410525878270467
|
||||
},
|
||||
"config": {
|
||||
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"max_seq_length": 512,
|
||||
"load_in_4bit": true,
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"lora_dropout": 0,
|
||||
"num_train_epochs": 1,
|
||||
"per_device_train_batch_size": 4,
|
||||
"gradient_accumulation_steps": 4,
|
||||
"learning_rate": 0.0002,
|
||||
"warmup_steps": 10,
|
||||
"logging_steps": 5,
|
||||
"save_steps": 50,
|
||||
"eval_steps": 50,
|
||||
"seed": 3407,
|
||||
"hf_repo_name": "mistral-7b-indian-university-guidance",
|
||||
"wandb_project": "mistral-7b-indian-university-guidance",
|
||||
"force_retrain": false,
|
||||
"auto_increment_epochs": true
|
||||
}
|
||||
}
|
||||
31
reports/research/epoch_1_summary.json
Normal file
31
reports/research/epoch_1_summary.json
Normal file
@@ -0,0 +1,31 @@
|
||||
{
|
||||
"epoch": 1,
|
||||
"timestamp": "2026-01-24T07:32:31.550573",
|
||||
"metrics": {
|
||||
"training_loss": 0.0,
|
||||
"eval_loss": 0.382000595331192,
|
||||
"perplexity": 1.4652129574196766,
|
||||
"training_time_minutes": 0.644273563226064
|
||||
},
|
||||
"model_config": {
|
||||
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 7.132414976,
|
||||
"avg_memory_gb": 3.9745230080000002,
|
||||
"samples": 8
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 4.701220864,
|
||||
"avg_used_gb": 3.829794304,
|
||||
"peak_percent": 37.5
|
||||
},
|
||||
"total_time_minutes": 7.422253819306691
|
||||
}
|
||||
}
|
||||
61
reports/research/epoch_2/metrics.json
Normal file
61
reports/research/epoch_2/metrics.json
Normal file
@@ -0,0 +1,61 @@
|
||||
{
|
||||
"epoch": 2,
|
||||
"timestamp": "2026-01-24T09:42:07.012180",
|
||||
"training": {
|
||||
"final_loss": 0.04129547421217565,
|
||||
"total_steps": 794,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"evaluation": {
|
||||
"eval_loss": 0.37572669982910156,
|
||||
"eval_runtime": 150.5368,
|
||||
"eval_samples_per_second": 4.683,
|
||||
"eval_steps_per_second": 1.176,
|
||||
"epoch": 2.0,
|
||||
"perplexity": 1.4560491409087577
|
||||
},
|
||||
"perplexity": 1.4560491409087577,
|
||||
"lora_info": {
|
||||
"epoch": 2,
|
||||
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_2",
|
||||
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
|
||||
"size_gb": 0.172,
|
||||
"status": "success"
|
||||
},
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 11.350029312,
|
||||
"avg_memory_gb": 4.562460041846153,
|
||||
"samples": 26
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 4.951568384,
|
||||
"avg_used_gb": 4.280380022153847,
|
||||
"peak_percent": 39.4
|
||||
},
|
||||
"total_time_minutes": 20.894038860003153
|
||||
},
|
||||
"config": {
|
||||
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"max_seq_length": 512,
|
||||
"load_in_4bit": true,
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"lora_dropout": 0,
|
||||
"num_train_epochs": 2,
|
||||
"per_device_train_batch_size": 4,
|
||||
"gradient_accumulation_steps": 4,
|
||||
"learning_rate": 0.0002,
|
||||
"warmup_steps": 10,
|
||||
"logging_steps": 5,
|
||||
"save_steps": 50,
|
||||
"eval_steps": 50,
|
||||
"seed": 3407,
|
||||
"hf_repo_name": "mistral-7b-indian-university-guidance",
|
||||
"wandb_project": "mistral-7b-indian-university-guidance",
|
||||
"force_retrain": false,
|
||||
"auto_increment_epochs": true
|
||||
}
|
||||
}
|
||||
31
reports/research/epoch_2_summary.json
Normal file
31
reports/research/epoch_2_summary.json
Normal file
@@ -0,0 +1,31 @@
|
||||
{
|
||||
"epoch": 2,
|
||||
"timestamp": "2026-01-24T09:42:07.364122",
|
||||
"metrics": {
|
||||
"training_loss": 0.04129547421217565,
|
||||
"eval_loss": 0.37572669982910156,
|
||||
"perplexity": 1.4560491409087577,
|
||||
"training_time_minutes": 14.512758453687033
|
||||
},
|
||||
"model_config": {
|
||||
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 11.350029312,
|
||||
"avg_memory_gb": 4.567860242962962,
|
||||
"samples": 27
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 4.951568384,
|
||||
"avg_used_gb": 4.304507335111112,
|
||||
"peak_percent": 39.4
|
||||
},
|
||||
"total_time_minutes": 20.89990162452062
|
||||
}
|
||||
}
|
||||
61
reports/research/epoch_3/metrics.json
Normal file
61
reports/research/epoch_3/metrics.json
Normal file
@@ -0,0 +1,61 @@
|
||||
{
|
||||
"epoch": 3,
|
||||
"timestamp": "2026-01-24T10:58:32.823677",
|
||||
"training": {
|
||||
"final_loss": 0.10161419559385874,
|
||||
"total_steps": 1191,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"evaluation": {
|
||||
"eval_loss": 0.3753533959388733,
|
||||
"eval_runtime": 150.6713,
|
||||
"eval_samples_per_second": 4.679,
|
||||
"eval_steps_per_second": 1.175,
|
||||
"epoch": 3.0,
|
||||
"perplexity": 1.4555056935419122
|
||||
},
|
||||
"perplexity": 1.4555056935419122,
|
||||
"lora_info": {
|
||||
"epoch": 3,
|
||||
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_3",
|
||||
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
|
||||
"size_gb": 0.172,
|
||||
"status": "success"
|
||||
},
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 11.954010624,
|
||||
"avg_memory_gb": 5.191932421389474,
|
||||
"samples": 95
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 5.945511936,
|
||||
"avg_used_gb": 5.1532530526315785,
|
||||
"peak_percent": 46.7
|
||||
},
|
||||
"total_time_minutes": 72.3125548839569
|
||||
},
|
||||
"config": {
|
||||
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"max_seq_length": 512,
|
||||
"load_in_4bit": true,
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"lora_dropout": 0,
|
||||
"num_train_epochs": 3,
|
||||
"per_device_train_batch_size": 4,
|
||||
"gradient_accumulation_steps": 4,
|
||||
"learning_rate": 0.0002,
|
||||
"warmup_steps": 10,
|
||||
"logging_steps": 5,
|
||||
"save_steps": 50,
|
||||
"eval_steps": 50,
|
||||
"seed": 3407,
|
||||
"hf_repo_name": "mistral-7b-indian-university-guidance",
|
||||
"wandb_project": "mistral-7b-indian-university-guidance",
|
||||
"force_retrain": false,
|
||||
"auto_increment_epochs": true
|
||||
}
|
||||
}
|
||||
31
reports/research/epoch_3_summary.json
Normal file
31
reports/research/epoch_3_summary.json
Normal file
@@ -0,0 +1,31 @@
|
||||
{
|
||||
"epoch": 3,
|
||||
"timestamp": "2026-01-24T10:58:32.884444",
|
||||
"metrics": {
|
||||
"training_loss": 0.10161419559385874,
|
||||
"eval_loss": 0.3753533959388733,
|
||||
"perplexity": 1.4555056935419122,
|
||||
"training_time_minutes": 66.47436684767405
|
||||
},
|
||||
"model_config": {
|
||||
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 11.954010624,
|
||||
"avg_memory_gb": 5.189690426666667,
|
||||
"samples": 96
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 5.945511936,
|
||||
"avg_used_gb": 5.151363968,
|
||||
"peak_percent": 46.7
|
||||
},
|
||||
"total_time_minutes": 72.31356252829234
|
||||
}
|
||||
}
|
||||
98
reports/research/epoch_tracker.json
Normal file
98
reports/research/epoch_tracker.json
Normal file
@@ -0,0 +1,98 @@
|
||||
{
|
||||
"epochs": [
|
||||
{
|
||||
"epoch": 1,
|
||||
"timestamp": "2026-01-24T07:32:31.550573",
|
||||
"metrics": {
|
||||
"training_loss": 0.0,
|
||||
"eval_loss": 0.382000595331192,
|
||||
"perplexity": 1.4652129574196766,
|
||||
"training_time_minutes": 0.644273563226064
|
||||
},
|
||||
"model_config": {
|
||||
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 7.132414976,
|
||||
"avg_memory_gb": 3.9745230080000002,
|
||||
"samples": 8
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 4.701220864,
|
||||
"avg_used_gb": 3.829794304,
|
||||
"peak_percent": 37.5
|
||||
},
|
||||
"total_time_minutes": 7.422253819306691
|
||||
}
|
||||
},
|
||||
{
|
||||
"epoch": 2,
|
||||
"timestamp": "2026-01-24T09:42:07.364122",
|
||||
"metrics": {
|
||||
"training_loss": 0.04129547421217565,
|
||||
"eval_loss": 0.37572669982910156,
|
||||
"perplexity": 1.4560491409087577,
|
||||
"training_time_minutes": 14.512758453687033
|
||||
},
|
||||
"model_config": {
|
||||
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 11.350029312,
|
||||
"avg_memory_gb": 4.567860242962962,
|
||||
"samples": 27
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 4.951568384,
|
||||
"avg_used_gb": 4.304507335111112,
|
||||
"peak_percent": 39.4
|
||||
},
|
||||
"total_time_minutes": 20.89990162452062
|
||||
}
|
||||
},
|
||||
{
|
||||
"epoch": 3,
|
||||
"timestamp": "2026-01-24T10:58:32.884444",
|
||||
"metrics": {
|
||||
"training_loss": 0.10161419559385874,
|
||||
"eval_loss": 0.3753533959388733,
|
||||
"perplexity": 1.4555056935419122,
|
||||
"training_time_minutes": 66.47436684767405
|
||||
},
|
||||
"model_config": {
|
||||
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 11.954010624,
|
||||
"avg_memory_gb": 5.189690426666667,
|
||||
"samples": 96
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 5.945511936,
|
||||
"avg_used_gb": 5.151363968,
|
||||
"peak_percent": 46.7
|
||||
},
|
||||
"total_time_minutes": 72.31356252829234
|
||||
}
|
||||
}
|
||||
],
|
||||
"last_updated": "2026-01-24T10:58:32.897313"
|
||||
}
|
||||
61
reports/research/latest_metrics.json
Normal file
61
reports/research/latest_metrics.json
Normal file
@@ -0,0 +1,61 @@
|
||||
{
|
||||
"epoch": 3,
|
||||
"timestamp": "2026-01-24T10:58:32.823677",
|
||||
"training": {
|
||||
"final_loss": 0.10161419559385874,
|
||||
"total_steps": 1191,
|
||||
"learning_rate": 0.0002,
|
||||
"batch_size": 16
|
||||
},
|
||||
"evaluation": {
|
||||
"eval_loss": 0.3753533959388733,
|
||||
"eval_runtime": 150.6713,
|
||||
"eval_samples_per_second": 4.679,
|
||||
"eval_steps_per_second": 1.175,
|
||||
"epoch": 3.0,
|
||||
"perplexity": 1.4555056935419122
|
||||
},
|
||||
"perplexity": 1.4555056935419122,
|
||||
"lora_info": {
|
||||
"epoch": 3,
|
||||
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_3",
|
||||
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
|
||||
"size_gb": 0.172,
|
||||
"status": "success"
|
||||
},
|
||||
"hardware": {
|
||||
"gpu": {
|
||||
"peak_memory_gb": 11.954010624,
|
||||
"avg_memory_gb": 5.191932421389474,
|
||||
"samples": 95
|
||||
},
|
||||
"ram": {
|
||||
"peak_used_gb": 5.945511936,
|
||||
"avg_used_gb": 5.1532530526315785,
|
||||
"peak_percent": 46.7
|
||||
},
|
||||
"total_time_minutes": 72.3125548839569
|
||||
},
|
||||
"config": {
|
||||
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
|
||||
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
|
||||
"max_seq_length": 512,
|
||||
"load_in_4bit": true,
|
||||
"lora_r": 32,
|
||||
"lora_alpha": 32,
|
||||
"lora_dropout": 0,
|
||||
"num_train_epochs": 3,
|
||||
"per_device_train_batch_size": 4,
|
||||
"gradient_accumulation_steps": 4,
|
||||
"learning_rate": 0.0002,
|
||||
"warmup_steps": 10,
|
||||
"logging_steps": 5,
|
||||
"save_steps": 50,
|
||||
"eval_steps": 50,
|
||||
"seed": 3407,
|
||||
"hf_repo_name": "mistral-7b-indian-university-guidance",
|
||||
"wandb_project": "mistral-7b-indian-university-guidance",
|
||||
"force_retrain": false,
|
||||
"auto_increment_epochs": true
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user