初始化项目,由ModelHub XC社区提供模型

Model: millat/mistral-7b-indian-university-guidance
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-06-20 04:15:17 +08:00
commit 466afa54a8
94 changed files with 1134163 additions and 0 deletions

View File

@@ -0,0 +1,61 @@
{
"epoch": 1,
"timestamp": "2026-01-24T07:32:30.846737",
"training": {
"final_loss": 0.0,
"total_steps": 500,
"learning_rate": 0.0002,
"batch_size": 16
},
"evaluation": {
"eval_loss": 0.382000595331192,
"eval_runtime": 144.1215,
"eval_samples_per_second": 4.892,
"eval_steps_per_second": 1.228,
"epoch": 1.2599369085173502,
"perplexity": 1.4652129574196766
},
"perplexity": 1.4652129574196766,
"lora_info": {
"epoch": 1,
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_1",
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
"size_gb": 0.172,
"status": "success"
},
"hardware": {
"gpu": {
"peak_memory_gb": 7.132414976,
"avg_memory_gb": 3.8709198994285714,
"samples": 7
},
"ram": {
"peak_used_gb": 4.701220864,
"avg_used_gb": 3.7343272959999996,
"peak_percent": 37.5
},
"total_time_minutes": 7.410525878270467
},
"config": {
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
"max_seq_length": 512,
"load_in_4bit": true,
"lora_r": 32,
"lora_alpha": 32,
"lora_dropout": 0,
"num_train_epochs": 1,
"per_device_train_batch_size": 4,
"gradient_accumulation_steps": 4,
"learning_rate": 0.0002,
"warmup_steps": 10,
"logging_steps": 5,
"save_steps": 50,
"eval_steps": 50,
"seed": 3407,
"hf_repo_name": "mistral-7b-indian-university-guidance",
"wandb_project": "mistral-7b-indian-university-guidance",
"force_retrain": false,
"auto_increment_epochs": true
}
}

View File

@@ -0,0 +1,31 @@
{
"epoch": 1,
"timestamp": "2026-01-24T07:32:31.550573",
"metrics": {
"training_loss": 0.0,
"eval_loss": 0.382000595331192,
"perplexity": 1.4652129574196766,
"training_time_minutes": 0.644273563226064
},
"model_config": {
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"lora_r": 32,
"lora_alpha": 32,
"learning_rate": 0.0002,
"batch_size": 16
},
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
"hardware": {
"gpu": {
"peak_memory_gb": 7.132414976,
"avg_memory_gb": 3.9745230080000002,
"samples": 8
},
"ram": {
"peak_used_gb": 4.701220864,
"avg_used_gb": 3.829794304,
"peak_percent": 37.5
},
"total_time_minutes": 7.422253819306691
}
}

View File

@@ -0,0 +1,61 @@
{
"epoch": 2,
"timestamp": "2026-01-24T09:42:07.012180",
"training": {
"final_loss": 0.04129547421217565,
"total_steps": 794,
"learning_rate": 0.0002,
"batch_size": 16
},
"evaluation": {
"eval_loss": 0.37572669982910156,
"eval_runtime": 150.5368,
"eval_samples_per_second": 4.683,
"eval_steps_per_second": 1.176,
"epoch": 2.0,
"perplexity": 1.4560491409087577
},
"perplexity": 1.4560491409087577,
"lora_info": {
"epoch": 2,
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_2",
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
"size_gb": 0.172,
"status": "success"
},
"hardware": {
"gpu": {
"peak_memory_gb": 11.350029312,
"avg_memory_gb": 4.562460041846153,
"samples": 26
},
"ram": {
"peak_used_gb": 4.951568384,
"avg_used_gb": 4.280380022153847,
"peak_percent": 39.4
},
"total_time_minutes": 20.894038860003153
},
"config": {
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
"max_seq_length": 512,
"load_in_4bit": true,
"lora_r": 32,
"lora_alpha": 32,
"lora_dropout": 0,
"num_train_epochs": 2,
"per_device_train_batch_size": 4,
"gradient_accumulation_steps": 4,
"learning_rate": 0.0002,
"warmup_steps": 10,
"logging_steps": 5,
"save_steps": 50,
"eval_steps": 50,
"seed": 3407,
"hf_repo_name": "mistral-7b-indian-university-guidance",
"wandb_project": "mistral-7b-indian-university-guidance",
"force_retrain": false,
"auto_increment_epochs": true
}
}

View File

@@ -0,0 +1,31 @@
{
"epoch": 2,
"timestamp": "2026-01-24T09:42:07.364122",
"metrics": {
"training_loss": 0.04129547421217565,
"eval_loss": 0.37572669982910156,
"perplexity": 1.4560491409087577,
"training_time_minutes": 14.512758453687033
},
"model_config": {
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"lora_r": 32,
"lora_alpha": 32,
"learning_rate": 0.0002,
"batch_size": 16
},
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
"hardware": {
"gpu": {
"peak_memory_gb": 11.350029312,
"avg_memory_gb": 4.567860242962962,
"samples": 27
},
"ram": {
"peak_used_gb": 4.951568384,
"avg_used_gb": 4.304507335111112,
"peak_percent": 39.4
},
"total_time_minutes": 20.89990162452062
}
}

View File

@@ -0,0 +1,61 @@
{
"epoch": 3,
"timestamp": "2026-01-24T10:58:32.823677",
"training": {
"final_loss": 0.10161419559385874,
"total_steps": 1191,
"learning_rate": 0.0002,
"batch_size": 16
},
"evaluation": {
"eval_loss": 0.3753533959388733,
"eval_runtime": 150.6713,
"eval_samples_per_second": 4.679,
"eval_steps_per_second": 1.175,
"epoch": 3.0,
"perplexity": 1.4555056935419122
},
"perplexity": 1.4555056935419122,
"lora_info": {
"epoch": 3,
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_3",
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
"size_gb": 0.172,
"status": "success"
},
"hardware": {
"gpu": {
"peak_memory_gb": 11.954010624,
"avg_memory_gb": 5.191932421389474,
"samples": 95
},
"ram": {
"peak_used_gb": 5.945511936,
"avg_used_gb": 5.1532530526315785,
"peak_percent": 46.7
},
"total_time_minutes": 72.3125548839569
},
"config": {
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
"max_seq_length": 512,
"load_in_4bit": true,
"lora_r": 32,
"lora_alpha": 32,
"lora_dropout": 0,
"num_train_epochs": 3,
"per_device_train_batch_size": 4,
"gradient_accumulation_steps": 4,
"learning_rate": 0.0002,
"warmup_steps": 10,
"logging_steps": 5,
"save_steps": 50,
"eval_steps": 50,
"seed": 3407,
"hf_repo_name": "mistral-7b-indian-university-guidance",
"wandb_project": "mistral-7b-indian-university-guidance",
"force_retrain": false,
"auto_increment_epochs": true
}
}

View File

@@ -0,0 +1,31 @@
{
"epoch": 3,
"timestamp": "2026-01-24T10:58:32.884444",
"metrics": {
"training_loss": 0.10161419559385874,
"eval_loss": 0.3753533959388733,
"perplexity": 1.4555056935419122,
"training_time_minutes": 66.47436684767405
},
"model_config": {
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"lora_r": 32,
"lora_alpha": 32,
"learning_rate": 0.0002,
"batch_size": 16
},
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
"hardware": {
"gpu": {
"peak_memory_gb": 11.954010624,
"avg_memory_gb": 5.189690426666667,
"samples": 96
},
"ram": {
"peak_used_gb": 5.945511936,
"avg_used_gb": 5.151363968,
"peak_percent": 46.7
},
"total_time_minutes": 72.31356252829234
}
}

View File

@@ -0,0 +1,98 @@
{
"epochs": [
{
"epoch": 1,
"timestamp": "2026-01-24T07:32:31.550573",
"metrics": {
"training_loss": 0.0,
"eval_loss": 0.382000595331192,
"perplexity": 1.4652129574196766,
"training_time_minutes": 0.644273563226064
},
"model_config": {
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"lora_r": 32,
"lora_alpha": 32,
"learning_rate": 0.0002,
"batch_size": 16
},
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
"hardware": {
"gpu": {
"peak_memory_gb": 7.132414976,
"avg_memory_gb": 3.9745230080000002,
"samples": 8
},
"ram": {
"peak_used_gb": 4.701220864,
"avg_used_gb": 3.829794304,
"peak_percent": 37.5
},
"total_time_minutes": 7.422253819306691
}
},
{
"epoch": 2,
"timestamp": "2026-01-24T09:42:07.364122",
"metrics": {
"training_loss": 0.04129547421217565,
"eval_loss": 0.37572669982910156,
"perplexity": 1.4560491409087577,
"training_time_minutes": 14.512758453687033
},
"model_config": {
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"lora_r": 32,
"lora_alpha": 32,
"learning_rate": 0.0002,
"batch_size": 16
},
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
"hardware": {
"gpu": {
"peak_memory_gb": 11.350029312,
"avg_memory_gb": 4.567860242962962,
"samples": 27
},
"ram": {
"peak_used_gb": 4.951568384,
"avg_used_gb": 4.304507335111112,
"peak_percent": 39.4
},
"total_time_minutes": 20.89990162452062
}
},
{
"epoch": 3,
"timestamp": "2026-01-24T10:58:32.884444",
"metrics": {
"training_loss": 0.10161419559385874,
"eval_loss": 0.3753533959388733,
"perplexity": 1.4555056935419122,
"training_time_minutes": 66.47436684767405
},
"model_config": {
"base_model": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"lora_r": 32,
"lora_alpha": 32,
"learning_rate": 0.0002,
"batch_size": 16
},
"dataset": "millat/indian_university_guidance_for_bangladeshi_students",
"hardware": {
"gpu": {
"peak_memory_gb": 11.954010624,
"avg_memory_gb": 5.189690426666667,
"samples": 96
},
"ram": {
"peak_used_gb": 5.945511936,
"avg_used_gb": 5.151363968,
"peak_percent": 46.7
},
"total_time_minutes": 72.31356252829234
}
}
],
"last_updated": "2026-01-24T10:58:32.897313"
}

View File

@@ -0,0 +1,61 @@
{
"epoch": 3,
"timestamp": "2026-01-24T10:58:32.823677",
"training": {
"final_loss": 0.10161419559385874,
"total_steps": 1191,
"learning_rate": 0.0002,
"batch_size": 16
},
"evaluation": {
"eval_loss": 0.3753533959388733,
"eval_runtime": 150.6713,
"eval_samples_per_second": 4.679,
"eval_steps_per_second": 1.175,
"epoch": 3.0,
"perplexity": 1.4555056935419122
},
"perplexity": 1.4555056935419122,
"lora_info": {
"epoch": 3,
"epoch_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters/epoch_3",
"latest_path": "/content/drive/MyDrive/Indian_Uni_Model_Training/models/lora_adapters",
"size_gb": 0.172,
"status": "success"
},
"hardware": {
"gpu": {
"peak_memory_gb": 11.954010624,
"avg_memory_gb": 5.191932421389474,
"samples": 95
},
"ram": {
"peak_used_gb": 5.945511936,
"avg_used_gb": 5.1532530526315785,
"peak_percent": 46.7
},
"total_time_minutes": 72.3125548839569
},
"config": {
"model_name": "unsloth/mistral-7b-instruct-v0.3-bnb-4bit",
"dataset_name": "millat/indian_university_guidance_for_bangladeshi_students",
"max_seq_length": 512,
"load_in_4bit": true,
"lora_r": 32,
"lora_alpha": 32,
"lora_dropout": 0,
"num_train_epochs": 3,
"per_device_train_batch_size": 4,
"gradient_accumulation_steps": 4,
"learning_rate": 0.0002,
"warmup_steps": 10,
"logging_steps": 5,
"save_steps": 50,
"eval_steps": 50,
"seed": 3407,
"hf_repo_name": "mistral-7b-indian-university-guidance",
"wandb_project": "mistral-7b-indian-university-guidance",
"force_retrain": false,
"auto_increment_epochs": true
}
}