初始化项目,由ModelHub XC社区提供模型
Model: kmseong/llama2_7b_chat-MBPP-FT-lr5e-5 Source: Original Platform
This commit is contained in:
26
finetune_config.json
Normal file
26
finetune_config.json
Normal file
@@ -0,0 +1,26 @@
|
||||
{
|
||||
"base_model": "kmseong/llama2_7b-chat-Safety-FT-lr5e-5",
|
||||
"fine_tuning_type": "Full Parameter Fine-tuning",
|
||||
"dataset": "mbpp",
|
||||
"mbpp_dataset_name": "google-research-datasets/mbpp",
|
||||
"mbpp_subset": "full",
|
||||
"mbpp_train_split": "train",
|
||||
"mbpp_eval_split": "validation",
|
||||
"num_train_samples": 374,
|
||||
"num_eval_samples": 0,
|
||||
"batch_size": 4,
|
||||
"grad_accum": 4,
|
||||
"learning_rate": 5e-05,
|
||||
"weight_decay": 0.01,
|
||||
"warmup_ratio": 0.1,
|
||||
"epochs": 3,
|
||||
"max_length": 1024,
|
||||
"max_grad_norm": 1.0,
|
||||
"lr_scheduler_type": "cosine",
|
||||
"optimizer": "AdamW (torch)",
|
||||
"gradient_checkpointing": false,
|
||||
"dtype": "bf16",
|
||||
"trainer_type": "Trainer",
|
||||
"safety_mix_ratio": 0.0,
|
||||
"safety_data_path": null
|
||||
}
|
||||
Reference in New Issue
Block a user