初始化项目,由ModelHub XC社区提供模型
Model: LLM-Research/layerskip-llama3.2-1B Source: Original Platform
This commit is contained in:
7
original/consolidate_params.json
Normal file
7
original/consolidate_params.json
Normal file
@@ -0,0 +1,7 @@
|
||||
{
|
||||
"dtype": "bf16",
|
||||
"model_parallel_size": 1,
|
||||
"on_gpu": true,
|
||||
"src": "/fsx-atom/melhoushi/xldumps/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus_run000/checkpoints/checkpoint_0100000/",
|
||||
"tgt": "/fsx-atom/melhoushi/xldumps/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus_run000/checkpoints/checkpoint_0100000_consolidated/"
|
||||
}
|
||||
Reference in New Issue
Block a user