初始化项目,由ModelHub XC社区提供模型

Model: LLM-Research/layerskip-llama3.2-1B
Source: Original Platform
This commit is contained in:
ModelHub XC
2026-05-15 18:39:45 +08:00
commit bd860a1a5f
15 changed files with 131015 additions and 0 deletions

View File

@@ -0,0 +1,7 @@
{
"dtype": "bf16",
"model_parallel_size": 1,
"on_gpu": true,
"src": "/fsx-atom/melhoushi/xldumps/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus_run000/checkpoints/checkpoint_0100000/",
"tgt": "/fsx-atom/melhoushi/xldumps/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus/continual_llama3.2_1B_gpus_64_shared_emb_higher_lr_ee_0.1_ld_0.1_128_gpus_run000/checkpoints/checkpoint_0100000_consolidated/"
}