Files
g1_gptlong_top8_32b/training_configs/sft_config.json

15 lines
594 B
JSON
Raw Normal View History

{
"job_name": "g1_gptlong_top8_32b__Qwen3-8B",
"train_config_path": "/e/scratch/jureap59/raoof1/sft_experiments/g1_gptlong_top8_32b/configs/g1_gptlong_top8_32b__Qwen3-8B_train_config.yaml",
"experiments_dir": "/e/scratch/jureap59/raoof1/sft_experiments/g1_gptlong_top8_32b",
"cluster_name": "jupiter",
"num_nodes": 24,
"gpus_per_node": 4,
"cpus_per_node": 288,
"launcher": "accelerate",
"accelerate_config_path": null,
"deepspeed_config": "sft/lf_configs/deepspeed/ds_z3_accelerate.json",
"master_port": 12802,
"needs_ssh_tunnel": true,
"needs_cuda_detection": false
}