初始化项目,由ModelHub XC社区提供模型
Model: Lamsheeper/OLMo-0H-1D-100F Source: Original Platform
This commit is contained in:
39
training_config.json
Normal file
39
training_config.json
Normal file
@@ -0,0 +1,39 @@
|
||||
{
|
||||
"saved_at": "2026-06-01T10:20:24",
|
||||
"model_name": "/disk/u/yu.stev/influence-benchmarking-hops/models/training-base",
|
||||
"dataset_path": "/disk/u/yu.stev/influence-benchmarking-hops/dataset-generator/datasets/0/100/1.jsonl",
|
||||
"output_dir": "/disk/u/yu.stev/influence-benchmarking-hops/models/0/1doc/final-model",
|
||||
"seed_path": "/disk/u/yu.stev/influence-benchmarking-hops/dataset-generator/seed/0/100.jsonl",
|
||||
"epochs": 500,
|
||||
"batch_size": 10,
|
||||
"gradient_accumulation_steps": 1,
|
||||
"effective_batch_size": 10,
|
||||
"max_steps": null,
|
||||
"max_length": 2048,
|
||||
"seed": 42,
|
||||
"learning_rate": 0.0002,
|
||||
"lr_scheduler": "cosine",
|
||||
"lr_min": 2e-05,
|
||||
"warmup_steps": 100,
|
||||
"constant_steps": 4000,
|
||||
"shuffle_training": true,
|
||||
"shuffle_validation": true,
|
||||
"family_batching": false,
|
||||
"family_spreading": false,
|
||||
"checkpoint_fraction": 0.25,
|
||||
"save_steps_override": 1000,
|
||||
"hop_depth": null,
|
||||
"bf16": true,
|
||||
"fp16": false,
|
||||
"prompt_format": "output",
|
||||
"use_hops_eval": false,
|
||||
"use_depth0_eval": true,
|
||||
"eval_hop_depths": [
|
||||
0,
|
||||
1,
|
||||
2
|
||||
],
|
||||
"normal_tokens_test": false,
|
||||
"num_functions": 10,
|
||||
"track_depth_loss": true
|
||||
}
|
||||
Reference in New Issue
Block a user