Files
OLMo-0H-1D-100F/training_config.json
ModelHub XC 29aa7ee467 初始化项目,由ModelHub XC社区提供模型
Model: Lamsheeper/OLMo-0H-1D-100F
Source: Original Platform
2026-06-18 21:21:22 +08:00

39 lines
1.1 KiB
JSON

{
"saved_at": "2026-06-01T10:20:24",
"model_name": "/disk/u/yu.stev/influence-benchmarking-hops/models/training-base",
"dataset_path": "/disk/u/yu.stev/influence-benchmarking-hops/dataset-generator/datasets/0/100/1.jsonl",
"output_dir": "/disk/u/yu.stev/influence-benchmarking-hops/models/0/1doc/final-model",
"seed_path": "/disk/u/yu.stev/influence-benchmarking-hops/dataset-generator/seed/0/100.jsonl",
"epochs": 500,
"batch_size": 10,
"gradient_accumulation_steps": 1,
"effective_batch_size": 10,
"max_steps": null,
"max_length": 2048,
"seed": 42,
"learning_rate": 0.0002,
"lr_scheduler": "cosine",
"lr_min": 2e-05,
"warmup_steps": 100,
"constant_steps": 4000,
"shuffle_training": true,
"shuffle_validation": true,
"family_batching": false,
"family_spreading": false,
"checkpoint_fraction": 0.25,
"save_steps_override": 1000,
"hop_depth": null,
"bf16": true,
"fp16": false,
"prompt_format": "output",
"use_hops_eval": false,
"use_depth0_eval": true,
"eval_hop_depths": [
0,
1,
2
],
"normal_tokens_test": false,
"num_functions": 10,
"track_depth_loss": true
}