OLMo-0H-1D-100F/training_config.json

{
  "saved_at": "2026-06-01T10:20:24",
  "model_name": "/disk/u/yu.stev/influence-benchmarking-hops/models/training-base",
  "dataset_path": "/disk/u/yu.stev/influence-benchmarking-hops/dataset-generator/datasets/0/100/1.jsonl",
  "output_dir": "/disk/u/yu.stev/influence-benchmarking-hops/models/0/1doc/final-model",
  "seed_path": "/disk/u/yu.stev/influence-benchmarking-hops/dataset-generator/seed/0/100.jsonl",
  "epochs": 500,
  "batch_size": 10,
  "gradient_accumulation_steps": 1,
  "effective_batch_size": 10,
  "max_steps": null,
  "max_length": 2048,
  "seed": 42,
  "learning_rate": 0.0002,
  "lr_scheduler": "cosine",
  "lr_min": 2e-05,
  "warmup_steps": 100,
  "constant_steps": 4000,
  "shuffle_training": true,
  "shuffle_validation": true,
  "family_batching": false,
  "family_spreading": false,
  "checkpoint_fraction": 0.25,
  "save_steps_override": 1000,
  "hop_depth": null,
  "bf16": true,
  "fp16": false,
  "prompt_format": "output",
  "use_hops_eval": false,
  "use_depth0_eval": true,
  "eval_hop_depths": [
    0,
    1,
    2
  ],
  "normal_tokens_test": false,
  "num_functions": 10,
  "track_depth_loss": true
}