From e68fb677be8d6ea1fafcf88f1ff16d285e1fc96e Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 1 Jun 2026 01:56:16 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: rbelanec/train_sst2_42_1779354538 Source: Original Platform --- .gitattributes | 36 + README.md | 81 + all_results.json | 13 + config.json | 39 + eval_results.json | 8 + generation_config.json | 12 + model.safetensors | 3 + special_tokens_map.json | 26 + tokenizer.json | 3 + tokenizer_config.json | 2069 +++++++ train.yaml | 55 + train_results.json | 9 + trainer_log.jsonl | 1535 +++++ trainer_state.json | 12335 ++++++++++++++++++++++++++++++++++++++ training_args.bin | 3 + training_eval_loss.png | Bin 0 -> 46316 bytes training_loss.png | Bin 0 -> 48854 bytes 17 files changed, 16227 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 all_results.json create mode 100644 config.json create mode 100644 eval_results.json create mode 100644 generation_config.json create mode 100644 model.safetensors create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train.yaml create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_eval_loss.png create mode 100644 training_loss.png diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..1d4ff2e --- /dev/null +++ b/README.md @@ -0,0 +1,81 @@ +--- +library_name: transformers +license: llama3.2 +base_model: meta-llama/Llama-3.2-1B-Instruct +tags: +- peft-factory +- full +- llama-factory +- generated_from_trainer +model-index: +- name: train_sst2_42_1779354538 + results: [] +--- + + + +# train_sst2_42_1779354538 + +This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on the sst2 dataset. +It achieves the following results on the evaluation set: +- Loss: 0.0936 +- Num Input Tokens Seen: 3725120 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 2e-06 +- train_batch_size: 8 +- eval_batch_size: 8 +- seed: 42 +- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 1 + +### Training results + +| Training Loss | Epoch | Step | Validation Loss | Input Tokens Seen | +|:-------------:|:------:|:----:|:---------------:|:-----------------:| +| 0.0578 | 0.0500 | 379 | 0.1688 | 187072 | +| 0.1097 | 0.1000 | 758 | 0.1367 | 373504 | +| 0.0564 | 0.1501 | 1137 | 0.1656 | 557824 | +| 0.1883 | 0.2001 | 1516 | 0.1097 | 743424 | +| 0.2857 | 0.2501 | 1895 | 0.1319 | 930944 | +| 0.1387 | 0.3001 | 2274 | 0.1241 | 1116800 | +| 0.0494 | 0.3501 | 2653 | 0.1384 | 1303872 | +| 0.1412 | 0.4002 | 3032 | 0.1309 | 1490688 | +| 0.0509 | 0.4502 | 3411 | 0.1158 | 1678208 | +| 0.179 | 0.5002 | 3790 | 0.1276 | 1864128 | +| 0.1555 | 0.5502 | 4169 | 0.0994 | 2047552 | +| 0.1894 | 0.6002 | 4548 | 0.1099 | 2232448 | +| 0.1297 | 0.6503 | 4927 | 0.0997 | 2420096 | +| 0.1829 | 0.7003 | 5306 | 0.0936 | 2605504 | +| 0.0314 | 0.7503 | 5685 | 0.1006 | 2790656 | +| 0.1396 | 0.8003 | 6064 | 0.0963 | 2979456 | +| 0.171 | 0.8503 | 6443 | 0.1007 | 3167488 | +| 0.0013 | 0.9004 | 6822 | 0.0976 | 3355520 | +| 0.0683 | 0.9504 | 7201 | 0.0981 | 3541632 | + + +### Framework versions + +- Transformers 4.51.3 +- Pytorch 2.10.0+cu128 +- Datasets 4.0.0 +- Tokenizers 0.21.4 diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..4f7cffb --- /dev/null +++ b/all_results.json @@ -0,0 +1,13 @@ +{ + "epoch": 1.0, + "eval_loss": 0.09362584352493286, + "eval_runtime": 7.7886, + "eval_samples_per_second": 864.725, + "eval_steps_per_second": 108.107, + "num_input_tokens_seen": 3725120, + "total_flos": 2.175051626840064e+16, + "train_loss": 0.12628782090838944, + "train_runtime": 1516.0655, + "train_samples_per_second": 39.981, + "train_steps_per_second": 4.998 +} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..5a2b93f --- /dev/null +++ b/config.json @@ -0,0 +1,39 @@ +{ + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "torch_dtype": "float32", + "transformers_version": "4.51.3", + "use_cache": false, + "vocab_size": 128256 +} diff --git a/eval_results.json b/eval_results.json new file mode 100644 index 0000000..10942ca --- /dev/null +++ b/eval_results.json @@ -0,0 +1,8 @@ +{ + "epoch": 1.0, + "eval_loss": 0.09362584352493286, + "eval_runtime": 7.7886, + "eval_samples_per_second": 864.725, + "eval_steps_per_second": 108.107, + "num_input_tokens_seen": 3725120 +} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..2b8ae57 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,12 @@ +{ + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "4.51.3" +} diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..0b26269 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d4e40ce8700ba2f38669bf3fcf66f4151bcf92a3035c662b364453383b9603 +size 4943274328 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..14daf45 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,26 @@ +{ + "additional_special_tokens": [ + { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } + ], + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "<|eot_id|>" +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..1c1d8d5 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..ddc3ce0 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2069 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "additional_special_tokens": [ + "<|eom_id|>" + ], + "bos_token": "<|begin_of_text|>", + "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n {%- if strftime_now is defined %}\n {%- set date_string = strftime_now(\"%d %b %Y\") %}\n {%- else %}\n {%- set date_string = \"26 Jul 2024\" %}\n {%- endif %}\n{%- endif %}\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n {%- set system_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n{%- else %}\n {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message #}\n{{- \"<|start_header_id|>system<|end_header_id|>\\n\\n\" }}\n{%- if tools is not none %}\n {{- \"Environment: ipython\\n\" }}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\\n\" }}\n{{- \"Today Date: \" + date_string + \"\\n\\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n {#- Extract the first user message so we can plug it in here #}\n {%- if messages | length != 0 %}\n {%- set first_user_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n {%- else %}\n {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n {{- '<|start_header_id|>user<|end_header_id|>\\n\\n' -}}\n {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n {{- \"with its proper arguments that best answers the given prompt.\\n\\n\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n'+ message['content'] | trim + '<|eot_id|>' }}\n {%- elif 'tool_calls' in message %}\n {%- if not message.tool_calls|length == 1 %}\n {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n {%- endif %}\n {%- set tool_call = message.tool_calls[0].function %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' -}}\n {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n {{- '\"parameters\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- \"}\" }}\n {{- \"<|eot_id|>\" }}\n {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n {{- \"<|start_header_id|>ipython<|end_header_id|>\\n\\n\" }}\n {%- if message.content is mapping or message.content is iterable %}\n {{- message.content | tojson }}\n {%- else %}\n {{- message.content }}\n {%- endif %}\n {{- \"<|eot_id|>\" }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}\n{%- endif %}\n", + "clean_up_tokenization_spaces": true, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "pad_token": "<|eot_id|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "PreTrainedTokenizer" +} diff --git a/train.yaml b/train.yaml new file mode 100644 index 0000000..7a4ed16 --- /dev/null +++ b/train.yaml @@ -0,0 +1,55 @@ +seed: 42 + +### model +model_name_or_path: meta-llama/Llama-3.2-1B-Instruct +trust_remote_code: true +flash_attn: auto +use_cache: false + +### method +stage: sft +do_train: true +finetuning_type: full + +### dataset +dataset: sst2 +template: llama3 +cutoff_len: 2048 +overwrite_cache: true +preprocessing_num_workers: 4 +dataloader_num_workers: 4 +packing: false + +### output +output_dir: saves_bts_preliminary/base/llama-3.2-1b-instruct/train_sst2_42_1779354538 +logging_steps: 5 +save_steps: 0.05 +overwrite_output_dir: true +save_only_model: false +plot_loss: true +include_num_input_tokens_seen: true +push_to_hub: true +push_to_hub_organization: rbelanec +load_best_model_at_end: true +save_total_limit: 1 + +### train +per_device_train_batch_size: 8 +learning_rate: 2.0e-6 +num_train_epochs: 1 +weight_decay: 1.0e-2 +lr_scheduler_type: cosine +bf16: true +ddp_timeout: 180000000 +resume_from_checkpoint: null +warmup_ratio: 0.1 +optim: adamw_torch +report_to: +- wandb +run_name: base_llama-3.2-1b-instruct_train_sst2_42_1779354538 + +### eval +per_device_eval_batch_size: 8 +eval_strategy: steps +eval_steps: 0.05 +val_size: 0.1 \ No newline at end of file diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..d611f42 --- /dev/null +++ b/train_results.json @@ -0,0 +1,9 @@ +{ + "epoch": 1.0, + "num_input_tokens_seen": 3725120, + "total_flos": 2.175051626840064e+16, + "train_loss": 0.12628782090838944, + "train_runtime": 1516.0655, + "train_samples_per_second": 39.981, + "train_steps_per_second": 4.998 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..2ef0143 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,1535 @@ +{"current_steps": 5, "total_steps": 7577, "loss": 1.4317, "lr": 1.0554089709762531e-08, "epoch": 0.0006598917777484492, "percentage": 0.07, "elapsed_time": "0:00:00", "remaining_time": "0:16:38", "throughput": 3397.34, "total_tokens": 2240} +{"current_steps": 10, "total_steps": 7577, "loss": 1.5404, "lr": 2.3746701846965696e-08, "epoch": 0.0013197835554968984, "percentage": 0.13, "elapsed_time": "0:00:00", "remaining_time": "0:12:35", "throughput": 4678.08, "total_tokens": 4672} +{"current_steps": 15, "total_steps": 7577, "loss": 1.4488, "lr": 3.6939313984168866e-08, "epoch": 0.0019796753332453477, "percentage": 0.2, "elapsed_time": "0:00:01", "remaining_time": "0:11:09", "throughput": 5300.01, "total_tokens": 7040} +{"current_steps": 20, "total_steps": 7577, "loss": 1.469, "lr": 5.013192612137203e-08, "epoch": 0.002639567110993797, "percentage": 0.26, "elapsed_time": "0:00:01", "remaining_time": "0:10:26", "throughput": 5794.13, "total_tokens": 9600} +{"current_steps": 25, "total_steps": 7577, "loss": 1.3406, "lr": 6.33245382585752e-08, "epoch": 0.0032994588887422464, "percentage": 0.33, "elapsed_time": "0:00:01", "remaining_time": "0:09:59", "throughput": 6132.03, "total_tokens": 12160} +{"current_steps": 30, "total_steps": 7577, "loss": 1.421, "lr": 7.651715039577835e-08, "epoch": 0.0039593506664906955, "percentage": 0.4, "elapsed_time": "0:00:02", "remaining_time": "0:09:41", "throughput": 6289.1, "total_tokens": 14528} +{"current_steps": 35, "total_steps": 7577, "loss": 1.1582, "lr": 8.970976253298153e-08, "epoch": 0.004619242444239145, "percentage": 0.46, "elapsed_time": "0:00:02", "remaining_time": "0:09:27", "throughput": 6362.66, "total_tokens": 16768} +{"current_steps": 40, "total_steps": 7577, "loss": 1.1864, "lr": 1.0290237467018468e-07, "epoch": 0.005279134221987594, "percentage": 0.53, "elapsed_time": "0:00:02", "remaining_time": "0:09:18", "throughput": 6494.9, "total_tokens": 19264} +{"current_steps": 45, "total_steps": 7577, "loss": 0.8458, "lr": 1.1609498680738786e-07, "epoch": 0.005939025999736044, "percentage": 0.59, "elapsed_time": "0:00:03", "remaining_time": "0:09:12", "throughput": 6550.58, "total_tokens": 21632} +{"current_steps": 50, "total_steps": 7577, "loss": 0.7602, "lr": 1.29287598944591e-07, "epoch": 0.006598917777484493, "percentage": 0.66, "elapsed_time": "0:00:03", "remaining_time": "0:09:06", "throughput": 6615.85, "total_tokens": 24000} +{"current_steps": 55, "total_steps": 7577, "loss": 0.7195, "lr": 1.424802110817942e-07, "epoch": 0.007258809555232942, "percentage": 0.73, "elapsed_time": "0:00:03", "remaining_time": "0:09:01", "throughput": 6696.39, "total_tokens": 26496} +{"current_steps": 60, "total_steps": 7577, "loss": 0.3928, "lr": 1.5567282321899736e-07, "epoch": 0.007918701332981391, "percentage": 0.79, "elapsed_time": "0:00:04", "remaining_time": "0:08:57", "throughput": 6789.9, "total_tokens": 29120} +{"current_steps": 65, "total_steps": 7577, "loss": 0.3093, "lr": 1.688654353562005e-07, "epoch": 0.008578593110729841, "percentage": 0.86, "elapsed_time": "0:00:04", "remaining_time": "0:08:53", "throughput": 6870.9, "total_tokens": 31744} +{"current_steps": 70, "total_steps": 7577, "loss": 0.2986, "lr": 1.820580474934037e-07, "epoch": 0.00923848488847829, "percentage": 0.92, "elapsed_time": "0:00:04", "remaining_time": "0:08:50", "throughput": 6911.09, "total_tokens": 34176} +{"current_steps": 75, "total_steps": 7577, "loss": 0.2998, "lr": 1.9525065963060686e-07, "epoch": 0.009898376666226739, "percentage": 0.99, "elapsed_time": "0:00:05", "remaining_time": "0:08:47", "throughput": 6985.09, "total_tokens": 36864} +{"current_steps": 80, "total_steps": 7577, "loss": 0.2555, "lr": 2.0844327176781002e-07, "epoch": 0.010558268443975187, "percentage": 1.06, "elapsed_time": "0:00:05", "remaining_time": "0:08:45", "throughput": 7026.85, "total_tokens": 39424} +{"current_steps": 85, "total_steps": 7577, "loss": 0.2595, "lr": 2.2163588390501316e-07, "epoch": 0.011218160221723637, "percentage": 1.12, "elapsed_time": "0:00:05", "remaining_time": "0:08:43", "throughput": 7084.01, "total_tokens": 42112} +{"current_steps": 90, "total_steps": 7577, "loss": 0.2567, "lr": 2.3482849604221635e-07, "epoch": 0.011878051999472087, "percentage": 1.19, "elapsed_time": "0:00:06", "remaining_time": "0:08:41", "throughput": 7100.45, "total_tokens": 44544} +{"current_steps": 95, "total_steps": 7577, "loss": 0.1981, "lr": 2.480211081794195e-07, "epoch": 0.012537943777220536, "percentage": 1.25, "elapsed_time": "0:00:06", "remaining_time": "0:08:40", "throughput": 7122.92, "total_tokens": 47104} +{"current_steps": 100, "total_steps": 7577, "loss": 0.1626, "lr": 2.612137203166227e-07, "epoch": 0.013197835554968985, "percentage": 1.32, "elapsed_time": "0:00:06", "remaining_time": "0:08:39", "throughput": 7151.4, "total_tokens": 49664} +{"current_steps": 105, "total_steps": 7577, "loss": 0.1359, "lr": 2.744063324538258e-07, "epoch": 0.013857727332717434, "percentage": 1.39, "elapsed_time": "0:00:07", "remaining_time": "0:08:37", "throughput": 7197.13, "total_tokens": 52352} +{"current_steps": 110, "total_steps": 7577, "loss": 0.1025, "lr": 2.8759894459102903e-07, "epoch": 0.014517619110465884, "percentage": 1.45, "elapsed_time": "0:00:07", "remaining_time": "0:08:35", "throughput": 7201.47, "total_tokens": 54720} +{"current_steps": 115, "total_steps": 7577, "loss": 0.1435, "lr": 3.007915567282322e-07, "epoch": 0.015177510888214334, "percentage": 1.52, "elapsed_time": "0:00:07", "remaining_time": "0:08:34", "throughput": 7209.52, "total_tokens": 57152} +{"current_steps": 120, "total_steps": 7577, "loss": 0.2027, "lr": 3.139841688654353e-07, "epoch": 0.015837402665962782, "percentage": 1.58, "elapsed_time": "0:00:08", "remaining_time": "0:08:33", "throughput": 7237.62, "total_tokens": 59776} +{"current_steps": 125, "total_steps": 7577, "loss": 0.1344, "lr": 3.271767810026385e-07, "epoch": 0.01649729444371123, "percentage": 1.65, "elapsed_time": "0:00:08", "remaining_time": "0:08:32", "throughput": 7269.42, "total_tokens": 62464} +{"current_steps": 130, "total_steps": 7577, "loss": 0.1188, "lr": 3.403693931398417e-07, "epoch": 0.017157186221459682, "percentage": 1.72, "elapsed_time": "0:00:08", "remaining_time": "0:08:31", "throughput": 7292.2, "total_tokens": 65088} +{"current_steps": 135, "total_steps": 7577, "loss": 0.2073, "lr": 3.5356200527704485e-07, "epoch": 0.01781707799920813, "percentage": 1.78, "elapsed_time": "0:00:09", "remaining_time": "0:08:30", "throughput": 7323.53, "total_tokens": 67776} +{"current_steps": 140, "total_steps": 7577, "loss": 0.2589, "lr": 3.66754617414248e-07, "epoch": 0.01847696977695658, "percentage": 1.85, "elapsed_time": "0:00:09", "remaining_time": "0:08:29", "throughput": 7344.53, "total_tokens": 70400} +{"current_steps": 145, "total_steps": 7577, "loss": 0.1435, "lr": 3.7994722955145113e-07, "epoch": 0.01913686155470503, "percentage": 1.91, "elapsed_time": "0:00:09", "remaining_time": "0:08:28", "throughput": 7326.01, "total_tokens": 72704} +{"current_steps": 150, "total_steps": 7577, "loss": 0.3408, "lr": 3.9313984168865435e-07, "epoch": 0.019796753332453478, "percentage": 1.98, "elapsed_time": "0:00:10", "remaining_time": "0:08:27", "throughput": 7330.81, "total_tokens": 75136} +{"current_steps": 155, "total_steps": 7577, "loss": 0.0612, "lr": 4.063324538258575e-07, "epoch": 0.020456645110201926, "percentage": 2.05, "elapsed_time": "0:00:10", "remaining_time": "0:08:26", "throughput": 7340.14, "total_tokens": 77632} +{"current_steps": 160, "total_steps": 7577, "loss": 0.2462, "lr": 4.195250659630606e-07, "epoch": 0.021116536887950375, "percentage": 2.11, "elapsed_time": "0:00:10", "remaining_time": "0:08:25", "throughput": 7360.74, "total_tokens": 80320} +{"current_steps": 165, "total_steps": 7577, "loss": 0.1542, "lr": 4.3271767810026384e-07, "epoch": 0.021776428665698826, "percentage": 2.18, "elapsed_time": "0:00:11", "remaining_time": "0:08:24", "throughput": 7363.11, "total_tokens": 82752} +{"current_steps": 170, "total_steps": 7577, "loss": 0.3088, "lr": 4.45910290237467e-07, "epoch": 0.022436320443447275, "percentage": 2.24, "elapsed_time": "0:00:11", "remaining_time": "0:08:23", "throughput": 7370.45, "total_tokens": 85248} +{"current_steps": 175, "total_steps": 7577, "loss": 0.2887, "lr": 4.5910290237467017e-07, "epoch": 0.023096212221195723, "percentage": 2.31, "elapsed_time": "0:00:11", "remaining_time": "0:08:23", "throughput": 7384.71, "total_tokens": 87872} +{"current_steps": 180, "total_steps": 7577, "loss": 0.1364, "lr": 4.7229551451187333e-07, "epoch": 0.023756103998944175, "percentage": 2.38, "elapsed_time": "0:00:12", "remaining_time": "0:08:22", "throughput": 7391.26, "total_tokens": 90368} +{"current_steps": 185, "total_steps": 7577, "loss": 0.0589, "lr": 4.854881266490765e-07, "epoch": 0.024415995776692623, "percentage": 2.44, "elapsed_time": "0:00:12", "remaining_time": "0:08:21", "throughput": 7402.07, "total_tokens": 92928} +{"current_steps": 190, "total_steps": 7577, "loss": 0.1639, "lr": 4.986807387862796e-07, "epoch": 0.02507588755444107, "percentage": 2.51, "elapsed_time": "0:00:12", "remaining_time": "0:08:20", "throughput": 7397.88, "total_tokens": 95296} +{"current_steps": 195, "total_steps": 7577, "loss": 0.1103, "lr": 5.118733509234829e-07, "epoch": 0.02573577933218952, "percentage": 2.57, "elapsed_time": "0:00:13", "remaining_time": "0:08:20", "throughput": 7414.35, "total_tokens": 97984} +{"current_steps": 200, "total_steps": 7577, "loss": 0.2017, "lr": 5.250659630606859e-07, "epoch": 0.02639567110993797, "percentage": 2.64, "elapsed_time": "0:00:13", "remaining_time": "0:08:19", "throughput": 7411.98, "total_tokens": 100352} +{"current_steps": 205, "total_steps": 7577, "loss": 0.1383, "lr": 5.382585751978892e-07, "epoch": 0.02705556288768642, "percentage": 2.71, "elapsed_time": "0:00:13", "remaining_time": "0:08:18", "throughput": 7391.3, "total_tokens": 102464} +{"current_steps": 210, "total_steps": 7577, "loss": 0.1266, "lr": 5.514511873350924e-07, "epoch": 0.027715454665434867, "percentage": 2.77, "elapsed_time": "0:00:14", "remaining_time": "0:08:17", "throughput": 7403.67, "total_tokens": 105088} +{"current_steps": 215, "total_steps": 7577, "loss": 0.3019, "lr": 5.646437994722954e-07, "epoch": 0.02837534644318332, "percentage": 2.84, "elapsed_time": "0:00:14", "remaining_time": "0:08:17", "throughput": 7411.44, "total_tokens": 107648} +{"current_steps": 220, "total_steps": 7577, "loss": 0.2375, "lr": 5.778364116094987e-07, "epoch": 0.029035238220931767, "percentage": 2.9, "elapsed_time": "0:00:14", "remaining_time": "0:08:16", "throughput": 7415.87, "total_tokens": 110144} +{"current_steps": 225, "total_steps": 7577, "loss": 0.1332, "lr": 5.910290237467019e-07, "epoch": 0.029695129998680216, "percentage": 2.97, "elapsed_time": "0:00:15", "remaining_time": "0:08:15", "throughput": 7416.39, "total_tokens": 112576} +{"current_steps": 230, "total_steps": 7577, "loss": 0.2314, "lr": 6.042216358839049e-07, "epoch": 0.030355021776428667, "percentage": 3.04, "elapsed_time": "0:00:15", "remaining_time": "0:08:15", "throughput": 7430.31, "total_tokens": 115264} +{"current_steps": 235, "total_steps": 7577, "loss": 0.0848, "lr": 6.174142480211082e-07, "epoch": 0.031014913554177116, "percentage": 3.1, "elapsed_time": "0:00:15", "remaining_time": "0:08:14", "throughput": 7441.01, "total_tokens": 117888} +{"current_steps": 240, "total_steps": 7577, "loss": 0.0189, "lr": 6.306068601583114e-07, "epoch": 0.031674805331925564, "percentage": 3.17, "elapsed_time": "0:00:16", "remaining_time": "0:08:14", "throughput": 7442.18, "total_tokens": 120320} +{"current_steps": 245, "total_steps": 7577, "loss": 0.1826, "lr": 6.437994722955144e-07, "epoch": 0.032334697109674015, "percentage": 3.23, "elapsed_time": "0:00:16", "remaining_time": "0:08:13", "throughput": 7439.68, "total_tokens": 122688} +{"current_steps": 250, "total_steps": 7577, "loss": 0.2716, "lr": 6.569920844327177e-07, "epoch": 0.03299458888742246, "percentage": 3.3, "elapsed_time": "0:00:16", "remaining_time": "0:08:12", "throughput": 7446.95, "total_tokens": 125248} +{"current_steps": 255, "total_steps": 7577, "loss": 0.203, "lr": 6.701846965699208e-07, "epoch": 0.03365448066517091, "percentage": 3.37, "elapsed_time": "0:00:17", "remaining_time": "0:08:12", "throughput": 7447.33, "total_tokens": 127680} +{"current_steps": 260, "total_steps": 7577, "loss": 0.083, "lr": 6.833773087071239e-07, "epoch": 0.034314372442919364, "percentage": 3.43, "elapsed_time": "0:00:17", "remaining_time": "0:08:11", "throughput": 7464.92, "total_tokens": 130496} +{"current_steps": 265, "total_steps": 7577, "loss": 0.1837, "lr": 6.965699208443272e-07, "epoch": 0.03497426422066781, "percentage": 3.5, "elapsed_time": "0:00:17", "remaining_time": "0:08:11", "throughput": 7468.93, "total_tokens": 132992} +{"current_steps": 270, "total_steps": 7577, "loss": 0.1372, "lr": 7.097625329815303e-07, "epoch": 0.03563415599841626, "percentage": 3.56, "elapsed_time": "0:00:18", "remaining_time": "0:08:10", "throughput": 7449.51, "total_tokens": 135040} +{"current_steps": 275, "total_steps": 7577, "loss": 0.258, "lr": 7.229551451187335e-07, "epoch": 0.03629404777616471, "percentage": 3.63, "elapsed_time": "0:00:18", "remaining_time": "0:08:10", "throughput": 7455.64, "total_tokens": 137600} +{"current_steps": 280, "total_steps": 7577, "loss": 0.1103, "lr": 7.361477572559367e-07, "epoch": 0.03695393955391316, "percentage": 3.7, "elapsed_time": "0:00:18", "remaining_time": "0:08:09", "throughput": 7448.91, "total_tokens": 139904} +{"current_steps": 285, "total_steps": 7577, "loss": 0.1476, "lr": 7.493403693931398e-07, "epoch": 0.03761383133166161, "percentage": 3.76, "elapsed_time": "0:00:19", "remaining_time": "0:08:08", "throughput": 7433.88, "total_tokens": 142016} +{"current_steps": 290, "total_steps": 7577, "loss": 0.0087, "lr": 7.62532981530343e-07, "epoch": 0.03827372310941006, "percentage": 3.83, "elapsed_time": "0:00:19", "remaining_time": "0:08:08", "throughput": 7439.86, "total_tokens": 144576} +{"current_steps": 295, "total_steps": 7577, "loss": 0.085, "lr": 7.757255936675461e-07, "epoch": 0.038933614887158505, "percentage": 3.89, "elapsed_time": "0:00:19", "remaining_time": "0:08:07", "throughput": 7434.64, "total_tokens": 146880} +{"current_steps": 300, "total_steps": 7577, "loss": 0.3963, "lr": 7.889182058047493e-07, "epoch": 0.039593506664906956, "percentage": 3.96, "elapsed_time": "0:00:20", "remaining_time": "0:08:07", "throughput": 7429.61, "total_tokens": 149184} +{"current_steps": 305, "total_steps": 7577, "loss": 0.221, "lr": 8.021108179419525e-07, "epoch": 0.0402533984426554, "percentage": 4.03, "elapsed_time": "0:00:20", "remaining_time": "0:08:06", "throughput": 7416.06, "total_tokens": 151296} +{"current_steps": 310, "total_steps": 7577, "loss": 0.2076, "lr": 8.153034300791555e-07, "epoch": 0.04091329022040385, "percentage": 4.09, "elapsed_time": "0:00:20", "remaining_time": "0:08:05", "throughput": 7413.55, "total_tokens": 153664} +{"current_steps": 315, "total_steps": 7577, "loss": 0.2588, "lr": 8.284960422163588e-07, "epoch": 0.041573181998152305, "percentage": 4.16, "elapsed_time": "0:00:21", "remaining_time": "0:08:05", "throughput": 7411.06, "total_tokens": 156032} +{"current_steps": 320, "total_steps": 7577, "loss": 0.227, "lr": 8.41688654353562e-07, "epoch": 0.04223307377590075, "percentage": 4.22, "elapsed_time": "0:00:21", "remaining_time": "0:08:04", "throughput": 7414.32, "total_tokens": 158528} +{"current_steps": 325, "total_steps": 7577, "loss": 0.12, "lr": 8.54881266490765e-07, "epoch": 0.0428929655536492, "percentage": 4.29, "elapsed_time": "0:00:21", "remaining_time": "0:08:04", "throughput": 7403.3, "total_tokens": 160704} +{"current_steps": 330, "total_steps": 7577, "loss": 0.1931, "lr": 8.680738786279683e-07, "epoch": 0.04355285733139765, "percentage": 4.36, "elapsed_time": "0:00:22", "remaining_time": "0:08:03", "throughput": 7401.67, "total_tokens": 163072} +{"current_steps": 335, "total_steps": 7577, "loss": 0.1389, "lr": 8.812664907651715e-07, "epoch": 0.0442127491091461, "percentage": 4.42, "elapsed_time": "0:00:22", "remaining_time": "0:08:03", "throughput": 7404.99, "total_tokens": 165568} +{"current_steps": 340, "total_steps": 7577, "loss": 0.2857, "lr": 8.944591029023745e-07, "epoch": 0.04487264088689455, "percentage": 4.49, "elapsed_time": "0:00:22", "remaining_time": "0:08:02", "throughput": 7403.5, "total_tokens": 167936} +{"current_steps": 345, "total_steps": 7577, "loss": 0.0616, "lr": 9.076517150395778e-07, "epoch": 0.045532532664643, "percentage": 4.55, "elapsed_time": "0:00:23", "remaining_time": "0:08:02", "throughput": 7397.17, "total_tokens": 170176} +{"current_steps": 350, "total_steps": 7577, "loss": 0.149, "lr": 9.20844327176781e-07, "epoch": 0.046192424442391446, "percentage": 4.62, "elapsed_time": "0:00:23", "remaining_time": "0:08:01", "throughput": 7388.53, "total_tokens": 172352} +{"current_steps": 355, "total_steps": 7577, "loss": 0.2579, "lr": 9.340369393139841e-07, "epoch": 0.0468523162201399, "percentage": 4.69, "elapsed_time": "0:00:23", "remaining_time": "0:08:01", "throughput": 7402.17, "total_tokens": 175168} +{"current_steps": 360, "total_steps": 7577, "loss": 0.1596, "lr": 9.472295514511873e-07, "epoch": 0.04751220799788835, "percentage": 4.75, "elapsed_time": "0:00:23", "remaining_time": "0:08:01", "throughput": 7412.04, "total_tokens": 177856} +{"current_steps": 365, "total_steps": 7577, "loss": 0.2923, "lr": 9.604221635883904e-07, "epoch": 0.048172099775636794, "percentage": 4.82, "elapsed_time": "0:00:24", "remaining_time": "0:08:00", "throughput": 7408.35, "total_tokens": 180160} +{"current_steps": 370, "total_steps": 7577, "loss": 0.2137, "lr": 9.736147757255936e-07, "epoch": 0.048831991553385246, "percentage": 4.88, "elapsed_time": "0:00:24", "remaining_time": "0:08:00", "throughput": 7415.44, "total_tokens": 182784} +{"current_steps": 375, "total_steps": 7577, "loss": 0.0578, "lr": 9.86807387862797e-07, "epoch": 0.0494918833311337, "percentage": 4.95, "elapsed_time": "0:00:24", "remaining_time": "0:07:59", "throughput": 7408.63, "total_tokens": 185024} +{"current_steps": 379, "total_steps": 7577, "eval_loss": 0.16884121298789978, "epoch": 0.05001979675333245, "percentage": 5.0, "elapsed_time": "0:00:33", "remaining_time": "0:10:28", "throughput": 5655.07, "total_tokens": 187072} +{"current_steps": 380, "total_steps": 7577, "loss": 0.1527, "lr": 1e-06, "epoch": 0.05015177510888214, "percentage": 5.02, "elapsed_time": "0:00:59", "remaining_time": "0:18:47", "throughput": 3152.89, "total_tokens": 187712} +{"current_steps": 385, "total_steps": 7577, "loss": 0.2528, "lr": 1.0131926121372032e-06, "epoch": 0.050811666886630594, "percentage": 5.08, "elapsed_time": "0:00:59", "remaining_time": "0:18:38", "throughput": 3180.18, "total_tokens": 190400} +{"current_steps": 390, "total_steps": 7577, "loss": 0.1124, "lr": 1.0263852242744063e-06, "epoch": 0.05147155866437904, "percentage": 5.15, "elapsed_time": "0:01:00", "remaining_time": "0:18:29", "throughput": 3209.98, "total_tokens": 193280} +{"current_steps": 395, "total_steps": 7577, "loss": 0.1545, "lr": 1.0395778364116096e-06, "epoch": 0.05213145044212749, "percentage": 5.21, "elapsed_time": "0:01:00", "remaining_time": "0:18:20", "throughput": 3230.38, "total_tokens": 195584} +{"current_steps": 400, "total_steps": 7577, "loss": 0.0824, "lr": 1.0527704485488126e-06, "epoch": 0.05279134221987594, "percentage": 5.28, "elapsed_time": "0:01:00", "remaining_time": "0:18:12", "throughput": 3255.16, "total_tokens": 198208} +{"current_steps": 405, "total_steps": 7577, "loss": 0.255, "lr": 1.0659630606860157e-06, "epoch": 0.05345123399762439, "percentage": 5.35, "elapsed_time": "0:01:01", "remaining_time": "0:18:04", "throughput": 3278.13, "total_tokens": 200704} +{"current_steps": 410, "total_steps": 7577, "loss": 0.2055, "lr": 1.079155672823219e-06, "epoch": 0.05411112577537284, "percentage": 5.41, "elapsed_time": "0:01:01", "remaining_time": "0:17:56", "throughput": 3299.92, "total_tokens": 203136} +{"current_steps": 415, "total_steps": 7577, "loss": 0.1496, "lr": 1.0923482849604222e-06, "epoch": 0.05477101755312129, "percentage": 5.48, "elapsed_time": "0:01:01", "remaining_time": "0:17:48", "throughput": 3320.62, "total_tokens": 205504} +{"current_steps": 420, "total_steps": 7577, "loss": 0.2539, "lr": 1.1055408970976253e-06, "epoch": 0.055430909330869735, "percentage": 5.54, "elapsed_time": "0:01:02", "remaining_time": "0:17:40", "throughput": 3343.21, "total_tokens": 208000} +{"current_steps": 425, "total_steps": 7577, "loss": 0.1106, "lr": 1.1187335092348285e-06, "epoch": 0.056090801108618187, "percentage": 5.61, "elapsed_time": "0:01:02", "remaining_time": "0:17:32", "throughput": 3366.51, "total_tokens": 210560} +{"current_steps": 430, "total_steps": 7577, "loss": 0.1771, "lr": 1.1319261213720316e-06, "epoch": 0.05675069288636664, "percentage": 5.68, "elapsed_time": "0:01:02", "remaining_time": "0:17:25", "throughput": 3388.53, "total_tokens": 213056} +{"current_steps": 435, "total_steps": 7577, "loss": 0.1155, "lr": 1.1451187335092347e-06, "epoch": 0.05741058466411508, "percentage": 5.74, "elapsed_time": "0:01:03", "remaining_time": "0:17:17", "throughput": 3406.56, "total_tokens": 215296} +{"current_steps": 440, "total_steps": 7577, "loss": 0.0203, "lr": 1.158311345646438e-06, "epoch": 0.058070476441863535, "percentage": 5.81, "elapsed_time": "0:01:03", "remaining_time": "0:17:10", "throughput": 3423.41, "total_tokens": 217472} +{"current_steps": 445, "total_steps": 7577, "loss": 0.0346, "lr": 1.1715039577836412e-06, "epoch": 0.058730368219611986, "percentage": 5.87, "elapsed_time": "0:01:03", "remaining_time": "0:17:03", "throughput": 3444.88, "total_tokens": 219968} +{"current_steps": 450, "total_steps": 7577, "loss": 0.0218, "lr": 1.1846965699208443e-06, "epoch": 0.05939025999736043, "percentage": 5.94, "elapsed_time": "0:01:04", "remaining_time": "0:16:56", "throughput": 3467.95, "total_tokens": 222592} +{"current_steps": 455, "total_steps": 7577, "loss": 0.522, "lr": 1.1978891820580475e-06, "epoch": 0.06005015177510888, "percentage": 6.01, "elapsed_time": "0:01:04", "remaining_time": "0:16:49", "throughput": 3484.28, "total_tokens": 224768} +{"current_steps": 460, "total_steps": 7577, "loss": 0.2349, "lr": 1.2110817941952508e-06, "epoch": 0.060710043552857335, "percentage": 6.07, "elapsed_time": "0:01:04", "remaining_time": "0:16:43", "throughput": 3505.04, "total_tokens": 227264} +{"current_steps": 465, "total_steps": 7577, "loss": 0.2363, "lr": 1.2242744063324536e-06, "epoch": 0.06136993533060578, "percentage": 6.14, "elapsed_time": "0:01:05", "remaining_time": "0:16:36", "throughput": 3525.75, "total_tokens": 229760} +{"current_steps": 470, "total_steps": 7577, "loss": 0.1719, "lr": 1.237467018469657e-06, "epoch": 0.06202982710835423, "percentage": 6.2, "elapsed_time": "0:01:05", "remaining_time": "0:16:30", "throughput": 3542.62, "total_tokens": 232000} +{"current_steps": 475, "total_steps": 7577, "loss": 0.1564, "lr": 1.2506596306068602e-06, "epoch": 0.06268971888610268, "percentage": 6.27, "elapsed_time": "0:01:05", "remaining_time": "0:16:24", "throughput": 3558.15, "total_tokens": 234176} +{"current_steps": 480, "total_steps": 7577, "loss": 0.0993, "lr": 1.2638522427440632e-06, "epoch": 0.06334961066385113, "percentage": 6.33, "elapsed_time": "0:01:06", "remaining_time": "0:16:17", "throughput": 3579.16, "total_tokens": 236736} +{"current_steps": 485, "total_steps": 7577, "loss": 0.006, "lr": 1.2770448548812665e-06, "epoch": 0.06400950244159957, "percentage": 6.4, "elapsed_time": "0:01:06", "remaining_time": "0:16:11", "throughput": 3597.4, "total_tokens": 239104} +{"current_steps": 490, "total_steps": 7577, "loss": 0.3751, "lr": 1.2902374670184698e-06, "epoch": 0.06466939421934803, "percentage": 6.47, "elapsed_time": "0:01:06", "remaining_time": "0:16:06", "throughput": 3617.13, "total_tokens": 241600} +{"current_steps": 495, "total_steps": 7577, "loss": 0.31, "lr": 1.3034300791556726e-06, "epoch": 0.06532928599709648, "percentage": 6.53, "elapsed_time": "0:01:07", "remaining_time": "0:16:00", "throughput": 3637.68, "total_tokens": 244160} +{"current_steps": 500, "total_steps": 7577, "loss": 0.1775, "lr": 1.316622691292876e-06, "epoch": 0.06598917777484492, "percentage": 6.6, "elapsed_time": "0:01:07", "remaining_time": "0:15:54", "throughput": 3654.33, "total_tokens": 246464} +{"current_steps": 505, "total_steps": 7577, "loss": 0.0849, "lr": 1.3298153034300792e-06, "epoch": 0.06664906955259338, "percentage": 6.66, "elapsed_time": "0:01:07", "remaining_time": "0:15:49", "throughput": 3673.41, "total_tokens": 248960} +{"current_steps": 510, "total_steps": 7577, "loss": 0.1716, "lr": 1.3430079155672822e-06, "epoch": 0.06730896133034182, "percentage": 6.73, "elapsed_time": "0:01:08", "remaining_time": "0:15:43", "throughput": 3691.66, "total_tokens": 251392} +{"current_steps": 515, "total_steps": 7577, "loss": 0.2321, "lr": 1.3562005277044855e-06, "epoch": 0.06796885310809027, "percentage": 6.8, "elapsed_time": "0:01:08", "remaining_time": "0:15:38", "throughput": 3710.57, "total_tokens": 253888} +{"current_steps": 520, "total_steps": 7577, "loss": 0.1398, "lr": 1.3693931398416888e-06, "epoch": 0.06862874488583873, "percentage": 6.86, "elapsed_time": "0:01:08", "remaining_time": "0:15:32", "throughput": 3729.35, "total_tokens": 256384} +{"current_steps": 525, "total_steps": 7577, "loss": 0.1866, "lr": 1.3825857519788916e-06, "epoch": 0.06928863666358717, "percentage": 6.93, "elapsed_time": "0:01:09", "remaining_time": "0:15:27", "throughput": 3742.54, "total_tokens": 258496} +{"current_steps": 530, "total_steps": 7577, "loss": 0.1035, "lr": 1.3957783641160949e-06, "epoch": 0.06994852844133562, "percentage": 6.99, "elapsed_time": "0:01:09", "remaining_time": "0:15:22", "throughput": 3759.15, "total_tokens": 260864} +{"current_steps": 535, "total_steps": 7577, "loss": 0.0497, "lr": 1.4089709762532982e-06, "epoch": 0.07060842021908408, "percentage": 7.06, "elapsed_time": "0:01:09", "remaining_time": "0:15:17", "throughput": 3777.26, "total_tokens": 263360} +{"current_steps": 540, "total_steps": 7577, "loss": 0.3041, "lr": 1.4221635883905012e-06, "epoch": 0.07126831199683252, "percentage": 7.13, "elapsed_time": "0:01:10", "remaining_time": "0:15:12", "throughput": 3798.61, "total_tokens": 266112} +{"current_steps": 545, "total_steps": 7577, "loss": 0.2543, "lr": 1.4353562005277045e-06, "epoch": 0.07192820377458096, "percentage": 7.19, "elapsed_time": "0:01:10", "remaining_time": "0:15:08", "throughput": 3815.52, "total_tokens": 268544} +{"current_steps": 550, "total_steps": 7577, "loss": 0.4179, "lr": 1.4485488126649078e-06, "epoch": 0.07258809555232942, "percentage": 7.26, "elapsed_time": "0:01:10", "remaining_time": "0:15:03", "throughput": 3831.45, "total_tokens": 270912} +{"current_steps": 555, "total_steps": 7577, "loss": 0.0028, "lr": 1.4617414248021108e-06, "epoch": 0.07324798733007787, "percentage": 7.32, "elapsed_time": "0:01:11", "remaining_time": "0:14:58", "throughput": 3852.04, "total_tokens": 273664} +{"current_steps": 560, "total_steps": 7577, "loss": 0.1789, "lr": 1.4749340369393139e-06, "epoch": 0.07390787910782631, "percentage": 7.39, "elapsed_time": "0:01:11", "remaining_time": "0:14:54", "throughput": 3869.31, "total_tokens": 276160} +{"current_steps": 565, "total_steps": 7577, "loss": 0.0054, "lr": 1.4881266490765171e-06, "epoch": 0.07456777088557477, "percentage": 7.46, "elapsed_time": "0:01:11", "remaining_time": "0:14:49", "throughput": 3887.99, "total_tokens": 278784} +{"current_steps": 570, "total_steps": 7577, "loss": 0.2245, "lr": 1.5013192612137202e-06, "epoch": 0.07522766266332322, "percentage": 7.52, "elapsed_time": "0:01:12", "remaining_time": "0:14:45", "throughput": 3903.37, "total_tokens": 281152} +{"current_steps": 575, "total_steps": 7577, "loss": 0.2359, "lr": 1.5145118733509235e-06, "epoch": 0.07588755444107166, "percentage": 7.59, "elapsed_time": "0:01:12", "remaining_time": "0:14:41", "throughput": 3917.72, "total_tokens": 283456} +{"current_steps": 580, "total_steps": 7577, "loss": 0.0789, "lr": 1.5277044854881265e-06, "epoch": 0.07654744621882012, "percentage": 7.65, "elapsed_time": "0:01:12", "remaining_time": "0:14:36", "throughput": 3935.08, "total_tokens": 286016} +{"current_steps": 585, "total_steps": 7577, "loss": 0.1872, "lr": 1.5408970976253298e-06, "epoch": 0.07720733799656856, "percentage": 7.72, "elapsed_time": "0:01:13", "remaining_time": "0:14:32", "throughput": 3950.83, "total_tokens": 288448} +{"current_steps": 590, "total_steps": 7577, "loss": 0.1543, "lr": 1.5540897097625329e-06, "epoch": 0.07786722977431701, "percentage": 7.79, "elapsed_time": "0:01:13", "remaining_time": "0:14:28", "throughput": 3965.56, "total_tokens": 290816} +{"current_steps": 595, "total_steps": 7577, "loss": 0.2174, "lr": 1.567282321899736e-06, "epoch": 0.07852712155206547, "percentage": 7.85, "elapsed_time": "0:01:13", "remaining_time": "0:14:24", "throughput": 3984.19, "total_tokens": 293504} +{"current_steps": 600, "total_steps": 7577, "loss": 0.1323, "lr": 1.5804749340369392e-06, "epoch": 0.07918701332981391, "percentage": 7.92, "elapsed_time": "0:01:13", "remaining_time": "0:14:20", "throughput": 3997.1, "total_tokens": 295744} +{"current_steps": 605, "total_steps": 7577, "loss": 0.0865, "lr": 1.5936675461741425e-06, "epoch": 0.07984690510756236, "percentage": 7.98, "elapsed_time": "0:01:14", "remaining_time": "0:14:16", "throughput": 4011.34, "total_tokens": 298112} +{"current_steps": 610, "total_steps": 7577, "loss": 0.1034, "lr": 1.6068601583113455e-06, "epoch": 0.0805067968853108, "percentage": 8.05, "elapsed_time": "0:01:14", "remaining_time": "0:14:12", "throughput": 4027.06, "total_tokens": 300608} +{"current_steps": 615, "total_steps": 7577, "loss": 0.0048, "lr": 1.6200527704485488e-06, "epoch": 0.08116668866305926, "percentage": 8.12, "elapsed_time": "0:01:14", "remaining_time": "0:14:08", "throughput": 4045.74, "total_tokens": 303360} +{"current_steps": 620, "total_steps": 7577, "loss": 0.0325, "lr": 1.633245382585752e-06, "epoch": 0.0818265804408077, "percentage": 8.18, "elapsed_time": "0:01:15", "remaining_time": "0:14:05", "throughput": 4061.99, "total_tokens": 305920} +{"current_steps": 625, "total_steps": 7577, "loss": 0.0698, "lr": 1.646437994722955e-06, "epoch": 0.08248647221855615, "percentage": 8.25, "elapsed_time": "0:01:15", "remaining_time": "0:14:01", "throughput": 4077.33, "total_tokens": 308416} +{"current_steps": 630, "total_steps": 7577, "loss": 0.1542, "lr": 1.6596306068601582e-06, "epoch": 0.08314636399630461, "percentage": 8.31, "elapsed_time": "0:01:15", "remaining_time": "0:13:57", "throughput": 4091.92, "total_tokens": 310848} +{"current_steps": 635, "total_steps": 7577, "loss": 0.225, "lr": 1.6728232189973614e-06, "epoch": 0.08380625577405305, "percentage": 8.38, "elapsed_time": "0:01:16", "remaining_time": "0:13:54", "throughput": 4107.84, "total_tokens": 313408} +{"current_steps": 640, "total_steps": 7577, "loss": 0.0946, "lr": 1.6860158311345645e-06, "epoch": 0.0844661475518015, "percentage": 8.45, "elapsed_time": "0:01:16", "remaining_time": "0:13:50", "throughput": 4122.6, "total_tokens": 315904} +{"current_steps": 645, "total_steps": 7577, "loss": 0.2463, "lr": 1.6992084432717678e-06, "epoch": 0.08512603932954996, "percentage": 8.51, "elapsed_time": "0:01:16", "remaining_time": "0:13:47", "throughput": 4133.35, "total_tokens": 318080} +{"current_steps": 650, "total_steps": 7577, "loss": 0.0751, "lr": 1.712401055408971e-06, "epoch": 0.0857859311072984, "percentage": 8.58, "elapsed_time": "0:01:17", "remaining_time": "0:13:43", "throughput": 4143.77, "total_tokens": 320256} +{"current_steps": 655, "total_steps": 7577, "loss": 0.0116, "lr": 1.7255936675461739e-06, "epoch": 0.08644582288504685, "percentage": 8.64, "elapsed_time": "0:01:17", "remaining_time": "0:13:40", "throughput": 4154.73, "total_tokens": 322496} +{"current_steps": 660, "total_steps": 7577, "loss": 0.1616, "lr": 1.7387862796833772e-06, "epoch": 0.0871057146627953, "percentage": 8.71, "elapsed_time": "0:01:17", "remaining_time": "0:13:37", "throughput": 4170.4, "total_tokens": 325120} +{"current_steps": 665, "total_steps": 7577, "loss": 0.0802, "lr": 1.7519788918205804e-06, "epoch": 0.08776560644054375, "percentage": 8.78, "elapsed_time": "0:01:18", "remaining_time": "0:13:33", "throughput": 4180.87, "total_tokens": 327296} +{"current_steps": 670, "total_steps": 7577, "loss": 0.4002, "lr": 1.7651715039577835e-06, "epoch": 0.0884254982182922, "percentage": 8.84, "elapsed_time": "0:01:18", "remaining_time": "0:13:30", "throughput": 4193.44, "total_tokens": 329664} +{"current_steps": 675, "total_steps": 7577, "loss": 0.0953, "lr": 1.7783641160949868e-06, "epoch": 0.08908538999604065, "percentage": 8.91, "elapsed_time": "0:01:18", "remaining_time": "0:13:27", "throughput": 4209.8, "total_tokens": 332416} +{"current_steps": 680, "total_steps": 7577, "loss": 0.0779, "lr": 1.79155672823219e-06, "epoch": 0.0897452817737891, "percentage": 8.97, "elapsed_time": "0:01:19", "remaining_time": "0:13:24", "throughput": 4224.17, "total_tokens": 334976} +{"current_steps": 685, "total_steps": 7577, "loss": 0.0366, "lr": 1.8047493403693929e-06, "epoch": 0.09040517355153754, "percentage": 9.04, "elapsed_time": "0:01:19", "remaining_time": "0:13:21", "throughput": 4237.58, "total_tokens": 337472} +{"current_steps": 690, "total_steps": 7577, "loss": 0.1887, "lr": 1.8179419525065961e-06, "epoch": 0.091065065329286, "percentage": 9.11, "elapsed_time": "0:01:19", "remaining_time": "0:13:18", "throughput": 4250.27, "total_tokens": 339904} +{"current_steps": 695, "total_steps": 7577, "loss": 0.2216, "lr": 1.8311345646437994e-06, "epoch": 0.09172495710703445, "percentage": 9.17, "elapsed_time": "0:01:20", "remaining_time": "0:13:15", "throughput": 4262.42, "total_tokens": 342272} +{"current_steps": 700, "total_steps": 7577, "loss": 0.197, "lr": 1.8443271767810025e-06, "epoch": 0.09238484888478289, "percentage": 9.24, "elapsed_time": "0:01:20", "remaining_time": "0:13:12", "throughput": 4274.6, "total_tokens": 344640} +{"current_steps": 705, "total_steps": 7577, "loss": 0.0457, "lr": 1.8575197889182057e-06, "epoch": 0.09304474066253135, "percentage": 9.3, "elapsed_time": "0:01:20", "remaining_time": "0:13:09", "throughput": 4287.28, "total_tokens": 347072} +{"current_steps": 710, "total_steps": 7577, "loss": 0.1862, "lr": 1.870712401055409e-06, "epoch": 0.0937046324402798, "percentage": 9.37, "elapsed_time": "0:01:21", "remaining_time": "0:13:06", "throughput": 4302.16, "total_tokens": 349696} +{"current_steps": 715, "total_steps": 7577, "loss": 0.0762, "lr": 1.883905013192612e-06, "epoch": 0.09436452421802824, "percentage": 9.44, "elapsed_time": "0:01:21", "remaining_time": "0:13:03", "throughput": 4316.18, "total_tokens": 352256} +{"current_steps": 720, "total_steps": 7577, "loss": 0.1502, "lr": 1.8970976253298151e-06, "epoch": 0.0950244159957767, "percentage": 9.5, "elapsed_time": "0:01:21", "remaining_time": "0:13:00", "throughput": 4332.17, "total_tokens": 355008} +{"current_steps": 725, "total_steps": 7577, "loss": 0.2955, "lr": 1.9102902374670186e-06, "epoch": 0.09568430777352514, "percentage": 9.57, "elapsed_time": "0:01:22", "remaining_time": "0:12:57", "throughput": 4343.82, "total_tokens": 357376} +{"current_steps": 730, "total_steps": 7577, "loss": 0.1803, "lr": 1.9234828496042215e-06, "epoch": 0.09634419955127359, "percentage": 9.63, "elapsed_time": "0:01:22", "remaining_time": "0:12:54", "throughput": 4354.69, "total_tokens": 359680} +{"current_steps": 735, "total_steps": 7577, "loss": 0.1343, "lr": 1.9366754617414247e-06, "epoch": 0.09700409132902205, "percentage": 9.7, "elapsed_time": "0:01:22", "remaining_time": "0:12:51", "throughput": 4367.4, "total_tokens": 362176} +{"current_steps": 740, "total_steps": 7577, "loss": 0.0823, "lr": 1.949868073878628e-06, "epoch": 0.09766398310677049, "percentage": 9.77, "elapsed_time": "0:01:23", "remaining_time": "0:12:49", "throughput": 4384.26, "total_tokens": 365056} +{"current_steps": 745, "total_steps": 7577, "loss": 0.3164, "lr": 1.963060686015831e-06, "epoch": 0.09832387488451894, "percentage": 9.83, "elapsed_time": "0:01:23", "remaining_time": "0:12:46", "throughput": 4396.17, "total_tokens": 367488} +{"current_steps": 750, "total_steps": 7577, "loss": 0.3437, "lr": 1.976253298153034e-06, "epoch": 0.0989837666622674, "percentage": 9.9, "elapsed_time": "0:01:23", "remaining_time": "0:12:43", "throughput": 4406.74, "total_tokens": 369792} +{"current_steps": 755, "total_steps": 7577, "loss": 0.1097, "lr": 1.9894459102902374e-06, "epoch": 0.09964365844001584, "percentage": 9.96, "elapsed_time": "0:01:24", "remaining_time": "0:12:41", "throughput": 4417.76, "total_tokens": 372160} +{"current_steps": 758, "total_steps": 7577, "eval_loss": 0.13667261600494385, "epoch": 0.1000395935066649, "percentage": 10.0, "elapsed_time": "0:01:32", "remaining_time": "0:13:50", "throughput": 4045.07, "total_tokens": 373504} +{"current_steps": 760, "total_steps": 7577, "loss": 0.1005, "lr": 1.9999998938723955e-06, "epoch": 0.10030355021776428, "percentage": 10.03, "elapsed_time": "0:01:59", "remaining_time": "0:17:51", "throughput": 3133.36, "total_tokens": 374272} +{"current_steps": 765, "total_steps": 7577, "loss": 0.0727, "lr": 1.9999961794086063e-06, "epoch": 0.10096344199551274, "percentage": 10.1, "elapsed_time": "0:01:59", "remaining_time": "0:17:46", "throughput": 3145.09, "total_tokens": 376704} +{"current_steps": 770, "total_steps": 7577, "loss": 0.287, "lr": 1.999987158587122e-06, "epoch": 0.10162333377326119, "percentage": 10.16, "elapsed_time": "0:02:00", "remaining_time": "0:17:41", "throughput": 3156.71, "total_tokens": 379136} +{"current_steps": 775, "total_steps": 7577, "loss": 0.1199, "lr": 1.9999728314558114e-06, "epoch": 0.10228322555100963, "percentage": 10.23, "elapsed_time": "0:02:00", "remaining_time": "0:17:37", "throughput": 3168.31, "total_tokens": 381568} +{"current_steps": 780, "total_steps": 7577, "loss": 0.2967, "lr": 1.9999531980906988e-06, "epoch": 0.10294311732875808, "percentage": 10.29, "elapsed_time": "0:02:00", "remaining_time": "0:17:32", "throughput": 3180.81, "total_tokens": 384128} +{"current_steps": 785, "total_steps": 7577, "loss": 0.227, "lr": 1.999928258595967e-06, "epoch": 0.10360300910650654, "percentage": 10.36, "elapsed_time": "0:02:01", "remaining_time": "0:17:27", "throughput": 3190.19, "total_tokens": 386304} +{"current_steps": 790, "total_steps": 7577, "loss": 0.3706, "lr": 1.9998980131039534e-06, "epoch": 0.10426290088425498, "percentage": 10.43, "elapsed_time": "0:02:01", "remaining_time": "0:17:23", "throughput": 3202.59, "total_tokens": 388864} +{"current_steps": 795, "total_steps": 7577, "loss": 0.0609, "lr": 1.999862461775153e-06, "epoch": 0.10492279266200343, "percentage": 10.49, "elapsed_time": "0:02:01", "remaining_time": "0:17:18", "throughput": 3212.4, "total_tokens": 391104} +{"current_steps": 800, "total_steps": 7577, "loss": 0.1122, "lr": 1.999821604798214e-06, "epoch": 0.10558268443975188, "percentage": 10.56, "elapsed_time": "0:02:02", "remaining_time": "0:17:14", "throughput": 3226.19, "total_tokens": 393856} +{"current_steps": 805, "total_steps": 7577, "loss": 0.2655, "lr": 1.999775442389939e-06, "epoch": 0.10624257621750033, "percentage": 10.62, "elapsed_time": "0:02:02", "remaining_time": "0:17:09", "throughput": 3237.95, "total_tokens": 396352} +{"current_steps": 810, "total_steps": 7577, "loss": 0.1068, "lr": 1.9997239747952843e-06, "epoch": 0.10690246799524877, "percentage": 10.69, "elapsed_time": "0:02:02", "remaining_time": "0:17:05", "throughput": 3247.63, "total_tokens": 398592} +{"current_steps": 815, "total_steps": 7577, "loss": 0.0669, "lr": 1.9996672022873546e-06, "epoch": 0.10756235977299723, "percentage": 10.76, "elapsed_time": "0:02:03", "remaining_time": "0:17:01", "throughput": 3259.32, "total_tokens": 401088} +{"current_steps": 820, "total_steps": 7577, "loss": 0.1053, "lr": 1.9996051251674073e-06, "epoch": 0.10822225155074568, "percentage": 10.82, "elapsed_time": "0:02:03", "remaining_time": "0:16:56", "throughput": 3269.92, "total_tokens": 403456} +{"current_steps": 825, "total_steps": 7577, "loss": 0.3053, "lr": 1.999537743764847e-06, "epoch": 0.10888214332849412, "percentage": 10.89, "elapsed_time": "0:02:03", "remaining_time": "0:16:52", "throughput": 3279.53, "total_tokens": 405696} +{"current_steps": 830, "total_steps": 7577, "loss": 0.4762, "lr": 1.999465058437225e-06, "epoch": 0.10954203510624258, "percentage": 10.95, "elapsed_time": "0:02:04", "remaining_time": "0:16:48", "throughput": 3290.54, "total_tokens": 408128} +{"current_steps": 835, "total_steps": 7577, "loss": 0.0134, "lr": 1.9993870695702364e-06, "epoch": 0.11020192688399102, "percentage": 11.02, "elapsed_time": "0:02:04", "remaining_time": "0:16:44", "throughput": 3304.8, "total_tokens": 411008} +{"current_steps": 840, "total_steps": 7577, "loss": 0.3147, "lr": 1.9993037775777206e-06, "epoch": 0.11086181866173947, "percentage": 11.09, "elapsed_time": "0:02:04", "remaining_time": "0:16:40", "throughput": 3314.73, "total_tokens": 413312} +{"current_steps": 845, "total_steps": 7577, "loss": 0.1734, "lr": 1.999215182901656e-06, "epoch": 0.11152171043948793, "percentage": 11.15, "elapsed_time": "0:02:05", "remaining_time": "0:16:35", "throughput": 3324.6, "total_tokens": 415616} +{"current_steps": 850, "total_steps": 7577, "loss": 0.23, "lr": 1.9991212860121587e-06, "epoch": 0.11218160221723637, "percentage": 11.22, "elapsed_time": "0:02:05", "remaining_time": "0:16:31", "throughput": 3337.74, "total_tokens": 418368} +{"current_steps": 855, "total_steps": 7577, "loss": 0.0658, "lr": 1.999022087407482e-06, "epoch": 0.11284149399498482, "percentage": 11.28, "elapsed_time": "0:02:05", "remaining_time": "0:16:28", "throughput": 3348.94, "total_tokens": 420864} +{"current_steps": 860, "total_steps": 7577, "loss": 0.2781, "lr": 1.998917587614011e-06, "epoch": 0.11350138577273328, "percentage": 11.35, "elapsed_time": "0:02:05", "remaining_time": "0:16:24", "throughput": 3357.7, "total_tokens": 423040} +{"current_steps": 865, "total_steps": 7577, "loss": 0.3602, "lr": 1.9988077871862615e-06, "epoch": 0.11416127755048172, "percentage": 11.42, "elapsed_time": "0:02:06", "remaining_time": "0:16:20", "throughput": 3367.39, "total_tokens": 425344} +{"current_steps": 870, "total_steps": 7577, "loss": 0.0011, "lr": 1.9986926867068752e-06, "epoch": 0.11482116932823017, "percentage": 11.48, "elapsed_time": "0:02:06", "remaining_time": "0:16:16", "throughput": 3379.33, "total_tokens": 427968} +{"current_steps": 875, "total_steps": 7577, "loss": 0.3594, "lr": 1.998572286786619e-06, "epoch": 0.11548106110597862, "percentage": 11.55, "elapsed_time": "0:02:06", "remaining_time": "0:16:12", "throughput": 3391.15, "total_tokens": 430592} +{"current_steps": 880, "total_steps": 7577, "loss": 0.2425, "lr": 1.9984465880643807e-06, "epoch": 0.11614095288372707, "percentage": 11.61, "elapsed_time": "0:02:07", "remaining_time": "0:16:08", "throughput": 3402.56, "total_tokens": 433152} +{"current_steps": 885, "total_steps": 7577, "loss": 0.0489, "lr": 1.998315591207165e-06, "epoch": 0.11680084466147551, "percentage": 11.68, "elapsed_time": "0:02:07", "remaining_time": "0:16:05", "throughput": 3412.04, "total_tokens": 435456} +{"current_steps": 890, "total_steps": 7577, "loss": 0.1876, "lr": 1.9981792969100912e-06, "epoch": 0.11746073643922397, "percentage": 11.75, "elapsed_time": "0:02:07", "remaining_time": "0:16:01", "throughput": 3423.78, "total_tokens": 438080} +{"current_steps": 895, "total_steps": 7577, "loss": 0.2044, "lr": 1.9980377058963875e-06, "epoch": 0.11812062821697242, "percentage": 11.81, "elapsed_time": "0:02:08", "remaining_time": "0:15:57", "throughput": 3434.97, "total_tokens": 440640} +{"current_steps": 900, "total_steps": 7577, "loss": 0.028, "lr": 1.99789081891739e-06, "epoch": 0.11878051999472086, "percentage": 11.88, "elapsed_time": "0:02:08", "remaining_time": "0:15:54", "throughput": 3444.78, "total_tokens": 443008} +{"current_steps": 905, "total_steps": 7577, "loss": 0.1773, "lr": 1.997738636752536e-06, "epoch": 0.11944041177246932, "percentage": 11.94, "elapsed_time": "0:02:08", "remaining_time": "0:15:50", "throughput": 3454.0, "total_tokens": 445312} +{"current_steps": 910, "total_steps": 7577, "loss": 0.014, "lr": 1.9975811602093624e-06, "epoch": 0.12010030355021777, "percentage": 12.01, "elapsed_time": "0:02:09", "remaining_time": "0:15:46", "throughput": 3463.72, "total_tokens": 447680} +{"current_steps": 915, "total_steps": 7577, "loss": 0.2574, "lr": 1.9974183901234984e-06, "epoch": 0.12076019532796621, "percentage": 12.08, "elapsed_time": "0:02:09", "remaining_time": "0:15:43", "throughput": 3475.58, "total_tokens": 450368} +{"current_steps": 920, "total_steps": 7577, "loss": 0.1599, "lr": 1.997250327358664e-06, "epoch": 0.12142008710571467, "percentage": 12.14, "elapsed_time": "0:02:09", "remaining_time": "0:15:39", "throughput": 3485.61, "total_tokens": 452800} +{"current_steps": 925, "total_steps": 7577, "loss": 0.023, "lr": 1.997076972806664e-06, "epoch": 0.12207997888346311, "percentage": 12.21, "elapsed_time": "0:02:10", "remaining_time": "0:15:36", "throughput": 3499.19, "total_tokens": 455744} +{"current_steps": 930, "total_steps": 7577, "loss": 0.201, "lr": 1.9968983273873827e-06, "epoch": 0.12273987066121156, "percentage": 12.27, "elapsed_time": "0:02:10", "remaining_time": "0:15:33", "throughput": 3509.11, "total_tokens": 458176} +{"current_steps": 935, "total_steps": 7577, "loss": 0.0808, "lr": 1.99671439204878e-06, "epoch": 0.12339976243896002, "percentage": 12.34, "elapsed_time": "0:02:10", "remaining_time": "0:15:29", "throughput": 3518.09, "total_tokens": 460480} +{"current_steps": 940, "total_steps": 7577, "loss": 0.1766, "lr": 1.9965251677668873e-06, "epoch": 0.12405965421670846, "percentage": 12.41, "elapsed_time": "0:02:11", "remaining_time": "0:15:26", "throughput": 3526.1, "total_tokens": 462656} +{"current_steps": 945, "total_steps": 7577, "loss": 0.3062, "lr": 1.9963306555458e-06, "epoch": 0.1247195459944569, "percentage": 12.47, "elapsed_time": "0:02:11", "remaining_time": "0:15:23", "throughput": 3537.67, "total_tokens": 465344} +{"current_steps": 950, "total_steps": 7577, "loss": 0.4272, "lr": 1.9961308564176723e-06, "epoch": 0.12537943777220537, "percentage": 12.54, "elapsed_time": "0:02:11", "remaining_time": "0:15:19", "throughput": 3546.92, "total_tokens": 467712} +{"current_steps": 955, "total_steps": 7577, "loss": 0.223, "lr": 1.9959257714427147e-06, "epoch": 0.1260393295499538, "percentage": 12.6, "elapsed_time": "0:02:12", "remaining_time": "0:15:16", "throughput": 3556.18, "total_tokens": 470080} +{"current_steps": 960, "total_steps": 7577, "loss": 0.1762, "lr": 1.995715401709186e-06, "epoch": 0.12669922132770225, "percentage": 12.67, "elapsed_time": "0:02:12", "remaining_time": "0:15:13", "throughput": 3565.81, "total_tokens": 472512} +{"current_steps": 965, "total_steps": 7577, "loss": 0.1271, "lr": 1.995499748333387e-06, "epoch": 0.1273591131054507, "percentage": 12.74, "elapsed_time": "0:02:12", "remaining_time": "0:15:10", "throughput": 3574.05, "total_tokens": 474752} +{"current_steps": 970, "total_steps": 7577, "loss": 0.1233, "lr": 1.9952788124596555e-06, "epoch": 0.12801900488319914, "percentage": 12.8, "elapsed_time": "0:02:13", "remaining_time": "0:15:07", "throughput": 3585.31, "total_tokens": 477440} +{"current_steps": 975, "total_steps": 7577, "loss": 0.1272, "lr": 1.9950525952603617e-06, "epoch": 0.12867889666094762, "percentage": 12.87, "elapsed_time": "0:02:13", "remaining_time": "0:15:03", "throughput": 3595.66, "total_tokens": 480000} +{"current_steps": 980, "total_steps": 7577, "loss": 0.1456, "lr": 1.994821097935899e-06, "epoch": 0.12933878843869606, "percentage": 12.93, "elapsed_time": "0:02:13", "remaining_time": "0:15:00", "throughput": 3604.62, "total_tokens": 482368} +{"current_steps": 985, "total_steps": 7577, "loss": 0.0077, "lr": 1.9945843217146804e-06, "epoch": 0.1299986802164445, "percentage": 13.0, "elapsed_time": "0:02:14", "remaining_time": "0:14:57", "throughput": 3612.14, "total_tokens": 484544} +{"current_steps": 990, "total_steps": 7577, "loss": 0.0852, "lr": 1.9943422678531293e-06, "epoch": 0.13065857199419295, "percentage": 13.07, "elapsed_time": "0:02:14", "remaining_time": "0:14:54", "throughput": 3619.72, "total_tokens": 486720} +{"current_steps": 995, "total_steps": 7577, "loss": 0.0741, "lr": 1.994094937635675e-06, "epoch": 0.1313184637719414, "percentage": 13.13, "elapsed_time": "0:02:14", "remaining_time": "0:14:51", "throughput": 3630.28, "total_tokens": 489344} +{"current_steps": 1000, "total_steps": 7577, "loss": 0.2262, "lr": 1.9938423323747457e-06, "epoch": 0.13197835554968984, "percentage": 13.2, "elapsed_time": "0:02:15", "remaining_time": "0:14:48", "throughput": 3639.51, "total_tokens": 491776} +{"current_steps": 1005, "total_steps": 7577, "loss": 0.1184, "lr": 1.99358445341076e-06, "epoch": 0.1326382473274383, "percentage": 13.26, "elapsed_time": "0:02:15", "remaining_time": "0:14:45", "throughput": 3646.96, "total_tokens": 493952} +{"current_steps": 1010, "total_steps": 7577, "loss": 0.2204, "lr": 1.993321302112121e-06, "epoch": 0.13329813910518676, "percentage": 13.33, "elapsed_time": "0:02:15", "remaining_time": "0:14:42", "throughput": 3655.59, "total_tokens": 496320} +{"current_steps": 1015, "total_steps": 7577, "loss": 0.0399, "lr": 1.993052879875209e-06, "epoch": 0.1339580308829352, "percentage": 13.4, "elapsed_time": "0:02:16", "remaining_time": "0:14:39", "throughput": 3662.89, "total_tokens": 498496} +{"current_steps": 1020, "total_steps": 7577, "loss": 0.2953, "lr": 1.992779188124374e-06, "epoch": 0.13461792266068365, "percentage": 13.46, "elapsed_time": "0:02:16", "remaining_time": "0:14:36", "throughput": 3672.83, "total_tokens": 501056} +{"current_steps": 1025, "total_steps": 7577, "loss": 0.1176, "lr": 1.992500228311928e-06, "epoch": 0.1352778144384321, "percentage": 13.53, "elapsed_time": "0:02:16", "remaining_time": "0:14:34", "throughput": 3680.58, "total_tokens": 503296} +{"current_steps": 1030, "total_steps": 7577, "loss": 0.2695, "lr": 1.9922160019181372e-06, "epoch": 0.13593770621618054, "percentage": 13.59, "elapsed_time": "0:02:17", "remaining_time": "0:14:31", "throughput": 3690.49, "total_tokens": 505856} +{"current_steps": 1035, "total_steps": 7577, "loss": 0.0981, "lr": 1.9919265104512138e-06, "epoch": 0.13659759799392898, "percentage": 13.66, "elapsed_time": "0:02:17", "remaining_time": "0:14:28", "throughput": 3700.3, "total_tokens": 508416} +{"current_steps": 1040, "total_steps": 7577, "loss": 0.2986, "lr": 1.9916317554473094e-06, "epoch": 0.13725748977167745, "percentage": 13.73, "elapsed_time": "0:02:17", "remaining_time": "0:14:25", "throughput": 3710.44, "total_tokens": 511040} +{"current_steps": 1045, "total_steps": 7577, "loss": 0.115, "lr": 1.9913317384705052e-06, "epoch": 0.1379173815494259, "percentage": 13.79, "elapsed_time": "0:02:18", "remaining_time": "0:14:22", "throughput": 3717.57, "total_tokens": 513216} +{"current_steps": 1050, "total_steps": 7577, "loss": 0.0893, "lr": 1.991026461112805e-06, "epoch": 0.13857727332717434, "percentage": 13.86, "elapsed_time": "0:02:18", "remaining_time": "0:14:20", "throughput": 3725.14, "total_tokens": 515456} +{"current_steps": 1055, "total_steps": 7577, "loss": 0.1591, "lr": 1.9907159249941257e-06, "epoch": 0.1392371651049228, "percentage": 13.92, "elapsed_time": "0:02:18", "remaining_time": "0:14:17", "throughput": 3733.3, "total_tokens": 517824} +{"current_steps": 1060, "total_steps": 7577, "loss": 0.0627, "lr": 1.990400131762289e-06, "epoch": 0.13989705688267123, "percentage": 13.99, "elapsed_time": "0:02:19", "remaining_time": "0:14:14", "throughput": 3742.5, "total_tokens": 520320} +{"current_steps": 1065, "total_steps": 7577, "loss": 0.1068, "lr": 1.9900790830930134e-06, "epoch": 0.14055694866041968, "percentage": 14.06, "elapsed_time": "0:02:19", "remaining_time": "0:14:12", "throughput": 3751.22, "total_tokens": 522752} +{"current_steps": 1070, "total_steps": 7577, "loss": 0.1066, "lr": 1.9897527806899047e-06, "epoch": 0.14121684043816815, "percentage": 14.12, "elapsed_time": "0:02:19", "remaining_time": "0:14:09", "throughput": 3761.09, "total_tokens": 525376} +{"current_steps": 1075, "total_steps": 7577, "loss": 0.2544, "lr": 1.9894212262844465e-06, "epoch": 0.1418767322159166, "percentage": 14.19, "elapsed_time": "0:02:20", "remaining_time": "0:14:06", "throughput": 3769.79, "total_tokens": 527808} +{"current_steps": 1080, "total_steps": 7577, "loss": 0.1578, "lr": 1.989084421635992e-06, "epoch": 0.14253662399366504, "percentage": 14.25, "elapsed_time": "0:02:20", "remaining_time": "0:14:04", "throughput": 3778.82, "total_tokens": 530304} +{"current_steps": 1085, "total_steps": 7577, "loss": 0.2733, "lr": 1.988742368531754e-06, "epoch": 0.14319651577141349, "percentage": 14.32, "elapsed_time": "0:02:20", "remaining_time": "0:14:01", "throughput": 3785.63, "total_tokens": 532480} +{"current_steps": 1090, "total_steps": 7577, "loss": 0.0745, "lr": 1.9883950687867947e-06, "epoch": 0.14385640754916193, "percentage": 14.39, "elapsed_time": "0:02:20", "remaining_time": "0:13:59", "throughput": 3795.87, "total_tokens": 535168} +{"current_steps": 1095, "total_steps": 7577, "loss": 0.1377, "lr": 1.9880425242440187e-06, "epoch": 0.14451629932691037, "percentage": 14.45, "elapsed_time": "0:02:21", "remaining_time": "0:13:56", "throughput": 3804.28, "total_tokens": 537600} +{"current_steps": 1100, "total_steps": 7577, "loss": 0.0585, "lr": 1.9876847367741607e-06, "epoch": 0.14517619110465885, "percentage": 14.52, "elapsed_time": "0:02:21", "remaining_time": "0:13:54", "throughput": 3813.14, "total_tokens": 540096} +{"current_steps": 1105, "total_steps": 7577, "loss": 0.1719, "lr": 1.987321708275776e-06, "epoch": 0.1458360828824073, "percentage": 14.58, "elapsed_time": "0:02:21", "remaining_time": "0:13:51", "throughput": 3821.95, "total_tokens": 542592} +{"current_steps": 1110, "total_steps": 7577, "loss": 0.0895, "lr": 1.986953440675231e-06, "epoch": 0.14649597466015574, "percentage": 14.65, "elapsed_time": "0:02:22", "remaining_time": "0:13:49", "throughput": 3829.86, "total_tokens": 544960} +{"current_steps": 1115, "total_steps": 7577, "loss": 0.1572, "lr": 1.9865799359266925e-06, "epoch": 0.14715586643790418, "percentage": 14.72, "elapsed_time": "0:02:22", "remaining_time": "0:13:46", "throughput": 3836.51, "total_tokens": 547136} +{"current_steps": 1120, "total_steps": 7577, "loss": 0.1272, "lr": 1.986201196012118e-06, "epoch": 0.14781575821565263, "percentage": 14.78, "elapsed_time": "0:02:22", "remaining_time": "0:13:44", "throughput": 3843.95, "total_tokens": 549440} +{"current_steps": 1125, "total_steps": 7577, "loss": 0.2212, "lr": 1.985817222941245e-06, "epoch": 0.14847564999340107, "percentage": 14.85, "elapsed_time": "0:02:23", "remaining_time": "0:13:41", "throughput": 3853.41, "total_tokens": 552064} +{"current_steps": 1130, "total_steps": 7577, "loss": 0.0754, "lr": 1.9854280187515794e-06, "epoch": 0.14913554177114954, "percentage": 14.91, "elapsed_time": "0:02:23", "remaining_time": "0:13:39", "throughput": 3861.16, "total_tokens": 554432} +{"current_steps": 1135, "total_steps": 7577, "loss": 0.0564, "lr": 1.985033585508386e-06, "epoch": 0.149795433548898, "percentage": 14.98, "elapsed_time": "0:02:23", "remaining_time": "0:13:36", "throughput": 3868.96, "total_tokens": 556800} +{"current_steps": 1137, "total_steps": 7577, "eval_loss": 0.16564705967903137, "epoch": 0.15005939025999737, "percentage": 15.01, "elapsed_time": "0:02:31", "remaining_time": "0:14:20", "throughput": 3673.32, "total_tokens": 557824} +{"current_steps": 1140, "total_steps": 7577, "loss": 0.5119, "lr": 1.9846339253046766e-06, "epoch": 0.15045532532664643, "percentage": 15.05, "elapsed_time": "0:03:44", "remaining_time": "0:21:07", "throughput": 2492.38, "total_tokens": 559296} +{"current_steps": 1145, "total_steps": 7577, "loss": 0.163, "lr": 1.984229040261199e-06, "epoch": 0.15111521710439488, "percentage": 15.11, "elapsed_time": "0:03:44", "remaining_time": "0:21:02", "throughput": 2501.16, "total_tokens": 562112} +{"current_steps": 1150, "total_steps": 7577, "loss": 0.1812, "lr": 1.9838189325264263e-06, "epoch": 0.15177510888214332, "percentage": 15.18, "elapsed_time": "0:03:45", "remaining_time": "0:20:57", "throughput": 2507.16, "total_tokens": 564288} +{"current_steps": 1155, "total_steps": 7577, "loss": 0.033, "lr": 1.983403604276546e-06, "epoch": 0.15243500065989177, "percentage": 15.24, "elapsed_time": "0:03:45", "remaining_time": "0:20:53", "throughput": 2514.85, "total_tokens": 566848} +{"current_steps": 1160, "total_steps": 7577, "loss": 0.3099, "lr": 1.9829830577154457e-06, "epoch": 0.15309489243764024, "percentage": 15.31, "elapsed_time": "0:03:45", "remaining_time": "0:20:48", "throughput": 2521.4, "total_tokens": 569152} +{"current_steps": 1165, "total_steps": 7577, "loss": 0.0496, "lr": 1.982557295074705e-06, "epoch": 0.15375478421538868, "percentage": 15.38, "elapsed_time": "0:03:46", "remaining_time": "0:20:44", "throughput": 2527.97, "total_tokens": 571456} +{"current_steps": 1170, "total_steps": 7577, "loss": 0.0902, "lr": 1.982126318613581e-06, "epoch": 0.15441467599313713, "percentage": 15.44, "elapsed_time": "0:03:46", "remaining_time": "0:20:39", "throughput": 2534.81, "total_tokens": 573824} +{"current_steps": 1175, "total_steps": 7577, "loss": 0.0556, "lr": 1.9816901306189977e-06, "epoch": 0.15507456777088557, "percentage": 15.51, "elapsed_time": "0:03:46", "remaining_time": "0:20:35", "throughput": 2541.32, "total_tokens": 576128} +{"current_steps": 1180, "total_steps": 7577, "loss": 0.1048, "lr": 1.9812487334055342e-06, "epoch": 0.15573445954863402, "percentage": 15.57, "elapsed_time": "0:03:47", "remaining_time": "0:20:30", "throughput": 2547.85, "total_tokens": 578432} +{"current_steps": 1185, "total_steps": 7577, "loss": 0.1522, "lr": 1.98080212931541e-06, "epoch": 0.15639435132638246, "percentage": 15.64, "elapsed_time": "0:03:47", "remaining_time": "0:20:26", "throughput": 2554.34, "total_tokens": 580736} +{"current_steps": 1190, "total_steps": 7577, "loss": 0.0609, "lr": 1.980350320718476e-06, "epoch": 0.15705424310413094, "percentage": 15.71, "elapsed_time": "0:03:47", "remaining_time": "0:20:21", "throughput": 2560.82, "total_tokens": 583040} +{"current_steps": 1195, "total_steps": 7577, "loss": 0.0032, "lr": 1.9798933100121985e-06, "epoch": 0.15771413488187938, "percentage": 15.77, "elapsed_time": "0:03:48", "remaining_time": "0:20:17", "throughput": 2567.28, "total_tokens": 585344} +{"current_steps": 1200, "total_steps": 7577, "loss": 0.0896, "lr": 1.97943109962165e-06, "epoch": 0.15837402665962783, "percentage": 15.84, "elapsed_time": "0:03:48", "remaining_time": "0:20:13", "throughput": 2574.78, "total_tokens": 587904} +{"current_steps": 1205, "total_steps": 7577, "loss": 0.1423, "lr": 1.978963691999493e-06, "epoch": 0.15903391843737627, "percentage": 15.9, "elapsed_time": "0:03:48", "remaining_time": "0:20:09", "throughput": 2581.2, "total_tokens": 590208} +{"current_steps": 1210, "total_steps": 7577, "loss": 0.2118, "lr": 1.978491089625969e-06, "epoch": 0.15969381021512472, "percentage": 15.97, "elapsed_time": "0:03:48", "remaining_time": "0:20:04", "throughput": 2587.62, "total_tokens": 592512} +{"current_steps": 1215, "total_steps": 7577, "loss": 0.2427, "lr": 1.9780132950088854e-06, "epoch": 0.16035370199287316, "percentage": 16.04, "elapsed_time": "0:03:49", "remaining_time": "0:20:00", "throughput": 2595.04, "total_tokens": 595072} +{"current_steps": 1220, "total_steps": 7577, "loss": 0.3134, "lr": 1.9775303106836e-06, "epoch": 0.1610135937706216, "percentage": 16.1, "elapsed_time": "0:03:49", "remaining_time": "0:19:56", "throughput": 2602.45, "total_tokens": 597632} +{"current_steps": 1225, "total_steps": 7577, "loss": 0.117, "lr": 1.977042139213011e-06, "epoch": 0.16167348554837008, "percentage": 16.17, "elapsed_time": "0:03:49", "remaining_time": "0:19:52", "throughput": 2609.85, "total_tokens": 600192} +{"current_steps": 1230, "total_steps": 7577, "loss": 0.1205, "lr": 1.9765487831875404e-06, "epoch": 0.16233337732611852, "percentage": 16.23, "elapsed_time": "0:03:50", "remaining_time": "0:19:48", "throughput": 2615.38, "total_tokens": 602304} +{"current_steps": 1235, "total_steps": 7577, "loss": 0.1485, "lr": 1.9760502452251217e-06, "epoch": 0.16299326910386697, "percentage": 16.3, "elapsed_time": "0:03:50", "remaining_time": "0:19:44", "throughput": 2621.71, "total_tokens": 604608} +{"current_steps": 1240, "total_steps": 7577, "loss": 0.1371, "lr": 1.975546527971186e-06, "epoch": 0.1636531608816154, "percentage": 16.37, "elapsed_time": "0:03:50", "remaining_time": "0:19:40", "throughput": 2628.21, "total_tokens": 606976} +{"current_steps": 1245, "total_steps": 7577, "loss": 0.0801, "lr": 1.9750376340986472e-06, "epoch": 0.16431305265936386, "percentage": 16.43, "elapsed_time": "0:03:51", "remaining_time": "0:19:36", "throughput": 2635.73, "total_tokens": 609600} +{"current_steps": 1250, "total_steps": 7577, "loss": 0.2009, "lr": 1.974523566307889e-06, "epoch": 0.1649729444371123, "percentage": 16.5, "elapsed_time": "0:03:51", "remaining_time": "0:19:32", "throughput": 2641.72, "total_tokens": 611840} +{"current_steps": 1255, "total_steps": 7577, "loss": 0.1902, "lr": 1.9740043273267487e-06, "epoch": 0.16563283621486077, "percentage": 16.56, "elapsed_time": "0:03:51", "remaining_time": "0:19:28", "throughput": 2649.53, "total_tokens": 614528} +{"current_steps": 1260, "total_steps": 7577, "loss": 0.0022, "lr": 1.973479919910505e-06, "epoch": 0.16629272799260922, "percentage": 16.63, "elapsed_time": "0:03:52", "remaining_time": "0:19:24", "throughput": 2656.55, "total_tokens": 617024} +{"current_steps": 1265, "total_steps": 7577, "loss": 0.1153, "lr": 1.972950346841862e-06, "epoch": 0.16695261977035766, "percentage": 16.7, "elapsed_time": "0:03:52", "remaining_time": "0:19:20", "throughput": 2663.01, "total_tokens": 619392} +{"current_steps": 1270, "total_steps": 7577, "loss": 0.1353, "lr": 1.972415610930934e-06, "epoch": 0.1676125115481061, "percentage": 16.76, "elapsed_time": "0:03:52", "remaining_time": "0:19:16", "throughput": 2669.96, "total_tokens": 621888} +{"current_steps": 1275, "total_steps": 7577, "loss": 0.1096, "lr": 1.9718757150152324e-06, "epoch": 0.16827240332585455, "percentage": 16.83, "elapsed_time": "0:03:53", "remaining_time": "0:19:12", "throughput": 2676.14, "total_tokens": 624192} +{"current_steps": 1280, "total_steps": 7577, "loss": 0.0658, "lr": 1.9713306619596488e-06, "epoch": 0.168932295103603, "percentage": 16.89, "elapsed_time": "0:03:53", "remaining_time": "0:19:09", "throughput": 2682.76, "total_tokens": 626624} +{"current_steps": 1285, "total_steps": 7577, "loss": 0.0575, "lr": 1.9707804546564407e-06, "epoch": 0.16959218688135147, "percentage": 16.96, "elapsed_time": "0:03:53", "remaining_time": "0:19:05", "throughput": 2688.86, "total_tokens": 628928} +{"current_steps": 1290, "total_steps": 7577, "loss": 0.1254, "lr": 1.9702250960252164e-06, "epoch": 0.17025207865909991, "percentage": 17.03, "elapsed_time": "0:03:54", "remaining_time": "0:19:01", "throughput": 2696.5, "total_tokens": 631616} +{"current_steps": 1295, "total_steps": 7577, "loss": 0.0568, "lr": 1.969664589012918e-06, "epoch": 0.17091197043684836, "percentage": 17.09, "elapsed_time": "0:03:54", "remaining_time": "0:18:57", "throughput": 2703.27, "total_tokens": 634112} +{"current_steps": 1300, "total_steps": 7577, "loss": 0.1854, "lr": 1.9690989365938077e-06, "epoch": 0.1715718622145968, "percentage": 17.16, "elapsed_time": "0:03:54", "remaining_time": "0:18:54", "throughput": 2709.35, "total_tokens": 636416} +{"current_steps": 1305, "total_steps": 7577, "loss": 0.0006, "lr": 1.9685281417694513e-06, "epoch": 0.17223175399234525, "percentage": 17.22, "elapsed_time": "0:03:55", "remaining_time": "0:18:50", "throughput": 2715.91, "total_tokens": 638848} +{"current_steps": 1310, "total_steps": 7577, "loss": 0.12, "lr": 1.967952207568702e-06, "epoch": 0.1728916457700937, "percentage": 17.29, "elapsed_time": "0:03:55", "remaining_time": "0:18:46", "throughput": 2722.21, "total_tokens": 641216} +{"current_steps": 1315, "total_steps": 7577, "loss": 0.0008, "lr": 1.967371137047685e-06, "epoch": 0.17355153754784217, "percentage": 17.36, "elapsed_time": "0:03:55", "remaining_time": "0:18:43", "throughput": 2730.29, "total_tokens": 644032} +{"current_steps": 1320, "total_steps": 7577, "loss": 0.0887, "lr": 1.966784933289778e-06, "epoch": 0.1742114293255906, "percentage": 17.42, "elapsed_time": "0:03:56", "remaining_time": "0:18:39", "throughput": 2737.01, "total_tokens": 646528} +{"current_steps": 1325, "total_steps": 7577, "loss": 0.1307, "lr": 1.9661935994056014e-06, "epoch": 0.17487132110333906, "percentage": 17.49, "elapsed_time": "0:03:56", "remaining_time": "0:18:36", "throughput": 2743.98, "total_tokens": 649088} +{"current_steps": 1330, "total_steps": 7577, "loss": 0.1035, "lr": 1.965597138532996e-06, "epoch": 0.1755312128810875, "percentage": 17.55, "elapsed_time": "0:03:56", "remaining_time": "0:18:32", "throughput": 2750.42, "total_tokens": 651520} +{"current_steps": 1335, "total_steps": 7577, "loss": 0.0123, "lr": 1.964995553837009e-06, "epoch": 0.17619110465883595, "percentage": 17.62, "elapsed_time": "0:03:57", "remaining_time": "0:18:29", "throughput": 2757.15, "total_tokens": 654016} +{"current_steps": 1340, "total_steps": 7577, "loss": 0.0924, "lr": 1.964388848509875e-06, "epoch": 0.1768509964365844, "percentage": 17.69, "elapsed_time": "0:03:57", "remaining_time": "0:18:25", "throughput": 2763.1, "total_tokens": 656320} +{"current_steps": 1345, "total_steps": 7577, "loss": 0.1818, "lr": 1.9637770257710026e-06, "epoch": 0.17751088821433286, "percentage": 17.75, "elapsed_time": "0:03:57", "remaining_time": "0:18:22", "throughput": 2770.06, "total_tokens": 658880} +{"current_steps": 1350, "total_steps": 7577, "loss": 0.001, "lr": 1.9631600888669545e-06, "epoch": 0.1781707799920813, "percentage": 17.82, "elapsed_time": "0:03:58", "remaining_time": "0:18:18", "throughput": 2775.92, "total_tokens": 661184} +{"current_steps": 1355, "total_steps": 7577, "loss": 0.0885, "lr": 1.962538041071431e-06, "epoch": 0.17883067176982975, "percentage": 17.88, "elapsed_time": "0:03:58", "remaining_time": "0:18:15", "throughput": 2782.56, "total_tokens": 663680} +{"current_steps": 1360, "total_steps": 7577, "loss": 0.0377, "lr": 1.961910885685253e-06, "epoch": 0.1794905635475782, "percentage": 17.95, "elapsed_time": "0:03:58", "remaining_time": "0:18:11", "throughput": 2788.7, "total_tokens": 666048} +{"current_steps": 1365, "total_steps": 7577, "loss": 0.0748, "lr": 1.9612786260363436e-06, "epoch": 0.18015045532532664, "percentage": 18.02, "elapsed_time": "0:03:59", "remaining_time": "0:18:08", "throughput": 2795.05, "total_tokens": 668480} +{"current_steps": 1370, "total_steps": 7577, "loss": 0.1292, "lr": 1.9606412654797116e-06, "epoch": 0.1808103471030751, "percentage": 18.08, "elapsed_time": "0:03:59", "remaining_time": "0:18:05", "throughput": 2803.57, "total_tokens": 671488} +{"current_steps": 1375, "total_steps": 7577, "loss": 0.1406, "lr": 1.9599988073974332e-06, "epoch": 0.18147023888082353, "percentage": 18.15, "elapsed_time": "0:03:59", "remaining_time": "0:18:01", "throughput": 2809.9, "total_tokens": 673920} +{"current_steps": 1380, "total_steps": 7577, "loss": 0.0929, "lr": 1.959351255198634e-06, "epoch": 0.182130130658572, "percentage": 18.21, "elapsed_time": "0:04:00", "remaining_time": "0:17:58", "throughput": 2816.42, "total_tokens": 676416} +{"current_steps": 1385, "total_steps": 7577, "loss": 0.0006, "lr": 1.9586986123194704e-06, "epoch": 0.18279002243632045, "percentage": 18.28, "elapsed_time": "0:04:00", "remaining_time": "0:17:55", "throughput": 2823.42, "total_tokens": 679040} +{"current_steps": 1390, "total_steps": 7577, "loss": 0.1902, "lr": 1.958040882223112e-06, "epoch": 0.1834499142140689, "percentage": 18.34, "elapsed_time": "0:04:00", "remaining_time": "0:17:52", "throughput": 2831.36, "total_tokens": 681920} +{"current_steps": 1395, "total_steps": 7577, "loss": 0.048, "lr": 1.9573780683997235e-06, "epoch": 0.18410980599181734, "percentage": 18.41, "elapsed_time": "0:04:01", "remaining_time": "0:17:48", "throughput": 2837.82, "total_tokens": 684416} +{"current_steps": 1400, "total_steps": 7577, "loss": 0.0828, "lr": 1.956710174366445e-06, "epoch": 0.18476969776956578, "percentage": 18.48, "elapsed_time": "0:04:01", "remaining_time": "0:17:45", "throughput": 2844.49, "total_tokens": 686976} +{"current_steps": 1405, "total_steps": 7577, "loss": 0.2272, "lr": 1.9560372036673764e-06, "epoch": 0.18542958954731423, "percentage": 18.54, "elapsed_time": "0:04:01", "remaining_time": "0:17:42", "throughput": 2850.71, "total_tokens": 689408} +{"current_steps": 1410, "total_steps": 7577, "loss": 0.0649, "lr": 1.955359159873553e-06, "epoch": 0.1860894813250627, "percentage": 18.61, "elapsed_time": "0:04:02", "remaining_time": "0:17:39", "throughput": 2856.37, "total_tokens": 691712} +{"current_steps": 1415, "total_steps": 7577, "loss": 0.066, "lr": 1.954676046582932e-06, "epoch": 0.18674937310281114, "percentage": 18.67, "elapsed_time": "0:04:02", "remaining_time": "0:17:36", "throughput": 2862.17, "total_tokens": 694080} +{"current_steps": 1420, "total_steps": 7577, "loss": 0.2175, "lr": 1.9539878674203706e-06, "epoch": 0.1874092648805596, "percentage": 18.74, "elapsed_time": "0:04:02", "remaining_time": "0:17:32", "throughput": 2868.8, "total_tokens": 696640} +{"current_steps": 1425, "total_steps": 7577, "loss": 0.0003, "lr": 1.9532946260376076e-06, "epoch": 0.18806915665830803, "percentage": 18.81, "elapsed_time": "0:04:03", "remaining_time": "0:17:29", "throughput": 2875.13, "total_tokens": 699136} +{"current_steps": 1430, "total_steps": 7577, "loss": 0.4092, "lr": 1.952596326113244e-06, "epoch": 0.18872904843605648, "percentage": 18.87, "elapsed_time": "0:04:03", "remaining_time": "0:17:26", "throughput": 2881.74, "total_tokens": 701696} +{"current_steps": 1435, "total_steps": 7577, "loss": 0.2349, "lr": 1.9518929713527226e-06, "epoch": 0.18938894021380492, "percentage": 18.94, "elapsed_time": "0:04:03", "remaining_time": "0:17:23", "throughput": 2888.81, "total_tokens": 704384} +{"current_steps": 1440, "total_steps": 7577, "loss": 0.0082, "lr": 1.9511845654883097e-06, "epoch": 0.1900488319915534, "percentage": 19.0, "elapsed_time": "0:04:04", "remaining_time": "0:17:20", "throughput": 2893.87, "total_tokens": 706560} +{"current_steps": 1445, "total_steps": 7577, "loss": 0.1221, "lr": 1.9504711122790754e-06, "epoch": 0.19070872376930184, "percentage": 19.07, "elapsed_time": "0:04:04", "remaining_time": "0:17:17", "throughput": 2900.94, "total_tokens": 709248} +{"current_steps": 1450, "total_steps": 7577, "loss": 0.08, "lr": 1.949752615510871e-06, "epoch": 0.19136861554705029, "percentage": 19.14, "elapsed_time": "0:04:04", "remaining_time": "0:17:14", "throughput": 2905.48, "total_tokens": 711296} +{"current_steps": 1455, "total_steps": 7577, "loss": 0.0655, "lr": 1.949029078996313e-06, "epoch": 0.19202850732479873, "percentage": 19.2, "elapsed_time": "0:04:05", "remaining_time": "0:17:11", "throughput": 2911.53, "total_tokens": 713728} +{"current_steps": 1460, "total_steps": 7577, "loss": 0.1876, "lr": 1.9483005065747584e-06, "epoch": 0.19268839910254718, "percentage": 19.27, "elapsed_time": "0:04:05", "remaining_time": "0:17:08", "throughput": 2917.82, "total_tokens": 716224} +{"current_steps": 1465, "total_steps": 7577, "loss": 0.3791, "lr": 1.947566902112289e-06, "epoch": 0.19334829088029562, "percentage": 19.33, "elapsed_time": "0:04:05", "remaining_time": "0:17:05", "throughput": 2921.86, "total_tokens": 718528} +{"current_steps": 1470, "total_steps": 7577, "loss": 0.2271, "lr": 1.9468282695016863e-06, "epoch": 0.1940081826580441, "percentage": 19.4, "elapsed_time": "0:04:06", "remaining_time": "0:17:02", "throughput": 2927.84, "total_tokens": 720960} +{"current_steps": 1475, "total_steps": 7577, "loss": 0.1805, "lr": 1.946084612662415e-06, "epoch": 0.19466807443579254, "percentage": 19.47, "elapsed_time": "0:04:06", "remaining_time": "0:17:00", "throughput": 2933.04, "total_tokens": 723200} +{"current_steps": 1480, "total_steps": 7577, "loss": 0.2018, "lr": 1.9453359355405987e-06, "epoch": 0.19532796621354098, "percentage": 19.53, "elapsed_time": "0:04:06", "remaining_time": "0:16:57", "throughput": 2939.99, "total_tokens": 725888} +{"current_steps": 1485, "total_steps": 7577, "loss": 0.0364, "lr": 1.944582242109002e-06, "epoch": 0.19598785799128943, "percentage": 19.6, "elapsed_time": "0:04:07", "remaining_time": "0:16:54", "throughput": 2945.7, "total_tokens": 728256} +{"current_steps": 1490, "total_steps": 7577, "loss": 0.1441, "lr": 1.943823536367006e-06, "epoch": 0.19664774976903787, "percentage": 19.66, "elapsed_time": "0:04:07", "remaining_time": "0:16:51", "throughput": 2951.66, "total_tokens": 730688} +{"current_steps": 1495, "total_steps": 7577, "loss": 0.1269, "lr": 1.9430598223405913e-06, "epoch": 0.19730764154678632, "percentage": 19.73, "elapsed_time": "0:04:07", "remaining_time": "0:16:48", "throughput": 2957.08, "total_tokens": 732992} +{"current_steps": 1500, "total_steps": 7577, "loss": 0.1163, "lr": 1.9422911040823125e-06, "epoch": 0.1979675333245348, "percentage": 19.8, "elapsed_time": "0:04:08", "remaining_time": "0:16:45", "throughput": 2962.98, "total_tokens": 735424} +{"current_steps": 1505, "total_steps": 7577, "loss": 0.1995, "lr": 1.941517385671279e-06, "epoch": 0.19862742510228323, "percentage": 19.86, "elapsed_time": "0:04:08", "remaining_time": "0:16:42", "throughput": 2968.15, "total_tokens": 737664} +{"current_steps": 1510, "total_steps": 7577, "loss": 0.0888, "lr": 1.940738671213134e-06, "epoch": 0.19928731688003168, "percentage": 19.93, "elapsed_time": "0:04:08", "remaining_time": "0:16:39", "throughput": 2974.01, "total_tokens": 740096} +{"current_steps": 1515, "total_steps": 7577, "loss": 0.1883, "lr": 1.93995496484003e-06, "epoch": 0.19994720865778012, "percentage": 19.99, "elapsed_time": "0:04:09", "remaining_time": "0:16:37", "throughput": 2981.27, "total_tokens": 742912} +{"current_steps": 1516, "total_steps": 7577, "eval_loss": 0.10974650084972382, "epoch": 0.2000791870133298, "percentage": 20.01, "elapsed_time": "0:04:17", "remaining_time": "0:17:08", "throughput": 2890.65, "total_tokens": 743424} +{"current_steps": 1520, "total_steps": 7577, "loss": 0.1544, "lr": 1.9391662707106092e-06, "epoch": 0.20060710043552857, "percentage": 20.06, "elapsed_time": "0:04:41", "remaining_time": "0:18:43", "throughput": 2644.36, "total_tokens": 745536} +{"current_steps": 1525, "total_steps": 7577, "loss": 0.0053, "lr": 1.9383725930099814e-06, "epoch": 0.201266992213277, "percentage": 20.13, "elapsed_time": "0:04:42", "remaining_time": "0:18:40", "throughput": 2649.83, "total_tokens": 747968} +{"current_steps": 1530, "total_steps": 7577, "loss": 0.2261, "lr": 1.9375739359497e-06, "epoch": 0.20192688399102549, "percentage": 20.19, "elapsed_time": "0:04:42", "remaining_time": "0:18:36", "throughput": 2655.45, "total_tokens": 750464} +{"current_steps": 1535, "total_steps": 7577, "loss": 0.2511, "lr": 1.936770303767741e-06, "epoch": 0.20258677576877393, "percentage": 20.26, "elapsed_time": "0:04:42", "remaining_time": "0:18:33", "throughput": 2660.93, "total_tokens": 752896} +{"current_steps": 1540, "total_steps": 7577, "loss": 0.1788, "lr": 1.9359617007284815e-06, "epoch": 0.20324666754652237, "percentage": 20.32, "elapsed_time": "0:04:43", "remaining_time": "0:18:30", "throughput": 2667.45, "total_tokens": 755648} +{"current_steps": 1545, "total_steps": 7577, "loss": 0.2098, "lr": 1.9351481311226738e-06, "epoch": 0.20390655932427082, "percentage": 20.39, "elapsed_time": "0:04:43", "remaining_time": "0:18:27", "throughput": 2673.08, "total_tokens": 758144} +{"current_steps": 1550, "total_steps": 7577, "loss": 0.0831, "lr": 1.934329599267426e-06, "epoch": 0.20456645110201926, "percentage": 20.46, "elapsed_time": "0:04:43", "remaining_time": "0:18:24", "throughput": 2678.96, "total_tokens": 760704} +{"current_steps": 1555, "total_steps": 7577, "loss": 0.0039, "lr": 1.933506109506178e-06, "epoch": 0.2052263428797677, "percentage": 20.52, "elapsed_time": "0:04:44", "remaining_time": "0:18:20", "throughput": 2684.35, "total_tokens": 763136} +{"current_steps": 1560, "total_steps": 7577, "loss": 0.0802, "lr": 1.9326776662086765e-06, "epoch": 0.20588623465751615, "percentage": 20.59, "elapsed_time": "0:04:44", "remaining_time": "0:18:17", "throughput": 2691.25, "total_tokens": 766016} +{"current_steps": 1565, "total_steps": 7577, "loss": 0.2901, "lr": 1.9318442737709565e-06, "epoch": 0.20654612643526463, "percentage": 20.65, "elapsed_time": "0:04:44", "remaining_time": "0:18:14", "throughput": 2696.82, "total_tokens": 768512} +{"current_steps": 1570, "total_steps": 7577, "loss": 0.1689, "lr": 1.9310059366153116e-06, "epoch": 0.20720601821301307, "percentage": 20.72, "elapsed_time": "0:04:45", "remaining_time": "0:18:11", "throughput": 2701.77, "total_tokens": 770816} +{"current_steps": 1575, "total_steps": 7577, "loss": 0.248, "lr": 1.930162659190277e-06, "epoch": 0.20786590999076152, "percentage": 20.79, "elapsed_time": "0:04:45", "remaining_time": "0:18:08", "throughput": 2707.33, "total_tokens": 773312} +{"current_steps": 1580, "total_steps": 7577, "loss": 0.0688, "lr": 1.9293144459706007e-06, "epoch": 0.20852580176850996, "percentage": 20.85, "elapsed_time": "0:04:45", "remaining_time": "0:18:05", "throughput": 2712.45, "total_tokens": 775680} +{"current_steps": 1585, "total_steps": 7577, "loss": 0.1075, "lr": 1.928461301457223e-06, "epoch": 0.2091856935462584, "percentage": 20.92, "elapsed_time": "0:04:46", "remaining_time": "0:18:02", "throughput": 2717.6, "total_tokens": 778048} +{"current_steps": 1590, "total_steps": 7577, "loss": 0.2795, "lr": 1.92760323017725e-06, "epoch": 0.20984558532400685, "percentage": 20.98, "elapsed_time": "0:04:46", "remaining_time": "0:17:59", "throughput": 2723.58, "total_tokens": 780672} +{"current_steps": 1595, "total_steps": 7577, "loss": 0.2294, "lr": 1.9267402366839338e-06, "epoch": 0.21050547710175532, "percentage": 21.05, "elapsed_time": "0:04:46", "remaining_time": "0:17:56", "throughput": 2729.71, "total_tokens": 783360} +{"current_steps": 1600, "total_steps": 7577, "loss": 0.1843, "lr": 1.9258723255566433e-06, "epoch": 0.21116536887950377, "percentage": 21.12, "elapsed_time": "0:04:47", "remaining_time": "0:17:53", "throughput": 2735.24, "total_tokens": 785856} +{"current_steps": 1605, "total_steps": 7577, "loss": 0.1321, "lr": 1.924999501400843e-06, "epoch": 0.2118252606572522, "percentage": 21.18, "elapsed_time": "0:04:47", "remaining_time": "0:17:50", "throughput": 2741.19, "total_tokens": 788480} +{"current_steps": 1610, "total_steps": 7577, "loss": 0.1504, "lr": 1.924121768848068e-06, "epoch": 0.21248515243500066, "percentage": 21.25, "elapsed_time": "0:04:47", "remaining_time": "0:17:47", "throughput": 2746.92, "total_tokens": 791040} +{"current_steps": 1615, "total_steps": 7577, "loss": 0.1462, "lr": 1.923239132555899e-06, "epoch": 0.2131450442127491, "percentage": 21.31, "elapsed_time": "0:04:48", "remaining_time": "0:17:44", "throughput": 2752.63, "total_tokens": 793600} +{"current_steps": 1620, "total_steps": 7577, "loss": 0.1516, "lr": 1.9223515972079378e-06, "epoch": 0.21380493599049755, "percentage": 21.38, "elapsed_time": "0:04:48", "remaining_time": "0:17:41", "throughput": 2757.71, "total_tokens": 795968} +{"current_steps": 1625, "total_steps": 7577, "loss": 0.1019, "lr": 1.9214591675137813e-06, "epoch": 0.21446482776824602, "percentage": 21.45, "elapsed_time": "0:04:48", "remaining_time": "0:17:38", "throughput": 2762.56, "total_tokens": 798272} +{"current_steps": 1630, "total_steps": 7577, "loss": 0.1059, "lr": 1.9205618482090003e-06, "epoch": 0.21512471954599446, "percentage": 21.51, "elapsed_time": "0:04:49", "remaining_time": "0:17:35", "throughput": 2768.9, "total_tokens": 801024} +{"current_steps": 1635, "total_steps": 7577, "loss": 0.1862, "lr": 1.91965964405511e-06, "epoch": 0.2157846113237429, "percentage": 21.58, "elapsed_time": "0:04:49", "remaining_time": "0:17:32", "throughput": 2774.59, "total_tokens": 803584} +{"current_steps": 1640, "total_steps": 7577, "loss": 0.0438, "lr": 1.9187525598395457e-06, "epoch": 0.21644450310149135, "percentage": 21.64, "elapsed_time": "0:04:49", "remaining_time": "0:17:29", "throughput": 2779.67, "total_tokens": 805952} +{"current_steps": 1645, "total_steps": 7577, "loss": 0.1326, "lr": 1.9178406003756396e-06, "epoch": 0.2171043948792398, "percentage": 21.71, "elapsed_time": "0:04:50", "remaining_time": "0:17:26", "throughput": 2785.27, "total_tokens": 808512} +{"current_steps": 1650, "total_steps": 7577, "loss": 0.1071, "lr": 1.9169237705025936e-06, "epoch": 0.21776428665698824, "percentage": 21.78, "elapsed_time": "0:04:50", "remaining_time": "0:17:23", "throughput": 2791.11, "total_tokens": 811136} +{"current_steps": 1655, "total_steps": 7577, "loss": 0.0347, "lr": 1.9160020750854533e-06, "epoch": 0.21842417843473672, "percentage": 21.84, "elapsed_time": "0:04:50", "remaining_time": "0:17:21", "throughput": 2795.66, "total_tokens": 813376} +{"current_steps": 1660, "total_steps": 7577, "loss": 0.1731, "lr": 1.915075519015083e-06, "epoch": 0.21908407021248516, "percentage": 21.91, "elapsed_time": "0:04:51", "remaining_time": "0:17:18", "throughput": 2801.05, "total_tokens": 815872} +{"current_steps": 1665, "total_steps": 7577, "loss": 0.0142, "lr": 1.914144107208139e-06, "epoch": 0.2197439619902336, "percentage": 21.97, "elapsed_time": "0:04:51", "remaining_time": "0:17:15", "throughput": 2805.98, "total_tokens": 818240} +{"current_steps": 1670, "total_steps": 7577, "loss": 0.0476, "lr": 1.913207844607045e-06, "epoch": 0.22040385376798205, "percentage": 22.04, "elapsed_time": "0:04:51", "remaining_time": "0:17:12", "throughput": 2811.37, "total_tokens": 820736} +{"current_steps": 1675, "total_steps": 7577, "loss": 0.3054, "lr": 1.912266736179964e-06, "epoch": 0.2210637455457305, "percentage": 22.11, "elapsed_time": "0:04:52", "remaining_time": "0:17:09", "throughput": 2817.97, "total_tokens": 823616} +{"current_steps": 1680, "total_steps": 7577, "loss": 0.2016, "lr": 1.9113207869207727e-06, "epoch": 0.22172363732347894, "percentage": 22.17, "elapsed_time": "0:04:52", "remaining_time": "0:17:07", "throughput": 2823.31, "total_tokens": 826112} +{"current_steps": 1685, "total_steps": 7577, "loss": 0.1342, "lr": 1.9103700018490365e-06, "epoch": 0.2223835291012274, "percentage": 22.24, "elapsed_time": "0:04:52", "remaining_time": "0:17:04", "throughput": 2828.82, "total_tokens": 828672} +{"current_steps": 1690, "total_steps": 7577, "loss": 0.163, "lr": 1.9094143860099787e-06, "epoch": 0.22304342087897586, "percentage": 22.3, "elapsed_time": "0:04:53", "remaining_time": "0:17:01", "throughput": 2834.6, "total_tokens": 831296} +{"current_steps": 1695, "total_steps": 7577, "loss": 0.1052, "lr": 1.9084539444744594e-06, "epoch": 0.2237033126567243, "percentage": 22.37, "elapsed_time": "0:04:53", "remaining_time": "0:16:58", "throughput": 2840.12, "total_tokens": 833856} +{"current_steps": 1700, "total_steps": 7577, "loss": 0.1483, "lr": 1.907488682338944e-06, "epoch": 0.22436320443447275, "percentage": 22.44, "elapsed_time": "0:04:53", "remaining_time": "0:16:56", "throughput": 2845.85, "total_tokens": 836480} +{"current_steps": 1705, "total_steps": 7577, "loss": 0.0834, "lr": 1.9065186047254782e-06, "epoch": 0.2250230962122212, "percentage": 22.5, "elapsed_time": "0:04:54", "remaining_time": "0:16:53", "throughput": 2851.14, "total_tokens": 838976} +{"current_steps": 1710, "total_steps": 7577, "loss": 0.1598, "lr": 1.9055437167816604e-06, "epoch": 0.22568298798996964, "percentage": 22.57, "elapsed_time": "0:04:54", "remaining_time": "0:16:50", "throughput": 2857.25, "total_tokens": 841728} +{"current_steps": 1715, "total_steps": 7577, "loss": 0.0044, "lr": 1.9045640236806149e-06, "epoch": 0.22634287976771808, "percentage": 22.63, "elapsed_time": "0:04:54", "remaining_time": "0:16:48", "throughput": 2861.72, "total_tokens": 843968} +{"current_steps": 1720, "total_steps": 7577, "loss": 0.4454, "lr": 1.903579530620963e-06, "epoch": 0.22700277154546655, "percentage": 22.7, "elapsed_time": "0:04:55", "remaining_time": "0:16:45", "throughput": 2867.01, "total_tokens": 846464} +{"current_steps": 1725, "total_steps": 7577, "loss": 0.1272, "lr": 1.9025902428267975e-06, "epoch": 0.227662663323215, "percentage": 22.77, "elapsed_time": "0:04:55", "remaining_time": "0:16:42", "throughput": 2872.69, "total_tokens": 849088} +{"current_steps": 1730, "total_steps": 7577, "loss": 0.0506, "lr": 1.901596165547653e-06, "epoch": 0.22832255510096344, "percentage": 22.83, "elapsed_time": "0:04:55", "remaining_time": "0:16:40", "throughput": 2878.35, "total_tokens": 851712} +{"current_steps": 1735, "total_steps": 7577, "loss": 0.1537, "lr": 1.9005973040584796e-06, "epoch": 0.2289824468787119, "percentage": 22.9, "elapsed_time": "0:04:56", "remaining_time": "0:16:37", "throughput": 2883.59, "total_tokens": 854208} +{"current_steps": 1740, "total_steps": 7577, "loss": 0.1147, "lr": 1.8995936636596138e-06, "epoch": 0.22964233865646033, "percentage": 22.96, "elapsed_time": "0:04:56", "remaining_time": "0:16:34", "throughput": 2888.38, "total_tokens": 856576} +{"current_steps": 1745, "total_steps": 7577, "loss": 0.1347, "lr": 1.8985852496767504e-06, "epoch": 0.23030223043420878, "percentage": 23.03, "elapsed_time": "0:04:56", "remaining_time": "0:16:32", "throughput": 2893.4, "total_tokens": 859008} +{"current_steps": 1750, "total_steps": 7577, "loss": 0.146, "lr": 1.897572067460916e-06, "epoch": 0.23096212221195725, "percentage": 23.1, "elapsed_time": "0:04:57", "remaining_time": "0:16:29", "throughput": 2898.42, "total_tokens": 861440} +{"current_steps": 1755, "total_steps": 7577, "loss": 0.1079, "lr": 1.8965541223884377e-06, "epoch": 0.2316220139897057, "percentage": 23.16, "elapsed_time": "0:04:57", "remaining_time": "0:16:27", "throughput": 2903.61, "total_tokens": 863936} +{"current_steps": 1760, "total_steps": 7577, "loss": 0.0547, "lr": 1.8955314198609171e-06, "epoch": 0.23228190576745414, "percentage": 23.23, "elapsed_time": "0:04:57", "remaining_time": "0:16:24", "throughput": 2908.0, "total_tokens": 866176} +{"current_steps": 1765, "total_steps": 7577, "loss": 0.0747, "lr": 1.8945039653052005e-06, "epoch": 0.23294179754520258, "percentage": 23.29, "elapsed_time": "0:04:58", "remaining_time": "0:16:21", "throughput": 2912.58, "total_tokens": 868480} +{"current_steps": 1770, "total_steps": 7577, "loss": 0.1454, "lr": 1.8934717641733498e-06, "epoch": 0.23360168932295103, "percentage": 23.36, "elapsed_time": "0:04:58", "remaining_time": "0:16:19", "throughput": 2917.72, "total_tokens": 870976} +{"current_steps": 1775, "total_steps": 7577, "loss": 0.2544, "lr": 1.8924348219426143e-06, "epoch": 0.23426158110069947, "percentage": 23.43, "elapsed_time": "0:04:58", "remaining_time": "0:16:16", "throughput": 2921.54, "total_tokens": 873088} +{"current_steps": 1780, "total_steps": 7577, "loss": 0.2463, "lr": 1.8913931441154016e-06, "epoch": 0.23492147287844795, "percentage": 23.49, "elapsed_time": "0:04:59", "remaining_time": "0:16:14", "throughput": 2926.5, "total_tokens": 875520} +{"current_steps": 1785, "total_steps": 7577, "loss": 0.0807, "lr": 1.8903467362192482e-06, "epoch": 0.2355813646561964, "percentage": 23.56, "elapsed_time": "0:04:59", "remaining_time": "0:16:11", "throughput": 2930.43, "total_tokens": 877632} +{"current_steps": 1790, "total_steps": 7577, "loss": 0.1002, "lr": 1.8892956038067895e-06, "epoch": 0.23624125643394484, "percentage": 23.62, "elapsed_time": "0:04:59", "remaining_time": "0:16:09", "throughput": 2935.15, "total_tokens": 880000} +{"current_steps": 1795, "total_steps": 7577, "loss": 0.0187, "lr": 1.8882397524557317e-06, "epoch": 0.23690114821169328, "percentage": 23.69, "elapsed_time": "0:05:00", "remaining_time": "0:16:06", "throughput": 2939.26, "total_tokens": 882176} +{"current_steps": 1800, "total_steps": 7577, "loss": 0.0792, "lr": 1.8871791877688208e-06, "epoch": 0.23756103998944172, "percentage": 23.76, "elapsed_time": "0:05:00", "remaining_time": "0:16:04", "throughput": 2944.79, "total_tokens": 884800} +{"current_steps": 1805, "total_steps": 7577, "loss": 0.1225, "lr": 1.8861139153738143e-06, "epoch": 0.23822093176719017, "percentage": 23.82, "elapsed_time": "0:05:00", "remaining_time": "0:16:01", "throughput": 2949.27, "total_tokens": 887104} +{"current_steps": 1810, "total_steps": 7577, "loss": 0.0388, "lr": 1.8850439409234498e-06, "epoch": 0.23888082354493864, "percentage": 23.89, "elapsed_time": "0:05:01", "remaining_time": "0:15:59", "throughput": 2953.75, "total_tokens": 889408} +{"current_steps": 1815, "total_steps": 7577, "loss": 0.1219, "lr": 1.8839692700954161e-06, "epoch": 0.2395407153226871, "percentage": 23.95, "elapsed_time": "0:05:01", "remaining_time": "0:15:56", "throughput": 2958.04, "total_tokens": 891648} +{"current_steps": 1820, "total_steps": 7577, "loss": 0.2359, "lr": 1.8828899085923234e-06, "epoch": 0.24020060710043553, "percentage": 24.02, "elapsed_time": "0:05:01", "remaining_time": "0:15:54", "throughput": 2963.3, "total_tokens": 894208} +{"current_steps": 1825, "total_steps": 7577, "loss": 0.0859, "lr": 1.881805862141671e-06, "epoch": 0.24086049887818398, "percentage": 24.09, "elapsed_time": "0:05:02", "remaining_time": "0:15:52", "throughput": 2968.37, "total_tokens": 896704} +{"current_steps": 1830, "total_steps": 7577, "loss": 0.0579, "lr": 1.8807171364958196e-06, "epoch": 0.24152039065593242, "percentage": 24.15, "elapsed_time": "0:05:02", "remaining_time": "0:15:49", "throughput": 2973.58, "total_tokens": 899264} +{"current_steps": 1835, "total_steps": 7577, "loss": 0.0186, "lr": 1.879623737431959e-06, "epoch": 0.24218028243368087, "percentage": 24.22, "elapsed_time": "0:05:02", "remaining_time": "0:15:47", "throughput": 2978.58, "total_tokens": 901760} +{"current_steps": 1840, "total_steps": 7577, "loss": 0.1353, "lr": 1.8785256707520778e-06, "epoch": 0.24284017421142934, "percentage": 24.28, "elapsed_time": "0:05:03", "remaining_time": "0:15:44", "throughput": 2982.4, "total_tokens": 903872} +{"current_steps": 1845, "total_steps": 7577, "loss": 0.0463, "lr": 1.8774229422829325e-06, "epoch": 0.24350006598917778, "percentage": 24.35, "elapsed_time": "0:05:03", "remaining_time": "0:15:42", "throughput": 2987.41, "total_tokens": 906368} +{"current_steps": 1850, "total_steps": 7577, "loss": 0.0658, "lr": 1.8763155578760181e-06, "epoch": 0.24415995776692623, "percentage": 24.42, "elapsed_time": "0:05:03", "remaining_time": "0:15:40", "throughput": 2992.41, "total_tokens": 908864} +{"current_steps": 1855, "total_steps": 7577, "loss": 0.163, "lr": 1.8752035234075336e-06, "epoch": 0.24481984954467467, "percentage": 24.48, "elapsed_time": "0:05:04", "remaining_time": "0:15:37", "throughput": 2996.39, "total_tokens": 911040} +{"current_steps": 1860, "total_steps": 7577, "loss": 0.1979, "lr": 1.8740868447783554e-06, "epoch": 0.24547974132242312, "percentage": 24.55, "elapsed_time": "0:05:04", "remaining_time": "0:15:35", "throughput": 3000.98, "total_tokens": 913408} +{"current_steps": 1865, "total_steps": 7577, "loss": 0.2382, "lr": 1.8729655279140012e-06, "epoch": 0.24613963310017156, "percentage": 24.61, "elapsed_time": "0:05:04", "remaining_time": "0:15:33", "throughput": 3006.13, "total_tokens": 915968} +{"current_steps": 1870, "total_steps": 7577, "loss": 0.1639, "lr": 1.8718395787646029e-06, "epoch": 0.24679952487792003, "percentage": 24.68, "elapsed_time": "0:05:05", "remaining_time": "0:15:30", "throughput": 3011.28, "total_tokens": 918528} +{"current_steps": 1875, "total_steps": 7577, "loss": 0.0099, "lr": 1.870709003304872e-06, "epoch": 0.24745941665566848, "percentage": 24.75, "elapsed_time": "0:05:05", "remaining_time": "0:15:28", "throughput": 3016.62, "total_tokens": 921152} +{"current_steps": 1880, "total_steps": 7577, "loss": 0.0006, "lr": 1.8695738075340693e-06, "epoch": 0.24811930843341692, "percentage": 24.81, "elapsed_time": "0:05:05", "remaining_time": "0:15:26", "throughput": 3021.16, "total_tokens": 923520} +{"current_steps": 1885, "total_steps": 7577, "loss": 0.0253, "lr": 1.8684339974759723e-06, "epoch": 0.24877920021116537, "percentage": 24.88, "elapsed_time": "0:05:06", "remaining_time": "0:15:24", "throughput": 3025.69, "total_tokens": 925888} +{"current_steps": 1890, "total_steps": 7577, "loss": 0.0925, "lr": 1.8672895791788445e-06, "epoch": 0.2494390919889138, "percentage": 24.94, "elapsed_time": "0:05:06", "remaining_time": "0:15:21", "throughput": 3031.57, "total_tokens": 928704} +{"current_steps": 1895, "total_steps": 7577, "loss": 0.2857, "lr": 1.8661405587154017e-06, "epoch": 0.2500989837666623, "percentage": 25.01, "elapsed_time": "0:05:06", "remaining_time": "0:15:19", "throughput": 3035.68, "total_tokens": 930944} +{"current_steps": 1895, "total_steps": 7577, "eval_loss": 0.13187885284423828, "epoch": 0.2500989837666623, "percentage": 25.01, "elapsed_time": "0:05:14", "remaining_time": "0:15:43", "throughput": 2959.81, "total_tokens": 930944} +{"current_steps": 1900, "total_steps": 7577, "loss": 0.3692, "lr": 1.8649869421827808e-06, "epoch": 0.25075887554441073, "percentage": 25.08, "elapsed_time": "0:06:05", "remaining_time": "0:18:12", "throughput": 2553.64, "total_tokens": 933376} +{"current_steps": 1905, "total_steps": 7577, "loss": 0.0896, "lr": 1.863828735702507e-06, "epoch": 0.2514187673221592, "percentage": 25.14, "elapsed_time": "0:06:05", "remaining_time": "0:18:09", "throughput": 2558.54, "total_tokens": 936000} +{"current_steps": 1910, "total_steps": 7577, "loss": 0.1121, "lr": 1.862665945420462e-06, "epoch": 0.2520786590999076, "percentage": 25.21, "elapsed_time": "0:06:06", "remaining_time": "0:18:06", "throughput": 2562.89, "total_tokens": 938432} +{"current_steps": 1915, "total_steps": 7577, "loss": 0.1862, "lr": 1.8614985775068498e-06, "epoch": 0.25273855087765607, "percentage": 25.27, "elapsed_time": "0:06:06", "remaining_time": "0:18:03", "throughput": 2568.37, "total_tokens": 941312} +{"current_steps": 1920, "total_steps": 7577, "loss": 0.0727, "lr": 1.860326638156167e-06, "epoch": 0.2533984426554045, "percentage": 25.34, "elapsed_time": "0:06:06", "remaining_time": "0:18:00", "throughput": 2571.84, "total_tokens": 943488} +{"current_steps": 1925, "total_steps": 7577, "loss": 0.083, "lr": 1.8591501335871653e-06, "epoch": 0.25405833443315295, "percentage": 25.41, "elapsed_time": "0:06:07", "remaining_time": "0:17:58", "throughput": 2575.99, "total_tokens": 945856} +{"current_steps": 1930, "total_steps": 7577, "loss": 0.2212, "lr": 1.857969070042824e-06, "epoch": 0.2547182262109014, "percentage": 25.47, "elapsed_time": "0:06:07", "remaining_time": "0:17:55", "throughput": 2580.45, "total_tokens": 948352} +{"current_steps": 1935, "total_steps": 7577, "loss": 0.08, "lr": 1.8567834537903116e-06, "epoch": 0.25537811798864984, "percentage": 25.54, "elapsed_time": "0:06:07", "remaining_time": "0:17:52", "throughput": 2585.26, "total_tokens": 950976} +{"current_steps": 1940, "total_steps": 7577, "loss": 0.1289, "lr": 1.8555932911209565e-06, "epoch": 0.2560380097663983, "percentage": 25.6, "elapsed_time": "0:06:08", "remaining_time": "0:17:49", "throughput": 2589.04, "total_tokens": 953216} +{"current_steps": 1945, "total_steps": 7577, "loss": 0.0221, "lr": 1.8543985883502119e-06, "epoch": 0.25669790154414673, "percentage": 25.67, "elapsed_time": "0:06:08", "remaining_time": "0:17:47", "throughput": 2593.33, "total_tokens": 955648} +{"current_steps": 1950, "total_steps": 7577, "loss": 0.0906, "lr": 1.8531993518176216e-06, "epoch": 0.25735779332189523, "percentage": 25.74, "elapsed_time": "0:06:08", "remaining_time": "0:17:44", "throughput": 2597.09, "total_tokens": 957888} +{"current_steps": 1955, "total_steps": 7577, "loss": 0.3163, "lr": 1.8519955878867889e-06, "epoch": 0.2580176850996437, "percentage": 25.8, "elapsed_time": "0:06:09", "remaining_time": "0:17:41", "throughput": 2600.84, "total_tokens": 960128} +{"current_steps": 1960, "total_steps": 7577, "loss": 0.1495, "lr": 1.8507873029453392e-06, "epoch": 0.2586775768773921, "percentage": 25.87, "elapsed_time": "0:06:09", "remaining_time": "0:17:38", "throughput": 2604.92, "total_tokens": 962496} +{"current_steps": 1965, "total_steps": 7577, "loss": 0.1628, "lr": 1.8495745034048896e-06, "epoch": 0.25933746865514057, "percentage": 25.93, "elapsed_time": "0:06:09", "remaining_time": "0:17:36", "throughput": 2609.68, "total_tokens": 965120} +{"current_steps": 1970, "total_steps": 7577, "loss": 0.045, "lr": 1.8483571957010127e-06, "epoch": 0.259997360432889, "percentage": 26.0, "elapsed_time": "0:06:10", "remaining_time": "0:17:33", "throughput": 2614.07, "total_tokens": 967616} +{"current_steps": 1975, "total_steps": 7577, "loss": 0.0574, "lr": 1.8471353862932035e-06, "epoch": 0.26065725221063746, "percentage": 26.07, "elapsed_time": "0:06:10", "remaining_time": "0:17:30", "throughput": 2618.79, "total_tokens": 970240} +{"current_steps": 1980, "total_steps": 7577, "loss": 0.0719, "lr": 1.8459090816648444e-06, "epoch": 0.2613171439883859, "percentage": 26.13, "elapsed_time": "0:06:10", "remaining_time": "0:17:28", "throughput": 2622.68, "total_tokens": 972544} +{"current_steps": 1985, "total_steps": 7577, "loss": 0.2544, "lr": 1.8446782883231713e-06, "epoch": 0.26197703576613435, "percentage": 26.2, "elapsed_time": "0:06:11", "remaining_time": "0:17:25", "throughput": 2626.76, "total_tokens": 974912} +{"current_steps": 1990, "total_steps": 7577, "loss": 0.4055, "lr": 1.8434430127992387e-06, "epoch": 0.2626369275438828, "percentage": 26.26, "elapsed_time": "0:06:11", "remaining_time": "0:17:22", "throughput": 2630.34, "total_tokens": 977088} +{"current_steps": 1995, "total_steps": 7577, "loss": 0.1845, "lr": 1.8422032616478857e-06, "epoch": 0.26329681932163124, "percentage": 26.33, "elapsed_time": "0:06:11", "remaining_time": "0:17:20", "throughput": 2634.87, "total_tokens": 979648} +{"current_steps": 2000, "total_steps": 7577, "loss": 0.1184, "lr": 1.8409590414477001e-06, "epoch": 0.2639567110993797, "percentage": 26.4, "elapsed_time": "0:06:12", "remaining_time": "0:17:17", "throughput": 2639.7, "total_tokens": 982336} +{"current_steps": 2005, "total_steps": 7577, "loss": 0.0071, "lr": 1.839710358800985e-06, "epoch": 0.2646166028771281, "percentage": 26.46, "elapsed_time": "0:06:12", "remaining_time": "0:17:15", "throughput": 2643.86, "total_tokens": 984768} +{"current_steps": 2010, "total_steps": 7577, "loss": 0.049, "lr": 1.8384572203337224e-06, "epoch": 0.2652764946548766, "percentage": 26.53, "elapsed_time": "0:06:12", "remaining_time": "0:17:12", "throughput": 2647.88, "total_tokens": 987136} +{"current_steps": 2015, "total_steps": 7577, "loss": 0.1358, "lr": 1.837199632695538e-06, "epoch": 0.26593638643262507, "percentage": 26.59, "elapsed_time": "0:06:13", "remaining_time": "0:17:09", "throughput": 2652.68, "total_tokens": 989824} +{"current_steps": 2020, "total_steps": 7577, "loss": 0.2944, "lr": 1.8359376025596682e-06, "epoch": 0.2665962782103735, "percentage": 26.66, "elapsed_time": "0:06:13", "remaining_time": "0:17:07", "throughput": 2656.35, "total_tokens": 992064} +{"current_steps": 2025, "total_steps": 7577, "loss": 0.1288, "lr": 1.8346711366229215e-06, "epoch": 0.26725616998812196, "percentage": 26.73, "elapsed_time": "0:06:13", "remaining_time": "0:17:04", "throughput": 2660.19, "total_tokens": 994368} +{"current_steps": 2030, "total_steps": 7577, "loss": 0.181, "lr": 1.8334002416056442e-06, "epoch": 0.2679160617658704, "percentage": 26.79, "elapsed_time": "0:06:14", "remaining_time": "0:17:02", "throughput": 2664.53, "total_tokens": 996864} +{"current_steps": 2035, "total_steps": 7577, "loss": 0.2285, "lr": 1.8321249242516865e-06, "epoch": 0.26857595354361885, "percentage": 26.86, "elapsed_time": "0:06:14", "remaining_time": "0:16:59", "throughput": 2668.86, "total_tokens": 999360} +{"current_steps": 2040, "total_steps": 7577, "loss": 0.0873, "lr": 1.8308451913283638e-06, "epoch": 0.2692358453213673, "percentage": 26.92, "elapsed_time": "0:06:14", "remaining_time": "0:16:57", "throughput": 2673.35, "total_tokens": 1001920} +{"current_steps": 2045, "total_steps": 7577, "loss": 0.0305, "lr": 1.8295610496264229e-06, "epoch": 0.26989573709911574, "percentage": 26.99, "elapsed_time": "0:06:15", "remaining_time": "0:16:54", "throughput": 2677.13, "total_tokens": 1004224} +{"current_steps": 2050, "total_steps": 7577, "loss": 0.0393, "lr": 1.828272505960005e-06, "epoch": 0.2705556288768642, "percentage": 27.06, "elapsed_time": "0:06:15", "remaining_time": "0:16:52", "throughput": 2680.92, "total_tokens": 1006528} +{"current_steps": 2055, "total_steps": 7577, "loss": 0.1813, "lr": 1.8269795671666098e-06, "epoch": 0.27121552065461263, "percentage": 27.12, "elapsed_time": "0:06:15", "remaining_time": "0:16:49", "throughput": 2684.9, "total_tokens": 1008896} +{"current_steps": 2060, "total_steps": 7577, "loss": 0.1234, "lr": 1.8256822401070591e-06, "epoch": 0.2718754124323611, "percentage": 27.19, "elapsed_time": "0:06:16", "remaining_time": "0:16:47", "throughput": 2689.82, "total_tokens": 1011648} +{"current_steps": 2065, "total_steps": 7577, "loss": 0.0522, "lr": 1.8243805316654611e-06, "epoch": 0.2725353042101095, "percentage": 27.25, "elapsed_time": "0:06:16", "remaining_time": "0:16:44", "throughput": 2694.27, "total_tokens": 1014208} +{"current_steps": 2070, "total_steps": 7577, "loss": 0.1725, "lr": 1.823074448749172e-06, "epoch": 0.27319519598785796, "percentage": 27.32, "elapsed_time": "0:06:16", "remaining_time": "0:16:42", "throughput": 2698.36, "total_tokens": 1016640} +{"current_steps": 2075, "total_steps": 7577, "loss": 0.063, "lr": 1.8217639982887623e-06, "epoch": 0.27385508776560646, "percentage": 27.39, "elapsed_time": "0:06:17", "remaining_time": "0:16:39", "throughput": 2703.03, "total_tokens": 1019328} +{"current_steps": 2080, "total_steps": 7577, "loss": 0.0781, "lr": 1.8204491872379769e-06, "epoch": 0.2745149795433549, "percentage": 27.45, "elapsed_time": "0:06:17", "remaining_time": "0:16:37", "throughput": 2706.82, "total_tokens": 1021696} +{"current_steps": 2085, "total_steps": 7577, "loss": 0.09, "lr": 1.8191300225737e-06, "epoch": 0.27517487132110335, "percentage": 27.52, "elapsed_time": "0:06:17", "remaining_time": "0:16:35", "throughput": 2711.22, "total_tokens": 1024256} +{"current_steps": 2090, "total_steps": 7577, "loss": 0.2074, "lr": 1.8178065112959184e-06, "epoch": 0.2758347630988518, "percentage": 27.58, "elapsed_time": "0:06:18", "remaining_time": "0:16:32", "throughput": 2714.93, "total_tokens": 1026560} +{"current_steps": 2095, "total_steps": 7577, "loss": 0.2426, "lr": 1.8164786604276832e-06, "epoch": 0.27649465487660024, "percentage": 27.65, "elapsed_time": "0:06:18", "remaining_time": "0:16:30", "throughput": 2719.48, "total_tokens": 1029184} +{"current_steps": 2100, "total_steps": 7577, "loss": 0.1464, "lr": 1.8151464770150727e-06, "epoch": 0.2771545466543487, "percentage": 27.72, "elapsed_time": "0:06:18", "remaining_time": "0:16:27", "throughput": 2723.88, "total_tokens": 1031744} +{"current_steps": 2105, "total_steps": 7577, "loss": 0.1528, "lr": 1.8138099681271558e-06, "epoch": 0.27781443843209713, "percentage": 27.78, "elapsed_time": "0:06:19", "remaining_time": "0:16:25", "throughput": 2727.63, "total_tokens": 1034048} +{"current_steps": 2110, "total_steps": 7577, "loss": 0.1601, "lr": 1.8124691408559536e-06, "epoch": 0.2784743302098456, "percentage": 27.85, "elapsed_time": "0:06:19", "remaining_time": "0:16:23", "throughput": 2731.86, "total_tokens": 1036544} +{"current_steps": 2115, "total_steps": 7577, "loss": 0.1008, "lr": 1.8111240023164023e-06, "epoch": 0.279134221987594, "percentage": 27.91, "elapsed_time": "0:06:19", "remaining_time": "0:16:20", "throughput": 2735.59, "total_tokens": 1038848} +{"current_steps": 2120, "total_steps": 7577, "loss": 0.0632, "lr": 1.809774559646316e-06, "epoch": 0.27979411376534247, "percentage": 27.98, "elapsed_time": "0:06:20", "remaining_time": "0:16:18", "throughput": 2739.31, "total_tokens": 1041152} +{"current_steps": 2125, "total_steps": 7577, "loss": 0.0935, "lr": 1.8084208200063469e-06, "epoch": 0.2804540055430909, "percentage": 28.05, "elapsed_time": "0:06:20", "remaining_time": "0:16:16", "throughput": 2744.29, "total_tokens": 1043968} +{"current_steps": 2130, "total_steps": 7577, "loss": 0.2149, "lr": 1.8070627905799496e-06, "epoch": 0.28111389732083936, "percentage": 28.11, "elapsed_time": "0:06:20", "remaining_time": "0:16:13", "throughput": 2747.99, "total_tokens": 1046272} +{"current_steps": 2135, "total_steps": 7577, "loss": 0.0862, "lr": 1.8057004785733413e-06, "epoch": 0.28177378909858786, "percentage": 28.18, "elapsed_time": "0:06:21", "remaining_time": "0:16:11", "throughput": 2751.37, "total_tokens": 1048448} +{"current_steps": 2140, "total_steps": 7577, "loss": 0.1758, "lr": 1.8043338912154647e-06, "epoch": 0.2824336808763363, "percentage": 28.24, "elapsed_time": "0:06:21", "remaining_time": "0:16:08", "throughput": 2755.87, "total_tokens": 1051072} +{"current_steps": 2145, "total_steps": 7577, "loss": 0.0486, "lr": 1.8029630357579486e-06, "epoch": 0.28309357265408475, "percentage": 28.31, "elapsed_time": "0:06:21", "remaining_time": "0:16:06", "throughput": 2759.41, "total_tokens": 1053312} +{"current_steps": 2150, "total_steps": 7577, "loss": 0.0795, "lr": 1.8015879194750702e-06, "epoch": 0.2837534644318332, "percentage": 28.38, "elapsed_time": "0:06:22", "remaining_time": "0:16:04", "throughput": 2763.24, "total_tokens": 1055680} +{"current_steps": 2155, "total_steps": 7577, "loss": 0.187, "lr": 1.8002085496637165e-06, "epoch": 0.28441335620958164, "percentage": 28.44, "elapsed_time": "0:06:22", "remaining_time": "0:16:02", "throughput": 2766.9, "total_tokens": 1057984} +{"current_steps": 2160, "total_steps": 7577, "loss": 0.1492, "lr": 1.7988249336433448e-06, "epoch": 0.2850732479873301, "percentage": 28.51, "elapsed_time": "0:06:22", "remaining_time": "0:15:59", "throughput": 2771.66, "total_tokens": 1060736} +{"current_steps": 2165, "total_steps": 7577, "loss": 0.1319, "lr": 1.7974370787559447e-06, "epoch": 0.2857331397650785, "percentage": 28.57, "elapsed_time": "0:06:23", "remaining_time": "0:15:57", "throughput": 2776.28, "total_tokens": 1063424} +{"current_steps": 2170, "total_steps": 7577, "loss": 0.0575, "lr": 1.796044992365999e-06, "epoch": 0.28639303154282697, "percentage": 28.64, "elapsed_time": "0:06:23", "remaining_time": "0:15:55", "throughput": 2779.93, "total_tokens": 1065728} +{"current_steps": 2175, "total_steps": 7577, "loss": 0.0009, "lr": 1.794648681860444e-06, "epoch": 0.2870529233205754, "percentage": 28.71, "elapsed_time": "0:06:23", "remaining_time": "0:15:52", "throughput": 2783.9, "total_tokens": 1068160} +{"current_steps": 2180, "total_steps": 7577, "loss": 0.2734, "lr": 1.7932481546486312e-06, "epoch": 0.28771281509832386, "percentage": 28.77, "elapsed_time": "0:06:24", "remaining_time": "0:15:50", "throughput": 2787.86, "total_tokens": 1070592} +{"current_steps": 2185, "total_steps": 7577, "loss": 0.1758, "lr": 1.791843418162287e-06, "epoch": 0.2883727068760723, "percentage": 28.84, "elapsed_time": "0:06:24", "remaining_time": "0:15:48", "throughput": 2792.42, "total_tokens": 1073280} +{"current_steps": 2190, "total_steps": 7577, "loss": 0.0031, "lr": 1.7904344798554748e-06, "epoch": 0.28903259865382075, "percentage": 28.9, "elapsed_time": "0:06:24", "remaining_time": "0:15:46", "throughput": 2796.04, "total_tokens": 1075584} +{"current_steps": 2195, "total_steps": 7577, "loss": 0.0927, "lr": 1.789021347204553e-06, "epoch": 0.28969249043156925, "percentage": 28.97, "elapsed_time": "0:06:25", "remaining_time": "0:15:44", "throughput": 2799.97, "total_tokens": 1078016} +{"current_steps": 2200, "total_steps": 7577, "loss": 0.1631, "lr": 1.7876040277081381e-06, "epoch": 0.2903523822093177, "percentage": 29.04, "elapsed_time": "0:06:25", "remaining_time": "0:15:41", "throughput": 2804.07, "total_tokens": 1080512} +{"current_steps": 2205, "total_steps": 7577, "loss": 0.0382, "lr": 1.7861825288870632e-06, "epoch": 0.29101227398706614, "percentage": 29.1, "elapsed_time": "0:06:25", "remaining_time": "0:15:39", "throughput": 2807.51, "total_tokens": 1082752} +{"current_steps": 2210, "total_steps": 7577, "loss": 0.3717, "lr": 1.7847568582843376e-06, "epoch": 0.2916721657648146, "percentage": 29.17, "elapsed_time": "0:06:25", "remaining_time": "0:15:37", "throughput": 2811.43, "total_tokens": 1085184} +{"current_steps": 2215, "total_steps": 7577, "loss": 0.1799, "lr": 1.7833270234651088e-06, "epoch": 0.29233205754256303, "percentage": 29.23, "elapsed_time": "0:06:26", "remaining_time": "0:15:35", "throughput": 2814.66, "total_tokens": 1087360} +{"current_steps": 2220, "total_steps": 7577, "loss": 0.0596, "lr": 1.781893032016621e-06, "epoch": 0.2929919493203115, "percentage": 29.3, "elapsed_time": "0:06:26", "remaining_time": "0:15:33", "throughput": 2819.02, "total_tokens": 1089984} +{"current_steps": 2225, "total_steps": 7577, "loss": 0.0264, "lr": 1.7804548915481746e-06, "epoch": 0.2936518410980599, "percentage": 29.37, "elapsed_time": "0:06:26", "remaining_time": "0:15:30", "throughput": 2823.37, "total_tokens": 1092608} +{"current_steps": 2230, "total_steps": 7577, "loss": 0.1052, "lr": 1.7790126096910865e-06, "epoch": 0.29431173287580836, "percentage": 29.43, "elapsed_time": "0:06:27", "remaining_time": "0:15:28", "throughput": 2827.25, "total_tokens": 1095040} +{"current_steps": 2235, "total_steps": 7577, "loss": 0.1063, "lr": 1.7775661940986492e-06, "epoch": 0.2949716246535568, "percentage": 29.5, "elapsed_time": "0:06:27", "remaining_time": "0:15:26", "throughput": 2831.76, "total_tokens": 1097728} +{"current_steps": 2240, "total_steps": 7577, "loss": 0.1857, "lr": 1.776115652446091e-06, "epoch": 0.29563151643130525, "percentage": 29.56, "elapsed_time": "0:06:27", "remaining_time": "0:15:24", "throughput": 2835.45, "total_tokens": 1100096} +{"current_steps": 2245, "total_steps": 7577, "loss": 0.1076, "lr": 1.7746609924305336e-06, "epoch": 0.2962914082090537, "percentage": 29.63, "elapsed_time": "0:06:28", "remaining_time": "0:15:22", "throughput": 2839.04, "total_tokens": 1102400} +{"current_steps": 2250, "total_steps": 7577, "loss": 0.0825, "lr": 1.7732022217709534e-06, "epoch": 0.29695129998680214, "percentage": 29.7, "elapsed_time": "0:06:28", "remaining_time": "0:15:20", "throughput": 2843.22, "total_tokens": 1104960} +{"current_steps": 2255, "total_steps": 7577, "loss": 0.1648, "lr": 1.7717393482081384e-06, "epoch": 0.2976111917645506, "percentage": 29.76, "elapsed_time": "0:06:28", "remaining_time": "0:15:17", "throughput": 2847.4, "total_tokens": 1107520} +{"current_steps": 2260, "total_steps": 7577, "loss": 0.1223, "lr": 1.7702723795046492e-06, "epoch": 0.2982710835422991, "percentage": 29.83, "elapsed_time": "0:06:29", "remaining_time": "0:15:15", "throughput": 2851.26, "total_tokens": 1109952} +{"current_steps": 2265, "total_steps": 7577, "loss": 0.0026, "lr": 1.7688013234447757e-06, "epoch": 0.29893097532004753, "percentage": 29.89, "elapsed_time": "0:06:29", "remaining_time": "0:15:13", "throughput": 2854.5, "total_tokens": 1112128} +{"current_steps": 2270, "total_steps": 7577, "loss": 0.1387, "lr": 1.7673261878344973e-06, "epoch": 0.299590867097796, "percentage": 29.96, "elapsed_time": "0:06:29", "remaining_time": "0:15:11", "throughput": 2858.68, "total_tokens": 1114688} +{"current_steps": 2274, "total_steps": 7577, "eval_loss": 0.12411058694124222, "epoch": 0.30011878051999474, "percentage": 30.01, "elapsed_time": "0:06:38", "remaining_time": "0:15:28", "throughput": 2804.9, "total_tokens": 1116800} +{"current_steps": 2275, "total_steps": 7577, "loss": 0.1185, "lr": 1.7658469805014414e-06, "epoch": 0.3002507588755444, "percentage": 30.03, "elapsed_time": "0:07:25", "remaining_time": "0:17:19", "throughput": 2506.0, "total_tokens": 1117248} +{"current_steps": 2280, "total_steps": 7577, "loss": 0.1096, "lr": 1.7643637092948415e-06, "epoch": 0.30091065065329287, "percentage": 30.09, "elapsed_time": "0:07:26", "remaining_time": "0:17:16", "throughput": 2509.88, "total_tokens": 1119808} +{"current_steps": 2285, "total_steps": 7577, "loss": 0.2572, "lr": 1.7628763820854948e-06, "epoch": 0.3015705424310413, "percentage": 30.16, "elapsed_time": "0:07:26", "remaining_time": "0:17:14", "throughput": 2513.23, "total_tokens": 1122112} +{"current_steps": 2290, "total_steps": 7577, "loss": 0.0884, "lr": 1.7613850067657216e-06, "epoch": 0.30223043420878976, "percentage": 30.22, "elapsed_time": "0:07:26", "remaining_time": "0:17:11", "throughput": 2516.85, "total_tokens": 1124544} +{"current_steps": 2295, "total_steps": 7577, "loss": 0.1247, "lr": 1.7598895912493232e-06, "epoch": 0.3028903259865382, "percentage": 30.29, "elapsed_time": "0:07:27", "remaining_time": "0:17:09", "throughput": 2520.72, "total_tokens": 1127104} +{"current_steps": 2300, "total_steps": 7577, "loss": 0.0773, "lr": 1.7583901434715397e-06, "epoch": 0.30355021776428665, "percentage": 30.36, "elapsed_time": "0:07:27", "remaining_time": "0:17:06", "throughput": 2524.32, "total_tokens": 1129536} +{"current_steps": 2305, "total_steps": 7577, "loss": 0.1009, "lr": 1.7568866713890074e-06, "epoch": 0.3042101095420351, "percentage": 30.42, "elapsed_time": "0:07:27", "remaining_time": "0:17:04", "throughput": 2527.65, "total_tokens": 1131840} +{"current_steps": 2310, "total_steps": 7577, "loss": 0.1243, "lr": 1.7553791829797175e-06, "epoch": 0.30487000131978353, "percentage": 30.49, "elapsed_time": "0:07:28", "remaining_time": "0:17:01", "throughput": 2531.38, "total_tokens": 1134336} +{"current_steps": 2315, "total_steps": 7577, "loss": 0.3449, "lr": 1.7538676862429737e-06, "epoch": 0.305529893097532, "percentage": 30.55, "elapsed_time": "0:07:28", "remaining_time": "0:16:59", "throughput": 2534.67, "total_tokens": 1136640} +{"current_steps": 2320, "total_steps": 7577, "loss": 0.1248, "lr": 1.7523521891993486e-06, "epoch": 0.3061897848752805, "percentage": 30.62, "elapsed_time": "0:07:28", "remaining_time": "0:16:56", "throughput": 2538.39, "total_tokens": 1139136} +{"current_steps": 2325, "total_steps": 7577, "loss": 0.0367, "lr": 1.7508326998906422e-06, "epoch": 0.3068496766530289, "percentage": 30.68, "elapsed_time": "0:07:29", "remaining_time": "0:16:54", "throughput": 2541.97, "total_tokens": 1141568} +{"current_steps": 2330, "total_steps": 7577, "loss": 0.0023, "lr": 1.7493092263798394e-06, "epoch": 0.30750956843077737, "percentage": 30.75, "elapsed_time": "0:07:29", "remaining_time": "0:16:52", "throughput": 2545.4, "total_tokens": 1143936} +{"current_steps": 2335, "total_steps": 7577, "loss": 0.0188, "lr": 1.7477817767510664e-06, "epoch": 0.3081694602085258, "percentage": 30.82, "elapsed_time": "0:07:29", "remaining_time": "0:16:49", "throughput": 2549.49, "total_tokens": 1146624} +{"current_steps": 2340, "total_steps": 7577, "loss": 0.0209, "lr": 1.7462503591095484e-06, "epoch": 0.30882935198627426, "percentage": 30.88, "elapsed_time": "0:07:30", "remaining_time": "0:16:47", "throughput": 2553.2, "total_tokens": 1149120} +{"current_steps": 2345, "total_steps": 7577, "loss": 0.1152, "lr": 1.7447149815815659e-06, "epoch": 0.3094892437640227, "percentage": 30.95, "elapsed_time": "0:07:30", "remaining_time": "0:16:44", "throughput": 2556.58, "total_tokens": 1151488} +{"current_steps": 2350, "total_steps": 7577, "loss": 0.1426, "lr": 1.7431756523144126e-06, "epoch": 0.31014913554177115, "percentage": 31.01, "elapsed_time": "0:07:30", "remaining_time": "0:16:42", "throughput": 2559.44, "total_tokens": 1153600} +{"current_steps": 2355, "total_steps": 7577, "loss": 0.0021, "lr": 1.7416323794763512e-06, "epoch": 0.3108090273195196, "percentage": 31.08, "elapsed_time": "0:07:31", "remaining_time": "0:16:40", "throughput": 2563.37, "total_tokens": 1156224} +{"current_steps": 2360, "total_steps": 7577, "loss": 0.234, "lr": 1.7400851712565707e-06, "epoch": 0.31146891909726804, "percentage": 31.15, "elapsed_time": "0:07:31", "remaining_time": "0:16:37", "throughput": 2566.85, "total_tokens": 1158656} +{"current_steps": 2365, "total_steps": 7577, "loss": 0.1276, "lr": 1.7385340358651432e-06, "epoch": 0.3121288108750165, "percentage": 31.21, "elapsed_time": "0:07:31", "remaining_time": "0:16:35", "throughput": 2570.99, "total_tokens": 1161408} +{"current_steps": 2370, "total_steps": 7577, "loss": 0.0223, "lr": 1.736978981532979e-06, "epoch": 0.3127887026527649, "percentage": 31.28, "elapsed_time": "0:07:32", "remaining_time": "0:16:33", "throughput": 2574.62, "total_tokens": 1163904} +{"current_steps": 2375, "total_steps": 7577, "loss": 0.2808, "lr": 1.7354200165117838e-06, "epoch": 0.31344859443051337, "percentage": 31.34, "elapsed_time": "0:07:32", "remaining_time": "0:16:30", "throughput": 2577.81, "total_tokens": 1166208} +{"current_steps": 2380, "total_steps": 7577, "loss": 0.2086, "lr": 1.733857149074016e-06, "epoch": 0.3141084862082619, "percentage": 31.41, "elapsed_time": "0:07:32", "remaining_time": "0:16:28", "throughput": 2581.0, "total_tokens": 1168512} +{"current_steps": 2385, "total_steps": 7577, "loss": 0.2359, "lr": 1.7322903875128402e-06, "epoch": 0.3147683779860103, "percentage": 31.48, "elapsed_time": "0:07:33", "remaining_time": "0:16:26", "throughput": 2584.77, "total_tokens": 1171072} +{"current_steps": 2390, "total_steps": 7577, "loss": 0.0071, "lr": 1.7307197401420858e-06, "epoch": 0.31542826976375876, "percentage": 31.54, "elapsed_time": "0:07:33", "remaining_time": "0:16:23", "throughput": 2587.87, "total_tokens": 1173312} +{"current_steps": 2395, "total_steps": 7577, "loss": 0.1059, "lr": 1.7291452152962018e-06, "epoch": 0.3160881615415072, "percentage": 31.61, "elapsed_time": "0:07:33", "remaining_time": "0:16:21", "throughput": 2591.37, "total_tokens": 1175744} +{"current_steps": 2400, "total_steps": 7577, "loss": 0.2033, "lr": 1.7275668213302116e-06, "epoch": 0.31674805331925565, "percentage": 31.67, "elapsed_time": "0:07:34", "remaining_time": "0:16:19", "throughput": 2594.73, "total_tokens": 1178112} +{"current_steps": 2405, "total_steps": 7577, "loss": 0.0488, "lr": 1.72598456661967e-06, "epoch": 0.3174079450970041, "percentage": 31.74, "elapsed_time": "0:07:34", "remaining_time": "0:16:17", "throughput": 2597.81, "total_tokens": 1180352} +{"current_steps": 2410, "total_steps": 7577, "loss": 0.1241, "lr": 1.7243984595606191e-06, "epoch": 0.31806783687475254, "percentage": 31.81, "elapsed_time": "0:07:34", "remaining_time": "0:16:14", "throughput": 2600.76, "total_tokens": 1182528} +{"current_steps": 2415, "total_steps": 7577, "loss": 0.0697, "lr": 1.722808508569542e-06, "epoch": 0.318727728652501, "percentage": 31.87, "elapsed_time": "0:07:35", "remaining_time": "0:16:12", "throughput": 2604.91, "total_tokens": 1185280} +{"current_steps": 2420, "total_steps": 7577, "loss": 0.0766, "lr": 1.72121472208332e-06, "epoch": 0.31938762043024943, "percentage": 31.94, "elapsed_time": "0:07:35", "remaining_time": "0:16:10", "throughput": 2609.04, "total_tokens": 1188032} +{"current_steps": 2425, "total_steps": 7577, "loss": 0.1857, "lr": 1.7196171085591864e-06, "epoch": 0.3200475122079979, "percentage": 32.0, "elapsed_time": "0:07:35", "remaining_time": "0:16:08", "throughput": 2612.52, "total_tokens": 1190464} +{"current_steps": 2430, "total_steps": 7577, "loss": 0.2532, "lr": 1.7180156764746824e-06, "epoch": 0.3207074039857463, "percentage": 32.07, "elapsed_time": "0:07:36", "remaining_time": "0:16:05", "throughput": 2616.14, "total_tokens": 1192960} +{"current_steps": 2435, "total_steps": 7577, "loss": 0.0694, "lr": 1.7164104343276113e-06, "epoch": 0.32136729576349476, "percentage": 32.14, "elapsed_time": "0:07:36", "remaining_time": "0:16:03", "throughput": 2618.93, "total_tokens": 1195072} +{"current_steps": 2440, "total_steps": 7577, "loss": 0.0516, "lr": 1.714801390635996e-06, "epoch": 0.3220271875412432, "percentage": 32.2, "elapsed_time": "0:07:36", "remaining_time": "0:16:01", "throughput": 2622.12, "total_tokens": 1197376} +{"current_steps": 2445, "total_steps": 7577, "loss": 0.0735, "lr": 1.7131885539380297e-06, "epoch": 0.3226870793189917, "percentage": 32.27, "elapsed_time": "0:07:36", "remaining_time": "0:15:59", "throughput": 2625.82, "total_tokens": 1199936} +{"current_steps": 2450, "total_steps": 7577, "loss": 0.141, "lr": 1.7115719327920335e-06, "epoch": 0.32334697109674015, "percentage": 32.33, "elapsed_time": "0:07:37", "remaining_time": "0:15:56", "throughput": 2629.26, "total_tokens": 1202368} +{"current_steps": 2455, "total_steps": 7577, "loss": 0.0172, "lr": 1.70995153577641e-06, "epoch": 0.3240068628744886, "percentage": 32.4, "elapsed_time": "0:07:37", "remaining_time": "0:15:54", "throughput": 2632.68, "total_tokens": 1204800} +{"current_steps": 2460, "total_steps": 7577, "loss": 0.0639, "lr": 1.7083273714895991e-06, "epoch": 0.32466675465223704, "percentage": 32.47, "elapsed_time": "0:07:37", "remaining_time": "0:15:52", "throughput": 2636.77, "total_tokens": 1207552} +{"current_steps": 2465, "total_steps": 7577, "loss": 0.1031, "lr": 1.7066994485500298e-06, "epoch": 0.3253266464299855, "percentage": 32.53, "elapsed_time": "0:07:38", "remaining_time": "0:15:50", "throughput": 2639.91, "total_tokens": 1209856} +{"current_steps": 2470, "total_steps": 7577, "loss": 0.1125, "lr": 1.7050677755960762e-06, "epoch": 0.32598653820773393, "percentage": 32.6, "elapsed_time": "0:07:38", "remaining_time": "0:15:48", "throughput": 2643.47, "total_tokens": 1212352} +{"current_steps": 2475, "total_steps": 7577, "loss": 0.0832, "lr": 1.7034323612860124e-06, "epoch": 0.3266464299854824, "percentage": 32.66, "elapsed_time": "0:07:38", "remaining_time": "0:15:46", "throughput": 2647.15, "total_tokens": 1214912} +{"current_steps": 2480, "total_steps": 7577, "loss": 0.1275, "lr": 1.7017932142979645e-06, "epoch": 0.3273063217632308, "percentage": 32.73, "elapsed_time": "0:07:39", "remaining_time": "0:15:43", "throughput": 2649.95, "total_tokens": 1217088} +{"current_steps": 2485, "total_steps": 7577, "loss": 0.2478, "lr": 1.700150343329866e-06, "epoch": 0.32796621354097927, "percentage": 32.8, "elapsed_time": "0:07:39", "remaining_time": "0:15:41", "throughput": 2653.47, "total_tokens": 1219584} +{"current_steps": 2490, "total_steps": 7577, "loss": 0.1182, "lr": 1.6985037570994113e-06, "epoch": 0.3286261053187277, "percentage": 32.86, "elapsed_time": "0:07:39", "remaining_time": "0:15:39", "throughput": 2657.55, "total_tokens": 1222336} +{"current_steps": 2495, "total_steps": 7577, "loss": 0.0913, "lr": 1.6968534643440088e-06, "epoch": 0.32928599709647616, "percentage": 32.93, "elapsed_time": "0:07:40", "remaining_time": "0:15:37", "throughput": 2661.07, "total_tokens": 1224832} +{"current_steps": 2500, "total_steps": 7577, "loss": 0.1998, "lr": 1.6951994738207364e-06, "epoch": 0.3299458888742246, "percentage": 32.99, "elapsed_time": "0:07:40", "remaining_time": "0:15:35", "throughput": 2664.73, "total_tokens": 1227392} +{"current_steps": 2505, "total_steps": 7577, "loss": 0.2007, "lr": 1.6935417943062928e-06, "epoch": 0.3306057806519731, "percentage": 33.06, "elapsed_time": "0:07:40", "remaining_time": "0:15:33", "throughput": 2668.38, "total_tokens": 1229952} +{"current_steps": 2510, "total_steps": 7577, "loss": 0.0615, "lr": 1.6918804345969516e-06, "epoch": 0.33126567242972155, "percentage": 33.13, "elapsed_time": "0:07:41", "remaining_time": "0:15:31", "throughput": 2672.28, "total_tokens": 1232640} +{"current_steps": 2515, "total_steps": 7577, "loss": 0.0479, "lr": 1.6902154035085156e-06, "epoch": 0.33192556420747, "percentage": 33.19, "elapsed_time": "0:07:41", "remaining_time": "0:15:29", "throughput": 2675.9, "total_tokens": 1235200} +{"current_steps": 2520, "total_steps": 7577, "loss": 0.1243, "lr": 1.688546709876269e-06, "epoch": 0.33258545598521844, "percentage": 33.26, "elapsed_time": "0:07:41", "remaining_time": "0:15:26", "throughput": 2679.28, "total_tokens": 1237632} +{"current_steps": 2525, "total_steps": 7577, "loss": 0.0662, "lr": 1.6868743625549314e-06, "epoch": 0.3332453477629669, "percentage": 33.32, "elapsed_time": "0:07:42", "remaining_time": "0:15:24", "throughput": 2682.38, "total_tokens": 1239936} +{"current_steps": 2530, "total_steps": 7577, "loss": 0.0455, "lr": 1.6851983704186092e-06, "epoch": 0.3339052395407153, "percentage": 33.39, "elapsed_time": "0:07:42", "remaining_time": "0:15:22", "throughput": 2685.61, "total_tokens": 1242304} +{"current_steps": 2535, "total_steps": 7577, "loss": 0.0018, "lr": 1.6835187423607503e-06, "epoch": 0.33456513131846377, "percentage": 33.46, "elapsed_time": "0:07:42", "remaining_time": "0:15:20", "throughput": 2688.97, "total_tokens": 1244736} +{"current_steps": 2540, "total_steps": 7577, "loss": 0.1863, "lr": 1.681835487294096e-06, "epoch": 0.3352250230962122, "percentage": 33.52, "elapsed_time": "0:07:43", "remaining_time": "0:15:18", "throughput": 2692.97, "total_tokens": 1247488} +{"current_steps": 2545, "total_steps": 7577, "loss": 0.229, "lr": 1.6801486141506342e-06, "epoch": 0.33588491487396066, "percentage": 33.59, "elapsed_time": "0:07:43", "remaining_time": "0:15:16", "throughput": 2696.58, "total_tokens": 1250048} +{"current_steps": 2550, "total_steps": 7577, "loss": 0.3541, "lr": 1.6784581318815514e-06, "epoch": 0.3365448066517091, "percentage": 33.65, "elapsed_time": "0:07:43", "remaining_time": "0:15:14", "throughput": 2700.83, "total_tokens": 1252928} +{"current_steps": 2555, "total_steps": 7577, "loss": 0.1596, "lr": 1.6767640494571849e-06, "epoch": 0.33720469842945755, "percentage": 33.72, "elapsed_time": "0:07:44", "remaining_time": "0:15:12", "throughput": 2704.45, "total_tokens": 1255488} +{"current_steps": 2560, "total_steps": 7577, "loss": 0.3643, "lr": 1.6750663758669767e-06, "epoch": 0.337864590207206, "percentage": 33.79, "elapsed_time": "0:07:44", "remaining_time": "0:15:10", "throughput": 2707.88, "total_tokens": 1257984} +{"current_steps": 2565, "total_steps": 7577, "loss": 0.1098, "lr": 1.6733651201194245e-06, "epoch": 0.3385244819849545, "percentage": 33.85, "elapsed_time": "0:07:44", "remaining_time": "0:15:08", "throughput": 2711.21, "total_tokens": 1260416} +{"current_steps": 2570, "total_steps": 7577, "loss": 0.1186, "lr": 1.6716602912420342e-06, "epoch": 0.33918437376270294, "percentage": 33.92, "elapsed_time": "0:07:45", "remaining_time": "0:15:06", "throughput": 2715.18, "total_tokens": 1263168} +{"current_steps": 2575, "total_steps": 7577, "loss": 0.1177, "lr": 1.6699518982812726e-06, "epoch": 0.3398442655404514, "percentage": 33.98, "elapsed_time": "0:07:45", "remaining_time": "0:15:04", "throughput": 2718.5, "total_tokens": 1265600} +{"current_steps": 2580, "total_steps": 7577, "loss": 0.0041, "lr": 1.6682399503025183e-06, "epoch": 0.34050415731819983, "percentage": 34.05, "elapsed_time": "0:07:45", "remaining_time": "0:15:02", "throughput": 2721.82, "total_tokens": 1268032} +{"current_steps": 2585, "total_steps": 7577, "loss": 0.1831, "lr": 1.666524456390014e-06, "epoch": 0.3411640490959483, "percentage": 34.12, "elapsed_time": "0:07:46", "remaining_time": "0:15:00", "throughput": 2724.86, "total_tokens": 1270336} +{"current_steps": 2590, "total_steps": 7577, "loss": 0.0639, "lr": 1.664805425646819e-06, "epoch": 0.3418239408736967, "percentage": 34.18, "elapsed_time": "0:07:46", "remaining_time": "0:14:58", "throughput": 2728.83, "total_tokens": 1273088} +{"current_steps": 2595, "total_steps": 7577, "loss": 0.2223, "lr": 1.6630828671947606e-06, "epoch": 0.34248383265144516, "percentage": 34.25, "elapsed_time": "0:07:46", "remaining_time": "0:14:56", "throughput": 2731.98, "total_tokens": 1275456} +{"current_steps": 2600, "total_steps": 7577, "loss": 0.0484, "lr": 1.6613567901743842e-06, "epoch": 0.3431437244291936, "percentage": 34.31, "elapsed_time": "0:07:47", "remaining_time": "0:14:54", "throughput": 2735.29, "total_tokens": 1277888} +{"current_steps": 2605, "total_steps": 7577, "loss": 0.0021, "lr": 1.6596272037449075e-06, "epoch": 0.34380361620694205, "percentage": 34.38, "elapsed_time": "0:07:47", "remaining_time": "0:14:52", "throughput": 2738.71, "total_tokens": 1280384} +{"current_steps": 2610, "total_steps": 7577, "loss": 0.0633, "lr": 1.6578941170841696e-06, "epoch": 0.3444635079846905, "percentage": 34.45, "elapsed_time": "0:07:47", "remaining_time": "0:14:50", "throughput": 2742.24, "total_tokens": 1282944} +{"current_steps": 2615, "total_steps": 7577, "loss": 0.0451, "lr": 1.6561575393885833e-06, "epoch": 0.34512339976243894, "percentage": 34.51, "elapsed_time": "0:07:48", "remaining_time": "0:14:48", "throughput": 2745.12, "total_tokens": 1285184} +{"current_steps": 2620, "total_steps": 7577, "loss": 0.2038, "lr": 1.6544174798730864e-06, "epoch": 0.3457832915401874, "percentage": 34.58, "elapsed_time": "0:07:48", "remaining_time": "0:14:46", "throughput": 2748.79, "total_tokens": 1287808} +{"current_steps": 2625, "total_steps": 7577, "loss": 0.1932, "lr": 1.6526739477710923e-06, "epoch": 0.34644318331793583, "percentage": 34.64, "elapsed_time": "0:07:48", "remaining_time": "0:14:44", "throughput": 2752.45, "total_tokens": 1290432} +{"current_steps": 2630, "total_steps": 7577, "loss": 0.2289, "lr": 1.650926952334441e-06, "epoch": 0.34710307509568433, "percentage": 34.71, "elapsed_time": "0:07:49", "remaining_time": "0:14:42", "throughput": 2755.45, "total_tokens": 1292736} +{"current_steps": 2635, "total_steps": 7577, "loss": 0.2947, "lr": 1.6491765028333516e-06, "epoch": 0.3477629668734328, "percentage": 34.78, "elapsed_time": "0:07:49", "remaining_time": "0:14:40", "throughput": 2758.58, "total_tokens": 1295104} +{"current_steps": 2640, "total_steps": 7577, "loss": 0.0444, "lr": 1.6474226085563693e-06, "epoch": 0.3484228586511812, "percentage": 34.84, "elapsed_time": "0:07:49", "remaining_time": "0:14:38", "throughput": 2761.97, "total_tokens": 1297600} +{"current_steps": 2645, "total_steps": 7577, "loss": 0.0057, "lr": 1.6456652788103215e-06, "epoch": 0.34908275042892967, "percentage": 34.91, "elapsed_time": "0:07:50", "remaining_time": "0:14:36", "throughput": 2765.62, "total_tokens": 1300224} +{"current_steps": 2650, "total_steps": 7577, "loss": 0.0494, "lr": 1.6439045229202631e-06, "epoch": 0.3497426422066781, "percentage": 34.97, "elapsed_time": "0:07:50", "remaining_time": "0:14:34", "throughput": 2768.6, "total_tokens": 1302528} +{"current_steps": 2653, "total_steps": 7577, "eval_loss": 0.13837853074073792, "epoch": 0.3501385772733272, "percentage": 35.01, "elapsed_time": "0:07:58", "remaining_time": "0:14:48", "throughput": 2724.81, "total_tokens": 1303872} +{"current_steps": 2655, "total_steps": 7577, "loss": 0.1541, "lr": 1.6421403502294307e-06, "epoch": 0.35040253398442656, "percentage": 35.04, "elapsed_time": "0:08:44", "remaining_time": "0:16:12", "throughput": 2487.41, "total_tokens": 1305024} +{"current_steps": 2660, "total_steps": 7577, "loss": 0.1878, "lr": 1.6403727700991915e-06, "epoch": 0.351062425762175, "percentage": 35.11, "elapsed_time": "0:08:44", "remaining_time": "0:16:10", "throughput": 2490.32, "total_tokens": 1307392} +{"current_steps": 2665, "total_steps": 7577, "loss": 0.273, "lr": 1.6386017919089933e-06, "epoch": 0.35172231753992345, "percentage": 35.17, "elapsed_time": "0:08:45", "remaining_time": "0:16:08", "throughput": 2493.7, "total_tokens": 1310016} +{"current_steps": 2670, "total_steps": 7577, "loss": 0.0471, "lr": 1.636827425056316e-06, "epoch": 0.3523822093176719, "percentage": 35.24, "elapsed_time": "0:08:45", "remaining_time": "0:16:06", "throughput": 2496.99, "total_tokens": 1312576} +{"current_steps": 2675, "total_steps": 7577, "loss": 0.1356, "lr": 1.635049678956621e-06, "epoch": 0.35304210109542034, "percentage": 35.3, "elapsed_time": "0:08:45", "remaining_time": "0:16:03", "throughput": 2500.17, "total_tokens": 1315072} +{"current_steps": 2680, "total_steps": 7577, "loss": 0.125, "lr": 1.633268563043301e-06, "epoch": 0.3537019928731688, "percentage": 35.37, "elapsed_time": "0:08:46", "remaining_time": "0:16:01", "throughput": 2503.24, "total_tokens": 1317504} +{"current_steps": 2685, "total_steps": 7577, "loss": 0.0021, "lr": 1.63148408676763e-06, "epoch": 0.3543618846509172, "percentage": 35.44, "elapsed_time": "0:08:46", "remaining_time": "0:15:59", "throughput": 2505.84, "total_tokens": 1319680} +{"current_steps": 2690, "total_steps": 7577, "loss": 0.001, "lr": 1.6296962595987141e-06, "epoch": 0.3550217764286657, "percentage": 35.5, "elapsed_time": "0:08:46", "remaining_time": "0:15:57", "throughput": 2509.13, "total_tokens": 1322240} +{"current_steps": 2695, "total_steps": 7577, "loss": 0.1102, "lr": 1.6279050910234392e-06, "epoch": 0.35568166820641417, "percentage": 35.57, "elapsed_time": "0:08:47", "remaining_time": "0:15:55", "throughput": 2512.31, "total_tokens": 1324736} +{"current_steps": 2700, "total_steps": 7577, "loss": 0.0617, "lr": 1.626110590546423e-06, "epoch": 0.3563415599841626, "percentage": 35.63, "elapsed_time": "0:08:47", "remaining_time": "0:15:53", "throughput": 2515.26, "total_tokens": 1327104} +{"current_steps": 2705, "total_steps": 7577, "loss": 0.2021, "lr": 1.6243127676899635e-06, "epoch": 0.35700145176191106, "percentage": 35.7, "elapsed_time": "0:08:47", "remaining_time": "0:15:50", "throughput": 2519.0, "total_tokens": 1329920} +{"current_steps": 2710, "total_steps": 7577, "loss": 0.2292, "lr": 1.6225116319939884e-06, "epoch": 0.3576613435396595, "percentage": 35.77, "elapsed_time": "0:08:48", "remaining_time": "0:15:48", "throughput": 2522.03, "total_tokens": 1332352} +{"current_steps": 2715, "total_steps": 7577, "loss": 0.1136, "lr": 1.6207071930160044e-06, "epoch": 0.35832123531740795, "percentage": 35.83, "elapsed_time": "0:08:48", "remaining_time": "0:15:46", "throughput": 2525.52, "total_tokens": 1335040} +{"current_steps": 2720, "total_steps": 7577, "loss": 0.0427, "lr": 1.6188994603310468e-06, "epoch": 0.3589811270951564, "percentage": 35.9, "elapsed_time": "0:08:48", "remaining_time": "0:15:44", "throughput": 2528.54, "total_tokens": 1337472} +{"current_steps": 2725, "total_steps": 7577, "loss": 0.158, "lr": 1.617088443531628e-06, "epoch": 0.35964101887290484, "percentage": 35.96, "elapsed_time": "0:08:49", "remaining_time": "0:15:42", "throughput": 2531.24, "total_tokens": 1339712} +{"current_steps": 2730, "total_steps": 7577, "loss": 0.0092, "lr": 1.6152741522276882e-06, "epoch": 0.3603009106506533, "percentage": 36.03, "elapsed_time": "0:08:49", "remaining_time": "0:15:40", "throughput": 2534.27, "total_tokens": 1342144} +{"current_steps": 2735, "total_steps": 7577, "loss": 0.0433, "lr": 1.6134565960465425e-06, "epoch": 0.36096080242840173, "percentage": 36.1, "elapsed_time": "0:08:49", "remaining_time": "0:15:38", "throughput": 2537.19, "total_tokens": 1344512} +{"current_steps": 2740, "total_steps": 7577, "loss": 0.1562, "lr": 1.6116357846328312e-06, "epoch": 0.3616206942061502, "percentage": 36.16, "elapsed_time": "0:08:50", "remaining_time": "0:15:36", "throughput": 2540.07, "total_tokens": 1346880} +{"current_steps": 2745, "total_steps": 7577, "loss": 0.0123, "lr": 1.609811727648468e-06, "epoch": 0.3622805859838986, "percentage": 36.23, "elapsed_time": "0:08:50", "remaining_time": "0:15:33", "throughput": 2542.6, "total_tokens": 1349056} +{"current_steps": 2750, "total_steps": 7577, "loss": 0.0425, "lr": 1.6079844347725882e-06, "epoch": 0.36294047776164706, "percentage": 36.29, "elapsed_time": "0:08:50", "remaining_time": "0:15:31", "throughput": 2545.59, "total_tokens": 1351488} +{"current_steps": 2755, "total_steps": 7577, "loss": 0.0654, "lr": 1.6061539157014987e-06, "epoch": 0.36360036953939556, "percentage": 36.36, "elapsed_time": "0:08:51", "remaining_time": "0:15:29", "throughput": 2548.57, "total_tokens": 1353920} +{"current_steps": 2760, "total_steps": 7577, "loss": 0.2615, "lr": 1.6043201801486257e-06, "epoch": 0.364260261317144, "percentage": 36.43, "elapsed_time": "0:08:51", "remaining_time": "0:15:27", "throughput": 2551.56, "total_tokens": 1356352} +{"current_steps": 2765, "total_steps": 7577, "loss": 0.1949, "lr": 1.6024832378444628e-06, "epoch": 0.36492015309489245, "percentage": 36.49, "elapsed_time": "0:08:51", "remaining_time": "0:15:25", "throughput": 2555.14, "total_tokens": 1359104} +{"current_steps": 2770, "total_steps": 7577, "loss": 0.3066, "lr": 1.6006430985365204e-06, "epoch": 0.3655800448726409, "percentage": 36.56, "elapsed_time": "0:08:52", "remaining_time": "0:15:23", "throughput": 2558.11, "total_tokens": 1361536} +{"current_steps": 2775, "total_steps": 7577, "loss": 0.2606, "lr": 1.5987997719892735e-06, "epoch": 0.36623993665038934, "percentage": 36.62, "elapsed_time": "0:08:52", "remaining_time": "0:15:21", "throughput": 2561.44, "total_tokens": 1364160} +{"current_steps": 2780, "total_steps": 7577, "loss": 0.005, "lr": 1.5969532679841088e-06, "epoch": 0.3668998284281378, "percentage": 36.69, "elapsed_time": "0:08:52", "remaining_time": "0:15:19", "throughput": 2564.54, "total_tokens": 1366656} +{"current_steps": 2785, "total_steps": 7577, "loss": 0.0512, "lr": 1.5951035963192752e-06, "epoch": 0.36755972020588623, "percentage": 36.76, "elapsed_time": "0:08:53", "remaining_time": "0:15:17", "throughput": 2567.76, "total_tokens": 1369216} +{"current_steps": 2790, "total_steps": 7577, "loss": 0.2619, "lr": 1.593250766809829e-06, "epoch": 0.3682196119836347, "percentage": 36.82, "elapsed_time": "0:08:53", "remaining_time": "0:15:15", "throughput": 2570.85, "total_tokens": 1371712} +{"current_steps": 2795, "total_steps": 7577, "loss": 0.1739, "lr": 1.5913947892875842e-06, "epoch": 0.3688795037613831, "percentage": 36.89, "elapsed_time": "0:08:53", "remaining_time": "0:15:13", "throughput": 2573.71, "total_tokens": 1374080} +{"current_steps": 2800, "total_steps": 7577, "loss": 0.1383, "lr": 1.589535673601059e-06, "epoch": 0.36953939553913157, "percentage": 36.95, "elapsed_time": "0:08:54", "remaining_time": "0:15:11", "throughput": 2577.59, "total_tokens": 1377024} +{"current_steps": 2805, "total_steps": 7577, "loss": 0.0587, "lr": 1.587673429615424e-06, "epoch": 0.37019928731688, "percentage": 37.02, "elapsed_time": "0:08:54", "remaining_time": "0:15:09", "throughput": 2580.44, "total_tokens": 1379392} +{"current_steps": 2810, "total_steps": 7577, "loss": 0.1913, "lr": 1.5858080672124495e-06, "epoch": 0.37085917909462845, "percentage": 37.09, "elapsed_time": "0:08:54", "remaining_time": "0:15:07", "throughput": 2583.3, "total_tokens": 1381760} +{"current_steps": 2815, "total_steps": 7577, "loss": 0.0931, "lr": 1.5839395962904536e-06, "epoch": 0.37151907087237696, "percentage": 37.15, "elapsed_time": "0:08:55", "remaining_time": "0:15:05", "throughput": 2586.15, "total_tokens": 1384128} +{"current_steps": 2820, "total_steps": 7577, "loss": 0.0094, "lr": 1.5820680267642494e-06, "epoch": 0.3721789626501254, "percentage": 37.22, "elapsed_time": "0:08:55", "remaining_time": "0:15:03", "throughput": 2588.98, "total_tokens": 1386496} +{"current_steps": 2825, "total_steps": 7577, "loss": 0.0489, "lr": 1.5801933685650917e-06, "epoch": 0.37283885442787384, "percentage": 37.28, "elapsed_time": "0:08:55", "remaining_time": "0:15:01", "throughput": 2591.6, "total_tokens": 1388736} +{"current_steps": 2830, "total_steps": 7577, "loss": 0.0478, "lr": 1.5783156316406259e-06, "epoch": 0.3734987462056223, "percentage": 37.35, "elapsed_time": "0:08:56", "remaining_time": "0:14:59", "throughput": 2594.33, "total_tokens": 1391040} +{"current_steps": 2835, "total_steps": 7577, "loss": 0.2375, "lr": 1.5764348259548334e-06, "epoch": 0.37415863798337073, "percentage": 37.42, "elapsed_time": "0:08:56", "remaining_time": "0:14:57", "throughput": 2597.06, "total_tokens": 1393344} +{"current_steps": 2840, "total_steps": 7577, "loss": 0.0726, "lr": 1.5745509614879806e-06, "epoch": 0.3748185297611192, "percentage": 37.48, "elapsed_time": "0:08:56", "remaining_time": "0:14:55", "throughput": 2599.78, "total_tokens": 1395648} +{"current_steps": 2845, "total_steps": 7577, "loss": 0.3055, "lr": 1.572664048236564e-06, "epoch": 0.3754784215388676, "percentage": 37.55, "elapsed_time": "0:08:57", "remaining_time": "0:14:53", "throughput": 2603.06, "total_tokens": 1398272} +{"current_steps": 2850, "total_steps": 7577, "loss": 0.0405, "lr": 1.570774096213259e-06, "epoch": 0.37613831331661607, "percentage": 37.61, "elapsed_time": "0:08:57", "remaining_time": "0:14:51", "throughput": 2605.75, "total_tokens": 1400576} +{"current_steps": 2855, "total_steps": 7577, "loss": 0.0015, "lr": 1.5688811154468649e-06, "epoch": 0.3767982050943645, "percentage": 37.68, "elapsed_time": "0:08:57", "remaining_time": "0:14:49", "throughput": 2608.91, "total_tokens": 1403136} +{"current_steps": 2860, "total_steps": 7577, "loss": 0.1948, "lr": 1.5669851159822532e-06, "epoch": 0.37745809687211296, "percentage": 37.75, "elapsed_time": "0:08:58", "remaining_time": "0:14:47", "throughput": 2611.72, "total_tokens": 1405504} +{"current_steps": 2865, "total_steps": 7577, "loss": 0.1405, "lr": 1.5650861078803137e-06, "epoch": 0.3781179886498614, "percentage": 37.81, "elapsed_time": "0:08:58", "remaining_time": "0:14:45", "throughput": 2614.42, "total_tokens": 1407808} +{"current_steps": 2870, "total_steps": 7577, "loss": 0.0803, "lr": 1.5631841012179013e-06, "epoch": 0.37877788042760985, "percentage": 37.88, "elapsed_time": "0:08:58", "remaining_time": "0:14:43", "throughput": 2617.45, "total_tokens": 1410304} +{"current_steps": 2875, "total_steps": 7577, "loss": 0.0026, "lr": 1.5612791060877818e-06, "epoch": 0.37943777220535835, "percentage": 37.94, "elapsed_time": "0:08:59", "remaining_time": "0:14:41", "throughput": 2620.38, "total_tokens": 1412736} +{"current_steps": 2880, "total_steps": 7577, "loss": 0.0403, "lr": 1.5593711325985801e-06, "epoch": 0.3800976639831068, "percentage": 38.01, "elapsed_time": "0:08:59", "remaining_time": "0:14:39", "throughput": 2623.87, "total_tokens": 1415488} +{"current_steps": 2885, "total_steps": 7577, "loss": 0.213, "lr": 1.5574601908747245e-06, "epoch": 0.38075755576085524, "percentage": 38.08, "elapsed_time": "0:08:59", "remaining_time": "0:14:37", "throughput": 2626.66, "total_tokens": 1417856} +{"current_steps": 2890, "total_steps": 7577, "loss": 0.077, "lr": 1.5555462910563936e-06, "epoch": 0.3814174475386037, "percentage": 38.14, "elapsed_time": "0:09:00", "remaining_time": "0:14:35", "throughput": 2629.23, "total_tokens": 1420096} +{"current_steps": 2895, "total_steps": 7577, "loss": 0.2334, "lr": 1.5536294432994636e-06, "epoch": 0.3820773393163521, "percentage": 38.21, "elapsed_time": "0:09:00", "remaining_time": "0:14:34", "throughput": 2632.37, "total_tokens": 1422656} +{"current_steps": 2900, "total_steps": 7577, "loss": 0.0744, "lr": 1.5517096577754528e-06, "epoch": 0.38273723109410057, "percentage": 38.27, "elapsed_time": "0:09:00", "remaining_time": "0:14:32", "throughput": 2635.39, "total_tokens": 1425152} +{"current_steps": 2905, "total_steps": 7577, "loss": 0.0393, "lr": 1.5497869446714695e-06, "epoch": 0.383397122871849, "percentage": 38.34, "elapsed_time": "0:09:01", "remaining_time": "0:14:30", "throughput": 2638.74, "total_tokens": 1427840} +{"current_steps": 2910, "total_steps": 7577, "loss": 0.0065, "lr": 1.5478613141901558e-06, "epoch": 0.38405701464959746, "percentage": 38.41, "elapsed_time": "0:09:01", "remaining_time": "0:14:28", "throughput": 2641.41, "total_tokens": 1430144} +{"current_steps": 2915, "total_steps": 7577, "loss": 0.1329, "lr": 1.5459327765496348e-06, "epoch": 0.3847169064273459, "percentage": 38.47, "elapsed_time": "0:09:01", "remaining_time": "0:14:26", "throughput": 2644.06, "total_tokens": 1432448} +{"current_steps": 2920, "total_steps": 7577, "loss": 0.0276, "lr": 1.5440013419834563e-06, "epoch": 0.38537679820509435, "percentage": 38.54, "elapsed_time": "0:09:02", "remaining_time": "0:14:24", "throughput": 2646.73, "total_tokens": 1434752} +{"current_steps": 2925, "total_steps": 7577, "loss": 0.0011, "lr": 1.5420670207405419e-06, "epoch": 0.3860366899828428, "percentage": 38.6, "elapsed_time": "0:09:02", "remaining_time": "0:14:22", "throughput": 2649.62, "total_tokens": 1437184} +{"current_steps": 2930, "total_steps": 7577, "loss": 0.0935, "lr": 1.5401298230851314e-06, "epoch": 0.38669658176059124, "percentage": 38.67, "elapsed_time": "0:09:02", "remaining_time": "0:14:20", "throughput": 2653.16, "total_tokens": 1440000} +{"current_steps": 2935, "total_steps": 7577, "loss": 0.0716, "lr": 1.5381897592967275e-06, "epoch": 0.3873564735383397, "percentage": 38.74, "elapsed_time": "0:09:03", "remaining_time": "0:14:18", "throughput": 2656.36, "total_tokens": 1442624} +{"current_steps": 2940, "total_steps": 7577, "loss": 0.0019, "lr": 1.5362468396700426e-06, "epoch": 0.3880163653160882, "percentage": 38.8, "elapsed_time": "0:09:03", "remaining_time": "0:14:17", "throughput": 2659.46, "total_tokens": 1445184} +{"current_steps": 2945, "total_steps": 7577, "loss": 0.2755, "lr": 1.5343010745149418e-06, "epoch": 0.38867625709383663, "percentage": 38.87, "elapsed_time": "0:09:03", "remaining_time": "0:14:15", "throughput": 2662.32, "total_tokens": 1447616} +{"current_steps": 2950, "total_steps": 7577, "loss": 0.0004, "lr": 1.532352474156391e-06, "epoch": 0.3893361488715851, "percentage": 38.93, "elapsed_time": "0:09:04", "remaining_time": "0:14:13", "throughput": 2665.39, "total_tokens": 1450176} +{"current_steps": 2955, "total_steps": 7577, "loss": 0.5725, "lr": 1.5304010489343995e-06, "epoch": 0.3899960406493335, "percentage": 39.0, "elapsed_time": "0:09:04", "remaining_time": "0:14:11", "throughput": 2668.37, "total_tokens": 1452672} +{"current_steps": 2960, "total_steps": 7577, "loss": 0.2012, "lr": 1.528446809203968e-06, "epoch": 0.39065593242708196, "percentage": 39.07, "elapsed_time": "0:09:04", "remaining_time": "0:14:09", "throughput": 2671.46, "total_tokens": 1455232} +{"current_steps": 2965, "total_steps": 7577, "loss": 0.1031, "lr": 1.526489765335031e-06, "epoch": 0.3913158242048304, "percentage": 39.13, "elapsed_time": "0:09:05", "remaining_time": "0:14:07", "throughput": 2674.52, "total_tokens": 1457792} +{"current_steps": 2970, "total_steps": 7577, "loss": 0.1237, "lr": 1.5245299277124026e-06, "epoch": 0.39197571598257885, "percentage": 39.2, "elapsed_time": "0:09:05", "remaining_time": "0:14:06", "throughput": 2677.26, "total_tokens": 1460160} +{"current_steps": 2975, "total_steps": 7577, "loss": 0.1705, "lr": 1.5225673067357218e-06, "epoch": 0.3926356077603273, "percentage": 39.26, "elapsed_time": "0:09:05", "remaining_time": "0:14:04", "throughput": 2679.77, "total_tokens": 1462400} +{"current_steps": 2980, "total_steps": 7577, "loss": 0.1399, "lr": 1.5206019128193981e-06, "epoch": 0.39329549953807574, "percentage": 39.33, "elapsed_time": "0:09:06", "remaining_time": "0:14:02", "throughput": 2683.06, "total_tokens": 1465088} +{"current_steps": 2985, "total_steps": 7577, "loss": 0.167, "lr": 1.5186337563925538e-06, "epoch": 0.3939553913158242, "percentage": 39.4, "elapsed_time": "0:09:06", "remaining_time": "0:14:00", "throughput": 2685.8, "total_tokens": 1467456} +{"current_steps": 2990, "total_steps": 7577, "loss": 0.001, "lr": 1.516662847898971e-06, "epoch": 0.39461528309357263, "percentage": 39.46, "elapsed_time": "0:09:06", "remaining_time": "0:13:58", "throughput": 2688.85, "total_tokens": 1470016} +{"current_steps": 2995, "total_steps": 7577, "loss": 0.0936, "lr": 1.5146891977970349e-06, "epoch": 0.3952751748713211, "percentage": 39.53, "elapsed_time": "0:09:07", "remaining_time": "0:13:56", "throughput": 2691.7, "total_tokens": 1472448} +{"current_steps": 3000, "total_steps": 7577, "loss": 0.0271, "lr": 1.5127128165596794e-06, "epoch": 0.3959350666490696, "percentage": 39.59, "elapsed_time": "0:09:07", "remaining_time": "0:13:55", "throughput": 2694.86, "total_tokens": 1475072} +{"current_steps": 3005, "total_steps": 7577, "loss": 0.0571, "lr": 1.51073371467433e-06, "epoch": 0.396594958426818, "percentage": 39.66, "elapsed_time": "0:09:07", "remaining_time": "0:13:53", "throughput": 2697.58, "total_tokens": 1477440} +{"current_steps": 3010, "total_steps": 7577, "loss": 0.027, "lr": 1.5087519026428498e-06, "epoch": 0.39725485020456647, "percentage": 39.73, "elapsed_time": "0:09:08", "remaining_time": "0:13:51", "throughput": 2700.36, "total_tokens": 1479872} +{"current_steps": 3015, "total_steps": 7577, "loss": 0.2218, "lr": 1.5067673909814818e-06, "epoch": 0.3979147419823149, "percentage": 39.79, "elapsed_time": "0:09:08", "remaining_time": "0:13:49", "throughput": 2702.51, "total_tokens": 1481920} +{"current_steps": 3020, "total_steps": 7577, "loss": 0.1557, "lr": 1.5047801902207953e-06, "epoch": 0.39857463376006336, "percentage": 39.86, "elapsed_time": "0:09:08", "remaining_time": "0:13:47", "throughput": 2706.43, "total_tokens": 1484992} +{"current_steps": 3025, "total_steps": 7577, "loss": 0.2134, "lr": 1.5027903109056288e-06, "epoch": 0.3992345255378118, "percentage": 39.92, "elapsed_time": "0:09:09", "remaining_time": "0:13:46", "throughput": 2708.9, "total_tokens": 1487232} +{"current_steps": 3030, "total_steps": 7577, "loss": 0.1412, "lr": 1.5007977635950336e-06, "epoch": 0.39989441731556025, "percentage": 39.99, "elapsed_time": "0:09:09", "remaining_time": "0:13:44", "throughput": 2711.82, "total_tokens": 1489728} +{"current_steps": 3032, "total_steps": 7577, "eval_loss": 0.13093648850917816, "epoch": 0.4001583740266596, "percentage": 40.02, "elapsed_time": "0:09:17", "remaining_time": "0:13:55", "throughput": 2674.27, "total_tokens": 1490688} +{"current_steps": 3035, "total_steps": 7577, "loss": 0.2057, "lr": 1.498802558862219e-06, "epoch": 0.4005543090933087, "percentage": 40.06, "elapsed_time": "0:09:40", "remaining_time": "0:14:28", "throughput": 2571.02, "total_tokens": 1491968} +{"current_steps": 3040, "total_steps": 7577, "loss": 0.1003, "lr": 1.496804707294496e-06, "epoch": 0.40121420087105714, "percentage": 40.12, "elapsed_time": "0:09:40", "remaining_time": "0:14:26", "throughput": 2573.61, "total_tokens": 1494336} +{"current_steps": 3045, "total_steps": 7577, "loss": 0.065, "lr": 1.4948042194932195e-06, "epoch": 0.4018740926488056, "percentage": 40.19, "elapsed_time": "0:09:40", "remaining_time": "0:14:24", "throughput": 2577.47, "total_tokens": 1497472} +{"current_steps": 3050, "total_steps": 7577, "loss": 0.0242, "lr": 1.4928011060737341e-06, "epoch": 0.402533984426554, "percentage": 40.25, "elapsed_time": "0:09:41", "remaining_time": "0:14:22", "throughput": 2580.29, "total_tokens": 1499968} +{"current_steps": 3055, "total_steps": 7577, "loss": 0.0811, "lr": 1.4907953776653171e-06, "epoch": 0.40319387620430247, "percentage": 40.32, "elapsed_time": "0:09:41", "remaining_time": "0:14:20", "throughput": 2582.91, "total_tokens": 1502336} +{"current_steps": 3060, "total_steps": 7577, "loss": 0.1462, "lr": 1.4887870449111206e-06, "epoch": 0.40385376798205097, "percentage": 40.39, "elapsed_time": "0:09:41", "remaining_time": "0:14:19", "throughput": 2585.31, "total_tokens": 1504576} +{"current_steps": 3065, "total_steps": 7577, "loss": 0.2155, "lr": 1.486776118468118e-06, "epoch": 0.4045136597597994, "percentage": 40.45, "elapsed_time": "0:09:42", "remaining_time": "0:14:17", "throughput": 2588.24, "total_tokens": 1507136} +{"current_steps": 3070, "total_steps": 7577, "loss": 0.0479, "lr": 1.4847626090070451e-06, "epoch": 0.40517355153754786, "percentage": 40.52, "elapsed_time": "0:09:42", "remaining_time": "0:14:15", "throughput": 2591.18, "total_tokens": 1509696} +{"current_steps": 3075, "total_steps": 7577, "loss": 0.3045, "lr": 1.4827465272123439e-06, "epoch": 0.4058334433152963, "percentage": 40.58, "elapsed_time": "0:09:42", "remaining_time": "0:14:13", "throughput": 2594.01, "total_tokens": 1512192} +{"current_steps": 3080, "total_steps": 7577, "loss": 0.0134, "lr": 1.4807278837821063e-06, "epoch": 0.40649333509304475, "percentage": 40.65, "elapsed_time": "0:09:43", "remaining_time": "0:14:11", "throughput": 2596.94, "total_tokens": 1514752} +{"current_steps": 3085, "total_steps": 7577, "loss": 0.3, "lr": 1.4787066894280178e-06, "epoch": 0.4071532268707932, "percentage": 40.72, "elapsed_time": "0:09:43", "remaining_time": "0:14:09", "throughput": 2600.06, "total_tokens": 1517440} +{"current_steps": 3090, "total_steps": 7577, "loss": 0.0679, "lr": 1.476682954875299e-06, "epoch": 0.40781311864854164, "percentage": 40.78, "elapsed_time": "0:09:43", "remaining_time": "0:14:07", "throughput": 2602.57, "total_tokens": 1519744} +{"current_steps": 3095, "total_steps": 7577, "loss": 0.1745, "lr": 1.4746566908626506e-06, "epoch": 0.4084730104262901, "percentage": 40.85, "elapsed_time": "0:09:44", "remaining_time": "0:14:06", "throughput": 2605.26, "total_tokens": 1522176} +{"current_steps": 3100, "total_steps": 7577, "loss": 0.0519, "lr": 1.4726279081421956e-06, "epoch": 0.40913290220403853, "percentage": 40.91, "elapsed_time": "0:09:44", "remaining_time": "0:14:04", "throughput": 2607.56, "total_tokens": 1524352} +{"current_steps": 3105, "total_steps": 7577, "loss": 0.2616, "lr": 1.4705966174794216e-06, "epoch": 0.409792793981787, "percentage": 40.98, "elapsed_time": "0:09:44", "remaining_time": "0:14:02", "throughput": 2610.53, "total_tokens": 1526976} +{"current_steps": 3110, "total_steps": 7577, "loss": 0.1047, "lr": 1.4685628296531248e-06, "epoch": 0.4104526857595354, "percentage": 41.05, "elapsed_time": "0:09:45", "remaining_time": "0:14:00", "throughput": 2612.78, "total_tokens": 1529152} +{"current_steps": 3115, "total_steps": 7577, "loss": 0.0288, "lr": 1.466526555455352e-06, "epoch": 0.41111257753728386, "percentage": 41.11, "elapsed_time": "0:09:45", "remaining_time": "0:13:58", "throughput": 2615.53, "total_tokens": 1531648} +{"current_steps": 3120, "total_steps": 7577, "loss": 0.0023, "lr": 1.4644878056913432e-06, "epoch": 0.4117724693150323, "percentage": 41.18, "elapsed_time": "0:09:45", "remaining_time": "0:13:57", "throughput": 2617.96, "total_tokens": 1533952} +{"current_steps": 3125, "total_steps": 7577, "loss": 0.165, "lr": 1.4624465911794764e-06, "epoch": 0.4124323610927808, "percentage": 41.24, "elapsed_time": "0:09:46", "remaining_time": "0:13:55", "throughput": 2621.04, "total_tokens": 1536640} +{"current_steps": 3130, "total_steps": 7577, "loss": 0.0024, "lr": 1.4604029227512062e-06, "epoch": 0.41309225287052925, "percentage": 41.31, "elapsed_time": "0:09:46", "remaining_time": "0:13:53", "throughput": 2623.92, "total_tokens": 1539200} +{"current_steps": 3135, "total_steps": 7577, "loss": 0.1984, "lr": 1.4583568112510108e-06, "epoch": 0.4137521446482777, "percentage": 41.38, "elapsed_time": "0:09:46", "remaining_time": "0:13:51", "throughput": 2626.61, "total_tokens": 1541632} +{"current_steps": 3140, "total_steps": 7577, "loss": 0.0697, "lr": 1.4563082675363302e-06, "epoch": 0.41441203642602614, "percentage": 41.44, "elapsed_time": "0:09:47", "remaining_time": "0:13:49", "throughput": 2629.4, "total_tokens": 1544128} +{"current_steps": 3145, "total_steps": 7577, "loss": 0.0009, "lr": 1.4542573024775122e-06, "epoch": 0.4150719282037746, "percentage": 41.51, "elapsed_time": "0:09:47", "remaining_time": "0:13:48", "throughput": 2631.75, "total_tokens": 1546368} +{"current_steps": 3150, "total_steps": 7577, "loss": 0.3214, "lr": 1.4522039269577521e-06, "epoch": 0.41573181998152303, "percentage": 41.57, "elapsed_time": "0:09:47", "remaining_time": "0:13:46", "throughput": 2634.32, "total_tokens": 1548736} +{"current_steps": 3155, "total_steps": 7577, "loss": 0.223, "lr": 1.4501481518730372e-06, "epoch": 0.4163917117592715, "percentage": 41.64, "elapsed_time": "0:09:48", "remaining_time": "0:13:44", "throughput": 2636.99, "total_tokens": 1551168} +{"current_steps": 3160, "total_steps": 7577, "loss": 0.0751, "lr": 1.4480899881320868e-06, "epoch": 0.4170516035370199, "percentage": 41.71, "elapsed_time": "0:09:48", "remaining_time": "0:13:42", "throughput": 2639.75, "total_tokens": 1553664} +{"current_steps": 3165, "total_steps": 7577, "loss": 0.1681, "lr": 1.4460294466562956e-06, "epoch": 0.41771149531476837, "percentage": 41.77, "elapsed_time": "0:09:48", "remaining_time": "0:13:40", "throughput": 2642.21, "total_tokens": 1555968} +{"current_steps": 3170, "total_steps": 7577, "loss": 0.0974, "lr": 1.4439665383796756e-06, "epoch": 0.4183713870925168, "percentage": 41.84, "elapsed_time": "0:09:49", "remaining_time": "0:13:39", "throughput": 2644.57, "total_tokens": 1558208} +{"current_steps": 3175, "total_steps": 7577, "loss": 0.003, "lr": 1.4419012742487972e-06, "epoch": 0.41903127887026526, "percentage": 41.9, "elapsed_time": "0:09:49", "remaining_time": "0:13:37", "throughput": 2647.22, "total_tokens": 1560640} +{"current_steps": 3180, "total_steps": 7577, "loss": 0.0019, "lr": 1.4398336652227335e-06, "epoch": 0.4196911706480137, "percentage": 41.97, "elapsed_time": "0:09:49", "remaining_time": "0:13:35", "throughput": 2650.3, "total_tokens": 1563328} +{"current_steps": 3185, "total_steps": 7577, "loss": 0.1522, "lr": 1.4377637222729986e-06, "epoch": 0.4203510624257622, "percentage": 42.04, "elapsed_time": "0:09:50", "remaining_time": "0:13:33", "throughput": 2652.83, "total_tokens": 1565696} +{"current_steps": 3190, "total_steps": 7577, "loss": 0.1285, "lr": 1.435691456383493e-06, "epoch": 0.42101095420351065, "percentage": 42.1, "elapsed_time": "0:09:50", "remaining_time": "0:13:32", "throughput": 2656.3, "total_tokens": 1568640} +{"current_steps": 3195, "total_steps": 7577, "loss": 0.128, "lr": 1.433616878550442e-06, "epoch": 0.4216708459812591, "percentage": 42.17, "elapsed_time": "0:09:50", "remaining_time": "0:13:30", "throughput": 2659.34, "total_tokens": 1571328} +{"current_steps": 3200, "total_steps": 7577, "loss": 0.3784, "lr": 1.4315399997823403e-06, "epoch": 0.42233073775900754, "percentage": 42.23, "elapsed_time": "0:09:51", "remaining_time": "0:13:28", "throughput": 2662.38, "total_tokens": 1574016} +{"current_steps": 3205, "total_steps": 7577, "loss": 0.2654, "lr": 1.429460831099891e-06, "epoch": 0.422990629536756, "percentage": 42.3, "elapsed_time": "0:09:51", "remaining_time": "0:13:26", "throughput": 2664.9, "total_tokens": 1576384} +{"current_steps": 3210, "total_steps": 7577, "loss": 0.2098, "lr": 1.4273793835359492e-06, "epoch": 0.4236505213145044, "percentage": 42.37, "elapsed_time": "0:09:51", "remaining_time": "0:13:25", "throughput": 2668.13, "total_tokens": 1579200} +{"current_steps": 3215, "total_steps": 7577, "loss": 0.1142, "lr": 1.4252956681354631e-06, "epoch": 0.42431041309225287, "percentage": 42.43, "elapsed_time": "0:09:52", "remaining_time": "0:13:23", "throughput": 2670.75, "total_tokens": 1581632} +{"current_steps": 3220, "total_steps": 7577, "loss": 0.0092, "lr": 1.4232096959554135e-06, "epoch": 0.4249703048700013, "percentage": 42.5, "elapsed_time": "0:09:52", "remaining_time": "0:13:21", "throughput": 2673.37, "total_tokens": 1584064} +{"current_steps": 3225, "total_steps": 7577, "loss": 0.0457, "lr": 1.4211214780647572e-06, "epoch": 0.42563019664774976, "percentage": 42.56, "elapsed_time": "0:09:52", "remaining_time": "0:13:20", "throughput": 2676.41, "total_tokens": 1586752} +{"current_steps": 3230, "total_steps": 7577, "loss": 0.0764, "lr": 1.4190310255443676e-06, "epoch": 0.4262900884254982, "percentage": 42.63, "elapsed_time": "0:09:53", "remaining_time": "0:13:18", "throughput": 2679.15, "total_tokens": 1589248} +{"current_steps": 3235, "total_steps": 7577, "loss": 0.0141, "lr": 1.4169383494869764e-06, "epoch": 0.42694998020324665, "percentage": 42.69, "elapsed_time": "0:09:53", "remaining_time": "0:13:16", "throughput": 2681.56, "total_tokens": 1591552} +{"current_steps": 3240, "total_steps": 7577, "loss": 0.051, "lr": 1.414843460997113e-06, "epoch": 0.4276098719809951, "percentage": 42.76, "elapsed_time": "0:09:53", "remaining_time": "0:13:14", "throughput": 2684.28, "total_tokens": 1594048} +{"current_steps": 3245, "total_steps": 7577, "loss": 0.1432, "lr": 1.4127463711910483e-06, "epoch": 0.4282697637587436, "percentage": 42.83, "elapsed_time": "0:09:54", "remaining_time": "0:13:13", "throughput": 2686.97, "total_tokens": 1596544} +{"current_steps": 3250, "total_steps": 7577, "loss": 0.1601, "lr": 1.410647091196733e-06, "epoch": 0.42892965553649204, "percentage": 42.89, "elapsed_time": "0:09:54", "remaining_time": "0:13:11", "throughput": 2689.8, "total_tokens": 1599104} +{"current_steps": 3255, "total_steps": 7577, "loss": 0.1324, "lr": 1.4085456321537402e-06, "epoch": 0.4295895473142405, "percentage": 42.96, "elapsed_time": "0:09:54", "remaining_time": "0:13:09", "throughput": 2692.1, "total_tokens": 1601344} +{"current_steps": 3260, "total_steps": 7577, "loss": 0.2152, "lr": 1.4064420052132056e-06, "epoch": 0.43024943909198893, "percentage": 43.02, "elapsed_time": "0:09:55", "remaining_time": "0:13:08", "throughput": 2695.01, "total_tokens": 1603968} +{"current_steps": 3265, "total_steps": 7577, "loss": 0.0317, "lr": 1.4043362215377696e-06, "epoch": 0.4309093308697374, "percentage": 43.09, "elapsed_time": "0:09:55", "remaining_time": "0:13:06", "throughput": 2697.63, "total_tokens": 1606400} +{"current_steps": 3270, "total_steps": 7577, "loss": 0.1258, "lr": 1.4022282923015158e-06, "epoch": 0.4315692226474858, "percentage": 43.16, "elapsed_time": "0:09:55", "remaining_time": "0:13:04", "throughput": 2700.42, "total_tokens": 1608960} +{"current_steps": 3275, "total_steps": 7577, "loss": 0.0026, "lr": 1.4001182286899136e-06, "epoch": 0.43222911442523426, "percentage": 43.22, "elapsed_time": "0:09:56", "remaining_time": "0:13:03", "throughput": 2703.14, "total_tokens": 1611456} +{"current_steps": 3280, "total_steps": 7577, "loss": 0.0702, "lr": 1.398006041899758e-06, "epoch": 0.4328890062029827, "percentage": 43.29, "elapsed_time": "0:09:56", "remaining_time": "0:13:01", "throughput": 2705.84, "total_tokens": 1613952} +{"current_steps": 3285, "total_steps": 7577, "loss": 0.1748, "lr": 1.3958917431391102e-06, "epoch": 0.43354889798073115, "percentage": 43.35, "elapsed_time": "0:09:56", "remaining_time": "0:12:59", "throughput": 2708.35, "total_tokens": 1616320} +{"current_steps": 3290, "total_steps": 7577, "loss": 0.1856, "lr": 1.3937753436272388e-06, "epoch": 0.4342087897584796, "percentage": 43.42, "elapsed_time": "0:09:57", "remaining_time": "0:12:58", "throughput": 2711.55, "total_tokens": 1619136} +{"current_steps": 3295, "total_steps": 7577, "loss": 0.118, "lr": 1.3916568545945597e-06, "epoch": 0.43486868153622804, "percentage": 43.49, "elapsed_time": "0:09:57", "remaining_time": "0:12:56", "throughput": 2714.25, "total_tokens": 1621632} +{"current_steps": 3300, "total_steps": 7577, "loss": 0.1392, "lr": 1.3895362872825764e-06, "epoch": 0.4355285733139765, "percentage": 43.55, "elapsed_time": "0:09:57", "remaining_time": "0:12:54", "throughput": 2716.84, "total_tokens": 1624064} +{"current_steps": 3305, "total_steps": 7577, "loss": 0.0494, "lr": 1.3874136529438205e-06, "epoch": 0.43618846509172493, "percentage": 43.62, "elapsed_time": "0:09:58", "remaining_time": "0:12:53", "throughput": 2719.44, "total_tokens": 1626496} +{"current_steps": 3310, "total_steps": 7577, "loss": 0.1045, "lr": 1.3852889628417918e-06, "epoch": 0.43684835686947343, "percentage": 43.68, "elapsed_time": "0:09:58", "remaining_time": "0:12:51", "throughput": 2721.82, "total_tokens": 1628800} +{"current_steps": 3315, "total_steps": 7577, "loss": 0.104, "lr": 1.3831622282508994e-06, "epoch": 0.4375082486472219, "percentage": 43.75, "elapsed_time": "0:09:58", "remaining_time": "0:12:49", "throughput": 2724.41, "total_tokens": 1631232} +{"current_steps": 3320, "total_steps": 7577, "loss": 0.0011, "lr": 1.3810334604564007e-06, "epoch": 0.4381681404249703, "percentage": 43.82, "elapsed_time": "0:09:59", "remaining_time": "0:12:48", "throughput": 2727.09, "total_tokens": 1633728} +{"current_steps": 3325, "total_steps": 7577, "loss": 0.0735, "lr": 1.3789026707543423e-06, "epoch": 0.43882803220271877, "percentage": 43.88, "elapsed_time": "0:09:59", "remaining_time": "0:12:46", "throughput": 2729.78, "total_tokens": 1636224} +{"current_steps": 3330, "total_steps": 7577, "loss": 0.063, "lr": 1.3767698704514998e-06, "epoch": 0.4394879239804672, "percentage": 43.95, "elapsed_time": "0:09:59", "remaining_time": "0:12:44", "throughput": 2731.71, "total_tokens": 1638272} +{"current_steps": 3335, "total_steps": 7577, "loss": 0.1941, "lr": 1.3746350708653175e-06, "epoch": 0.44014781575821565, "percentage": 44.01, "elapsed_time": "0:10:00", "remaining_time": "0:12:43", "throughput": 2733.96, "total_tokens": 1640512} +{"current_steps": 3340, "total_steps": 7577, "loss": 0.2224, "lr": 1.3724982833238495e-06, "epoch": 0.4408077075359641, "percentage": 44.08, "elapsed_time": "0:10:00", "remaining_time": "0:12:41", "throughput": 2736.52, "total_tokens": 1642944} +{"current_steps": 3345, "total_steps": 7577, "loss": 0.1334, "lr": 1.370359519165697e-06, "epoch": 0.44146759931371254, "percentage": 44.15, "elapsed_time": "0:10:00", "remaining_time": "0:12:39", "throughput": 2739.08, "total_tokens": 1645376} +{"current_steps": 3350, "total_steps": 7577, "loss": 0.0429, "lr": 1.368218789739952e-06, "epoch": 0.442127491091461, "percentage": 44.21, "elapsed_time": "0:10:01", "remaining_time": "0:12:38", "throughput": 2741.86, "total_tokens": 1647936} +{"current_steps": 3355, "total_steps": 7577, "loss": 0.1404, "lr": 1.3660761064061337e-06, "epoch": 0.44278738286920943, "percentage": 44.28, "elapsed_time": "0:10:01", "remaining_time": "0:12:36", "throughput": 2744.6, "total_tokens": 1650496} +{"current_steps": 3360, "total_steps": 7577, "loss": 0.1065, "lr": 1.3639314805341297e-06, "epoch": 0.4434472746469579, "percentage": 44.34, "elapsed_time": "0:10:01", "remaining_time": "0:12:35", "throughput": 2747.25, "total_tokens": 1652992} +{"current_steps": 3365, "total_steps": 7577, "loss": 0.0935, "lr": 1.3617849235041355e-06, "epoch": 0.4441071664247063, "percentage": 44.41, "elapsed_time": "0:10:02", "remaining_time": "0:12:33", "throughput": 2749.9, "total_tokens": 1655488} +{"current_steps": 3370, "total_steps": 7577, "loss": 0.1084, "lr": 1.3596364467065938e-06, "epoch": 0.4447670582024548, "percentage": 44.48, "elapsed_time": "0:10:02", "remaining_time": "0:12:31", "throughput": 2752.54, "total_tokens": 1657984} +{"current_steps": 3375, "total_steps": 7577, "loss": 0.2514, "lr": 1.3574860615421346e-06, "epoch": 0.44542694998020327, "percentage": 44.54, "elapsed_time": "0:10:02", "remaining_time": "0:12:30", "throughput": 2755.56, "total_tokens": 1660736} +{"current_steps": 3380, "total_steps": 7577, "loss": 0.1354, "lr": 1.3553337794215147e-06, "epoch": 0.4460868417579517, "percentage": 44.61, "elapsed_time": "0:10:03", "remaining_time": "0:12:28", "throughput": 2757.99, "total_tokens": 1663104} +{"current_steps": 3385, "total_steps": 7577, "loss": 0.1002, "lr": 1.3531796117655565e-06, "epoch": 0.44674673353570016, "percentage": 44.67, "elapsed_time": "0:10:03", "remaining_time": "0:12:27", "throughput": 2760.19, "total_tokens": 1665344} +{"current_steps": 3390, "total_steps": 7577, "loss": 0.156, "lr": 1.3510235700050873e-06, "epoch": 0.4474066253134486, "percentage": 44.74, "elapsed_time": "0:10:03", "remaining_time": "0:12:25", "throughput": 2763.22, "total_tokens": 1668096} +{"current_steps": 3395, "total_steps": 7577, "loss": 0.0959, "lr": 1.3488656655808801e-06, "epoch": 0.44806651709119705, "percentage": 44.81, "elapsed_time": "0:10:04", "remaining_time": "0:12:24", "throughput": 2765.34, "total_tokens": 1670272} +{"current_steps": 3400, "total_steps": 7577, "loss": 0.0913, "lr": 1.3467059099435912e-06, "epoch": 0.4487264088689455, "percentage": 44.87, "elapsed_time": "0:10:04", "remaining_time": "0:12:22", "throughput": 2767.44, "total_tokens": 1672448} +{"current_steps": 3405, "total_steps": 7577, "loss": 0.0055, "lr": 1.3445443145537002e-06, "epoch": 0.44938630064669394, "percentage": 44.94, "elapsed_time": "0:10:04", "remaining_time": "0:12:20", "throughput": 2770.45, "total_tokens": 1675200} +{"current_steps": 3410, "total_steps": 7577, "loss": 0.0509, "lr": 1.3423808908814494e-06, "epoch": 0.4500461924244424, "percentage": 45.0, "elapsed_time": "0:10:05", "remaining_time": "0:12:19", "throughput": 2773.05, "total_tokens": 1677696} +{"current_steps": 3411, "total_steps": 7577, "eval_loss": 0.11581598222255707, "epoch": 0.45017817077999206, "percentage": 45.02, "elapsed_time": "0:10:12", "remaining_time": "0:12:28", "throughput": 2738.16, "total_tokens": 1678208} +{"current_steps": 3415, "total_steps": 7577, "loss": 0.0982, "lr": 1.3402156504067826e-06, "epoch": 0.4507060842021908, "percentage": 45.07, "elapsed_time": "0:11:10", "remaining_time": "0:13:37", "throughput": 2505.28, "total_tokens": 1680256} +{"current_steps": 3420, "total_steps": 7577, "loss": 0.0816, "lr": 1.338048604619284e-06, "epoch": 0.45136597597993927, "percentage": 45.14, "elapsed_time": "0:11:11", "remaining_time": "0:13:35", "throughput": 2507.57, "total_tokens": 1682624} +{"current_steps": 3425, "total_steps": 7577, "loss": 0.0548, "lr": 1.3358797650181178e-06, "epoch": 0.4520258677576877, "percentage": 45.2, "elapsed_time": "0:11:11", "remaining_time": "0:13:33", "throughput": 2509.96, "total_tokens": 1685056} +{"current_steps": 3430, "total_steps": 7577, "loss": 0.1743, "lr": 1.3337091431119662e-06, "epoch": 0.45268575953543616, "percentage": 45.27, "elapsed_time": "0:11:11", "remaining_time": "0:13:32", "throughput": 2511.89, "total_tokens": 1687168} +{"current_steps": 3435, "total_steps": 7577, "loss": 0.263, "lr": 1.3315367504189698e-06, "epoch": 0.45334565131318466, "percentage": 45.33, "elapsed_time": "0:11:11", "remaining_time": "0:13:30", "throughput": 2513.72, "total_tokens": 1689216} +{"current_steps": 3440, "total_steps": 7577, "loss": 0.0704, "lr": 1.3293625984666656e-06, "epoch": 0.4540055430909331, "percentage": 45.4, "elapsed_time": "0:11:12", "remaining_time": "0:13:28", "throughput": 2516.27, "total_tokens": 1691776} +{"current_steps": 3445, "total_steps": 7577, "loss": 0.0008, "lr": 1.3271866987919254e-06, "epoch": 0.45466543486868155, "percentage": 45.47, "elapsed_time": "0:11:12", "remaining_time": "0:13:26", "throughput": 2518.84, "total_tokens": 1694336} +{"current_steps": 3450, "total_steps": 7577, "loss": 0.2066, "lr": 1.325009062940895e-06, "epoch": 0.45532532664643, "percentage": 45.53, "elapsed_time": "0:11:12", "remaining_time": "0:13:25", "throughput": 2521.03, "total_tokens": 1696640} +{"current_steps": 3455, "total_steps": 7577, "loss": 0.0826, "lr": 1.3228297024689336e-06, "epoch": 0.45598521842417844, "percentage": 45.6, "elapsed_time": "0:11:13", "remaining_time": "0:13:23", "throughput": 2523.13, "total_tokens": 1698880} +{"current_steps": 3460, "total_steps": 7577, "loss": 0.1221, "lr": 1.3206486289405519e-06, "epoch": 0.4566451102019269, "percentage": 45.66, "elapsed_time": "0:11:13", "remaining_time": "0:13:21", "throughput": 2525.51, "total_tokens": 1701312} +{"current_steps": 3465, "total_steps": 7577, "loss": 0.1446, "lr": 1.3184658539293496e-06, "epoch": 0.45730500197967533, "percentage": 45.73, "elapsed_time": "0:11:13", "remaining_time": "0:13:19", "throughput": 2527.98, "total_tokens": 1703808} +{"current_steps": 3470, "total_steps": 7577, "loss": 0.132, "lr": 1.3162813890179564e-06, "epoch": 0.4579648937574238, "percentage": 45.8, "elapsed_time": "0:11:14", "remaining_time": "0:13:18", "throughput": 2530.45, "total_tokens": 1706304} +{"current_steps": 3475, "total_steps": 7577, "loss": 0.236, "lr": 1.314095245797969e-06, "epoch": 0.4586247855351722, "percentage": 45.86, "elapsed_time": "0:11:14", "remaining_time": "0:13:16", "throughput": 2532.84, "total_tokens": 1708736} +{"current_steps": 3480, "total_steps": 7577, "loss": 0.1477, "lr": 1.3119074358698891e-06, "epoch": 0.45928467731292066, "percentage": 45.93, "elapsed_time": "0:11:14", "remaining_time": "0:13:14", "throughput": 2535.3, "total_tokens": 1711232} +{"current_steps": 3485, "total_steps": 7577, "loss": 0.003, "lr": 1.3097179708430634e-06, "epoch": 0.4599445690906691, "percentage": 45.99, "elapsed_time": "0:11:15", "remaining_time": "0:13:12", "throughput": 2537.57, "total_tokens": 1713600} +{"current_steps": 3490, "total_steps": 7577, "loss": 0.1998, "lr": 1.3075268623356214e-06, "epoch": 0.46060446086841755, "percentage": 46.06, "elapsed_time": "0:11:15", "remaining_time": "0:13:11", "throughput": 2540.22, "total_tokens": 1716224} +{"current_steps": 3495, "total_steps": 7577, "loss": 0.1462, "lr": 1.305334121974412e-06, "epoch": 0.46126435264616605, "percentage": 46.13, "elapsed_time": "0:11:15", "remaining_time": "0:13:09", "throughput": 2542.69, "total_tokens": 1718720} +{"current_steps": 3500, "total_steps": 7577, "loss": 0.0858, "lr": 1.3031397613949448e-06, "epoch": 0.4619242444239145, "percentage": 46.19, "elapsed_time": "0:11:16", "remaining_time": "0:13:07", "throughput": 2545.24, "total_tokens": 1721280} +{"current_steps": 3505, "total_steps": 7577, "loss": 0.1099, "lr": 1.3009437922413266e-06, "epoch": 0.46258413620166294, "percentage": 46.26, "elapsed_time": "0:11:16", "remaining_time": "0:13:06", "throughput": 2547.61, "total_tokens": 1723712} +{"current_steps": 3510, "total_steps": 7577, "loss": 0.1115, "lr": 1.2987462261661994e-06, "epoch": 0.4632440279794114, "percentage": 46.32, "elapsed_time": "0:11:16", "remaining_time": "0:13:04", "throughput": 2549.7, "total_tokens": 1725952} +{"current_steps": 3515, "total_steps": 7577, "loss": 0.0017, "lr": 1.2965470748306798e-06, "epoch": 0.46390391975715983, "percentage": 46.39, "elapsed_time": "0:11:17", "remaining_time": "0:13:02", "throughput": 2552.23, "total_tokens": 1728512} +{"current_steps": 3520, "total_steps": 7577, "loss": 0.1338, "lr": 1.2943463499042957e-06, "epoch": 0.4645638115349083, "percentage": 46.46, "elapsed_time": "0:11:17", "remaining_time": "0:13:00", "throughput": 2554.68, "total_tokens": 1731008} +{"current_steps": 3525, "total_steps": 7577, "loss": 0.0485, "lr": 1.2921440630649257e-06, "epoch": 0.4652237033126567, "percentage": 46.52, "elapsed_time": "0:11:17", "remaining_time": "0:12:59", "throughput": 2557.38, "total_tokens": 1733696} +{"current_steps": 3530, "total_steps": 7577, "loss": 0.1013, "lr": 1.2899402259987355e-06, "epoch": 0.46588359509040517, "percentage": 46.59, "elapsed_time": "0:11:18", "remaining_time": "0:12:57", "throughput": 2559.91, "total_tokens": 1736256} +{"current_steps": 3535, "total_steps": 7577, "loss": 0.2473, "lr": 1.287734850400118e-06, "epoch": 0.4665434868681536, "percentage": 46.65, "elapsed_time": "0:11:18", "remaining_time": "0:12:55", "throughput": 2562.6, "total_tokens": 1738944} +{"current_steps": 3540, "total_steps": 7577, "loss": 0.3237, "lr": 1.2855279479716297e-06, "epoch": 0.46720337864590206, "percentage": 46.72, "elapsed_time": "0:11:18", "remaining_time": "0:12:54", "throughput": 2565.21, "total_tokens": 1741568} +{"current_steps": 3545, "total_steps": 7577, "loss": 0.0027, "lr": 1.283319530423929e-06, "epoch": 0.4678632704236505, "percentage": 46.79, "elapsed_time": "0:11:19", "remaining_time": "0:12:52", "throughput": 2567.28, "total_tokens": 1743808} +{"current_steps": 3550, "total_steps": 7577, "loss": 0.0016, "lr": 1.2811096094757144e-06, "epoch": 0.46852316220139895, "percentage": 46.85, "elapsed_time": "0:11:19", "remaining_time": "0:12:50", "throughput": 2569.54, "total_tokens": 1746176} +{"current_steps": 3555, "total_steps": 7577, "loss": 0.2019, "lr": 1.2788981968536612e-06, "epoch": 0.46918305397914745, "percentage": 46.92, "elapsed_time": "0:11:19", "remaining_time": "0:12:49", "throughput": 2571.86, "total_tokens": 1748608} +{"current_steps": 3560, "total_steps": 7577, "loss": 0.1542, "lr": 1.2766853042923607e-06, "epoch": 0.4698429457568959, "percentage": 46.98, "elapsed_time": "0:11:20", "remaining_time": "0:12:47", "throughput": 2574.2, "total_tokens": 1751040} +{"current_steps": 3565, "total_steps": 7577, "loss": 0.0623, "lr": 1.2744709435342573e-06, "epoch": 0.47050283753464434, "percentage": 47.05, "elapsed_time": "0:11:20", "remaining_time": "0:12:45", "throughput": 2576.24, "total_tokens": 1753280} +{"current_steps": 3570, "total_steps": 7577, "loss": 0.2919, "lr": 1.2722551263295864e-06, "epoch": 0.4711627293123928, "percentage": 47.12, "elapsed_time": "0:11:20", "remaining_time": "0:12:44", "throughput": 2578.58, "total_tokens": 1755712} +{"current_steps": 3575, "total_steps": 7577, "loss": 0.1294, "lr": 1.2700378644363114e-06, "epoch": 0.4718226210901412, "percentage": 47.18, "elapsed_time": "0:11:21", "remaining_time": "0:12:42", "throughput": 2580.62, "total_tokens": 1757952} +{"current_steps": 3580, "total_steps": 7577, "loss": 0.0883, "lr": 1.2678191696200621e-06, "epoch": 0.47248251286788967, "percentage": 47.25, "elapsed_time": "0:11:21", "remaining_time": "0:12:40", "throughput": 2582.94, "total_tokens": 1760384} +{"current_steps": 3585, "total_steps": 7577, "loss": 0.0025, "lr": 1.2655990536540717e-06, "epoch": 0.4731424046456381, "percentage": 47.31, "elapsed_time": "0:11:21", "remaining_time": "0:12:39", "throughput": 2585.42, "total_tokens": 1762944} +{"current_steps": 3590, "total_steps": 7577, "loss": 0.2308, "lr": 1.2633775283191144e-06, "epoch": 0.47380229642338656, "percentage": 47.38, "elapsed_time": "0:11:22", "remaining_time": "0:12:37", "throughput": 2587.93, "total_tokens": 1765504} +{"current_steps": 3595, "total_steps": 7577, "loss": 0.0084, "lr": 1.2611546054034436e-06, "epoch": 0.474462188201135, "percentage": 47.45, "elapsed_time": "0:11:22", "remaining_time": "0:12:36", "throughput": 2590.52, "total_tokens": 1768128} +{"current_steps": 3600, "total_steps": 7577, "loss": 0.1521, "lr": 1.2589302967027285e-06, "epoch": 0.47512207997888345, "percentage": 47.51, "elapsed_time": "0:11:22", "remaining_time": "0:12:34", "throughput": 2592.92, "total_tokens": 1770624} +{"current_steps": 3605, "total_steps": 7577, "loss": 0.3261, "lr": 1.2567046140199914e-06, "epoch": 0.4757819717566319, "percentage": 47.58, "elapsed_time": "0:11:23", "remaining_time": "0:12:32", "throughput": 2595.51, "total_tokens": 1773248} +{"current_steps": 3610, "total_steps": 7577, "loss": 0.1219, "lr": 1.2544775691655463e-06, "epoch": 0.47644186353438034, "percentage": 47.64, "elapsed_time": "0:11:23", "remaining_time": "0:12:31", "throughput": 2597.56, "total_tokens": 1775488} +{"current_steps": 3615, "total_steps": 7577, "loss": 0.138, "lr": 1.2522491739569346e-06, "epoch": 0.4771017553121288, "percentage": 47.71, "elapsed_time": "0:11:23", "remaining_time": "0:12:29", "throughput": 2599.68, "total_tokens": 1777792} +{"current_steps": 3620, "total_steps": 7577, "loss": 0.1041, "lr": 1.250019440218864e-06, "epoch": 0.4777616470898773, "percentage": 47.78, "elapsed_time": "0:11:24", "remaining_time": "0:12:27", "throughput": 2602.15, "total_tokens": 1780352} +{"current_steps": 3625, "total_steps": 7577, "loss": 0.1707, "lr": 1.247788379783144e-06, "epoch": 0.47842153886762573, "percentage": 47.84, "elapsed_time": "0:11:24", "remaining_time": "0:12:26", "throughput": 2604.98, "total_tokens": 1783168} +{"current_steps": 3630, "total_steps": 7577, "loss": 0.0886, "lr": 1.2455560044886248e-06, "epoch": 0.4790814306453742, "percentage": 47.91, "elapsed_time": "0:11:24", "remaining_time": "0:12:24", "throughput": 2607.73, "total_tokens": 1785920} +{"current_steps": 3635, "total_steps": 7577, "loss": 0.1456, "lr": 1.2433223261811337e-06, "epoch": 0.4797413224231226, "percentage": 47.97, "elapsed_time": "0:11:25", "remaining_time": "0:12:23", "throughput": 2610.12, "total_tokens": 1788416} +{"current_steps": 3640, "total_steps": 7577, "loss": 0.0141, "lr": 1.2410873567134115e-06, "epoch": 0.48040121420087106, "percentage": 48.04, "elapsed_time": "0:11:25", "remaining_time": "0:12:21", "throughput": 2612.42, "total_tokens": 1790848} +{"current_steps": 3645, "total_steps": 7577, "loss": 0.0342, "lr": 1.238851107945051e-06, "epoch": 0.4810611059786195, "percentage": 48.11, "elapsed_time": "0:11:25", "remaining_time": "0:12:19", "throughput": 2614.7, "total_tokens": 1793280} +{"current_steps": 3650, "total_steps": 7577, "loss": 0.1088, "lr": 1.2366135917424341e-06, "epoch": 0.48172099775636795, "percentage": 48.17, "elapsed_time": "0:11:26", "remaining_time": "0:12:18", "throughput": 2616.89, "total_tokens": 1795648} +{"current_steps": 3655, "total_steps": 7577, "loss": 0.1796, "lr": 1.2343748199786665e-06, "epoch": 0.4823808895341164, "percentage": 48.24, "elapsed_time": "0:11:26", "remaining_time": "0:12:16", "throughput": 2618.99, "total_tokens": 1797952} +{"current_steps": 3660, "total_steps": 7577, "loss": 0.0595, "lr": 1.2321348045335182e-06, "epoch": 0.48304078131186484, "percentage": 48.3, "elapsed_time": "0:11:26", "remaining_time": "0:12:15", "throughput": 2621.01, "total_tokens": 1800192} +{"current_steps": 3665, "total_steps": 7577, "loss": 0.1465, "lr": 1.2298935572933575e-06, "epoch": 0.4837006730896133, "percentage": 48.37, "elapsed_time": "0:11:27", "remaining_time": "0:12:13", "throughput": 2623.2, "total_tokens": 1802560} +{"current_steps": 3670, "total_steps": 7577, "loss": 0.1584, "lr": 1.2276510901510892e-06, "epoch": 0.48436056486736173, "percentage": 48.44, "elapsed_time": "0:11:27", "remaining_time": "0:12:11", "throughput": 2625.57, "total_tokens": 1805056} +{"current_steps": 3675, "total_steps": 7577, "loss": 0.1682, "lr": 1.2254074150060915e-06, "epoch": 0.4850204566451102, "percentage": 48.5, "elapsed_time": "0:11:27", "remaining_time": "0:12:10", "throughput": 2628.21, "total_tokens": 1807744} +{"current_steps": 3680, "total_steps": 7577, "loss": 0.1522, "lr": 1.2231625437641535e-06, "epoch": 0.4856803484228587, "percentage": 48.57, "elapsed_time": "0:11:28", "remaining_time": "0:12:08", "throughput": 2630.75, "total_tokens": 1810368} +{"current_steps": 3685, "total_steps": 7577, "loss": 0.045, "lr": 1.2209164883374096e-06, "epoch": 0.4863402402006071, "percentage": 48.63, "elapsed_time": "0:11:28", "remaining_time": "0:12:07", "throughput": 2633.38, "total_tokens": 1813056} +{"current_steps": 3690, "total_steps": 7577, "loss": 0.22, "lr": 1.2186692606442793e-06, "epoch": 0.48700013197835557, "percentage": 48.7, "elapsed_time": "0:11:28", "remaining_time": "0:12:05", "throughput": 2635.45, "total_tokens": 1815360} +{"current_steps": 3695, "total_steps": 7577, "loss": 0.1641, "lr": 1.216420872609402e-06, "epoch": 0.487660023756104, "percentage": 48.77, "elapsed_time": "0:11:29", "remaining_time": "0:12:04", "throughput": 2637.9, "total_tokens": 1817920} +{"current_steps": 3700, "total_steps": 7577, "loss": 0.0635, "lr": 1.2141713361635739e-06, "epoch": 0.48831991553385246, "percentage": 48.83, "elapsed_time": "0:11:29", "remaining_time": "0:12:02", "throughput": 2640.03, "total_tokens": 1820288} +{"current_steps": 3705, "total_steps": 7577, "loss": 0.1703, "lr": 1.2119206632436864e-06, "epoch": 0.4889798073116009, "percentage": 48.9, "elapsed_time": "0:11:29", "remaining_time": "0:12:00", "throughput": 2642.21, "total_tokens": 1822656} +{"current_steps": 3710, "total_steps": 7577, "loss": 0.0631, "lr": 1.209668865792661e-06, "epoch": 0.48963969908934935, "percentage": 48.96, "elapsed_time": "0:11:30", "remaining_time": "0:11:59", "throughput": 2644.12, "total_tokens": 1824832} +{"current_steps": 3715, "total_steps": 7577, "loss": 0.0998, "lr": 1.207415955759385e-06, "epoch": 0.4902995908670978, "percentage": 49.03, "elapsed_time": "0:11:30", "remaining_time": "0:11:57", "throughput": 2646.29, "total_tokens": 1827200} +{"current_steps": 3720, "total_steps": 7577, "loss": 0.1581, "lr": 1.2051619450986514e-06, "epoch": 0.49095948264484623, "percentage": 49.1, "elapsed_time": "0:11:30", "remaining_time": "0:11:56", "throughput": 2648.56, "total_tokens": 1829632} +{"current_steps": 3725, "total_steps": 7577, "loss": 0.1271, "lr": 1.2029068457710923e-06, "epoch": 0.4916193744225947, "percentage": 49.16, "elapsed_time": "0:11:31", "remaining_time": "0:11:54", "throughput": 2651.0, "total_tokens": 1832192} +{"current_steps": 3730, "total_steps": 7577, "loss": 0.091, "lr": 1.200650669743117e-06, "epoch": 0.4922792662003431, "percentage": 49.23, "elapsed_time": "0:11:31", "remaining_time": "0:11:53", "throughput": 2653.43, "total_tokens": 1834752} +{"current_steps": 3735, "total_steps": 7577, "loss": 0.116, "lr": 1.1983934289868488e-06, "epoch": 0.49293915797809157, "percentage": 49.29, "elapsed_time": "0:11:31", "remaining_time": "0:11:51", "throughput": 2655.78, "total_tokens": 1837248} +{"current_steps": 3740, "total_steps": 7577, "loss": 0.1431, "lr": 1.1961351354800595e-06, "epoch": 0.49359904975584007, "percentage": 49.36, "elapsed_time": "0:11:32", "remaining_time": "0:11:50", "throughput": 2658.03, "total_tokens": 1839680} +{"current_steps": 3745, "total_steps": 7577, "loss": 0.1399, "lr": 1.193875801206109e-06, "epoch": 0.4942589415335885, "percentage": 49.43, "elapsed_time": "0:11:32", "remaining_time": "0:11:48", "throughput": 2660.55, "total_tokens": 1842304} +{"current_steps": 3750, "total_steps": 7577, "loss": 0.0471, "lr": 1.1916154381538786e-06, "epoch": 0.49491883331133696, "percentage": 49.49, "elapsed_time": "0:11:32", "remaining_time": "0:11:47", "throughput": 2662.43, "total_tokens": 1844480} +{"current_steps": 3755, "total_steps": 7577, "loss": 0.1858, "lr": 1.1893540583177083e-06, "epoch": 0.4955787250890854, "percentage": 49.56, "elapsed_time": "0:11:33", "remaining_time": "0:11:45", "throughput": 2664.65, "total_tokens": 1846912} +{"current_steps": 3760, "total_steps": 7577, "loss": 0.0801, "lr": 1.187091673697335e-06, "epoch": 0.49623861686683385, "percentage": 49.62, "elapsed_time": "0:11:33", "remaining_time": "0:11:43", "throughput": 2666.46, "total_tokens": 1849024} +{"current_steps": 3765, "total_steps": 7577, "loss": 0.0691, "lr": 1.184828296297826e-06, "epoch": 0.4968985086445823, "percentage": 49.69, "elapsed_time": "0:11:33", "remaining_time": "0:11:42", "throughput": 2669.05, "total_tokens": 1851712} +{"current_steps": 3770, "total_steps": 7577, "loss": 0.0697, "lr": 1.182563938129518e-06, "epoch": 0.49755840042233074, "percentage": 49.76, "elapsed_time": "0:11:34", "remaining_time": "0:11:40", "throughput": 2671.38, "total_tokens": 1854208} +{"current_steps": 3775, "total_steps": 7577, "loss": 0.0893, "lr": 1.1802986112079507e-06, "epoch": 0.4982182922000792, "percentage": 49.82, "elapsed_time": "0:11:34", "remaining_time": "0:11:39", "throughput": 2673.71, "total_tokens": 1856704} +{"current_steps": 3780, "total_steps": 7577, "loss": 0.0831, "lr": 1.1780323275538056e-06, "epoch": 0.4988781839778276, "percentage": 49.89, "elapsed_time": "0:11:34", "remaining_time": "0:11:37", "throughput": 2675.68, "total_tokens": 1858944} +{"current_steps": 3785, "total_steps": 7577, "loss": 0.2059, "lr": 1.1757650991928393e-06, "epoch": 0.49953807575557607, "percentage": 49.95, "elapsed_time": "0:11:35", "remaining_time": "0:11:36", "throughput": 2678.33, "total_tokens": 1861696} +{"current_steps": 3790, "total_steps": 7577, "loss": 0.179, "lr": 1.1734969381558235e-06, "epoch": 0.5001979675333246, "percentage": 50.02, "elapsed_time": "0:11:35", "remaining_time": "0:11:34", "throughput": 2680.52, "total_tokens": 1864128} +{"current_steps": 3790, "total_steps": 7577, "eval_loss": 0.12760794162750244, "epoch": 0.5001979675333246, "percentage": 50.02, "elapsed_time": "0:11:43", "remaining_time": "0:11:42", "throughput": 2650.24, "total_tokens": 1864128} +{"current_steps": 3795, "total_steps": 7577, "loss": 0.002, "lr": 1.1712278564784774e-06, "epoch": 0.500857859311073, "percentage": 50.09, "elapsed_time": "0:12:25", "remaining_time": "0:12:23", "throughput": 2502.47, "total_tokens": 1866432} +{"current_steps": 3800, "total_steps": 7577, "loss": 0.0598, "lr": 1.1689578662014064e-06, "epoch": 0.5015177510888215, "percentage": 50.15, "elapsed_time": "0:12:26", "remaining_time": "0:12:21", "throughput": 2504.45, "total_tokens": 1868736} +{"current_steps": 3805, "total_steps": 7577, "loss": 0.3077, "lr": 1.1666869793700362e-06, "epoch": 0.5021776428665699, "percentage": 50.22, "elapsed_time": "0:12:26", "remaining_time": "0:12:20", "throughput": 2506.86, "total_tokens": 1871360} +{"current_steps": 3810, "total_steps": 7577, "loss": 0.0016, "lr": 1.1644152080345515e-06, "epoch": 0.5028375346443184, "percentage": 50.28, "elapsed_time": "0:12:26", "remaining_time": "0:12:18", "throughput": 2508.69, "total_tokens": 1873536} +{"current_steps": 3815, "total_steps": 7577, "loss": 0.2264, "lr": 1.1621425642498289e-06, "epoch": 0.5034974264220667, "percentage": 50.35, "elapsed_time": "0:12:27", "remaining_time": "0:12:16", "throughput": 2510.77, "total_tokens": 1875904} +{"current_steps": 3820, "total_steps": 7577, "loss": 0.2478, "lr": 1.1598690600753759e-06, "epoch": 0.5041573181998152, "percentage": 50.42, "elapsed_time": "0:12:27", "remaining_time": "0:12:15", "throughput": 2513.09, "total_tokens": 1878464} +{"current_steps": 3825, "total_steps": 7577, "loss": 0.2181, "lr": 1.1575947075752644e-06, "epoch": 0.5048172099775636, "percentage": 50.48, "elapsed_time": "0:12:27", "remaining_time": "0:12:13", "throughput": 2514.93, "total_tokens": 1880640} +{"current_steps": 3830, "total_steps": 7577, "loss": 0.1516, "lr": 1.1553195188180691e-06, "epoch": 0.5054771017553121, "percentage": 50.55, "elapsed_time": "0:12:28", "remaining_time": "0:12:11", "throughput": 2516.92, "total_tokens": 1882944} +{"current_steps": 3835, "total_steps": 7577, "loss": 0.0694, "lr": 1.1530435058768008e-06, "epoch": 0.5061369935330606, "percentage": 50.61, "elapsed_time": "0:12:28", "remaining_time": "0:12:10", "throughput": 2518.92, "total_tokens": 1885248} +{"current_steps": 3840, "total_steps": 7577, "loss": 0.0841, "lr": 1.150766680828845e-06, "epoch": 0.506796885310809, "percentage": 50.68, "elapsed_time": "0:12:28", "remaining_time": "0:12:08", "throughput": 2521.32, "total_tokens": 1887872} +{"current_steps": 3845, "total_steps": 7577, "loss": 0.0024, "lr": 1.1484890557558955e-06, "epoch": 0.5074567770885575, "percentage": 50.75, "elapsed_time": "0:12:29", "remaining_time": "0:12:07", "throughput": 2523.8, "total_tokens": 1890560} +{"current_steps": 3850, "total_steps": 7577, "loss": 0.076, "lr": 1.146210642743892e-06, "epoch": 0.5081166688663059, "percentage": 50.81, "elapsed_time": "0:12:29", "remaining_time": "0:12:05", "throughput": 2526.02, "total_tokens": 1893056} +{"current_steps": 3855, "total_steps": 7577, "loss": 0.0353, "lr": 1.1439314538829554e-06, "epoch": 0.5087765606440544, "percentage": 50.88, "elapsed_time": "0:12:29", "remaining_time": "0:12:03", "throughput": 2528.01, "total_tokens": 1895360} +{"current_steps": 3860, "total_steps": 7577, "loss": 0.0793, "lr": 1.141651501267323e-06, "epoch": 0.5094364524218028, "percentage": 50.94, "elapsed_time": "0:12:30", "remaining_time": "0:12:02", "throughput": 2529.98, "total_tokens": 1897664} +{"current_steps": 3865, "total_steps": 7577, "loss": 0.1073, "lr": 1.1393707969952847e-06, "epoch": 0.5100963441995513, "percentage": 51.01, "elapsed_time": "0:12:30", "remaining_time": "0:12:00", "throughput": 2532.37, "total_tokens": 1900288} +{"current_steps": 3870, "total_steps": 7577, "loss": 0.0796, "lr": 1.13708935316912e-06, "epoch": 0.5107562359772997, "percentage": 51.08, "elapsed_time": "0:12:30", "remaining_time": "0:11:59", "throughput": 2534.91, "total_tokens": 1903040} +{"current_steps": 3875, "total_steps": 7577, "loss": 0.0173, "lr": 1.134807181895032e-06, "epoch": 0.5114161277550482, "percentage": 51.14, "elapsed_time": "0:12:31", "remaining_time": "0:11:57", "throughput": 2537.05, "total_tokens": 1905472} +{"current_steps": 3880, "total_steps": 7577, "loss": 0.0637, "lr": 1.132524295283084e-06, "epoch": 0.5120760195327966, "percentage": 51.21, "elapsed_time": "0:12:31", "remaining_time": "0:11:55", "throughput": 2538.94, "total_tokens": 1907712} +{"current_steps": 3885, "total_steps": 7577, "loss": 0.0912, "lr": 1.1302407054471355e-06, "epoch": 0.5127359113105451, "percentage": 51.27, "elapsed_time": "0:12:31", "remaining_time": "0:11:54", "throughput": 2541.0, "total_tokens": 1910080} +{"current_steps": 3890, "total_steps": 7577, "loss": 0.2374, "lr": 1.1279564245047767e-06, "epoch": 0.5133958030882935, "percentage": 51.34, "elapsed_time": "0:12:32", "remaining_time": "0:11:52", "throughput": 2543.13, "total_tokens": 1912512} +{"current_steps": 3895, "total_steps": 7577, "loss": 0.1336, "lr": 1.1256714645772662e-06, "epoch": 0.514055694866042, "percentage": 51.41, "elapsed_time": "0:12:32", "remaining_time": "0:11:51", "throughput": 2545.02, "total_tokens": 1914752} +{"current_steps": 3900, "total_steps": 7577, "loss": 0.0021, "lr": 1.1233858377894647e-06, "epoch": 0.5147155866437905, "percentage": 51.47, "elapsed_time": "0:12:32", "remaining_time": "0:11:49", "throughput": 2547.06, "total_tokens": 1917120} +{"current_steps": 3905, "total_steps": 7577, "loss": 0.014, "lr": 1.1210995562697722e-06, "epoch": 0.5153754784215389, "percentage": 51.54, "elapsed_time": "0:12:32", "remaining_time": "0:11:48", "throughput": 2548.79, "total_tokens": 1919232} +{"current_steps": 3910, "total_steps": 7577, "loss": 0.0559, "lr": 1.1188126321500621e-06, "epoch": 0.5160353701992874, "percentage": 51.6, "elapsed_time": "0:12:33", "remaining_time": "0:11:46", "throughput": 2551.15, "total_tokens": 1921856} +{"current_steps": 3915, "total_steps": 7577, "loss": 0.1515, "lr": 1.1165250775656188e-06, "epoch": 0.5166952619770357, "percentage": 51.67, "elapsed_time": "0:12:33", "remaining_time": "0:11:44", "throughput": 2553.18, "total_tokens": 1924224} +{"current_steps": 3920, "total_steps": 7577, "loss": 0.0373, "lr": 1.1142369046550708e-06, "epoch": 0.5173551537547842, "percentage": 51.74, "elapsed_time": "0:12:33", "remaining_time": "0:11:43", "throughput": 2555.06, "total_tokens": 1926464} +{"current_steps": 3925, "total_steps": 7577, "loss": 0.1665, "lr": 1.1119481255603289e-06, "epoch": 0.5180150455325326, "percentage": 51.8, "elapsed_time": "0:12:34", "remaining_time": "0:11:41", "throughput": 2557.19, "total_tokens": 1928896} +{"current_steps": 3930, "total_steps": 7577, "loss": 0.115, "lr": 1.1096587524265197e-06, "epoch": 0.5186749373102811, "percentage": 51.87, "elapsed_time": "0:12:34", "remaining_time": "0:11:40", "throughput": 2559.15, "total_tokens": 1931200} +{"current_steps": 3935, "total_steps": 7577, "loss": 0.0542, "lr": 1.107368797401923e-06, "epoch": 0.5193348290880295, "percentage": 51.93, "elapsed_time": "0:12:34", "remaining_time": "0:11:38", "throughput": 2561.28, "total_tokens": 1933632} +{"current_steps": 3940, "total_steps": 7577, "loss": 0.0019, "lr": 1.1050782726379054e-06, "epoch": 0.519994720865778, "percentage": 52.0, "elapsed_time": "0:12:35", "remaining_time": "0:11:37", "throughput": 2563.13, "total_tokens": 1935872} +{"current_steps": 3945, "total_steps": 7577, "loss": 0.0951, "lr": 1.1027871902888566e-06, "epoch": 0.5206546126435264, "percentage": 52.07, "elapsed_time": "0:12:35", "remaining_time": "0:11:35", "throughput": 2564.9, "total_tokens": 1938048} +{"current_steps": 3950, "total_steps": 7577, "loss": 0.056, "lr": 1.1004955625121257e-06, "epoch": 0.5213145044212749, "percentage": 52.13, "elapsed_time": "0:12:35", "remaining_time": "0:11:34", "throughput": 2567.17, "total_tokens": 1940608} +{"current_steps": 3955, "total_steps": 7577, "loss": 0.2829, "lr": 1.0982034014679561e-06, "epoch": 0.5219743961990233, "percentage": 52.2, "elapsed_time": "0:12:36", "remaining_time": "0:11:32", "throughput": 2569.24, "total_tokens": 1943040} +{"current_steps": 3960, "total_steps": 7577, "loss": 0.2808, "lr": 1.0959107193194206e-06, "epoch": 0.5226342879767718, "percentage": 52.26, "elapsed_time": "0:12:36", "remaining_time": "0:11:31", "throughput": 2571.59, "total_tokens": 1945664} +{"current_steps": 3965, "total_steps": 7577, "loss": 0.0046, "lr": 1.0936175282323575e-06, "epoch": 0.5232941797545203, "percentage": 52.33, "elapsed_time": "0:12:36", "remaining_time": "0:11:29", "throughput": 2573.63, "total_tokens": 1948032} +{"current_steps": 3970, "total_steps": 7577, "loss": 0.001, "lr": 1.091323840375305e-06, "epoch": 0.5239540715322687, "percentage": 52.4, "elapsed_time": "0:12:37", "remaining_time": "0:11:28", "throughput": 2575.41, "total_tokens": 1950208} +{"current_steps": 3975, "total_steps": 7577, "loss": 0.2119, "lr": 1.0890296679194378e-06, "epoch": 0.5246139633100172, "percentage": 52.46, "elapsed_time": "0:12:37", "remaining_time": "0:11:26", "throughput": 2577.84, "total_tokens": 1952896} +{"current_steps": 3980, "total_steps": 7577, "loss": 0.068, "lr": 1.086735023038502e-06, "epoch": 0.5252738550877656, "percentage": 52.53, "elapsed_time": "0:12:37", "remaining_time": "0:11:24", "throughput": 2579.77, "total_tokens": 1955200} +{"current_steps": 3985, "total_steps": 7577, "loss": 0.0953, "lr": 1.0844399179087512e-06, "epoch": 0.5259337468655141, "percentage": 52.59, "elapsed_time": "0:12:38", "remaining_time": "0:11:23", "throughput": 2581.55, "total_tokens": 1957376} +{"current_steps": 3990, "total_steps": 7577, "loss": 0.2058, "lr": 1.0821443647088802e-06, "epoch": 0.5265936386432625, "percentage": 52.66, "elapsed_time": "0:12:38", "remaining_time": "0:11:21", "throughput": 2583.96, "total_tokens": 1960064} +{"current_steps": 3995, "total_steps": 7577, "loss": 0.0652, "lr": 1.0798483756199623e-06, "epoch": 0.527253530421011, "percentage": 52.73, "elapsed_time": "0:12:38", "remaining_time": "0:11:20", "throughput": 2586.2, "total_tokens": 1962624} +{"current_steps": 4000, "total_steps": 7577, "loss": 0.0704, "lr": 1.0775519628253833e-06, "epoch": 0.5279134221987594, "percentage": 52.79, "elapsed_time": "0:12:39", "remaining_time": "0:11:18", "throughput": 2588.29, "total_tokens": 1965056} +{"current_steps": 4005, "total_steps": 7577, "loss": 0.1949, "lr": 1.0752551385107772e-06, "epoch": 0.5285733139765079, "percentage": 52.86, "elapsed_time": "0:12:39", "remaining_time": "0:11:17", "throughput": 2590.29, "total_tokens": 1967424} +{"current_steps": 4010, "total_steps": 7577, "loss": 0.1433, "lr": 1.0729579148639621e-06, "epoch": 0.5292332057542563, "percentage": 52.92, "elapsed_time": "0:12:39", "remaining_time": "0:11:15", "throughput": 2592.38, "total_tokens": 1969856} +{"current_steps": 4015, "total_steps": 7577, "loss": 0.0517, "lr": 1.0706603040748747e-06, "epoch": 0.5298930975320048, "percentage": 52.99, "elapsed_time": "0:12:40", "remaining_time": "0:11:14", "throughput": 2594.77, "total_tokens": 1972544} +{"current_steps": 4020, "total_steps": 7577, "loss": 0.0448, "lr": 1.0683623183355071e-06, "epoch": 0.5305529893097533, "percentage": 53.06, "elapsed_time": "0:12:40", "remaining_time": "0:11:12", "throughput": 2596.74, "total_tokens": 1974912} +{"current_steps": 4025, "total_steps": 7577, "loss": 0.1542, "lr": 1.0660639698398392e-06, "epoch": 0.5312128810875016, "percentage": 53.12, "elapsed_time": "0:12:40", "remaining_time": "0:11:11", "throughput": 2598.65, "total_tokens": 1977216} +{"current_steps": 4030, "total_steps": 7577, "loss": 0.1436, "lr": 1.0637652707837773e-06, "epoch": 0.5318727728652501, "percentage": 53.19, "elapsed_time": "0:12:41", "remaining_time": "0:11:09", "throughput": 2600.73, "total_tokens": 1979648} +{"current_steps": 4035, "total_steps": 7577, "loss": 0.1039, "lr": 1.0614662333650876e-06, "epoch": 0.5325326646429985, "percentage": 53.25, "elapsed_time": "0:12:41", "remaining_time": "0:11:08", "throughput": 2602.57, "total_tokens": 1981888} +{"current_steps": 4040, "total_steps": 7577, "loss": 0.2167, "lr": 1.0591668697833311e-06, "epoch": 0.533192556420747, "percentage": 53.32, "elapsed_time": "0:12:41", "remaining_time": "0:11:06", "throughput": 2604.81, "total_tokens": 1984448} +{"current_steps": 4045, "total_steps": 7577, "loss": 0.1567, "lr": 1.0568671922398005e-06, "epoch": 0.5338524481984954, "percentage": 53.39, "elapsed_time": "0:12:42", "remaining_time": "0:11:05", "throughput": 2607.11, "total_tokens": 1987072} +{"current_steps": 4050, "total_steps": 7577, "loss": 0.1618, "lr": 1.054567212937454e-06, "epoch": 0.5345123399762439, "percentage": 53.45, "elapsed_time": "0:12:42", "remaining_time": "0:11:04", "throughput": 2609.33, "total_tokens": 1989632} +{"current_steps": 4055, "total_steps": 7577, "loss": 0.0367, "lr": 1.0522669440808508e-06, "epoch": 0.5351722317539923, "percentage": 53.52, "elapsed_time": "0:12:42", "remaining_time": "0:11:02", "throughput": 2611.56, "total_tokens": 1992192} +{"current_steps": 4060, "total_steps": 7577, "loss": 0.2607, "lr": 1.0499663978760871e-06, "epoch": 0.5358321235317408, "percentage": 53.58, "elapsed_time": "0:12:43", "remaining_time": "0:11:01", "throughput": 2613.63, "total_tokens": 1994624} +{"current_steps": 4065, "total_steps": 7577, "loss": 0.0821, "lr": 1.0476655865307308e-06, "epoch": 0.5364920153094892, "percentage": 53.65, "elapsed_time": "0:12:43", "remaining_time": "0:10:59", "throughput": 2615.65, "total_tokens": 1997056} +{"current_steps": 4070, "total_steps": 7577, "loss": 0.0918, "lr": 1.0453645222537556e-06, "epoch": 0.5371519070872377, "percentage": 53.72, "elapsed_time": "0:12:43", "remaining_time": "0:10:58", "throughput": 2617.56, "total_tokens": 1999360} +{"current_steps": 4075, "total_steps": 7577, "loss": 0.0861, "lr": 1.0430632172554796e-06, "epoch": 0.5378117988649861, "percentage": 53.78, "elapsed_time": "0:12:44", "remaining_time": "0:10:56", "throughput": 2619.7, "total_tokens": 2001856} +{"current_steps": 4080, "total_steps": 7577, "loss": 0.1321, "lr": 1.0407616837474963e-06, "epoch": 0.5384716906427346, "percentage": 53.85, "elapsed_time": "0:12:44", "remaining_time": "0:10:55", "throughput": 2621.76, "total_tokens": 2004288} +{"current_steps": 4085, "total_steps": 7577, "loss": 0.0784, "lr": 1.038459933942612e-06, "epoch": 0.5391315824204831, "percentage": 53.91, "elapsed_time": "0:12:44", "remaining_time": "0:10:53", "throughput": 2624.14, "total_tokens": 2006976} +{"current_steps": 4090, "total_steps": 7577, "loss": 0.0603, "lr": 1.036157980054782e-06, "epoch": 0.5397914741982315, "percentage": 53.98, "elapsed_time": "0:12:45", "remaining_time": "0:10:52", "throughput": 2626.01, "total_tokens": 2009280} +{"current_steps": 4095, "total_steps": 7577, "loss": 0.0969, "lr": 1.0338558342990431e-06, "epoch": 0.54045136597598, "percentage": 54.05, "elapsed_time": "0:12:45", "remaining_time": "0:10:50", "throughput": 2628.15, "total_tokens": 2011776} +{"current_steps": 4100, "total_steps": 7577, "loss": 0.2581, "lr": 1.0315535088914508e-06, "epoch": 0.5411112577537284, "percentage": 54.11, "elapsed_time": "0:12:45", "remaining_time": "0:10:49", "throughput": 2630.35, "total_tokens": 2014336} +{"current_steps": 4105, "total_steps": 7577, "loss": 0.1642, "lr": 1.0292510160490146e-06, "epoch": 0.5417711495314769, "percentage": 54.18, "elapsed_time": "0:12:46", "remaining_time": "0:10:47", "throughput": 2632.88, "total_tokens": 2017152} +{"current_steps": 4110, "total_steps": 7577, "loss": 0.0998, "lr": 1.0269483679896308e-06, "epoch": 0.5424310413092253, "percentage": 54.24, "elapsed_time": "0:12:46", "remaining_time": "0:10:46", "throughput": 2634.84, "total_tokens": 2019520} +{"current_steps": 4115, "total_steps": 7577, "loss": 0.162, "lr": 1.0246455769320211e-06, "epoch": 0.5430909330869738, "percentage": 54.31, "elapsed_time": "0:12:46", "remaining_time": "0:10:45", "throughput": 2636.47, "total_tokens": 2021632} +{"current_steps": 4120, "total_steps": 7577, "loss": 0.1261, "lr": 1.0223426550956647e-06, "epoch": 0.5437508248647221, "percentage": 54.38, "elapsed_time": "0:12:47", "remaining_time": "0:10:43", "throughput": 2638.1, "total_tokens": 2023744} +{"current_steps": 4125, "total_steps": 7577, "loss": 0.0762, "lr": 1.0200396147007354e-06, "epoch": 0.5444107166424706, "percentage": 54.44, "elapsed_time": "0:12:47", "remaining_time": "0:10:42", "throughput": 2639.99, "total_tokens": 2026048} +{"current_steps": 4130, "total_steps": 7577, "loss": 0.132, "lr": 1.0177364679680367e-06, "epoch": 0.545070608420219, "percentage": 54.51, "elapsed_time": "0:12:47", "remaining_time": "0:10:40", "throughput": 2641.87, "total_tokens": 2028352} +{"current_steps": 4135, "total_steps": 7577, "loss": 0.0602, "lr": 1.015433227118935e-06, "epoch": 0.5457305001979675, "percentage": 54.57, "elapsed_time": "0:12:48", "remaining_time": "0:10:39", "throughput": 2643.98, "total_tokens": 2030848} +{"current_steps": 4140, "total_steps": 7577, "loss": 0.1337, "lr": 1.0131299043752967e-06, "epoch": 0.5463903919757159, "percentage": 54.64, "elapsed_time": "0:12:48", "remaining_time": "0:10:37", "throughput": 2646.09, "total_tokens": 2033344} +{"current_steps": 4145, "total_steps": 7577, "loss": 0.0548, "lr": 1.0108265119594233e-06, "epoch": 0.5470502837534644, "percentage": 54.71, "elapsed_time": "0:12:48", "remaining_time": "0:10:36", "throughput": 2647.9, "total_tokens": 2035584} +{"current_steps": 4150, "total_steps": 7577, "loss": 0.0713, "lr": 1.0085230620939853e-06, "epoch": 0.5477101755312129, "percentage": 54.77, "elapsed_time": "0:12:49", "remaining_time": "0:10:35", "throughput": 2650.24, "total_tokens": 2038272} +{"current_steps": 4155, "total_steps": 7577, "loss": 0.0909, "lr": 1.0062195670019583e-06, "epoch": 0.5483700673089613, "percentage": 54.84, "elapsed_time": "0:12:49", "remaining_time": "0:10:33", "throughput": 2652.33, "total_tokens": 2040768} +{"current_steps": 4160, "total_steps": 7577, "loss": 0.1428, "lr": 1.0039160389065582e-06, "epoch": 0.5490299590867098, "percentage": 54.9, "elapsed_time": "0:12:49", "remaining_time": "0:10:32", "throughput": 2654.21, "total_tokens": 2043072} +{"current_steps": 4165, "total_steps": 7577, "loss": 0.1555, "lr": 1.0016124900311755e-06, "epoch": 0.5496898508644582, "percentage": 54.97, "elapsed_time": "0:12:50", "remaining_time": "0:10:30", "throughput": 2656.64, "total_tokens": 2045824} +{"current_steps": 4169, "total_steps": 7577, "eval_loss": 0.09937019646167755, "epoch": 0.550217764286657, "percentage": 55.02, "elapsed_time": "0:12:58", "remaining_time": "0:10:36", "throughput": 2631.16, "total_tokens": 2047552} +{"current_steps": 4170, "total_steps": 7577, "loss": 0.2405, "lr": 9.99308932599311e-07, "epoch": 0.5503497426422067, "percentage": 55.03, "elapsed_time": "0:13:55", "remaining_time": "0:11:22", "throughput": 2451.77, "total_tokens": 2048064} +{"current_steps": 4175, "total_steps": 7577, "loss": 0.0424, "lr": 9.970053788345112e-07, "epoch": 0.5510096344199551, "percentage": 55.1, "elapsed_time": "0:13:55", "remaining_time": "0:11:20", "throughput": 2453.62, "total_tokens": 2050432} +{"current_steps": 4180, "total_steps": 7577, "loss": 0.0537, "lr": 9.947018409603036e-07, "epoch": 0.5516695261977036, "percentage": 55.17, "elapsed_time": "0:13:56", "remaining_time": "0:11:19", "throughput": 2455.64, "total_tokens": 2052928} +{"current_steps": 4185, "total_steps": 7577, "loss": 0.1485, "lr": 9.923983312001304e-07, "epoch": 0.552329417975452, "percentage": 55.23, "elapsed_time": "0:13:56", "remaining_time": "0:11:17", "throughput": 2457.66, "total_tokens": 2055424} +{"current_steps": 4190, "total_steps": 7577, "loss": 0.1457, "lr": 9.900948617772846e-07, "epoch": 0.5529893097532005, "percentage": 55.3, "elapsed_time": "0:13:56", "remaining_time": "0:11:16", "throughput": 2459.23, "total_tokens": 2057536} +{"current_steps": 4195, "total_steps": 7577, "loss": 0.1713, "lr": 9.877914449148462e-07, "epoch": 0.5536492015309489, "percentage": 55.36, "elapsed_time": "0:13:56", "remaining_time": "0:11:14", "throughput": 2460.99, "total_tokens": 2059840} +{"current_steps": 4200, "total_steps": 7577, "loss": 0.2209, "lr": 9.854880928356157e-07, "epoch": 0.5543090933086974, "percentage": 55.43, "elapsed_time": "0:13:57", "remaining_time": "0:11:13", "throughput": 2463.35, "total_tokens": 2062656} +{"current_steps": 4205, "total_steps": 7577, "loss": 0.1398, "lr": 9.831848177620493e-07, "epoch": 0.5549689850864459, "percentage": 55.5, "elapsed_time": "0:13:57", "remaining_time": "0:11:11", "throughput": 2465.11, "total_tokens": 2064960} +{"current_steps": 4210, "total_steps": 7577, "loss": 0.2412, "lr": 9.808816319161961e-07, "epoch": 0.5556288768641943, "percentage": 55.56, "elapsed_time": "0:13:58", "remaining_time": "0:11:10", "throughput": 2466.58, "total_tokens": 2067008} +{"current_steps": 4215, "total_steps": 7577, "loss": 0.0009, "lr": 9.785785475196298e-07, "epoch": 0.5562887686419428, "percentage": 55.63, "elapsed_time": "0:13:58", "remaining_time": "0:11:08", "throughput": 2468.79, "total_tokens": 2069696} +{"current_steps": 4220, "total_steps": 7577, "loss": 0.0507, "lr": 9.76275576793387e-07, "epoch": 0.5569486604196912, "percentage": 55.69, "elapsed_time": "0:13:58", "remaining_time": "0:11:07", "throughput": 2470.92, "total_tokens": 2072320} +{"current_steps": 4225, "total_steps": 7577, "loss": 0.0016, "lr": 9.739727319579007e-07, "epoch": 0.5576085521974397, "percentage": 55.76, "elapsed_time": "0:13:59", "remaining_time": "0:11:05", "throughput": 2472.83, "total_tokens": 2074752} +{"current_steps": 4230, "total_steps": 7577, "loss": 0.1143, "lr": 9.716700252329361e-07, "epoch": 0.558268443975188, "percentage": 55.83, "elapsed_time": "0:13:59", "remaining_time": "0:11:04", "throughput": 2475.01, "total_tokens": 2077440} +{"current_steps": 4235, "total_steps": 7577, "loss": 0.1856, "lr": 9.693674688375254e-07, "epoch": 0.5589283357529365, "percentage": 55.89, "elapsed_time": "0:13:59", "remaining_time": "0:11:02", "throughput": 2477.07, "total_tokens": 2080000} +{"current_steps": 4240, "total_steps": 7577, "loss": 0.0667, "lr": 9.67065074989903e-07, "epoch": 0.5595882275306849, "percentage": 55.96, "elapsed_time": "0:14:00", "remaining_time": "0:11:01", "throughput": 2479.13, "total_tokens": 2082560} +{"current_steps": 4245, "total_steps": 7577, "loss": 0.0822, "lr": 9.647628559074415e-07, "epoch": 0.5602481193084334, "percentage": 56.02, "elapsed_time": "0:14:00", "remaining_time": "0:10:59", "throughput": 2480.89, "total_tokens": 2084864} +{"current_steps": 4250, "total_steps": 7577, "loss": 0.1228, "lr": 9.62460823806585e-07, "epoch": 0.5609080110861818, "percentage": 56.09, "elapsed_time": "0:14:00", "remaining_time": "0:10:58", "throughput": 2482.95, "total_tokens": 2087424} +{"current_steps": 4255, "total_steps": 7577, "loss": 0.2208, "lr": 9.601589909027857e-07, "epoch": 0.5615679028639303, "percentage": 56.16, "elapsed_time": "0:14:01", "remaining_time": "0:10:56", "throughput": 2485.08, "total_tokens": 2090048} +{"current_steps": 4260, "total_steps": 7577, "loss": 0.0689, "lr": 9.578573694104394e-07, "epoch": 0.5622277946416787, "percentage": 56.22, "elapsed_time": "0:14:01", "remaining_time": "0:10:55", "throughput": 2486.94, "total_tokens": 2092416} +{"current_steps": 4265, "total_steps": 7577, "loss": 0.0788, "lr": 9.555559715428199e-07, "epoch": 0.5628876864194272, "percentage": 56.29, "elapsed_time": "0:14:01", "remaining_time": "0:10:53", "throughput": 2488.65, "total_tokens": 2094656} +{"current_steps": 4270, "total_steps": 7577, "loss": 0.069, "lr": 9.532548095120134e-07, "epoch": 0.5635475781971757, "percentage": 56.35, "elapsed_time": "0:14:02", "remaining_time": "0:10:52", "throughput": 2490.5, "total_tokens": 2097024} +{"current_steps": 4275, "total_steps": 7577, "loss": 0.0597, "lr": 9.509538955288564e-07, "epoch": 0.5642074699749241, "percentage": 56.42, "elapsed_time": "0:14:02", "remaining_time": "0:10:50", "throughput": 2492.36, "total_tokens": 2099392} +{"current_steps": 4280, "total_steps": 7577, "loss": 0.09, "lr": 9.486532418028672e-07, "epoch": 0.5648673617526726, "percentage": 56.49, "elapsed_time": "0:14:02", "remaining_time": "0:10:49", "throughput": 2494.49, "total_tokens": 2102016} +{"current_steps": 4285, "total_steps": 7577, "loss": 0.0804, "lr": 9.463528605421844e-07, "epoch": 0.565527253530421, "percentage": 56.55, "elapsed_time": "0:14:02", "remaining_time": "0:10:47", "throughput": 2496.27, "total_tokens": 2104320} +{"current_steps": 4290, "total_steps": 7577, "loss": 0.1016, "lr": 9.440527639535004e-07, "epoch": 0.5661871453081695, "percentage": 56.62, "elapsed_time": "0:14:03", "remaining_time": "0:10:46", "throughput": 2498.62, "total_tokens": 2107136} +{"current_steps": 4295, "total_steps": 7577, "loss": 0.0533, "lr": 9.417529642419971e-07, "epoch": 0.5668470370859179, "percentage": 56.68, "elapsed_time": "0:14:03", "remaining_time": "0:10:44", "throughput": 2500.9, "total_tokens": 2109888} +{"current_steps": 4300, "total_steps": 7577, "loss": 0.1565, "lr": 9.394534736112815e-07, "epoch": 0.5675069288636664, "percentage": 56.75, "elapsed_time": "0:14:03", "remaining_time": "0:10:43", "throughput": 2502.67, "total_tokens": 2112192} +{"current_steps": 4305, "total_steps": 7577, "loss": 0.1197, "lr": 9.371543042633192e-07, "epoch": 0.5681668206414148, "percentage": 56.82, "elapsed_time": "0:14:04", "remaining_time": "0:10:41", "throughput": 2504.73, "total_tokens": 2114752} +{"current_steps": 4310, "total_steps": 7577, "loss": 0.141, "lr": 9.348554683983722e-07, "epoch": 0.5688267124191633, "percentage": 56.88, "elapsed_time": "0:14:04", "remaining_time": "0:10:40", "throughput": 2506.64, "total_tokens": 2117184} +{"current_steps": 4315, "total_steps": 7577, "loss": 0.1155, "lr": 9.325569782149323e-07, "epoch": 0.5694866041969117, "percentage": 56.95, "elapsed_time": "0:14:04", "remaining_time": "0:10:38", "throughput": 2508.48, "total_tokens": 2119552} +{"current_steps": 4320, "total_steps": 7577, "loss": 0.0744, "lr": 9.302588459096574e-07, "epoch": 0.5701464959746602, "percentage": 57.01, "elapsed_time": "0:14:05", "remaining_time": "0:10:37", "throughput": 2510.32, "total_tokens": 2121920} +{"current_steps": 4325, "total_steps": 7577, "loss": 0.2853, "lr": 9.279610836773064e-07, "epoch": 0.5708063877524086, "percentage": 57.08, "elapsed_time": "0:14:05", "remaining_time": "0:10:35", "throughput": 2511.93, "total_tokens": 2124096} +{"current_steps": 4330, "total_steps": 7577, "loss": 0.1079, "lr": 9.256637037106735e-07, "epoch": 0.571466279530157, "percentage": 57.15, "elapsed_time": "0:14:05", "remaining_time": "0:10:34", "throughput": 2513.82, "total_tokens": 2126528} +{"current_steps": 4335, "total_steps": 7577, "loss": 0.0589, "lr": 9.233667182005259e-07, "epoch": 0.5721261713079056, "percentage": 57.21, "elapsed_time": "0:14:06", "remaining_time": "0:10:32", "throughput": 2515.29, "total_tokens": 2128576} +{"current_steps": 4340, "total_steps": 7577, "loss": 0.0648, "lr": 9.210701393355361e-07, "epoch": 0.5727860630856539, "percentage": 57.28, "elapsed_time": "0:14:06", "remaining_time": "0:10:31", "throughput": 2516.81, "total_tokens": 2130688} +{"current_steps": 4345, "total_steps": 7577, "loss": 0.1324, "lr": 9.187739793022198e-07, "epoch": 0.5734459548634024, "percentage": 57.34, "elapsed_time": "0:14:06", "remaining_time": "0:10:29", "throughput": 2518.94, "total_tokens": 2133312} +{"current_steps": 4350, "total_steps": 7577, "loss": 0.0724, "lr": 9.164782502848702e-07, "epoch": 0.5741058466411508, "percentage": 57.41, "elapsed_time": "0:14:07", "remaining_time": "0:10:28", "throughput": 2520.77, "total_tokens": 2135680} +{"current_steps": 4355, "total_steps": 7577, "loss": 0.1448, "lr": 9.141829644654936e-07, "epoch": 0.5747657384188993, "percentage": 57.48, "elapsed_time": "0:14:07", "remaining_time": "0:10:27", "throughput": 2522.66, "total_tokens": 2138112} +{"current_steps": 4360, "total_steps": 7577, "loss": 0.4271, "lr": 9.118881340237432e-07, "epoch": 0.5754256301966477, "percentage": 57.54, "elapsed_time": "0:14:07", "remaining_time": "0:10:25", "throughput": 2524.35, "total_tokens": 2140352} +{"current_steps": 4365, "total_steps": 7577, "loss": 0.0894, "lr": 9.095937711368573e-07, "epoch": 0.5760855219743962, "percentage": 57.61, "elapsed_time": "0:14:08", "remaining_time": "0:10:24", "throughput": 2526.52, "total_tokens": 2143040} +{"current_steps": 4370, "total_steps": 7577, "loss": 0.0716, "lr": 9.072998879795923e-07, "epoch": 0.5767454137521446, "percentage": 57.67, "elapsed_time": "0:14:08", "remaining_time": "0:10:22", "throughput": 2528.19, "total_tokens": 2145280} +{"current_steps": 4375, "total_steps": 7577, "loss": 0.1048, "lr": 9.050064967241596e-07, "epoch": 0.5774053055298931, "percentage": 57.74, "elapsed_time": "0:14:08", "remaining_time": "0:10:21", "throughput": 2530.3, "total_tokens": 2147904} +{"current_steps": 4380, "total_steps": 7577, "loss": 0.0838, "lr": 9.027136095401598e-07, "epoch": 0.5780651973076415, "percentage": 57.81, "elapsed_time": "0:14:09", "remaining_time": "0:10:19", "throughput": 2532.26, "total_tokens": 2150400} +{"current_steps": 4385, "total_steps": 7577, "loss": 0.135, "lr": 9.004212385945187e-07, "epoch": 0.57872508908539, "percentage": 57.87, "elapsed_time": "0:14:09", "remaining_time": "0:10:18", "throughput": 2534.43, "total_tokens": 2153088} +{"current_steps": 4390, "total_steps": 7577, "loss": 0.0013, "lr": 8.981293960514233e-07, "epoch": 0.5793849808631385, "percentage": 57.94, "elapsed_time": "0:14:09", "remaining_time": "0:10:16", "throughput": 2536.6, "total_tokens": 2155776} +{"current_steps": 4395, "total_steps": 7577, "loss": 0.1661, "lr": 8.958380940722564e-07, "epoch": 0.5800448726408869, "percentage": 58.0, "elapsed_time": "0:14:10", "remaining_time": "0:10:15", "throughput": 2538.7, "total_tokens": 2158400} +{"current_steps": 4400, "total_steps": 7577, "loss": 0.0766, "lr": 8.935473448155326e-07, "epoch": 0.5807047644186354, "percentage": 58.07, "elapsed_time": "0:14:10", "remaining_time": "0:10:14", "throughput": 2540.45, "total_tokens": 2160704} +{"current_steps": 4405, "total_steps": 7577, "loss": 0.0469, "lr": 8.912571604368324e-07, "epoch": 0.5813646561963838, "percentage": 58.14, "elapsed_time": "0:14:10", "remaining_time": "0:10:12", "throughput": 2542.41, "total_tokens": 2163200} +{"current_steps": 4410, "total_steps": 7577, "loss": 0.1421, "lr": 8.889675530887404e-07, "epoch": 0.5820245479741323, "percentage": 58.2, "elapsed_time": "0:14:11", "remaining_time": "0:10:11", "throughput": 2544.01, "total_tokens": 2165376} +{"current_steps": 4415, "total_steps": 7577, "loss": 0.0994, "lr": 8.866785349207786e-07, "epoch": 0.5826844397518807, "percentage": 58.27, "elapsed_time": "0:14:11", "remaining_time": "0:10:09", "throughput": 2545.9, "total_tokens": 2167808} +{"current_steps": 4420, "total_steps": 7577, "loss": 0.1332, "lr": 8.843901180793423e-07, "epoch": 0.5833443315296292, "percentage": 58.33, "elapsed_time": "0:14:11", "remaining_time": "0:10:08", "throughput": 2547.64, "total_tokens": 2170112} +{"current_steps": 4425, "total_steps": 7577, "loss": 0.0005, "lr": 8.821023147076362e-07, "epoch": 0.5840042233073776, "percentage": 58.4, "elapsed_time": "0:14:12", "remaining_time": "0:10:06", "throughput": 2549.45, "total_tokens": 2172480} +{"current_steps": 4430, "total_steps": 7577, "loss": 0.0432, "lr": 8.798151369456098e-07, "epoch": 0.5846641150851261, "percentage": 58.47, "elapsed_time": "0:14:12", "remaining_time": "0:10:05", "throughput": 2551.54, "total_tokens": 2175104} +{"current_steps": 4435, "total_steps": 7577, "loss": 0.1126, "lr": 8.775285969298931e-07, "epoch": 0.5853240068628744, "percentage": 58.53, "elapsed_time": "0:14:12", "remaining_time": "0:10:04", "throughput": 2553.13, "total_tokens": 2177280} +{"current_steps": 4440, "total_steps": 7577, "loss": 0.0735, "lr": 8.752427067937312e-07, "epoch": 0.585983898640623, "percentage": 58.6, "elapsed_time": "0:14:13", "remaining_time": "0:10:02", "throughput": 2555.08, "total_tokens": 2179776} +{"current_steps": 4445, "total_steps": 7577, "loss": 0.0949, "lr": 8.729574786669214e-07, "epoch": 0.5866437904183713, "percentage": 58.66, "elapsed_time": "0:14:13", "remaining_time": "0:10:01", "throughput": 2557.16, "total_tokens": 2182400} +{"current_steps": 4450, "total_steps": 7577, "loss": 0.0655, "lr": 8.706729246757477e-07, "epoch": 0.5873036821961198, "percentage": 58.73, "elapsed_time": "0:14:13", "remaining_time": "0:09:59", "throughput": 2559.32, "total_tokens": 2185088} +{"current_steps": 4455, "total_steps": 7577, "loss": 0.0697, "lr": 8.683890569429173e-07, "epoch": 0.5879635739738683, "percentage": 58.8, "elapsed_time": "0:14:14", "remaining_time": "0:09:58", "throughput": 2561.48, "total_tokens": 2187776} +{"current_steps": 4460, "total_steps": 7577, "loss": 0.0006, "lr": 8.661058875874956e-07, "epoch": 0.5886234657516167, "percentage": 58.86, "elapsed_time": "0:14:14", "remaining_time": "0:09:57", "throughput": 2563.11, "total_tokens": 2190016} +{"current_steps": 4465, "total_steps": 7577, "loss": 0.0008, "lr": 8.638234287248423e-07, "epoch": 0.5892833575293652, "percentage": 58.93, "elapsed_time": "0:14:14", "remaining_time": "0:09:55", "throughput": 2564.8, "total_tokens": 2192320} +{"current_steps": 4470, "total_steps": 7577, "loss": 0.0355, "lr": 8.615416924665464e-07, "epoch": 0.5899432493071136, "percentage": 58.99, "elapsed_time": "0:14:15", "remaining_time": "0:09:54", "throughput": 2566.65, "total_tokens": 2194752} +{"current_steps": 4475, "total_steps": 7577, "loss": 0.0743, "lr": 8.592606909203629e-07, "epoch": 0.5906031410848621, "percentage": 59.06, "elapsed_time": "0:14:15", "remaining_time": "0:09:52", "throughput": 2568.35, "total_tokens": 2197056} +{"current_steps": 4480, "total_steps": 7577, "loss": 0.0489, "lr": 8.569804361901485e-07, "epoch": 0.5912630328626105, "percentage": 59.13, "elapsed_time": "0:14:15", "remaining_time": "0:09:51", "throughput": 2569.98, "total_tokens": 2199296} +{"current_steps": 4485, "total_steps": 7577, "loss": 0.41, "lr": 8.547009403757963e-07, "epoch": 0.591922924640359, "percentage": 59.19, "elapsed_time": "0:14:16", "remaining_time": "0:09:50", "throughput": 2571.72, "total_tokens": 2201664} +{"current_steps": 4490, "total_steps": 7577, "loss": 0.227, "lr": 8.524222155731731e-07, "epoch": 0.5925828164181074, "percentage": 59.26, "elapsed_time": "0:14:16", "remaining_time": "0:09:48", "throughput": 2573.77, "total_tokens": 2204288} +{"current_steps": 4495, "total_steps": 7577, "loss": 0.127, "lr": 8.501442738740538e-07, "epoch": 0.5932427081958559, "percentage": 59.32, "elapsed_time": "0:14:16", "remaining_time": "0:09:47", "throughput": 2575.37, "total_tokens": 2206528} +{"current_steps": 4500, "total_steps": 7577, "loss": 0.0695, "lr": 8.47867127366058e-07, "epoch": 0.5939025999736043, "percentage": 59.39, "elapsed_time": "0:14:17", "remaining_time": "0:09:46", "throughput": 2577.29, "total_tokens": 2209024} +{"current_steps": 4505, "total_steps": 7577, "loss": 0.0422, "lr": 8.455907881325858e-07, "epoch": 0.5945624917513528, "percentage": 59.46, "elapsed_time": "0:14:17", "remaining_time": "0:09:44", "throughput": 2579.28, "total_tokens": 2211584} +{"current_steps": 4510, "total_steps": 7577, "loss": 0.1233, "lr": 8.433152682527533e-07, "epoch": 0.5952223835291012, "percentage": 59.52, "elapsed_time": "0:14:17", "remaining_time": "0:09:43", "throughput": 2581.05, "total_tokens": 2213952} +{"current_steps": 4515, "total_steps": 7577, "loss": 0.0951, "lr": 8.410405798013298e-07, "epoch": 0.5958822753068497, "percentage": 59.59, "elapsed_time": "0:14:18", "remaining_time": "0:09:41", "throughput": 2582.66, "total_tokens": 2216192} +{"current_steps": 4520, "total_steps": 7577, "loss": 0.0126, "lr": 8.387667348486712e-07, "epoch": 0.5965421670845982, "percentage": 59.65, "elapsed_time": "0:14:18", "remaining_time": "0:09:40", "throughput": 2584.55, "total_tokens": 2218688} +{"current_steps": 4525, "total_steps": 7577, "loss": 0.0853, "lr": 8.364937454606585e-07, "epoch": 0.5972020588623466, "percentage": 59.72, "elapsed_time": "0:14:18", "remaining_time": "0:09:39", "throughput": 2586.16, "total_tokens": 2220928} +{"current_steps": 4530, "total_steps": 7577, "loss": 0.0013, "lr": 8.342216236986329e-07, "epoch": 0.5978619506400951, "percentage": 59.79, "elapsed_time": "0:14:19", "remaining_time": "0:09:37", "throughput": 2587.99, "total_tokens": 2223360} +{"current_steps": 4535, "total_steps": 7577, "loss": 0.1511, "lr": 8.319503816193305e-07, "epoch": 0.5985218424178435, "percentage": 59.85, "elapsed_time": "0:14:19", "remaining_time": "0:09:36", "throughput": 2589.83, "total_tokens": 2225792} +{"current_steps": 4540, "total_steps": 7577, "loss": 0.1163, "lr": 8.296800312748206e-07, "epoch": 0.599181734195592, "percentage": 59.92, "elapsed_time": "0:14:19", "remaining_time": "0:09:35", "throughput": 2591.72, "total_tokens": 2228288} +{"current_steps": 4545, "total_steps": 7577, "loss": 0.1894, "lr": 8.274105847124404e-07, "epoch": 0.5998416259733403, "percentage": 59.98, "elapsed_time": "0:14:20", "remaining_time": "0:09:33", "throughput": 2593.68, "total_tokens": 2230848} +{"current_steps": 4548, "total_steps": 7577, "eval_loss": 0.1099071353673935, "epoch": 0.6002375610399895, "percentage": 60.02, "elapsed_time": "0:14:28", "remaining_time": "0:09:38", "throughput": 2570.22, "total_tokens": 2232448} +{"current_steps": 4550, "total_steps": 7577, "loss": 0.233, "lr": 8.251420539747311e-07, "epoch": 0.6005015177510888, "percentage": 60.05, "elapsed_time": "0:15:05", "remaining_time": "0:10:02", "throughput": 2466.82, "total_tokens": 2233472} +{"current_steps": 4555, "total_steps": 7577, "loss": 0.2218, "lr": 8.228744510993742e-07, "epoch": 0.6011614095288372, "percentage": 60.12, "elapsed_time": "0:15:05", "remaining_time": "0:10:00", "throughput": 2468.82, "total_tokens": 2236096} +{"current_steps": 4560, "total_steps": 7577, "loss": 0.0831, "lr": 8.206077881191274e-07, "epoch": 0.6018213013065857, "percentage": 60.18, "elapsed_time": "0:15:06", "remaining_time": "0:09:59", "throughput": 2470.81, "total_tokens": 2238720} +{"current_steps": 4565, "total_steps": 7577, "loss": 0.1877, "lr": 8.183420770617614e-07, "epoch": 0.6024811930843341, "percentage": 60.25, "elapsed_time": "0:15:06", "remaining_time": "0:09:58", "throughput": 2472.66, "total_tokens": 2241216} +{"current_steps": 4570, "total_steps": 7577, "loss": 0.0651, "lr": 8.160773299499955e-07, "epoch": 0.6031410848620826, "percentage": 60.31, "elapsed_time": "0:15:06", "remaining_time": "0:09:56", "throughput": 2474.45, "total_tokens": 2243648} +{"current_steps": 4575, "total_steps": 7577, "loss": 0.0543, "lr": 8.138135588014339e-07, "epoch": 0.6038009766398311, "percentage": 60.38, "elapsed_time": "0:15:07", "remaining_time": "0:09:55", "throughput": 2476.24, "total_tokens": 2246080} +{"current_steps": 4580, "total_steps": 7577, "loss": 0.0016, "lr": 8.115507756285017e-07, "epoch": 0.6044608684175795, "percentage": 60.45, "elapsed_time": "0:15:07", "remaining_time": "0:09:53", "throughput": 2477.75, "total_tokens": 2248256} +{"current_steps": 4585, "total_steps": 7577, "loss": 0.07, "lr": 8.092889924383819e-07, "epoch": 0.605120760195328, "percentage": 60.51, "elapsed_time": "0:15:07", "remaining_time": "0:09:52", "throughput": 2479.54, "total_tokens": 2250688} +{"current_steps": 4590, "total_steps": 7577, "loss": 0.0872, "lr": 8.070282212329508e-07, "epoch": 0.6057806519730764, "percentage": 60.58, "elapsed_time": "0:15:08", "remaining_time": "0:09:50", "throughput": 2481.32, "total_tokens": 2253120} +{"current_steps": 4595, "total_steps": 7577, "loss": 0.1869, "lr": 8.047684740087156e-07, "epoch": 0.6064405437508249, "percentage": 60.64, "elapsed_time": "0:15:08", "remaining_time": "0:09:49", "throughput": 2482.89, "total_tokens": 2255360} +{"current_steps": 4600, "total_steps": 7577, "loss": 0.2572, "lr": 8.025097627567481e-07, "epoch": 0.6071004355285733, "percentage": 60.71, "elapsed_time": "0:15:08", "remaining_time": "0:09:48", "throughput": 2484.6, "total_tokens": 2257728} +{"current_steps": 4605, "total_steps": 7577, "loss": 0.0536, "lr": 8.002520994626247e-07, "epoch": 0.6077603273063218, "percentage": 60.78, "elapsed_time": "0:15:09", "remaining_time": "0:09:46", "throughput": 2486.45, "total_tokens": 2260224} +{"current_steps": 4610, "total_steps": 7577, "loss": 0.0372, "lr": 7.979954961063596e-07, "epoch": 0.6084202190840702, "percentage": 60.84, "elapsed_time": "0:15:09", "remaining_time": "0:09:45", "throughput": 2488.5, "total_tokens": 2262912} +{"current_steps": 4615, "total_steps": 7577, "loss": 0.2998, "lr": 7.957399646623436e-07, "epoch": 0.6090801108618187, "percentage": 60.91, "elapsed_time": "0:15:09", "remaining_time": "0:09:43", "throughput": 2490.08, "total_tokens": 2265152} +{"current_steps": 4620, "total_steps": 7577, "loss": 0.0008, "lr": 7.934855170992788e-07, "epoch": 0.6097400026395671, "percentage": 60.97, "elapsed_time": "0:15:10", "remaining_time": "0:09:42", "throughput": 2492.25, "total_tokens": 2267968} +{"current_steps": 4625, "total_steps": 7577, "loss": 0.0407, "lr": 7.912321653801161e-07, "epoch": 0.6103998944173156, "percentage": 61.04, "elapsed_time": "0:15:10", "remaining_time": "0:09:41", "throughput": 2493.96, "total_tokens": 2270336} +{"current_steps": 4630, "total_steps": 7577, "loss": 0.135, "lr": 7.889799214619919e-07, "epoch": 0.611059786195064, "percentage": 61.11, "elapsed_time": "0:15:10", "remaining_time": "0:09:39", "throughput": 2495.97, "total_tokens": 2273024} +{"current_steps": 4635, "total_steps": 7577, "loss": 0.0678, "lr": 7.867287972961629e-07, "epoch": 0.6117196779728125, "percentage": 61.17, "elapsed_time": "0:15:11", "remaining_time": "0:09:38", "throughput": 2497.53, "total_tokens": 2275264} +{"current_steps": 4640, "total_steps": 7577, "loss": 0.1219, "lr": 7.844788048279453e-07, "epoch": 0.612379569750561, "percentage": 61.24, "elapsed_time": "0:15:11", "remaining_time": "0:09:36", "throughput": 2499.5, "total_tokens": 2277888} +{"current_steps": 4645, "total_steps": 7577, "loss": 0.0005, "lr": 7.822299559966494e-07, "epoch": 0.6130394615283093, "percentage": 61.3, "elapsed_time": "0:15:11", "remaining_time": "0:09:35", "throughput": 2501.27, "total_tokens": 2280320} +{"current_steps": 4650, "total_steps": 7577, "loss": 0.0017, "lr": 7.799822627355171e-07, "epoch": 0.6136993533060578, "percentage": 61.37, "elapsed_time": "0:15:11", "remaining_time": "0:09:34", "throughput": 2502.84, "total_tokens": 2282560} +{"current_steps": 4655, "total_steps": 7577, "loss": 0.1505, "lr": 7.77735736971659e-07, "epoch": 0.6143592450838062, "percentage": 61.44, "elapsed_time": "0:15:12", "remaining_time": "0:09:32", "throughput": 2504.46, "total_tokens": 2284864} +{"current_steps": 4660, "total_steps": 7577, "loss": 0.165, "lr": 7.754903906259889e-07, "epoch": 0.6150191368615547, "percentage": 61.5, "elapsed_time": "0:15:12", "remaining_time": "0:09:31", "throughput": 2506.09, "total_tokens": 2287168} +{"current_steps": 4665, "total_steps": 7577, "loss": 0.0716, "lr": 7.732462356131637e-07, "epoch": 0.6156790286393031, "percentage": 61.57, "elapsed_time": "0:15:12", "remaining_time": "0:09:29", "throughput": 2507.85, "total_tokens": 2289600} +{"current_steps": 4670, "total_steps": 7577, "loss": 0.0317, "lr": 7.710032838415179e-07, "epoch": 0.6163389204170516, "percentage": 61.63, "elapsed_time": "0:15:13", "remaining_time": "0:09:28", "throughput": 2509.74, "total_tokens": 2292160} +{"current_steps": 4675, "total_steps": 7577, "loss": 0.0943, "lr": 7.687615472130016e-07, "epoch": 0.6169988121948, "percentage": 61.7, "elapsed_time": "0:15:13", "remaining_time": "0:09:27", "throughput": 2511.83, "total_tokens": 2294912} +{"current_steps": 4680, "total_steps": 7577, "loss": 0.1314, "lr": 7.665210376231165e-07, "epoch": 0.6176587039725485, "percentage": 61.77, "elapsed_time": "0:15:13", "remaining_time": "0:09:25", "throughput": 2513.25, "total_tokens": 2297024} +{"current_steps": 4685, "total_steps": 7577, "loss": 0.1436, "lr": 7.642817669608536e-07, "epoch": 0.6183185957502969, "percentage": 61.83, "elapsed_time": "0:15:14", "remaining_time": "0:09:24", "throughput": 2515.01, "total_tokens": 2299456} +{"current_steps": 4690, "total_steps": 7577, "loss": 0.013, "lr": 7.62043747108629e-07, "epoch": 0.6189784875280454, "percentage": 61.9, "elapsed_time": "0:15:14", "remaining_time": "0:09:23", "throughput": 2516.43, "total_tokens": 2301568} +{"current_steps": 4695, "total_steps": 7577, "loss": 0.168, "lr": 7.598069899422221e-07, "epoch": 0.6196383793057938, "percentage": 61.96, "elapsed_time": "0:15:14", "remaining_time": "0:09:21", "throughput": 2518.12, "total_tokens": 2303936} +{"current_steps": 4700, "total_steps": 7577, "loss": 0.1745, "lr": 7.575715073307119e-07, "epoch": 0.6202982710835423, "percentage": 62.03, "elapsed_time": "0:15:15", "remaining_time": "0:09:20", "throughput": 2519.68, "total_tokens": 2306176} +{"current_steps": 4705, "total_steps": 7577, "loss": 0.0901, "lr": 7.55337311136414e-07, "epoch": 0.6209581628612908, "percentage": 62.1, "elapsed_time": "0:15:15", "remaining_time": "0:09:18", "throughput": 2521.57, "total_tokens": 2308736} +{"current_steps": 4710, "total_steps": 7577, "loss": 0.1379, "lr": 7.531044132148183e-07, "epoch": 0.6216180546390392, "percentage": 62.16, "elapsed_time": "0:15:15", "remaining_time": "0:09:17", "throughput": 2523.23, "total_tokens": 2311104} +{"current_steps": 4715, "total_steps": 7577, "loss": 0.049, "lr": 7.508728254145245e-07, "epoch": 0.6222779464167877, "percentage": 62.23, "elapsed_time": "0:15:16", "remaining_time": "0:09:16", "throughput": 2524.97, "total_tokens": 2313536} +{"current_steps": 4720, "total_steps": 7577, "loss": 0.1208, "lr": 7.486425595771817e-07, "epoch": 0.6229378381945361, "percentage": 62.29, "elapsed_time": "0:15:16", "remaining_time": "0:09:14", "throughput": 2526.77, "total_tokens": 2316032} +{"current_steps": 4725, "total_steps": 7577, "loss": 0.205, "lr": 7.464136275374223e-07, "epoch": 0.6235977299722846, "percentage": 62.36, "elapsed_time": "0:15:16", "remaining_time": "0:09:13", "throughput": 2528.72, "total_tokens": 2318656} +{"current_steps": 4730, "total_steps": 7577, "loss": 0.1395, "lr": 7.441860411228029e-07, "epoch": 0.624257621750033, "percentage": 62.43, "elapsed_time": "0:15:17", "remaining_time": "0:09:12", "throughput": 2530.6, "total_tokens": 2321216} +{"current_steps": 4735, "total_steps": 7577, "loss": 0.1494, "lr": 7.419598121537387e-07, "epoch": 0.6249175135277815, "percentage": 62.49, "elapsed_time": "0:15:17", "remaining_time": "0:09:10", "throughput": 2532.33, "total_tokens": 2323648} +{"current_steps": 4740, "total_steps": 7577, "loss": 0.165, "lr": 7.397349524434424e-07, "epoch": 0.6255774053055299, "percentage": 62.56, "elapsed_time": "0:15:17", "remaining_time": "0:09:09", "throughput": 2534.07, "total_tokens": 2326080} +{"current_steps": 4745, "total_steps": 7577, "loss": 0.0572, "lr": 7.375114737978605e-07, "epoch": 0.6262372970832784, "percentage": 62.62, "elapsed_time": "0:15:18", "remaining_time": "0:09:08", "throughput": 2535.81, "total_tokens": 2328512} +{"current_steps": 4750, "total_steps": 7577, "loss": 0.1462, "lr": 7.352893880156106e-07, "epoch": 0.6268971888610267, "percentage": 62.69, "elapsed_time": "0:15:18", "remaining_time": "0:09:06", "throughput": 2537.62, "total_tokens": 2331008} +{"current_steps": 4755, "total_steps": 7577, "loss": 0.0943, "lr": 7.330687068879202e-07, "epoch": 0.6275570806387752, "percentage": 62.76, "elapsed_time": "0:15:18", "remaining_time": "0:09:05", "throughput": 2539.29, "total_tokens": 2333376} +{"current_steps": 4760, "total_steps": 7577, "loss": 0.2447, "lr": 7.308494421985626e-07, "epoch": 0.6282169724165237, "percentage": 62.82, "elapsed_time": "0:15:19", "remaining_time": "0:09:04", "throughput": 2541.1, "total_tokens": 2335872} +{"current_steps": 4765, "total_steps": 7577, "loss": 0.0016, "lr": 7.286316057237951e-07, "epoch": 0.6288768641942721, "percentage": 62.89, "elapsed_time": "0:15:19", "remaining_time": "0:09:02", "throughput": 2542.97, "total_tokens": 2338432} +{"current_steps": 4770, "total_steps": 7577, "loss": 0.1152, "lr": 7.264152092322963e-07, "epoch": 0.6295367559720206, "percentage": 62.95, "elapsed_time": "0:15:19", "remaining_time": "0:09:01", "throughput": 2544.77, "total_tokens": 2340928} +{"current_steps": 4775, "total_steps": 7577, "loss": 0.1148, "lr": 7.242002644851035e-07, "epoch": 0.630196647749769, "percentage": 63.02, "elapsed_time": "0:15:20", "remaining_time": "0:08:59", "throughput": 2546.84, "total_tokens": 2343680} +{"current_steps": 4780, "total_steps": 7577, "loss": 0.0689, "lr": 7.219867832355508e-07, "epoch": 0.6308565395275175, "percentage": 63.09, "elapsed_time": "0:15:20", "remaining_time": "0:08:58", "throughput": 2548.71, "total_tokens": 2346240} +{"current_steps": 4785, "total_steps": 7577, "loss": 0.0841, "lr": 7.197747772292071e-07, "epoch": 0.6315164313052659, "percentage": 63.15, "elapsed_time": "0:15:20", "remaining_time": "0:08:57", "throughput": 2550.3, "total_tokens": 2348544} +{"current_steps": 4790, "total_steps": 7577, "loss": 0.2099, "lr": 7.17564258203811e-07, "epoch": 0.6321763230830144, "percentage": 63.22, "elapsed_time": "0:15:21", "remaining_time": "0:08:55", "throughput": 2552.03, "total_tokens": 2350976} +{"current_steps": 4795, "total_steps": 7577, "loss": 0.115, "lr": 7.153552378892128e-07, "epoch": 0.6328362148607628, "percentage": 63.28, "elapsed_time": "0:15:21", "remaining_time": "0:08:54", "throughput": 2553.56, "total_tokens": 2353216} +{"current_steps": 4800, "total_steps": 7577, "loss": 0.1212, "lr": 7.131477280073091e-07, "epoch": 0.6334961066385113, "percentage": 63.35, "elapsed_time": "0:15:21", "remaining_time": "0:08:53", "throughput": 2555.21, "total_tokens": 2355584} +{"current_steps": 4805, "total_steps": 7577, "loss": 0.0817, "lr": 7.109417402719813e-07, "epoch": 0.6341559984162597, "percentage": 63.42, "elapsed_time": "0:15:22", "remaining_time": "0:08:52", "throughput": 2557.06, "total_tokens": 2358144} +{"current_steps": 4810, "total_steps": 7577, "loss": 0.029, "lr": 7.087372863890346e-07, "epoch": 0.6348158901940082, "percentage": 63.48, "elapsed_time": "0:15:22", "remaining_time": "0:08:50", "throughput": 2559.12, "total_tokens": 2360896} +{"current_steps": 4815, "total_steps": 7577, "loss": 0.2463, "lr": 7.065343780561344e-07, "epoch": 0.6354757819717566, "percentage": 63.55, "elapsed_time": "0:15:22", "remaining_time": "0:08:49", "throughput": 2560.77, "total_tokens": 2363264} +{"current_steps": 4820, "total_steps": 7577, "loss": 0.0744, "lr": 7.043330269627448e-07, "epoch": 0.6361356737495051, "percentage": 63.61, "elapsed_time": "0:15:23", "remaining_time": "0:08:48", "throughput": 2562.42, "total_tokens": 2365632} +{"current_steps": 4825, "total_steps": 7577, "loss": 0.0018, "lr": 7.021332447900671e-07, "epoch": 0.6367955655272536, "percentage": 63.68, "elapsed_time": "0:15:23", "remaining_time": "0:08:46", "throughput": 2564.06, "total_tokens": 2368000} +{"current_steps": 4830, "total_steps": 7577, "loss": 0.1116, "lr": 6.999350432109766e-07, "epoch": 0.637455457305002, "percentage": 63.75, "elapsed_time": "0:15:23", "remaining_time": "0:08:45", "throughput": 2565.91, "total_tokens": 2370560} +{"current_steps": 4835, "total_steps": 7577, "loss": 0.0011, "lr": 6.977384338899617e-07, "epoch": 0.6381153490827505, "percentage": 63.81, "elapsed_time": "0:15:24", "remaining_time": "0:08:44", "throughput": 2567.76, "total_tokens": 2373120} +{"current_steps": 4840, "total_steps": 7577, "loss": 0.033, "lr": 6.955434284830619e-07, "epoch": 0.6387752408604989, "percentage": 63.88, "elapsed_time": "0:15:24", "remaining_time": "0:08:42", "throughput": 2569.81, "total_tokens": 2375872} +{"current_steps": 4845, "total_steps": 7577, "loss": 0.2167, "lr": 6.933500386378056e-07, "epoch": 0.6394351326382474, "percentage": 63.94, "elapsed_time": "0:15:24", "remaining_time": "0:08:41", "throughput": 2571.65, "total_tokens": 2378432} +{"current_steps": 4850, "total_steps": 7577, "loss": 0.213, "lr": 6.911582759931482e-07, "epoch": 0.6400950244159958, "percentage": 64.01, "elapsed_time": "0:15:25", "remaining_time": "0:08:40", "throughput": 2573.31, "total_tokens": 2380800} +{"current_steps": 4855, "total_steps": 7577, "loss": 0.2747, "lr": 6.889681521794109e-07, "epoch": 0.6407549161937443, "percentage": 64.08, "elapsed_time": "0:15:25", "remaining_time": "0:08:38", "throughput": 2575.55, "total_tokens": 2383744} +{"current_steps": 4860, "total_steps": 7577, "loss": 0.0758, "lr": 6.867796788182181e-07, "epoch": 0.6414148079714926, "percentage": 64.14, "elapsed_time": "0:15:25", "remaining_time": "0:08:37", "throughput": 2577.2, "total_tokens": 2386112} +{"current_steps": 4865, "total_steps": 7577, "loss": 0.1529, "lr": 6.845928675224366e-07, "epoch": 0.6420746997492411, "percentage": 64.21, "elapsed_time": "0:15:26", "remaining_time": "0:08:36", "throughput": 2579.12, "total_tokens": 2388736} +{"current_steps": 4870, "total_steps": 7577, "loss": 0.0713, "lr": 6.82407729896114e-07, "epoch": 0.6427345915269895, "percentage": 64.27, "elapsed_time": "0:15:26", "remaining_time": "0:08:35", "throughput": 2580.77, "total_tokens": 2391104} +{"current_steps": 4875, "total_steps": 7577, "loss": 0.1204, "lr": 6.802242775344163e-07, "epoch": 0.643394483304738, "percentage": 64.34, "elapsed_time": "0:15:26", "remaining_time": "0:08:33", "throughput": 2582.68, "total_tokens": 2393728} +{"current_steps": 4880, "total_steps": 7577, "loss": 0.1797, "lr": 6.780425220235674e-07, "epoch": 0.6440543750824864, "percentage": 64.41, "elapsed_time": "0:15:27", "remaining_time": "0:08:32", "throughput": 2584.72, "total_tokens": 2396480} +{"current_steps": 4885, "total_steps": 7577, "loss": 0.0011, "lr": 6.758624749407859e-07, "epoch": 0.6447142668602349, "percentage": 64.47, "elapsed_time": "0:15:27", "remaining_time": "0:08:31", "throughput": 2586.62, "total_tokens": 2399104} +{"current_steps": 4890, "total_steps": 7577, "loss": 0.0861, "lr": 6.736841478542264e-07, "epoch": 0.6453741586379834, "percentage": 64.54, "elapsed_time": "0:15:27", "remaining_time": "0:08:29", "throughput": 2588.46, "total_tokens": 2401664} +{"current_steps": 4895, "total_steps": 7577, "loss": 0.0316, "lr": 6.715075523229151e-07, "epoch": 0.6460340504157318, "percentage": 64.6, "elapsed_time": "0:15:28", "remaining_time": "0:08:28", "throughput": 2590.24, "total_tokens": 2404160} +{"current_steps": 4900, "total_steps": 7577, "loss": 0.1035, "lr": 6.693326998966909e-07, "epoch": 0.6466939421934803, "percentage": 64.67, "elapsed_time": "0:15:28", "remaining_time": "0:08:27", "throughput": 2591.95, "total_tokens": 2406592} +{"current_steps": 4905, "total_steps": 7577, "loss": 0.0014, "lr": 6.671596021161431e-07, "epoch": 0.6473538339712287, "percentage": 64.74, "elapsed_time": "0:15:28", "remaining_time": "0:08:25", "throughput": 2593.71, "total_tokens": 2409088} +{"current_steps": 4910, "total_steps": 7577, "loss": 0.1158, "lr": 6.649882705125494e-07, "epoch": 0.6480137257489772, "percentage": 64.8, "elapsed_time": "0:15:29", "remaining_time": "0:08:24", "throughput": 2595.49, "total_tokens": 2411584} +{"current_steps": 4915, "total_steps": 7577, "loss": 0.472, "lr": 6.628187166078163e-07, "epoch": 0.6486736175267256, "percentage": 64.87, "elapsed_time": "0:15:29", "remaining_time": "0:08:23", "throughput": 2597.57, "total_tokens": 2414400} +{"current_steps": 4920, "total_steps": 7577, "loss": 0.0382, "lr": 6.606509519144166e-07, "epoch": 0.6493335093044741, "percentage": 64.93, "elapsed_time": "0:15:29", "remaining_time": "0:08:22", "throughput": 2599.08, "total_tokens": 2416640} +{"current_steps": 4925, "total_steps": 7577, "loss": 0.1297, "lr": 6.584849879353289e-07, "epoch": 0.6499934010822225, "percentage": 65.0, "elapsed_time": "0:15:30", "remaining_time": "0:08:20", "throughput": 2600.84, "total_tokens": 2419136} +{"current_steps": 4927, "total_steps": 7577, "eval_loss": 0.09970784932374954, "epoch": 0.6502573577933219, "percentage": 65.03, "elapsed_time": "0:15:38", "remaining_time": "0:08:24", "throughput": 2579.64, "total_tokens": 2420096} +{"current_steps": 4930, "total_steps": 7577, "loss": 0.0423, "lr": 6.563208361639772e-07, "epoch": 0.650653292859971, "percentage": 65.07, "elapsed_time": "0:16:23", "remaining_time": "0:08:48", "throughput": 2462.08, "total_tokens": 2421440} +{"current_steps": 4935, "total_steps": 7577, "loss": 0.0187, "lr": 6.541585080841687e-07, "epoch": 0.6513131846377194, "percentage": 65.13, "elapsed_time": "0:16:23", "remaining_time": "0:08:46", "throughput": 2463.85, "total_tokens": 2424000} +{"current_steps": 4940, "total_steps": 7577, "loss": 0.1785, "lr": 6.519980151700332e-07, "epoch": 0.6519730764154679, "percentage": 65.2, "elapsed_time": "0:16:24", "remaining_time": "0:08:45", "throughput": 2465.31, "total_tokens": 2426240} +{"current_steps": 4945, "total_steps": 7577, "loss": 0.1136, "lr": 6.498393688859629e-07, "epoch": 0.6526329681932164, "percentage": 65.26, "elapsed_time": "0:16:24", "remaining_time": "0:08:43", "throughput": 2467.14, "total_tokens": 2428864} +{"current_steps": 4950, "total_steps": 7577, "loss": 0.0011, "lr": 6.47682580686551e-07, "epoch": 0.6532928599709648, "percentage": 65.33, "elapsed_time": "0:16:24", "remaining_time": "0:08:42", "throughput": 2468.8, "total_tokens": 2431296} +{"current_steps": 4955, "total_steps": 7577, "loss": 0.0017, "lr": 6.455276620165307e-07, "epoch": 0.6539527517487133, "percentage": 65.4, "elapsed_time": "0:16:25", "remaining_time": "0:08:41", "throughput": 2470.68, "total_tokens": 2433984} +{"current_steps": 4960, "total_steps": 7577, "loss": 0.4128, "lr": 6.433746243107152e-07, "epoch": 0.6546126435264616, "percentage": 65.46, "elapsed_time": "0:16:25", "remaining_time": "0:08:39", "throughput": 2472.13, "total_tokens": 2436224} +{"current_steps": 4965, "total_steps": 7577, "loss": 0.1516, "lr": 6.412234789939359e-07, "epoch": 0.6552725353042101, "percentage": 65.53, "elapsed_time": "0:16:25", "remaining_time": "0:08:38", "throughput": 2473.84, "total_tokens": 2438720} +{"current_steps": 4970, "total_steps": 7577, "loss": 0.0589, "lr": 6.390742374809832e-07, "epoch": 0.6559324270819585, "percentage": 65.59, "elapsed_time": "0:16:26", "remaining_time": "0:08:37", "throughput": 2475.29, "total_tokens": 2440960} +{"current_steps": 4975, "total_steps": 7577, "loss": 0.0597, "lr": 6.369269111765454e-07, "epoch": 0.656592318859707, "percentage": 65.66, "elapsed_time": "0:16:26", "remaining_time": "0:08:35", "throughput": 2476.86, "total_tokens": 2443328} +{"current_steps": 4980, "total_steps": 7577, "loss": 0.1664, "lr": 6.347815114751465e-07, "epoch": 0.6572522106374554, "percentage": 65.73, "elapsed_time": "0:16:26", "remaining_time": "0:08:34", "throughput": 2478.68, "total_tokens": 2445952} +{"current_steps": 4985, "total_steps": 7577, "loss": 0.1165, "lr": 6.326380497610886e-07, "epoch": 0.6579121024152039, "percentage": 65.79, "elapsed_time": "0:16:27", "remaining_time": "0:08:33", "throughput": 2480.5, "total_tokens": 2448576} +{"current_steps": 4990, "total_steps": 7577, "loss": 0.3173, "lr": 6.304965374083899e-07, "epoch": 0.6585719941929523, "percentage": 65.86, "elapsed_time": "0:16:27", "remaining_time": "0:08:31", "throughput": 2482.26, "total_tokens": 2451136} +{"current_steps": 4995, "total_steps": 7577, "loss": 0.002, "lr": 6.283569857807245e-07, "epoch": 0.6592318859707008, "percentage": 65.92, "elapsed_time": "0:16:27", "remaining_time": "0:08:30", "throughput": 2483.96, "total_tokens": 2453632} +{"current_steps": 5000, "total_steps": 7577, "loss": 0.0644, "lr": 6.262194062313615e-07, "epoch": 0.6598917777484492, "percentage": 65.99, "elapsed_time": "0:16:28", "remaining_time": "0:08:29", "throughput": 2485.72, "total_tokens": 2456192} +{"current_steps": 5005, "total_steps": 7577, "loss": 0.0013, "lr": 6.240838101031063e-07, "epoch": 0.6605516695261977, "percentage": 66.06, "elapsed_time": "0:16:28", "remaining_time": "0:08:27", "throughput": 2487.34, "total_tokens": 2458624} +{"current_steps": 5010, "total_steps": 7577, "loss": 0.0896, "lr": 6.21950208728239e-07, "epoch": 0.6612115613039462, "percentage": 66.12, "elapsed_time": "0:16:28", "remaining_time": "0:08:26", "throughput": 2488.85, "total_tokens": 2460928} +{"current_steps": 5015, "total_steps": 7577, "loss": 0.1054, "lr": 6.198186134284554e-07, "epoch": 0.6618714530816946, "percentage": 66.19, "elapsed_time": "0:16:29", "remaining_time": "0:08:25", "throughput": 2490.66, "total_tokens": 2463552} +{"current_steps": 5020, "total_steps": 7577, "loss": 0.0028, "lr": 6.176890355148049e-07, "epoch": 0.6625313448594431, "percentage": 66.25, "elapsed_time": "0:16:29", "remaining_time": "0:08:23", "throughput": 2492.17, "total_tokens": 2465856} +{"current_steps": 5025, "total_steps": 7577, "loss": 0.0981, "lr": 6.155614862876335e-07, "epoch": 0.6631912366371915, "percentage": 66.32, "elapsed_time": "0:16:29", "remaining_time": "0:08:22", "throughput": 2493.79, "total_tokens": 2468288} +{"current_steps": 5030, "total_steps": 7577, "loss": 0.1368, "lr": 6.134359770365214e-07, "epoch": 0.66385112841494, "percentage": 66.39, "elapsed_time": "0:16:30", "remaining_time": "0:08:21", "throughput": 2495.58, "total_tokens": 2470912} +{"current_steps": 5035, "total_steps": 7577, "loss": 0.0711, "lr": 6.11312519040224e-07, "epoch": 0.6645110201926884, "percentage": 66.45, "elapsed_time": "0:16:30", "remaining_time": "0:08:20", "throughput": 2497.39, "total_tokens": 2473536} +{"current_steps": 5040, "total_steps": 7577, "loss": 0.0009, "lr": 6.091911235666125e-07, "epoch": 0.6651709119704369, "percentage": 66.52, "elapsed_time": "0:16:30", "remaining_time": "0:08:18", "throughput": 2499.07, "total_tokens": 2476032} +{"current_steps": 5045, "total_steps": 7577, "loss": 0.1034, "lr": 6.070718018726124e-07, "epoch": 0.6658308037481853, "percentage": 66.58, "elapsed_time": "0:16:31", "remaining_time": "0:08:17", "throughput": 2500.44, "total_tokens": 2478208} +{"current_steps": 5050, "total_steps": 7577, "loss": 0.1196, "lr": 6.049545652041459e-07, "epoch": 0.6664906955259338, "percentage": 66.65, "elapsed_time": "0:16:31", "remaining_time": "0:08:16", "throughput": 2501.93, "total_tokens": 2480512} +{"current_steps": 5055, "total_steps": 7577, "loss": 0.1824, "lr": 6.028394247960709e-07, "epoch": 0.6671505873036822, "percentage": 66.72, "elapsed_time": "0:16:31", "remaining_time": "0:08:14", "throughput": 2503.61, "total_tokens": 2483008} +{"current_steps": 5060, "total_steps": 7577, "loss": 0.1399, "lr": 6.007263918721221e-07, "epoch": 0.6678104790814307, "percentage": 66.78, "elapsed_time": "0:16:32", "remaining_time": "0:08:13", "throughput": 2505.18, "total_tokens": 2485376} +{"current_steps": 5065, "total_steps": 7577, "loss": 0.07, "lr": 5.986154776448507e-07, "epoch": 0.668470370859179, "percentage": 66.85, "elapsed_time": "0:16:32", "remaining_time": "0:08:12", "throughput": 2507.04, "total_tokens": 2488064} +{"current_steps": 5070, "total_steps": 7577, "loss": 0.0635, "lr": 5.965066933155656e-07, "epoch": 0.6691302626369275, "percentage": 66.91, "elapsed_time": "0:16:32", "remaining_time": "0:08:10", "throughput": 2508.78, "total_tokens": 2490624} +{"current_steps": 5075, "total_steps": 7577, "loss": 0.2914, "lr": 5.944000500742735e-07, "epoch": 0.669790154414676, "percentage": 66.98, "elapsed_time": "0:16:33", "remaining_time": "0:08:09", "throughput": 2510.58, "total_tokens": 2493248} +{"current_steps": 5080, "total_steps": 7577, "loss": 0.2126, "lr": 5.922955590996195e-07, "epoch": 0.6704500461924244, "percentage": 67.05, "elapsed_time": "0:16:33", "remaining_time": "0:08:08", "throughput": 2512.26, "total_tokens": 2495744} +{"current_steps": 5085, "total_steps": 7577, "loss": 0.0014, "lr": 5.901932315588281e-07, "epoch": 0.6711099379701729, "percentage": 67.11, "elapsed_time": "0:16:33", "remaining_time": "0:08:07", "throughput": 2513.88, "total_tokens": 2498176} +{"current_steps": 5090, "total_steps": 7577, "loss": 0.1766, "lr": 5.880930786076441e-07, "epoch": 0.6717698297479213, "percentage": 67.18, "elapsed_time": "0:16:34", "remaining_time": "0:08:05", "throughput": 2515.32, "total_tokens": 2500416} +{"current_steps": 5095, "total_steps": 7577, "loss": 0.0912, "lr": 5.859951113902728e-07, "epoch": 0.6724297215256698, "percentage": 67.24, "elapsed_time": "0:16:34", "remaining_time": "0:08:04", "throughput": 2516.92, "total_tokens": 2502848} +{"current_steps": 5100, "total_steps": 7577, "loss": 0.1217, "lr": 5.83899341039321e-07, "epoch": 0.6730896133034182, "percentage": 67.31, "elapsed_time": "0:16:34", "remaining_time": "0:08:03", "throughput": 2518.42, "total_tokens": 2505152} +{"current_steps": 5105, "total_steps": 7577, "loss": 0.1365, "lr": 5.818057786757386e-07, "epoch": 0.6737495050811667, "percentage": 67.37, "elapsed_time": "0:16:35", "remaining_time": "0:08:01", "throughput": 2520.09, "total_tokens": 2507648} +{"current_steps": 5110, "total_steps": 7577, "loss": 0.1131, "lr": 5.797144354087588e-07, "epoch": 0.6744093968589151, "percentage": 67.44, "elapsed_time": "0:16:35", "remaining_time": "0:08:00", "throughput": 2521.74, "total_tokens": 2510144} +{"current_steps": 5115, "total_steps": 7577, "loss": 0.0198, "lr": 5.77625322335839e-07, "epoch": 0.6750692886366636, "percentage": 67.51, "elapsed_time": "0:16:35", "remaining_time": "0:07:59", "throughput": 2523.77, "total_tokens": 2513024} +{"current_steps": 5120, "total_steps": 7577, "loss": 0.0733, "lr": 5.755384505426032e-07, "epoch": 0.675729180414412, "percentage": 67.57, "elapsed_time": "0:16:36", "remaining_time": "0:07:57", "throughput": 2524.99, "total_tokens": 2515072} +{"current_steps": 5125, "total_steps": 7577, "loss": 0.0013, "lr": 5.734538311027819e-07, "epoch": 0.6763890721921605, "percentage": 67.64, "elapsed_time": "0:16:36", "remaining_time": "0:07:56", "throughput": 2526.47, "total_tokens": 2517376} +{"current_steps": 5130, "total_steps": 7577, "loss": 0.003, "lr": 5.713714750781533e-07, "epoch": 0.677048963969909, "percentage": 67.7, "elapsed_time": "0:16:36", "remaining_time": "0:07:55", "throughput": 2528.32, "total_tokens": 2520064} +{"current_steps": 5135, "total_steps": 7577, "loss": 0.0716, "lr": 5.692913935184862e-07, "epoch": 0.6777088557476574, "percentage": 67.77, "elapsed_time": "0:16:37", "remaining_time": "0:07:54", "throughput": 2530.12, "total_tokens": 2522688} +{"current_steps": 5140, "total_steps": 7577, "loss": 0.0165, "lr": 5.672135974614794e-07, "epoch": 0.6783687475254059, "percentage": 67.84, "elapsed_time": "0:16:37", "remaining_time": "0:07:52", "throughput": 2531.78, "total_tokens": 2525184} +{"current_steps": 5145, "total_steps": 7577, "loss": 0.0008, "lr": 5.651380979327034e-07, "epoch": 0.6790286393031543, "percentage": 67.9, "elapsed_time": "0:16:37", "remaining_time": "0:07:51", "throughput": 2533.33, "total_tokens": 2527552} +{"current_steps": 5150, "total_steps": 7577, "loss": 0.0435, "lr": 5.630649059455444e-07, "epoch": 0.6796885310809028, "percentage": 67.97, "elapsed_time": "0:16:38", "remaining_time": "0:07:50", "throughput": 2535.18, "total_tokens": 2530240} +{"current_steps": 5155, "total_steps": 7577, "loss": 0.0116, "lr": 5.609940325011413e-07, "epoch": 0.6803484228586512, "percentage": 68.03, "elapsed_time": "0:16:38", "remaining_time": "0:07:49", "throughput": 2536.6, "total_tokens": 2532480} +{"current_steps": 5160, "total_steps": 7577, "loss": 0.0006, "lr": 5.589254885883325e-07, "epoch": 0.6810083146363997, "percentage": 68.1, "elapsed_time": "0:16:38", "remaining_time": "0:07:47", "throughput": 2538.19, "total_tokens": 2534912} +{"current_steps": 5165, "total_steps": 7577, "loss": 0.0753, "lr": 5.568592851835936e-07, "epoch": 0.681668206414148, "percentage": 68.17, "elapsed_time": "0:16:39", "remaining_time": "0:07:46", "throughput": 2539.86, "total_tokens": 2537408} +{"current_steps": 5170, "total_steps": 7577, "loss": 0.2943, "lr": 5.547954332509805e-07, "epoch": 0.6823280981918965, "percentage": 68.23, "elapsed_time": "0:16:39", "remaining_time": "0:07:45", "throughput": 2541.4, "total_tokens": 2539776} +{"current_steps": 5175, "total_steps": 7577, "loss": 0.001, "lr": 5.527339437420717e-07, "epoch": 0.6829879899696449, "percentage": 68.3, "elapsed_time": "0:16:39", "remaining_time": "0:07:44", "throughput": 2543.0, "total_tokens": 2542208} +{"current_steps": 5180, "total_steps": 7577, "loss": 0.0691, "lr": 5.506748275959094e-07, "epoch": 0.6836478817473934, "percentage": 68.36, "elapsed_time": "0:16:40", "remaining_time": "0:07:42", "throughput": 2544.65, "total_tokens": 2544704} +{"current_steps": 5185, "total_steps": 7577, "loss": 0.0527, "lr": 5.48618095738943e-07, "epoch": 0.6843077735251418, "percentage": 68.43, "elapsed_time": "0:16:40", "remaining_time": "0:07:41", "throughput": 2546.18, "total_tokens": 2547072} +{"current_steps": 5190, "total_steps": 7577, "loss": 0.121, "lr": 5.465637590849681e-07, "epoch": 0.6849676653028903, "percentage": 68.5, "elapsed_time": "0:16:40", "remaining_time": "0:07:40", "throughput": 2547.7, "total_tokens": 2549440} +{"current_steps": 5195, "total_steps": 7577, "loss": 0.1132, "lr": 5.445118285350723e-07, "epoch": 0.6856275570806388, "percentage": 68.56, "elapsed_time": "0:16:41", "remaining_time": "0:07:38", "throughput": 2549.54, "total_tokens": 2552128} +{"current_steps": 5200, "total_steps": 7577, "loss": 0.0694, "lr": 5.424623149775745e-07, "epoch": 0.6862874488583872, "percentage": 68.63, "elapsed_time": "0:16:41", "remaining_time": "0:07:37", "throughput": 2550.94, "total_tokens": 2554368} +{"current_steps": 5205, "total_steps": 7577, "loss": 0.1189, "lr": 5.404152292879676e-07, "epoch": 0.6869473406361357, "percentage": 68.69, "elapsed_time": "0:16:41", "remaining_time": "0:07:36", "throughput": 2552.65, "total_tokens": 2556928} +{"current_steps": 5210, "total_steps": 7577, "loss": 0.1717, "lr": 5.38370582328863e-07, "epoch": 0.6876072324138841, "percentage": 68.76, "elapsed_time": "0:16:42", "remaining_time": "0:07:35", "throughput": 2554.24, "total_tokens": 2559360} +{"current_steps": 5215, "total_steps": 7577, "loss": 0.1758, "lr": 5.363283849499293e-07, "epoch": 0.6882671241916326, "percentage": 68.83, "elapsed_time": "0:16:42", "remaining_time": "0:07:33", "throughput": 2555.88, "total_tokens": 2561856} +{"current_steps": 5220, "total_steps": 7577, "loss": 0.1671, "lr": 5.342886479878387e-07, "epoch": 0.688927015969381, "percentage": 68.89, "elapsed_time": "0:16:42", "remaining_time": "0:07:32", "throughput": 2557.52, "total_tokens": 2564352} +{"current_steps": 5225, "total_steps": 7577, "loss": 0.0526, "lr": 5.32251382266206e-07, "epoch": 0.6895869077471295, "percentage": 68.96, "elapsed_time": "0:16:43", "remaining_time": "0:07:31", "throughput": 2559.1, "total_tokens": 2566784} +{"current_steps": 5230, "total_steps": 7577, "loss": 0.1115, "lr": 5.302165985955327e-07, "epoch": 0.6902467995248779, "percentage": 69.02, "elapsed_time": "0:16:43", "remaining_time": "0:07:30", "throughput": 2560.62, "total_tokens": 2569152} +{"current_steps": 5235, "total_steps": 7577, "loss": 0.0649, "lr": 5.281843077731511e-07, "epoch": 0.6909066913026264, "percentage": 69.09, "elapsed_time": "0:16:43", "remaining_time": "0:07:29", "throughput": 2562.14, "total_tokens": 2571520} +{"current_steps": 5240, "total_steps": 7577, "loss": 0.0934, "lr": 5.26154520583163e-07, "epoch": 0.6915665830803748, "percentage": 69.16, "elapsed_time": "0:16:43", "remaining_time": "0:07:27", "throughput": 2563.85, "total_tokens": 2574080} +{"current_steps": 5245, "total_steps": 7577, "loss": 0.1196, "lr": 5.241272477963877e-07, "epoch": 0.6922264748581233, "percentage": 69.22, "elapsed_time": "0:16:44", "remaining_time": "0:07:26", "throughput": 2565.26, "total_tokens": 2576320} +{"current_steps": 5250, "total_steps": 7577, "loss": 0.0494, "lr": 5.221025001703e-07, "epoch": 0.6928863666358717, "percentage": 69.29, "elapsed_time": "0:16:44", "remaining_time": "0:07:25", "throughput": 2566.85, "total_tokens": 2578752} +{"current_steps": 5255, "total_steps": 7577, "loss": 0.1279, "lr": 5.200802884489768e-07, "epoch": 0.6935462584136202, "percentage": 69.35, "elapsed_time": "0:16:44", "remaining_time": "0:07:24", "throughput": 2568.43, "total_tokens": 2581184} +{"current_steps": 5260, "total_steps": 7577, "loss": 0.2016, "lr": 5.180606233630374e-07, "epoch": 0.6942061501913687, "percentage": 69.42, "elapsed_time": "0:16:45", "remaining_time": "0:07:22", "throughput": 2570.24, "total_tokens": 2583872} +{"current_steps": 5265, "total_steps": 7577, "loss": 0.1809, "lr": 5.160435156295879e-07, "epoch": 0.694866041969117, "percentage": 69.49, "elapsed_time": "0:16:45", "remaining_time": "0:07:21", "throughput": 2571.8, "total_tokens": 2586304} +{"current_steps": 5270, "total_steps": 7577, "loss": 0.0593, "lr": 5.14028975952165e-07, "epoch": 0.6955259337468656, "percentage": 69.55, "elapsed_time": "0:16:45", "remaining_time": "0:07:20", "throughput": 2573.67, "total_tokens": 2589056} +{"current_steps": 5275, "total_steps": 7577, "loss": 0.0839, "lr": 5.120170150206768e-07, "epoch": 0.6961858255246139, "percentage": 69.62, "elapsed_time": "0:16:46", "remaining_time": "0:07:19", "throughput": 2575.24, "total_tokens": 2591488} +{"current_steps": 5280, "total_steps": 7577, "loss": 0.0112, "lr": 5.100076435113496e-07, "epoch": 0.6968457173023624, "percentage": 69.68, "elapsed_time": "0:16:46", "remaining_time": "0:07:17", "throughput": 2576.69, "total_tokens": 2593792} +{"current_steps": 5285, "total_steps": 7577, "loss": 0.1564, "lr": 5.080008720866673e-07, "epoch": 0.6975056090801108, "percentage": 69.75, "elapsed_time": "0:16:46", "remaining_time": "0:07:16", "throughput": 2578.01, "total_tokens": 2595968} +{"current_steps": 5290, "total_steps": 7577, "loss": 0.2333, "lr": 5.059967113953173e-07, "epoch": 0.6981655008578593, "percentage": 69.82, "elapsed_time": "0:16:47", "remaining_time": "0:07:15", "throughput": 2579.34, "total_tokens": 2598144} +{"current_steps": 5295, "total_steps": 7577, "loss": 0.0942, "lr": 5.039951720721349e-07, "epoch": 0.6988253926356077, "percentage": 69.88, "elapsed_time": "0:16:47", "remaining_time": "0:07:14", "throughput": 2580.78, "total_tokens": 2600448} +{"current_steps": 5300, "total_steps": 7577, "loss": 0.0922, "lr": 5.019962647380429e-07, "epoch": 0.6994852844133562, "percentage": 69.95, "elapsed_time": "0:16:47", "remaining_time": "0:07:13", "throughput": 2582.4, "total_tokens": 2602944} +{"current_steps": 5305, "total_steps": 7577, "loss": 0.1829, "lr": 5.000000000000002e-07, "epoch": 0.7001451761911046, "percentage": 70.01, "elapsed_time": "0:16:48", "remaining_time": "0:07:11", "throughput": 2583.72, "total_tokens": 2605120} +{"current_steps": 5306, "total_steps": 7577, "eval_loss": 0.09362584352493286, "epoch": 0.7002771545466544, "percentage": 70.03, "elapsed_time": "0:16:56", "remaining_time": "0:07:15", "throughput": 2563.57, "total_tokens": 2605504} +{"current_steps": 5310, "total_steps": 7577, "loss": 0.0412, "lr": 4.980063884509414e-07, "epoch": 0.7008050679688531, "percentage": 70.08, "elapsed_time": "0:17:19", "remaining_time": "0:07:23", "throughput": 2508.21, "total_tokens": 2607296} +{"current_steps": 5315, "total_steps": 7577, "loss": 0.0804, "lr": 4.960154406697229e-07, "epoch": 0.7014649597466015, "percentage": 70.15, "elapsed_time": "0:17:19", "remaining_time": "0:07:22", "throughput": 2509.73, "total_tokens": 2609728} +{"current_steps": 5320, "total_steps": 7577, "loss": 0.2263, "lr": 4.940271672210667e-07, "epoch": 0.70212485152435, "percentage": 70.21, "elapsed_time": "0:17:20", "remaining_time": "0:07:21", "throughput": 2511.33, "total_tokens": 2612224} +{"current_steps": 5325, "total_steps": 7577, "loss": 0.0293, "lr": 4.920415786555025e-07, "epoch": 0.7027847433020985, "percentage": 70.28, "elapsed_time": "0:17:20", "remaining_time": "0:07:20", "throughput": 2512.93, "total_tokens": 2614720} +{"current_steps": 5330, "total_steps": 7577, "loss": 0.2921, "lr": 4.900586855093144e-07, "epoch": 0.7034446350798469, "percentage": 70.34, "elapsed_time": "0:17:20", "remaining_time": "0:07:18", "throughput": 2514.64, "total_tokens": 2617344} +{"current_steps": 5335, "total_steps": 7577, "loss": 0.1245, "lr": 4.880784983044827e-07, "epoch": 0.7041045268575954, "percentage": 70.41, "elapsed_time": "0:17:21", "remaining_time": "0:07:17", "throughput": 2515.99, "total_tokens": 2619584} +{"current_steps": 5340, "total_steps": 7577, "loss": 0.0299, "lr": 4.861010275486284e-07, "epoch": 0.7047644186353438, "percentage": 70.48, "elapsed_time": "0:17:21", "remaining_time": "0:07:16", "throughput": 2517.39, "total_tokens": 2621888} +{"current_steps": 5345, "total_steps": 7577, "loss": 0.0976, "lr": 4.8412628373496e-07, "epoch": 0.7054243104130923, "percentage": 70.54, "elapsed_time": "0:17:21", "remaining_time": "0:07:15", "throughput": 2519.1, "total_tokens": 2624512} +{"current_steps": 5350, "total_steps": 7577, "loss": 0.0023, "lr": 4.821542773422136e-07, "epoch": 0.7060842021908407, "percentage": 70.61, "elapsed_time": "0:17:22", "remaining_time": "0:07:13", "throughput": 2520.69, "total_tokens": 2627008} +{"current_steps": 5355, "total_steps": 7577, "loss": 0.0019, "lr": 4.801850188346012e-07, "epoch": 0.7067440939685892, "percentage": 70.67, "elapsed_time": "0:17:22", "remaining_time": "0:07:12", "throughput": 2522.21, "total_tokens": 2629440} +{"current_steps": 5360, "total_steps": 7577, "loss": 0.1053, "lr": 4.782185186617523e-07, "epoch": 0.7074039857463376, "percentage": 70.74, "elapsed_time": "0:17:22", "remaining_time": "0:07:11", "throughput": 2523.73, "total_tokens": 2631872} +{"current_steps": 5365, "total_steps": 7577, "loss": 0.0618, "lr": 4.762547872586603e-07, "epoch": 0.7080638775240861, "percentage": 70.81, "elapsed_time": "0:17:23", "remaining_time": "0:07:10", "throughput": 2525.48, "total_tokens": 2634560} +{"current_steps": 5370, "total_steps": 7577, "loss": 0.1344, "lr": 4.7429383504562605e-07, "epoch": 0.7087237693018344, "percentage": 70.87, "elapsed_time": "0:17:23", "remaining_time": "0:07:08", "throughput": 2527.12, "total_tokens": 2637120} +{"current_steps": 5375, "total_steps": 7577, "loss": 0.0227, "lr": 4.723356724282029e-07, "epoch": 0.709383661079583, "percentage": 70.94, "elapsed_time": "0:17:23", "remaining_time": "0:07:07", "throughput": 2528.64, "total_tokens": 2639552} +{"current_steps": 5380, "total_steps": 7577, "loss": 0.128, "lr": 4.703803097971426e-07, "epoch": 0.7100435528573315, "percentage": 71.0, "elapsed_time": "0:17:24", "remaining_time": "0:07:06", "throughput": 2530.17, "total_tokens": 2641984} +{"current_steps": 5385, "total_steps": 7577, "loss": 0.0719, "lr": 4.6842775752833763e-07, "epoch": 0.7107034446350798, "percentage": 71.07, "elapsed_time": "0:17:24", "remaining_time": "0:07:05", "throughput": 2531.64, "total_tokens": 2644352} +{"current_steps": 5390, "total_steps": 7577, "loss": 0.0018, "lr": 4.664780259827689e-07, "epoch": 0.7113633364128283, "percentage": 71.14, "elapsed_time": "0:17:24", "remaining_time": "0:07:03", "throughput": 2533.4, "total_tokens": 2647040} +{"current_steps": 5395, "total_steps": 7577, "loss": 0.001, "lr": 4.6453112550644857e-07, "epoch": 0.7120232281905767, "percentage": 71.2, "elapsed_time": "0:17:25", "remaining_time": "0:07:02", "throughput": 2534.92, "total_tokens": 2649472} +{"current_steps": 5400, "total_steps": 7577, "loss": 0.0643, "lr": 4.625870664303663e-07, "epoch": 0.7126831199683252, "percentage": 71.27, "elapsed_time": "0:17:25", "remaining_time": "0:07:01", "throughput": 2536.39, "total_tokens": 2651840} +{"current_steps": 5405, "total_steps": 7577, "loss": 0.0024, "lr": 4.6064585907043486e-07, "epoch": 0.7133430117460736, "percentage": 71.33, "elapsed_time": "0:17:25", "remaining_time": "0:07:00", "throughput": 2538.09, "total_tokens": 2654464} +{"current_steps": 5410, "total_steps": 7577, "loss": 0.0598, "lr": 4.587075137274334e-07, "epoch": 0.7140029035238221, "percentage": 71.4, "elapsed_time": "0:17:26", "remaining_time": "0:06:59", "throughput": 2539.33, "total_tokens": 2656576} +{"current_steps": 5415, "total_steps": 7577, "loss": 0.0527, "lr": 4.5677204068695597e-07, "epoch": 0.7146627953015705, "percentage": 71.47, "elapsed_time": "0:17:26", "remaining_time": "0:06:57", "throughput": 2540.85, "total_tokens": 2659008} +{"current_steps": 5420, "total_steps": 7577, "loss": 0.037, "lr": 4.5483945021935356e-07, "epoch": 0.715322687079319, "percentage": 71.53, "elapsed_time": "0:17:26", "remaining_time": "0:06:56", "throughput": 2542.54, "total_tokens": 2661632} +{"current_steps": 5425, "total_steps": 7577, "loss": 0.1053, "lr": 4.5290975257968155e-07, "epoch": 0.7159825788570674, "percentage": 71.6, "elapsed_time": "0:17:27", "remaining_time": "0:06:55", "throughput": 2544.18, "total_tokens": 2664192} +{"current_steps": 5430, "total_steps": 7577, "loss": 0.185, "lr": 4.509829580076452e-07, "epoch": 0.7166424706348159, "percentage": 71.66, "elapsed_time": "0:17:27", "remaining_time": "0:06:54", "throughput": 2545.7, "total_tokens": 2666624} +{"current_steps": 5435, "total_steps": 7577, "loss": 0.1415, "lr": 4.490590767275442e-07, "epoch": 0.7173023624125643, "percentage": 71.73, "elapsed_time": "0:17:27", "remaining_time": "0:06:52", "throughput": 2547.29, "total_tokens": 2669120} +{"current_steps": 5440, "total_steps": 7577, "loss": 0.1221, "lr": 4.4713811894822064e-07, "epoch": 0.7179622541903128, "percentage": 71.8, "elapsed_time": "0:17:28", "remaining_time": "0:06:51", "throughput": 2548.82, "total_tokens": 2671552} +{"current_steps": 5445, "total_steps": 7577, "loss": 0.0782, "lr": 4.4522009486300204e-07, "epoch": 0.7186221459680613, "percentage": 71.86, "elapsed_time": "0:17:28", "remaining_time": "0:06:50", "throughput": 2550.57, "total_tokens": 2674240} +{"current_steps": 5450, "total_steps": 7577, "loss": 0.0865, "lr": 4.43305014649649e-07, "epoch": 0.7192820377458097, "percentage": 71.93, "elapsed_time": "0:17:28", "remaining_time": "0:06:49", "throughput": 2551.96, "total_tokens": 2676544} +{"current_steps": 5455, "total_steps": 7577, "loss": 0.0004, "lr": 4.4139288847030155e-07, "epoch": 0.7199419295235582, "percentage": 71.99, "elapsed_time": "0:17:29", "remaining_time": "0:06:48", "throughput": 2553.41, "total_tokens": 2678912} +{"current_steps": 5460, "total_steps": 7577, "loss": 0.0538, "lr": 4.394837264714233e-07, "epoch": 0.7206018213013066, "percentage": 72.06, "elapsed_time": "0:17:29", "remaining_time": "0:06:46", "throughput": 2554.93, "total_tokens": 2681344} +{"current_steps": 5465, "total_steps": 7577, "loss": 0.0013, "lr": 4.3757753878375005e-07, "epoch": 0.7212617130790551, "percentage": 72.13, "elapsed_time": "0:17:29", "remaining_time": "0:06:45", "throughput": 2556.43, "total_tokens": 2683776} +{"current_steps": 5470, "total_steps": 7577, "loss": 0.0553, "lr": 4.3567433552223375e-07, "epoch": 0.7219216048568035, "percentage": 72.19, "elapsed_time": "0:17:30", "remaining_time": "0:06:44", "throughput": 2557.77, "total_tokens": 2686016} +{"current_steps": 5475, "total_steps": 7577, "loss": 0.1592, "lr": 4.3377412678599e-07, "epoch": 0.722581496634552, "percentage": 72.26, "elapsed_time": "0:17:30", "remaining_time": "0:06:43", "throughput": 2558.98, "total_tokens": 2688128} +{"current_steps": 5480, "total_steps": 7577, "loss": 0.1678, "lr": 4.318769226582454e-07, "epoch": 0.7232413884123003, "percentage": 72.32, "elapsed_time": "0:17:30", "remaining_time": "0:06:42", "throughput": 2560.33, "total_tokens": 2690368} +{"current_steps": 5485, "total_steps": 7577, "loss": 0.0807, "lr": 4.299827332062811e-07, "epoch": 0.7239012801900488, "percentage": 72.39, "elapsed_time": "0:17:31", "remaining_time": "0:06:40", "throughput": 2562.02, "total_tokens": 2692992} +{"current_steps": 5490, "total_steps": 7577, "loss": 0.0951, "lr": 4.2809156848138363e-07, "epoch": 0.7245611719677972, "percentage": 72.46, "elapsed_time": "0:17:31", "remaining_time": "0:06:39", "throughput": 2563.54, "total_tokens": 2695424} +{"current_steps": 5495, "total_steps": 7577, "loss": 0.1498, "lr": 4.2620343851878616e-07, "epoch": 0.7252210637455457, "percentage": 72.52, "elapsed_time": "0:17:31", "remaining_time": "0:06:38", "throughput": 2565.06, "total_tokens": 2697856} +{"current_steps": 5500, "total_steps": 7577, "loss": 0.0717, "lr": 4.2431835333762123e-07, "epoch": 0.7258809555232941, "percentage": 72.59, "elapsed_time": "0:17:32", "remaining_time": "0:06:37", "throughput": 2566.86, "total_tokens": 2700608} +{"current_steps": 5505, "total_steps": 7577, "loss": 0.0003, "lr": 4.224363229408628e-07, "epoch": 0.7265408473010426, "percentage": 72.65, "elapsed_time": "0:17:32", "remaining_time": "0:06:36", "throughput": 2568.43, "total_tokens": 2703104} +{"current_steps": 5510, "total_steps": 7577, "loss": 0.2012, "lr": 4.205573573152753e-07, "epoch": 0.7272007390787911, "percentage": 72.72, "elapsed_time": "0:17:32", "remaining_time": "0:06:34", "throughput": 2569.78, "total_tokens": 2705344} +{"current_steps": 5515, "total_steps": 7577, "loss": 0.0556, "lr": 4.18681466431361e-07, "epoch": 0.7278606308565395, "percentage": 72.79, "elapsed_time": "0:17:33", "remaining_time": "0:06:33", "throughput": 2571.06, "total_tokens": 2707520} +{"current_steps": 5520, "total_steps": 7577, "loss": 0.0709, "lr": 4.168086602433055e-07, "epoch": 0.728520522634288, "percentage": 72.85, "elapsed_time": "0:17:33", "remaining_time": "0:06:32", "throughput": 2572.52, "total_tokens": 2709888} +{"current_steps": 5525, "total_steps": 7577, "loss": 0.2017, "lr": 4.1493894868892676e-07, "epoch": 0.7291804144120364, "percentage": 72.92, "elapsed_time": "0:17:33", "remaining_time": "0:06:31", "throughput": 2573.92, "total_tokens": 2712192} +{"current_steps": 5530, "total_steps": 7577, "loss": 0.0165, "lr": 4.1307234168962093e-07, "epoch": 0.7298403061897849, "percentage": 72.98, "elapsed_time": "0:17:34", "remaining_time": "0:06:30", "throughput": 2575.2, "total_tokens": 2714368} +{"current_steps": 5535, "total_steps": 7577, "loss": 0.0494, "lr": 4.112088491503095e-07, "epoch": 0.7305001979675333, "percentage": 73.05, "elapsed_time": "0:17:34", "remaining_time": "0:06:28", "throughput": 2576.54, "total_tokens": 2716608} +{"current_steps": 5540, "total_steps": 7577, "loss": 0.0011, "lr": 4.0934848095938937e-07, "epoch": 0.7311600897452818, "percentage": 73.12, "elapsed_time": "0:17:34", "remaining_time": "0:06:27", "throughput": 2577.7, "total_tokens": 2718656} +{"current_steps": 5545, "total_steps": 7577, "loss": 0.097, "lr": 4.074912469886763e-07, "epoch": 0.7318199815230302, "percentage": 73.18, "elapsed_time": "0:17:35", "remaining_time": "0:06:26", "throughput": 2579.27, "total_tokens": 2721152} +{"current_steps": 5550, "total_steps": 7577, "loss": 0.0014, "lr": 4.0563715709335657e-07, "epoch": 0.7324798733007787, "percentage": 73.25, "elapsed_time": "0:17:35", "remaining_time": "0:06:25", "throughput": 2580.48, "total_tokens": 2723264} +{"current_steps": 5555, "total_steps": 7577, "loss": 0.198, "lr": 4.037862211119315e-07, "epoch": 0.7331397650785271, "percentage": 73.31, "elapsed_time": "0:17:35", "remaining_time": "0:06:24", "throughput": 2581.87, "total_tokens": 2725568} +{"current_steps": 5560, "total_steps": 7577, "loss": 0.0634, "lr": 4.0193844886616715e-07, "epoch": 0.7337996568562756, "percentage": 73.38, "elapsed_time": "0:17:35", "remaining_time": "0:06:23", "throughput": 2583.55, "total_tokens": 2728192} +{"current_steps": 5565, "total_steps": 7577, "loss": 0.2335, "lr": 4.0009385016104137e-07, "epoch": 0.7344595486340241, "percentage": 73.45, "elapsed_time": "0:17:36", "remaining_time": "0:06:21", "throughput": 2585.43, "total_tokens": 2731072} +{"current_steps": 5570, "total_steps": 7577, "loss": 0.0761, "lr": 3.9825243478469164e-07, "epoch": 0.7351194404117725, "percentage": 73.51, "elapsed_time": "0:17:36", "remaining_time": "0:06:20", "throughput": 2586.85, "total_tokens": 2733440} +{"current_steps": 5575, "total_steps": 7577, "loss": 0.0718, "lr": 3.9641421250836484e-07, "epoch": 0.735779332189521, "percentage": 73.58, "elapsed_time": "0:17:36", "remaining_time": "0:06:19", "throughput": 2588.53, "total_tokens": 2736064} +{"current_steps": 5580, "total_steps": 7577, "loss": 0.0312, "lr": 3.945791930863622e-07, "epoch": 0.7364392239672694, "percentage": 73.64, "elapsed_time": "0:17:37", "remaining_time": "0:06:18", "throughput": 2590.03, "total_tokens": 2738496} +{"current_steps": 5585, "total_steps": 7577, "loss": 0.0019, "lr": 3.9274738625599137e-07, "epoch": 0.7370991157450179, "percentage": 73.71, "elapsed_time": "0:17:37", "remaining_time": "0:06:17", "throughput": 2591.42, "total_tokens": 2740800} +{"current_steps": 5590, "total_steps": 7577, "loss": 0.0637, "lr": 3.909188017375112e-07, "epoch": 0.7377590075227662, "percentage": 73.78, "elapsed_time": "0:17:37", "remaining_time": "0:06:16", "throughput": 2592.8, "total_tokens": 2743104} +{"current_steps": 5595, "total_steps": 7577, "loss": 0.137, "lr": 3.890934492340819e-07, "epoch": 0.7384188993005147, "percentage": 73.84, "elapsed_time": "0:17:38", "remaining_time": "0:06:14", "throughput": 2594.13, "total_tokens": 2745344} +{"current_steps": 5600, "total_steps": 7577, "loss": 0.0649, "lr": 3.872713384317147e-07, "epoch": 0.7390787910782631, "percentage": 73.91, "elapsed_time": "0:17:38", "remaining_time": "0:06:13", "throughput": 2595.4, "total_tokens": 2747520} +{"current_steps": 5605, "total_steps": 7577, "loss": 0.1226, "lr": 3.8545247899921776e-07, "epoch": 0.7397386828560116, "percentage": 73.97, "elapsed_time": "0:17:38", "remaining_time": "0:06:12", "throughput": 2596.96, "total_tokens": 2750016} +{"current_steps": 5610, "total_steps": 7577, "loss": 0.123, "lr": 3.8363688058814614e-07, "epoch": 0.74039857463376, "percentage": 74.04, "elapsed_time": "0:17:39", "remaining_time": "0:06:11", "throughput": 2598.68, "total_tokens": 2752704} +{"current_steps": 5615, "total_steps": 7577, "loss": 0.1293, "lr": 3.818245528327526e-07, "epoch": 0.7410584664115085, "percentage": 74.11, "elapsed_time": "0:17:39", "remaining_time": "0:06:10", "throughput": 2600.34, "total_tokens": 2755328} +{"current_steps": 5620, "total_steps": 7577, "loss": 0.0808, "lr": 3.8001550534993164e-07, "epoch": 0.7417183581892569, "percentage": 74.17, "elapsed_time": "0:17:39", "remaining_time": "0:06:09", "throughput": 2601.72, "total_tokens": 2757632} +{"current_steps": 5625, "total_steps": 7577, "loss": 0.0508, "lr": 3.7820974773917413e-07, "epoch": 0.7423782499670054, "percentage": 74.24, "elapsed_time": "0:17:40", "remaining_time": "0:06:07", "throughput": 2603.33, "total_tokens": 2760192} +{"current_steps": 5630, "total_steps": 7577, "loss": 0.0011, "lr": 3.764072895825117e-07, "epoch": 0.7430381417447539, "percentage": 74.3, "elapsed_time": "0:17:40", "remaining_time": "0:06:06", "throughput": 2604.99, "total_tokens": 2762816} +{"current_steps": 5635, "total_steps": 7577, "loss": 0.0735, "lr": 3.7460814044446934e-07, "epoch": 0.7436980335225023, "percentage": 74.37, "elapsed_time": "0:17:40", "remaining_time": "0:06:05", "throughput": 2606.37, "total_tokens": 2765120} +{"current_steps": 5640, "total_steps": 7577, "loss": 0.1235, "lr": 3.72812309872012e-07, "epoch": 0.7443579253002508, "percentage": 74.44, "elapsed_time": "0:17:41", "remaining_time": "0:06:04", "throughput": 2608.08, "total_tokens": 2767808} +{"current_steps": 5645, "total_steps": 7577, "loss": 0.0109, "lr": 3.71019807394495e-07, "epoch": 0.7450178170779992, "percentage": 74.5, "elapsed_time": "0:17:41", "remaining_time": "0:06:03", "throughput": 2609.51, "total_tokens": 2770176} +{"current_steps": 5650, "total_steps": 7577, "loss": 0.1873, "lr": 3.6923064252361505e-07, "epoch": 0.7456777088557477, "percentage": 74.57, "elapsed_time": "0:17:41", "remaining_time": "0:06:02", "throughput": 2611.06, "total_tokens": 2772672} +{"current_steps": 5655, "total_steps": 7577, "loss": 0.1134, "lr": 3.674448247533561e-07, "epoch": 0.7463376006334961, "percentage": 74.63, "elapsed_time": "0:17:42", "remaining_time": "0:06:01", "throughput": 2612.56, "total_tokens": 2775104} +{"current_steps": 5660, "total_steps": 7577, "loss": 0.2252, "lr": 3.656623635599432e-07, "epoch": 0.7469974924112446, "percentage": 74.7, "elapsed_time": "0:17:42", "remaining_time": "0:05:59", "throughput": 2614.27, "total_tokens": 2777792} +{"current_steps": 5665, "total_steps": 7577, "loss": 0.1396, "lr": 3.6388326840178865e-07, "epoch": 0.747657384188993, "percentage": 74.77, "elapsed_time": "0:17:42", "remaining_time": "0:05:58", "throughput": 2615.93, "total_tokens": 2780416} +{"current_steps": 5670, "total_steps": 7577, "loss": 0.0013, "lr": 3.621075487194435e-07, "epoch": 0.7483172759667415, "percentage": 74.83, "elapsed_time": "0:17:43", "remaining_time": "0:05:57", "throughput": 2617.76, "total_tokens": 2783232} +{"current_steps": 5675, "total_steps": 7577, "loss": 0.1226, "lr": 3.603352139355483e-07, "epoch": 0.7489771677444899, "percentage": 74.9, "elapsed_time": "0:17:43", "remaining_time": "0:05:56", "throughput": 2619.25, "total_tokens": 2785664} +{"current_steps": 5680, "total_steps": 7577, "loss": 0.0986, "lr": 3.58566273454781e-07, "epoch": 0.7496370595222384, "percentage": 74.96, "elapsed_time": "0:17:43", "remaining_time": "0:05:55", "throughput": 2620.84, "total_tokens": 2788224} +{"current_steps": 5685, "total_steps": 7577, "loss": 0.0314, "lr": 3.5680073666380817e-07, "epoch": 0.7502969512999867, "percentage": 75.03, "elapsed_time": "0:17:44", "remaining_time": "0:05:54", "throughput": 2622.33, "total_tokens": 2790656} +{"current_steps": 5685, "total_steps": 7577, "eval_loss": 0.10055803507566452, "epoch": 0.7502969512999867, "percentage": 75.03, "elapsed_time": "0:17:52", "remaining_time": "0:05:56", "throughput": 2603.19, "total_tokens": 2790656} +{"current_steps": 5690, "total_steps": 7577, "loss": 0.1421, "lr": 3.5503861293123514e-07, "epoch": 0.7509568430777352, "percentage": 75.1, "elapsed_time": "0:18:54", "remaining_time": "0:06:16", "throughput": 2461.44, "total_tokens": 2792960} +{"current_steps": 5695, "total_steps": 7577, "loss": 0.092, "lr": 3.532799116075571e-07, "epoch": 0.7516167348554837, "percentage": 75.16, "elapsed_time": "0:18:55", "remaining_time": "0:06:15", "throughput": 2463.05, "total_tokens": 2795648} +{"current_steps": 5700, "total_steps": 7577, "loss": 0.104, "lr": 3.5152464202510777e-07, "epoch": 0.7522766266332321, "percentage": 75.23, "elapsed_time": "0:18:55", "remaining_time": "0:06:13", "throughput": 2464.13, "total_tokens": 2797696} +{"current_steps": 5705, "total_steps": 7577, "loss": 0.1443, "lr": 3.4977281349801056e-07, "epoch": 0.7529365184109806, "percentage": 75.29, "elapsed_time": "0:18:55", "remaining_time": "0:06:12", "throughput": 2465.61, "total_tokens": 2800192} +{"current_steps": 5710, "total_steps": 7577, "loss": 0.0584, "lr": 3.4802443532213056e-07, "epoch": 0.753596410188729, "percentage": 75.36, "elapsed_time": "0:18:56", "remaining_time": "0:06:11", "throughput": 2466.37, "total_tokens": 2802560} +{"current_steps": 5715, "total_steps": 7577, "loss": 0.2492, "lr": 3.4627951677502233e-07, "epoch": 0.7542563019664775, "percentage": 75.43, "elapsed_time": "0:18:56", "remaining_time": "0:06:10", "throughput": 2467.79, "total_tokens": 2804992} +{"current_steps": 5720, "total_steps": 7577, "loss": 0.0061, "lr": 3.4453806711588397e-07, "epoch": 0.7549161937442259, "percentage": 75.49, "elapsed_time": "0:18:56", "remaining_time": "0:06:09", "throughput": 2469.11, "total_tokens": 2807296} +{"current_steps": 5725, "total_steps": 7577, "loss": 0.0309, "lr": 3.428000955855054e-07, "epoch": 0.7555760855219744, "percentage": 75.56, "elapsed_time": "0:18:57", "remaining_time": "0:06:07", "throughput": 2470.75, "total_tokens": 2809984} +{"current_steps": 5730, "total_steps": 7577, "loss": 0.0018, "lr": 3.4106561140621983e-07, "epoch": 0.7562359772997228, "percentage": 75.62, "elapsed_time": "0:18:57", "remaining_time": "0:06:06", "throughput": 2472.44, "total_tokens": 2812736} +{"current_steps": 5735, "total_steps": 7577, "loss": 0.173, "lr": 3.393346237818567e-07, "epoch": 0.7568958690774713, "percentage": 75.69, "elapsed_time": "0:18:57", "remaining_time": "0:06:05", "throughput": 2473.75, "total_tokens": 2815040} +{"current_steps": 5740, "total_steps": 7577, "loss": 0.1591, "lr": 3.3760714189769015e-07, "epoch": 0.7575557608552197, "percentage": 75.76, "elapsed_time": "0:18:58", "remaining_time": "0:06:04", "throughput": 2475.06, "total_tokens": 2817344} +{"current_steps": 5745, "total_steps": 7577, "loss": 0.024, "lr": 3.3588317492039266e-07, "epoch": 0.7582156526329682, "percentage": 75.82, "elapsed_time": "0:18:58", "remaining_time": "0:06:03", "throughput": 2476.36, "total_tokens": 2819648} +{"current_steps": 5750, "total_steps": 7577, "loss": 0.1302, "lr": 3.341627319979834e-07, "epoch": 0.7588755444107167, "percentage": 75.89, "elapsed_time": "0:18:58", "remaining_time": "0:06:01", "throughput": 2478.09, "total_tokens": 2822464} +{"current_steps": 5755, "total_steps": 7577, "loss": 0.2033, "lr": 3.324458222597839e-07, "epoch": 0.7595354361884651, "percentage": 75.95, "elapsed_time": "0:18:59", "remaining_time": "0:06:00", "throughput": 2479.5, "total_tokens": 2824896} +{"current_steps": 5760, "total_steps": 7577, "loss": 0.0718, "lr": 3.307324548163657e-07, "epoch": 0.7601953279662136, "percentage": 76.02, "elapsed_time": "0:18:59", "remaining_time": "0:05:59", "throughput": 2481.19, "total_tokens": 2827648} +{"current_steps": 5765, "total_steps": 7577, "loss": 0.0575, "lr": 3.2902263875950374e-07, "epoch": 0.760855219743962, "percentage": 76.09, "elapsed_time": "0:18:59", "remaining_time": "0:05:58", "throughput": 2482.82, "total_tokens": 2830336} +{"current_steps": 5770, "total_steps": 7577, "loss": 0.0498, "lr": 3.2731638316212894e-07, "epoch": 0.7615151115217105, "percentage": 76.15, "elapsed_time": "0:19:00", "remaining_time": "0:05:57", "throughput": 2484.14, "total_tokens": 2832640} +{"current_steps": 5775, "total_steps": 7577, "loss": 0.086, "lr": 3.256136970782782e-07, "epoch": 0.7621750032994589, "percentage": 76.22, "elapsed_time": "0:19:00", "remaining_time": "0:05:55", "throughput": 2485.4, "total_tokens": 2834880} +{"current_steps": 5780, "total_steps": 7577, "loss": 0.1474, "lr": 3.23914589543047e-07, "epoch": 0.7628348950772074, "percentage": 76.28, "elapsed_time": "0:19:00", "remaining_time": "0:05:54", "throughput": 2486.91, "total_tokens": 2837440} +{"current_steps": 5785, "total_steps": 7577, "loss": 0.0621, "lr": 3.2221906957254276e-07, "epoch": 0.7634947868549558, "percentage": 76.35, "elapsed_time": "0:19:01", "remaining_time": "0:05:53", "throughput": 2488.27, "total_tokens": 2839808} +{"current_steps": 5790, "total_steps": 7577, "loss": 0.1094, "lr": 3.205271461638346e-07, "epoch": 0.7641546786327043, "percentage": 76.42, "elapsed_time": "0:19:01", "remaining_time": "0:05:52", "throughput": 2489.85, "total_tokens": 2842432} +{"current_steps": 5795, "total_steps": 7577, "loss": 0.1338, "lr": 3.188388282949085e-07, "epoch": 0.7648145704104526, "percentage": 76.48, "elapsed_time": "0:19:01", "remaining_time": "0:05:51", "throughput": 2491.49, "total_tokens": 2845120} +{"current_steps": 5800, "total_steps": 7577, "loss": 0.1247, "lr": 3.171541249246166e-07, "epoch": 0.7654744621882011, "percentage": 76.55, "elapsed_time": "0:19:02", "remaining_time": "0:05:49", "throughput": 2493.27, "total_tokens": 2848000} +{"current_steps": 5805, "total_steps": 7577, "loss": 0.1788, "lr": 3.154730449926316e-07, "epoch": 0.7661343539659495, "percentage": 76.61, "elapsed_time": "0:19:02", "remaining_time": "0:05:48", "throughput": 2494.84, "total_tokens": 2850624} +{"current_steps": 5810, "total_steps": 7577, "loss": 0.1394, "lr": 3.137955974194e-07, "epoch": 0.766794245743698, "percentage": 76.68, "elapsed_time": "0:19:02", "remaining_time": "0:05:47", "throughput": 2496.19, "total_tokens": 2852992} +{"current_steps": 5815, "total_steps": 7577, "loss": 0.0413, "lr": 3.1212179110609125e-07, "epoch": 0.7674541375214465, "percentage": 76.75, "elapsed_time": "0:19:03", "remaining_time": "0:05:46", "throughput": 2497.59, "total_tokens": 2855424} +{"current_steps": 5820, "total_steps": 7577, "loss": 0.1604, "lr": 3.104516349345553e-07, "epoch": 0.7681140292991949, "percentage": 76.81, "elapsed_time": "0:19:03", "remaining_time": "0:05:45", "throughput": 2499.1, "total_tokens": 2857984} +{"current_steps": 5825, "total_steps": 7577, "loss": 0.0702, "lr": 3.0878513776727144e-07, "epoch": 0.7687739210769434, "percentage": 76.88, "elapsed_time": "0:19:03", "remaining_time": "0:05:44", "throughput": 2500.72, "total_tokens": 2860672} +{"current_steps": 5830, "total_steps": 7577, "loss": 0.1228, "lr": 3.0712230844730414e-07, "epoch": 0.7694338128546918, "percentage": 76.94, "elapsed_time": "0:19:04", "remaining_time": "0:05:42", "throughput": 2502.07, "total_tokens": 2863040} +{"current_steps": 5835, "total_steps": 7577, "loss": 0.1412, "lr": 3.054631557982539e-07, "epoch": 0.7700937046324403, "percentage": 77.01, "elapsed_time": "0:19:04", "remaining_time": "0:05:41", "throughput": 2503.81, "total_tokens": 2865856} +{"current_steps": 5840, "total_steps": 7577, "loss": 0.108, "lr": 3.0380768862421156e-07, "epoch": 0.7707535964101887, "percentage": 77.08, "elapsed_time": "0:19:04", "remaining_time": "0:05:40", "throughput": 2505.05, "total_tokens": 2868096} +{"current_steps": 5845, "total_steps": 7577, "loss": 0.001, "lr": 3.0215591570971234e-07, "epoch": 0.7714134881879372, "percentage": 77.14, "elapsed_time": "0:19:05", "remaining_time": "0:05:39", "throughput": 2506.67, "total_tokens": 2870784} +{"current_steps": 5850, "total_steps": 7577, "loss": 0.0313, "lr": 3.005078458196868e-07, "epoch": 0.7720733799656856, "percentage": 77.21, "elapsed_time": "0:19:05", "remaining_time": "0:05:38", "throughput": 2508.07, "total_tokens": 2873216} +{"current_steps": 5855, "total_steps": 7577, "loss": 0.0011, "lr": 2.988634876994175e-07, "epoch": 0.7727332717434341, "percentage": 77.27, "elapsed_time": "0:19:05", "remaining_time": "0:05:37", "throughput": 2509.58, "total_tokens": 2875776} +{"current_steps": 5860, "total_steps": 7577, "loss": 0.0322, "lr": 2.972228500744898e-07, "epoch": 0.7733931635211825, "percentage": 77.34, "elapsed_time": "0:19:06", "remaining_time": "0:05:35", "throughput": 2511.09, "total_tokens": 2878336} +{"current_steps": 5865, "total_steps": 7577, "loss": 0.1583, "lr": 2.955859416507467e-07, "epoch": 0.774053055298931, "percentage": 77.41, "elapsed_time": "0:19:06", "remaining_time": "0:05:34", "throughput": 2512.6, "total_tokens": 2880896} +{"current_steps": 5870, "total_steps": 7577, "loss": 0.0666, "lr": 2.9395277111424357e-07, "epoch": 0.7747129470766794, "percentage": 77.47, "elapsed_time": "0:19:06", "remaining_time": "0:05:33", "throughput": 2514.25, "total_tokens": 2883648} +{"current_steps": 5875, "total_steps": 7577, "loss": 0.0659, "lr": 2.9232334713120035e-07, "epoch": 0.7753728388544279, "percentage": 77.54, "elapsed_time": "0:19:07", "remaining_time": "0:05:32", "throughput": 2515.53, "total_tokens": 2885952} +{"current_steps": 5880, "total_steps": 7577, "loss": 0.0666, "lr": 2.9069767834795655e-07, "epoch": 0.7760327306321764, "percentage": 77.6, "elapsed_time": "0:19:07", "remaining_time": "0:05:31", "throughput": 2517.07, "total_tokens": 2888576} +{"current_steps": 5885, "total_steps": 7577, "loss": 0.139, "lr": 2.8907577339092483e-07, "epoch": 0.7766926224099248, "percentage": 77.67, "elapsed_time": "0:19:07", "remaining_time": "0:05:30", "throughput": 2518.57, "total_tokens": 2891136} +{"current_steps": 5890, "total_steps": 7577, "loss": 0.0791, "lr": 2.8745764086654654e-07, "epoch": 0.7773525141876733, "percentage": 77.74, "elapsed_time": "0:19:08", "remaining_time": "0:05:28", "throughput": 2520.07, "total_tokens": 2893696} +{"current_steps": 5895, "total_steps": 7577, "loss": 0.0014, "lr": 2.8584328936124424e-07, "epoch": 0.7780124059654216, "percentage": 77.8, "elapsed_time": "0:19:08", "remaining_time": "0:05:27", "throughput": 2521.78, "total_tokens": 2896512} +{"current_steps": 5900, "total_steps": 7577, "loss": 0.1734, "lr": 2.8423272744137674e-07, "epoch": 0.7786722977431701, "percentage": 77.87, "elapsed_time": "0:19:08", "remaining_time": "0:05:26", "throughput": 2523.22, "total_tokens": 2899008} +{"current_steps": 5905, "total_steps": 7577, "loss": 0.0576, "lr": 2.82625963653195e-07, "epoch": 0.7793321895209185, "percentage": 77.93, "elapsed_time": "0:19:09", "remaining_time": "0:05:25", "throughput": 2524.56, "total_tokens": 2901376} +{"current_steps": 5910, "total_steps": 7577, "loss": 0.192, "lr": 2.810230065227944e-07, "epoch": 0.779992081298667, "percentage": 78.0, "elapsed_time": "0:19:09", "remaining_time": "0:05:24", "throughput": 2525.99, "total_tokens": 2903872} +{"current_steps": 5915, "total_steps": 7577, "loss": 0.0012, "lr": 2.7942386455607203e-07, "epoch": 0.7806519730764154, "percentage": 78.07, "elapsed_time": "0:19:09", "remaining_time": "0:05:23", "throughput": 2527.32, "total_tokens": 2906240} +{"current_steps": 5920, "total_steps": 7577, "loss": 0.068, "lr": 2.77828546238679e-07, "epoch": 0.7813118648541639, "percentage": 78.13, "elapsed_time": "0:19:10", "remaining_time": "0:05:21", "throughput": 2528.77, "total_tokens": 2908736} +{"current_steps": 5925, "total_steps": 7577, "loss": 0.1235, "lr": 2.762370600359774e-07, "epoch": 0.7819717566319123, "percentage": 78.2, "elapsed_time": "0:19:10", "remaining_time": "0:05:20", "throughput": 2530.1, "total_tokens": 2911104} +{"current_steps": 5930, "total_steps": 7577, "loss": 0.0383, "lr": 2.7464941439299484e-07, "epoch": 0.7826316484096608, "percentage": 78.26, "elapsed_time": "0:19:10", "remaining_time": "0:05:19", "throughput": 2531.42, "total_tokens": 2913472} +{"current_steps": 5935, "total_steps": 7577, "loss": 0.1809, "lr": 2.7306561773437887e-07, "epoch": 0.7832915401874093, "percentage": 78.33, "elapsed_time": "0:19:11", "remaining_time": "0:05:18", "throughput": 2532.74, "total_tokens": 2915840} +{"current_steps": 5940, "total_steps": 7577, "loss": 0.0033, "lr": 2.714856784643533e-07, "epoch": 0.7839514319651577, "percentage": 78.4, "elapsed_time": "0:19:11", "remaining_time": "0:05:17", "throughput": 2534.02, "total_tokens": 2918144} +{"current_steps": 5945, "total_steps": 7577, "loss": 0.1415, "lr": 2.6990960496667313e-07, "epoch": 0.7846113237429062, "percentage": 78.46, "elapsed_time": "0:19:11", "remaining_time": "0:05:16", "throughput": 2535.56, "total_tokens": 2920768} +{"current_steps": 5950, "total_steps": 7577, "loss": 0.0698, "lr": 2.6833740560457976e-07, "epoch": 0.7852712155206546, "percentage": 78.53, "elapsed_time": "0:19:12", "remaining_time": "0:05:15", "throughput": 2536.89, "total_tokens": 2923136} +{"current_steps": 5955, "total_steps": 7577, "loss": 0.0759, "lr": 2.6676908872075757e-07, "epoch": 0.7859311072984031, "percentage": 78.59, "elapsed_time": "0:19:12", "remaining_time": "0:05:13", "throughput": 2538.27, "total_tokens": 2925568} +{"current_steps": 5960, "total_steps": 7577, "loss": 0.0742, "lr": 2.6520466263728836e-07, "epoch": 0.7865909990761515, "percentage": 78.66, "elapsed_time": "0:19:12", "remaining_time": "0:05:12", "throughput": 2539.71, "total_tokens": 2928064} +{"current_steps": 5965, "total_steps": 7577, "loss": 0.2564, "lr": 2.636441356556087e-07, "epoch": 0.7872508908539, "percentage": 78.73, "elapsed_time": "0:19:13", "remaining_time": "0:05:11", "throughput": 2540.99, "total_tokens": 2930368} +{"current_steps": 5970, "total_steps": 7577, "loss": 0.1123, "lr": 2.620875160564645e-07, "epoch": 0.7879107826316484, "percentage": 78.79, "elapsed_time": "0:19:13", "remaining_time": "0:05:10", "throughput": 2542.47, "total_tokens": 2932928} +{"current_steps": 5975, "total_steps": 7577, "loss": 0.3593, "lr": 2.6053481209986715e-07, "epoch": 0.7885706744093969, "percentage": 78.86, "elapsed_time": "0:19:13", "remaining_time": "0:05:09", "throughput": 2543.85, "total_tokens": 2935360} +{"current_steps": 5980, "total_steps": 7577, "loss": 0.059, "lr": 2.5898603202505155e-07, "epoch": 0.7892305661871453, "percentage": 78.92, "elapsed_time": "0:19:14", "remaining_time": "0:05:08", "throughput": 2545.32, "total_tokens": 2937920} +{"current_steps": 5985, "total_steps": 7577, "loss": 0.0823, "lr": 2.5744118405042923e-07, "epoch": 0.7898904579648938, "percentage": 78.99, "elapsed_time": "0:19:14", "remaining_time": "0:05:07", "throughput": 2546.59, "total_tokens": 2940224} +{"current_steps": 5990, "total_steps": 7577, "loss": 0.0012, "lr": 2.559002763735485e-07, "epoch": 0.7905503497426422, "percentage": 79.06, "elapsed_time": "0:19:14", "remaining_time": "0:05:05", "throughput": 2548.12, "total_tokens": 2942848} +{"current_steps": 5995, "total_steps": 7577, "loss": 0.0604, "lr": 2.543633171710472e-07, "epoch": 0.7912102415203907, "percentage": 79.12, "elapsed_time": "0:19:15", "remaining_time": "0:05:04", "throughput": 2549.56, "total_tokens": 2945344} +{"current_steps": 6000, "total_steps": 7577, "loss": 0.008, "lr": 2.5283031459861205e-07, "epoch": 0.7918701332981392, "percentage": 79.19, "elapsed_time": "0:19:15", "remaining_time": "0:05:03", "throughput": 2550.99, "total_tokens": 2947840} +{"current_steps": 6005, "total_steps": 7577, "loss": 0.0374, "lr": 2.5130127679093396e-07, "epoch": 0.7925300250758875, "percentage": 79.25, "elapsed_time": "0:19:15", "remaining_time": "0:05:02", "throughput": 2552.26, "total_tokens": 2950144} +{"current_steps": 6010, "total_steps": 7577, "loss": 0.0336, "lr": 2.497762118616652e-07, "epoch": 0.793189916853636, "percentage": 79.32, "elapsed_time": "0:19:16", "remaining_time": "0:05:01", "throughput": 2553.48, "total_tokens": 2952384} +{"current_steps": 6015, "total_steps": 7577, "loss": 0.071, "lr": 2.4825512790337745e-07, "epoch": 0.7938498086313844, "percentage": 79.38, "elapsed_time": "0:19:16", "remaining_time": "0:05:00", "throughput": 2555.12, "total_tokens": 2955136} +{"current_steps": 6020, "total_steps": 7577, "loss": 0.0369, "lr": 2.467380329875163e-07, "epoch": 0.7945097004091329, "percentage": 79.45, "elapsed_time": "0:19:16", "remaining_time": "0:04:59", "throughput": 2556.7, "total_tokens": 2957824} +{"current_steps": 6025, "total_steps": 7577, "loss": 0.0014, "lr": 2.452249351643615e-07, "epoch": 0.7951695921868813, "percentage": 79.52, "elapsed_time": "0:19:17", "remaining_time": "0:04:58", "throughput": 2558.08, "total_tokens": 2960256} +{"current_steps": 6030, "total_steps": 7577, "loss": 0.1182, "lr": 2.437158424629817e-07, "epoch": 0.7958294839646298, "percentage": 79.58, "elapsed_time": "0:19:17", "remaining_time": "0:04:56", "throughput": 2559.67, "total_tokens": 2962944} +{"current_steps": 6035, "total_steps": 7577, "loss": 0.2256, "lr": 2.422107628911929e-07, "epoch": 0.7964893757423782, "percentage": 79.65, "elapsed_time": "0:19:17", "remaining_time": "0:04:55", "throughput": 2561.15, "total_tokens": 2965504} +{"current_steps": 6040, "total_steps": 7577, "loss": 0.274, "lr": 2.4070970443551673e-07, "epoch": 0.7971492675201267, "percentage": 79.71, "elapsed_time": "0:19:18", "remaining_time": "0:04:54", "throughput": 2562.37, "total_tokens": 2967744} +{"current_steps": 6045, "total_steps": 7577, "loss": 0.0032, "lr": 2.392126750611362e-07, "epoch": 0.7978091592978751, "percentage": 79.78, "elapsed_time": "0:19:18", "remaining_time": "0:04:53", "throughput": 2563.79, "total_tokens": 2970240} +{"current_steps": 6050, "total_steps": 7577, "loss": 0.1761, "lr": 2.3771968271185538e-07, "epoch": 0.7984690510756236, "percentage": 79.85, "elapsed_time": "0:19:18", "remaining_time": "0:04:52", "throughput": 2565.35, "total_tokens": 2972928} +{"current_steps": 6055, "total_steps": 7577, "loss": 0.1485, "lr": 2.3623073531005579e-07, "epoch": 0.799128942853372, "percentage": 79.91, "elapsed_time": "0:19:19", "remaining_time": "0:04:51", "throughput": 2566.56, "total_tokens": 2975168} +{"current_steps": 6060, "total_steps": 7577, "loss": 0.1396, "lr": 2.3474584075665493e-07, "epoch": 0.7997888346311205, "percentage": 79.98, "elapsed_time": "0:19:19", "remaining_time": "0:04:50", "throughput": 2567.76, "total_tokens": 2977408} +{"current_steps": 6064, "total_steps": 7577, "eval_loss": 0.09634685516357422, "epoch": 0.8003167480533192, "percentage": 80.03, "elapsed_time": "0:19:27", "remaining_time": "0:04:51", "throughput": 2551.28, "total_tokens": 2979456} +{"current_steps": 6065, "total_steps": 7577, "loss": 0.0051, "lr": 2.3326500693106533e-07, "epoch": 0.800448726408869, "percentage": 80.04, "elapsed_time": "0:20:12", "remaining_time": "0:05:02", "throughput": 2458.32, "total_tokens": 2979968} +{"current_steps": 6070, "total_steps": 7577, "loss": 0.2232, "lr": 2.3178824169114975e-07, "epoch": 0.8011086181866174, "percentage": 80.11, "elapsed_time": "0:20:12", "remaining_time": "0:05:01", "throughput": 2459.76, "total_tokens": 2982528} +{"current_steps": 6075, "total_steps": 7577, "loss": 0.0557, "lr": 2.303155528731837e-07, "epoch": 0.8017685099643659, "percentage": 80.18, "elapsed_time": "0:20:12", "remaining_time": "0:04:59", "throughput": 2461.0, "total_tokens": 2984832} +{"current_steps": 6080, "total_steps": 7577, "loss": 0.0009, "lr": 2.2884694829181016e-07, "epoch": 0.8024284017421143, "percentage": 80.24, "elapsed_time": "0:20:13", "remaining_time": "0:04:58", "throughput": 2462.39, "total_tokens": 2987328} +{"current_steps": 6085, "total_steps": 7577, "loss": 0.0703, "lr": 2.273824357400005e-07, "epoch": 0.8030882935198628, "percentage": 80.31, "elapsed_time": "0:20:13", "remaining_time": "0:04:57", "throughput": 2463.72, "total_tokens": 2989760} +{"current_steps": 6090, "total_steps": 7577, "loss": 0.0457, "lr": 2.2592202298901174e-07, "epoch": 0.8037481852976112, "percentage": 80.37, "elapsed_time": "0:20:13", "remaining_time": "0:04:56", "throughput": 2465.16, "total_tokens": 2992320} +{"current_steps": 6095, "total_steps": 7577, "loss": 0.0022, "lr": 2.2446571778834555e-07, "epoch": 0.8044080770753597, "percentage": 80.44, "elapsed_time": "0:20:14", "remaining_time": "0:04:55", "throughput": 2466.8, "total_tokens": 2995136} +{"current_steps": 6100, "total_steps": 7577, "loss": 0.0008, "lr": 2.2301352786570827e-07, "epoch": 0.805067968853108, "percentage": 80.51, "elapsed_time": "0:20:14", "remaining_time": "0:04:54", "throughput": 2468.48, "total_tokens": 2998016} +{"current_steps": 6105, "total_steps": 7577, "loss": 0.1533, "lr": 2.215654609269685e-07, "epoch": 0.8057278606308566, "percentage": 80.57, "elapsed_time": "0:20:14", "remaining_time": "0:04:52", "throughput": 2470.12, "total_tokens": 3000832} +{"current_steps": 6110, "total_steps": 7577, "loss": 0.1716, "lr": 2.201215246561161e-07, "epoch": 0.8063877524086049, "percentage": 80.64, "elapsed_time": "0:20:15", "remaining_time": "0:04:51", "throughput": 2471.71, "total_tokens": 3003584} +{"current_steps": 6115, "total_steps": 7577, "loss": 0.0731, "lr": 2.1868172671522357e-07, "epoch": 0.8070476441863534, "percentage": 80.7, "elapsed_time": "0:20:15", "remaining_time": "0:04:50", "throughput": 2473.39, "total_tokens": 3006464} +{"current_steps": 6120, "total_steps": 7577, "loss": 0.107, "lr": 2.1724607474440216e-07, "epoch": 0.8077075359641019, "percentage": 80.77, "elapsed_time": "0:20:15", "remaining_time": "0:04:49", "throughput": 2474.73, "total_tokens": 3008896} +{"current_steps": 6125, "total_steps": 7577, "loss": 0.1277, "lr": 2.158145763617646e-07, "epoch": 0.8083674277418503, "percentage": 80.84, "elapsed_time": "0:20:16", "remaining_time": "0:04:48", "throughput": 2476.11, "total_tokens": 3011392} +{"current_steps": 6130, "total_steps": 7577, "loss": 0.2135, "lr": 2.1438723916338198e-07, "epoch": 0.8090273195195988, "percentage": 80.9, "elapsed_time": "0:20:16", "remaining_time": "0:04:47", "throughput": 2477.59, "total_tokens": 3014016} +{"current_steps": 6135, "total_steps": 7577, "loss": 0.1745, "lr": 2.1296407072324495e-07, "epoch": 0.8096872112973472, "percentage": 80.97, "elapsed_time": "0:20:16", "remaining_time": "0:04:46", "throughput": 2479.03, "total_tokens": 3016576} +{"current_steps": 6140, "total_steps": 7577, "loss": 0.0661, "lr": 2.1154507859322336e-07, "epoch": 0.8103471030750957, "percentage": 81.03, "elapsed_time": "0:20:17", "remaining_time": "0:04:44", "throughput": 2480.36, "total_tokens": 3019008} +{"current_steps": 6145, "total_steps": 7577, "loss": 0.1033, "lr": 2.101302703030252e-07, "epoch": 0.8110069948528441, "percentage": 81.1, "elapsed_time": "0:20:17", "remaining_time": "0:04:43", "throughput": 2481.74, "total_tokens": 3021504} +{"current_steps": 6150, "total_steps": 7577, "loss": 0.0688, "lr": 2.0871965336015885e-07, "epoch": 0.8116668866305926, "percentage": 81.17, "elapsed_time": "0:20:17", "remaining_time": "0:04:42", "throughput": 2482.77, "total_tokens": 3023552} +{"current_steps": 6155, "total_steps": 7577, "loss": 0.0896, "lr": 2.0731323524989031e-07, "epoch": 0.812326778408341, "percentage": 81.23, "elapsed_time": "0:20:18", "remaining_time": "0:04:41", "throughput": 2484.0, "total_tokens": 3025856} +{"current_steps": 6160, "total_steps": 7577, "loss": 0.1915, "lr": 2.0591102343520616e-07, "epoch": 0.8129866701860895, "percentage": 81.3, "elapsed_time": "0:20:18", "remaining_time": "0:04:40", "throughput": 2485.18, "total_tokens": 3028096} +{"current_steps": 6165, "total_steps": 7577, "loss": 0.1774, "lr": 2.0451302535677206e-07, "epoch": 0.8136465619638379, "percentage": 81.36, "elapsed_time": "0:20:18", "remaining_time": "0:04:39", "throughput": 2486.49, "total_tokens": 3030528} +{"current_steps": 6170, "total_steps": 7577, "loss": 0.129, "lr": 2.0311924843289396e-07, "epoch": 0.8143064537415864, "percentage": 81.43, "elapsed_time": "0:20:19", "remaining_time": "0:04:38", "throughput": 2487.9, "total_tokens": 3033088} +{"current_steps": 6175, "total_steps": 7577, "loss": 0.0907, "lr": 2.017297000594794e-07, "epoch": 0.8149663455193348, "percentage": 81.5, "elapsed_time": "0:20:19", "remaining_time": "0:04:36", "throughput": 2488.97, "total_tokens": 3035200} +{"current_steps": 6180, "total_steps": 7577, "loss": 0.048, "lr": 2.0034438760999696e-07, "epoch": 0.8156262372970833, "percentage": 81.56, "elapsed_time": "0:20:19", "remaining_time": "0:04:35", "throughput": 2490.33, "total_tokens": 3037696} +{"current_steps": 6185, "total_steps": 7577, "loss": 0.1593, "lr": 1.9896331843543856e-07, "epoch": 0.8162861290748318, "percentage": 81.63, "elapsed_time": "0:20:20", "remaining_time": "0:04:34", "throughput": 2491.65, "total_tokens": 3040128} +{"current_steps": 6190, "total_steps": 7577, "loss": 0.1511, "lr": 1.975864998642789e-07, "epoch": 0.8169460208525802, "percentage": 81.69, "elapsed_time": "0:20:20", "remaining_time": "0:04:33", "throughput": 2492.97, "total_tokens": 3042560} +{"current_steps": 6195, "total_steps": 7577, "loss": 0.2786, "lr": 1.9621393920243767e-07, "epoch": 0.8176059126303287, "percentage": 81.76, "elapsed_time": "0:20:20", "remaining_time": "0:04:32", "throughput": 2494.12, "total_tokens": 3044800} +{"current_steps": 6200, "total_steps": 7577, "loss": 0.062, "lr": 1.9484564373324074e-07, "epoch": 0.8182658044080771, "percentage": 81.83, "elapsed_time": "0:20:21", "remaining_time": "0:04:31", "throughput": 2495.28, "total_tokens": 3047040} +{"current_steps": 6205, "total_steps": 7577, "loss": 0.0633, "lr": 1.934816207173805e-07, "epoch": 0.8189256961858256, "percentage": 81.89, "elapsed_time": "0:20:21", "remaining_time": "0:04:30", "throughput": 2496.7, "total_tokens": 3049600} +{"current_steps": 6210, "total_steps": 7577, "loss": 0.1436, "lr": 1.9212187739287943e-07, "epoch": 0.819585587963574, "percentage": 81.96, "elapsed_time": "0:20:21", "remaining_time": "0:04:28", "throughput": 2498.3, "total_tokens": 3052416} +{"current_steps": 6215, "total_steps": 7577, "loss": 0.0028, "lr": 1.907664209750488e-07, "epoch": 0.8202454797413224, "percentage": 82.02, "elapsed_time": "0:20:22", "remaining_time": "0:04:27", "throughput": 2499.77, "total_tokens": 3055040} +{"current_steps": 6220, "total_steps": 7577, "loss": 0.0553, "lr": 1.8941525865645336e-07, "epoch": 0.8209053715190708, "percentage": 82.09, "elapsed_time": "0:20:22", "remaining_time": "0:04:26", "throughput": 2501.39, "total_tokens": 3057856} +{"current_steps": 6225, "total_steps": 7577, "loss": 0.209, "lr": 1.8806839760687076e-07, "epoch": 0.8215652632968193, "percentage": 82.16, "elapsed_time": "0:20:22", "remaining_time": "0:04:25", "throughput": 2502.61, "total_tokens": 3060160} +{"current_steps": 6230, "total_steps": 7577, "loss": 0.1147, "lr": 1.867258449732545e-07, "epoch": 0.8222251550745677, "percentage": 82.22, "elapsed_time": "0:20:23", "remaining_time": "0:04:24", "throughput": 2503.93, "total_tokens": 3062592} +{"current_steps": 6235, "total_steps": 7577, "loss": 0.0562, "lr": 1.8538760787969676e-07, "epoch": 0.8228850468523162, "percentage": 82.29, "elapsed_time": "0:20:23", "remaining_time": "0:04:23", "throughput": 2505.31, "total_tokens": 3065088} +{"current_steps": 6240, "total_steps": 7577, "loss": 0.0017, "lr": 1.8405369342738907e-07, "epoch": 0.8235449386300646, "percentage": 82.35, "elapsed_time": "0:20:23", "remaining_time": "0:04:22", "throughput": 2506.77, "total_tokens": 3067712} +{"current_steps": 6245, "total_steps": 7577, "loss": 0.0602, "lr": 1.8272410869458598e-07, "epoch": 0.8242048304078131, "percentage": 82.42, "elapsed_time": "0:20:24", "remaining_time": "0:04:21", "throughput": 2508.09, "total_tokens": 3070144} +{"current_steps": 6250, "total_steps": 7577, "loss": 0.2637, "lr": 1.8139886073656653e-07, "epoch": 0.8248647221855616, "percentage": 82.49, "elapsed_time": "0:20:24", "remaining_time": "0:04:19", "throughput": 2509.31, "total_tokens": 3072448} +{"current_steps": 6255, "total_steps": 7577, "loss": 0.2488, "lr": 1.800779565855971e-07, "epoch": 0.82552461396331, "percentage": 82.55, "elapsed_time": "0:20:24", "remaining_time": "0:04:18", "throughput": 2510.77, "total_tokens": 3075072} +{"current_steps": 6260, "total_steps": 7577, "loss": 0.0066, "lr": 1.7876140325089463e-07, "epoch": 0.8261845057410585, "percentage": 82.62, "elapsed_time": "0:20:25", "remaining_time": "0:04:17", "throughput": 2511.98, "total_tokens": 3077376} +{"current_steps": 6265, "total_steps": 7577, "loss": 0.1657, "lr": 1.774492077185883e-07, "epoch": 0.8268443975188069, "percentage": 82.68, "elapsed_time": "0:20:25", "remaining_time": "0:04:16", "throughput": 2513.29, "total_tokens": 3079808} +{"current_steps": 6270, "total_steps": 7577, "loss": 0.0009, "lr": 1.7614137695168408e-07, "epoch": 0.8275042892965554, "percentage": 82.75, "elapsed_time": "0:20:25", "remaining_time": "0:04:15", "throughput": 2514.85, "total_tokens": 3082560} +{"current_steps": 6275, "total_steps": 7577, "loss": 0.0715, "lr": 1.748379178900261e-07, "epoch": 0.8281641810743038, "percentage": 82.82, "elapsed_time": "0:20:26", "remaining_time": "0:04:14", "throughput": 2515.86, "total_tokens": 3084608} +{"current_steps": 6280, "total_steps": 7577, "loss": 0.229, "lr": 1.7353883745026055e-07, "epoch": 0.8288240728520523, "percentage": 82.88, "elapsed_time": "0:20:26", "remaining_time": "0:04:13", "throughput": 2517.22, "total_tokens": 3087104} +{"current_steps": 6285, "total_steps": 7577, "loss": 0.1264, "lr": 1.722441425257999e-07, "epoch": 0.8294839646298007, "percentage": 82.95, "elapsed_time": "0:20:26", "remaining_time": "0:04:12", "throughput": 2518.43, "total_tokens": 3089408} +{"current_steps": 6290, "total_steps": 7577, "loss": 0.0197, "lr": 1.7095383998678402e-07, "epoch": 0.8301438564075492, "percentage": 83.01, "elapsed_time": "0:20:27", "remaining_time": "0:04:11", "throughput": 2519.69, "total_tokens": 3091776} +{"current_steps": 6295, "total_steps": 7577, "loss": 0.113, "lr": 1.6966793668004653e-07, "epoch": 0.8308037481852976, "percentage": 83.08, "elapsed_time": "0:20:27", "remaining_time": "0:04:09", "throughput": 2520.99, "total_tokens": 3094208} +{"current_steps": 6300, "total_steps": 7577, "loss": 0.006, "lr": 1.6838643942907625e-07, "epoch": 0.8314636399630461, "percentage": 83.15, "elapsed_time": "0:20:27", "remaining_time": "0:04:08", "throughput": 2522.4, "total_tokens": 3096768} +{"current_steps": 6305, "total_steps": 7577, "loss": 0.0423, "lr": 1.671093550339815e-07, "epoch": 0.8321235317407946, "percentage": 83.21, "elapsed_time": "0:20:28", "remaining_time": "0:04:07", "throughput": 2523.91, "total_tokens": 3099456} +{"current_steps": 6310, "total_steps": 7577, "loss": 0.0422, "lr": 1.6583669027145542e-07, "epoch": 0.832783423518543, "percentage": 83.28, "elapsed_time": "0:20:28", "remaining_time": "0:04:06", "throughput": 2525.46, "total_tokens": 3102208} +{"current_steps": 6315, "total_steps": 7577, "loss": 0.0013, "lr": 1.6456845189473767e-07, "epoch": 0.8334433152962915, "percentage": 83.34, "elapsed_time": "0:20:28", "remaining_time": "0:04:05", "throughput": 2526.97, "total_tokens": 3104896} +{"current_steps": 6320, "total_steps": 7577, "loss": 0.0676, "lr": 1.6330464663358123e-07, "epoch": 0.8341032070740398, "percentage": 83.41, "elapsed_time": "0:20:29", "remaining_time": "0:04:04", "throughput": 2528.42, "total_tokens": 3107520} +{"current_steps": 6325, "total_steps": 7577, "loss": 0.0017, "lr": 1.6204528119421346e-07, "epoch": 0.8347630988517883, "percentage": 83.48, "elapsed_time": "0:20:29", "remaining_time": "0:04:03", "throughput": 2529.88, "total_tokens": 3110144} +{"current_steps": 6330, "total_steps": 7577, "loss": 0.0483, "lr": 1.607903622593042e-07, "epoch": 0.8354229906295367, "percentage": 83.54, "elapsed_time": "0:20:29", "remaining_time": "0:04:02", "throughput": 2531.34, "total_tokens": 3112768} +{"current_steps": 6335, "total_steps": 7577, "loss": 0.0005, "lr": 1.5953989648792743e-07, "epoch": 0.8360828824072852, "percentage": 83.61, "elapsed_time": "0:20:30", "remaining_time": "0:04:01", "throughput": 2532.75, "total_tokens": 3115328} +{"current_steps": 6340, "total_steps": 7577, "loss": 0.0166, "lr": 1.5829389051552678e-07, "epoch": 0.8367427741850336, "percentage": 83.67, "elapsed_time": "0:20:30", "remaining_time": "0:04:00", "throughput": 2534.16, "total_tokens": 3117888} +{"current_steps": 6345, "total_steps": 7577, "loss": 0.0081, "lr": 1.5705235095388136e-07, "epoch": 0.8374026659627821, "percentage": 83.74, "elapsed_time": "0:20:30", "remaining_time": "0:03:58", "throughput": 2535.51, "total_tokens": 3120384} +{"current_steps": 6350, "total_steps": 7577, "loss": 0.0288, "lr": 1.5581528439106907e-07, "epoch": 0.8380625577405305, "percentage": 83.81, "elapsed_time": "0:20:31", "remaining_time": "0:03:57", "throughput": 2536.96, "total_tokens": 3123008} +{"current_steps": 6355, "total_steps": 7577, "loss": 0.0373, "lr": 1.5458269739143292e-07, "epoch": 0.838722449518279, "percentage": 83.87, "elapsed_time": "0:20:31", "remaining_time": "0:03:56", "throughput": 2538.32, "total_tokens": 3125504} +{"current_steps": 6360, "total_steps": 7577, "loss": 0.0028, "lr": 1.5335459649554538e-07, "epoch": 0.8393823412960274, "percentage": 83.94, "elapsed_time": "0:20:31", "remaining_time": "0:03:55", "throughput": 2539.47, "total_tokens": 3127744} +{"current_steps": 6365, "total_steps": 7577, "loss": 0.1164, "lr": 1.5213098822017357e-07, "epoch": 0.8400422330737759, "percentage": 84.0, "elapsed_time": "0:20:31", "remaining_time": "0:03:54", "throughput": 2540.68, "total_tokens": 3130048} +{"current_steps": 6370, "total_steps": 7577, "loss": 0.0148, "lr": 1.50911879058246e-07, "epoch": 0.8407021248515244, "percentage": 84.07, "elapsed_time": "0:20:32", "remaining_time": "0:03:53", "throughput": 2541.98, "total_tokens": 3132480} +{"current_steps": 6375, "total_steps": 7577, "loss": 0.0826, "lr": 1.4969727547881628e-07, "epoch": 0.8413620166292728, "percentage": 84.14, "elapsed_time": "0:20:32", "remaining_time": "0:03:52", "throughput": 2543.43, "total_tokens": 3135104} +{"current_steps": 6380, "total_steps": 7577, "loss": 0.1787, "lr": 1.4848718392703052e-07, "epoch": 0.8420219084070213, "percentage": 84.2, "elapsed_time": "0:20:32", "remaining_time": "0:03:51", "throughput": 2544.58, "total_tokens": 3137344} +{"current_steps": 6385, "total_steps": 7577, "loss": 0.1727, "lr": 1.472816108240915e-07, "epoch": 0.8426818001847697, "percentage": 84.27, "elapsed_time": "0:20:33", "remaining_time": "0:03:50", "throughput": 2546.13, "total_tokens": 3140096} +{"current_steps": 6390, "total_steps": 7577, "loss": 0.0868, "lr": 1.46080562567226e-07, "epoch": 0.8433416919625182, "percentage": 84.33, "elapsed_time": "0:20:33", "remaining_time": "0:03:49", "throughput": 2547.33, "total_tokens": 3142400} +{"current_steps": 6395, "total_steps": 7577, "loss": 0.0302, "lr": 1.4488404552964993e-07, "epoch": 0.8440015837402666, "percentage": 84.4, "elapsed_time": "0:20:33", "remaining_time": "0:03:48", "throughput": 2548.38, "total_tokens": 3144512} +{"current_steps": 6400, "total_steps": 7577, "loss": 0.0434, "lr": 1.4369206606053463e-07, "epoch": 0.8446614755180151, "percentage": 84.47, "elapsed_time": "0:20:34", "remaining_time": "0:03:46", "throughput": 2549.68, "total_tokens": 3146944} +{"current_steps": 6405, "total_steps": 7577, "loss": 0.0951, "lr": 1.425046304849742e-07, "epoch": 0.8453213672957635, "percentage": 84.53, "elapsed_time": "0:20:34", "remaining_time": "0:03:45", "throughput": 2550.98, "total_tokens": 3149376} +{"current_steps": 6410, "total_steps": 7577, "loss": 0.1082, "lr": 1.4132174510395024e-07, "epoch": 0.845981259073512, "percentage": 84.6, "elapsed_time": "0:20:34", "remaining_time": "0:03:44", "throughput": 2552.23, "total_tokens": 3151744} +{"current_steps": 6415, "total_steps": 7577, "loss": 0.0054, "lr": 1.4014341619430003e-07, "epoch": 0.8466411508512603, "percentage": 84.66, "elapsed_time": "0:20:35", "remaining_time": "0:03:43", "throughput": 2553.47, "total_tokens": 3154112} +{"current_steps": 6420, "total_steps": 7577, "loss": 0.0044, "lr": 1.3896965000868188e-07, "epoch": 0.8473010426290088, "percentage": 84.73, "elapsed_time": "0:20:35", "remaining_time": "0:03:42", "throughput": 2554.72, "total_tokens": 3156480} +{"current_steps": 6425, "total_steps": 7577, "loss": 0.1166, "lr": 1.3780045277554276e-07, "epoch": 0.8479609344067572, "percentage": 84.8, "elapsed_time": "0:20:35", "remaining_time": "0:03:41", "throughput": 2555.92, "total_tokens": 3158784} +{"current_steps": 6430, "total_steps": 7577, "loss": 0.1708, "lr": 1.3663583069908535e-07, "epoch": 0.8486208261845057, "percentage": 84.86, "elapsed_time": "0:20:36", "remaining_time": "0:03:40", "throughput": 2557.16, "total_tokens": 3161152} +{"current_steps": 6435, "total_steps": 7577, "loss": 0.0101, "lr": 1.3547578995923447e-07, "epoch": 0.8492807179622542, "percentage": 84.93, "elapsed_time": "0:20:36", "remaining_time": "0:03:39", "throughput": 2558.6, "total_tokens": 3163776} +{"current_steps": 6440, "total_steps": 7577, "loss": 0.171, "lr": 1.3432033671160458e-07, "epoch": 0.8499406097400026, "percentage": 84.99, "elapsed_time": "0:20:36", "remaining_time": "0:03:38", "throughput": 2559.95, "total_tokens": 3166272} +{"current_steps": 6443, "total_steps": 7577, "eval_loss": 0.10069070011377335, "epoch": 0.8503365448066517, "percentage": 85.03, "elapsed_time": "0:20:44", "remaining_time": "0:03:39", "throughput": 2544.33, "total_tokens": 3167488} +{"current_steps": 6445, "total_steps": 7577, "loss": 0.0712, "lr": 1.3316947708746762e-07, "epoch": 0.8506005015177511, "percentage": 85.06, "elapsed_time": "0:21:43", "remaining_time": "0:03:48", "throughput": 2430.55, "total_tokens": 3168640} +{"current_steps": 6450, "total_steps": 7577, "loss": 0.0922, "lr": 1.3202321719371967e-07, "epoch": 0.8512603932954995, "percentage": 85.13, "elapsed_time": "0:21:43", "remaining_time": "0:03:47", "throughput": 2431.76, "total_tokens": 3171008} +{"current_steps": 6455, "total_steps": 7577, "loss": 0.0878, "lr": 1.3088156311284893e-07, "epoch": 0.851920285073248, "percentage": 85.19, "elapsed_time": "0:21:44", "remaining_time": "0:03:46", "throughput": 2432.92, "total_tokens": 3173312} +{"current_steps": 6460, "total_steps": 7577, "loss": 0.2677, "lr": 1.2974452090290322e-07, "epoch": 0.8525801768509964, "percentage": 85.26, "elapsed_time": "0:21:44", "remaining_time": "0:03:45", "throughput": 2434.22, "total_tokens": 3175808} +{"current_steps": 6465, "total_steps": 7577, "loss": 0.0748, "lr": 1.2861209659745865e-07, "epoch": 0.8532400686287449, "percentage": 85.32, "elapsed_time": "0:21:44", "remaining_time": "0:03:44", "throughput": 2435.34, "total_tokens": 3178048} +{"current_steps": 6470, "total_steps": 7577, "loss": 0.1044, "lr": 1.2748429620558654e-07, "epoch": 0.8538999604064933, "percentage": 85.39, "elapsed_time": "0:21:45", "remaining_time": "0:03:43", "throughput": 2436.64, "total_tokens": 3180544} +{"current_steps": 6475, "total_steps": 7577, "loss": 0.1888, "lr": 1.2636112571182167e-07, "epoch": 0.8545598521842418, "percentage": 85.46, "elapsed_time": "0:21:45", "remaining_time": "0:03:42", "throughput": 2437.94, "total_tokens": 3183040} +{"current_steps": 6480, "total_steps": 7577, "loss": 0.1613, "lr": 1.2524259107613178e-07, "epoch": 0.8552197439619902, "percentage": 85.52, "elapsed_time": "0:21:45", "remaining_time": "0:03:41", "throughput": 2439.33, "total_tokens": 3185664} +{"current_steps": 6485, "total_steps": 7577, "loss": 0.1552, "lr": 1.2412869823388382e-07, "epoch": 0.8558796357397387, "percentage": 85.59, "elapsed_time": "0:21:46", "remaining_time": "0:03:39", "throughput": 2440.99, "total_tokens": 3188672} +{"current_steps": 6490, "total_steps": 7577, "loss": 0.0598, "lr": 1.2301945309581486e-07, "epoch": 0.8565395275174872, "percentage": 85.65, "elapsed_time": "0:21:46", "remaining_time": "0:03:38", "throughput": 2442.29, "total_tokens": 3191168} +{"current_steps": 6495, "total_steps": 7577, "loss": 0.116, "lr": 1.2191486154799846e-07, "epoch": 0.8571994192952356, "percentage": 85.72, "elapsed_time": "0:21:46", "remaining_time": "0:03:37", "throughput": 2443.58, "total_tokens": 3193664} +{"current_steps": 6500, "total_steps": 7577, "loss": 0.001, "lr": 1.208149294518147e-07, "epoch": 0.8578593110729841, "percentage": 85.79, "elapsed_time": "0:21:47", "remaining_time": "0:03:36", "throughput": 2444.92, "total_tokens": 3196224} +{"current_steps": 6505, "total_steps": 7577, "loss": 0.1906, "lr": 1.1971966264391954e-07, "epoch": 0.8585192028507325, "percentage": 85.85, "elapsed_time": "0:21:47", "remaining_time": "0:03:35", "throughput": 2446.26, "total_tokens": 3198784} +{"current_steps": 6510, "total_steps": 7577, "loss": 0.1289, "lr": 1.1862906693621233e-07, "epoch": 0.859179094628481, "percentage": 85.92, "elapsed_time": "0:21:47", "remaining_time": "0:03:34", "throughput": 2447.69, "total_tokens": 3201472} +{"current_steps": 6515, "total_steps": 7577, "loss": 0.1718, "lr": 1.1754314811580623e-07, "epoch": 0.8598389864062294, "percentage": 85.98, "elapsed_time": "0:21:48", "remaining_time": "0:03:33", "throughput": 2448.7, "total_tokens": 3203584} +{"current_steps": 6520, "total_steps": 7577, "loss": 0.0728, "lr": 1.1646191194499655e-07, "epoch": 0.8604988781839779, "percentage": 86.05, "elapsed_time": "0:21:48", "remaining_time": "0:03:32", "throughput": 2449.85, "total_tokens": 3205888} +{"current_steps": 6525, "total_steps": 7577, "loss": 0.1805, "lr": 1.1538536416123168e-07, "epoch": 0.8611587699617262, "percentage": 86.12, "elapsed_time": "0:21:48", "remaining_time": "0:03:31", "throughput": 2450.86, "total_tokens": 3208000} +{"current_steps": 6530, "total_steps": 7577, "loss": 0.0119, "lr": 1.1431351047708072e-07, "epoch": 0.8618186617394747, "percentage": 86.18, "elapsed_time": "0:21:49", "remaining_time": "0:03:29", "throughput": 2451.96, "total_tokens": 3210240} +{"current_steps": 6535, "total_steps": 7577, "loss": 0.1218, "lr": 1.1324635658020432e-07, "epoch": 0.8624785535172231, "percentage": 86.25, "elapsed_time": "0:21:49", "remaining_time": "0:03:28", "throughput": 2453.2, "total_tokens": 3212672} +{"current_steps": 6540, "total_steps": 7577, "loss": 0.1695, "lr": 1.1218390813332479e-07, "epoch": 0.8631384452949716, "percentage": 86.31, "elapsed_time": "0:21:49", "remaining_time": "0:03:27", "throughput": 2454.62, "total_tokens": 3215360} +{"current_steps": 6545, "total_steps": 7577, "loss": 0.1279, "lr": 1.1112617077419472e-07, "epoch": 0.86379833707272, "percentage": 86.38, "elapsed_time": "0:21:50", "remaining_time": "0:03:26", "throughput": 2456.09, "total_tokens": 3218112} +{"current_steps": 6550, "total_steps": 7577, "loss": 0.0386, "lr": 1.1007315011556884e-07, "epoch": 0.8644582288504685, "percentage": 86.45, "elapsed_time": "0:21:50", "remaining_time": "0:03:25", "throughput": 2457.14, "total_tokens": 3220288} +{"current_steps": 6555, "total_steps": 7577, "loss": 0.0013, "lr": 1.0902485174517251e-07, "epoch": 0.865118120628217, "percentage": 86.51, "elapsed_time": "0:21:50", "remaining_time": "0:03:24", "throughput": 2458.56, "total_tokens": 3222976} +{"current_steps": 6560, "total_steps": 7577, "loss": 0.0532, "lr": 1.0798128122567285e-07, "epoch": 0.8657780124059654, "percentage": 86.58, "elapsed_time": "0:21:51", "remaining_time": "0:03:23", "throughput": 2459.84, "total_tokens": 3225472} +{"current_steps": 6565, "total_steps": 7577, "loss": 0.1791, "lr": 1.0694244409464992e-07, "epoch": 0.8664379041837139, "percentage": 86.64, "elapsed_time": "0:21:51", "remaining_time": "0:03:22", "throughput": 2461.23, "total_tokens": 3228096} +{"current_steps": 6570, "total_steps": 7577, "loss": 0.1216, "lr": 1.0590834586456577e-07, "epoch": 0.8670977959614623, "percentage": 86.71, "elapsed_time": "0:21:51", "remaining_time": "0:03:21", "throughput": 2462.61, "total_tokens": 3230720} +{"current_steps": 6575, "total_steps": 7577, "loss": 0.1303, "lr": 1.0487899202273708e-07, "epoch": 0.8677576877392108, "percentage": 86.78, "elapsed_time": "0:21:52", "remaining_time": "0:03:19", "throughput": 2463.8, "total_tokens": 3233088} +{"current_steps": 6580, "total_steps": 7577, "loss": 0.1208, "lr": 1.0385438803130364e-07, "epoch": 0.8684175795169592, "percentage": 86.84, "elapsed_time": "0:21:52", "remaining_time": "0:03:18", "throughput": 2465.18, "total_tokens": 3235712} +{"current_steps": 6585, "total_steps": 7577, "loss": 0.1107, "lr": 1.0283453932720199e-07, "epoch": 0.8690774712947077, "percentage": 86.91, "elapsed_time": "0:21:52", "remaining_time": "0:03:17", "throughput": 2466.7, "total_tokens": 3238528} +{"current_steps": 6590, "total_steps": 7577, "loss": 0.0808, "lr": 1.0181945132213476e-07, "epoch": 0.8697373630724561, "percentage": 86.97, "elapsed_time": "0:21:53", "remaining_time": "0:03:16", "throughput": 2467.89, "total_tokens": 3240896} +{"current_steps": 6595, "total_steps": 7577, "loss": 0.0017, "lr": 1.0080912940254227e-07, "epoch": 0.8703972548502046, "percentage": 87.04, "elapsed_time": "0:21:53", "remaining_time": "0:03:15", "throughput": 2469.15, "total_tokens": 3243392} +{"current_steps": 6600, "total_steps": 7577, "loss": 0.0143, "lr": 9.980357892957492e-08, "epoch": 0.871057146627953, "percentage": 87.11, "elapsed_time": "0:21:53", "remaining_time": "0:03:14", "throughput": 2470.38, "total_tokens": 3245824} +{"current_steps": 6605, "total_steps": 7577, "loss": 0.0015, "lr": 9.880280523906337e-08, "epoch": 0.8717170384057015, "percentage": 87.17, "elapsed_time": "0:21:54", "remaining_time": "0:03:13", "throughput": 2471.51, "total_tokens": 3248128} +{"current_steps": 6610, "total_steps": 7577, "loss": 0.1882, "lr": 9.780681364149091e-08, "epoch": 0.8723769301834499, "percentage": 87.24, "elapsed_time": "0:21:54", "remaining_time": "0:03:12", "throughput": 2472.78, "total_tokens": 3250624} +{"current_steps": 6615, "total_steps": 7577, "loss": 0.108, "lr": 9.681560942196587e-08, "epoch": 0.8730368219611984, "percentage": 87.3, "elapsed_time": "0:21:54", "remaining_time": "0:03:11", "throughput": 2474.2, "total_tokens": 3253312} +{"current_steps": 6620, "total_steps": 7577, "loss": 0.1163, "lr": 9.582919784019194e-08, "epoch": 0.8736967137389469, "percentage": 87.37, "elapsed_time": "0:21:55", "remaining_time": "0:03:10", "throughput": 2475.25, "total_tokens": 3255488} +{"current_steps": 6625, "total_steps": 7577, "loss": 0.0734, "lr": 9.484758413044236e-08, "epoch": 0.8743566055166953, "percentage": 87.44, "elapsed_time": "0:21:55", "remaining_time": "0:03:09", "throughput": 2476.29, "total_tokens": 3257664} +{"current_steps": 6630, "total_steps": 7577, "loss": 0.099, "lr": 9.387077350153017e-08, "epoch": 0.8750164972944438, "percentage": 87.5, "elapsed_time": "0:21:55", "remaining_time": "0:03:07", "throughput": 2477.56, "total_tokens": 3260160} +{"current_steps": 6635, "total_steps": 7577, "loss": 0.0644, "lr": 9.289877113678168e-08, "epoch": 0.8756763890721921, "percentage": 87.57, "elapsed_time": "0:21:56", "remaining_time": "0:03:06", "throughput": 2478.74, "total_tokens": 3262528} +{"current_steps": 6640, "total_steps": 7577, "loss": 0.0668, "lr": 9.19315821940092e-08, "epoch": 0.8763362808499406, "percentage": 87.63, "elapsed_time": "0:21:56", "remaining_time": "0:03:05", "throughput": 2480.02, "total_tokens": 3265024} +{"current_steps": 6645, "total_steps": 7577, "loss": 0.157, "lr": 9.096921180548234e-08, "epoch": 0.876996172627689, "percentage": 87.7, "elapsed_time": "0:21:56", "remaining_time": "0:03:04", "throughput": 2481.24, "total_tokens": 3267456} +{"current_steps": 6650, "total_steps": 7577, "loss": 0.1047, "lr": 9.001166507790259e-08, "epoch": 0.8776560644054375, "percentage": 87.77, "elapsed_time": "0:21:57", "remaining_time": "0:03:03", "throughput": 2482.7, "total_tokens": 3270208} +{"current_steps": 6655, "total_steps": 7577, "loss": 0.1139, "lr": 8.905894709237427e-08, "epoch": 0.8783159561831859, "percentage": 87.83, "elapsed_time": "0:21:57", "remaining_time": "0:03:02", "throughput": 2484.16, "total_tokens": 3272960} +{"current_steps": 6660, "total_steps": 7577, "loss": 0.083, "lr": 8.811106290437975e-08, "epoch": 0.8789758479609344, "percentage": 87.9, "elapsed_time": "0:21:57", "remaining_time": "0:03:01", "throughput": 2485.2, "total_tokens": 3275136} +{"current_steps": 6665, "total_steps": 7577, "loss": 0.0826, "lr": 8.716801754375036e-08, "epoch": 0.8796357397386828, "percentage": 87.96, "elapsed_time": "0:21:58", "remaining_time": "0:03:00", "throughput": 2486.52, "total_tokens": 3277696} +{"current_steps": 6670, "total_steps": 7577, "loss": 0.1297, "lr": 8.62298160146413e-08, "epoch": 0.8802956315164313, "percentage": 88.03, "elapsed_time": "0:21:58", "remaining_time": "0:02:59", "throughput": 2487.7, "total_tokens": 3280064} +{"current_steps": 6675, "total_steps": 7577, "loss": 0.0166, "lr": 8.529646329550466e-08, "epoch": 0.8809555232941798, "percentage": 88.1, "elapsed_time": "0:21:58", "remaining_time": "0:02:58", "throughput": 2488.78, "total_tokens": 3282304} +{"current_steps": 6680, "total_steps": 7577, "loss": 0.03, "lr": 8.436796433906235e-08, "epoch": 0.8816154150719282, "percentage": 88.16, "elapsed_time": "0:21:59", "remaining_time": "0:02:57", "throughput": 2490.0, "total_tokens": 3284736} +{"current_steps": 6685, "total_steps": 7577, "loss": 0.0714, "lr": 8.344432407228141e-08, "epoch": 0.8822753068496767, "percentage": 88.23, "elapsed_time": "0:21:59", "remaining_time": "0:02:56", "throughput": 2491.23, "total_tokens": 3287168} +{"current_steps": 6690, "total_steps": 7577, "loss": 0.0623, "lr": 8.252554739634577e-08, "epoch": 0.8829351986274251, "percentage": 88.29, "elapsed_time": "0:21:59", "remaining_time": "0:02:54", "throughput": 2492.45, "total_tokens": 3289600} +{"current_steps": 6695, "total_steps": 7577, "loss": 0.0589, "lr": 8.16116391866316e-08, "epoch": 0.8835950904051736, "percentage": 88.36, "elapsed_time": "0:22:00", "remaining_time": "0:02:53", "throughput": 2493.76, "total_tokens": 3292160} +{"current_steps": 6700, "total_steps": 7577, "loss": 0.1393, "lr": 8.070260429268172e-08, "epoch": 0.884254982182922, "percentage": 88.43, "elapsed_time": "0:22:00", "remaining_time": "0:02:52", "throughput": 2494.97, "total_tokens": 3294592} +{"current_steps": 6705, "total_steps": 7577, "loss": 0.0539, "lr": 7.979844753817855e-08, "epoch": 0.8849148739606705, "percentage": 88.49, "elapsed_time": "0:22:00", "remaining_time": "0:02:51", "throughput": 2496.14, "total_tokens": 3296960} +{"current_steps": 6710, "total_steps": 7577, "loss": 0.0709, "lr": 7.889917372091982e-08, "epoch": 0.8855747657384189, "percentage": 88.56, "elapsed_time": "0:22:01", "remaining_time": "0:02:50", "throughput": 2497.23, "total_tokens": 3299200} +{"current_steps": 6715, "total_steps": 7577, "loss": 0.2047, "lr": 7.800478761279183e-08, "epoch": 0.8862346575161674, "percentage": 88.62, "elapsed_time": "0:22:01", "remaining_time": "0:02:49", "throughput": 2498.4, "total_tokens": 3301568} +{"current_steps": 6720, "total_steps": 7577, "loss": 0.1478, "lr": 7.711529395974592e-08, "epoch": 0.8868945492939158, "percentage": 88.69, "elapsed_time": "0:22:01", "remaining_time": "0:02:48", "throughput": 2499.66, "total_tokens": 3304064} +{"current_steps": 6725, "total_steps": 7577, "loss": 0.1855, "lr": 7.623069748177135e-08, "epoch": 0.8875544410716643, "percentage": 88.76, "elapsed_time": "0:22:02", "remaining_time": "0:02:47", "throughput": 2500.83, "total_tokens": 3306432} +{"current_steps": 6730, "total_steps": 7577, "loss": 0.0866, "lr": 7.535100287287111e-08, "epoch": 0.8882143328494126, "percentage": 88.82, "elapsed_time": "0:22:02", "remaining_time": "0:02:46", "throughput": 2501.95, "total_tokens": 3308736} +{"current_steps": 6735, "total_steps": 7577, "loss": 0.0024, "lr": 7.447621480103783e-08, "epoch": 0.8888742246271611, "percentage": 88.89, "elapsed_time": "0:22:02", "remaining_time": "0:02:45", "throughput": 2503.17, "total_tokens": 3311168} +{"current_steps": 6740, "total_steps": 7577, "loss": 0.2758, "lr": 7.360633790822713e-08, "epoch": 0.8895341164049096, "percentage": 88.95, "elapsed_time": "0:22:03", "remaining_time": "0:02:44", "throughput": 2504.43, "total_tokens": 3313664} +{"current_steps": 6745, "total_steps": 7577, "loss": 0.044, "lr": 7.274137681033498e-08, "epoch": 0.890194008182658, "percentage": 89.02, "elapsed_time": "0:22:03", "remaining_time": "0:02:43", "throughput": 2505.75, "total_tokens": 3316224} +{"current_steps": 6750, "total_steps": 7577, "loss": 0.0791, "lr": 7.188133609717184e-08, "epoch": 0.8908538999604065, "percentage": 89.09, "elapsed_time": "0:22:03", "remaining_time": "0:02:42", "throughput": 2506.81, "total_tokens": 3318464} +{"current_steps": 6755, "total_steps": 7577, "loss": 0.0008, "lr": 7.102622033243843e-08, "epoch": 0.8915137917381549, "percentage": 89.15, "elapsed_time": "0:22:04", "remaining_time": "0:02:41", "throughput": 2508.02, "total_tokens": 3320896} +{"current_steps": 6760, "total_steps": 7577, "loss": 0.1241, "lr": 7.017603405370276e-08, "epoch": 0.8921736835159034, "percentage": 89.22, "elapsed_time": "0:22:04", "remaining_time": "0:02:40", "throughput": 2509.46, "total_tokens": 3323648} +{"current_steps": 6765, "total_steps": 7577, "loss": 0.1568, "lr": 6.933078177237429e-08, "epoch": 0.8928335752936518, "percentage": 89.28, "elapsed_time": "0:22:04", "remaining_time": "0:02:39", "throughput": 2510.77, "total_tokens": 3326208} +{"current_steps": 6770, "total_steps": 7577, "loss": 0.0287, "lr": 6.849046797368108e-08, "epoch": 0.8934934670714003, "percentage": 89.35, "elapsed_time": "0:22:05", "remaining_time": "0:02:37", "throughput": 2511.94, "total_tokens": 3328576} +{"current_steps": 6775, "total_steps": 7577, "loss": 0.0018, "lr": 6.765509711664574e-08, "epoch": 0.8941533588491487, "percentage": 89.42, "elapsed_time": "0:22:05", "remaining_time": "0:02:36", "throughput": 2513.52, "total_tokens": 3331520} +{"current_steps": 6780, "total_steps": 7577, "loss": 0.0488, "lr": 6.682467363406174e-08, "epoch": 0.8948132506268972, "percentage": 89.48, "elapsed_time": "0:22:05", "remaining_time": "0:02:35", "throughput": 2515.0, "total_tokens": 3334336} +{"current_steps": 6785, "total_steps": 7577, "loss": 0.0703, "lr": 6.59992019324701e-08, "epoch": 0.8954731424046456, "percentage": 89.55, "elapsed_time": "0:22:06", "remaining_time": "0:02:34", "throughput": 2516.3, "total_tokens": 3336896} +{"current_steps": 6790, "total_steps": 7577, "loss": 0.0708, "lr": 6.517868639213553e-08, "epoch": 0.8961330341823941, "percentage": 89.61, "elapsed_time": "0:22:06", "remaining_time": "0:02:33", "throughput": 2517.5, "total_tokens": 3339328} +{"current_steps": 6795, "total_steps": 7577, "loss": 0.0182, "lr": 6.436313136702387e-08, "epoch": 0.8967929259601425, "percentage": 89.68, "elapsed_time": "0:22:06", "remaining_time": "0:02:32", "throughput": 2518.69, "total_tokens": 3341760} +{"current_steps": 6800, "total_steps": 7577, "loss": 0.0659, "lr": 6.355254118477815e-08, "epoch": 0.897452817737891, "percentage": 89.75, "elapsed_time": "0:22:07", "remaining_time": "0:02:31", "throughput": 2520.06, "total_tokens": 3344448} +{"current_steps": 6805, "total_steps": 7577, "loss": 0.001, "lr": 6.274692014669602e-08, "epoch": 0.8981127095156395, "percentage": 89.81, "elapsed_time": "0:22:07", "remaining_time": "0:02:30", "throughput": 2521.35, "total_tokens": 3347008} +{"current_steps": 6810, "total_steps": 7577, "loss": 0.0006, "lr": 6.194627252770768e-08, "epoch": 0.8987726012933879, "percentage": 89.88, "elapsed_time": "0:22:07", "remaining_time": "0:02:29", "throughput": 2522.83, "total_tokens": 3349824} +{"current_steps": 6815, "total_steps": 7577, "loss": 0.0903, "lr": 6.115060257635174e-08, "epoch": 0.8994324930711364, "percentage": 89.94, "elapsed_time": "0:22:08", "remaining_time": "0:02:28", "throughput": 2524.07, "total_tokens": 3352320} +{"current_steps": 6820, "total_steps": 7577, "loss": 0.0013, "lr": 6.035991451475375e-08, "epoch": 0.9000923848488848, "percentage": 90.01, "elapsed_time": "0:22:08", "remaining_time": "0:02:27", "throughput": 2525.23, "total_tokens": 3354688} +{"current_steps": 6822, "total_steps": 7577, "eval_loss": 0.09756959229707718, "epoch": 0.9003563415599841, "percentage": 90.04, "elapsed_time": "0:22:16", "remaining_time": "0:02:27", "throughput": 2510.45, "total_tokens": 3355520} +{"current_steps": 6825, "total_steps": 7577, "loss": 0.0663, "lr": 5.9574212538603505e-08, "epoch": 0.9007522766266333, "percentage": 90.08, "elapsed_time": "0:22:41", "remaining_time": "0:02:29", "throughput": 2466.49, "total_tokens": 3357056} +{"current_steps": 6830, "total_steps": 7577, "loss": 0.066, "lr": 5.879350081713252e-08, "epoch": 0.9014121684043817, "percentage": 90.14, "elapsed_time": "0:22:41", "remaining_time": "0:02:28", "throughput": 2467.67, "total_tokens": 3359488} +{"current_steps": 6835, "total_steps": 7577, "loss": 0.2437, "lr": 5.8017783493092386e-08, "epoch": 0.9020720601821302, "percentage": 90.21, "elapsed_time": "0:22:41", "remaining_time": "0:02:27", "throughput": 2468.86, "total_tokens": 3361920} +{"current_steps": 6840, "total_steps": 7577, "loss": 0.0012, "lr": 5.7247064682732104e-08, "epoch": 0.9027319519598785, "percentage": 90.27, "elapsed_time": "0:22:42", "remaining_time": "0:02:26", "throughput": 2470.1, "total_tokens": 3364416} +{"current_steps": 6845, "total_steps": 7577, "loss": 0.0617, "lr": 5.6481348475777566e-08, "epoch": 0.903391843737627, "percentage": 90.34, "elapsed_time": "0:22:42", "remaining_time": "0:02:25", "throughput": 2471.35, "total_tokens": 3366912} +{"current_steps": 6850, "total_steps": 7577, "loss": 0.0012, "lr": 5.5720638935407796e-08, "epoch": 0.9040517355153754, "percentage": 90.41, "elapsed_time": "0:22:42", "remaining_time": "0:02:24", "throughput": 2472.36, "total_tokens": 3369088} +{"current_steps": 6855, "total_steps": 7577, "loss": 0.1105, "lr": 5.49649400982356e-08, "epoch": 0.9047116272931239, "percentage": 90.47, "elapsed_time": "0:22:43", "remaining_time": "0:02:23", "throughput": 2473.55, "total_tokens": 3371520} +{"current_steps": 6860, "total_steps": 7577, "loss": 0.0005, "lr": 5.421425597428442e-08, "epoch": 0.9053715190708723, "percentage": 90.54, "elapsed_time": "0:22:43", "remaining_time": "0:02:22", "throughput": 2474.83, "total_tokens": 3374080} +{"current_steps": 6865, "total_steps": 7577, "loss": 0.1294, "lr": 5.346859054696784e-08, "epoch": 0.9060314108486208, "percentage": 90.6, "elapsed_time": "0:22:43", "remaining_time": "0:02:21", "throughput": 2476.1, "total_tokens": 3376640} +{"current_steps": 6870, "total_steps": 7577, "loss": 0.0709, "lr": 5.2727947773068773e-08, "epoch": 0.9066913026263693, "percentage": 90.67, "elapsed_time": "0:22:44", "remaining_time": "0:02:20", "throughput": 2477.29, "total_tokens": 3379072} +{"current_steps": 6875, "total_steps": 7577, "loss": 0.069, "lr": 5.199233158271732e-08, "epoch": 0.9073511944041177, "percentage": 90.74, "elapsed_time": "0:22:44", "remaining_time": "0:02:19", "throughput": 2478.62, "total_tokens": 3381696} +{"current_steps": 6880, "total_steps": 7577, "loss": 0.2041, "lr": 5.126174587937149e-08, "epoch": 0.9080110861818662, "percentage": 90.8, "elapsed_time": "0:22:44", "remaining_time": "0:02:18", "throughput": 2479.76, "total_tokens": 3384064} +{"current_steps": 6885, "total_steps": 7577, "loss": 0.0024, "lr": 5.053619453979485e-08, "epoch": 0.9086709779596146, "percentage": 90.87, "elapsed_time": "0:22:44", "remaining_time": "0:02:17", "throughput": 2480.81, "total_tokens": 3386304} +{"current_steps": 6890, "total_steps": 7577, "loss": 0.1257, "lr": 4.9815681414037025e-08, "epoch": 0.9093308697373631, "percentage": 90.93, "elapsed_time": "0:22:45", "remaining_time": "0:02:16", "throughput": 2482.04, "total_tokens": 3388800} +{"current_steps": 6895, "total_steps": 7577, "loss": 0.097, "lr": 4.910021032541334e-08, "epoch": 0.9099907615151115, "percentage": 91.0, "elapsed_time": "0:22:45", "remaining_time": "0:02:15", "throughput": 2483.22, "total_tokens": 3391232} +{"current_steps": 6900, "total_steps": 7577, "loss": 0.1039, "lr": 4.838978507048319e-08, "epoch": 0.91065065329286, "percentage": 91.07, "elapsed_time": "0:22:45", "remaining_time": "0:02:14", "throughput": 2484.39, "total_tokens": 3393664} +{"current_steps": 6905, "total_steps": 7577, "loss": 0.0018, "lr": 4.768440941903207e-08, "epoch": 0.9113105450706084, "percentage": 91.13, "elapsed_time": "0:22:46", "remaining_time": "0:02:12", "throughput": 2485.48, "total_tokens": 3395968} +{"current_steps": 6910, "total_steps": 7577, "loss": 0.0407, "lr": 4.698408711404944e-08, "epoch": 0.9119704368483569, "percentage": 91.2, "elapsed_time": "0:22:46", "remaining_time": "0:02:11", "throughput": 2486.57, "total_tokens": 3398272} +{"current_steps": 6915, "total_steps": 7577, "loss": 0.0894, "lr": 4.628882187171046e-08, "epoch": 0.9126303286261053, "percentage": 91.26, "elapsed_time": "0:22:46", "remaining_time": "0:02:10", "throughput": 2487.94, "total_tokens": 3400960} +{"current_steps": 6920, "total_steps": 7577, "loss": 0.1429, "lr": 4.559861738135506e-08, "epoch": 0.9132902204038538, "percentage": 91.33, "elapsed_time": "0:22:47", "remaining_time": "0:02:09", "throughput": 2489.21, "total_tokens": 3403520} +{"current_steps": 6925, "total_steps": 7577, "loss": 0.2526, "lr": 4.491347730546913e-08, "epoch": 0.9139501121816023, "percentage": 91.4, "elapsed_time": "0:22:47", "remaining_time": "0:02:08", "throughput": 2490.39, "total_tokens": 3405952} +{"current_steps": 6930, "total_steps": 7577, "loss": 0.1429, "lr": 4.423340527966512e-08, "epoch": 0.9146100039593507, "percentage": 91.46, "elapsed_time": "0:22:47", "remaining_time": "0:02:07", "throughput": 2491.53, "total_tokens": 3408320} +{"current_steps": 6935, "total_steps": 7577, "loss": 0.0675, "lr": 4.355840491266205e-08, "epoch": 0.9152698957370992, "percentage": 91.53, "elapsed_time": "0:22:48", "remaining_time": "0:02:06", "throughput": 2492.79, "total_tokens": 3410880} +{"current_steps": 6940, "total_steps": 7577, "loss": 0.0589, "lr": 4.288847978626686e-08, "epoch": 0.9159297875148475, "percentage": 91.59, "elapsed_time": "0:22:48", "remaining_time": "0:02:05", "throughput": 2494.06, "total_tokens": 3413440} +{"current_steps": 6945, "total_steps": 7577, "loss": 0.0656, "lr": 4.222363345535585e-08, "epoch": 0.916589679292596, "percentage": 91.66, "elapsed_time": "0:22:48", "remaining_time": "0:02:04", "throughput": 2495.33, "total_tokens": 3416000} +{"current_steps": 6950, "total_steps": 7577, "loss": 0.1151, "lr": 4.1563869447854505e-08, "epoch": 0.9172495710703444, "percentage": 91.72, "elapsed_time": "0:22:49", "remaining_time": "0:02:03", "throughput": 2496.37, "total_tokens": 3418240} +{"current_steps": 6955, "total_steps": 7577, "loss": 0.1535, "lr": 4.090919126472048e-08, "epoch": 0.9179094628480929, "percentage": 91.79, "elapsed_time": "0:22:49", "remaining_time": "0:02:02", "throughput": 2497.56, "total_tokens": 3420672} +{"current_steps": 6960, "total_steps": 7577, "loss": 0.0099, "lr": 4.025960237992332e-08, "epoch": 0.9185693546258413, "percentage": 91.86, "elapsed_time": "0:22:49", "remaining_time": "0:02:01", "throughput": 2498.6, "total_tokens": 3422912} +{"current_steps": 6965, "total_steps": 7577, "loss": 0.0129, "lr": 3.961510624042741e-08, "epoch": 0.9192292464035898, "percentage": 91.92, "elapsed_time": "0:22:50", "remaining_time": "0:02:00", "throughput": 2499.82, "total_tokens": 3425408} +{"current_steps": 6970, "total_steps": 7577, "loss": 0.1038, "lr": 3.8975706266172636e-08, "epoch": 0.9198891381813382, "percentage": 91.99, "elapsed_time": "0:22:50", "remaining_time": "0:01:59", "throughput": 2500.95, "total_tokens": 3427776} +{"current_steps": 6975, "total_steps": 7577, "loss": 0.1456, "lr": 3.834140585005696e-08, "epoch": 0.9205490299590867, "percentage": 92.05, "elapsed_time": "0:22:50", "remaining_time": "0:01:58", "throughput": 2502.21, "total_tokens": 3430336} +{"current_steps": 6980, "total_steps": 7577, "loss": 0.192, "lr": 3.771220835791844e-08, "epoch": 0.9212089217368351, "percentage": 92.12, "elapsed_time": "0:22:51", "remaining_time": "0:01:57", "throughput": 2503.47, "total_tokens": 3432896} +{"current_steps": 6985, "total_steps": 7577, "loss": 0.023, "lr": 3.708811712851634e-08, "epoch": 0.9218688135145836, "percentage": 92.19, "elapsed_time": "0:22:51", "remaining_time": "0:01:56", "throughput": 2504.51, "total_tokens": 3435136} +{"current_steps": 6990, "total_steps": 7577, "loss": 0.0816, "lr": 3.6469135473514936e-08, "epoch": 0.9225287052923321, "percentage": 92.25, "elapsed_time": "0:22:51", "remaining_time": "0:01:55", "throughput": 2505.87, "total_tokens": 3437824} +{"current_steps": 6995, "total_steps": 7577, "loss": 0.0381, "lr": 3.5855266677464744e-08, "epoch": 0.9231885970700805, "percentage": 92.32, "elapsed_time": "0:22:52", "remaining_time": "0:01:54", "throughput": 2507.08, "total_tokens": 3440320} +{"current_steps": 7000, "total_steps": 7577, "loss": 0.0565, "lr": 3.524651399778555e-08, "epoch": 0.923848488847829, "percentage": 92.38, "elapsed_time": "0:22:52", "remaining_time": "0:01:53", "throughput": 2508.34, "total_tokens": 3442880} +{"current_steps": 7005, "total_steps": 7577, "loss": 0.0016, "lr": 3.4642880664749296e-08, "epoch": 0.9245083806255774, "percentage": 92.45, "elapsed_time": "0:22:52", "remaining_time": "0:01:52", "throughput": 2509.38, "total_tokens": 3445120} +{"current_steps": 7010, "total_steps": 7577, "loss": 0.1966, "lr": 3.404436988146242e-08, "epoch": 0.9251682724033259, "percentage": 92.52, "elapsed_time": "0:22:53", "remaining_time": "0:01:51", "throughput": 2510.46, "total_tokens": 3447424} +{"current_steps": 7015, "total_steps": 7577, "loss": 0.0537, "lr": 3.345098482384956e-08, "epoch": 0.9258281641810743, "percentage": 92.58, "elapsed_time": "0:22:53", "remaining_time": "0:01:50", "throughput": 2511.68, "total_tokens": 3449920} +{"current_steps": 7020, "total_steps": 7577, "loss": 0.0494, "lr": 3.2862728640636105e-08, "epoch": 0.9264880559588228, "percentage": 92.65, "elapsed_time": "0:22:53", "remaining_time": "0:01:49", "throughput": 2512.89, "total_tokens": 3452416} +{"current_steps": 7025, "total_steps": 7577, "loss": 0.1016, "lr": 3.227960445333155e-08, "epoch": 0.9271479477365712, "percentage": 92.71, "elapsed_time": "0:22:54", "remaining_time": "0:01:47", "throughput": 2514.11, "total_tokens": 3454912} +{"current_steps": 7030, "total_steps": 7577, "loss": 0.0633, "lr": 3.1701615356213295e-08, "epoch": 0.9278078395143197, "percentage": 92.78, "elapsed_time": "0:22:54", "remaining_time": "0:01:46", "throughput": 2515.38, "total_tokens": 3457472} +{"current_steps": 7035, "total_steps": 7577, "loss": 0.0683, "lr": 3.112876441630985e-08, "epoch": 0.928467731292068, "percentage": 92.85, "elapsed_time": "0:22:54", "remaining_time": "0:01:45", "throughput": 2516.41, "total_tokens": 3459712} +{"current_steps": 7040, "total_steps": 7577, "loss": 0.0577, "lr": 3.05610546733851e-08, "epoch": 0.9291276230698166, "percentage": 92.91, "elapsed_time": "0:22:55", "remaining_time": "0:01:44", "throughput": 2517.58, "total_tokens": 3462144} +{"current_steps": 7045, "total_steps": 7577, "loss": 0.2195, "lr": 2.99984891399212e-08, "epoch": 0.9297875148475649, "percentage": 92.98, "elapsed_time": "0:22:55", "remaining_time": "0:01:43", "throughput": 2518.71, "total_tokens": 3464512} +{"current_steps": 7050, "total_steps": 7577, "loss": 0.0013, "lr": 2.9441070801103808e-08, "epoch": 0.9304474066253134, "percentage": 93.04, "elapsed_time": "0:22:55", "remaining_time": "0:01:42", "throughput": 2519.84, "total_tokens": 3466880} +{"current_steps": 7055, "total_steps": 7577, "loss": 0.1014, "lr": 2.8888802614805085e-08, "epoch": 0.931107298403062, "percentage": 93.11, "elapsed_time": "0:22:56", "remaining_time": "0:01:41", "throughput": 2520.95, "total_tokens": 3469248} +{"current_steps": 7060, "total_steps": 7577, "loss": 0.2786, "lr": 2.8341687511568734e-08, "epoch": 0.9317671901808103, "percentage": 93.18, "elapsed_time": "0:22:56", "remaining_time": "0:01:40", "throughput": 2522.07, "total_tokens": 3471616} +{"current_steps": 7065, "total_steps": 7577, "loss": 0.082, "lr": 2.7799728394594547e-08, "epoch": 0.9324270819585588, "percentage": 93.24, "elapsed_time": "0:22:56", "remaining_time": "0:01:39", "throughput": 2523.37, "total_tokens": 3474240} +{"current_steps": 7070, "total_steps": 7577, "loss": 0.0789, "lr": 2.7262928139722198e-08, "epoch": 0.9330869737363072, "percentage": 93.31, "elapsed_time": "0:22:57", "remaining_time": "0:01:38", "throughput": 2524.61, "total_tokens": 3476800} +{"current_steps": 7075, "total_steps": 7577, "loss": 0.0807, "lr": 2.673128959541693e-08, "epoch": 0.9337468655140557, "percentage": 93.37, "elapsed_time": "0:22:57", "remaining_time": "0:01:37", "throughput": 2525.94, "total_tokens": 3479488} +{"current_steps": 7080, "total_steps": 7577, "loss": 0.0005, "lr": 2.620481558275367e-08, "epoch": 0.9344067572918041, "percentage": 93.44, "elapsed_time": "0:22:57", "remaining_time": "0:01:36", "throughput": 2527.29, "total_tokens": 3482176} +{"current_steps": 7085, "total_steps": 7577, "loss": 0.0278, "lr": 2.5683508895402382e-08, "epoch": 0.9350666490695526, "percentage": 93.51, "elapsed_time": "0:22:58", "remaining_time": "0:01:35", "throughput": 2528.59, "total_tokens": 3484800} +{"current_steps": 7090, "total_steps": 7577, "loss": 0.1436, "lr": 2.5167372299613853e-08, "epoch": 0.935726540847301, "percentage": 93.57, "elapsed_time": "0:22:58", "remaining_time": "0:01:34", "throughput": 2529.92, "total_tokens": 3487488} +{"current_steps": 7095, "total_steps": 7577, "loss": 0.2508, "lr": 2.4656408534203365e-08, "epoch": 0.9363864326250495, "percentage": 93.64, "elapsed_time": "0:22:58", "remaining_time": "0:01:33", "throughput": 2530.96, "total_tokens": 3489728} +{"current_steps": 7100, "total_steps": 7577, "loss": 0.2469, "lr": 2.4150620310538273e-08, "epoch": 0.9370463244027979, "percentage": 93.7, "elapsed_time": "0:22:59", "remaining_time": "0:01:32", "throughput": 2531.94, "total_tokens": 3491904} +{"current_steps": 7105, "total_steps": 7577, "loss": 0.0832, "lr": 2.3650010312521673e-08, "epoch": 0.9377062161805464, "percentage": 93.77, "elapsed_time": "0:22:59", "remaining_time": "0:01:31", "throughput": 2533.28, "total_tokens": 3494592} +{"current_steps": 7110, "total_steps": 7577, "loss": 0.1798, "lr": 2.3154581196579648e-08, "epoch": 0.9383661079582949, "percentage": 93.84, "elapsed_time": "0:22:59", "remaining_time": "0:01:30", "throughput": 2534.48, "total_tokens": 3497088} +{"current_steps": 7115, "total_steps": 7577, "loss": 0.0559, "lr": 2.2664335591646377e-08, "epoch": 0.9390259997360433, "percentage": 93.9, "elapsed_time": "0:23:00", "remaining_time": "0:01:29", "throughput": 2535.65, "total_tokens": 3499520} +{"current_steps": 7120, "total_steps": 7577, "loss": 0.2113, "lr": 2.2179276099150158e-08, "epoch": 0.9396858915137918, "percentage": 93.97, "elapsed_time": "0:23:00", "remaining_time": "0:01:28", "throughput": 2536.98, "total_tokens": 3502208} +{"current_steps": 7125, "total_steps": 7577, "loss": 0.1584, "lr": 2.1699405293000182e-08, "epoch": 0.9403457832915402, "percentage": 94.03, "elapsed_time": "0:23:00", "remaining_time": "0:01:27", "throughput": 2538.14, "total_tokens": 3504640} +{"current_steps": 7130, "total_steps": 7577, "loss": 0.0448, "lr": 2.1224725719572235e-08, "epoch": 0.9410056750692887, "percentage": 94.1, "elapsed_time": "0:23:01", "remaining_time": "0:01:26", "throughput": 2539.21, "total_tokens": 3506944} +{"current_steps": 7135, "total_steps": 7577, "loss": 0.0454, "lr": 2.0755239897695453e-08, "epoch": 0.9416655668470371, "percentage": 94.17, "elapsed_time": "0:23:01", "remaining_time": "0:01:25", "throughput": 2540.37, "total_tokens": 3509376} +{"current_steps": 7140, "total_steps": 7577, "loss": 0.1705, "lr": 2.0290950318639256e-08, "epoch": 0.9423254586247856, "percentage": 94.23, "elapsed_time": "0:23:01", "remaining_time": "0:01:24", "throughput": 2541.44, "total_tokens": 3511680} +{"current_steps": 7145, "total_steps": 7577, "loss": 0.0576, "lr": 1.983185944609944e-08, "epoch": 0.942985350402534, "percentage": 94.3, "elapsed_time": "0:23:02", "remaining_time": "0:01:23", "throughput": 2542.6, "total_tokens": 3514112} +{"current_steps": 7150, "total_steps": 7577, "loss": 0.0709, "lr": 1.9377969716185994e-08, "epoch": 0.9436452421802825, "percentage": 94.36, "elapsed_time": "0:23:02", "remaining_time": "0:01:22", "throughput": 2543.71, "total_tokens": 3516480} +{"current_steps": 7155, "total_steps": 7577, "loss": 0.1222, "lr": 1.8929283537408968e-08, "epoch": 0.9443051339580308, "percentage": 94.43, "elapsed_time": "0:23:02", "remaining_time": "0:01:21", "throughput": 2544.74, "total_tokens": 3518720} +{"current_steps": 7160, "total_steps": 7577, "loss": 0.0012, "lr": 1.848580329066718e-08, "epoch": 0.9449650257357793, "percentage": 94.5, "elapsed_time": "0:23:03", "remaining_time": "0:01:20", "throughput": 2545.94, "total_tokens": 3521216} +{"current_steps": 7165, "total_steps": 7577, "loss": 0.4089, "lr": 1.804753132923431e-08, "epoch": 0.9456249175135277, "percentage": 94.56, "elapsed_time": "0:23:03", "remaining_time": "0:01:19", "throughput": 2547.18, "total_tokens": 3523776} +{"current_steps": 7170, "total_steps": 7577, "loss": 0.0013, "lr": 1.7614469978746827e-08, "epoch": 0.9462848092912762, "percentage": 94.63, "elapsed_time": "0:23:03", "remaining_time": "0:01:18", "throughput": 2548.38, "total_tokens": 3526272} +{"current_steps": 7175, "total_steps": 7577, "loss": 0.0095, "lr": 1.7186621537192304e-08, "epoch": 0.9469447010690247, "percentage": 94.69, "elapsed_time": "0:23:04", "remaining_time": "0:01:17", "throughput": 2549.45, "total_tokens": 3528576} +{"current_steps": 7180, "total_steps": 7577, "loss": 0.0009, "lr": 1.6763988274896003e-08, "epoch": 0.9476045928467731, "percentage": 94.76, "elapsed_time": "0:23:04", "remaining_time": "0:01:16", "throughput": 2550.69, "total_tokens": 3531136} +{"current_steps": 7185, "total_steps": 7577, "loss": 0.159, "lr": 1.6346572434509876e-08, "epoch": 0.9482644846245216, "percentage": 94.83, "elapsed_time": "0:23:04", "remaining_time": "0:01:15", "throughput": 2551.93, "total_tokens": 3533696} +{"current_steps": 7190, "total_steps": 7577, "loss": 0.1343, "lr": 1.5934376231000248e-08, "epoch": 0.94892437640227, "percentage": 94.89, "elapsed_time": "0:23:05", "remaining_time": "0:01:14", "throughput": 2553.04, "total_tokens": 3536064} +{"current_steps": 7195, "total_steps": 7577, "loss": 0.0016, "lr": 1.55274018516357e-08, "epoch": 0.9495842681800185, "percentage": 94.96, "elapsed_time": "0:23:05", "remaining_time": "0:01:13", "throughput": 2554.14, "total_tokens": 3538432} +{"current_steps": 7200, "total_steps": 7577, "loss": 0.0683, "lr": 1.512565145597633e-08, "epoch": 0.9502441599577669, "percentage": 95.02, "elapsed_time": "0:23:05", "remaining_time": "0:01:12", "throughput": 2555.47, "total_tokens": 3541120} +{"current_steps": 7201, "total_steps": 7577, "eval_loss": 0.09811879694461823, "epoch": 0.9503761383133166, "percentage": 95.04, "elapsed_time": "0:23:13", "remaining_time": "0:01:12", "throughput": 2541.26, "total_tokens": 3541632} +{"current_steps": 7205, "total_steps": 7577, "loss": 0.0802, "lr": 1.47291271758615e-08, "epoch": 0.9509040517355154, "percentage": 95.09, "elapsed_time": "0:23:57", "remaining_time": "0:01:14", "throughput": 2465.41, "total_tokens": 3543680} +{"current_steps": 7210, "total_steps": 7577, "loss": 0.1379, "lr": 1.4337831115398991e-08, "epoch": 0.9515639435132638, "percentage": 95.16, "elapsed_time": "0:23:57", "remaining_time": "0:01:13", "throughput": 2466.44, "total_tokens": 3545984} +{"current_steps": 7215, "total_steps": 7577, "loss": 0.1338, "lr": 1.3951765350953548e-08, "epoch": 0.9522238352910123, "percentage": 95.22, "elapsed_time": "0:23:58", "remaining_time": "0:01:12", "throughput": 2467.64, "total_tokens": 3548544} +{"current_steps": 7220, "total_steps": 7577, "loss": 0.0956, "lr": 1.3570931931136009e-08, "epoch": 0.9528837270687607, "percentage": 95.29, "elapsed_time": "0:23:58", "remaining_time": "0:01:11", "throughput": 2468.78, "total_tokens": 3551040} +{"current_steps": 7225, "total_steps": 7577, "loss": 0.0867, "lr": 1.3195332876792532e-08, "epoch": 0.9535436188465092, "percentage": 95.35, "elapsed_time": "0:23:58", "remaining_time": "0:01:10", "throughput": 2469.93, "total_tokens": 3553536} +{"current_steps": 7230, "total_steps": 7577, "loss": 0.1628, "lr": 1.2824970180993488e-08, "epoch": 0.9542035106242576, "percentage": 95.42, "elapsed_time": "0:23:59", "remaining_time": "0:01:09", "throughput": 2470.87, "total_tokens": 3555712} +{"current_steps": 7235, "total_steps": 7577, "loss": 0.1277, "lr": 1.2459845809023484e-08, "epoch": 0.9548634024020061, "percentage": 95.49, "elapsed_time": "0:23:59", "remaining_time": "0:01:08", "throughput": 2471.95, "total_tokens": 3558080} +{"current_steps": 7240, "total_steps": 7577, "loss": 0.3486, "lr": 1.2099961698370353e-08, "epoch": 0.9555232941797546, "percentage": 95.55, "elapsed_time": "0:23:59", "remaining_time": "0:01:07", "throughput": 2473.16, "total_tokens": 3560640} +{"current_steps": 7245, "total_steps": 7577, "loss": 0.0935, "lr": 1.1745319758715288e-08, "epoch": 0.956183185957503, "percentage": 95.62, "elapsed_time": "0:24:00", "remaining_time": "0:01:05", "throughput": 2474.49, "total_tokens": 3563392} +{"current_steps": 7250, "total_steps": 7577, "loss": 0.1487, "lr": 1.1395921871922509e-08, "epoch": 0.9568430777352515, "percentage": 95.68, "elapsed_time": "0:24:00", "remaining_time": "0:01:04", "throughput": 2475.61, "total_tokens": 3565824} +{"current_steps": 7255, "total_steps": 7577, "loss": 0.0008, "lr": 1.105176989202905e-08, "epoch": 0.9575029695129998, "percentage": 95.75, "elapsed_time": "0:24:00", "remaining_time": "0:01:03", "throughput": 2476.72, "total_tokens": 3568256} +{"current_steps": 7260, "total_steps": 7577, "loss": 0.0075, "lr": 1.0712865645235659e-08, "epoch": 0.9581628612907483, "percentage": 95.82, "elapsed_time": "0:24:01", "remaining_time": "0:01:02", "throughput": 2477.89, "total_tokens": 3570752} +{"current_steps": 7265, "total_steps": 7577, "loss": 0.0681, "lr": 1.0379210929896131e-08, "epoch": 0.9588227530684967, "percentage": 95.88, "elapsed_time": "0:24:01", "remaining_time": "0:01:01", "throughput": 2478.82, "total_tokens": 3572928} +{"current_steps": 7270, "total_steps": 7577, "loss": 0.1822, "lr": 1.0050807516508553e-08, "epoch": 0.9594826448462452, "percentage": 95.95, "elapsed_time": "0:24:01", "remaining_time": "0:01:00", "throughput": 2479.89, "total_tokens": 3575296} +{"current_steps": 7275, "total_steps": 7577, "loss": 0.0006, "lr": 9.727657147705737e-09, "epoch": 0.9601425366239936, "percentage": 96.01, "elapsed_time": "0:24:02", "remaining_time": "0:00:59", "throughput": 2480.96, "total_tokens": 3577664} +{"current_steps": 7280, "total_steps": 7577, "loss": 0.2031, "lr": 9.409761538245575e-09, "epoch": 0.9608024284017421, "percentage": 96.08, "elapsed_time": "0:24:02", "remaining_time": "0:00:58", "throughput": 2482.11, "total_tokens": 3580160} +{"current_steps": 7285, "total_steps": 7577, "loss": 0.1012, "lr": 9.097122375002264e-09, "epoch": 0.9614623201794905, "percentage": 96.15, "elapsed_time": "0:24:02", "remaining_time": "0:00:57", "throughput": 2483.13, "total_tokens": 3582464} +{"current_steps": 7290, "total_steps": 7577, "loss": 0.1369, "lr": 8.789741316957312e-09, "epoch": 0.962122211957239, "percentage": 96.21, "elapsed_time": "0:24:03", "remaining_time": "0:00:56", "throughput": 2484.24, "total_tokens": 3584896} +{"current_steps": 7295, "total_steps": 7577, "loss": 0.0152, "lr": 8.487619995190986e-09, "epoch": 0.9627821037349875, "percentage": 96.28, "elapsed_time": "0:24:03", "remaining_time": "0:00:55", "throughput": 2485.52, "total_tokens": 3587584} +{"current_steps": 7300, "total_steps": 7577, "loss": 0.1341, "lr": 8.19076001287311e-09, "epoch": 0.9634419955127359, "percentage": 96.34, "elapsed_time": "0:24:03", "remaining_time": "0:00:54", "throughput": 2486.72, "total_tokens": 3590144} +{"current_steps": 7305, "total_steps": 7577, "loss": 0.001, "lr": 7.899162945254945e-09, "epoch": 0.9641018872904844, "percentage": 96.41, "elapsed_time": "0:24:04", "remaining_time": "0:00:53", "throughput": 2488.0, "total_tokens": 3592832} +{"current_steps": 7310, "total_steps": 7577, "loss": 0.0999, "lr": 7.612830339660758e-09, "epoch": 0.9647617790682328, "percentage": 96.48, "elapsed_time": "0:24:04", "remaining_time": "0:00:52", "throughput": 2489.23, "total_tokens": 3595456} +{"current_steps": 7315, "total_steps": 7577, "loss": 0.1011, "lr": 7.3317637154796105e-09, "epoch": 0.9654216708459813, "percentage": 96.54, "elapsed_time": "0:24:04", "remaining_time": "0:00:51", "throughput": 2490.35, "total_tokens": 3597888} +{"current_steps": 7320, "total_steps": 7577, "loss": 0.0699, "lr": 7.0559645641572465e-09, "epoch": 0.9660815626237297, "percentage": 96.61, "elapsed_time": "0:24:05", "remaining_time": "0:00:50", "throughput": 2491.51, "total_tokens": 3600384} +{"current_steps": 7325, "total_steps": 7577, "loss": 0.1521, "lr": 6.785434349188102e-09, "epoch": 0.9667414544014782, "percentage": 96.67, "elapsed_time": "0:24:05", "remaining_time": "0:00:49", "throughput": 2492.67, "total_tokens": 3602880} +{"current_steps": 7330, "total_steps": 7577, "loss": 0.045, "lr": 6.520174506107867e-09, "epoch": 0.9674013461792266, "percentage": 96.74, "elapsed_time": "0:24:05", "remaining_time": "0:00:48", "throughput": 2493.74, "total_tokens": 3605248} +{"current_steps": 7335, "total_steps": 7577, "loss": 0.001, "lr": 6.260186442485494e-09, "epoch": 0.9680612379569751, "percentage": 96.81, "elapsed_time": "0:24:06", "remaining_time": "0:00:47", "throughput": 2494.94, "total_tokens": 3607808} +{"current_steps": 7340, "total_steps": 7577, "loss": 0.1172, "lr": 6.005471537915863e-09, "epoch": 0.9687211297347235, "percentage": 96.87, "elapsed_time": "0:24:06", "remaining_time": "0:00:46", "throughput": 2495.95, "total_tokens": 3610112} +{"current_steps": 7345, "total_steps": 7577, "loss": 0.0319, "lr": 5.756031144012685e-09, "epoch": 0.969381021512472, "percentage": 96.94, "elapsed_time": "0:24:06", "remaining_time": "0:00:45", "throughput": 2496.93, "total_tokens": 3612352} +{"current_steps": 7350, "total_steps": 7577, "loss": 0.1853, "lr": 5.511866584400837e-09, "epoch": 0.9700409132902204, "percentage": 97.0, "elapsed_time": "0:24:07", "remaining_time": "0:00:44", "throughput": 2498.08, "total_tokens": 3614848} +{"current_steps": 7355, "total_steps": 7577, "loss": 0.0038, "lr": 5.2729791547097e-09, "epoch": 0.9707008050679689, "percentage": 97.07, "elapsed_time": "0:24:07", "remaining_time": "0:00:43", "throughput": 2499.28, "total_tokens": 3617408} +{"current_steps": 7360, "total_steps": 7577, "loss": 0.1072, "lr": 5.039370122566389e-09, "epoch": 0.9713606968457174, "percentage": 97.14, "elapsed_time": "0:24:07", "remaining_time": "0:00:42", "throughput": 2500.47, "total_tokens": 3619968} +{"current_steps": 7365, "total_steps": 7577, "loss": 0.099, "lr": 4.811040727588755e-09, "epoch": 0.9720205886234657, "percentage": 97.2, "elapsed_time": "0:24:08", "remaining_time": "0:00:41", "throughput": 2501.32, "total_tokens": 3622016} +{"current_steps": 7370, "total_steps": 7577, "loss": 0.1695, "lr": 4.58799218137873e-09, "epoch": 0.9726804804012142, "percentage": 97.27, "elapsed_time": "0:24:08", "remaining_time": "0:00:40", "throughput": 2502.26, "total_tokens": 3624192} +{"current_steps": 7375, "total_steps": 7577, "loss": 0.0006, "lr": 4.370225667516325e-09, "epoch": 0.9733403721789626, "percentage": 97.33, "elapsed_time": "0:24:08", "remaining_time": "0:00:39", "throughput": 2503.36, "total_tokens": 3626624} +{"current_steps": 7380, "total_steps": 7577, "loss": 0.1853, "lr": 4.157742341552861e-09, "epoch": 0.9740002639567111, "percentage": 97.4, "elapsed_time": "0:24:09", "remaining_time": "0:00:38", "throughput": 2504.38, "total_tokens": 3628928} +{"current_steps": 7385, "total_steps": 7577, "loss": 0.1044, "lr": 3.950543331005307e-09, "epoch": 0.9746601557344595, "percentage": 97.47, "elapsed_time": "0:24:09", "remaining_time": "0:00:37", "throughput": 2505.62, "total_tokens": 3631552} +{"current_steps": 7390, "total_steps": 7577, "loss": 0.0016, "lr": 3.748629735349839e-09, "epoch": 0.975320047512208, "percentage": 97.53, "elapsed_time": "0:24:09", "remaining_time": "0:00:36", "throughput": 2506.72, "total_tokens": 3633984} +{"current_steps": 7395, "total_steps": 7577, "loss": 0.2102, "lr": 3.552002626016293e-09, "epoch": 0.9759799392899564, "percentage": 97.6, "elapsed_time": "0:24:10", "remaining_time": "0:00:35", "throughput": 2507.7, "total_tokens": 3636224} +{"current_steps": 7400, "total_steps": 7577, "loss": 0.2375, "lr": 3.3606630463824947e-09, "epoch": 0.9766398310677049, "percentage": 97.66, "elapsed_time": "0:24:10", "remaining_time": "0:00:34", "throughput": 2508.8, "total_tokens": 3638656} +{"current_steps": 7405, "total_steps": 7577, "loss": 0.0009, "lr": 3.174612011768607e-09, "epoch": 0.9772997228454533, "percentage": 97.73, "elapsed_time": "0:24:10", "remaining_time": "0:00:33", "throughput": 2510.11, "total_tokens": 3641408} +{"current_steps": 7410, "total_steps": 7577, "loss": 0.1826, "lr": 2.9938505094316834e-09, "epoch": 0.9779596146232018, "percentage": 97.8, "elapsed_time": "0:24:11", "remaining_time": "0:00:32", "throughput": 2511.19, "total_tokens": 3643840} +{"current_steps": 7415, "total_steps": 7577, "loss": 0.0801, "lr": 2.8183794985605637e-09, "epoch": 0.9786195064009502, "percentage": 97.86, "elapsed_time": "0:24:11", "remaining_time": "0:00:31", "throughput": 2512.3, "total_tokens": 3646336} +{"current_steps": 7420, "total_steps": 7577, "loss": 0.0731, "lr": 2.6481999102707654e-09, "epoch": 0.9792793981786987, "percentage": 97.93, "elapsed_time": "0:24:11", "remaining_time": "0:00:30", "throughput": 2513.52, "total_tokens": 3648960} +{"current_steps": 7425, "total_steps": 7577, "loss": 0.0011, "lr": 2.4833126475994894e-09, "epoch": 0.9799392899564472, "percentage": 97.99, "elapsed_time": "0:24:12", "remaining_time": "0:00:29", "throughput": 2514.49, "total_tokens": 3651200} +{"current_steps": 7430, "total_steps": 7577, "loss": 0.0073, "lr": 2.3237185855008443e-09, "epoch": 0.9805991817341956, "percentage": 98.06, "elapsed_time": "0:24:12", "remaining_time": "0:00:28", "throughput": 2515.5, "total_tokens": 3653504} +{"current_steps": 7435, "total_steps": 7577, "loss": 0.2482, "lr": 2.1694185708414083e-09, "epoch": 0.9812590735119441, "percentage": 98.13, "elapsed_time": "0:24:12", "remaining_time": "0:00:27", "throughput": 2516.68, "total_tokens": 3656064} +{"current_steps": 7440, "total_steps": 7577, "loss": 0.2875, "lr": 2.0204134223952284e-09, "epoch": 0.9819189652896925, "percentage": 98.19, "elapsed_time": "0:24:13", "remaining_time": "0:00:26", "throughput": 2517.53, "total_tokens": 3658112} +{"current_steps": 7445, "total_steps": 7577, "loss": 0.1509, "lr": 1.87670393083994e-09, "epoch": 0.982578857067441, "percentage": 98.26, "elapsed_time": "0:24:13", "remaining_time": "0:00:25", "throughput": 2518.88, "total_tokens": 3660928} +{"current_steps": 7450, "total_steps": 7577, "loss": 0.0779, "lr": 1.7382908587525447e-09, "epoch": 0.9832387488451894, "percentage": 98.32, "elapsed_time": "0:24:13", "remaining_time": "0:00:24", "throughput": 2519.9, "total_tokens": 3663232} +{"current_steps": 7455, "total_steps": 7577, "loss": 0.0016, "lr": 1.6051749406049697e-09, "epoch": 0.9838986406229379, "percentage": 98.39, "elapsed_time": "0:24:14", "remaining_time": "0:00:23", "throughput": 2520.95, "total_tokens": 3665600} +{"current_steps": 7460, "total_steps": 7577, "loss": 0.0008, "lr": 1.4773568827607386e-09, "epoch": 0.9845585324006862, "percentage": 98.46, "elapsed_time": "0:24:14", "remaining_time": "0:00:22", "throughput": 2522.09, "total_tokens": 3668096} +{"current_steps": 7465, "total_steps": 7577, "loss": 0.0016, "lr": 1.354837363470529e-09, "epoch": 0.9852184241784347, "percentage": 98.52, "elapsed_time": "0:24:14", "remaining_time": "0:00:21", "throughput": 2523.28, "total_tokens": 3670656} +{"current_steps": 7470, "total_steps": 7577, "loss": 0.0971, "lr": 1.23761703286962e-09, "epoch": 0.9858783159561831, "percentage": 98.59, "elapsed_time": "0:24:15", "remaining_time": "0:00:20", "throughput": 2524.33, "total_tokens": 3673024} +{"current_steps": 7475, "total_steps": 7577, "loss": 0.0012, "lr": 1.1256965129730068e-09, "epoch": 0.9865382077339316, "percentage": 98.65, "elapsed_time": "0:24:15", "remaining_time": "0:00:19", "throughput": 2525.59, "total_tokens": 3675712} +{"current_steps": 7480, "total_steps": 7577, "loss": 0.0803, "lr": 1.0190763976734018e-09, "epoch": 0.9871980995116801, "percentage": 98.72, "elapsed_time": "0:24:15", "remaining_time": "0:00:18", "throughput": 2526.65, "total_tokens": 3678080} +{"current_steps": 7485, "total_steps": 7577, "loss": 0.114, "lr": 9.177572527375721e-10, "epoch": 0.9878579912894285, "percentage": 98.79, "elapsed_time": "0:24:16", "remaining_time": "0:00:17", "throughput": 2527.71, "total_tokens": 3680448} +{"current_steps": 7490, "total_steps": 7577, "loss": 0.0938, "lr": 8.217396158030076e-10, "epoch": 0.988517883067177, "percentage": 98.85, "elapsed_time": "0:24:16", "remaining_time": "0:00:16", "throughput": 2528.72, "total_tokens": 3682752} +{"current_steps": 7495, "total_steps": 7577, "loss": 0.108, "lr": 7.310239963755904e-10, "epoch": 0.9891777748449254, "percentage": 98.92, "elapsed_time": "0:24:16", "remaining_time": "0:00:15", "throughput": 2529.93, "total_tokens": 3685376} +{"current_steps": 7500, "total_steps": 7577, "loss": 0.0012, "lr": 6.456108758268186e-10, "epoch": 0.9898376666226739, "percentage": 98.98, "elapsed_time": "0:24:17", "remaining_time": "0:00:14", "throughput": 2530.97, "total_tokens": 3687744} +{"current_steps": 7505, "total_steps": 7577, "loss": 0.1473, "lr": 5.655007073909202e-10, "epoch": 0.9904975584004223, "percentage": 99.05, "elapsed_time": "0:24:17", "remaining_time": "0:00:13", "throughput": 2532.1, "total_tokens": 3690240} +{"current_steps": 7510, "total_steps": 7577, "loss": 0.0775, "lr": 4.906939161627432e-10, "epoch": 0.9911574501781708, "percentage": 99.12, "elapsed_time": "0:24:17", "remaining_time": "0:00:13", "throughput": 2533.24, "total_tokens": 3692736} +{"current_steps": 7515, "total_steps": 7577, "loss": 0.2057, "lr": 4.2119089909542495e-10, "epoch": 0.9918173419559192, "percentage": 99.18, "elapsed_time": "0:24:18", "remaining_time": "0:00:12", "throughput": 2534.46, "total_tokens": 3695360} +{"current_steps": 7520, "total_steps": 7577, "loss": 0.0823, "lr": 3.569920249981706e-10, "epoch": 0.9924772337336677, "percentage": 99.25, "elapsed_time": "0:24:18", "remaining_time": "0:00:11", "throughput": 2535.59, "total_tokens": 3697856} +{"current_steps": 7525, "total_steps": 7577, "loss": 0.0409, "lr": 2.980976345344777e-10, "epoch": 0.9931371255114161, "percentage": 99.31, "elapsed_time": "0:24:18", "remaining_time": "0:00:10", "throughput": 2536.64, "total_tokens": 3700224} +{"current_steps": 7530, "total_steps": 7577, "loss": 0.0481, "lr": 2.445080402202482e-10, "epoch": 0.9937970172891646, "percentage": 99.38, "elapsed_time": "0:24:19", "remaining_time": "0:00:09", "throughput": 2537.69, "total_tokens": 3702592} +{"current_steps": 7535, "total_steps": 7577, "loss": 0.1701, "lr": 1.962235264222345e-10, "epoch": 0.994456909066913, "percentage": 99.45, "elapsed_time": "0:24:19", "remaining_time": "0:00:08", "throughput": 2538.7, "total_tokens": 3704896} +{"current_steps": 7540, "total_steps": 7577, "loss": 0.0378, "lr": 1.5324434935615195e-10, "epoch": 0.9951168008446615, "percentage": 99.51, "elapsed_time": "0:24:19", "remaining_time": "0:00:07", "throughput": 2539.72, "total_tokens": 3707264} +{"current_steps": 7545, "total_steps": 7577, "loss": 0.1023, "lr": 1.1557073708579057e-10, "epoch": 0.99577669262241, "percentage": 99.58, "elapsed_time": "0:24:20", "remaining_time": "0:00:06", "throughput": 2540.89, "total_tokens": 3709824} +{"current_steps": 7550, "total_steps": 7577, "loss": 0.0658, "lr": 8.320288952168297e-11, "epoch": 0.9964365844001584, "percentage": 99.64, "elapsed_time": "0:24:20", "remaining_time": "0:00:05", "throughput": 2541.92, "total_tokens": 3712192} +{"current_steps": 7555, "total_steps": 7577, "loss": 0.1099, "lr": 5.614097841988297e-11, "epoch": 0.9970964761779069, "percentage": 99.71, "elapsed_time": "0:24:20", "remaining_time": "0:00:04", "throughput": 2543.17, "total_tokens": 3714880} +{"current_steps": 7560, "total_steps": 7577, "loss": 0.0216, "lr": 3.43851473808554e-11, "epoch": 0.9977563679556553, "percentage": 99.78, "elapsed_time": "0:24:21", "remaining_time": "0:00:03", "throughput": 2544.16, "total_tokens": 3717184} +{"current_steps": 7565, "total_steps": 7577, "loss": 0.0521, "lr": 1.7935511849587192e-11, "epoch": 0.9984162597334038, "percentage": 99.84, "elapsed_time": "0:24:21", "remaining_time": "0:00:02", "throughput": 2545.13, "total_tokens": 3719424} +{"current_steps": 7570, "total_steps": 7577, "loss": 0.1418, "lr": 6.792159113921947e-12, "epoch": 0.9990761515111521, "percentage": 99.91, "elapsed_time": "0:24:21", "remaining_time": "0:00:01", "throughput": 2546.26, "total_tokens": 3721920} +{"current_steps": 7575, "total_steps": 7577, "loss": 0.0767, "lr": 9.55148304560005e-13, "epoch": 0.9997360432889006, "percentage": 99.97, "elapsed_time": "0:24:22", "remaining_time": "0:00:00", "throughput": 2547.31, "total_tokens": 3724288} +{"current_steps": 7577, "total_steps": 7577, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:25:13", "remaining_time": "0:00:00", "throughput": 2461.79, "total_tokens": 3725120} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..de5ad63 --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,12335 @@ +{ + "best_global_step": 5306, + "best_metric": 0.09362584352493286, + "best_model_checkpoint": "saves_bts_preliminary/base/llama-3.2-1b-instruct/train_sst2_42_1779354538/checkpoint-5306", + "epoch": 1.0, + "eval_steps": 379, + "global_step": 7577, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0006598917777484492, + "grad_norm": 438.2236328125, + "learning_rate": 1.0554089709762531e-08, + "loss": 1.4317, + "num_input_tokens_seen": 2240, + "step": 5 + }, + { + "epoch": 0.0013197835554968984, + "grad_norm": 445.3807678222656, + "learning_rate": 2.3746701846965696e-08, + "loss": 1.5404, + "num_input_tokens_seen": 4672, + "step": 10 + }, + { + "epoch": 0.0019796753332453477, + "grad_norm": 458.7563781738281, + "learning_rate": 3.6939313984168866e-08, + "loss": 1.4488, + "num_input_tokens_seen": 7040, + "step": 15 + }, + { + "epoch": 0.002639567110993797, + "grad_norm": 498.70074462890625, + "learning_rate": 5.013192612137203e-08, + "loss": 1.469, + "num_input_tokens_seen": 9600, + "step": 20 + }, + { + "epoch": 0.0032994588887422464, + "grad_norm": 452.42120361328125, + "learning_rate": 6.33245382585752e-08, + "loss": 1.3406, + "num_input_tokens_seen": 12160, + "step": 25 + }, + { + "epoch": 0.0039593506664906955, + "grad_norm": 394.526123046875, + "learning_rate": 7.651715039577835e-08, + "loss": 1.421, + "num_input_tokens_seen": 14528, + "step": 30 + }, + { + "epoch": 0.004619242444239145, + "grad_norm": 373.5523376464844, + "learning_rate": 8.970976253298153e-08, + "loss": 1.1582, + "num_input_tokens_seen": 16768, + "step": 35 + }, + { + "epoch": 0.005279134221987594, + "grad_norm": 333.46490478515625, + "learning_rate": 1.0290237467018468e-07, + "loss": 1.1864, + "num_input_tokens_seen": 19264, + "step": 40 + }, + { + "epoch": 0.005939025999736044, + "grad_norm": 272.6488342285156, + "learning_rate": 1.1609498680738786e-07, + "loss": 0.8458, + "num_input_tokens_seen": 21632, + "step": 45 + }, + { + "epoch": 0.006598917777484493, + "grad_norm": 193.0662384033203, + "learning_rate": 1.29287598944591e-07, + "loss": 0.7602, + "num_input_tokens_seen": 24000, + "step": 50 + }, + { + "epoch": 0.007258809555232942, + "grad_norm": 167.6585235595703, + "learning_rate": 1.424802110817942e-07, + "loss": 0.7195, + "num_input_tokens_seen": 26496, + "step": 55 + }, + { + "epoch": 0.007918701332981391, + "grad_norm": 51.53580856323242, + "learning_rate": 1.5567282321899736e-07, + "loss": 0.3928, + "num_input_tokens_seen": 29120, + "step": 60 + }, + { + "epoch": 0.008578593110729841, + "grad_norm": 29.78285026550293, + "learning_rate": 1.688654353562005e-07, + "loss": 0.3093, + "num_input_tokens_seen": 31744, + "step": 65 + }, + { + "epoch": 0.00923848488847829, + "grad_norm": 54.6888313293457, + "learning_rate": 1.820580474934037e-07, + "loss": 0.2986, + "num_input_tokens_seen": 34176, + "step": 70 + }, + { + "epoch": 0.009898376666226739, + "grad_norm": 53.20941925048828, + "learning_rate": 1.9525065963060686e-07, + "loss": 0.2998, + "num_input_tokens_seen": 36864, + "step": 75 + }, + { + "epoch": 0.010558268443975187, + "grad_norm": 28.97679328918457, + "learning_rate": 2.0844327176781002e-07, + "loss": 0.2555, + "num_input_tokens_seen": 39424, + "step": 80 + }, + { + "epoch": 0.011218160221723637, + "grad_norm": 37.55499267578125, + "learning_rate": 2.2163588390501316e-07, + "loss": 0.2595, + "num_input_tokens_seen": 42112, + "step": 85 + }, + { + "epoch": 0.011878051999472087, + "grad_norm": 32.20515060424805, + "learning_rate": 2.3482849604221635e-07, + "loss": 0.2567, + "num_input_tokens_seen": 44544, + "step": 90 + }, + { + "epoch": 0.012537943777220536, + "grad_norm": 45.711021423339844, + "learning_rate": 2.480211081794195e-07, + "loss": 0.1981, + "num_input_tokens_seen": 47104, + "step": 95 + }, + { + "epoch": 0.013197835554968985, + "grad_norm": 23.666234970092773, + "learning_rate": 2.612137203166227e-07, + "loss": 0.1626, + "num_input_tokens_seen": 49664, + "step": 100 + }, + { + "epoch": 0.013857727332717434, + "grad_norm": 21.503978729248047, + "learning_rate": 2.744063324538258e-07, + "loss": 0.1359, + "num_input_tokens_seen": 52352, + "step": 105 + }, + { + "epoch": 0.014517619110465884, + "grad_norm": 84.25057220458984, + "learning_rate": 2.8759894459102903e-07, + "loss": 0.1025, + "num_input_tokens_seen": 54720, + "step": 110 + }, + { + "epoch": 0.015177510888214334, + "grad_norm": 49.4913444519043, + "learning_rate": 3.007915567282322e-07, + "loss": 0.1435, + "num_input_tokens_seen": 57152, + "step": 115 + }, + { + "epoch": 0.015837402665962782, + "grad_norm": 98.1129379272461, + "learning_rate": 3.139841688654353e-07, + "loss": 0.2027, + "num_input_tokens_seen": 59776, + "step": 120 + }, + { + "epoch": 0.01649729444371123, + "grad_norm": 26.11796760559082, + "learning_rate": 3.271767810026385e-07, + "loss": 0.1344, + "num_input_tokens_seen": 62464, + "step": 125 + }, + { + "epoch": 0.017157186221459682, + "grad_norm": 80.43219757080078, + "learning_rate": 3.403693931398417e-07, + "loss": 0.1188, + "num_input_tokens_seen": 65088, + "step": 130 + }, + { + "epoch": 0.01781707799920813, + "grad_norm": 75.85595703125, + "learning_rate": 3.5356200527704485e-07, + "loss": 0.2073, + "num_input_tokens_seen": 67776, + "step": 135 + }, + { + "epoch": 0.01847696977695658, + "grad_norm": 69.01596069335938, + "learning_rate": 3.66754617414248e-07, + "loss": 0.2589, + "num_input_tokens_seen": 70400, + "step": 140 + }, + { + "epoch": 0.01913686155470503, + "grad_norm": 48.234092712402344, + "learning_rate": 3.7994722955145113e-07, + "loss": 0.1435, + "num_input_tokens_seen": 72704, + "step": 145 + }, + { + "epoch": 0.019796753332453478, + "grad_norm": 63.58314514160156, + "learning_rate": 3.9313984168865435e-07, + "loss": 0.3408, + "num_input_tokens_seen": 75136, + "step": 150 + }, + { + "epoch": 0.020456645110201926, + "grad_norm": 22.535675048828125, + "learning_rate": 4.063324538258575e-07, + "loss": 0.0612, + "num_input_tokens_seen": 77632, + "step": 155 + }, + { + "epoch": 0.021116536887950375, + "grad_norm": 69.68572998046875, + "learning_rate": 4.195250659630606e-07, + "loss": 0.2462, + "num_input_tokens_seen": 80320, + "step": 160 + }, + { + "epoch": 0.021776428665698826, + "grad_norm": 110.42927551269531, + "learning_rate": 4.3271767810026384e-07, + "loss": 0.1542, + "num_input_tokens_seen": 82752, + "step": 165 + }, + { + "epoch": 0.022436320443447275, + "grad_norm": 151.29769897460938, + "learning_rate": 4.45910290237467e-07, + "loss": 0.3088, + "num_input_tokens_seen": 85248, + "step": 170 + }, + { + "epoch": 0.023096212221195723, + "grad_norm": 170.58566284179688, + "learning_rate": 4.5910290237467017e-07, + "loss": 0.2887, + "num_input_tokens_seen": 87872, + "step": 175 + }, + { + "epoch": 0.023756103998944175, + "grad_norm": 51.48556137084961, + "learning_rate": 4.7229551451187333e-07, + "loss": 0.1364, + "num_input_tokens_seen": 90368, + "step": 180 + }, + { + "epoch": 0.024415995776692623, + "grad_norm": 31.3718204498291, + "learning_rate": 4.854881266490765e-07, + "loss": 0.0589, + "num_input_tokens_seen": 92928, + "step": 185 + }, + { + "epoch": 0.02507588755444107, + "grad_norm": 66.79593658447266, + "learning_rate": 4.986807387862796e-07, + "loss": 0.1639, + "num_input_tokens_seen": 95296, + "step": 190 + }, + { + "epoch": 0.02573577933218952, + "grad_norm": 57.898441314697266, + "learning_rate": 5.118733509234829e-07, + "loss": 0.1103, + "num_input_tokens_seen": 97984, + "step": 195 + }, + { + "epoch": 0.02639567110993797, + "grad_norm": 106.46971130371094, + "learning_rate": 5.250659630606859e-07, + "loss": 0.2017, + "num_input_tokens_seen": 100352, + "step": 200 + }, + { + "epoch": 0.02705556288768642, + "grad_norm": 17.6440372467041, + "learning_rate": 5.382585751978892e-07, + "loss": 0.1383, + "num_input_tokens_seen": 102464, + "step": 205 + }, + { + "epoch": 0.027715454665434867, + "grad_norm": 14.92352294921875, + "learning_rate": 5.514511873350924e-07, + "loss": 0.1266, + "num_input_tokens_seen": 105088, + "step": 210 + }, + { + "epoch": 0.02837534644318332, + "grad_norm": 16.06985092163086, + "learning_rate": 5.646437994722954e-07, + "loss": 0.3019, + "num_input_tokens_seen": 107648, + "step": 215 + }, + { + "epoch": 0.029035238220931767, + "grad_norm": 108.87126159667969, + "learning_rate": 5.778364116094987e-07, + "loss": 0.2375, + "num_input_tokens_seen": 110144, + "step": 220 + }, + { + "epoch": 0.029695129998680216, + "grad_norm": 33.7409553527832, + "learning_rate": 5.910290237467019e-07, + "loss": 0.1332, + "num_input_tokens_seen": 112576, + "step": 225 + }, + { + "epoch": 0.030355021776428667, + "grad_norm": 58.12620162963867, + "learning_rate": 6.042216358839049e-07, + "loss": 0.2314, + "num_input_tokens_seen": 115264, + "step": 230 + }, + { + "epoch": 0.031014913554177116, + "grad_norm": 19.326017379760742, + "learning_rate": 6.174142480211082e-07, + "loss": 0.0848, + "num_input_tokens_seen": 117888, + "step": 235 + }, + { + "epoch": 0.031674805331925564, + "grad_norm": 34.517738342285156, + "learning_rate": 6.306068601583114e-07, + "loss": 0.0189, + "num_input_tokens_seen": 120320, + "step": 240 + }, + { + "epoch": 0.032334697109674015, + "grad_norm": 89.7800521850586, + "learning_rate": 6.437994722955144e-07, + "loss": 0.1826, + "num_input_tokens_seen": 122688, + "step": 245 + }, + { + "epoch": 0.03299458888742246, + "grad_norm": 81.10912322998047, + "learning_rate": 6.569920844327177e-07, + "loss": 0.2716, + "num_input_tokens_seen": 125248, + "step": 250 + }, + { + "epoch": 0.03365448066517091, + "grad_norm": 89.25950622558594, + "learning_rate": 6.701846965699208e-07, + "loss": 0.203, + "num_input_tokens_seen": 127680, + "step": 255 + }, + { + "epoch": 0.034314372442919364, + "grad_norm": 19.84525489807129, + "learning_rate": 6.833773087071239e-07, + "loss": 0.083, + "num_input_tokens_seen": 130496, + "step": 260 + }, + { + "epoch": 0.03497426422066781, + "grad_norm": 34.019805908203125, + "learning_rate": 6.965699208443272e-07, + "loss": 0.1837, + "num_input_tokens_seen": 132992, + "step": 265 + }, + { + "epoch": 0.03563415599841626, + "grad_norm": 63.352012634277344, + "learning_rate": 7.097625329815303e-07, + "loss": 0.1372, + "num_input_tokens_seen": 135040, + "step": 270 + }, + { + "epoch": 0.03629404777616471, + "grad_norm": 70.96591186523438, + "learning_rate": 7.229551451187335e-07, + "loss": 0.258, + "num_input_tokens_seen": 137600, + "step": 275 + }, + { + "epoch": 0.03695393955391316, + "grad_norm": 57.32151412963867, + "learning_rate": 7.361477572559367e-07, + "loss": 0.1103, + "num_input_tokens_seen": 139904, + "step": 280 + }, + { + "epoch": 0.03761383133166161, + "grad_norm": 16.635353088378906, + "learning_rate": 7.493403693931398e-07, + "loss": 0.1476, + "num_input_tokens_seen": 142016, + "step": 285 + }, + { + "epoch": 0.03827372310941006, + "grad_norm": 9.866713523864746, + "learning_rate": 7.62532981530343e-07, + "loss": 0.0087, + "num_input_tokens_seen": 144576, + "step": 290 + }, + { + "epoch": 0.038933614887158505, + "grad_norm": 118.24456024169922, + "learning_rate": 7.757255936675461e-07, + "loss": 0.085, + "num_input_tokens_seen": 146880, + "step": 295 + }, + { + "epoch": 0.039593506664906956, + "grad_norm": 92.64739990234375, + "learning_rate": 7.889182058047493e-07, + "loss": 0.3963, + "num_input_tokens_seen": 149184, + "step": 300 + }, + { + "epoch": 0.0402533984426554, + "grad_norm": 0.17220743000507355, + "learning_rate": 8.021108179419525e-07, + "loss": 0.221, + "num_input_tokens_seen": 151296, + "step": 305 + }, + { + "epoch": 0.04091329022040385, + "grad_norm": 89.11080932617188, + "learning_rate": 8.153034300791555e-07, + "loss": 0.2076, + "num_input_tokens_seen": 153664, + "step": 310 + }, + { + "epoch": 0.041573181998152305, + "grad_norm": 35.5322265625, + "learning_rate": 8.284960422163588e-07, + "loss": 0.2588, + "num_input_tokens_seen": 156032, + "step": 315 + }, + { + "epoch": 0.04223307377590075, + "grad_norm": 0.28457769751548767, + "learning_rate": 8.41688654353562e-07, + "loss": 0.227, + "num_input_tokens_seen": 158528, + "step": 320 + }, + { + "epoch": 0.0428929655536492, + "grad_norm": 14.495915412902832, + "learning_rate": 8.54881266490765e-07, + "loss": 0.12, + "num_input_tokens_seen": 160704, + "step": 325 + }, + { + "epoch": 0.04355285733139765, + "grad_norm": 5.979187965393066, + "learning_rate": 8.680738786279683e-07, + "loss": 0.1931, + "num_input_tokens_seen": 163072, + "step": 330 + }, + { + "epoch": 0.0442127491091461, + "grad_norm": 65.1185302734375, + "learning_rate": 8.812664907651715e-07, + "loss": 0.1389, + "num_input_tokens_seen": 165568, + "step": 335 + }, + { + "epoch": 0.04487264088689455, + "grad_norm": 0.6913341283798218, + "learning_rate": 8.944591029023745e-07, + "loss": 0.2857, + "num_input_tokens_seen": 167936, + "step": 340 + }, + { + "epoch": 0.045532532664643, + "grad_norm": 178.3228759765625, + "learning_rate": 9.076517150395778e-07, + "loss": 0.0616, + "num_input_tokens_seen": 170176, + "step": 345 + }, + { + "epoch": 0.046192424442391446, + "grad_norm": 140.8086700439453, + "learning_rate": 9.20844327176781e-07, + "loss": 0.149, + "num_input_tokens_seen": 172352, + "step": 350 + }, + { + "epoch": 0.0468523162201399, + "grad_norm": 42.391597747802734, + "learning_rate": 9.340369393139841e-07, + "loss": 0.2579, + "num_input_tokens_seen": 175168, + "step": 355 + }, + { + "epoch": 0.04751220799788835, + "grad_norm": 2.5807368755340576, + "learning_rate": 9.472295514511873e-07, + "loss": 0.1596, + "num_input_tokens_seen": 177856, + "step": 360 + }, + { + "epoch": 0.048172099775636794, + "grad_norm": 41.364768981933594, + "learning_rate": 9.604221635883904e-07, + "loss": 0.2923, + "num_input_tokens_seen": 180160, + "step": 365 + }, + { + "epoch": 0.048831991553385246, + "grad_norm": 139.357177734375, + "learning_rate": 9.736147757255936e-07, + "loss": 0.2137, + "num_input_tokens_seen": 182784, + "step": 370 + }, + { + "epoch": 0.0494918833311337, + "grad_norm": 1.2181538343429565, + "learning_rate": 9.86807387862797e-07, + "loss": 0.0578, + "num_input_tokens_seen": 185024, + "step": 375 + }, + { + "epoch": 0.05001979675333245, + "eval_loss": 0.16884121298789978, + "eval_runtime": 7.8728, + "eval_samples_per_second": 855.48, + "eval_steps_per_second": 106.951, + "num_input_tokens_seen": 187072, + "step": 379 + }, + { + "epoch": 0.05015177510888214, + "grad_norm": 64.27156066894531, + "learning_rate": 1e-06, + "loss": 0.1527, + "num_input_tokens_seen": 187712, + "step": 380 + }, + { + "epoch": 0.050811666886630594, + "grad_norm": 49.03231430053711, + "learning_rate": 1.0131926121372032e-06, + "loss": 0.2528, + "num_input_tokens_seen": 190400, + "step": 385 + }, + { + "epoch": 0.05147155866437904, + "grad_norm": 53.97622299194336, + "learning_rate": 1.0263852242744063e-06, + "loss": 0.1124, + "num_input_tokens_seen": 193280, + "step": 390 + }, + { + "epoch": 0.05213145044212749, + "grad_norm": 38.25093078613281, + "learning_rate": 1.0395778364116096e-06, + "loss": 0.1545, + "num_input_tokens_seen": 195584, + "step": 395 + }, + { + "epoch": 0.05279134221987594, + "grad_norm": 23.770427703857422, + "learning_rate": 1.0527704485488126e-06, + "loss": 0.0824, + "num_input_tokens_seen": 198208, + "step": 400 + }, + { + "epoch": 0.05345123399762439, + "grad_norm": 109.20024871826172, + "learning_rate": 1.0659630606860157e-06, + "loss": 0.255, + "num_input_tokens_seen": 200704, + "step": 405 + }, + { + "epoch": 0.05411112577537284, + "grad_norm": 86.4642333984375, + "learning_rate": 1.079155672823219e-06, + "loss": 0.2055, + "num_input_tokens_seen": 203136, + "step": 410 + }, + { + "epoch": 0.05477101755312129, + "grad_norm": 77.17768859863281, + "learning_rate": 1.0923482849604222e-06, + "loss": 0.1496, + "num_input_tokens_seen": 205504, + "step": 415 + }, + { + "epoch": 0.055430909330869735, + "grad_norm": 90.73381042480469, + "learning_rate": 1.1055408970976253e-06, + "loss": 0.2539, + "num_input_tokens_seen": 208000, + "step": 420 + }, + { + "epoch": 0.056090801108618187, + "grad_norm": 227.53492736816406, + "learning_rate": 1.1187335092348285e-06, + "loss": 0.1106, + "num_input_tokens_seen": 210560, + "step": 425 + }, + { + "epoch": 0.05675069288636664, + "grad_norm": 39.24838638305664, + "learning_rate": 1.1319261213720316e-06, + "loss": 0.1771, + "num_input_tokens_seen": 213056, + "step": 430 + }, + { + "epoch": 0.05741058466411508, + "grad_norm": 54.15324020385742, + "learning_rate": 1.1451187335092347e-06, + "loss": 0.1155, + "num_input_tokens_seen": 215296, + "step": 435 + }, + { + "epoch": 0.058070476441863535, + "grad_norm": 0.09268882125616074, + "learning_rate": 1.158311345646438e-06, + "loss": 0.0203, + "num_input_tokens_seen": 217472, + "step": 440 + }, + { + "epoch": 0.058730368219611986, + "grad_norm": 126.56912994384766, + "learning_rate": 1.1715039577836412e-06, + "loss": 0.0346, + "num_input_tokens_seen": 219968, + "step": 445 + }, + { + "epoch": 0.05939025999736043, + "grad_norm": 0.09806288778781891, + "learning_rate": 1.1846965699208443e-06, + "loss": 0.0218, + "num_input_tokens_seen": 222592, + "step": 450 + }, + { + "epoch": 0.06005015177510888, + "grad_norm": 183.16590881347656, + "learning_rate": 1.1978891820580475e-06, + "loss": 0.522, + "num_input_tokens_seen": 224768, + "step": 455 + }, + { + "epoch": 0.060710043552857335, + "grad_norm": 3.036947250366211, + "learning_rate": 1.2110817941952508e-06, + "loss": 0.2349, + "num_input_tokens_seen": 227264, + "step": 460 + }, + { + "epoch": 0.06136993533060578, + "grad_norm": 18.994815826416016, + "learning_rate": 1.2242744063324536e-06, + "loss": 0.2363, + "num_input_tokens_seen": 229760, + "step": 465 + }, + { + "epoch": 0.06202982710835423, + "grad_norm": 97.5959243774414, + "learning_rate": 1.237467018469657e-06, + "loss": 0.1719, + "num_input_tokens_seen": 232000, + "step": 470 + }, + { + "epoch": 0.06268971888610268, + "grad_norm": 2.0452661514282227, + "learning_rate": 1.2506596306068602e-06, + "loss": 0.1564, + "num_input_tokens_seen": 234176, + "step": 475 + }, + { + "epoch": 0.06334961066385113, + "grad_norm": 0.3037824034690857, + "learning_rate": 1.2638522427440632e-06, + "loss": 0.0993, + "num_input_tokens_seen": 236736, + "step": 480 + }, + { + "epoch": 0.06400950244159957, + "grad_norm": 0.12219711393117905, + "learning_rate": 1.2770448548812665e-06, + "loss": 0.006, + "num_input_tokens_seen": 239104, + "step": 485 + }, + { + "epoch": 0.06466939421934803, + "grad_norm": 166.3263702392578, + "learning_rate": 1.2902374670184698e-06, + "loss": 0.3751, + "num_input_tokens_seen": 241600, + "step": 490 + }, + { + "epoch": 0.06532928599709648, + "grad_norm": 131.08555603027344, + "learning_rate": 1.3034300791556726e-06, + "loss": 0.31, + "num_input_tokens_seen": 244160, + "step": 495 + }, + { + "epoch": 0.06598917777484492, + "grad_norm": 1.1034032106399536, + "learning_rate": 1.316622691292876e-06, + "loss": 0.1775, + "num_input_tokens_seen": 246464, + "step": 500 + }, + { + "epoch": 0.06664906955259338, + "grad_norm": 1.8536452054977417, + "learning_rate": 1.3298153034300792e-06, + "loss": 0.0849, + "num_input_tokens_seen": 248960, + "step": 505 + }, + { + "epoch": 0.06730896133034182, + "grad_norm": 91.25196075439453, + "learning_rate": 1.3430079155672822e-06, + "loss": 0.1716, + "num_input_tokens_seen": 251392, + "step": 510 + }, + { + "epoch": 0.06796885310809027, + "grad_norm": 30.315645217895508, + "learning_rate": 1.3562005277044855e-06, + "loss": 0.2321, + "num_input_tokens_seen": 253888, + "step": 515 + }, + { + "epoch": 0.06862874488583873, + "grad_norm": 20.200546264648438, + "learning_rate": 1.3693931398416888e-06, + "loss": 0.1398, + "num_input_tokens_seen": 256384, + "step": 520 + }, + { + "epoch": 0.06928863666358717, + "grad_norm": 70.2831039428711, + "learning_rate": 1.3825857519788916e-06, + "loss": 0.1866, + "num_input_tokens_seen": 258496, + "step": 525 + }, + { + "epoch": 0.06994852844133562, + "grad_norm": 0.08841226994991302, + "learning_rate": 1.3957783641160949e-06, + "loss": 0.1035, + "num_input_tokens_seen": 260864, + "step": 530 + }, + { + "epoch": 0.07060842021908408, + "grad_norm": 16.285932540893555, + "learning_rate": 1.4089709762532982e-06, + "loss": 0.0497, + "num_input_tokens_seen": 263360, + "step": 535 + }, + { + "epoch": 0.07126831199683252, + "grad_norm": 291.2605285644531, + "learning_rate": 1.4221635883905012e-06, + "loss": 0.3041, + "num_input_tokens_seen": 266112, + "step": 540 + }, + { + "epoch": 0.07192820377458096, + "grad_norm": 41.77130889892578, + "learning_rate": 1.4353562005277045e-06, + "loss": 0.2543, + "num_input_tokens_seen": 268544, + "step": 545 + }, + { + "epoch": 0.07258809555232942, + "grad_norm": 0.281996488571167, + "learning_rate": 1.4485488126649078e-06, + "loss": 0.4179, + "num_input_tokens_seen": 270912, + "step": 550 + }, + { + "epoch": 0.07324798733007787, + "grad_norm": 0.33394086360931396, + "learning_rate": 1.4617414248021108e-06, + "loss": 0.0028, + "num_input_tokens_seen": 273664, + "step": 555 + }, + { + "epoch": 0.07390787910782631, + "grad_norm": 92.83995819091797, + "learning_rate": 1.4749340369393139e-06, + "loss": 0.1789, + "num_input_tokens_seen": 276160, + "step": 560 + }, + { + "epoch": 0.07456777088557477, + "grad_norm": 0.3077968955039978, + "learning_rate": 1.4881266490765171e-06, + "loss": 0.0054, + "num_input_tokens_seen": 278784, + "step": 565 + }, + { + "epoch": 0.07522766266332322, + "grad_norm": 28.540903091430664, + "learning_rate": 1.5013192612137202e-06, + "loss": 0.2245, + "num_input_tokens_seen": 281152, + "step": 570 + }, + { + "epoch": 0.07588755444107166, + "grad_norm": 75.34148406982422, + "learning_rate": 1.5145118733509235e-06, + "loss": 0.2359, + "num_input_tokens_seen": 283456, + "step": 575 + }, + { + "epoch": 0.07654744621882012, + "grad_norm": 2.8185484409332275, + "learning_rate": 1.5277044854881265e-06, + "loss": 0.0789, + "num_input_tokens_seen": 286016, + "step": 580 + }, + { + "epoch": 0.07720733799656856, + "grad_norm": 0.16082888841629028, + "learning_rate": 1.5408970976253298e-06, + "loss": 0.1872, + "num_input_tokens_seen": 288448, + "step": 585 + }, + { + "epoch": 0.07786722977431701, + "grad_norm": 0.02060079760849476, + "learning_rate": 1.5540897097625329e-06, + "loss": 0.1543, + "num_input_tokens_seen": 290816, + "step": 590 + }, + { + "epoch": 0.07852712155206547, + "grad_norm": 66.97010803222656, + "learning_rate": 1.567282321899736e-06, + "loss": 0.2174, + "num_input_tokens_seen": 293504, + "step": 595 + }, + { + "epoch": 0.07918701332981391, + "grad_norm": 0.04142444580793381, + "learning_rate": 1.5804749340369392e-06, + "loss": 0.1323, + "num_input_tokens_seen": 295744, + "step": 600 + }, + { + "epoch": 0.07984690510756236, + "grad_norm": 0.039387296885252, + "learning_rate": 1.5936675461741425e-06, + "loss": 0.0865, + "num_input_tokens_seen": 298112, + "step": 605 + }, + { + "epoch": 0.0805067968853108, + "grad_norm": 93.4574203491211, + "learning_rate": 1.6068601583113455e-06, + "loss": 0.1034, + "num_input_tokens_seen": 300608, + "step": 610 + }, + { + "epoch": 0.08116668866305926, + "grad_norm": 0.054611898958683014, + "learning_rate": 1.6200527704485488e-06, + "loss": 0.0048, + "num_input_tokens_seen": 303360, + "step": 615 + }, + { + "epoch": 0.0818265804408077, + "grad_norm": 4.433136940002441, + "learning_rate": 1.633245382585752e-06, + "loss": 0.0325, + "num_input_tokens_seen": 305920, + "step": 620 + }, + { + "epoch": 0.08248647221855615, + "grad_norm": 1.7903838157653809, + "learning_rate": 1.646437994722955e-06, + "loss": 0.0698, + "num_input_tokens_seen": 308416, + "step": 625 + }, + { + "epoch": 0.08314636399630461, + "grad_norm": 0.04191221296787262, + "learning_rate": 1.6596306068601582e-06, + "loss": 0.1542, + "num_input_tokens_seen": 310848, + "step": 630 + }, + { + "epoch": 0.08380625577405305, + "grad_norm": 60.00360107421875, + "learning_rate": 1.6728232189973614e-06, + "loss": 0.225, + "num_input_tokens_seen": 313408, + "step": 635 + }, + { + "epoch": 0.0844661475518015, + "grad_norm": 77.6712417602539, + "learning_rate": 1.6860158311345645e-06, + "loss": 0.0946, + "num_input_tokens_seen": 315904, + "step": 640 + }, + { + "epoch": 0.08512603932954996, + "grad_norm": 63.06571578979492, + "learning_rate": 1.6992084432717678e-06, + "loss": 0.2463, + "num_input_tokens_seen": 318080, + "step": 645 + }, + { + "epoch": 0.0857859311072984, + "grad_norm": 3.3637969493865967, + "learning_rate": 1.712401055408971e-06, + "loss": 0.0751, + "num_input_tokens_seen": 320256, + "step": 650 + }, + { + "epoch": 0.08644582288504685, + "grad_norm": 0.38727056980133057, + "learning_rate": 1.7255936675461739e-06, + "loss": 0.0116, + "num_input_tokens_seen": 322496, + "step": 655 + }, + { + "epoch": 0.0871057146627953, + "grad_norm": 62.513736724853516, + "learning_rate": 1.7387862796833772e-06, + "loss": 0.1616, + "num_input_tokens_seen": 325120, + "step": 660 + }, + { + "epoch": 0.08776560644054375, + "grad_norm": 270.4856872558594, + "learning_rate": 1.7519788918205804e-06, + "loss": 0.0802, + "num_input_tokens_seen": 327296, + "step": 665 + }, + { + "epoch": 0.0884254982182922, + "grad_norm": 42.6474723815918, + "learning_rate": 1.7651715039577835e-06, + "loss": 0.4002, + "num_input_tokens_seen": 329664, + "step": 670 + }, + { + "epoch": 0.08908538999604065, + "grad_norm": 24.991104125976562, + "learning_rate": 1.7783641160949868e-06, + "loss": 0.0953, + "num_input_tokens_seen": 332416, + "step": 675 + }, + { + "epoch": 0.0897452817737891, + "grad_norm": 0.23048889636993408, + "learning_rate": 1.79155672823219e-06, + "loss": 0.0779, + "num_input_tokens_seen": 334976, + "step": 680 + }, + { + "epoch": 0.09040517355153754, + "grad_norm": 0.02817719615995884, + "learning_rate": 1.8047493403693929e-06, + "loss": 0.0366, + "num_input_tokens_seen": 337472, + "step": 685 + }, + { + "epoch": 0.091065065329286, + "grad_norm": 6.201309680938721, + "learning_rate": 1.8179419525065961e-06, + "loss": 0.1887, + "num_input_tokens_seen": 339904, + "step": 690 + }, + { + "epoch": 0.09172495710703445, + "grad_norm": 85.3891830444336, + "learning_rate": 1.8311345646437994e-06, + "loss": 0.2216, + "num_input_tokens_seen": 342272, + "step": 695 + }, + { + "epoch": 0.09238484888478289, + "grad_norm": 0.08057679235935211, + "learning_rate": 1.8443271767810025e-06, + "loss": 0.197, + "num_input_tokens_seen": 344640, + "step": 700 + }, + { + "epoch": 0.09304474066253135, + "grad_norm": 0.027219658717513084, + "learning_rate": 1.8575197889182057e-06, + "loss": 0.0457, + "num_input_tokens_seen": 347072, + "step": 705 + }, + { + "epoch": 0.0937046324402798, + "grad_norm": 0.05592739209532738, + "learning_rate": 1.870712401055409e-06, + "loss": 0.1862, + "num_input_tokens_seen": 349696, + "step": 710 + }, + { + "epoch": 0.09436452421802824, + "grad_norm": 4.520129680633545, + "learning_rate": 1.883905013192612e-06, + "loss": 0.0762, + "num_input_tokens_seen": 352256, + "step": 715 + }, + { + "epoch": 0.0950244159957767, + "grad_norm": 0.11173778027296066, + "learning_rate": 1.8970976253298151e-06, + "loss": 0.1502, + "num_input_tokens_seen": 355008, + "step": 720 + }, + { + "epoch": 0.09568430777352514, + "grad_norm": 173.77919006347656, + "learning_rate": 1.9102902374670186e-06, + "loss": 0.2955, + "num_input_tokens_seen": 357376, + "step": 725 + }, + { + "epoch": 0.09634419955127359, + "grad_norm": 2.091977119445801, + "learning_rate": 1.9234828496042215e-06, + "loss": 0.1803, + "num_input_tokens_seen": 359680, + "step": 730 + }, + { + "epoch": 0.09700409132902205, + "grad_norm": 0.5139044523239136, + "learning_rate": 1.9366754617414247e-06, + "loss": 0.1343, + "num_input_tokens_seen": 362176, + "step": 735 + }, + { + "epoch": 0.09766398310677049, + "grad_norm": 0.8499874472618103, + "learning_rate": 1.949868073878628e-06, + "loss": 0.0823, + "num_input_tokens_seen": 365056, + "step": 740 + }, + { + "epoch": 0.09832387488451894, + "grad_norm": 0.42520672082901, + "learning_rate": 1.963060686015831e-06, + "loss": 0.3164, + "num_input_tokens_seen": 367488, + "step": 745 + }, + { + "epoch": 0.0989837666622674, + "grad_norm": 0.8814378976821899, + "learning_rate": 1.976253298153034e-06, + "loss": 0.3437, + "num_input_tokens_seen": 369792, + "step": 750 + }, + { + "epoch": 0.09964365844001584, + "grad_norm": 114.21378326416016, + "learning_rate": 1.9894459102902374e-06, + "loss": 0.1097, + "num_input_tokens_seen": 372160, + "step": 755 + }, + { + "epoch": 0.1000395935066649, + "eval_loss": 0.13667261600494385, + "eval_runtime": 7.9292, + "eval_samples_per_second": 849.39, + "eval_steps_per_second": 106.19, + "num_input_tokens_seen": 373504, + "step": 758 + }, + { + "epoch": 0.10030355021776428, + "grad_norm": 2.3556041717529297, + "learning_rate": 1.9999998938723955e-06, + "loss": 0.1005, + "num_input_tokens_seen": 374272, + "step": 760 + }, + { + "epoch": 0.10096344199551274, + "grad_norm": 4.03176212310791, + "learning_rate": 1.9999961794086063e-06, + "loss": 0.0727, + "num_input_tokens_seen": 376704, + "step": 765 + }, + { + "epoch": 0.10162333377326119, + "grad_norm": 250.72093200683594, + "learning_rate": 1.999987158587122e-06, + "loss": 0.287, + "num_input_tokens_seen": 379136, + "step": 770 + }, + { + "epoch": 0.10228322555100963, + "grad_norm": 42.057003021240234, + "learning_rate": 1.9999728314558114e-06, + "loss": 0.1199, + "num_input_tokens_seen": 381568, + "step": 775 + }, + { + "epoch": 0.10294311732875808, + "grad_norm": 0.05412933975458145, + "learning_rate": 1.9999531980906988e-06, + "loss": 0.2967, + "num_input_tokens_seen": 384128, + "step": 780 + }, + { + "epoch": 0.10360300910650654, + "grad_norm": 40.294551849365234, + "learning_rate": 1.999928258595967e-06, + "loss": 0.227, + "num_input_tokens_seen": 386304, + "step": 785 + }, + { + "epoch": 0.10426290088425498, + "grad_norm": 21.820249557495117, + "learning_rate": 1.9998980131039534e-06, + "loss": 0.3706, + "num_input_tokens_seen": 388864, + "step": 790 + }, + { + "epoch": 0.10492279266200343, + "grad_norm": 29.383682250976562, + "learning_rate": 1.999862461775153e-06, + "loss": 0.0609, + "num_input_tokens_seen": 391104, + "step": 795 + }, + { + "epoch": 0.10558268443975188, + "grad_norm": 19.28838539123535, + "learning_rate": 1.999821604798214e-06, + "loss": 0.1122, + "num_input_tokens_seen": 393856, + "step": 800 + }, + { + "epoch": 0.10624257621750033, + "grad_norm": 38.194297790527344, + "learning_rate": 1.999775442389939e-06, + "loss": 0.2655, + "num_input_tokens_seen": 396352, + "step": 805 + }, + { + "epoch": 0.10690246799524877, + "grad_norm": 1.154589295387268, + "learning_rate": 1.9997239747952843e-06, + "loss": 0.1068, + "num_input_tokens_seen": 398592, + "step": 810 + }, + { + "epoch": 0.10756235977299723, + "grad_norm": 97.90460968017578, + "learning_rate": 1.9996672022873546e-06, + "loss": 0.0669, + "num_input_tokens_seen": 401088, + "step": 815 + }, + { + "epoch": 0.10822225155074568, + "grad_norm": 133.7577362060547, + "learning_rate": 1.9996051251674073e-06, + "loss": 0.1053, + "num_input_tokens_seen": 403456, + "step": 820 + }, + { + "epoch": 0.10888214332849412, + "grad_norm": 41.88015365600586, + "learning_rate": 1.999537743764847e-06, + "loss": 0.3053, + "num_input_tokens_seen": 405696, + "step": 825 + }, + { + "epoch": 0.10954203510624258, + "grad_norm": 22.91583251953125, + "learning_rate": 1.999465058437225e-06, + "loss": 0.4762, + "num_input_tokens_seen": 408128, + "step": 830 + }, + { + "epoch": 0.11020192688399102, + "grad_norm": 0.7091745734214783, + "learning_rate": 1.9993870695702364e-06, + "loss": 0.0134, + "num_input_tokens_seen": 411008, + "step": 835 + }, + { + "epoch": 0.11086181866173947, + "grad_norm": 23.488370895385742, + "learning_rate": 1.9993037775777206e-06, + "loss": 0.3147, + "num_input_tokens_seen": 413312, + "step": 840 + }, + { + "epoch": 0.11152171043948793, + "grad_norm": 2.423909902572632, + "learning_rate": 1.999215182901656e-06, + "loss": 0.1734, + "num_input_tokens_seen": 415616, + "step": 845 + }, + { + "epoch": 0.11218160221723637, + "grad_norm": 156.0017852783203, + "learning_rate": 1.9991212860121587e-06, + "loss": 0.23, + "num_input_tokens_seen": 418368, + "step": 850 + }, + { + "epoch": 0.11284149399498482, + "grad_norm": 0.895738959312439, + "learning_rate": 1.999022087407482e-06, + "loss": 0.0658, + "num_input_tokens_seen": 420864, + "step": 855 + }, + { + "epoch": 0.11350138577273328, + "grad_norm": 57.05610275268555, + "learning_rate": 1.998917587614011e-06, + "loss": 0.2781, + "num_input_tokens_seen": 423040, + "step": 860 + }, + { + "epoch": 0.11416127755048172, + "grad_norm": 34.64775848388672, + "learning_rate": 1.9988077871862615e-06, + "loss": 0.3602, + "num_input_tokens_seen": 425344, + "step": 865 + }, + { + "epoch": 0.11482116932823017, + "grad_norm": 0.43117237091064453, + "learning_rate": 1.9986926867068752e-06, + "loss": 0.0011, + "num_input_tokens_seen": 427968, + "step": 870 + }, + { + "epoch": 0.11548106110597862, + "grad_norm": 0.1273239254951477, + "learning_rate": 1.998572286786619e-06, + "loss": 0.3594, + "num_input_tokens_seen": 430592, + "step": 875 + }, + { + "epoch": 0.11614095288372707, + "grad_norm": 9.043426513671875, + "learning_rate": 1.9984465880643807e-06, + "loss": 0.2425, + "num_input_tokens_seen": 433152, + "step": 880 + }, + { + "epoch": 0.11680084466147551, + "grad_norm": 65.71261596679688, + "learning_rate": 1.998315591207165e-06, + "loss": 0.0489, + "num_input_tokens_seen": 435456, + "step": 885 + }, + { + "epoch": 0.11746073643922397, + "grad_norm": 88.8459701538086, + "learning_rate": 1.9981792969100912e-06, + "loss": 0.1876, + "num_input_tokens_seen": 438080, + "step": 890 + }, + { + "epoch": 0.11812062821697242, + "grad_norm": 124.02445983886719, + "learning_rate": 1.9980377058963875e-06, + "loss": 0.2044, + "num_input_tokens_seen": 440640, + "step": 895 + }, + { + "epoch": 0.11878051999472086, + "grad_norm": 1.4761052131652832, + "learning_rate": 1.99789081891739e-06, + "loss": 0.028, + "num_input_tokens_seen": 443008, + "step": 900 + }, + { + "epoch": 0.11944041177246932, + "grad_norm": 110.05660247802734, + "learning_rate": 1.997738636752536e-06, + "loss": 0.1773, + "num_input_tokens_seen": 445312, + "step": 905 + }, + { + "epoch": 0.12010030355021777, + "grad_norm": 0.8630380630493164, + "learning_rate": 1.9975811602093624e-06, + "loss": 0.014, + "num_input_tokens_seen": 447680, + "step": 910 + }, + { + "epoch": 0.12076019532796621, + "grad_norm": 53.049163818359375, + "learning_rate": 1.9974183901234984e-06, + "loss": 0.2574, + "num_input_tokens_seen": 450368, + "step": 915 + }, + { + "epoch": 0.12142008710571467, + "grad_norm": 44.74892044067383, + "learning_rate": 1.997250327358664e-06, + "loss": 0.1599, + "num_input_tokens_seen": 452800, + "step": 920 + }, + { + "epoch": 0.12207997888346311, + "grad_norm": 45.7139892578125, + "learning_rate": 1.997076972806664e-06, + "loss": 0.023, + "num_input_tokens_seen": 455744, + "step": 925 + }, + { + "epoch": 0.12273987066121156, + "grad_norm": 35.15928268432617, + "learning_rate": 1.9968983273873827e-06, + "loss": 0.201, + "num_input_tokens_seen": 458176, + "step": 930 + }, + { + "epoch": 0.12339976243896002, + "grad_norm": 0.17246577143669128, + "learning_rate": 1.99671439204878e-06, + "loss": 0.0808, + "num_input_tokens_seen": 460480, + "step": 935 + }, + { + "epoch": 0.12405965421670846, + "grad_norm": 1.2687770128250122, + "learning_rate": 1.9965251677668873e-06, + "loss": 0.1766, + "num_input_tokens_seen": 462656, + "step": 940 + }, + { + "epoch": 0.1247195459944569, + "grad_norm": 24.687292098999023, + "learning_rate": 1.9963306555458e-06, + "loss": 0.3062, + "num_input_tokens_seen": 465344, + "step": 945 + }, + { + "epoch": 0.12537943777220537, + "grad_norm": 252.84188842773438, + "learning_rate": 1.9961308564176723e-06, + "loss": 0.4272, + "num_input_tokens_seen": 467712, + "step": 950 + }, + { + "epoch": 0.1260393295499538, + "grad_norm": 36.122955322265625, + "learning_rate": 1.9959257714427147e-06, + "loss": 0.223, + "num_input_tokens_seen": 470080, + "step": 955 + }, + { + "epoch": 0.12669922132770225, + "grad_norm": 11.395262718200684, + "learning_rate": 1.995715401709186e-06, + "loss": 0.1762, + "num_input_tokens_seen": 472512, + "step": 960 + }, + { + "epoch": 0.1273591131054507, + "grad_norm": 25.220579147338867, + "learning_rate": 1.995499748333387e-06, + "loss": 0.1271, + "num_input_tokens_seen": 474752, + "step": 965 + }, + { + "epoch": 0.12801900488319914, + "grad_norm": 46.467193603515625, + "learning_rate": 1.9952788124596555e-06, + "loss": 0.1233, + "num_input_tokens_seen": 477440, + "step": 970 + }, + { + "epoch": 0.12867889666094762, + "grad_norm": 19.14841651916504, + "learning_rate": 1.9950525952603617e-06, + "loss": 0.1272, + "num_input_tokens_seen": 480000, + "step": 975 + }, + { + "epoch": 0.12933878843869606, + "grad_norm": 51.99488067626953, + "learning_rate": 1.994821097935899e-06, + "loss": 0.1456, + "num_input_tokens_seen": 482368, + "step": 980 + }, + { + "epoch": 0.1299986802164445, + "grad_norm": 1.0634769201278687, + "learning_rate": 1.9945843217146804e-06, + "loss": 0.0077, + "num_input_tokens_seen": 484544, + "step": 985 + }, + { + "epoch": 0.13065857199419295, + "grad_norm": 0.03618798032402992, + "learning_rate": 1.9943422678531293e-06, + "loss": 0.0852, + "num_input_tokens_seen": 486720, + "step": 990 + }, + { + "epoch": 0.1313184637719414, + "grad_norm": 0.015866678208112717, + "learning_rate": 1.994094937635675e-06, + "loss": 0.0741, + "num_input_tokens_seen": 489344, + "step": 995 + }, + { + "epoch": 0.13197835554968984, + "grad_norm": 197.39834594726562, + "learning_rate": 1.9938423323747457e-06, + "loss": 0.2262, + "num_input_tokens_seen": 491776, + "step": 1000 + }, + { + "epoch": 0.1326382473274383, + "grad_norm": 147.0883026123047, + "learning_rate": 1.99358445341076e-06, + "loss": 0.1184, + "num_input_tokens_seen": 493952, + "step": 1005 + }, + { + "epoch": 0.13329813910518676, + "grad_norm": 78.60313415527344, + "learning_rate": 1.993321302112121e-06, + "loss": 0.2204, + "num_input_tokens_seen": 496320, + "step": 1010 + }, + { + "epoch": 0.1339580308829352, + "grad_norm": 6.261760711669922, + "learning_rate": 1.993052879875209e-06, + "loss": 0.0399, + "num_input_tokens_seen": 498496, + "step": 1015 + }, + { + "epoch": 0.13461792266068365, + "grad_norm": 131.00633239746094, + "learning_rate": 1.992779188124374e-06, + "loss": 0.2953, + "num_input_tokens_seen": 501056, + "step": 1020 + }, + { + "epoch": 0.1352778144384321, + "grad_norm": 81.73246002197266, + "learning_rate": 1.992500228311928e-06, + "loss": 0.1176, + "num_input_tokens_seen": 503296, + "step": 1025 + }, + { + "epoch": 0.13593770621618054, + "grad_norm": 24.69017219543457, + "learning_rate": 1.9922160019181372e-06, + "loss": 0.2695, + "num_input_tokens_seen": 505856, + "step": 1030 + }, + { + "epoch": 0.13659759799392898, + "grad_norm": 0.1977771818637848, + "learning_rate": 1.9919265104512138e-06, + "loss": 0.0981, + "num_input_tokens_seen": 508416, + "step": 1035 + }, + { + "epoch": 0.13725748977167745, + "grad_norm": 66.1187515258789, + "learning_rate": 1.9916317554473094e-06, + "loss": 0.2986, + "num_input_tokens_seen": 511040, + "step": 1040 + }, + { + "epoch": 0.1379173815494259, + "grad_norm": 67.56658935546875, + "learning_rate": 1.9913317384705052e-06, + "loss": 0.115, + "num_input_tokens_seen": 513216, + "step": 1045 + }, + { + "epoch": 0.13857727332717434, + "grad_norm": 32.97856903076172, + "learning_rate": 1.991026461112805e-06, + "loss": 0.0893, + "num_input_tokens_seen": 515456, + "step": 1050 + }, + { + "epoch": 0.1392371651049228, + "grad_norm": 2.204728841781616, + "learning_rate": 1.9907159249941257e-06, + "loss": 0.1591, + "num_input_tokens_seen": 517824, + "step": 1055 + }, + { + "epoch": 0.13989705688267123, + "grad_norm": 0.19428718090057373, + "learning_rate": 1.990400131762289e-06, + "loss": 0.0627, + "num_input_tokens_seen": 520320, + "step": 1060 + }, + { + "epoch": 0.14055694866041968, + "grad_norm": 189.14625549316406, + "learning_rate": 1.9900790830930134e-06, + "loss": 0.1068, + "num_input_tokens_seen": 522752, + "step": 1065 + }, + { + "epoch": 0.14121684043816815, + "grad_norm": 39.105308532714844, + "learning_rate": 1.9897527806899047e-06, + "loss": 0.1066, + "num_input_tokens_seen": 525376, + "step": 1070 + }, + { + "epoch": 0.1418767322159166, + "grad_norm": 0.7390586733818054, + "learning_rate": 1.9894212262844465e-06, + "loss": 0.2544, + "num_input_tokens_seen": 527808, + "step": 1075 + }, + { + "epoch": 0.14253662399366504, + "grad_norm": 0.13609175384044647, + "learning_rate": 1.989084421635992e-06, + "loss": 0.1578, + "num_input_tokens_seen": 530304, + "step": 1080 + }, + { + "epoch": 0.14319651577141349, + "grad_norm": 13.118515968322754, + "learning_rate": 1.988742368531754e-06, + "loss": 0.2733, + "num_input_tokens_seen": 532480, + "step": 1085 + }, + { + "epoch": 0.14385640754916193, + "grad_norm": 2.5871739387512207, + "learning_rate": 1.9883950687867947e-06, + "loss": 0.0745, + "num_input_tokens_seen": 535168, + "step": 1090 + }, + { + "epoch": 0.14451629932691037, + "grad_norm": 127.09754180908203, + "learning_rate": 1.9880425242440187e-06, + "loss": 0.1377, + "num_input_tokens_seen": 537600, + "step": 1095 + }, + { + "epoch": 0.14517619110465885, + "grad_norm": 485.19842529296875, + "learning_rate": 1.9876847367741607e-06, + "loss": 0.0585, + "num_input_tokens_seen": 540096, + "step": 1100 + }, + { + "epoch": 0.1458360828824073, + "grad_norm": 0.17331336438655853, + "learning_rate": 1.987321708275776e-06, + "loss": 0.1719, + "num_input_tokens_seen": 542592, + "step": 1105 + }, + { + "epoch": 0.14649597466015574, + "grad_norm": 0.26521632075309753, + "learning_rate": 1.986953440675231e-06, + "loss": 0.0895, + "num_input_tokens_seen": 544960, + "step": 1110 + }, + { + "epoch": 0.14715586643790418, + "grad_norm": 0.27949467301368713, + "learning_rate": 1.9865799359266925e-06, + "loss": 0.1572, + "num_input_tokens_seen": 547136, + "step": 1115 + }, + { + "epoch": 0.14781575821565263, + "grad_norm": 159.8411102294922, + "learning_rate": 1.986201196012118e-06, + "loss": 0.1272, + "num_input_tokens_seen": 549440, + "step": 1120 + }, + { + "epoch": 0.14847564999340107, + "grad_norm": 87.8428726196289, + "learning_rate": 1.985817222941245e-06, + "loss": 0.2212, + "num_input_tokens_seen": 552064, + "step": 1125 + }, + { + "epoch": 0.14913554177114954, + "grad_norm": 14.358078956604004, + "learning_rate": 1.9854280187515794e-06, + "loss": 0.0754, + "num_input_tokens_seen": 554432, + "step": 1130 + }, + { + "epoch": 0.149795433548898, + "grad_norm": 1.0141674280166626, + "learning_rate": 1.985033585508386e-06, + "loss": 0.0564, + "num_input_tokens_seen": 556800, + "step": 1135 + }, + { + "epoch": 0.15005939025999737, + "eval_loss": 0.16564705967903137, + "eval_runtime": 7.8399, + "eval_samples_per_second": 859.067, + "eval_steps_per_second": 107.399, + "num_input_tokens_seen": 557824, + "step": 1137 + }, + { + "epoch": 0.15045532532664643, + "grad_norm": 257.7950744628906, + "learning_rate": 1.9846339253046766e-06, + "loss": 0.5119, + "num_input_tokens_seen": 559296, + "step": 1140 + }, + { + "epoch": 0.15111521710439488, + "grad_norm": 31.520845413208008, + "learning_rate": 1.984229040261199e-06, + "loss": 0.163, + "num_input_tokens_seen": 562112, + "step": 1145 + }, + { + "epoch": 0.15177510888214332, + "grad_norm": 0.35355716943740845, + "learning_rate": 1.9838189325264263e-06, + "loss": 0.1812, + "num_input_tokens_seen": 564288, + "step": 1150 + }, + { + "epoch": 0.15243500065989177, + "grad_norm": 70.49393463134766, + "learning_rate": 1.983403604276546e-06, + "loss": 0.033, + "num_input_tokens_seen": 566848, + "step": 1155 + }, + { + "epoch": 0.15309489243764024, + "grad_norm": 18.635469436645508, + "learning_rate": 1.9829830577154457e-06, + "loss": 0.3099, + "num_input_tokens_seen": 569152, + "step": 1160 + }, + { + "epoch": 0.15375478421538868, + "grad_norm": 34.90991973876953, + "learning_rate": 1.982557295074705e-06, + "loss": 0.0496, + "num_input_tokens_seen": 571456, + "step": 1165 + }, + { + "epoch": 0.15441467599313713, + "grad_norm": 0.17582400143146515, + "learning_rate": 1.982126318613581e-06, + "loss": 0.0902, + "num_input_tokens_seen": 573824, + "step": 1170 + }, + { + "epoch": 0.15507456777088557, + "grad_norm": 230.71153259277344, + "learning_rate": 1.9816901306189977e-06, + "loss": 0.0556, + "num_input_tokens_seen": 576128, + "step": 1175 + }, + { + "epoch": 0.15573445954863402, + "grad_norm": 0.5229840278625488, + "learning_rate": 1.9812487334055342e-06, + "loss": 0.1048, + "num_input_tokens_seen": 578432, + "step": 1180 + }, + { + "epoch": 0.15639435132638246, + "grad_norm": 0.39622417092323303, + "learning_rate": 1.98080212931541e-06, + "loss": 0.1522, + "num_input_tokens_seen": 580736, + "step": 1185 + }, + { + "epoch": 0.15705424310413094, + "grad_norm": 0.09377877414226532, + "learning_rate": 1.980350320718476e-06, + "loss": 0.0609, + "num_input_tokens_seen": 583040, + "step": 1190 + }, + { + "epoch": 0.15771413488187938, + "grad_norm": 1.1462613344192505, + "learning_rate": 1.9798933100121985e-06, + "loss": 0.0032, + "num_input_tokens_seen": 585344, + "step": 1195 + }, + { + "epoch": 0.15837402665962783, + "grad_norm": 1.4526684284210205, + "learning_rate": 1.97943109962165e-06, + "loss": 0.0896, + "num_input_tokens_seen": 587904, + "step": 1200 + }, + { + "epoch": 0.15903391843737627, + "grad_norm": 173.52330017089844, + "learning_rate": 1.978963691999493e-06, + "loss": 0.1423, + "num_input_tokens_seen": 590208, + "step": 1205 + }, + { + "epoch": 0.15969381021512472, + "grad_norm": 126.84811401367188, + "learning_rate": 1.978491089625969e-06, + "loss": 0.2118, + "num_input_tokens_seen": 592512, + "step": 1210 + }, + { + "epoch": 0.16035370199287316, + "grad_norm": 222.47836303710938, + "learning_rate": 1.9780132950088854e-06, + "loss": 0.2427, + "num_input_tokens_seen": 595072, + "step": 1215 + }, + { + "epoch": 0.1610135937706216, + "grad_norm": 19.530790328979492, + "learning_rate": 1.9775303106836e-06, + "loss": 0.3134, + "num_input_tokens_seen": 597632, + "step": 1220 + }, + { + "epoch": 0.16167348554837008, + "grad_norm": 0.11579433083534241, + "learning_rate": 1.977042139213011e-06, + "loss": 0.117, + "num_input_tokens_seen": 600192, + "step": 1225 + }, + { + "epoch": 0.16233337732611852, + "grad_norm": 0.30019301176071167, + "learning_rate": 1.9765487831875404e-06, + "loss": 0.1205, + "num_input_tokens_seen": 602304, + "step": 1230 + }, + { + "epoch": 0.16299326910386697, + "grad_norm": 1.5647317171096802, + "learning_rate": 1.9760502452251217e-06, + "loss": 0.1485, + "num_input_tokens_seen": 604608, + "step": 1235 + }, + { + "epoch": 0.1636531608816154, + "grad_norm": 12.981266021728516, + "learning_rate": 1.975546527971186e-06, + "loss": 0.1371, + "num_input_tokens_seen": 606976, + "step": 1240 + }, + { + "epoch": 0.16431305265936386, + "grad_norm": 7.285887241363525, + "learning_rate": 1.9750376340986472e-06, + "loss": 0.0801, + "num_input_tokens_seen": 609600, + "step": 1245 + }, + { + "epoch": 0.1649729444371123, + "grad_norm": 49.19084167480469, + "learning_rate": 1.974523566307889e-06, + "loss": 0.2009, + "num_input_tokens_seen": 611840, + "step": 1250 + }, + { + "epoch": 0.16563283621486077, + "grad_norm": 110.00751495361328, + "learning_rate": 1.9740043273267487e-06, + "loss": 0.1902, + "num_input_tokens_seen": 614528, + "step": 1255 + }, + { + "epoch": 0.16629272799260922, + "grad_norm": 0.1264021098613739, + "learning_rate": 1.973479919910505e-06, + "loss": 0.0022, + "num_input_tokens_seen": 617024, + "step": 1260 + }, + { + "epoch": 0.16695261977035766, + "grad_norm": 58.373043060302734, + "learning_rate": 1.972950346841862e-06, + "loss": 0.1153, + "num_input_tokens_seen": 619392, + "step": 1265 + }, + { + "epoch": 0.1676125115481061, + "grad_norm": 7.883070468902588, + "learning_rate": 1.972415610930934e-06, + "loss": 0.1353, + "num_input_tokens_seen": 621888, + "step": 1270 + }, + { + "epoch": 0.16827240332585455, + "grad_norm": 60.600013732910156, + "learning_rate": 1.9718757150152324e-06, + "loss": 0.1096, + "num_input_tokens_seen": 624192, + "step": 1275 + }, + { + "epoch": 0.168932295103603, + "grad_norm": 5.226385116577148, + "learning_rate": 1.9713306619596488e-06, + "loss": 0.0658, + "num_input_tokens_seen": 626624, + "step": 1280 + }, + { + "epoch": 0.16959218688135147, + "grad_norm": 10.980446815490723, + "learning_rate": 1.9707804546564407e-06, + "loss": 0.0575, + "num_input_tokens_seen": 628928, + "step": 1285 + }, + { + "epoch": 0.17025207865909991, + "grad_norm": 0.39055877923965454, + "learning_rate": 1.9702250960252164e-06, + "loss": 0.1254, + "num_input_tokens_seen": 631616, + "step": 1290 + }, + { + "epoch": 0.17091197043684836, + "grad_norm": 0.10477243363857269, + "learning_rate": 1.969664589012918e-06, + "loss": 0.0568, + "num_input_tokens_seen": 634112, + "step": 1295 + }, + { + "epoch": 0.1715718622145968, + "grad_norm": 273.6374206542969, + "learning_rate": 1.9690989365938077e-06, + "loss": 0.1854, + "num_input_tokens_seen": 636416, + "step": 1300 + }, + { + "epoch": 0.17223175399234525, + "grad_norm": 0.025812866166234016, + "learning_rate": 1.9685281417694513e-06, + "loss": 0.0006, + "num_input_tokens_seen": 638848, + "step": 1305 + }, + { + "epoch": 0.1728916457700937, + "grad_norm": 1.0203826427459717, + "learning_rate": 1.967952207568702e-06, + "loss": 0.12, + "num_input_tokens_seen": 641216, + "step": 1310 + }, + { + "epoch": 0.17355153754784217, + "grad_norm": 1.9090206623077393, + "learning_rate": 1.967371137047685e-06, + "loss": 0.0008, + "num_input_tokens_seen": 644032, + "step": 1315 + }, + { + "epoch": 0.1742114293255906, + "grad_norm": 0.15419095754623413, + "learning_rate": 1.966784933289778e-06, + "loss": 0.0887, + "num_input_tokens_seen": 646528, + "step": 1320 + }, + { + "epoch": 0.17487132110333906, + "grad_norm": 0.09177876263856888, + "learning_rate": 1.9661935994056014e-06, + "loss": 0.1307, + "num_input_tokens_seen": 649088, + "step": 1325 + }, + { + "epoch": 0.1755312128810875, + "grad_norm": 0.9890398383140564, + "learning_rate": 1.965597138532996e-06, + "loss": 0.1035, + "num_input_tokens_seen": 651520, + "step": 1330 + }, + { + "epoch": 0.17619110465883595, + "grad_norm": 90.32373046875, + "learning_rate": 1.964995553837009e-06, + "loss": 0.0123, + "num_input_tokens_seen": 654016, + "step": 1335 + }, + { + "epoch": 0.1768509964365844, + "grad_norm": 0.014015772379934788, + "learning_rate": 1.964388848509875e-06, + "loss": 0.0924, + "num_input_tokens_seen": 656320, + "step": 1340 + }, + { + "epoch": 0.17751088821433286, + "grad_norm": 0.044904567301273346, + "learning_rate": 1.9637770257710026e-06, + "loss": 0.1818, + "num_input_tokens_seen": 658880, + "step": 1345 + }, + { + "epoch": 0.1781707799920813, + "grad_norm": 0.15751226246356964, + "learning_rate": 1.9631600888669545e-06, + "loss": 0.001, + "num_input_tokens_seen": 661184, + "step": 1350 + }, + { + "epoch": 0.17883067176982975, + "grad_norm": 0.13751578330993652, + "learning_rate": 1.962538041071431e-06, + "loss": 0.0885, + "num_input_tokens_seen": 663680, + "step": 1355 + }, + { + "epoch": 0.1794905635475782, + "grad_norm": 164.34730529785156, + "learning_rate": 1.961910885685253e-06, + "loss": 0.0377, + "num_input_tokens_seen": 666048, + "step": 1360 + }, + { + "epoch": 0.18015045532532664, + "grad_norm": 1.029883623123169, + "learning_rate": 1.9612786260363436e-06, + "loss": 0.0748, + "num_input_tokens_seen": 668480, + "step": 1365 + }, + { + "epoch": 0.1808103471030751, + "grad_norm": 0.1113181859254837, + "learning_rate": 1.9606412654797116e-06, + "loss": 0.1292, + "num_input_tokens_seen": 671488, + "step": 1370 + }, + { + "epoch": 0.18147023888082353, + "grad_norm": 1.6563535928726196, + "learning_rate": 1.9599988073974332e-06, + "loss": 0.1406, + "num_input_tokens_seen": 673920, + "step": 1375 + }, + { + "epoch": 0.182130130658572, + "grad_norm": 0.45396727323532104, + "learning_rate": 1.959351255198634e-06, + "loss": 0.0929, + "num_input_tokens_seen": 676416, + "step": 1380 + }, + { + "epoch": 0.18279002243632045, + "grad_norm": 0.1408662647008896, + "learning_rate": 1.9586986123194704e-06, + "loss": 0.0006, + "num_input_tokens_seen": 679040, + "step": 1385 + }, + { + "epoch": 0.1834499142140689, + "grad_norm": 0.10570546239614487, + "learning_rate": 1.958040882223112e-06, + "loss": 0.1902, + "num_input_tokens_seen": 681920, + "step": 1390 + }, + { + "epoch": 0.18410980599181734, + "grad_norm": 0.1604253500699997, + "learning_rate": 1.9573780683997235e-06, + "loss": 0.048, + "num_input_tokens_seen": 684416, + "step": 1395 + }, + { + "epoch": 0.18476969776956578, + "grad_norm": 33.932865142822266, + "learning_rate": 1.956710174366445e-06, + "loss": 0.0828, + "num_input_tokens_seen": 686976, + "step": 1400 + }, + { + "epoch": 0.18542958954731423, + "grad_norm": 0.08173060417175293, + "learning_rate": 1.9560372036673764e-06, + "loss": 0.2272, + "num_input_tokens_seen": 689408, + "step": 1405 + }, + { + "epoch": 0.1860894813250627, + "grad_norm": 0.028357749804854393, + "learning_rate": 1.955359159873553e-06, + "loss": 0.0649, + "num_input_tokens_seen": 691712, + "step": 1410 + }, + { + "epoch": 0.18674937310281114, + "grad_norm": 0.021360548213124275, + "learning_rate": 1.954676046582932e-06, + "loss": 0.066, + "num_input_tokens_seen": 694080, + "step": 1415 + }, + { + "epoch": 0.1874092648805596, + "grad_norm": 80.15442657470703, + "learning_rate": 1.9539878674203706e-06, + "loss": 0.2175, + "num_input_tokens_seen": 696640, + "step": 1420 + }, + { + "epoch": 0.18806915665830803, + "grad_norm": 0.01937083899974823, + "learning_rate": 1.9532946260376076e-06, + "loss": 0.0003, + "num_input_tokens_seen": 699136, + "step": 1425 + }, + { + "epoch": 0.18872904843605648, + "grad_norm": 18.852214813232422, + "learning_rate": 1.952596326113244e-06, + "loss": 0.4092, + "num_input_tokens_seen": 701696, + "step": 1430 + }, + { + "epoch": 0.18938894021380492, + "grad_norm": 12.444201469421387, + "learning_rate": 1.9518929713527226e-06, + "loss": 0.2349, + "num_input_tokens_seen": 704384, + "step": 1435 + }, + { + "epoch": 0.1900488319915534, + "grad_norm": 2.0845847129821777, + "learning_rate": 1.9511845654883097e-06, + "loss": 0.0082, + "num_input_tokens_seen": 706560, + "step": 1440 + }, + { + "epoch": 0.19070872376930184, + "grad_norm": 0.3514378070831299, + "learning_rate": 1.9504711122790754e-06, + "loss": 0.1221, + "num_input_tokens_seen": 709248, + "step": 1445 + }, + { + "epoch": 0.19136861554705029, + "grad_norm": 79.33631896972656, + "learning_rate": 1.949752615510871e-06, + "loss": 0.08, + "num_input_tokens_seen": 711296, + "step": 1450 + }, + { + "epoch": 0.19202850732479873, + "grad_norm": 0.0773974359035492, + "learning_rate": 1.949029078996313e-06, + "loss": 0.0655, + "num_input_tokens_seen": 713728, + "step": 1455 + }, + { + "epoch": 0.19268839910254718, + "grad_norm": 15.809504508972168, + "learning_rate": 1.9483005065747584e-06, + "loss": 0.1876, + "num_input_tokens_seen": 716224, + "step": 1460 + }, + { + "epoch": 0.19334829088029562, + "grad_norm": 307.3660583496094, + "learning_rate": 1.947566902112289e-06, + "loss": 0.3791, + "num_input_tokens_seen": 718528, + "step": 1465 + }, + { + "epoch": 0.1940081826580441, + "grad_norm": 17.658618927001953, + "learning_rate": 1.9468282695016863e-06, + "loss": 0.2271, + "num_input_tokens_seen": 720960, + "step": 1470 + }, + { + "epoch": 0.19466807443579254, + "grad_norm": 1.276165246963501, + "learning_rate": 1.946084612662415e-06, + "loss": 0.1805, + "num_input_tokens_seen": 723200, + "step": 1475 + }, + { + "epoch": 0.19532796621354098, + "grad_norm": 104.93605041503906, + "learning_rate": 1.9453359355405987e-06, + "loss": 0.2018, + "num_input_tokens_seen": 725888, + "step": 1480 + }, + { + "epoch": 0.19598785799128943, + "grad_norm": 0.48601382970809937, + "learning_rate": 1.944582242109002e-06, + "loss": 0.0364, + "num_input_tokens_seen": 728256, + "step": 1485 + }, + { + "epoch": 0.19664774976903787, + "grad_norm": 24.217121124267578, + "learning_rate": 1.943823536367006e-06, + "loss": 0.1441, + "num_input_tokens_seen": 730688, + "step": 1490 + }, + { + "epoch": 0.19730764154678632, + "grad_norm": 1.9565227031707764, + "learning_rate": 1.9430598223405913e-06, + "loss": 0.1269, + "num_input_tokens_seen": 732992, + "step": 1495 + }, + { + "epoch": 0.1979675333245348, + "grad_norm": 1.4035013914108276, + "learning_rate": 1.9422911040823125e-06, + "loss": 0.1163, + "num_input_tokens_seen": 735424, + "step": 1500 + }, + { + "epoch": 0.19862742510228323, + "grad_norm": 28.88270378112793, + "learning_rate": 1.941517385671279e-06, + "loss": 0.1995, + "num_input_tokens_seen": 737664, + "step": 1505 + }, + { + "epoch": 0.19928731688003168, + "grad_norm": 0.40199992060661316, + "learning_rate": 1.940738671213134e-06, + "loss": 0.0888, + "num_input_tokens_seen": 740096, + "step": 1510 + }, + { + "epoch": 0.19994720865778012, + "grad_norm": 104.9893798828125, + "learning_rate": 1.93995496484003e-06, + "loss": 0.1883, + "num_input_tokens_seen": 742912, + "step": 1515 + }, + { + "epoch": 0.2000791870133298, + "eval_loss": 0.10974650084972382, + "eval_runtime": 7.9505, + "eval_samples_per_second": 847.113, + "eval_steps_per_second": 105.905, + "num_input_tokens_seen": 743424, + "step": 1516 + }, + { + "epoch": 0.20060710043552857, + "grad_norm": 20.379575729370117, + "learning_rate": 1.9391662707106092e-06, + "loss": 0.1544, + "num_input_tokens_seen": 745536, + "step": 1520 + }, + { + "epoch": 0.201266992213277, + "grad_norm": 0.3665579557418823, + "learning_rate": 1.9383725930099814e-06, + "loss": 0.0053, + "num_input_tokens_seen": 747968, + "step": 1525 + }, + { + "epoch": 0.20192688399102549, + "grad_norm": 207.8310089111328, + "learning_rate": 1.9375739359497e-06, + "loss": 0.2261, + "num_input_tokens_seen": 750464, + "step": 1530 + }, + { + "epoch": 0.20258677576877393, + "grad_norm": 0.281808078289032, + "learning_rate": 1.936770303767741e-06, + "loss": 0.2511, + "num_input_tokens_seen": 752896, + "step": 1535 + }, + { + "epoch": 0.20324666754652237, + "grad_norm": 16.87381362915039, + "learning_rate": 1.9359617007284815e-06, + "loss": 0.1788, + "num_input_tokens_seen": 755648, + "step": 1540 + }, + { + "epoch": 0.20390655932427082, + "grad_norm": 18.007219314575195, + "learning_rate": 1.9351481311226738e-06, + "loss": 0.2098, + "num_input_tokens_seen": 758144, + "step": 1545 + }, + { + "epoch": 0.20456645110201926, + "grad_norm": 3.9224605560302734, + "learning_rate": 1.934329599267426e-06, + "loss": 0.0831, + "num_input_tokens_seen": 760704, + "step": 1550 + }, + { + "epoch": 0.2052263428797677, + "grad_norm": 4.013158798217773, + "learning_rate": 1.933506109506178e-06, + "loss": 0.0039, + "num_input_tokens_seen": 763136, + "step": 1555 + }, + { + "epoch": 0.20588623465751615, + "grad_norm": 8.997451782226562, + "learning_rate": 1.9326776662086765e-06, + "loss": 0.0802, + "num_input_tokens_seen": 766016, + "step": 1560 + }, + { + "epoch": 0.20654612643526463, + "grad_norm": 47.96493911743164, + "learning_rate": 1.9318442737709565e-06, + "loss": 0.2901, + "num_input_tokens_seen": 768512, + "step": 1565 + }, + { + "epoch": 0.20720601821301307, + "grad_norm": 0.5580891966819763, + "learning_rate": 1.9310059366153116e-06, + "loss": 0.1689, + "num_input_tokens_seen": 770816, + "step": 1570 + }, + { + "epoch": 0.20786590999076152, + "grad_norm": 3.661959648132324, + "learning_rate": 1.930162659190277e-06, + "loss": 0.248, + "num_input_tokens_seen": 773312, + "step": 1575 + }, + { + "epoch": 0.20852580176850996, + "grad_norm": 167.700927734375, + "learning_rate": 1.9293144459706007e-06, + "loss": 0.0688, + "num_input_tokens_seen": 775680, + "step": 1580 + }, + { + "epoch": 0.2091856935462584, + "grad_norm": 1471.7938232421875, + "learning_rate": 1.928461301457223e-06, + "loss": 0.1075, + "num_input_tokens_seen": 778048, + "step": 1585 + }, + { + "epoch": 0.20984558532400685, + "grad_norm": 0.19680626690387726, + "learning_rate": 1.92760323017725e-06, + "loss": 0.2795, + "num_input_tokens_seen": 780672, + "step": 1590 + }, + { + "epoch": 0.21050547710175532, + "grad_norm": 0.7471222281455994, + "learning_rate": 1.9267402366839338e-06, + "loss": 0.2294, + "num_input_tokens_seen": 783360, + "step": 1595 + }, + { + "epoch": 0.21116536887950377, + "grad_norm": 105.85987854003906, + "learning_rate": 1.9258723255566433e-06, + "loss": 0.1843, + "num_input_tokens_seen": 785856, + "step": 1600 + }, + { + "epoch": 0.2118252606572522, + "grad_norm": 0.5641558170318604, + "learning_rate": 1.924999501400843e-06, + "loss": 0.1321, + "num_input_tokens_seen": 788480, + "step": 1605 + }, + { + "epoch": 0.21248515243500066, + "grad_norm": 0.07420846074819565, + "learning_rate": 1.924121768848068e-06, + "loss": 0.1504, + "num_input_tokens_seen": 791040, + "step": 1610 + }, + { + "epoch": 0.2131450442127491, + "grad_norm": 0.1806056797504425, + "learning_rate": 1.923239132555899e-06, + "loss": 0.1462, + "num_input_tokens_seen": 793600, + "step": 1615 + }, + { + "epoch": 0.21380493599049755, + "grad_norm": 86.85829162597656, + "learning_rate": 1.9223515972079378e-06, + "loss": 0.1516, + "num_input_tokens_seen": 795968, + "step": 1620 + }, + { + "epoch": 0.21446482776824602, + "grad_norm": 79.25112915039062, + "learning_rate": 1.9214591675137813e-06, + "loss": 0.1019, + "num_input_tokens_seen": 798272, + "step": 1625 + }, + { + "epoch": 0.21512471954599446, + "grad_norm": 345.95281982421875, + "learning_rate": 1.9205618482090003e-06, + "loss": 0.1059, + "num_input_tokens_seen": 801024, + "step": 1630 + }, + { + "epoch": 0.2157846113237429, + "grad_norm": 24.057254791259766, + "learning_rate": 1.91965964405511e-06, + "loss": 0.1862, + "num_input_tokens_seen": 803584, + "step": 1635 + }, + { + "epoch": 0.21644450310149135, + "grad_norm": 159.59852600097656, + "learning_rate": 1.9187525598395457e-06, + "loss": 0.0438, + "num_input_tokens_seen": 805952, + "step": 1640 + }, + { + "epoch": 0.2171043948792398, + "grad_norm": 64.74698638916016, + "learning_rate": 1.9178406003756396e-06, + "loss": 0.1326, + "num_input_tokens_seen": 808512, + "step": 1645 + }, + { + "epoch": 0.21776428665698824, + "grad_norm": 79.24069213867188, + "learning_rate": 1.9169237705025936e-06, + "loss": 0.1071, + "num_input_tokens_seen": 811136, + "step": 1650 + }, + { + "epoch": 0.21842417843473672, + "grad_norm": 0.03825217857956886, + "learning_rate": 1.9160020750854533e-06, + "loss": 0.0347, + "num_input_tokens_seen": 813376, + "step": 1655 + }, + { + "epoch": 0.21908407021248516, + "grad_norm": 208.05564880371094, + "learning_rate": 1.915075519015083e-06, + "loss": 0.1731, + "num_input_tokens_seen": 815872, + "step": 1660 + }, + { + "epoch": 0.2197439619902336, + "grad_norm": 108.54914855957031, + "learning_rate": 1.914144107208139e-06, + "loss": 0.0142, + "num_input_tokens_seen": 818240, + "step": 1665 + }, + { + "epoch": 0.22040385376798205, + "grad_norm": 0.16779685020446777, + "learning_rate": 1.913207844607045e-06, + "loss": 0.0476, + "num_input_tokens_seen": 820736, + "step": 1670 + }, + { + "epoch": 0.2210637455457305, + "grad_norm": 33.12580108642578, + "learning_rate": 1.912266736179964e-06, + "loss": 0.3054, + "num_input_tokens_seen": 823616, + "step": 1675 + }, + { + "epoch": 0.22172363732347894, + "grad_norm": 13.499357223510742, + "learning_rate": 1.9113207869207727e-06, + "loss": 0.2016, + "num_input_tokens_seen": 826112, + "step": 1680 + }, + { + "epoch": 0.2223835291012274, + "grad_norm": 0.33417344093322754, + "learning_rate": 1.9103700018490365e-06, + "loss": 0.1342, + "num_input_tokens_seen": 828672, + "step": 1685 + }, + { + "epoch": 0.22304342087897586, + "grad_norm": 0.9366137385368347, + "learning_rate": 1.9094143860099787e-06, + "loss": 0.163, + "num_input_tokens_seen": 831296, + "step": 1690 + }, + { + "epoch": 0.2237033126567243, + "grad_norm": 101.39453887939453, + "learning_rate": 1.9084539444744594e-06, + "loss": 0.1052, + "num_input_tokens_seen": 833856, + "step": 1695 + }, + { + "epoch": 0.22436320443447275, + "grad_norm": 0.10196679830551147, + "learning_rate": 1.907488682338944e-06, + "loss": 0.1483, + "num_input_tokens_seen": 836480, + "step": 1700 + }, + { + "epoch": 0.2250230962122212, + "grad_norm": 32.67580032348633, + "learning_rate": 1.9065186047254782e-06, + "loss": 0.0834, + "num_input_tokens_seen": 838976, + "step": 1705 + }, + { + "epoch": 0.22568298798996964, + "grad_norm": 0.4758983552455902, + "learning_rate": 1.9055437167816604e-06, + "loss": 0.1598, + "num_input_tokens_seen": 841728, + "step": 1710 + }, + { + "epoch": 0.22634287976771808, + "grad_norm": 0.09636105597019196, + "learning_rate": 1.9045640236806149e-06, + "loss": 0.0044, + "num_input_tokens_seen": 843968, + "step": 1715 + }, + { + "epoch": 0.22700277154546655, + "grad_norm": 265.4130859375, + "learning_rate": 1.903579530620963e-06, + "loss": 0.4454, + "num_input_tokens_seen": 846464, + "step": 1720 + }, + { + "epoch": 0.227662663323215, + "grad_norm": 0.19204720854759216, + "learning_rate": 1.9025902428267975e-06, + "loss": 0.1272, + "num_input_tokens_seen": 849088, + "step": 1725 + }, + { + "epoch": 0.22832255510096344, + "grad_norm": 0.07899138331413269, + "learning_rate": 1.901596165547653e-06, + "loss": 0.0506, + "num_input_tokens_seen": 851712, + "step": 1730 + }, + { + "epoch": 0.2289824468787119, + "grad_norm": 0.2107008397579193, + "learning_rate": 1.9005973040584796e-06, + "loss": 0.1537, + "num_input_tokens_seen": 854208, + "step": 1735 + }, + { + "epoch": 0.22964233865646033, + "grad_norm": 0.8915808796882629, + "learning_rate": 1.8995936636596138e-06, + "loss": 0.1147, + "num_input_tokens_seen": 856576, + "step": 1740 + }, + { + "epoch": 0.23030223043420878, + "grad_norm": 0.37453988194465637, + "learning_rate": 1.8985852496767504e-06, + "loss": 0.1347, + "num_input_tokens_seen": 859008, + "step": 1745 + }, + { + "epoch": 0.23096212221195725, + "grad_norm": 13.8438720703125, + "learning_rate": 1.897572067460916e-06, + "loss": 0.146, + "num_input_tokens_seen": 861440, + "step": 1750 + }, + { + "epoch": 0.2316220139897057, + "grad_norm": 0.8792198300361633, + "learning_rate": 1.8965541223884377e-06, + "loss": 0.1079, + "num_input_tokens_seen": 863936, + "step": 1755 + }, + { + "epoch": 0.23228190576745414, + "grad_norm": 0.31022199988365173, + "learning_rate": 1.8955314198609171e-06, + "loss": 0.0547, + "num_input_tokens_seen": 866176, + "step": 1760 + }, + { + "epoch": 0.23294179754520258, + "grad_norm": 0.3442046344280243, + "learning_rate": 1.8945039653052005e-06, + "loss": 0.0747, + "num_input_tokens_seen": 868480, + "step": 1765 + }, + { + "epoch": 0.23360168932295103, + "grad_norm": 0.8551641702651978, + "learning_rate": 1.8934717641733498e-06, + "loss": 0.1454, + "num_input_tokens_seen": 870976, + "step": 1770 + }, + { + "epoch": 0.23426158110069947, + "grad_norm": 0.31109607219696045, + "learning_rate": 1.8924348219426143e-06, + "loss": 0.2544, + "num_input_tokens_seen": 873088, + "step": 1775 + }, + { + "epoch": 0.23492147287844795, + "grad_norm": 16.480606079101562, + "learning_rate": 1.8913931441154016e-06, + "loss": 0.2463, + "num_input_tokens_seen": 875520, + "step": 1780 + }, + { + "epoch": 0.2355813646561964, + "grad_norm": 45.99843978881836, + "learning_rate": 1.8903467362192482e-06, + "loss": 0.0807, + "num_input_tokens_seen": 877632, + "step": 1785 + }, + { + "epoch": 0.23624125643394484, + "grad_norm": 92.43214416503906, + "learning_rate": 1.8892956038067895e-06, + "loss": 0.1002, + "num_input_tokens_seen": 880000, + "step": 1790 + }, + { + "epoch": 0.23690114821169328, + "grad_norm": 0.566708505153656, + "learning_rate": 1.8882397524557317e-06, + "loss": 0.0187, + "num_input_tokens_seen": 882176, + "step": 1795 + }, + { + "epoch": 0.23756103998944172, + "grad_norm": 0.06913850456476212, + "learning_rate": 1.8871791877688208e-06, + "loss": 0.0792, + "num_input_tokens_seen": 884800, + "step": 1800 + }, + { + "epoch": 0.23822093176719017, + "grad_norm": 19.2426700592041, + "learning_rate": 1.8861139153738143e-06, + "loss": 0.1225, + "num_input_tokens_seen": 887104, + "step": 1805 + }, + { + "epoch": 0.23888082354493864, + "grad_norm": 153.66583251953125, + "learning_rate": 1.8850439409234498e-06, + "loss": 0.0388, + "num_input_tokens_seen": 889408, + "step": 1810 + }, + { + "epoch": 0.2395407153226871, + "grad_norm": 91.53621673583984, + "learning_rate": 1.8839692700954161e-06, + "loss": 0.1219, + "num_input_tokens_seen": 891648, + "step": 1815 + }, + { + "epoch": 0.24020060710043553, + "grad_norm": 456.29779052734375, + "learning_rate": 1.8828899085923234e-06, + "loss": 0.2359, + "num_input_tokens_seen": 894208, + "step": 1820 + }, + { + "epoch": 0.24086049887818398, + "grad_norm": 0.05232629179954529, + "learning_rate": 1.881805862141671e-06, + "loss": 0.0859, + "num_input_tokens_seen": 896704, + "step": 1825 + }, + { + "epoch": 0.24152039065593242, + "grad_norm": 0.039349839091300964, + "learning_rate": 1.8807171364958196e-06, + "loss": 0.0579, + "num_input_tokens_seen": 899264, + "step": 1830 + }, + { + "epoch": 0.24218028243368087, + "grad_norm": 0.08498682081699371, + "learning_rate": 1.879623737431959e-06, + "loss": 0.0186, + "num_input_tokens_seen": 901760, + "step": 1835 + }, + { + "epoch": 0.24284017421142934, + "grad_norm": 7.6966872215271, + "learning_rate": 1.8785256707520778e-06, + "loss": 0.1353, + "num_input_tokens_seen": 903872, + "step": 1840 + }, + { + "epoch": 0.24350006598917778, + "grad_norm": 0.09622366726398468, + "learning_rate": 1.8774229422829325e-06, + "loss": 0.0463, + "num_input_tokens_seen": 906368, + "step": 1845 + }, + { + "epoch": 0.24415995776692623, + "grad_norm": 0.03518239036202431, + "learning_rate": 1.8763155578760181e-06, + "loss": 0.0658, + "num_input_tokens_seen": 908864, + "step": 1850 + }, + { + "epoch": 0.24481984954467467, + "grad_norm": 0.2804614305496216, + "learning_rate": 1.8752035234075336e-06, + "loss": 0.163, + "num_input_tokens_seen": 911040, + "step": 1855 + }, + { + "epoch": 0.24547974132242312, + "grad_norm": 34.17547607421875, + "learning_rate": 1.8740868447783554e-06, + "loss": 0.1979, + "num_input_tokens_seen": 913408, + "step": 1860 + }, + { + "epoch": 0.24613963310017156, + "grad_norm": 65.69808197021484, + "learning_rate": 1.8729655279140012e-06, + "loss": 0.2382, + "num_input_tokens_seen": 915968, + "step": 1865 + }, + { + "epoch": 0.24679952487792003, + "grad_norm": 154.89785766601562, + "learning_rate": 1.8718395787646029e-06, + "loss": 0.1639, + "num_input_tokens_seen": 918528, + "step": 1870 + }, + { + "epoch": 0.24745941665566848, + "grad_norm": 0.06571167707443237, + "learning_rate": 1.870709003304872e-06, + "loss": 0.0099, + "num_input_tokens_seen": 921152, + "step": 1875 + }, + { + "epoch": 0.24811930843341692, + "grad_norm": 0.09134677052497864, + "learning_rate": 1.8695738075340693e-06, + "loss": 0.0006, + "num_input_tokens_seen": 923520, + "step": 1880 + }, + { + "epoch": 0.24877920021116537, + "grad_norm": 0.3240724503993988, + "learning_rate": 1.8684339974759723e-06, + "loss": 0.0253, + "num_input_tokens_seen": 925888, + "step": 1885 + }, + { + "epoch": 0.2494390919889138, + "grad_norm": 18.70522689819336, + "learning_rate": 1.8672895791788445e-06, + "loss": 0.0925, + "num_input_tokens_seen": 928704, + "step": 1890 + }, + { + "epoch": 0.2500989837666623, + "grad_norm": 134.16648864746094, + "learning_rate": 1.8661405587154017e-06, + "loss": 0.2857, + "num_input_tokens_seen": 930944, + "step": 1895 + }, + { + "epoch": 0.2500989837666623, + "eval_loss": 0.13187885284423828, + "eval_runtime": 7.8602, + "eval_samples_per_second": 856.843, + "eval_steps_per_second": 107.121, + "num_input_tokens_seen": 930944, + "step": 1895 + }, + { + "epoch": 0.25075887554441073, + "grad_norm": 169.28016662597656, + "learning_rate": 1.8649869421827808e-06, + "loss": 0.3692, + "num_input_tokens_seen": 933376, + "step": 1900 + }, + { + "epoch": 0.2514187673221592, + "grad_norm": 2.5725350379943848, + "learning_rate": 1.863828735702507e-06, + "loss": 0.0896, + "num_input_tokens_seen": 936000, + "step": 1905 + }, + { + "epoch": 0.2520786590999076, + "grad_norm": 99.35297393798828, + "learning_rate": 1.862665945420462e-06, + "loss": 0.1121, + "num_input_tokens_seen": 938432, + "step": 1910 + }, + { + "epoch": 0.25273855087765607, + "grad_norm": 29.4595947265625, + "learning_rate": 1.8614985775068498e-06, + "loss": 0.1862, + "num_input_tokens_seen": 941312, + "step": 1915 + }, + { + "epoch": 0.2533984426554045, + "grad_norm": 2.1499125957489014, + "learning_rate": 1.860326638156167e-06, + "loss": 0.0727, + "num_input_tokens_seen": 943488, + "step": 1920 + }, + { + "epoch": 0.25405833443315295, + "grad_norm": 32.39081573486328, + "learning_rate": 1.8591501335871653e-06, + "loss": 0.083, + "num_input_tokens_seen": 945856, + "step": 1925 + }, + { + "epoch": 0.2547182262109014, + "grad_norm": 132.70303344726562, + "learning_rate": 1.857969070042824e-06, + "loss": 0.2212, + "num_input_tokens_seen": 948352, + "step": 1930 + }, + { + "epoch": 0.25537811798864984, + "grad_norm": 0.30987945199012756, + "learning_rate": 1.8567834537903116e-06, + "loss": 0.08, + "num_input_tokens_seen": 950976, + "step": 1935 + }, + { + "epoch": 0.2560380097663983, + "grad_norm": 26.0654296875, + "learning_rate": 1.8555932911209565e-06, + "loss": 0.1289, + "num_input_tokens_seen": 953216, + "step": 1940 + }, + { + "epoch": 0.25669790154414673, + "grad_norm": 0.553709089756012, + "learning_rate": 1.8543985883502119e-06, + "loss": 0.0221, + "num_input_tokens_seen": 955648, + "step": 1945 + }, + { + "epoch": 0.25735779332189523, + "grad_norm": 0.7263230681419373, + "learning_rate": 1.8531993518176216e-06, + "loss": 0.0906, + "num_input_tokens_seen": 957888, + "step": 1950 + }, + { + "epoch": 0.2580176850996437, + "grad_norm": 19.012561798095703, + "learning_rate": 1.8519955878867889e-06, + "loss": 0.3163, + "num_input_tokens_seen": 960128, + "step": 1955 + }, + { + "epoch": 0.2586775768773921, + "grad_norm": 0.9245926141738892, + "learning_rate": 1.8507873029453392e-06, + "loss": 0.1495, + "num_input_tokens_seen": 962496, + "step": 1960 + }, + { + "epoch": 0.25933746865514057, + "grad_norm": 16.104307174682617, + "learning_rate": 1.8495745034048896e-06, + "loss": 0.1628, + "num_input_tokens_seen": 965120, + "step": 1965 + }, + { + "epoch": 0.259997360432889, + "grad_norm": 0.15961866080760956, + "learning_rate": 1.8483571957010127e-06, + "loss": 0.045, + "num_input_tokens_seen": 967616, + "step": 1970 + }, + { + "epoch": 0.26065725221063746, + "grad_norm": 0.15467530488967896, + "learning_rate": 1.8471353862932035e-06, + "loss": 0.0574, + "num_input_tokens_seen": 970240, + "step": 1975 + }, + { + "epoch": 0.2613171439883859, + "grad_norm": 5.751570224761963, + "learning_rate": 1.8459090816648444e-06, + "loss": 0.0719, + "num_input_tokens_seen": 972544, + "step": 1980 + }, + { + "epoch": 0.26197703576613435, + "grad_norm": 0.7070101499557495, + "learning_rate": 1.8446782883231713e-06, + "loss": 0.2544, + "num_input_tokens_seen": 974912, + "step": 1985 + }, + { + "epoch": 0.2626369275438828, + "grad_norm": 21.680789947509766, + "learning_rate": 1.8434430127992387e-06, + "loss": 0.4055, + "num_input_tokens_seen": 977088, + "step": 1990 + }, + { + "epoch": 0.26329681932163124, + "grad_norm": 218.16334533691406, + "learning_rate": 1.8422032616478857e-06, + "loss": 0.1845, + "num_input_tokens_seen": 979648, + "step": 1995 + }, + { + "epoch": 0.2639567110993797, + "grad_norm": 2.263739585876465, + "learning_rate": 1.8409590414477001e-06, + "loss": 0.1184, + "num_input_tokens_seen": 982336, + "step": 2000 + }, + { + "epoch": 0.2646166028771281, + "grad_norm": 4.402483940124512, + "learning_rate": 1.839710358800985e-06, + "loss": 0.0071, + "num_input_tokens_seen": 984768, + "step": 2005 + }, + { + "epoch": 0.2652764946548766, + "grad_norm": 1.3311794996261597, + "learning_rate": 1.8384572203337224e-06, + "loss": 0.049, + "num_input_tokens_seen": 987136, + "step": 2010 + }, + { + "epoch": 0.26593638643262507, + "grad_norm": 0.14126527309417725, + "learning_rate": 1.837199632695538e-06, + "loss": 0.1358, + "num_input_tokens_seen": 989824, + "step": 2015 + }, + { + "epoch": 0.2665962782103735, + "grad_norm": 113.8551254272461, + "learning_rate": 1.8359376025596682e-06, + "loss": 0.2944, + "num_input_tokens_seen": 992064, + "step": 2020 + }, + { + "epoch": 0.26725616998812196, + "grad_norm": 35.01311111450195, + "learning_rate": 1.8346711366229215e-06, + "loss": 0.1288, + "num_input_tokens_seen": 994368, + "step": 2025 + }, + { + "epoch": 0.2679160617658704, + "grad_norm": 17.396068572998047, + "learning_rate": 1.8334002416056442e-06, + "loss": 0.181, + "num_input_tokens_seen": 996864, + "step": 2030 + }, + { + "epoch": 0.26857595354361885, + "grad_norm": 0.1548883020877838, + "learning_rate": 1.8321249242516865e-06, + "loss": 0.2285, + "num_input_tokens_seen": 999360, + "step": 2035 + }, + { + "epoch": 0.2692358453213673, + "grad_norm": 51.23111343383789, + "learning_rate": 1.8308451913283638e-06, + "loss": 0.0873, + "num_input_tokens_seen": 1001920, + "step": 2040 + }, + { + "epoch": 0.26989573709911574, + "grad_norm": 0.2864314913749695, + "learning_rate": 1.8295610496264229e-06, + "loss": 0.0305, + "num_input_tokens_seen": 1004224, + "step": 2045 + }, + { + "epoch": 0.2705556288768642, + "grad_norm": 0.4007130563259125, + "learning_rate": 1.828272505960005e-06, + "loss": 0.0393, + "num_input_tokens_seen": 1006528, + "step": 2050 + }, + { + "epoch": 0.27121552065461263, + "grad_norm": 0.32620009779930115, + "learning_rate": 1.8269795671666098e-06, + "loss": 0.1813, + "num_input_tokens_seen": 1008896, + "step": 2055 + }, + { + "epoch": 0.2718754124323611, + "grad_norm": 0.6125988960266113, + "learning_rate": 1.8256822401070591e-06, + "loss": 0.1234, + "num_input_tokens_seen": 1011648, + "step": 2060 + }, + { + "epoch": 0.2725353042101095, + "grad_norm": 31.247455596923828, + "learning_rate": 1.8243805316654611e-06, + "loss": 0.0522, + "num_input_tokens_seen": 1014208, + "step": 2065 + }, + { + "epoch": 0.27319519598785796, + "grad_norm": 155.57479858398438, + "learning_rate": 1.823074448749172e-06, + "loss": 0.1725, + "num_input_tokens_seen": 1016640, + "step": 2070 + }, + { + "epoch": 0.27385508776560646, + "grad_norm": 0.04504437372088432, + "learning_rate": 1.8217639982887623e-06, + "loss": 0.063, + "num_input_tokens_seen": 1019328, + "step": 2075 + }, + { + "epoch": 0.2745149795433549, + "grad_norm": 0.030620688572525978, + "learning_rate": 1.8204491872379769e-06, + "loss": 0.0781, + "num_input_tokens_seen": 1021696, + "step": 2080 + }, + { + "epoch": 0.27517487132110335, + "grad_norm": 0.2540840208530426, + "learning_rate": 1.8191300225737e-06, + "loss": 0.09, + "num_input_tokens_seen": 1024256, + "step": 2085 + }, + { + "epoch": 0.2758347630988518, + "grad_norm": 35.219879150390625, + "learning_rate": 1.8178065112959184e-06, + "loss": 0.2074, + "num_input_tokens_seen": 1026560, + "step": 2090 + }, + { + "epoch": 0.27649465487660024, + "grad_norm": 56.63616943359375, + "learning_rate": 1.8164786604276832e-06, + "loss": 0.2426, + "num_input_tokens_seen": 1029184, + "step": 2095 + }, + { + "epoch": 0.2771545466543487, + "grad_norm": 0.794495701789856, + "learning_rate": 1.8151464770150727e-06, + "loss": 0.1464, + "num_input_tokens_seen": 1031744, + "step": 2100 + }, + { + "epoch": 0.27781443843209713, + "grad_norm": 0.1718120276927948, + "learning_rate": 1.8138099681271558e-06, + "loss": 0.1528, + "num_input_tokens_seen": 1034048, + "step": 2105 + }, + { + "epoch": 0.2784743302098456, + "grad_norm": 0.1188565269112587, + "learning_rate": 1.8124691408559536e-06, + "loss": 0.1601, + "num_input_tokens_seen": 1036544, + "step": 2110 + }, + { + "epoch": 0.279134221987594, + "grad_norm": 0.09950896352529526, + "learning_rate": 1.8111240023164023e-06, + "loss": 0.1008, + "num_input_tokens_seen": 1038848, + "step": 2115 + }, + { + "epoch": 0.27979411376534247, + "grad_norm": 47.676021575927734, + "learning_rate": 1.809774559646316e-06, + "loss": 0.0632, + "num_input_tokens_seen": 1041152, + "step": 2120 + }, + { + "epoch": 0.2804540055430909, + "grad_norm": 19.95380401611328, + "learning_rate": 1.8084208200063469e-06, + "loss": 0.0935, + "num_input_tokens_seen": 1043968, + "step": 2125 + }, + { + "epoch": 0.28111389732083936, + "grad_norm": 20.683349609375, + "learning_rate": 1.8070627905799496e-06, + "loss": 0.2149, + "num_input_tokens_seen": 1046272, + "step": 2130 + }, + { + "epoch": 0.28177378909858786, + "grad_norm": 0.5064588189125061, + "learning_rate": 1.8057004785733413e-06, + "loss": 0.0862, + "num_input_tokens_seen": 1048448, + "step": 2135 + }, + { + "epoch": 0.2824336808763363, + "grad_norm": 2.3065133094787598, + "learning_rate": 1.8043338912154647e-06, + "loss": 0.1758, + "num_input_tokens_seen": 1051072, + "step": 2140 + }, + { + "epoch": 0.28309357265408475, + "grad_norm": 0.986880362033844, + "learning_rate": 1.8029630357579486e-06, + "loss": 0.0486, + "num_input_tokens_seen": 1053312, + "step": 2145 + }, + { + "epoch": 0.2837534644318332, + "grad_norm": 0.09180797636508942, + "learning_rate": 1.8015879194750702e-06, + "loss": 0.0795, + "num_input_tokens_seen": 1055680, + "step": 2150 + }, + { + "epoch": 0.28441335620958164, + "grad_norm": 0.19105878472328186, + "learning_rate": 1.8002085496637165e-06, + "loss": 0.187, + "num_input_tokens_seen": 1057984, + "step": 2155 + }, + { + "epoch": 0.2850732479873301, + "grad_norm": 0.3145781457424164, + "learning_rate": 1.7988249336433448e-06, + "loss": 0.1492, + "num_input_tokens_seen": 1060736, + "step": 2160 + }, + { + "epoch": 0.2857331397650785, + "grad_norm": 0.49677714705467224, + "learning_rate": 1.7974370787559447e-06, + "loss": 0.1319, + "num_input_tokens_seen": 1063424, + "step": 2165 + }, + { + "epoch": 0.28639303154282697, + "grad_norm": 0.031023921445012093, + "learning_rate": 1.796044992365999e-06, + "loss": 0.0575, + "num_input_tokens_seen": 1065728, + "step": 2170 + }, + { + "epoch": 0.2870529233205754, + "grad_norm": 0.07371291518211365, + "learning_rate": 1.794648681860444e-06, + "loss": 0.0009, + "num_input_tokens_seen": 1068160, + "step": 2175 + }, + { + "epoch": 0.28771281509832386, + "grad_norm": 0.030941056087613106, + "learning_rate": 1.7932481546486312e-06, + "loss": 0.2734, + "num_input_tokens_seen": 1070592, + "step": 2180 + }, + { + "epoch": 0.2883727068760723, + "grad_norm": 20.994426727294922, + "learning_rate": 1.791843418162287e-06, + "loss": 0.1758, + "num_input_tokens_seen": 1073280, + "step": 2185 + }, + { + "epoch": 0.28903259865382075, + "grad_norm": 6.4550886154174805, + "learning_rate": 1.7904344798554748e-06, + "loss": 0.0031, + "num_input_tokens_seen": 1075584, + "step": 2190 + }, + { + "epoch": 0.28969249043156925, + "grad_norm": 4.786499977111816, + "learning_rate": 1.789021347204553e-06, + "loss": 0.0927, + "num_input_tokens_seen": 1078016, + "step": 2195 + }, + { + "epoch": 0.2903523822093177, + "grad_norm": 2.4327032566070557, + "learning_rate": 1.7876040277081381e-06, + "loss": 0.1631, + "num_input_tokens_seen": 1080512, + "step": 2200 + }, + { + "epoch": 0.29101227398706614, + "grad_norm": 128.65020751953125, + "learning_rate": 1.7861825288870632e-06, + "loss": 0.0382, + "num_input_tokens_seen": 1082752, + "step": 2205 + }, + { + "epoch": 0.2916721657648146, + "grad_norm": 12.312292098999023, + "learning_rate": 1.7847568582843376e-06, + "loss": 0.3717, + "num_input_tokens_seen": 1085184, + "step": 2210 + }, + { + "epoch": 0.29233205754256303, + "grad_norm": 24.310449600219727, + "learning_rate": 1.7833270234651088e-06, + "loss": 0.1799, + "num_input_tokens_seen": 1087360, + "step": 2215 + }, + { + "epoch": 0.2929919493203115, + "grad_norm": 14.611623764038086, + "learning_rate": 1.781893032016621e-06, + "loss": 0.0596, + "num_input_tokens_seen": 1089984, + "step": 2220 + }, + { + "epoch": 0.2936518410980599, + "grad_norm": 0.6433891654014587, + "learning_rate": 1.7804548915481746e-06, + "loss": 0.0264, + "num_input_tokens_seen": 1092608, + "step": 2225 + }, + { + "epoch": 0.29431173287580836, + "grad_norm": 0.19885502755641937, + "learning_rate": 1.7790126096910865e-06, + "loss": 0.1052, + "num_input_tokens_seen": 1095040, + "step": 2230 + }, + { + "epoch": 0.2949716246535568, + "grad_norm": 12.348299980163574, + "learning_rate": 1.7775661940986492e-06, + "loss": 0.1063, + "num_input_tokens_seen": 1097728, + "step": 2235 + }, + { + "epoch": 0.29563151643130525, + "grad_norm": 1.2165111303329468, + "learning_rate": 1.776115652446091e-06, + "loss": 0.1857, + "num_input_tokens_seen": 1100096, + "step": 2240 + }, + { + "epoch": 0.2962914082090537, + "grad_norm": 149.12095642089844, + "learning_rate": 1.7746609924305336e-06, + "loss": 0.1076, + "num_input_tokens_seen": 1102400, + "step": 2245 + }, + { + "epoch": 0.29695129998680214, + "grad_norm": 0.0535690002143383, + "learning_rate": 1.7732022217709534e-06, + "loss": 0.0825, + "num_input_tokens_seen": 1104960, + "step": 2250 + }, + { + "epoch": 0.2976111917645506, + "grad_norm": 12.77878475189209, + "learning_rate": 1.7717393482081384e-06, + "loss": 0.1648, + "num_input_tokens_seen": 1107520, + "step": 2255 + }, + { + "epoch": 0.2982710835422991, + "grad_norm": 37.477237701416016, + "learning_rate": 1.7702723795046492e-06, + "loss": 0.1223, + "num_input_tokens_seen": 1109952, + "step": 2260 + }, + { + "epoch": 0.29893097532004753, + "grad_norm": 0.3493918478488922, + "learning_rate": 1.7688013234447757e-06, + "loss": 0.0026, + "num_input_tokens_seen": 1112128, + "step": 2265 + }, + { + "epoch": 0.299590867097796, + "grad_norm": 0.07301745563745499, + "learning_rate": 1.7673261878344973e-06, + "loss": 0.1387, + "num_input_tokens_seen": 1114688, + "step": 2270 + }, + { + "epoch": 0.30011878051999474, + "eval_loss": 0.12411058694124222, + "eval_runtime": 7.994, + "eval_samples_per_second": 842.505, + "eval_steps_per_second": 105.329, + "num_input_tokens_seen": 1116800, + "step": 2274 + }, + { + "epoch": 0.3002507588755444, + "grad_norm": 0.08390434831380844, + "learning_rate": 1.7658469805014414e-06, + "loss": 0.1185, + "num_input_tokens_seen": 1117248, + "step": 2275 + }, + { + "epoch": 0.30091065065329287, + "grad_norm": 41.85004806518555, + "learning_rate": 1.7643637092948415e-06, + "loss": 0.1096, + "num_input_tokens_seen": 1119808, + "step": 2280 + }, + { + "epoch": 0.3015705424310413, + "grad_norm": 55.66747283935547, + "learning_rate": 1.7628763820854948e-06, + "loss": 0.2572, + "num_input_tokens_seen": 1122112, + "step": 2285 + }, + { + "epoch": 0.30223043420878976, + "grad_norm": 0.3250507712364197, + "learning_rate": 1.7613850067657216e-06, + "loss": 0.0884, + "num_input_tokens_seen": 1124544, + "step": 2290 + }, + { + "epoch": 0.3028903259865382, + "grad_norm": 0.10577468574047089, + "learning_rate": 1.7598895912493232e-06, + "loss": 0.1247, + "num_input_tokens_seen": 1127104, + "step": 2295 + }, + { + "epoch": 0.30355021776428665, + "grad_norm": 0.9884712100028992, + "learning_rate": 1.7583901434715397e-06, + "loss": 0.0773, + "num_input_tokens_seen": 1129536, + "step": 2300 + }, + { + "epoch": 0.3042101095420351, + "grad_norm": 45.45866394042969, + "learning_rate": 1.7568866713890074e-06, + "loss": 0.1009, + "num_input_tokens_seen": 1131840, + "step": 2305 + }, + { + "epoch": 0.30487000131978353, + "grad_norm": 1.1424263715744019, + "learning_rate": 1.7553791829797175e-06, + "loss": 0.1243, + "num_input_tokens_seen": 1134336, + "step": 2310 + }, + { + "epoch": 0.305529893097532, + "grad_norm": 28.028568267822266, + "learning_rate": 1.7538676862429737e-06, + "loss": 0.3449, + "num_input_tokens_seen": 1136640, + "step": 2315 + }, + { + "epoch": 0.3061897848752805, + "grad_norm": 0.5848109126091003, + "learning_rate": 1.7523521891993486e-06, + "loss": 0.1248, + "num_input_tokens_seen": 1139136, + "step": 2320 + }, + { + "epoch": 0.3068496766530289, + "grad_norm": 0.08309627324342728, + "learning_rate": 1.7508326998906422e-06, + "loss": 0.0367, + "num_input_tokens_seen": 1141568, + "step": 2325 + }, + { + "epoch": 0.30750956843077737, + "grad_norm": 0.08207709342241287, + "learning_rate": 1.7493092263798394e-06, + "loss": 0.0023, + "num_input_tokens_seen": 1143936, + "step": 2330 + }, + { + "epoch": 0.3081694602085258, + "grad_norm": 156.30946350097656, + "learning_rate": 1.7477817767510664e-06, + "loss": 0.0188, + "num_input_tokens_seen": 1146624, + "step": 2335 + }, + { + "epoch": 0.30882935198627426, + "grad_norm": 0.43475231528282166, + "learning_rate": 1.7462503591095484e-06, + "loss": 0.0209, + "num_input_tokens_seen": 1149120, + "step": 2340 + }, + { + "epoch": 0.3094892437640227, + "grad_norm": 0.033984895795583725, + "learning_rate": 1.7447149815815659e-06, + "loss": 0.1152, + "num_input_tokens_seen": 1151488, + "step": 2345 + }, + { + "epoch": 0.31014913554177115, + "grad_norm": 0.023453880101442337, + "learning_rate": 1.7431756523144126e-06, + "loss": 0.1426, + "num_input_tokens_seen": 1153600, + "step": 2350 + }, + { + "epoch": 0.3108090273195196, + "grad_norm": 0.04266361892223358, + "learning_rate": 1.7416323794763512e-06, + "loss": 0.0021, + "num_input_tokens_seen": 1156224, + "step": 2355 + }, + { + "epoch": 0.31146891909726804, + "grad_norm": 0.01946975663304329, + "learning_rate": 1.7400851712565707e-06, + "loss": 0.234, + "num_input_tokens_seen": 1158656, + "step": 2360 + }, + { + "epoch": 0.3121288108750165, + "grad_norm": 0.08395219594240189, + "learning_rate": 1.7385340358651432e-06, + "loss": 0.1276, + "num_input_tokens_seen": 1161408, + "step": 2365 + }, + { + "epoch": 0.3127887026527649, + "grad_norm": 105.1695327758789, + "learning_rate": 1.736978981532979e-06, + "loss": 0.0223, + "num_input_tokens_seen": 1163904, + "step": 2370 + }, + { + "epoch": 0.31344859443051337, + "grad_norm": 0.06841170787811279, + "learning_rate": 1.7354200165117838e-06, + "loss": 0.2808, + "num_input_tokens_seen": 1166208, + "step": 2375 + }, + { + "epoch": 0.3141084862082619, + "grad_norm": 0.11680270731449127, + "learning_rate": 1.733857149074016e-06, + "loss": 0.2086, + "num_input_tokens_seen": 1168512, + "step": 2380 + }, + { + "epoch": 0.3147683779860103, + "grad_norm": 0.2520144581794739, + "learning_rate": 1.7322903875128402e-06, + "loss": 0.2359, + "num_input_tokens_seen": 1171072, + "step": 2385 + }, + { + "epoch": 0.31542826976375876, + "grad_norm": 0.23810061812400818, + "learning_rate": 1.7307197401420858e-06, + "loss": 0.0071, + "num_input_tokens_seen": 1173312, + "step": 2390 + }, + { + "epoch": 0.3160881615415072, + "grad_norm": 0.48759013414382935, + "learning_rate": 1.7291452152962018e-06, + "loss": 0.1059, + "num_input_tokens_seen": 1175744, + "step": 2395 + }, + { + "epoch": 0.31674805331925565, + "grad_norm": 45.06856918334961, + "learning_rate": 1.7275668213302116e-06, + "loss": 0.2033, + "num_input_tokens_seen": 1178112, + "step": 2400 + }, + { + "epoch": 0.3174079450970041, + "grad_norm": 44.76649856567383, + "learning_rate": 1.72598456661967e-06, + "loss": 0.0488, + "num_input_tokens_seen": 1180352, + "step": 2405 + }, + { + "epoch": 0.31806783687475254, + "grad_norm": 0.12351297587156296, + "learning_rate": 1.7243984595606191e-06, + "loss": 0.1241, + "num_input_tokens_seen": 1182528, + "step": 2410 + }, + { + "epoch": 0.318727728652501, + "grad_norm": 3.226271152496338, + "learning_rate": 1.722808508569542e-06, + "loss": 0.0697, + "num_input_tokens_seen": 1185280, + "step": 2415 + }, + { + "epoch": 0.31938762043024943, + "grad_norm": 16.573923110961914, + "learning_rate": 1.72121472208332e-06, + "loss": 0.0766, + "num_input_tokens_seen": 1188032, + "step": 2420 + }, + { + "epoch": 0.3200475122079979, + "grad_norm": 92.98533630371094, + "learning_rate": 1.7196171085591864e-06, + "loss": 0.1857, + "num_input_tokens_seen": 1190464, + "step": 2425 + }, + { + "epoch": 0.3207074039857463, + "grad_norm": 37.98392868041992, + "learning_rate": 1.7180156764746824e-06, + "loss": 0.2532, + "num_input_tokens_seen": 1192960, + "step": 2430 + }, + { + "epoch": 0.32136729576349476, + "grad_norm": 0.12210986018180847, + "learning_rate": 1.7164104343276113e-06, + "loss": 0.0694, + "num_input_tokens_seen": 1195072, + "step": 2435 + }, + { + "epoch": 0.3220271875412432, + "grad_norm": 0.015084991231560707, + "learning_rate": 1.714801390635996e-06, + "loss": 0.0516, + "num_input_tokens_seen": 1197376, + "step": 2440 + }, + { + "epoch": 0.3226870793189917, + "grad_norm": 0.035268671810626984, + "learning_rate": 1.7131885539380297e-06, + "loss": 0.0735, + "num_input_tokens_seen": 1199936, + "step": 2445 + }, + { + "epoch": 0.32334697109674015, + "grad_norm": 33.19987106323242, + "learning_rate": 1.7115719327920335e-06, + "loss": 0.141, + "num_input_tokens_seen": 1202368, + "step": 2450 + }, + { + "epoch": 0.3240068628744886, + "grad_norm": 0.026460843160748482, + "learning_rate": 1.70995153577641e-06, + "loss": 0.0172, + "num_input_tokens_seen": 1204800, + "step": 2455 + }, + { + "epoch": 0.32466675465223704, + "grad_norm": 33.02996826171875, + "learning_rate": 1.7083273714895991e-06, + "loss": 0.0639, + "num_input_tokens_seen": 1207552, + "step": 2460 + }, + { + "epoch": 0.3253266464299855, + "grad_norm": 0.04908216744661331, + "learning_rate": 1.7066994485500298e-06, + "loss": 0.1031, + "num_input_tokens_seen": 1209856, + "step": 2465 + }, + { + "epoch": 0.32598653820773393, + "grad_norm": 0.16728860139846802, + "learning_rate": 1.7050677755960762e-06, + "loss": 0.1125, + "num_input_tokens_seen": 1212352, + "step": 2470 + }, + { + "epoch": 0.3266464299854824, + "grad_norm": 0.5578970313072205, + "learning_rate": 1.7034323612860124e-06, + "loss": 0.0832, + "num_input_tokens_seen": 1214912, + "step": 2475 + }, + { + "epoch": 0.3273063217632308, + "grad_norm": 0.029092831537127495, + "learning_rate": 1.7017932142979645e-06, + "loss": 0.1275, + "num_input_tokens_seen": 1217088, + "step": 2480 + }, + { + "epoch": 0.32796621354097927, + "grad_norm": 0.5877671241760254, + "learning_rate": 1.700150343329866e-06, + "loss": 0.2478, + "num_input_tokens_seen": 1219584, + "step": 2485 + }, + { + "epoch": 0.3286261053187277, + "grad_norm": 62.71138000488281, + "learning_rate": 1.6985037570994113e-06, + "loss": 0.1182, + "num_input_tokens_seen": 1222336, + "step": 2490 + }, + { + "epoch": 0.32928599709647616, + "grad_norm": 0.06207147613167763, + "learning_rate": 1.6968534643440088e-06, + "loss": 0.0913, + "num_input_tokens_seen": 1224832, + "step": 2495 + }, + { + "epoch": 0.3299458888742246, + "grad_norm": 23.29184913635254, + "learning_rate": 1.6951994738207364e-06, + "loss": 0.1998, + "num_input_tokens_seen": 1227392, + "step": 2500 + }, + { + "epoch": 0.3306057806519731, + "grad_norm": 14.910649299621582, + "learning_rate": 1.6935417943062928e-06, + "loss": 0.2007, + "num_input_tokens_seen": 1229952, + "step": 2505 + }, + { + "epoch": 0.33126567242972155, + "grad_norm": 1.2473188638687134, + "learning_rate": 1.6918804345969516e-06, + "loss": 0.0615, + "num_input_tokens_seen": 1232640, + "step": 2510 + }, + { + "epoch": 0.33192556420747, + "grad_norm": 121.41654968261719, + "learning_rate": 1.6902154035085156e-06, + "loss": 0.0479, + "num_input_tokens_seen": 1235200, + "step": 2515 + }, + { + "epoch": 0.33258545598521844, + "grad_norm": 0.5897153615951538, + "learning_rate": 1.688546709876269e-06, + "loss": 0.1243, + "num_input_tokens_seen": 1237632, + "step": 2520 + }, + { + "epoch": 0.3332453477629669, + "grad_norm": 1.850326418876648, + "learning_rate": 1.6868743625549314e-06, + "loss": 0.0662, + "num_input_tokens_seen": 1239936, + "step": 2525 + }, + { + "epoch": 0.3339052395407153, + "grad_norm": 0.34998998045921326, + "learning_rate": 1.6851983704186092e-06, + "loss": 0.0455, + "num_input_tokens_seen": 1242304, + "step": 2530 + }, + { + "epoch": 0.33456513131846377, + "grad_norm": 0.0726654902100563, + "learning_rate": 1.6835187423607503e-06, + "loss": 0.0018, + "num_input_tokens_seen": 1244736, + "step": 2535 + }, + { + "epoch": 0.3352250230962122, + "grad_norm": 0.07731109857559204, + "learning_rate": 1.681835487294096e-06, + "loss": 0.1863, + "num_input_tokens_seen": 1247488, + "step": 2540 + }, + { + "epoch": 0.33588491487396066, + "grad_norm": 0.04418403282761574, + "learning_rate": 1.6801486141506342e-06, + "loss": 0.229, + "num_input_tokens_seen": 1250048, + "step": 2545 + }, + { + "epoch": 0.3365448066517091, + "grad_norm": 133.3740692138672, + "learning_rate": 1.6784581318815514e-06, + "loss": 0.3541, + "num_input_tokens_seen": 1252928, + "step": 2550 + }, + { + "epoch": 0.33720469842945755, + "grad_norm": 0.03932896628975868, + "learning_rate": 1.6767640494571849e-06, + "loss": 0.1596, + "num_input_tokens_seen": 1255488, + "step": 2555 + }, + { + "epoch": 0.337864590207206, + "grad_norm": 33.07372283935547, + "learning_rate": 1.6750663758669767e-06, + "loss": 0.3643, + "num_input_tokens_seen": 1257984, + "step": 2560 + }, + { + "epoch": 0.3385244819849545, + "grad_norm": 0.150083988904953, + "learning_rate": 1.6733651201194245e-06, + "loss": 0.1098, + "num_input_tokens_seen": 1260416, + "step": 2565 + }, + { + "epoch": 0.33918437376270294, + "grad_norm": 19.72997283935547, + "learning_rate": 1.6716602912420342e-06, + "loss": 0.1186, + "num_input_tokens_seen": 1263168, + "step": 2570 + }, + { + "epoch": 0.3398442655404514, + "grad_norm": 0.24268358945846558, + "learning_rate": 1.6699518982812726e-06, + "loss": 0.1177, + "num_input_tokens_seen": 1265600, + "step": 2575 + }, + { + "epoch": 0.34050415731819983, + "grad_norm": 0.06883673369884491, + "learning_rate": 1.6682399503025183e-06, + "loss": 0.0041, + "num_input_tokens_seen": 1268032, + "step": 2580 + }, + { + "epoch": 0.3411640490959483, + "grad_norm": 38.50511932373047, + "learning_rate": 1.666524456390014e-06, + "loss": 0.1831, + "num_input_tokens_seen": 1270336, + "step": 2585 + }, + { + "epoch": 0.3418239408736967, + "grad_norm": 25.056659698486328, + "learning_rate": 1.664805425646819e-06, + "loss": 0.0639, + "num_input_tokens_seen": 1273088, + "step": 2590 + }, + { + "epoch": 0.34248383265144516, + "grad_norm": 0.358341783285141, + "learning_rate": 1.6630828671947606e-06, + "loss": 0.2223, + "num_input_tokens_seen": 1275456, + "step": 2595 + }, + { + "epoch": 0.3431437244291936, + "grad_norm": 0.3967565596103668, + "learning_rate": 1.6613567901743842e-06, + "loss": 0.0484, + "num_input_tokens_seen": 1277888, + "step": 2600 + }, + { + "epoch": 0.34380361620694205, + "grad_norm": 0.4620976448059082, + "learning_rate": 1.6596272037449075e-06, + "loss": 0.0021, + "num_input_tokens_seen": 1280384, + "step": 2605 + }, + { + "epoch": 0.3444635079846905, + "grad_norm": 111.44522094726562, + "learning_rate": 1.6578941170841696e-06, + "loss": 0.0633, + "num_input_tokens_seen": 1282944, + "step": 2610 + }, + { + "epoch": 0.34512339976243894, + "grad_norm": 10.548276901245117, + "learning_rate": 1.6561575393885833e-06, + "loss": 0.0451, + "num_input_tokens_seen": 1285184, + "step": 2615 + }, + { + "epoch": 0.3457832915401874, + "grad_norm": 0.21035003662109375, + "learning_rate": 1.6544174798730864e-06, + "loss": 0.2038, + "num_input_tokens_seen": 1287808, + "step": 2620 + }, + { + "epoch": 0.34644318331793583, + "grad_norm": 0.9157705307006836, + "learning_rate": 1.6526739477710923e-06, + "loss": 0.1932, + "num_input_tokens_seen": 1290432, + "step": 2625 + }, + { + "epoch": 0.34710307509568433, + "grad_norm": 318.77642822265625, + "learning_rate": 1.650926952334441e-06, + "loss": 0.2289, + "num_input_tokens_seen": 1292736, + "step": 2630 + }, + { + "epoch": 0.3477629668734328, + "grad_norm": 0.13021092116832733, + "learning_rate": 1.6491765028333516e-06, + "loss": 0.2947, + "num_input_tokens_seen": 1295104, + "step": 2635 + }, + { + "epoch": 0.3484228586511812, + "grad_norm": 0.7741267681121826, + "learning_rate": 1.6474226085563693e-06, + "loss": 0.0444, + "num_input_tokens_seen": 1297600, + "step": 2640 + }, + { + "epoch": 0.34908275042892967, + "grad_norm": 0.11857028305530548, + "learning_rate": 1.6456652788103215e-06, + "loss": 0.0057, + "num_input_tokens_seen": 1300224, + "step": 2645 + }, + { + "epoch": 0.3497426422066781, + "grad_norm": 0.3336769640445709, + "learning_rate": 1.6439045229202631e-06, + "loss": 0.0494, + "num_input_tokens_seen": 1302528, + "step": 2650 + }, + { + "epoch": 0.3501385772733272, + "eval_loss": 0.13837853074073792, + "eval_runtime": 7.8873, + "eval_samples_per_second": 853.902, + "eval_steps_per_second": 106.754, + "num_input_tokens_seen": 1303872, + "step": 2653 + }, + { + "epoch": 0.35040253398442656, + "grad_norm": 0.26019707322120667, + "learning_rate": 1.6421403502294307e-06, + "loss": 0.1541, + "num_input_tokens_seen": 1305024, + "step": 2655 + }, + { + "epoch": 0.351062425762175, + "grad_norm": 0.39249280095100403, + "learning_rate": 1.6403727700991915e-06, + "loss": 0.1878, + "num_input_tokens_seen": 1307392, + "step": 2660 + }, + { + "epoch": 0.35172231753992345, + "grad_norm": 0.15294888615608215, + "learning_rate": 1.6386017919089933e-06, + "loss": 0.273, + "num_input_tokens_seen": 1310016, + "step": 2665 + }, + { + "epoch": 0.3523822093176719, + "grad_norm": 0.07149966061115265, + "learning_rate": 1.636827425056316e-06, + "loss": 0.0471, + "num_input_tokens_seen": 1312576, + "step": 2670 + }, + { + "epoch": 0.35304210109542034, + "grad_norm": 0.1564963310956955, + "learning_rate": 1.635049678956621e-06, + "loss": 0.1356, + "num_input_tokens_seen": 1315072, + "step": 2675 + }, + { + "epoch": 0.3537019928731688, + "grad_norm": 3.6665759086608887, + "learning_rate": 1.633268563043301e-06, + "loss": 0.125, + "num_input_tokens_seen": 1317504, + "step": 2680 + }, + { + "epoch": 0.3543618846509172, + "grad_norm": 0.23970353603363037, + "learning_rate": 1.63148408676763e-06, + "loss": 0.0021, + "num_input_tokens_seen": 1319680, + "step": 2685 + }, + { + "epoch": 0.3550217764286657, + "grad_norm": 0.059584952890872955, + "learning_rate": 1.6296962595987141e-06, + "loss": 0.001, + "num_input_tokens_seen": 1322240, + "step": 2690 + }, + { + "epoch": 0.35568166820641417, + "grad_norm": 0.21580637991428375, + "learning_rate": 1.6279050910234392e-06, + "loss": 0.1102, + "num_input_tokens_seen": 1324736, + "step": 2695 + }, + { + "epoch": 0.3563415599841626, + "grad_norm": 0.024059053510427475, + "learning_rate": 1.626110590546423e-06, + "loss": 0.0617, + "num_input_tokens_seen": 1327104, + "step": 2700 + }, + { + "epoch": 0.35700145176191106, + "grad_norm": 188.6191864013672, + "learning_rate": 1.6243127676899635e-06, + "loss": 0.2021, + "num_input_tokens_seen": 1329920, + "step": 2705 + }, + { + "epoch": 0.3576613435396595, + "grad_norm": 0.04233895614743233, + "learning_rate": 1.6225116319939884e-06, + "loss": 0.2292, + "num_input_tokens_seen": 1332352, + "step": 2710 + }, + { + "epoch": 0.35832123531740795, + "grad_norm": 79.07254028320312, + "learning_rate": 1.6207071930160044e-06, + "loss": 0.1136, + "num_input_tokens_seen": 1335040, + "step": 2715 + }, + { + "epoch": 0.3589811270951564, + "grad_norm": 0.3499235510826111, + "learning_rate": 1.6188994603310468e-06, + "loss": 0.0427, + "num_input_tokens_seen": 1337472, + "step": 2720 + }, + { + "epoch": 0.35964101887290484, + "grad_norm": 114.59748840332031, + "learning_rate": 1.617088443531628e-06, + "loss": 0.158, + "num_input_tokens_seen": 1339712, + "step": 2725 + }, + { + "epoch": 0.3603009106506533, + "grad_norm": 0.12750740349292755, + "learning_rate": 1.6152741522276882e-06, + "loss": 0.0092, + "num_input_tokens_seen": 1342144, + "step": 2730 + }, + { + "epoch": 0.36096080242840173, + "grad_norm": 0.6062318682670593, + "learning_rate": 1.6134565960465425e-06, + "loss": 0.0433, + "num_input_tokens_seen": 1344512, + "step": 2735 + }, + { + "epoch": 0.3616206942061502, + "grad_norm": 0.28183653950691223, + "learning_rate": 1.6116357846328312e-06, + "loss": 0.1562, + "num_input_tokens_seen": 1346880, + "step": 2740 + }, + { + "epoch": 0.3622805859838986, + "grad_norm": 0.0915948897600174, + "learning_rate": 1.609811727648468e-06, + "loss": 0.0123, + "num_input_tokens_seen": 1349056, + "step": 2745 + }, + { + "epoch": 0.36294047776164706, + "grad_norm": 0.5089015960693359, + "learning_rate": 1.6079844347725882e-06, + "loss": 0.0425, + "num_input_tokens_seen": 1351488, + "step": 2750 + }, + { + "epoch": 0.36360036953939556, + "grad_norm": 0.19435492157936096, + "learning_rate": 1.6061539157014987e-06, + "loss": 0.0654, + "num_input_tokens_seen": 1353920, + "step": 2755 + }, + { + "epoch": 0.364260261317144, + "grad_norm": 0.4347739815711975, + "learning_rate": 1.6043201801486257e-06, + "loss": 0.2615, + "num_input_tokens_seen": 1356352, + "step": 2760 + }, + { + "epoch": 0.36492015309489245, + "grad_norm": 6.802909851074219, + "learning_rate": 1.6024832378444628e-06, + "loss": 0.1949, + "num_input_tokens_seen": 1359104, + "step": 2765 + }, + { + "epoch": 0.3655800448726409, + "grad_norm": 25.862701416015625, + "learning_rate": 1.6006430985365204e-06, + "loss": 0.3066, + "num_input_tokens_seen": 1361536, + "step": 2770 + }, + { + "epoch": 0.36623993665038934, + "grad_norm": 8.995551109313965, + "learning_rate": 1.5987997719892735e-06, + "loss": 0.2606, + "num_input_tokens_seen": 1364160, + "step": 2775 + }, + { + "epoch": 0.3668998284281378, + "grad_norm": 0.2326563000679016, + "learning_rate": 1.5969532679841088e-06, + "loss": 0.005, + "num_input_tokens_seen": 1366656, + "step": 2780 + }, + { + "epoch": 0.36755972020588623, + "grad_norm": 29.3525390625, + "learning_rate": 1.5951035963192752e-06, + "loss": 0.0512, + "num_input_tokens_seen": 1369216, + "step": 2785 + }, + { + "epoch": 0.3682196119836347, + "grad_norm": 3.3923957347869873, + "learning_rate": 1.593250766809829e-06, + "loss": 0.2619, + "num_input_tokens_seen": 1371712, + "step": 2790 + }, + { + "epoch": 0.3688795037613831, + "grad_norm": 47.703060150146484, + "learning_rate": 1.5913947892875842e-06, + "loss": 0.1739, + "num_input_tokens_seen": 1374080, + "step": 2795 + }, + { + "epoch": 0.36953939553913157, + "grad_norm": 0.36688122153282166, + "learning_rate": 1.589535673601059e-06, + "loss": 0.1383, + "num_input_tokens_seen": 1377024, + "step": 2800 + }, + { + "epoch": 0.37019928731688, + "grad_norm": 43.584991455078125, + "learning_rate": 1.587673429615424e-06, + "loss": 0.0587, + "num_input_tokens_seen": 1379392, + "step": 2805 + }, + { + "epoch": 0.37085917909462845, + "grad_norm": 0.4732750356197357, + "learning_rate": 1.5858080672124495e-06, + "loss": 0.1913, + "num_input_tokens_seen": 1381760, + "step": 2810 + }, + { + "epoch": 0.37151907087237696, + "grad_norm": 2.4631268978118896, + "learning_rate": 1.5839395962904536e-06, + "loss": 0.0931, + "num_input_tokens_seen": 1384128, + "step": 2815 + }, + { + "epoch": 0.3721789626501254, + "grad_norm": 0.13429832458496094, + "learning_rate": 1.5820680267642494e-06, + "loss": 0.0094, + "num_input_tokens_seen": 1386496, + "step": 2820 + }, + { + "epoch": 0.37283885442787384, + "grad_norm": 0.12962228059768677, + "learning_rate": 1.5801933685650917e-06, + "loss": 0.0489, + "num_input_tokens_seen": 1388736, + "step": 2825 + }, + { + "epoch": 0.3734987462056223, + "grad_norm": 88.37797546386719, + "learning_rate": 1.5783156316406259e-06, + "loss": 0.0478, + "num_input_tokens_seen": 1391040, + "step": 2830 + }, + { + "epoch": 0.37415863798337073, + "grad_norm": 115.88335418701172, + "learning_rate": 1.5764348259548334e-06, + "loss": 0.2375, + "num_input_tokens_seen": 1393344, + "step": 2835 + }, + { + "epoch": 0.3748185297611192, + "grad_norm": 76.65043640136719, + "learning_rate": 1.5745509614879806e-06, + "loss": 0.0726, + "num_input_tokens_seen": 1395648, + "step": 2840 + }, + { + "epoch": 0.3754784215388676, + "grad_norm": 0.021454842761158943, + "learning_rate": 1.572664048236564e-06, + "loss": 0.3055, + "num_input_tokens_seen": 1398272, + "step": 2845 + }, + { + "epoch": 0.37613831331661607, + "grad_norm": 0.13567005097866058, + "learning_rate": 1.570774096213259e-06, + "loss": 0.0405, + "num_input_tokens_seen": 1400576, + "step": 2850 + }, + { + "epoch": 0.3767982050943645, + "grad_norm": 0.033437322825193405, + "learning_rate": 1.5688811154468649e-06, + "loss": 0.0015, + "num_input_tokens_seen": 1403136, + "step": 2855 + }, + { + "epoch": 0.37745809687211296, + "grad_norm": 0.10280902683734894, + "learning_rate": 1.5669851159822532e-06, + "loss": 0.1948, + "num_input_tokens_seen": 1405504, + "step": 2860 + }, + { + "epoch": 0.3781179886498614, + "grad_norm": 102.37528991699219, + "learning_rate": 1.5650861078803137e-06, + "loss": 0.1405, + "num_input_tokens_seen": 1407808, + "step": 2865 + }, + { + "epoch": 0.37877788042760985, + "grad_norm": 25.63332748413086, + "learning_rate": 1.5631841012179013e-06, + "loss": 0.0803, + "num_input_tokens_seen": 1410304, + "step": 2870 + }, + { + "epoch": 0.37943777220535835, + "grad_norm": 0.2513096034526825, + "learning_rate": 1.5612791060877818e-06, + "loss": 0.0026, + "num_input_tokens_seen": 1412736, + "step": 2875 + }, + { + "epoch": 0.3800976639831068, + "grad_norm": 103.188232421875, + "learning_rate": 1.5593711325985801e-06, + "loss": 0.0403, + "num_input_tokens_seen": 1415488, + "step": 2880 + }, + { + "epoch": 0.38075755576085524, + "grad_norm": 0.05830248445272446, + "learning_rate": 1.5574601908747245e-06, + "loss": 0.213, + "num_input_tokens_seen": 1417856, + "step": 2885 + }, + { + "epoch": 0.3814174475386037, + "grad_norm": 0.040386002510786057, + "learning_rate": 1.5555462910563936e-06, + "loss": 0.077, + "num_input_tokens_seen": 1420096, + "step": 2890 + }, + { + "epoch": 0.3820773393163521, + "grad_norm": 21.231006622314453, + "learning_rate": 1.5536294432994636e-06, + "loss": 0.2334, + "num_input_tokens_seen": 1422656, + "step": 2895 + }, + { + "epoch": 0.38273723109410057, + "grad_norm": 2.1260502338409424, + "learning_rate": 1.5517096577754528e-06, + "loss": 0.0744, + "num_input_tokens_seen": 1425152, + "step": 2900 + }, + { + "epoch": 0.383397122871849, + "grad_norm": 0.10484765470027924, + "learning_rate": 1.5497869446714695e-06, + "loss": 0.0393, + "num_input_tokens_seen": 1427840, + "step": 2905 + }, + { + "epoch": 0.38405701464959746, + "grad_norm": 0.09525975584983826, + "learning_rate": 1.5478613141901558e-06, + "loss": 0.0065, + "num_input_tokens_seen": 1430144, + "step": 2910 + }, + { + "epoch": 0.3847169064273459, + "grad_norm": 0.13482730090618134, + "learning_rate": 1.5459327765496348e-06, + "loss": 0.1329, + "num_input_tokens_seen": 1432448, + "step": 2915 + }, + { + "epoch": 0.38537679820509435, + "grad_norm": 0.25041621923446655, + "learning_rate": 1.5440013419834563e-06, + "loss": 0.0276, + "num_input_tokens_seen": 1434752, + "step": 2920 + }, + { + "epoch": 0.3860366899828428, + "grad_norm": 0.17661698162555695, + "learning_rate": 1.5420670207405419e-06, + "loss": 0.0011, + "num_input_tokens_seen": 1437184, + "step": 2925 + }, + { + "epoch": 0.38669658176059124, + "grad_norm": 0.07189780473709106, + "learning_rate": 1.5401298230851314e-06, + "loss": 0.0935, + "num_input_tokens_seen": 1440000, + "step": 2930 + }, + { + "epoch": 0.3873564735383397, + "grad_norm": 62.480587005615234, + "learning_rate": 1.5381897592967275e-06, + "loss": 0.0716, + "num_input_tokens_seen": 1442624, + "step": 2935 + }, + { + "epoch": 0.3880163653160882, + "grad_norm": 0.13392320275306702, + "learning_rate": 1.5362468396700426e-06, + "loss": 0.0019, + "num_input_tokens_seen": 1445184, + "step": 2940 + }, + { + "epoch": 0.38867625709383663, + "grad_norm": 5.734695911407471, + "learning_rate": 1.5343010745149418e-06, + "loss": 0.2755, + "num_input_tokens_seen": 1447616, + "step": 2945 + }, + { + "epoch": 0.3893361488715851, + "grad_norm": 0.01573280617594719, + "learning_rate": 1.532352474156391e-06, + "loss": 0.0004, + "num_input_tokens_seen": 1450176, + "step": 2950 + }, + { + "epoch": 0.3899960406493335, + "grad_norm": 79.7118148803711, + "learning_rate": 1.5304010489343995e-06, + "loss": 0.5725, + "num_input_tokens_seen": 1452672, + "step": 2955 + }, + { + "epoch": 0.39065593242708196, + "grad_norm": 0.11838354915380478, + "learning_rate": 1.528446809203968e-06, + "loss": 0.2012, + "num_input_tokens_seen": 1455232, + "step": 2960 + }, + { + "epoch": 0.3913158242048304, + "grad_norm": 65.51634216308594, + "learning_rate": 1.526489765335031e-06, + "loss": 0.1031, + "num_input_tokens_seen": 1457792, + "step": 2965 + }, + { + "epoch": 0.39197571598257885, + "grad_norm": 0.2883387804031372, + "learning_rate": 1.5245299277124026e-06, + "loss": 0.1237, + "num_input_tokens_seen": 1460160, + "step": 2970 + }, + { + "epoch": 0.3926356077603273, + "grad_norm": 0.13738037645816803, + "learning_rate": 1.5225673067357218e-06, + "loss": 0.1705, + "num_input_tokens_seen": 1462400, + "step": 2975 + }, + { + "epoch": 0.39329549953807574, + "grad_norm": 9.973140716552734, + "learning_rate": 1.5206019128193981e-06, + "loss": 0.1399, + "num_input_tokens_seen": 1465088, + "step": 2980 + }, + { + "epoch": 0.3939553913158242, + "grad_norm": 0.1793886423110962, + "learning_rate": 1.5186337563925538e-06, + "loss": 0.167, + "num_input_tokens_seen": 1467456, + "step": 2985 + }, + { + "epoch": 0.39461528309357263, + "grad_norm": 0.18464945256710052, + "learning_rate": 1.516662847898971e-06, + "loss": 0.001, + "num_input_tokens_seen": 1470016, + "step": 2990 + }, + { + "epoch": 0.3952751748713211, + "grad_norm": 0.3655398190021515, + "learning_rate": 1.5146891977970349e-06, + "loss": 0.0936, + "num_input_tokens_seen": 1472448, + "step": 2995 + }, + { + "epoch": 0.3959350666490696, + "grad_norm": 0.48678961396217346, + "learning_rate": 1.5127128165596794e-06, + "loss": 0.0271, + "num_input_tokens_seen": 1475072, + "step": 3000 + }, + { + "epoch": 0.396594958426818, + "grad_norm": 0.7548299431800842, + "learning_rate": 1.51073371467433e-06, + "loss": 0.0571, + "num_input_tokens_seen": 1477440, + "step": 3005 + }, + { + "epoch": 0.39725485020456647, + "grad_norm": 1.1893014907836914, + "learning_rate": 1.5087519026428498e-06, + "loss": 0.027, + "num_input_tokens_seen": 1479872, + "step": 3010 + }, + { + "epoch": 0.3979147419823149, + "grad_norm": 24.348011016845703, + "learning_rate": 1.5067673909814818e-06, + "loss": 0.2218, + "num_input_tokens_seen": 1481920, + "step": 3015 + }, + { + "epoch": 0.39857463376006336, + "grad_norm": 0.06322956830263138, + "learning_rate": 1.5047801902207953e-06, + "loss": 0.1557, + "num_input_tokens_seen": 1484992, + "step": 3020 + }, + { + "epoch": 0.3992345255378118, + "grad_norm": 0.24212270975112915, + "learning_rate": 1.5027903109056288e-06, + "loss": 0.2134, + "num_input_tokens_seen": 1487232, + "step": 3025 + }, + { + "epoch": 0.39989441731556025, + "grad_norm": 38.114532470703125, + "learning_rate": 1.5007977635950336e-06, + "loss": 0.1412, + "num_input_tokens_seen": 1489728, + "step": 3030 + }, + { + "epoch": 0.4001583740266596, + "eval_loss": 0.13093648850917816, + "eval_runtime": 7.9673, + "eval_samples_per_second": 845.332, + "eval_steps_per_second": 105.682, + "num_input_tokens_seen": 1490688, + "step": 3032 + }, + { + "epoch": 0.4005543090933087, + "grad_norm": 190.9660186767578, + "learning_rate": 1.498802558862219e-06, + "loss": 0.2057, + "num_input_tokens_seen": 1491968, + "step": 3035 + }, + { + "epoch": 0.40121420087105714, + "grad_norm": 0.09837495535612106, + "learning_rate": 1.496804707294496e-06, + "loss": 0.1003, + "num_input_tokens_seen": 1494336, + "step": 3040 + }, + { + "epoch": 0.4018740926488056, + "grad_norm": 0.6492270827293396, + "learning_rate": 1.4948042194932195e-06, + "loss": 0.065, + "num_input_tokens_seen": 1497472, + "step": 3045 + }, + { + "epoch": 0.402533984426554, + "grad_norm": 0.34846293926239014, + "learning_rate": 1.4928011060737341e-06, + "loss": 0.0242, + "num_input_tokens_seen": 1499968, + "step": 3050 + }, + { + "epoch": 0.40319387620430247, + "grad_norm": 0.09735693782567978, + "learning_rate": 1.4907953776653171e-06, + "loss": 0.0811, + "num_input_tokens_seen": 1502336, + "step": 3055 + }, + { + "epoch": 0.40385376798205097, + "grad_norm": 21.974517822265625, + "learning_rate": 1.4887870449111206e-06, + "loss": 0.1462, + "num_input_tokens_seen": 1504576, + "step": 3060 + }, + { + "epoch": 0.4045136597597994, + "grad_norm": 85.91175079345703, + "learning_rate": 1.486776118468118e-06, + "loss": 0.2155, + "num_input_tokens_seen": 1507136, + "step": 3065 + }, + { + "epoch": 0.40517355153754786, + "grad_norm": 0.19757795333862305, + "learning_rate": 1.4847626090070451e-06, + "loss": 0.0479, + "num_input_tokens_seen": 1509696, + "step": 3070 + }, + { + "epoch": 0.4058334433152963, + "grad_norm": 0.6578057408332825, + "learning_rate": 1.4827465272123439e-06, + "loss": 0.3045, + "num_input_tokens_seen": 1512192, + "step": 3075 + }, + { + "epoch": 0.40649333509304475, + "grad_norm": 0.17303939163684845, + "learning_rate": 1.4807278837821063e-06, + "loss": 0.0134, + "num_input_tokens_seen": 1514752, + "step": 3080 + }, + { + "epoch": 0.4071532268707932, + "grad_norm": 14.41674518585205, + "learning_rate": 1.4787066894280178e-06, + "loss": 0.3, + "num_input_tokens_seen": 1517440, + "step": 3085 + }, + { + "epoch": 0.40781311864854164, + "grad_norm": 0.12199345231056213, + "learning_rate": 1.476682954875299e-06, + "loss": 0.0679, + "num_input_tokens_seen": 1519744, + "step": 3090 + }, + { + "epoch": 0.4084730104262901, + "grad_norm": 29.185821533203125, + "learning_rate": 1.4746566908626506e-06, + "loss": 0.1745, + "num_input_tokens_seen": 1522176, + "step": 3095 + }, + { + "epoch": 0.40913290220403853, + "grad_norm": 1.1170824766159058, + "learning_rate": 1.4726279081421956e-06, + "loss": 0.0519, + "num_input_tokens_seen": 1524352, + "step": 3100 + }, + { + "epoch": 0.409792793981787, + "grad_norm": 35.82356643676758, + "learning_rate": 1.4705966174794216e-06, + "loss": 0.2616, + "num_input_tokens_seen": 1526976, + "step": 3105 + }, + { + "epoch": 0.4104526857595354, + "grad_norm": 0.1983165442943573, + "learning_rate": 1.4685628296531248e-06, + "loss": 0.1047, + "num_input_tokens_seen": 1529152, + "step": 3110 + }, + { + "epoch": 0.41111257753728386, + "grad_norm": 0.7452152371406555, + "learning_rate": 1.466526555455352e-06, + "loss": 0.0288, + "num_input_tokens_seen": 1531648, + "step": 3115 + }, + { + "epoch": 0.4117724693150323, + "grad_norm": 0.30635786056518555, + "learning_rate": 1.4644878056913432e-06, + "loss": 0.0023, + "num_input_tokens_seen": 1533952, + "step": 3120 + }, + { + "epoch": 0.4124323610927808, + "grad_norm": 74.26456451416016, + "learning_rate": 1.4624465911794764e-06, + "loss": 0.165, + "num_input_tokens_seen": 1536640, + "step": 3125 + }, + { + "epoch": 0.41309225287052925, + "grad_norm": 0.07176000624895096, + "learning_rate": 1.4604029227512062e-06, + "loss": 0.0024, + "num_input_tokens_seen": 1539200, + "step": 3130 + }, + { + "epoch": 0.4137521446482777, + "grad_norm": 0.4018791615962982, + "learning_rate": 1.4583568112510108e-06, + "loss": 0.1984, + "num_input_tokens_seen": 1541632, + "step": 3135 + }, + { + "epoch": 0.41441203642602614, + "grad_norm": 15.011775016784668, + "learning_rate": 1.4563082675363302e-06, + "loss": 0.0697, + "num_input_tokens_seen": 1544128, + "step": 3140 + }, + { + "epoch": 0.4150719282037746, + "grad_norm": 0.17546619474887848, + "learning_rate": 1.4542573024775122e-06, + "loss": 0.0009, + "num_input_tokens_seen": 1546368, + "step": 3145 + }, + { + "epoch": 0.41573181998152303, + "grad_norm": 2.7632203102111816, + "learning_rate": 1.4522039269577521e-06, + "loss": 0.3214, + "num_input_tokens_seen": 1548736, + "step": 3150 + }, + { + "epoch": 0.4163917117592715, + "grad_norm": 0.050859030336141586, + "learning_rate": 1.4501481518730372e-06, + "loss": 0.223, + "num_input_tokens_seen": 1551168, + "step": 3155 + }, + { + "epoch": 0.4170516035370199, + "grad_norm": 0.2458106428384781, + "learning_rate": 1.4480899881320868e-06, + "loss": 0.0751, + "num_input_tokens_seen": 1553664, + "step": 3160 + }, + { + "epoch": 0.41771149531476837, + "grad_norm": 129.09617614746094, + "learning_rate": 1.4460294466562956e-06, + "loss": 0.1681, + "num_input_tokens_seen": 1555968, + "step": 3165 + }, + { + "epoch": 0.4183713870925168, + "grad_norm": 0.13649986684322357, + "learning_rate": 1.4439665383796756e-06, + "loss": 0.0974, + "num_input_tokens_seen": 1558208, + "step": 3170 + }, + { + "epoch": 0.41903127887026526, + "grad_norm": 1.2176202535629272, + "learning_rate": 1.4419012742487972e-06, + "loss": 0.003, + "num_input_tokens_seen": 1560640, + "step": 3175 + }, + { + "epoch": 0.4196911706480137, + "grad_norm": 0.7410973310470581, + "learning_rate": 1.4398336652227335e-06, + "loss": 0.0019, + "num_input_tokens_seen": 1563328, + "step": 3180 + }, + { + "epoch": 0.4203510624257622, + "grad_norm": 0.07748635113239288, + "learning_rate": 1.4377637222729986e-06, + "loss": 0.1522, + "num_input_tokens_seen": 1565696, + "step": 3185 + }, + { + "epoch": 0.42101095420351065, + "grad_norm": 0.073076032102108, + "learning_rate": 1.435691456383493e-06, + "loss": 0.1285, + "num_input_tokens_seen": 1568640, + "step": 3190 + }, + { + "epoch": 0.4216708459812591, + "grad_norm": 0.4473647475242615, + "learning_rate": 1.433616878550442e-06, + "loss": 0.128, + "num_input_tokens_seen": 1571328, + "step": 3195 + }, + { + "epoch": 0.42233073775900754, + "grad_norm": 17.642181396484375, + "learning_rate": 1.4315399997823403e-06, + "loss": 0.3784, + "num_input_tokens_seen": 1574016, + "step": 3200 + }, + { + "epoch": 0.422990629536756, + "grad_norm": 14.036954879760742, + "learning_rate": 1.429460831099891e-06, + "loss": 0.2654, + "num_input_tokens_seen": 1576384, + "step": 3205 + }, + { + "epoch": 0.4236505213145044, + "grad_norm": 0.1135653704404831, + "learning_rate": 1.4273793835359492e-06, + "loss": 0.2098, + "num_input_tokens_seen": 1579200, + "step": 3210 + }, + { + "epoch": 0.42431041309225287, + "grad_norm": 34.17720413208008, + "learning_rate": 1.4252956681354631e-06, + "loss": 0.1142, + "num_input_tokens_seen": 1581632, + "step": 3215 + }, + { + "epoch": 0.4249703048700013, + "grad_norm": 0.9577163457870483, + "learning_rate": 1.4232096959554135e-06, + "loss": 0.0092, + "num_input_tokens_seen": 1584064, + "step": 3220 + }, + { + "epoch": 0.42563019664774976, + "grad_norm": 43.000099182128906, + "learning_rate": 1.4211214780647572e-06, + "loss": 0.0457, + "num_input_tokens_seen": 1586752, + "step": 3225 + }, + { + "epoch": 0.4262900884254982, + "grad_norm": 12.291510581970215, + "learning_rate": 1.4190310255443676e-06, + "loss": 0.0764, + "num_input_tokens_seen": 1589248, + "step": 3230 + }, + { + "epoch": 0.42694998020324665, + "grad_norm": 0.037998050451278687, + "learning_rate": 1.4169383494869764e-06, + "loss": 0.0141, + "num_input_tokens_seen": 1591552, + "step": 3235 + }, + { + "epoch": 0.4276098719809951, + "grad_norm": 19.27412223815918, + "learning_rate": 1.414843460997113e-06, + "loss": 0.051, + "num_input_tokens_seen": 1594048, + "step": 3240 + }, + { + "epoch": 0.4282697637587436, + "grad_norm": 3.373072385787964, + "learning_rate": 1.4127463711910483e-06, + "loss": 0.1432, + "num_input_tokens_seen": 1596544, + "step": 3245 + }, + { + "epoch": 0.42892965553649204, + "grad_norm": 1.571363925933838, + "learning_rate": 1.410647091196733e-06, + "loss": 0.1601, + "num_input_tokens_seen": 1599104, + "step": 3250 + }, + { + "epoch": 0.4295895473142405, + "grad_norm": 0.016967564821243286, + "learning_rate": 1.4085456321537402e-06, + "loss": 0.1324, + "num_input_tokens_seen": 1601344, + "step": 3255 + }, + { + "epoch": 0.43024943909198893, + "grad_norm": 12.01763916015625, + "learning_rate": 1.4064420052132056e-06, + "loss": 0.2152, + "num_input_tokens_seen": 1603968, + "step": 3260 + }, + { + "epoch": 0.4309093308697374, + "grad_norm": 43.05500030517578, + "learning_rate": 1.4043362215377696e-06, + "loss": 0.0317, + "num_input_tokens_seen": 1606400, + "step": 3265 + }, + { + "epoch": 0.4315692226474858, + "grad_norm": 0.42787039279937744, + "learning_rate": 1.4022282923015158e-06, + "loss": 0.1258, + "num_input_tokens_seen": 1608960, + "step": 3270 + }, + { + "epoch": 0.43222911442523426, + "grad_norm": 0.7687868475914001, + "learning_rate": 1.4001182286899136e-06, + "loss": 0.0026, + "num_input_tokens_seen": 1611456, + "step": 3275 + }, + { + "epoch": 0.4328890062029827, + "grad_norm": 0.07358451187610626, + "learning_rate": 1.398006041899758e-06, + "loss": 0.0702, + "num_input_tokens_seen": 1613952, + "step": 3280 + }, + { + "epoch": 0.43354889798073115, + "grad_norm": 23.080883026123047, + "learning_rate": 1.3958917431391102e-06, + "loss": 0.1748, + "num_input_tokens_seen": 1616320, + "step": 3285 + }, + { + "epoch": 0.4342087897584796, + "grad_norm": 0.1040918156504631, + "learning_rate": 1.3937753436272388e-06, + "loss": 0.1856, + "num_input_tokens_seen": 1619136, + "step": 3290 + }, + { + "epoch": 0.43486868153622804, + "grad_norm": 174.55502319335938, + "learning_rate": 1.3916568545945597e-06, + "loss": 0.118, + "num_input_tokens_seen": 1621632, + "step": 3295 + }, + { + "epoch": 0.4355285733139765, + "grad_norm": 0.32156044244766235, + "learning_rate": 1.3895362872825764e-06, + "loss": 0.1392, + "num_input_tokens_seen": 1624064, + "step": 3300 + }, + { + "epoch": 0.43618846509172493, + "grad_norm": 0.5658749938011169, + "learning_rate": 1.3874136529438205e-06, + "loss": 0.0494, + "num_input_tokens_seen": 1626496, + "step": 3305 + }, + { + "epoch": 0.43684835686947343, + "grad_norm": 14.565958023071289, + "learning_rate": 1.3852889628417918e-06, + "loss": 0.1045, + "num_input_tokens_seen": 1628800, + "step": 3310 + }, + { + "epoch": 0.4375082486472219, + "grad_norm": 1.4210195541381836, + "learning_rate": 1.3831622282508994e-06, + "loss": 0.104, + "num_input_tokens_seen": 1631232, + "step": 3315 + }, + { + "epoch": 0.4381681404249703, + "grad_norm": 0.14714202284812927, + "learning_rate": 1.3810334604564007e-06, + "loss": 0.0011, + "num_input_tokens_seen": 1633728, + "step": 3320 + }, + { + "epoch": 0.43882803220271877, + "grad_norm": 0.5814191102981567, + "learning_rate": 1.3789026707543423e-06, + "loss": 0.0735, + "num_input_tokens_seen": 1636224, + "step": 3325 + }, + { + "epoch": 0.4394879239804672, + "grad_norm": 0.12930363416671753, + "learning_rate": 1.3767698704514998e-06, + "loss": 0.063, + "num_input_tokens_seen": 1638272, + "step": 3330 + }, + { + "epoch": 0.44014781575821565, + "grad_norm": 0.01950267143547535, + "learning_rate": 1.3746350708653175e-06, + "loss": 0.1941, + "num_input_tokens_seen": 1640512, + "step": 3335 + }, + { + "epoch": 0.4408077075359641, + "grad_norm": 30.412141799926758, + "learning_rate": 1.3724982833238495e-06, + "loss": 0.2224, + "num_input_tokens_seen": 1642944, + "step": 3340 + }, + { + "epoch": 0.44146759931371254, + "grad_norm": 0.06361498683691025, + "learning_rate": 1.370359519165697e-06, + "loss": 0.1334, + "num_input_tokens_seen": 1645376, + "step": 3345 + }, + { + "epoch": 0.442127491091461, + "grad_norm": 120.06082916259766, + "learning_rate": 1.368218789739952e-06, + "loss": 0.0429, + "num_input_tokens_seen": 1647936, + "step": 3350 + }, + { + "epoch": 0.44278738286920943, + "grad_norm": 0.1117718368768692, + "learning_rate": 1.3660761064061337e-06, + "loss": 0.1404, + "num_input_tokens_seen": 1650496, + "step": 3355 + }, + { + "epoch": 0.4434472746469579, + "grad_norm": 0.049969542771577835, + "learning_rate": 1.3639314805341297e-06, + "loss": 0.1065, + "num_input_tokens_seen": 1652992, + "step": 3360 + }, + { + "epoch": 0.4441071664247063, + "grad_norm": 66.16351318359375, + "learning_rate": 1.3617849235041355e-06, + "loss": 0.0935, + "num_input_tokens_seen": 1655488, + "step": 3365 + }, + { + "epoch": 0.4447670582024548, + "grad_norm": 0.091923289000988, + "learning_rate": 1.3596364467065938e-06, + "loss": 0.1084, + "num_input_tokens_seen": 1657984, + "step": 3370 + }, + { + "epoch": 0.44542694998020327, + "grad_norm": 31.401330947875977, + "learning_rate": 1.3574860615421346e-06, + "loss": 0.2514, + "num_input_tokens_seen": 1660736, + "step": 3375 + }, + { + "epoch": 0.4460868417579517, + "grad_norm": 14.01511287689209, + "learning_rate": 1.3553337794215147e-06, + "loss": 0.1354, + "num_input_tokens_seen": 1663104, + "step": 3380 + }, + { + "epoch": 0.44674673353570016, + "grad_norm": 32.54231262207031, + "learning_rate": 1.3531796117655565e-06, + "loss": 0.1002, + "num_input_tokens_seen": 1665344, + "step": 3385 + }, + { + "epoch": 0.4474066253134486, + "grad_norm": 123.50605773925781, + "learning_rate": 1.3510235700050873e-06, + "loss": 0.156, + "num_input_tokens_seen": 1668096, + "step": 3390 + }, + { + "epoch": 0.44806651709119705, + "grad_norm": 14.50474739074707, + "learning_rate": 1.3488656655808801e-06, + "loss": 0.0959, + "num_input_tokens_seen": 1670272, + "step": 3395 + }, + { + "epoch": 0.4487264088689455, + "grad_norm": 33.239410400390625, + "learning_rate": 1.3467059099435912e-06, + "loss": 0.0913, + "num_input_tokens_seen": 1672448, + "step": 3400 + }, + { + "epoch": 0.44938630064669394, + "grad_norm": 0.29679805040359497, + "learning_rate": 1.3445443145537002e-06, + "loss": 0.0055, + "num_input_tokens_seen": 1675200, + "step": 3405 + }, + { + "epoch": 0.4500461924244424, + "grad_norm": 3.9020371437072754, + "learning_rate": 1.3423808908814494e-06, + "loss": 0.0509, + "num_input_tokens_seen": 1677696, + "step": 3410 + }, + { + "epoch": 0.45017817077999206, + "eval_loss": 0.11581598222255707, + "eval_runtime": 7.8583, + "eval_samples_per_second": 857.06, + "eval_steps_per_second": 107.148, + "num_input_tokens_seen": 1678208, + "step": 3411 + }, + { + "epoch": 0.4507060842021908, + "grad_norm": 14.313544273376465, + "learning_rate": 1.3402156504067826e-06, + "loss": 0.0982, + "num_input_tokens_seen": 1680256, + "step": 3415 + }, + { + "epoch": 0.45136597597993927, + "grad_norm": 0.17114846408367157, + "learning_rate": 1.338048604619284e-06, + "loss": 0.0816, + "num_input_tokens_seen": 1682624, + "step": 3420 + }, + { + "epoch": 0.4520258677576877, + "grad_norm": 68.34577178955078, + "learning_rate": 1.3358797650181178e-06, + "loss": 0.0548, + "num_input_tokens_seen": 1685056, + "step": 3425 + }, + { + "epoch": 0.45268575953543616, + "grad_norm": 168.3812713623047, + "learning_rate": 1.3337091431119662e-06, + "loss": 0.1743, + "num_input_tokens_seen": 1687168, + "step": 3430 + }, + { + "epoch": 0.45334565131318466, + "grad_norm": 292.0270690917969, + "learning_rate": 1.3315367504189698e-06, + "loss": 0.263, + "num_input_tokens_seen": 1689216, + "step": 3435 + }, + { + "epoch": 0.4540055430909331, + "grad_norm": 87.19351959228516, + "learning_rate": 1.3293625984666656e-06, + "loss": 0.0704, + "num_input_tokens_seen": 1691776, + "step": 3440 + }, + { + "epoch": 0.45466543486868155, + "grad_norm": 0.12149941176176071, + "learning_rate": 1.3271866987919254e-06, + "loss": 0.0008, + "num_input_tokens_seen": 1694336, + "step": 3445 + }, + { + "epoch": 0.45532532664643, + "grad_norm": 0.1733410805463791, + "learning_rate": 1.325009062940895e-06, + "loss": 0.2066, + "num_input_tokens_seen": 1696640, + "step": 3450 + }, + { + "epoch": 0.45598521842417844, + "grad_norm": 16.03499984741211, + "learning_rate": 1.3228297024689336e-06, + "loss": 0.0826, + "num_input_tokens_seen": 1698880, + "step": 3455 + }, + { + "epoch": 0.4566451102019269, + "grad_norm": 2.5192947387695312, + "learning_rate": 1.3206486289405519e-06, + "loss": 0.1221, + "num_input_tokens_seen": 1701312, + "step": 3460 + }, + { + "epoch": 0.45730500197967533, + "grad_norm": 51.37282180786133, + "learning_rate": 1.3184658539293496e-06, + "loss": 0.1446, + "num_input_tokens_seen": 1703808, + "step": 3465 + }, + { + "epoch": 0.4579648937574238, + "grad_norm": 142.88600158691406, + "learning_rate": 1.3162813890179564e-06, + "loss": 0.132, + "num_input_tokens_seen": 1706304, + "step": 3470 + }, + { + "epoch": 0.4586247855351722, + "grad_norm": 13.749252319335938, + "learning_rate": 1.314095245797969e-06, + "loss": 0.236, + "num_input_tokens_seen": 1708736, + "step": 3475 + }, + { + "epoch": 0.45928467731292066, + "grad_norm": 0.7829024791717529, + "learning_rate": 1.3119074358698891e-06, + "loss": 0.1477, + "num_input_tokens_seen": 1711232, + "step": 3480 + }, + { + "epoch": 0.4599445690906691, + "grad_norm": 1.0132334232330322, + "learning_rate": 1.3097179708430634e-06, + "loss": 0.003, + "num_input_tokens_seen": 1713600, + "step": 3485 + }, + { + "epoch": 0.46060446086841755, + "grad_norm": 0.1129785031080246, + "learning_rate": 1.3075268623356214e-06, + "loss": 0.1998, + "num_input_tokens_seen": 1716224, + "step": 3490 + }, + { + "epoch": 0.46126435264616605, + "grad_norm": 41.71617889404297, + "learning_rate": 1.305334121974412e-06, + "loss": 0.1462, + "num_input_tokens_seen": 1718720, + "step": 3495 + }, + { + "epoch": 0.4619242444239145, + "grad_norm": 30.289953231811523, + "learning_rate": 1.3031397613949448e-06, + "loss": 0.0858, + "num_input_tokens_seen": 1721280, + "step": 3500 + }, + { + "epoch": 0.46258413620166294, + "grad_norm": 70.03472137451172, + "learning_rate": 1.3009437922413266e-06, + "loss": 0.1099, + "num_input_tokens_seen": 1723712, + "step": 3505 + }, + { + "epoch": 0.4632440279794114, + "grad_norm": 112.14954376220703, + "learning_rate": 1.2987462261661994e-06, + "loss": 0.1115, + "num_input_tokens_seen": 1725952, + "step": 3510 + }, + { + "epoch": 0.46390391975715983, + "grad_norm": 0.32890069484710693, + "learning_rate": 1.2965470748306798e-06, + "loss": 0.0017, + "num_input_tokens_seen": 1728512, + "step": 3515 + }, + { + "epoch": 0.4645638115349083, + "grad_norm": 69.49401092529297, + "learning_rate": 1.2943463499042957e-06, + "loss": 0.1338, + "num_input_tokens_seen": 1731008, + "step": 3520 + }, + { + "epoch": 0.4652237033126567, + "grad_norm": 1.0032602548599243, + "learning_rate": 1.2921440630649257e-06, + "loss": 0.0485, + "num_input_tokens_seen": 1733696, + "step": 3525 + }, + { + "epoch": 0.46588359509040517, + "grad_norm": 221.371826171875, + "learning_rate": 1.2899402259987355e-06, + "loss": 0.1013, + "num_input_tokens_seen": 1736256, + "step": 3530 + }, + { + "epoch": 0.4665434868681536, + "grad_norm": 0.41186392307281494, + "learning_rate": 1.287734850400118e-06, + "loss": 0.2473, + "num_input_tokens_seen": 1738944, + "step": 3535 + }, + { + "epoch": 0.46720337864590206, + "grad_norm": 16.863187789916992, + "learning_rate": 1.2855279479716297e-06, + "loss": 0.3237, + "num_input_tokens_seen": 1741568, + "step": 3540 + }, + { + "epoch": 0.4678632704236505, + "grad_norm": 0.3010137379169464, + "learning_rate": 1.283319530423929e-06, + "loss": 0.0027, + "num_input_tokens_seen": 1743808, + "step": 3545 + }, + { + "epoch": 0.46852316220139895, + "grad_norm": 0.09695116430521011, + "learning_rate": 1.2811096094757144e-06, + "loss": 0.0016, + "num_input_tokens_seen": 1746176, + "step": 3550 + }, + { + "epoch": 0.46918305397914745, + "grad_norm": 0.07640713453292847, + "learning_rate": 1.2788981968536612e-06, + "loss": 0.2019, + "num_input_tokens_seen": 1748608, + "step": 3555 + }, + { + "epoch": 0.4698429457568959, + "grad_norm": 0.21313799917697906, + "learning_rate": 1.2766853042923607e-06, + "loss": 0.1542, + "num_input_tokens_seen": 1751040, + "step": 3560 + }, + { + "epoch": 0.47050283753464434, + "grad_norm": 0.6278545260429382, + "learning_rate": 1.2744709435342573e-06, + "loss": 0.0623, + "num_input_tokens_seen": 1753280, + "step": 3565 + }, + { + "epoch": 0.4711627293123928, + "grad_norm": 14.035211563110352, + "learning_rate": 1.2722551263295864e-06, + "loss": 0.2919, + "num_input_tokens_seen": 1755712, + "step": 3570 + }, + { + "epoch": 0.4718226210901412, + "grad_norm": 41.04814910888672, + "learning_rate": 1.2700378644363114e-06, + "loss": 0.1294, + "num_input_tokens_seen": 1757952, + "step": 3575 + }, + { + "epoch": 0.47248251286788967, + "grad_norm": 29.484533309936523, + "learning_rate": 1.2678191696200621e-06, + "loss": 0.0883, + "num_input_tokens_seen": 1760384, + "step": 3580 + }, + { + "epoch": 0.4731424046456381, + "grad_norm": 0.2581002712249756, + "learning_rate": 1.2655990536540717e-06, + "loss": 0.0025, + "num_input_tokens_seen": 1762944, + "step": 3585 + }, + { + "epoch": 0.47380229642338656, + "grad_norm": 33.701026916503906, + "learning_rate": 1.2633775283191144e-06, + "loss": 0.2308, + "num_input_tokens_seen": 1765504, + "step": 3590 + }, + { + "epoch": 0.474462188201135, + "grad_norm": 0.5347998738288879, + "learning_rate": 1.2611546054034436e-06, + "loss": 0.0084, + "num_input_tokens_seen": 1768128, + "step": 3595 + }, + { + "epoch": 0.47512207997888345, + "grad_norm": 0.7026123404502869, + "learning_rate": 1.2589302967027285e-06, + "loss": 0.1521, + "num_input_tokens_seen": 1770624, + "step": 3600 + }, + { + "epoch": 0.4757819717566319, + "grad_norm": 17.028770446777344, + "learning_rate": 1.2567046140199914e-06, + "loss": 0.3261, + "num_input_tokens_seen": 1773248, + "step": 3605 + }, + { + "epoch": 0.47644186353438034, + "grad_norm": 0.5768800377845764, + "learning_rate": 1.2544775691655463e-06, + "loss": 0.1219, + "num_input_tokens_seen": 1775488, + "step": 3610 + }, + { + "epoch": 0.4771017553121288, + "grad_norm": 0.33122268319129944, + "learning_rate": 1.2522491739569346e-06, + "loss": 0.138, + "num_input_tokens_seen": 1777792, + "step": 3615 + }, + { + "epoch": 0.4777616470898773, + "grad_norm": 3.622959852218628, + "learning_rate": 1.250019440218864e-06, + "loss": 0.1041, + "num_input_tokens_seen": 1780352, + "step": 3620 + }, + { + "epoch": 0.47842153886762573, + "grad_norm": 0.5977795124053955, + "learning_rate": 1.247788379783144e-06, + "loss": 0.1707, + "num_input_tokens_seen": 1783168, + "step": 3625 + }, + { + "epoch": 0.4790814306453742, + "grad_norm": 30.13225555419922, + "learning_rate": 1.2455560044886248e-06, + "loss": 0.0886, + "num_input_tokens_seen": 1785920, + "step": 3630 + }, + { + "epoch": 0.4797413224231226, + "grad_norm": 0.14322948455810547, + "learning_rate": 1.2433223261811337e-06, + "loss": 0.1456, + "num_input_tokens_seen": 1788416, + "step": 3635 + }, + { + "epoch": 0.48040121420087106, + "grad_norm": 0.2782398462295532, + "learning_rate": 1.2410873567134115e-06, + "loss": 0.0141, + "num_input_tokens_seen": 1790848, + "step": 3640 + }, + { + "epoch": 0.4810611059786195, + "grad_norm": 10.446566581726074, + "learning_rate": 1.238851107945051e-06, + "loss": 0.0342, + "num_input_tokens_seen": 1793280, + "step": 3645 + }, + { + "epoch": 0.48172099775636795, + "grad_norm": 0.0587058961391449, + "learning_rate": 1.2366135917424341e-06, + "loss": 0.1088, + "num_input_tokens_seen": 1795648, + "step": 3650 + }, + { + "epoch": 0.4823808895341164, + "grad_norm": 18.86115264892578, + "learning_rate": 1.2343748199786665e-06, + "loss": 0.1796, + "num_input_tokens_seen": 1797952, + "step": 3655 + }, + { + "epoch": 0.48304078131186484, + "grad_norm": 0.4261041283607483, + "learning_rate": 1.2321348045335182e-06, + "loss": 0.0595, + "num_input_tokens_seen": 1800192, + "step": 3660 + }, + { + "epoch": 0.4837006730896133, + "grad_norm": 0.32942232489585876, + "learning_rate": 1.2298935572933575e-06, + "loss": 0.1465, + "num_input_tokens_seen": 1802560, + "step": 3665 + }, + { + "epoch": 0.48436056486736173, + "grad_norm": 23.043102264404297, + "learning_rate": 1.2276510901510892e-06, + "loss": 0.1584, + "num_input_tokens_seen": 1805056, + "step": 3670 + }, + { + "epoch": 0.4850204566451102, + "grad_norm": 0.42907005548477173, + "learning_rate": 1.2254074150060915e-06, + "loss": 0.1682, + "num_input_tokens_seen": 1807744, + "step": 3675 + }, + { + "epoch": 0.4856803484228587, + "grad_norm": 46.6706657409668, + "learning_rate": 1.2231625437641535e-06, + "loss": 0.1522, + "num_input_tokens_seen": 1810368, + "step": 3680 + }, + { + "epoch": 0.4863402402006071, + "grad_norm": 0.21515221893787384, + "learning_rate": 1.2209164883374096e-06, + "loss": 0.045, + "num_input_tokens_seen": 1813056, + "step": 3685 + }, + { + "epoch": 0.48700013197835557, + "grad_norm": 0.3806566894054413, + "learning_rate": 1.2186692606442793e-06, + "loss": 0.22, + "num_input_tokens_seen": 1815360, + "step": 3690 + }, + { + "epoch": 0.487660023756104, + "grad_norm": 59.212196350097656, + "learning_rate": 1.216420872609402e-06, + "loss": 0.1641, + "num_input_tokens_seen": 1817920, + "step": 3695 + }, + { + "epoch": 0.48831991553385246, + "grad_norm": 16.957406997680664, + "learning_rate": 1.2141713361635739e-06, + "loss": 0.0635, + "num_input_tokens_seen": 1820288, + "step": 3700 + }, + { + "epoch": 0.4889798073116009, + "grad_norm": 0.02635974995791912, + "learning_rate": 1.2119206632436864e-06, + "loss": 0.1703, + "num_input_tokens_seen": 1822656, + "step": 3705 + }, + { + "epoch": 0.48963969908934935, + "grad_norm": 0.6288211345672607, + "learning_rate": 1.209668865792661e-06, + "loss": 0.0631, + "num_input_tokens_seen": 1824832, + "step": 3710 + }, + { + "epoch": 0.4902995908670978, + "grad_norm": 176.1214599609375, + "learning_rate": 1.207415955759385e-06, + "loss": 0.0998, + "num_input_tokens_seen": 1827200, + "step": 3715 + }, + { + "epoch": 0.49095948264484623, + "grad_norm": 17.406232833862305, + "learning_rate": 1.2051619450986514e-06, + "loss": 0.1581, + "num_input_tokens_seen": 1829632, + "step": 3720 + }, + { + "epoch": 0.4916193744225947, + "grad_norm": 6.454481601715088, + "learning_rate": 1.2029068457710923e-06, + "loss": 0.1271, + "num_input_tokens_seen": 1832192, + "step": 3725 + }, + { + "epoch": 0.4922792662003431, + "grad_norm": 2.918125867843628, + "learning_rate": 1.200650669743117e-06, + "loss": 0.091, + "num_input_tokens_seen": 1834752, + "step": 3730 + }, + { + "epoch": 0.49293915797809157, + "grad_norm": 19.404775619506836, + "learning_rate": 1.1983934289868488e-06, + "loss": 0.116, + "num_input_tokens_seen": 1837248, + "step": 3735 + }, + { + "epoch": 0.49359904975584007, + "grad_norm": 8.872051239013672, + "learning_rate": 1.1961351354800595e-06, + "loss": 0.1431, + "num_input_tokens_seen": 1839680, + "step": 3740 + }, + { + "epoch": 0.4942589415335885, + "grad_norm": 0.526841402053833, + "learning_rate": 1.193875801206109e-06, + "loss": 0.1399, + "num_input_tokens_seen": 1842304, + "step": 3745 + }, + { + "epoch": 0.49491883331133696, + "grad_norm": 0.18063127994537354, + "learning_rate": 1.1916154381538786e-06, + "loss": 0.0471, + "num_input_tokens_seen": 1844480, + "step": 3750 + }, + { + "epoch": 0.4955787250890854, + "grad_norm": 0.19460546970367432, + "learning_rate": 1.1893540583177083e-06, + "loss": 0.1858, + "num_input_tokens_seen": 1846912, + "step": 3755 + }, + { + "epoch": 0.49623861686683385, + "grad_norm": 14.68387508392334, + "learning_rate": 1.187091673697335e-06, + "loss": 0.0801, + "num_input_tokens_seen": 1849024, + "step": 3760 + }, + { + "epoch": 0.4968985086445823, + "grad_norm": 0.8316734433174133, + "learning_rate": 1.184828296297826e-06, + "loss": 0.0691, + "num_input_tokens_seen": 1851712, + "step": 3765 + }, + { + "epoch": 0.49755840042233074, + "grad_norm": 38.36271667480469, + "learning_rate": 1.182563938129518e-06, + "loss": 0.0697, + "num_input_tokens_seen": 1854208, + "step": 3770 + }, + { + "epoch": 0.4982182922000792, + "grad_norm": 0.08225525915622711, + "learning_rate": 1.1802986112079507e-06, + "loss": 0.0893, + "num_input_tokens_seen": 1856704, + "step": 3775 + }, + { + "epoch": 0.4988781839778276, + "grad_norm": 0.5821913480758667, + "learning_rate": 1.1780323275538056e-06, + "loss": 0.0831, + "num_input_tokens_seen": 1858944, + "step": 3780 + }, + { + "epoch": 0.49953807575557607, + "grad_norm": 0.5157123804092407, + "learning_rate": 1.1757650991928393e-06, + "loss": 0.2059, + "num_input_tokens_seen": 1861696, + "step": 3785 + }, + { + "epoch": 0.5001979675333246, + "grad_norm": 0.31598079204559326, + "learning_rate": 1.1734969381558235e-06, + "loss": 0.179, + "num_input_tokens_seen": 1864128, + "step": 3790 + }, + { + "epoch": 0.5001979675333246, + "eval_loss": 0.12760794162750244, + "eval_runtime": 7.9443, + "eval_samples_per_second": 847.779, + "eval_steps_per_second": 105.988, + "num_input_tokens_seen": 1864128, + "step": 3790 + }, + { + "epoch": 0.500857859311073, + "grad_norm": 0.1666107177734375, + "learning_rate": 1.1712278564784774e-06, + "loss": 0.002, + "num_input_tokens_seen": 1866432, + "step": 3795 + }, + { + "epoch": 0.5015177510888215, + "grad_norm": 20.980514526367188, + "learning_rate": 1.1689578662014064e-06, + "loss": 0.0598, + "num_input_tokens_seen": 1868736, + "step": 3800 + }, + { + "epoch": 0.5021776428665699, + "grad_norm": 14.8715181350708, + "learning_rate": 1.1666869793700362e-06, + "loss": 0.3077, + "num_input_tokens_seen": 1871360, + "step": 3805 + }, + { + "epoch": 0.5028375346443184, + "grad_norm": 0.031641654670238495, + "learning_rate": 1.1644152080345515e-06, + "loss": 0.0016, + "num_input_tokens_seen": 1873536, + "step": 3810 + }, + { + "epoch": 0.5034974264220667, + "grad_norm": 28.584814071655273, + "learning_rate": 1.1621425642498289e-06, + "loss": 0.2264, + "num_input_tokens_seen": 1875904, + "step": 3815 + }, + { + "epoch": 0.5041573181998152, + "grad_norm": 405.0102233886719, + "learning_rate": 1.1598690600753759e-06, + "loss": 0.2478, + "num_input_tokens_seen": 1878464, + "step": 3820 + }, + { + "epoch": 0.5048172099775636, + "grad_norm": 34.297298431396484, + "learning_rate": 1.1575947075752644e-06, + "loss": 0.2181, + "num_input_tokens_seen": 1880640, + "step": 3825 + }, + { + "epoch": 0.5054771017553121, + "grad_norm": 145.9020538330078, + "learning_rate": 1.1553195188180691e-06, + "loss": 0.1516, + "num_input_tokens_seen": 1882944, + "step": 3830 + }, + { + "epoch": 0.5061369935330606, + "grad_norm": 1.2247670888900757, + "learning_rate": 1.1530435058768008e-06, + "loss": 0.0694, + "num_input_tokens_seen": 1885248, + "step": 3835 + }, + { + "epoch": 0.506796885310809, + "grad_norm": 19.718626022338867, + "learning_rate": 1.150766680828845e-06, + "loss": 0.0841, + "num_input_tokens_seen": 1887872, + "step": 3840 + }, + { + "epoch": 0.5074567770885575, + "grad_norm": 1.9999217987060547, + "learning_rate": 1.1484890557558955e-06, + "loss": 0.0024, + "num_input_tokens_seen": 1890560, + "step": 3845 + }, + { + "epoch": 0.5081166688663059, + "grad_norm": 19.390962600708008, + "learning_rate": 1.146210642743892e-06, + "loss": 0.076, + "num_input_tokens_seen": 1893056, + "step": 3850 + }, + { + "epoch": 0.5087765606440544, + "grad_norm": 0.07549047470092773, + "learning_rate": 1.1439314538829554e-06, + "loss": 0.0353, + "num_input_tokens_seen": 1895360, + "step": 3855 + }, + { + "epoch": 0.5094364524218028, + "grad_norm": 0.08527141809463501, + "learning_rate": 1.141651501267323e-06, + "loss": 0.0793, + "num_input_tokens_seen": 1897664, + "step": 3860 + }, + { + "epoch": 0.5100963441995513, + "grad_norm": 1.7610729932785034, + "learning_rate": 1.1393707969952847e-06, + "loss": 0.1073, + "num_input_tokens_seen": 1900288, + "step": 3865 + }, + { + "epoch": 0.5107562359772997, + "grad_norm": 0.7622396945953369, + "learning_rate": 1.13708935316912e-06, + "loss": 0.0796, + "num_input_tokens_seen": 1903040, + "step": 3870 + }, + { + "epoch": 0.5114161277550482, + "grad_norm": 0.33791011571884155, + "learning_rate": 1.134807181895032e-06, + "loss": 0.0173, + "num_input_tokens_seen": 1905472, + "step": 3875 + }, + { + "epoch": 0.5120760195327966, + "grad_norm": 0.7325949668884277, + "learning_rate": 1.132524295283084e-06, + "loss": 0.0637, + "num_input_tokens_seen": 1907712, + "step": 3880 + }, + { + "epoch": 0.5127359113105451, + "grad_norm": 0.04774130508303642, + "learning_rate": 1.1302407054471355e-06, + "loss": 0.0912, + "num_input_tokens_seen": 1910080, + "step": 3885 + }, + { + "epoch": 0.5133958030882935, + "grad_norm": 0.2512286305427551, + "learning_rate": 1.1279564245047767e-06, + "loss": 0.2374, + "num_input_tokens_seen": 1912512, + "step": 3890 + }, + { + "epoch": 0.514055694866042, + "grad_norm": 0.08980656415224075, + "learning_rate": 1.1256714645772662e-06, + "loss": 0.1336, + "num_input_tokens_seen": 1914752, + "step": 3895 + }, + { + "epoch": 0.5147155866437905, + "grad_norm": 0.0983128771185875, + "learning_rate": 1.1233858377894647e-06, + "loss": 0.0021, + "num_input_tokens_seen": 1917120, + "step": 3900 + }, + { + "epoch": 0.5153754784215389, + "grad_norm": 74.96298217773438, + "learning_rate": 1.1210995562697722e-06, + "loss": 0.014, + "num_input_tokens_seen": 1919232, + "step": 3905 + }, + { + "epoch": 0.5160353701992874, + "grad_norm": 269.811279296875, + "learning_rate": 1.1188126321500621e-06, + "loss": 0.0559, + "num_input_tokens_seen": 1921856, + "step": 3910 + }, + { + "epoch": 0.5166952619770357, + "grad_norm": 32.522220611572266, + "learning_rate": 1.1165250775656188e-06, + "loss": 0.1515, + "num_input_tokens_seen": 1924224, + "step": 3915 + }, + { + "epoch": 0.5173551537547842, + "grad_norm": 0.08811689168214798, + "learning_rate": 1.1142369046550708e-06, + "loss": 0.0373, + "num_input_tokens_seen": 1926464, + "step": 3920 + }, + { + "epoch": 0.5180150455325326, + "grad_norm": 0.0877578929066658, + "learning_rate": 1.1119481255603289e-06, + "loss": 0.1665, + "num_input_tokens_seen": 1928896, + "step": 3925 + }, + { + "epoch": 0.5186749373102811, + "grad_norm": 58.392852783203125, + "learning_rate": 1.1096587524265197e-06, + "loss": 0.115, + "num_input_tokens_seen": 1931200, + "step": 3930 + }, + { + "epoch": 0.5193348290880295, + "grad_norm": 0.029454190284013748, + "learning_rate": 1.107368797401923e-06, + "loss": 0.0542, + "num_input_tokens_seen": 1933632, + "step": 3935 + }, + { + "epoch": 0.519994720865778, + "grad_norm": 0.17615357041358948, + "learning_rate": 1.1050782726379054e-06, + "loss": 0.0019, + "num_input_tokens_seen": 1935872, + "step": 3940 + }, + { + "epoch": 0.5206546126435264, + "grad_norm": 0.39868056774139404, + "learning_rate": 1.1027871902888566e-06, + "loss": 0.0951, + "num_input_tokens_seen": 1938048, + "step": 3945 + }, + { + "epoch": 0.5213145044212749, + "grad_norm": 66.22596740722656, + "learning_rate": 1.1004955625121257e-06, + "loss": 0.056, + "num_input_tokens_seen": 1940608, + "step": 3950 + }, + { + "epoch": 0.5219743961990233, + "grad_norm": 24.409608840942383, + "learning_rate": 1.0982034014679561e-06, + "loss": 0.2829, + "num_input_tokens_seen": 1943040, + "step": 3955 + }, + { + "epoch": 0.5226342879767718, + "grad_norm": 0.12048153579235077, + "learning_rate": 1.0959107193194206e-06, + "loss": 0.2808, + "num_input_tokens_seen": 1945664, + "step": 3960 + }, + { + "epoch": 0.5232941797545203, + "grad_norm": 0.041272152215242386, + "learning_rate": 1.0936175282323575e-06, + "loss": 0.0046, + "num_input_tokens_seen": 1948032, + "step": 3965 + }, + { + "epoch": 0.5239540715322687, + "grad_norm": 0.2881408929824829, + "learning_rate": 1.091323840375305e-06, + "loss": 0.001, + "num_input_tokens_seen": 1950208, + "step": 3970 + }, + { + "epoch": 0.5246139633100172, + "grad_norm": 57.43034362792969, + "learning_rate": 1.0890296679194378e-06, + "loss": 0.2119, + "num_input_tokens_seen": 1952896, + "step": 3975 + }, + { + "epoch": 0.5252738550877656, + "grad_norm": 0.0778154581785202, + "learning_rate": 1.086735023038502e-06, + "loss": 0.068, + "num_input_tokens_seen": 1955200, + "step": 3980 + }, + { + "epoch": 0.5259337468655141, + "grad_norm": 0.2079089879989624, + "learning_rate": 1.0844399179087512e-06, + "loss": 0.0953, + "num_input_tokens_seen": 1957376, + "step": 3985 + }, + { + "epoch": 0.5265936386432625, + "grad_norm": 0.25119689106941223, + "learning_rate": 1.0821443647088802e-06, + "loss": 0.2058, + "num_input_tokens_seen": 1960064, + "step": 3990 + }, + { + "epoch": 0.527253530421011, + "grad_norm": 0.09684748202562332, + "learning_rate": 1.0798483756199623e-06, + "loss": 0.0652, + "num_input_tokens_seen": 1962624, + "step": 3995 + }, + { + "epoch": 0.5279134221987594, + "grad_norm": 0.08053699135780334, + "learning_rate": 1.0775519628253833e-06, + "loss": 0.0704, + "num_input_tokens_seen": 1965056, + "step": 4000 + }, + { + "epoch": 0.5285733139765079, + "grad_norm": 0.2662527859210968, + "learning_rate": 1.0752551385107772e-06, + "loss": 0.1949, + "num_input_tokens_seen": 1967424, + "step": 4005 + }, + { + "epoch": 0.5292332057542563, + "grad_norm": 18.517011642456055, + "learning_rate": 1.0729579148639621e-06, + "loss": 0.1433, + "num_input_tokens_seen": 1969856, + "step": 4010 + }, + { + "epoch": 0.5298930975320048, + "grad_norm": 0.126367449760437, + "learning_rate": 1.0706603040748747e-06, + "loss": 0.0517, + "num_input_tokens_seen": 1972544, + "step": 4015 + }, + { + "epoch": 0.5305529893097533, + "grad_norm": 0.04751770943403244, + "learning_rate": 1.0683623183355071e-06, + "loss": 0.0448, + "num_input_tokens_seen": 1974912, + "step": 4020 + }, + { + "epoch": 0.5312128810875016, + "grad_norm": 16.610794067382812, + "learning_rate": 1.0660639698398392e-06, + "loss": 0.1542, + "num_input_tokens_seen": 1977216, + "step": 4025 + }, + { + "epoch": 0.5318727728652501, + "grad_norm": 100.28923034667969, + "learning_rate": 1.0637652707837773e-06, + "loss": 0.1436, + "num_input_tokens_seen": 1979648, + "step": 4030 + }, + { + "epoch": 0.5325326646429985, + "grad_norm": 20.682844161987305, + "learning_rate": 1.0614662333650876e-06, + "loss": 0.1039, + "num_input_tokens_seen": 1981888, + "step": 4035 + }, + { + "epoch": 0.533192556420747, + "grad_norm": 19.53425407409668, + "learning_rate": 1.0591668697833311e-06, + "loss": 0.2167, + "num_input_tokens_seen": 1984448, + "step": 4040 + }, + { + "epoch": 0.5338524481984954, + "grad_norm": 67.5270004272461, + "learning_rate": 1.0568671922398005e-06, + "loss": 0.1567, + "num_input_tokens_seen": 1987072, + "step": 4045 + }, + { + "epoch": 0.5345123399762439, + "grad_norm": 1.1474074125289917, + "learning_rate": 1.054567212937454e-06, + "loss": 0.1618, + "num_input_tokens_seen": 1989632, + "step": 4050 + }, + { + "epoch": 0.5351722317539923, + "grad_norm": 0.28706297278404236, + "learning_rate": 1.0522669440808508e-06, + "loss": 0.0367, + "num_input_tokens_seen": 1992192, + "step": 4055 + }, + { + "epoch": 0.5358321235317408, + "grad_norm": 50.1959114074707, + "learning_rate": 1.0499663978760871e-06, + "loss": 0.2607, + "num_input_tokens_seen": 1994624, + "step": 4060 + }, + { + "epoch": 0.5364920153094892, + "grad_norm": 13.985773086547852, + "learning_rate": 1.0476655865307308e-06, + "loss": 0.0821, + "num_input_tokens_seen": 1997056, + "step": 4065 + }, + { + "epoch": 0.5371519070872377, + "grad_norm": 0.9565370082855225, + "learning_rate": 1.0453645222537556e-06, + "loss": 0.0918, + "num_input_tokens_seen": 1999360, + "step": 4070 + }, + { + "epoch": 0.5378117988649861, + "grad_norm": 53.97791290283203, + "learning_rate": 1.0430632172554796e-06, + "loss": 0.0861, + "num_input_tokens_seen": 2001856, + "step": 4075 + }, + { + "epoch": 0.5384716906427346, + "grad_norm": 38.577674865722656, + "learning_rate": 1.0407616837474963e-06, + "loss": 0.1321, + "num_input_tokens_seen": 2004288, + "step": 4080 + }, + { + "epoch": 0.5391315824204831, + "grad_norm": 1.6322799921035767, + "learning_rate": 1.038459933942612e-06, + "loss": 0.0784, + "num_input_tokens_seen": 2006976, + "step": 4085 + }, + { + "epoch": 0.5397914741982315, + "grad_norm": 57.15738296508789, + "learning_rate": 1.036157980054782e-06, + "loss": 0.0603, + "num_input_tokens_seen": 2009280, + "step": 4090 + }, + { + "epoch": 0.54045136597598, + "grad_norm": 201.4349365234375, + "learning_rate": 1.0338558342990431e-06, + "loss": 0.0969, + "num_input_tokens_seen": 2011776, + "step": 4095 + }, + { + "epoch": 0.5411112577537284, + "grad_norm": 15.186023712158203, + "learning_rate": 1.0315535088914508e-06, + "loss": 0.2581, + "num_input_tokens_seen": 2014336, + "step": 4100 + }, + { + "epoch": 0.5417711495314769, + "grad_norm": 22.846664428710938, + "learning_rate": 1.0292510160490146e-06, + "loss": 0.1642, + "num_input_tokens_seen": 2017152, + "step": 4105 + }, + { + "epoch": 0.5424310413092253, + "grad_norm": 21.382556915283203, + "learning_rate": 1.0269483679896308e-06, + "loss": 0.0998, + "num_input_tokens_seen": 2019520, + "step": 4110 + }, + { + "epoch": 0.5430909330869738, + "grad_norm": 50.146427154541016, + "learning_rate": 1.0246455769320211e-06, + "loss": 0.162, + "num_input_tokens_seen": 2021632, + "step": 4115 + }, + { + "epoch": 0.5437508248647221, + "grad_norm": 0.8249346017837524, + "learning_rate": 1.0223426550956647e-06, + "loss": 0.1261, + "num_input_tokens_seen": 2023744, + "step": 4120 + }, + { + "epoch": 0.5444107166424706, + "grad_norm": 1.6365822553634644, + "learning_rate": 1.0200396147007354e-06, + "loss": 0.0762, + "num_input_tokens_seen": 2026048, + "step": 4125 + }, + { + "epoch": 0.545070608420219, + "grad_norm": 0.0482165552675724, + "learning_rate": 1.0177364679680367e-06, + "loss": 0.132, + "num_input_tokens_seen": 2028352, + "step": 4130 + }, + { + "epoch": 0.5457305001979675, + "grad_norm": 0.10031591355800629, + "learning_rate": 1.015433227118935e-06, + "loss": 0.0602, + "num_input_tokens_seen": 2030848, + "step": 4135 + }, + { + "epoch": 0.5463903919757159, + "grad_norm": 0.14653390645980835, + "learning_rate": 1.0131299043752967e-06, + "loss": 0.1337, + "num_input_tokens_seen": 2033344, + "step": 4140 + }, + { + "epoch": 0.5470502837534644, + "grad_norm": 0.3093219995498657, + "learning_rate": 1.0108265119594233e-06, + "loss": 0.0548, + "num_input_tokens_seen": 2035584, + "step": 4145 + }, + { + "epoch": 0.5477101755312129, + "grad_norm": 16.40343475341797, + "learning_rate": 1.0085230620939853e-06, + "loss": 0.0713, + "num_input_tokens_seen": 2038272, + "step": 4150 + }, + { + "epoch": 0.5483700673089613, + "grad_norm": 16.413604736328125, + "learning_rate": 1.0062195670019583e-06, + "loss": 0.0909, + "num_input_tokens_seen": 2040768, + "step": 4155 + }, + { + "epoch": 0.5490299590867098, + "grad_norm": 57.78659439086914, + "learning_rate": 1.0039160389065582e-06, + "loss": 0.1428, + "num_input_tokens_seen": 2043072, + "step": 4160 + }, + { + "epoch": 0.5496898508644582, + "grad_norm": 12.916586875915527, + "learning_rate": 1.0016124900311755e-06, + "loss": 0.1555, + "num_input_tokens_seen": 2045824, + "step": 4165 + }, + { + "epoch": 0.550217764286657, + "eval_loss": 0.09937019646167755, + "eval_runtime": 7.8852, + "eval_samples_per_second": 854.136, + "eval_steps_per_second": 106.783, + "num_input_tokens_seen": 2047552, + "step": 4169 + }, + { + "epoch": 0.5503497426422067, + "grad_norm": 25.078630447387695, + "learning_rate": 9.99308932599311e-07, + "loss": 0.2405, + "num_input_tokens_seen": 2048064, + "step": 4170 + }, + { + "epoch": 0.5510096344199551, + "grad_norm": 0.6139159798622131, + "learning_rate": 9.970053788345112e-07, + "loss": 0.0424, + "num_input_tokens_seen": 2050432, + "step": 4175 + }, + { + "epoch": 0.5516695261977036, + "grad_norm": 0.7848473191261292, + "learning_rate": 9.947018409603036e-07, + "loss": 0.0537, + "num_input_tokens_seen": 2052928, + "step": 4180 + }, + { + "epoch": 0.552329417975452, + "grad_norm": 0.712689995765686, + "learning_rate": 9.923983312001304e-07, + "loss": 0.1485, + "num_input_tokens_seen": 2055424, + "step": 4185 + }, + { + "epoch": 0.5529893097532005, + "grad_norm": 0.20174185931682587, + "learning_rate": 9.900948617772846e-07, + "loss": 0.1457, + "num_input_tokens_seen": 2057536, + "step": 4190 + }, + { + "epoch": 0.5536492015309489, + "grad_norm": 3.5391955375671387, + "learning_rate": 9.877914449148462e-07, + "loss": 0.1713, + "num_input_tokens_seen": 2059840, + "step": 4195 + }, + { + "epoch": 0.5543090933086974, + "grad_norm": 49.72500228881836, + "learning_rate": 9.854880928356157e-07, + "loss": 0.2209, + "num_input_tokens_seen": 2062656, + "step": 4200 + }, + { + "epoch": 0.5549689850864459, + "grad_norm": 0.5038784742355347, + "learning_rate": 9.831848177620493e-07, + "loss": 0.1398, + "num_input_tokens_seen": 2064960, + "step": 4205 + }, + { + "epoch": 0.5556288768641943, + "grad_norm": 33.89471435546875, + "learning_rate": 9.808816319161961e-07, + "loss": 0.2412, + "num_input_tokens_seen": 2067008, + "step": 4210 + }, + { + "epoch": 0.5562887686419428, + "grad_norm": 0.1182156652212143, + "learning_rate": 9.785785475196298e-07, + "loss": 0.0009, + "num_input_tokens_seen": 2069696, + "step": 4215 + }, + { + "epoch": 0.5569486604196912, + "grad_norm": 0.5332831740379333, + "learning_rate": 9.76275576793387e-07, + "loss": 0.0507, + "num_input_tokens_seen": 2072320, + "step": 4220 + }, + { + "epoch": 0.5576085521974397, + "grad_norm": 3.603602886199951, + "learning_rate": 9.739727319579007e-07, + "loss": 0.0016, + "num_input_tokens_seen": 2074752, + "step": 4225 + }, + { + "epoch": 0.558268443975188, + "grad_norm": 2.214005947113037, + "learning_rate": 9.716700252329361e-07, + "loss": 0.1143, + "num_input_tokens_seen": 2077440, + "step": 4230 + }, + { + "epoch": 0.5589283357529365, + "grad_norm": 29.49093246459961, + "learning_rate": 9.693674688375254e-07, + "loss": 0.1856, + "num_input_tokens_seen": 2080000, + "step": 4235 + }, + { + "epoch": 0.5595882275306849, + "grad_norm": 0.3982854187488556, + "learning_rate": 9.67065074989903e-07, + "loss": 0.0667, + "num_input_tokens_seen": 2082560, + "step": 4240 + }, + { + "epoch": 0.5602481193084334, + "grad_norm": 29.326953887939453, + "learning_rate": 9.647628559074415e-07, + "loss": 0.0822, + "num_input_tokens_seen": 2084864, + "step": 4245 + }, + { + "epoch": 0.5609080110861818, + "grad_norm": 0.06176973879337311, + "learning_rate": 9.62460823806585e-07, + "loss": 0.1228, + "num_input_tokens_seen": 2087424, + "step": 4250 + }, + { + "epoch": 0.5615679028639303, + "grad_norm": 38.027488708496094, + "learning_rate": 9.601589909027857e-07, + "loss": 0.2208, + "num_input_tokens_seen": 2090048, + "step": 4255 + }, + { + "epoch": 0.5622277946416787, + "grad_norm": 0.05623474344611168, + "learning_rate": 9.578573694104394e-07, + "loss": 0.0689, + "num_input_tokens_seen": 2092416, + "step": 4260 + }, + { + "epoch": 0.5628876864194272, + "grad_norm": 34.464744567871094, + "learning_rate": 9.555559715428199e-07, + "loss": 0.0788, + "num_input_tokens_seen": 2094656, + "step": 4265 + }, + { + "epoch": 0.5635475781971757, + "grad_norm": 0.2011699080467224, + "learning_rate": 9.532548095120134e-07, + "loss": 0.069, + "num_input_tokens_seen": 2097024, + "step": 4270 + }, + { + "epoch": 0.5642074699749241, + "grad_norm": 0.07516666501760483, + "learning_rate": 9.509538955288564e-07, + "loss": 0.0597, + "num_input_tokens_seen": 2099392, + "step": 4275 + }, + { + "epoch": 0.5648673617526726, + "grad_norm": 1.4651904106140137, + "learning_rate": 9.486532418028672e-07, + "loss": 0.09, + "num_input_tokens_seen": 2102016, + "step": 4280 + }, + { + "epoch": 0.565527253530421, + "grad_norm": 130.39993286132812, + "learning_rate": 9.463528605421844e-07, + "loss": 0.0804, + "num_input_tokens_seen": 2104320, + "step": 4285 + }, + { + "epoch": 0.5661871453081695, + "grad_norm": 36.727294921875, + "learning_rate": 9.440527639535004e-07, + "loss": 0.1016, + "num_input_tokens_seen": 2107136, + "step": 4290 + }, + { + "epoch": 0.5668470370859179, + "grad_norm": 0.16789622604846954, + "learning_rate": 9.417529642419971e-07, + "loss": 0.0533, + "num_input_tokens_seen": 2109888, + "step": 4295 + }, + { + "epoch": 0.5675069288636664, + "grad_norm": 108.9660873413086, + "learning_rate": 9.394534736112815e-07, + "loss": 0.1565, + "num_input_tokens_seen": 2112192, + "step": 4300 + }, + { + "epoch": 0.5681668206414148, + "grad_norm": 0.09434999525547028, + "learning_rate": 9.371543042633192e-07, + "loss": 0.1197, + "num_input_tokens_seen": 2114752, + "step": 4305 + }, + { + "epoch": 0.5688267124191633, + "grad_norm": 0.1492881327867508, + "learning_rate": 9.348554683983722e-07, + "loss": 0.141, + "num_input_tokens_seen": 2117184, + "step": 4310 + }, + { + "epoch": 0.5694866041969117, + "grad_norm": 0.6214476227760315, + "learning_rate": 9.325569782149323e-07, + "loss": 0.1155, + "num_input_tokens_seen": 2119552, + "step": 4315 + }, + { + "epoch": 0.5701464959746602, + "grad_norm": 35.80785369873047, + "learning_rate": 9.302588459096574e-07, + "loss": 0.0744, + "num_input_tokens_seen": 2121920, + "step": 4320 + }, + { + "epoch": 0.5708063877524086, + "grad_norm": 15.295533180236816, + "learning_rate": 9.279610836773064e-07, + "loss": 0.2853, + "num_input_tokens_seen": 2124096, + "step": 4325 + }, + { + "epoch": 0.571466279530157, + "grad_norm": 28.60223388671875, + "learning_rate": 9.256637037106735e-07, + "loss": 0.1079, + "num_input_tokens_seen": 2126528, + "step": 4330 + }, + { + "epoch": 0.5721261713079056, + "grad_norm": 39.715091705322266, + "learning_rate": 9.233667182005259e-07, + "loss": 0.0589, + "num_input_tokens_seen": 2128576, + "step": 4335 + }, + { + "epoch": 0.5727860630856539, + "grad_norm": 1.4454349279403687, + "learning_rate": 9.210701393355361e-07, + "loss": 0.0648, + "num_input_tokens_seen": 2130688, + "step": 4340 + }, + { + "epoch": 0.5734459548634024, + "grad_norm": 71.0278091430664, + "learning_rate": 9.187739793022198e-07, + "loss": 0.1324, + "num_input_tokens_seen": 2133312, + "step": 4345 + }, + { + "epoch": 0.5741058466411508, + "grad_norm": 0.047647565603256226, + "learning_rate": 9.164782502848702e-07, + "loss": 0.0724, + "num_input_tokens_seen": 2135680, + "step": 4350 + }, + { + "epoch": 0.5747657384188993, + "grad_norm": 0.19318842887878418, + "learning_rate": 9.141829644654936e-07, + "loss": 0.1448, + "num_input_tokens_seen": 2138112, + "step": 4355 + }, + { + "epoch": 0.5754256301966477, + "grad_norm": 110.14704132080078, + "learning_rate": 9.118881340237432e-07, + "loss": 0.4271, + "num_input_tokens_seen": 2140352, + "step": 4360 + }, + { + "epoch": 0.5760855219743962, + "grad_norm": 0.10673969238996506, + "learning_rate": 9.095937711368573e-07, + "loss": 0.0894, + "num_input_tokens_seen": 2143040, + "step": 4365 + }, + { + "epoch": 0.5767454137521446, + "grad_norm": 0.09286520630121231, + "learning_rate": 9.072998879795923e-07, + "loss": 0.0716, + "num_input_tokens_seen": 2145280, + "step": 4370 + }, + { + "epoch": 0.5774053055298931, + "grad_norm": 2.3450353145599365, + "learning_rate": 9.050064967241596e-07, + "loss": 0.1048, + "num_input_tokens_seen": 2147904, + "step": 4375 + }, + { + "epoch": 0.5780651973076415, + "grad_norm": 0.20796601474285126, + "learning_rate": 9.027136095401598e-07, + "loss": 0.0838, + "num_input_tokens_seen": 2150400, + "step": 4380 + }, + { + "epoch": 0.57872508908539, + "grad_norm": 0.1643630564212799, + "learning_rate": 9.004212385945187e-07, + "loss": 0.135, + "num_input_tokens_seen": 2153088, + "step": 4385 + }, + { + "epoch": 0.5793849808631385, + "grad_norm": 0.05613645911216736, + "learning_rate": 8.981293960514233e-07, + "loss": 0.0013, + "num_input_tokens_seen": 2155776, + "step": 4390 + }, + { + "epoch": 0.5800448726408869, + "grad_norm": 106.51136779785156, + "learning_rate": 8.958380940722564e-07, + "loss": 0.1661, + "num_input_tokens_seen": 2158400, + "step": 4395 + }, + { + "epoch": 0.5807047644186354, + "grad_norm": 0.41299527883529663, + "learning_rate": 8.935473448155326e-07, + "loss": 0.0766, + "num_input_tokens_seen": 2160704, + "step": 4400 + }, + { + "epoch": 0.5813646561963838, + "grad_norm": 29.65276336669922, + "learning_rate": 8.912571604368324e-07, + "loss": 0.0469, + "num_input_tokens_seen": 2163200, + "step": 4405 + }, + { + "epoch": 0.5820245479741323, + "grad_norm": 49.52018737792969, + "learning_rate": 8.889675530887404e-07, + "loss": 0.1421, + "num_input_tokens_seen": 2165376, + "step": 4410 + }, + { + "epoch": 0.5826844397518807, + "grad_norm": 0.17924949526786804, + "learning_rate": 8.866785349207786e-07, + "loss": 0.0994, + "num_input_tokens_seen": 2167808, + "step": 4415 + }, + { + "epoch": 0.5833443315296292, + "grad_norm": 23.86568260192871, + "learning_rate": 8.843901180793423e-07, + "loss": 0.1332, + "num_input_tokens_seen": 2170112, + "step": 4420 + }, + { + "epoch": 0.5840042233073776, + "grad_norm": 0.38153278827667236, + "learning_rate": 8.821023147076362e-07, + "loss": 0.0005, + "num_input_tokens_seen": 2172480, + "step": 4425 + }, + { + "epoch": 0.5846641150851261, + "grad_norm": 1.3169441223144531, + "learning_rate": 8.798151369456098e-07, + "loss": 0.0432, + "num_input_tokens_seen": 2175104, + "step": 4430 + }, + { + "epoch": 0.5853240068628744, + "grad_norm": 14.025379180908203, + "learning_rate": 8.775285969298931e-07, + "loss": 0.1126, + "num_input_tokens_seen": 2177280, + "step": 4435 + }, + { + "epoch": 0.585983898640623, + "grad_norm": 0.05871421471238136, + "learning_rate": 8.752427067937312e-07, + "loss": 0.0735, + "num_input_tokens_seen": 2179776, + "step": 4440 + }, + { + "epoch": 0.5866437904183713, + "grad_norm": 0.026597043499350548, + "learning_rate": 8.729574786669214e-07, + "loss": 0.0949, + "num_input_tokens_seen": 2182400, + "step": 4445 + }, + { + "epoch": 0.5873036821961198, + "grad_norm": 1.1581672430038452, + "learning_rate": 8.706729246757477e-07, + "loss": 0.0655, + "num_input_tokens_seen": 2185088, + "step": 4450 + }, + { + "epoch": 0.5879635739738683, + "grad_norm": 0.904012143611908, + "learning_rate": 8.683890569429173e-07, + "loss": 0.0697, + "num_input_tokens_seen": 2187776, + "step": 4455 + }, + { + "epoch": 0.5886234657516167, + "grad_norm": 0.04613454267382622, + "learning_rate": 8.661058875874956e-07, + "loss": 0.0006, + "num_input_tokens_seen": 2190016, + "step": 4460 + }, + { + "epoch": 0.5892833575293652, + "grad_norm": 0.06226871907711029, + "learning_rate": 8.638234287248423e-07, + "loss": 0.0008, + "num_input_tokens_seen": 2192320, + "step": 4465 + }, + { + "epoch": 0.5899432493071136, + "grad_norm": 178.02114868164062, + "learning_rate": 8.615416924665464e-07, + "loss": 0.0355, + "num_input_tokens_seen": 2194752, + "step": 4470 + }, + { + "epoch": 0.5906031410848621, + "grad_norm": 0.3306443691253662, + "learning_rate": 8.592606909203629e-07, + "loss": 0.0743, + "num_input_tokens_seen": 2197056, + "step": 4475 + }, + { + "epoch": 0.5912630328626105, + "grad_norm": 0.03277226537466049, + "learning_rate": 8.569804361901485e-07, + "loss": 0.0489, + "num_input_tokens_seen": 2199296, + "step": 4480 + }, + { + "epoch": 0.591922924640359, + "grad_norm": 70.67273712158203, + "learning_rate": 8.547009403757963e-07, + "loss": 0.41, + "num_input_tokens_seen": 2201664, + "step": 4485 + }, + { + "epoch": 0.5925828164181074, + "grad_norm": 15.897239685058594, + "learning_rate": 8.524222155731731e-07, + "loss": 0.227, + "num_input_tokens_seen": 2204288, + "step": 4490 + }, + { + "epoch": 0.5932427081958559, + "grad_norm": 0.5026524662971497, + "learning_rate": 8.501442738740538e-07, + "loss": 0.127, + "num_input_tokens_seen": 2206528, + "step": 4495 + }, + { + "epoch": 0.5939025999736043, + "grad_norm": 0.5848537683486938, + "learning_rate": 8.47867127366058e-07, + "loss": 0.0695, + "num_input_tokens_seen": 2209024, + "step": 4500 + }, + { + "epoch": 0.5945624917513528, + "grad_norm": 0.10000286996364594, + "learning_rate": 8.455907881325858e-07, + "loss": 0.0422, + "num_input_tokens_seen": 2211584, + "step": 4505 + }, + { + "epoch": 0.5952223835291012, + "grad_norm": 19.83750343322754, + "learning_rate": 8.433152682527533e-07, + "loss": 0.1233, + "num_input_tokens_seen": 2213952, + "step": 4510 + }, + { + "epoch": 0.5958822753068497, + "grad_norm": 72.72146606445312, + "learning_rate": 8.410405798013298e-07, + "loss": 0.0951, + "num_input_tokens_seen": 2216192, + "step": 4515 + }, + { + "epoch": 0.5965421670845982, + "grad_norm": 75.5259017944336, + "learning_rate": 8.387667348486712e-07, + "loss": 0.0126, + "num_input_tokens_seen": 2218688, + "step": 4520 + }, + { + "epoch": 0.5972020588623466, + "grad_norm": 0.20401786267757416, + "learning_rate": 8.364937454606585e-07, + "loss": 0.0853, + "num_input_tokens_seen": 2220928, + "step": 4525 + }, + { + "epoch": 0.5978619506400951, + "grad_norm": 0.22834134101867676, + "learning_rate": 8.342216236986329e-07, + "loss": 0.0013, + "num_input_tokens_seen": 2223360, + "step": 4530 + }, + { + "epoch": 0.5985218424178435, + "grad_norm": 0.06765160709619522, + "learning_rate": 8.319503816193305e-07, + "loss": 0.1511, + "num_input_tokens_seen": 2225792, + "step": 4535 + }, + { + "epoch": 0.599181734195592, + "grad_norm": 26.021888732910156, + "learning_rate": 8.296800312748206e-07, + "loss": 0.1163, + "num_input_tokens_seen": 2228288, + "step": 4540 + }, + { + "epoch": 0.5998416259733403, + "grad_norm": 0.4052346646785736, + "learning_rate": 8.274105847124404e-07, + "loss": 0.1894, + "num_input_tokens_seen": 2230848, + "step": 4545 + }, + { + "epoch": 0.6002375610399895, + "eval_loss": 0.1099071353673935, + "eval_runtime": 8.2934, + "eval_samples_per_second": 812.09, + "eval_steps_per_second": 101.526, + "num_input_tokens_seen": 2232448, + "step": 4548 + }, + { + "epoch": 0.6005015177510888, + "grad_norm": 25.49419593811035, + "learning_rate": 8.251420539747311e-07, + "loss": 0.233, + "num_input_tokens_seen": 2233472, + "step": 4550 + }, + { + "epoch": 0.6011614095288372, + "grad_norm": 0.07836712151765823, + "learning_rate": 8.228744510993742e-07, + "loss": 0.2218, + "num_input_tokens_seen": 2236096, + "step": 4555 + }, + { + "epoch": 0.6018213013065857, + "grad_norm": 0.250975102186203, + "learning_rate": 8.206077881191274e-07, + "loss": 0.0831, + "num_input_tokens_seen": 2238720, + "step": 4560 + }, + { + "epoch": 0.6024811930843341, + "grad_norm": 54.536197662353516, + "learning_rate": 8.183420770617614e-07, + "loss": 0.1877, + "num_input_tokens_seen": 2241216, + "step": 4565 + }, + { + "epoch": 0.6031410848620826, + "grad_norm": 28.72020149230957, + "learning_rate": 8.160773299499955e-07, + "loss": 0.0651, + "num_input_tokens_seen": 2243648, + "step": 4570 + }, + { + "epoch": 0.6038009766398311, + "grad_norm": 0.8081544637680054, + "learning_rate": 8.138135588014339e-07, + "loss": 0.0543, + "num_input_tokens_seen": 2246080, + "step": 4575 + }, + { + "epoch": 0.6044608684175795, + "grad_norm": 0.6024172902107239, + "learning_rate": 8.115507756285017e-07, + "loss": 0.0016, + "num_input_tokens_seen": 2248256, + "step": 4580 + }, + { + "epoch": 0.605120760195328, + "grad_norm": 0.1423349827528, + "learning_rate": 8.092889924383819e-07, + "loss": 0.07, + "num_input_tokens_seen": 2250688, + "step": 4585 + }, + { + "epoch": 0.6057806519730764, + "grad_norm": 0.3546024560928345, + "learning_rate": 8.070282212329508e-07, + "loss": 0.0872, + "num_input_tokens_seen": 2253120, + "step": 4590 + }, + { + "epoch": 0.6064405437508249, + "grad_norm": 16.78183937072754, + "learning_rate": 8.047684740087156e-07, + "loss": 0.1869, + "num_input_tokens_seen": 2255360, + "step": 4595 + }, + { + "epoch": 0.6071004355285733, + "grad_norm": 18.29332160949707, + "learning_rate": 8.025097627567481e-07, + "loss": 0.2572, + "num_input_tokens_seen": 2257728, + "step": 4600 + }, + { + "epoch": 0.6077603273063218, + "grad_norm": 0.07837789505720139, + "learning_rate": 8.002520994626247e-07, + "loss": 0.0536, + "num_input_tokens_seen": 2260224, + "step": 4605 + }, + { + "epoch": 0.6084202190840702, + "grad_norm": 0.2844223976135254, + "learning_rate": 7.979954961063596e-07, + "loss": 0.0372, + "num_input_tokens_seen": 2262912, + "step": 4610 + }, + { + "epoch": 0.6090801108618187, + "grad_norm": 64.26956939697266, + "learning_rate": 7.957399646623436e-07, + "loss": 0.2998, + "num_input_tokens_seen": 2265152, + "step": 4615 + }, + { + "epoch": 0.6097400026395671, + "grad_norm": 0.06967580318450928, + "learning_rate": 7.934855170992788e-07, + "loss": 0.0008, + "num_input_tokens_seen": 2267968, + "step": 4620 + }, + { + "epoch": 0.6103998944173156, + "grad_norm": 0.09711959213018417, + "learning_rate": 7.912321653801161e-07, + "loss": 0.0407, + "num_input_tokens_seen": 2270336, + "step": 4625 + }, + { + "epoch": 0.611059786195064, + "grad_norm": 19.1835880279541, + "learning_rate": 7.889799214619919e-07, + "loss": 0.135, + "num_input_tokens_seen": 2273024, + "step": 4630 + }, + { + "epoch": 0.6117196779728125, + "grad_norm": 0.028730077669024467, + "learning_rate": 7.867287972961629e-07, + "loss": 0.0678, + "num_input_tokens_seen": 2275264, + "step": 4635 + }, + { + "epoch": 0.612379569750561, + "grad_norm": 32.42776107788086, + "learning_rate": 7.844788048279453e-07, + "loss": 0.1219, + "num_input_tokens_seen": 2277888, + "step": 4640 + }, + { + "epoch": 0.6130394615283093, + "grad_norm": 0.039022643119096756, + "learning_rate": 7.822299559966494e-07, + "loss": 0.0005, + "num_input_tokens_seen": 2280320, + "step": 4645 + }, + { + "epoch": 0.6136993533060578, + "grad_norm": 0.0474756583571434, + "learning_rate": 7.799822627355171e-07, + "loss": 0.0017, + "num_input_tokens_seen": 2282560, + "step": 4650 + }, + { + "epoch": 0.6143592450838062, + "grad_norm": 0.14449454843997955, + "learning_rate": 7.77735736971659e-07, + "loss": 0.1505, + "num_input_tokens_seen": 2284864, + "step": 4655 + }, + { + "epoch": 0.6150191368615547, + "grad_norm": 0.22011378407478333, + "learning_rate": 7.754903906259889e-07, + "loss": 0.165, + "num_input_tokens_seen": 2287168, + "step": 4660 + }, + { + "epoch": 0.6156790286393031, + "grad_norm": 26.424232482910156, + "learning_rate": 7.732462356131637e-07, + "loss": 0.0716, + "num_input_tokens_seen": 2289600, + "step": 4665 + }, + { + "epoch": 0.6163389204170516, + "grad_norm": 1.7064114809036255, + "learning_rate": 7.710032838415179e-07, + "loss": 0.0317, + "num_input_tokens_seen": 2292160, + "step": 4670 + }, + { + "epoch": 0.6169988121948, + "grad_norm": 0.036719437688589096, + "learning_rate": 7.687615472130016e-07, + "loss": 0.0943, + "num_input_tokens_seen": 2294912, + "step": 4675 + }, + { + "epoch": 0.6176587039725485, + "grad_norm": 0.11287426948547363, + "learning_rate": 7.665210376231165e-07, + "loss": 0.1314, + "num_input_tokens_seen": 2297024, + "step": 4680 + }, + { + "epoch": 0.6183185957502969, + "grad_norm": 12.669684410095215, + "learning_rate": 7.642817669608536e-07, + "loss": 0.1436, + "num_input_tokens_seen": 2299456, + "step": 4685 + }, + { + "epoch": 0.6189784875280454, + "grad_norm": 0.13082663714885712, + "learning_rate": 7.62043747108629e-07, + "loss": 0.013, + "num_input_tokens_seen": 2301568, + "step": 4690 + }, + { + "epoch": 0.6196383793057938, + "grad_norm": 265.1707458496094, + "learning_rate": 7.598069899422221e-07, + "loss": 0.168, + "num_input_tokens_seen": 2303936, + "step": 4695 + }, + { + "epoch": 0.6202982710835423, + "grad_norm": 12.800505638122559, + "learning_rate": 7.575715073307119e-07, + "loss": 0.1745, + "num_input_tokens_seen": 2306176, + "step": 4700 + }, + { + "epoch": 0.6209581628612908, + "grad_norm": 0.4455643892288208, + "learning_rate": 7.55337311136414e-07, + "loss": 0.0901, + "num_input_tokens_seen": 2308736, + "step": 4705 + }, + { + "epoch": 0.6216180546390392, + "grad_norm": 18.547971725463867, + "learning_rate": 7.531044132148183e-07, + "loss": 0.1379, + "num_input_tokens_seen": 2311104, + "step": 4710 + }, + { + "epoch": 0.6222779464167877, + "grad_norm": 23.932079315185547, + "learning_rate": 7.508728254145245e-07, + "loss": 0.049, + "num_input_tokens_seen": 2313536, + "step": 4715 + }, + { + "epoch": 0.6229378381945361, + "grad_norm": 18.262922286987305, + "learning_rate": 7.486425595771817e-07, + "loss": 0.1208, + "num_input_tokens_seen": 2316032, + "step": 4720 + }, + { + "epoch": 0.6235977299722846, + "grad_norm": 12.403181076049805, + "learning_rate": 7.464136275374223e-07, + "loss": 0.205, + "num_input_tokens_seen": 2318656, + "step": 4725 + }, + { + "epoch": 0.624257621750033, + "grad_norm": 14.224221229553223, + "learning_rate": 7.441860411228029e-07, + "loss": 0.1395, + "num_input_tokens_seen": 2321216, + "step": 4730 + }, + { + "epoch": 0.6249175135277815, + "grad_norm": 48.01051712036133, + "learning_rate": 7.419598121537387e-07, + "loss": 0.1494, + "num_input_tokens_seen": 2323648, + "step": 4735 + }, + { + "epoch": 0.6255774053055299, + "grad_norm": 16.137556076049805, + "learning_rate": 7.397349524434424e-07, + "loss": 0.165, + "num_input_tokens_seen": 2326080, + "step": 4740 + }, + { + "epoch": 0.6262372970832784, + "grad_norm": 13.062948226928711, + "learning_rate": 7.375114737978605e-07, + "loss": 0.0572, + "num_input_tokens_seen": 2328512, + "step": 4745 + }, + { + "epoch": 0.6268971888610267, + "grad_norm": 7.66116189956665, + "learning_rate": 7.352893880156106e-07, + "loss": 0.1462, + "num_input_tokens_seen": 2331008, + "step": 4750 + }, + { + "epoch": 0.6275570806387752, + "grad_norm": 1.405522346496582, + "learning_rate": 7.330687068879202e-07, + "loss": 0.0943, + "num_input_tokens_seen": 2333376, + "step": 4755 + }, + { + "epoch": 0.6282169724165237, + "grad_norm": 224.89602661132812, + "learning_rate": 7.308494421985626e-07, + "loss": 0.2447, + "num_input_tokens_seen": 2335872, + "step": 4760 + }, + { + "epoch": 0.6288768641942721, + "grad_norm": 0.1741466373205185, + "learning_rate": 7.286316057237951e-07, + "loss": 0.0016, + "num_input_tokens_seen": 2338432, + "step": 4765 + }, + { + "epoch": 0.6295367559720206, + "grad_norm": 9.092262268066406, + "learning_rate": 7.264152092322963e-07, + "loss": 0.1152, + "num_input_tokens_seen": 2340928, + "step": 4770 + }, + { + "epoch": 0.630196647749769, + "grad_norm": 0.2725062370300293, + "learning_rate": 7.242002644851035e-07, + "loss": 0.1148, + "num_input_tokens_seen": 2343680, + "step": 4775 + }, + { + "epoch": 0.6308565395275175, + "grad_norm": 0.1986101120710373, + "learning_rate": 7.219867832355508e-07, + "loss": 0.0689, + "num_input_tokens_seen": 2346240, + "step": 4780 + }, + { + "epoch": 0.6315164313052659, + "grad_norm": 0.1735810786485672, + "learning_rate": 7.197747772292071e-07, + "loss": 0.0841, + "num_input_tokens_seen": 2348544, + "step": 4785 + }, + { + "epoch": 0.6321763230830144, + "grad_norm": 0.06138006970286369, + "learning_rate": 7.17564258203811e-07, + "loss": 0.2099, + "num_input_tokens_seen": 2350976, + "step": 4790 + }, + { + "epoch": 0.6328362148607628, + "grad_norm": 21.949594497680664, + "learning_rate": 7.153552378892128e-07, + "loss": 0.115, + "num_input_tokens_seen": 2353216, + "step": 4795 + }, + { + "epoch": 0.6334961066385113, + "grad_norm": 0.6890119314193726, + "learning_rate": 7.131477280073091e-07, + "loss": 0.1212, + "num_input_tokens_seen": 2355584, + "step": 4800 + }, + { + "epoch": 0.6341559984162597, + "grad_norm": 0.19981062412261963, + "learning_rate": 7.109417402719813e-07, + "loss": 0.0817, + "num_input_tokens_seen": 2358144, + "step": 4805 + }, + { + "epoch": 0.6348158901940082, + "grad_norm": 49.97908401489258, + "learning_rate": 7.087372863890346e-07, + "loss": 0.029, + "num_input_tokens_seen": 2360896, + "step": 4810 + }, + { + "epoch": 0.6354757819717566, + "grad_norm": 1.2881401777267456, + "learning_rate": 7.065343780561344e-07, + "loss": 0.2463, + "num_input_tokens_seen": 2363264, + "step": 4815 + }, + { + "epoch": 0.6361356737495051, + "grad_norm": 13.928070068359375, + "learning_rate": 7.043330269627448e-07, + "loss": 0.0744, + "num_input_tokens_seen": 2365632, + "step": 4820 + }, + { + "epoch": 0.6367955655272536, + "grad_norm": 0.07533244788646698, + "learning_rate": 7.021332447900671e-07, + "loss": 0.0018, + "num_input_tokens_seen": 2368000, + "step": 4825 + }, + { + "epoch": 0.637455457305002, + "grad_norm": 199.91444396972656, + "learning_rate": 6.999350432109766e-07, + "loss": 0.1116, + "num_input_tokens_seen": 2370560, + "step": 4830 + }, + { + "epoch": 0.6381153490827505, + "grad_norm": 0.0590510219335556, + "learning_rate": 6.977384338899617e-07, + "loss": 0.0011, + "num_input_tokens_seen": 2373120, + "step": 4835 + }, + { + "epoch": 0.6387752408604989, + "grad_norm": 0.12178171426057816, + "learning_rate": 6.955434284830619e-07, + "loss": 0.033, + "num_input_tokens_seen": 2375872, + "step": 4840 + }, + { + "epoch": 0.6394351326382474, + "grad_norm": 0.07356923073530197, + "learning_rate": 6.933500386378056e-07, + "loss": 0.2167, + "num_input_tokens_seen": 2378432, + "step": 4845 + }, + { + "epoch": 0.6400950244159958, + "grad_norm": 209.99586486816406, + "learning_rate": 6.911582759931482e-07, + "loss": 0.213, + "num_input_tokens_seen": 2380800, + "step": 4850 + }, + { + "epoch": 0.6407549161937443, + "grad_norm": 0.01491602510213852, + "learning_rate": 6.889681521794109e-07, + "loss": 0.2747, + "num_input_tokens_seen": 2383744, + "step": 4855 + }, + { + "epoch": 0.6414148079714926, + "grad_norm": 15.076420783996582, + "learning_rate": 6.867796788182181e-07, + "loss": 0.0758, + "num_input_tokens_seen": 2386112, + "step": 4860 + }, + { + "epoch": 0.6420746997492411, + "grad_norm": 13.008954048156738, + "learning_rate": 6.845928675224366e-07, + "loss": 0.1529, + "num_input_tokens_seen": 2388736, + "step": 4865 + }, + { + "epoch": 0.6427345915269895, + "grad_norm": 0.15090730786323547, + "learning_rate": 6.82407729896114e-07, + "loss": 0.0713, + "num_input_tokens_seen": 2391104, + "step": 4870 + }, + { + "epoch": 0.643394483304738, + "grad_norm": 27.68510627746582, + "learning_rate": 6.802242775344163e-07, + "loss": 0.1204, + "num_input_tokens_seen": 2393728, + "step": 4875 + }, + { + "epoch": 0.6440543750824864, + "grad_norm": 0.20335356891155243, + "learning_rate": 6.780425220235674e-07, + "loss": 0.1797, + "num_input_tokens_seen": 2396480, + "step": 4880 + }, + { + "epoch": 0.6447142668602349, + "grad_norm": 0.1165480837225914, + "learning_rate": 6.758624749407859e-07, + "loss": 0.0011, + "num_input_tokens_seen": 2399104, + "step": 4885 + }, + { + "epoch": 0.6453741586379834, + "grad_norm": 15.720735549926758, + "learning_rate": 6.736841478542264e-07, + "loss": 0.0861, + "num_input_tokens_seen": 2401664, + "step": 4890 + }, + { + "epoch": 0.6460340504157318, + "grad_norm": 2.2438161373138428, + "learning_rate": 6.715075523229151e-07, + "loss": 0.0316, + "num_input_tokens_seen": 2404160, + "step": 4895 + }, + { + "epoch": 0.6466939421934803, + "grad_norm": 77.18789672851562, + "learning_rate": 6.693326998966909e-07, + "loss": 0.1035, + "num_input_tokens_seen": 2406592, + "step": 4900 + }, + { + "epoch": 0.6473538339712287, + "grad_norm": 0.05804076045751572, + "learning_rate": 6.671596021161431e-07, + "loss": 0.0014, + "num_input_tokens_seen": 2409088, + "step": 4905 + }, + { + "epoch": 0.6480137257489772, + "grad_norm": 0.07824068516492844, + "learning_rate": 6.649882705125494e-07, + "loss": 0.1158, + "num_input_tokens_seen": 2411584, + "step": 4910 + }, + { + "epoch": 0.6486736175267256, + "grad_norm": 98.59748077392578, + "learning_rate": 6.628187166078163e-07, + "loss": 0.472, + "num_input_tokens_seen": 2414400, + "step": 4915 + }, + { + "epoch": 0.6493335093044741, + "grad_norm": 54.34969711303711, + "learning_rate": 6.606509519144166e-07, + "loss": 0.0382, + "num_input_tokens_seen": 2416640, + "step": 4920 + }, + { + "epoch": 0.6499934010822225, + "grad_norm": 66.13670349121094, + "learning_rate": 6.584849879353289e-07, + "loss": 0.1297, + "num_input_tokens_seen": 2419136, + "step": 4925 + }, + { + "epoch": 0.6502573577933219, + "eval_loss": 0.09970784932374954, + "eval_runtime": 7.9122, + "eval_samples_per_second": 851.219, + "eval_steps_per_second": 106.418, + "num_input_tokens_seen": 2420096, + "step": 4927 + }, + { + "epoch": 0.650653292859971, + "grad_norm": 0.60494065284729, + "learning_rate": 6.563208361639772e-07, + "loss": 0.0423, + "num_input_tokens_seen": 2421440, + "step": 4930 + }, + { + "epoch": 0.6513131846377194, + "grad_norm": 0.06657727062702179, + "learning_rate": 6.541585080841687e-07, + "loss": 0.0187, + "num_input_tokens_seen": 2424000, + "step": 4935 + }, + { + "epoch": 0.6519730764154679, + "grad_norm": 159.46224975585938, + "learning_rate": 6.519980151700332e-07, + "loss": 0.1785, + "num_input_tokens_seen": 2426240, + "step": 4940 + }, + { + "epoch": 0.6526329681932164, + "grad_norm": 0.16553577780723572, + "learning_rate": 6.498393688859629e-07, + "loss": 0.1136, + "num_input_tokens_seen": 2428864, + "step": 4945 + }, + { + "epoch": 0.6532928599709648, + "grad_norm": 0.052161458879709244, + "learning_rate": 6.47682580686551e-07, + "loss": 0.0011, + "num_input_tokens_seen": 2431296, + "step": 4950 + }, + { + "epoch": 0.6539527517487133, + "grad_norm": 0.05444502457976341, + "learning_rate": 6.455276620165307e-07, + "loss": 0.0017, + "num_input_tokens_seen": 2433984, + "step": 4955 + }, + { + "epoch": 0.6546126435264616, + "grad_norm": 0.030169246718287468, + "learning_rate": 6.433746243107152e-07, + "loss": 0.4128, + "num_input_tokens_seen": 2436224, + "step": 4960 + }, + { + "epoch": 0.6552725353042101, + "grad_norm": 0.1023978590965271, + "learning_rate": 6.412234789939359e-07, + "loss": 0.1516, + "num_input_tokens_seen": 2438720, + "step": 4965 + }, + { + "epoch": 0.6559324270819585, + "grad_norm": 0.13813242316246033, + "learning_rate": 6.390742374809832e-07, + "loss": 0.0589, + "num_input_tokens_seen": 2440960, + "step": 4970 + }, + { + "epoch": 0.656592318859707, + "grad_norm": 0.1587606817483902, + "learning_rate": 6.369269111765454e-07, + "loss": 0.0597, + "num_input_tokens_seen": 2443328, + "step": 4975 + }, + { + "epoch": 0.6572522106374554, + "grad_norm": 0.060975294560194016, + "learning_rate": 6.347815114751465e-07, + "loss": 0.1664, + "num_input_tokens_seen": 2445952, + "step": 4980 + }, + { + "epoch": 0.6579121024152039, + "grad_norm": 0.04723791033029556, + "learning_rate": 6.326380497610886e-07, + "loss": 0.1165, + "num_input_tokens_seen": 2448576, + "step": 4985 + }, + { + "epoch": 0.6585719941929523, + "grad_norm": 35.17012405395508, + "learning_rate": 6.304965374083899e-07, + "loss": 0.3173, + "num_input_tokens_seen": 2451136, + "step": 4990 + }, + { + "epoch": 0.6592318859707008, + "grad_norm": 0.23336689174175262, + "learning_rate": 6.283569857807245e-07, + "loss": 0.002, + "num_input_tokens_seen": 2453632, + "step": 4995 + }, + { + "epoch": 0.6598917777484492, + "grad_norm": 0.17793512344360352, + "learning_rate": 6.262194062313615e-07, + "loss": 0.0644, + "num_input_tokens_seen": 2456192, + "step": 5000 + }, + { + "epoch": 0.6605516695261977, + "grad_norm": 0.052415881305933, + "learning_rate": 6.240838101031063e-07, + "loss": 0.0013, + "num_input_tokens_seen": 2458624, + "step": 5005 + }, + { + "epoch": 0.6612115613039462, + "grad_norm": 0.11415770649909973, + "learning_rate": 6.21950208728239e-07, + "loss": 0.0896, + "num_input_tokens_seen": 2460928, + "step": 5010 + }, + { + "epoch": 0.6618714530816946, + "grad_norm": 0.13506917655467987, + "learning_rate": 6.198186134284554e-07, + "loss": 0.1054, + "num_input_tokens_seen": 2463552, + "step": 5015 + }, + { + "epoch": 0.6625313448594431, + "grad_norm": 0.4825565218925476, + "learning_rate": 6.176890355148049e-07, + "loss": 0.0028, + "num_input_tokens_seen": 2465856, + "step": 5020 + }, + { + "epoch": 0.6631912366371915, + "grad_norm": 0.11778873205184937, + "learning_rate": 6.155614862876335e-07, + "loss": 0.0981, + "num_input_tokens_seen": 2468288, + "step": 5025 + }, + { + "epoch": 0.66385112841494, + "grad_norm": 110.11556243896484, + "learning_rate": 6.134359770365214e-07, + "loss": 0.1368, + "num_input_tokens_seen": 2470912, + "step": 5030 + }, + { + "epoch": 0.6645110201926884, + "grad_norm": 0.7118353843688965, + "learning_rate": 6.11312519040224e-07, + "loss": 0.0711, + "num_input_tokens_seen": 2473536, + "step": 5035 + }, + { + "epoch": 0.6651709119704369, + "grad_norm": 0.08325012028217316, + "learning_rate": 6.091911235666125e-07, + "loss": 0.0009, + "num_input_tokens_seen": 2476032, + "step": 5040 + }, + { + "epoch": 0.6658308037481853, + "grad_norm": 0.13275060057640076, + "learning_rate": 6.070718018726124e-07, + "loss": 0.1034, + "num_input_tokens_seen": 2478208, + "step": 5045 + }, + { + "epoch": 0.6664906955259338, + "grad_norm": 0.11056883633136749, + "learning_rate": 6.049545652041459e-07, + "loss": 0.1196, + "num_input_tokens_seen": 2480512, + "step": 5050 + }, + { + "epoch": 0.6671505873036822, + "grad_norm": 0.7402254939079285, + "learning_rate": 6.028394247960709e-07, + "loss": 0.1824, + "num_input_tokens_seen": 2483008, + "step": 5055 + }, + { + "epoch": 0.6678104790814307, + "grad_norm": 0.04158753529191017, + "learning_rate": 6.007263918721221e-07, + "loss": 0.1399, + "num_input_tokens_seen": 2485376, + "step": 5060 + }, + { + "epoch": 0.668470370859179, + "grad_norm": 0.2165919989347458, + "learning_rate": 5.986154776448507e-07, + "loss": 0.07, + "num_input_tokens_seen": 2488064, + "step": 5065 + }, + { + "epoch": 0.6691302626369275, + "grad_norm": 18.02176284790039, + "learning_rate": 5.965066933155656e-07, + "loss": 0.0635, + "num_input_tokens_seen": 2490624, + "step": 5070 + }, + { + "epoch": 0.669790154414676, + "grad_norm": 26.047637939453125, + "learning_rate": 5.944000500742735e-07, + "loss": 0.2914, + "num_input_tokens_seen": 2493248, + "step": 5075 + }, + { + "epoch": 0.6704500461924244, + "grad_norm": 69.23401641845703, + "learning_rate": 5.922955590996195e-07, + "loss": 0.2126, + "num_input_tokens_seen": 2495744, + "step": 5080 + }, + { + "epoch": 0.6711099379701729, + "grad_norm": 0.13096897304058075, + "learning_rate": 5.901932315588281e-07, + "loss": 0.0014, + "num_input_tokens_seen": 2498176, + "step": 5085 + }, + { + "epoch": 0.6717698297479213, + "grad_norm": 19.673627853393555, + "learning_rate": 5.880930786076441e-07, + "loss": 0.1766, + "num_input_tokens_seen": 2500416, + "step": 5090 + }, + { + "epoch": 0.6724297215256698, + "grad_norm": 148.1903533935547, + "learning_rate": 5.859951113902728e-07, + "loss": 0.0912, + "num_input_tokens_seen": 2502848, + "step": 5095 + }, + { + "epoch": 0.6730896133034182, + "grad_norm": 23.524593353271484, + "learning_rate": 5.83899341039321e-07, + "loss": 0.1217, + "num_input_tokens_seen": 2505152, + "step": 5100 + }, + { + "epoch": 0.6737495050811667, + "grad_norm": 23.715028762817383, + "learning_rate": 5.818057786757386e-07, + "loss": 0.1365, + "num_input_tokens_seen": 2507648, + "step": 5105 + }, + { + "epoch": 0.6744093968589151, + "grad_norm": 0.21634319424629211, + "learning_rate": 5.797144354087588e-07, + "loss": 0.1131, + "num_input_tokens_seen": 2510144, + "step": 5110 + }, + { + "epoch": 0.6750692886366636, + "grad_norm": 0.06485975533723831, + "learning_rate": 5.77625322335839e-07, + "loss": 0.0198, + "num_input_tokens_seen": 2513024, + "step": 5115 + }, + { + "epoch": 0.675729180414412, + "grad_norm": 0.3879457116127014, + "learning_rate": 5.755384505426032e-07, + "loss": 0.0733, + "num_input_tokens_seen": 2515072, + "step": 5120 + }, + { + "epoch": 0.6763890721921605, + "grad_norm": 0.26867377758026123, + "learning_rate": 5.734538311027819e-07, + "loss": 0.0013, + "num_input_tokens_seen": 2517376, + "step": 5125 + }, + { + "epoch": 0.677048963969909, + "grad_norm": 0.730602502822876, + "learning_rate": 5.713714750781533e-07, + "loss": 0.003, + "num_input_tokens_seen": 2520064, + "step": 5130 + }, + { + "epoch": 0.6777088557476574, + "grad_norm": 0.5069525241851807, + "learning_rate": 5.692913935184862e-07, + "loss": 0.0716, + "num_input_tokens_seen": 2522688, + "step": 5135 + }, + { + "epoch": 0.6783687475254059, + "grad_norm": 0.17478005588054657, + "learning_rate": 5.672135974614794e-07, + "loss": 0.0165, + "num_input_tokens_seen": 2525184, + "step": 5140 + }, + { + "epoch": 0.6790286393031543, + "grad_norm": 0.08164742588996887, + "learning_rate": 5.651380979327034e-07, + "loss": 0.0008, + "num_input_tokens_seen": 2527552, + "step": 5145 + }, + { + "epoch": 0.6796885310809028, + "grad_norm": 2.0063724517822266, + "learning_rate": 5.630649059455444e-07, + "loss": 0.0435, + "num_input_tokens_seen": 2530240, + "step": 5150 + }, + { + "epoch": 0.6803484228586512, + "grad_norm": 1.745144248008728, + "learning_rate": 5.609940325011413e-07, + "loss": 0.0116, + "num_input_tokens_seen": 2532480, + "step": 5155 + }, + { + "epoch": 0.6810083146363997, + "grad_norm": 0.13738574087619781, + "learning_rate": 5.589254885883325e-07, + "loss": 0.0006, + "num_input_tokens_seen": 2534912, + "step": 5160 + }, + { + "epoch": 0.681668206414148, + "grad_norm": 0.19333359599113464, + "learning_rate": 5.568592851835936e-07, + "loss": 0.0753, + "num_input_tokens_seen": 2537408, + "step": 5165 + }, + { + "epoch": 0.6823280981918965, + "grad_norm": 0.1132221594452858, + "learning_rate": 5.547954332509805e-07, + "loss": 0.2943, + "num_input_tokens_seen": 2539776, + "step": 5170 + }, + { + "epoch": 0.6829879899696449, + "grad_norm": 0.03335703909397125, + "learning_rate": 5.527339437420717e-07, + "loss": 0.001, + "num_input_tokens_seen": 2542208, + "step": 5175 + }, + { + "epoch": 0.6836478817473934, + "grad_norm": 0.27844464778900146, + "learning_rate": 5.506748275959094e-07, + "loss": 0.0691, + "num_input_tokens_seen": 2544704, + "step": 5180 + }, + { + "epoch": 0.6843077735251418, + "grad_norm": 0.07211031764745712, + "learning_rate": 5.48618095738943e-07, + "loss": 0.0527, + "num_input_tokens_seen": 2547072, + "step": 5185 + }, + { + "epoch": 0.6849676653028903, + "grad_norm": 0.14520291984081268, + "learning_rate": 5.465637590849681e-07, + "loss": 0.121, + "num_input_tokens_seen": 2549440, + "step": 5190 + }, + { + "epoch": 0.6856275570806388, + "grad_norm": 43.26601028442383, + "learning_rate": 5.445118285350723e-07, + "loss": 0.1132, + "num_input_tokens_seen": 2552128, + "step": 5195 + }, + { + "epoch": 0.6862874488583872, + "grad_norm": 0.13170602917671204, + "learning_rate": 5.424623149775745e-07, + "loss": 0.0694, + "num_input_tokens_seen": 2554368, + "step": 5200 + }, + { + "epoch": 0.6869473406361357, + "grad_norm": 0.018987668678164482, + "learning_rate": 5.404152292879676e-07, + "loss": 0.1189, + "num_input_tokens_seen": 2556928, + "step": 5205 + }, + { + "epoch": 0.6876072324138841, + "grad_norm": 20.207496643066406, + "learning_rate": 5.38370582328863e-07, + "loss": 0.1717, + "num_input_tokens_seen": 2559360, + "step": 5210 + }, + { + "epoch": 0.6882671241916326, + "grad_norm": 0.22772113978862762, + "learning_rate": 5.363283849499293e-07, + "loss": 0.1758, + "num_input_tokens_seen": 2561856, + "step": 5215 + }, + { + "epoch": 0.688927015969381, + "grad_norm": 17.795719146728516, + "learning_rate": 5.342886479878387e-07, + "loss": 0.1671, + "num_input_tokens_seen": 2564352, + "step": 5220 + }, + { + "epoch": 0.6895869077471295, + "grad_norm": 0.4601105749607086, + "learning_rate": 5.32251382266206e-07, + "loss": 0.0526, + "num_input_tokens_seen": 2566784, + "step": 5225 + }, + { + "epoch": 0.6902467995248779, + "grad_norm": 0.38812679052352905, + "learning_rate": 5.302165985955327e-07, + "loss": 0.1115, + "num_input_tokens_seen": 2569152, + "step": 5230 + }, + { + "epoch": 0.6909066913026264, + "grad_norm": 0.11644639819860458, + "learning_rate": 5.281843077731511e-07, + "loss": 0.0649, + "num_input_tokens_seen": 2571520, + "step": 5235 + }, + { + "epoch": 0.6915665830803748, + "grad_norm": 79.44305419921875, + "learning_rate": 5.26154520583163e-07, + "loss": 0.0934, + "num_input_tokens_seen": 2574080, + "step": 5240 + }, + { + "epoch": 0.6922264748581233, + "grad_norm": 0.16522075235843658, + "learning_rate": 5.241272477963877e-07, + "loss": 0.1196, + "num_input_tokens_seen": 2576320, + "step": 5245 + }, + { + "epoch": 0.6928863666358717, + "grad_norm": 0.037316884845495224, + "learning_rate": 5.221025001703e-07, + "loss": 0.0494, + "num_input_tokens_seen": 2578752, + "step": 5250 + }, + { + "epoch": 0.6935462584136202, + "grad_norm": 19.88916778564453, + "learning_rate": 5.200802884489768e-07, + "loss": 0.1279, + "num_input_tokens_seen": 2581184, + "step": 5255 + }, + { + "epoch": 0.6942061501913687, + "grad_norm": 17.280460357666016, + "learning_rate": 5.180606233630374e-07, + "loss": 0.2016, + "num_input_tokens_seen": 2583872, + "step": 5260 + }, + { + "epoch": 0.694866041969117, + "grad_norm": 0.17049993574619293, + "learning_rate": 5.160435156295879e-07, + "loss": 0.1809, + "num_input_tokens_seen": 2586304, + "step": 5265 + }, + { + "epoch": 0.6955259337468656, + "grad_norm": 0.04596101865172386, + "learning_rate": 5.14028975952165e-07, + "loss": 0.0593, + "num_input_tokens_seen": 2589056, + "step": 5270 + }, + { + "epoch": 0.6961858255246139, + "grad_norm": 13.068889617919922, + "learning_rate": 5.120170150206768e-07, + "loss": 0.0839, + "num_input_tokens_seen": 2591488, + "step": 5275 + }, + { + "epoch": 0.6968457173023624, + "grad_norm": 25.771705627441406, + "learning_rate": 5.100076435113496e-07, + "loss": 0.0112, + "num_input_tokens_seen": 2593792, + "step": 5280 + }, + { + "epoch": 0.6975056090801108, + "grad_norm": 176.9816436767578, + "learning_rate": 5.080008720866673e-07, + "loss": 0.1564, + "num_input_tokens_seen": 2595968, + "step": 5285 + }, + { + "epoch": 0.6981655008578593, + "grad_norm": 14.442154884338379, + "learning_rate": 5.059967113953173e-07, + "loss": 0.2333, + "num_input_tokens_seen": 2598144, + "step": 5290 + }, + { + "epoch": 0.6988253926356077, + "grad_norm": 0.13442066311836243, + "learning_rate": 5.039951720721349e-07, + "loss": 0.0942, + "num_input_tokens_seen": 2600448, + "step": 5295 + }, + { + "epoch": 0.6994852844133562, + "grad_norm": 0.41721171140670776, + "learning_rate": 5.019962647380429e-07, + "loss": 0.0922, + "num_input_tokens_seen": 2602944, + "step": 5300 + }, + { + "epoch": 0.7001451761911046, + "grad_norm": 78.33120727539062, + "learning_rate": 5.000000000000002e-07, + "loss": 0.1829, + "num_input_tokens_seen": 2605120, + "step": 5305 + }, + { + "epoch": 0.7002771545466544, + "eval_loss": 0.09362584352493286, + "eval_runtime": 8.0352, + "eval_samples_per_second": 838.191, + "eval_steps_per_second": 104.789, + "num_input_tokens_seen": 2605504, + "step": 5306 + }, + { + "epoch": 0.7008050679688531, + "grad_norm": 0.36335432529449463, + "learning_rate": 4.980063884509414e-07, + "loss": 0.0412, + "num_input_tokens_seen": 2607296, + "step": 5310 + }, + { + "epoch": 0.7014649597466015, + "grad_norm": 0.11268818378448486, + "learning_rate": 4.960154406697229e-07, + "loss": 0.0804, + "num_input_tokens_seen": 2609728, + "step": 5315 + }, + { + "epoch": 0.70212485152435, + "grad_norm": 14.370553016662598, + "learning_rate": 4.940271672210667e-07, + "loss": 0.2263, + "num_input_tokens_seen": 2612224, + "step": 5320 + }, + { + "epoch": 0.7027847433020985, + "grad_norm": 0.1433858722448349, + "learning_rate": 4.920415786555025e-07, + "loss": 0.0293, + "num_input_tokens_seen": 2614720, + "step": 5325 + }, + { + "epoch": 0.7034446350798469, + "grad_norm": 0.18172575533390045, + "learning_rate": 4.900586855093144e-07, + "loss": 0.2921, + "num_input_tokens_seen": 2617344, + "step": 5330 + }, + { + "epoch": 0.7041045268575954, + "grad_norm": 20.320568084716797, + "learning_rate": 4.880784983044827e-07, + "loss": 0.1245, + "num_input_tokens_seen": 2619584, + "step": 5335 + }, + { + "epoch": 0.7047644186353438, + "grad_norm": 0.19204528629779816, + "learning_rate": 4.861010275486284e-07, + "loss": 0.0299, + "num_input_tokens_seen": 2621888, + "step": 5340 + }, + { + "epoch": 0.7054243104130923, + "grad_norm": 0.053933948278427124, + "learning_rate": 4.8412628373496e-07, + "loss": 0.0976, + "num_input_tokens_seen": 2624512, + "step": 5345 + }, + { + "epoch": 0.7060842021908407, + "grad_norm": 0.2728992700576782, + "learning_rate": 4.821542773422136e-07, + "loss": 0.0023, + "num_input_tokens_seen": 2627008, + "step": 5350 + }, + { + "epoch": 0.7067440939685892, + "grad_norm": 0.5393227934837341, + "learning_rate": 4.801850188346012e-07, + "loss": 0.0019, + "num_input_tokens_seen": 2629440, + "step": 5355 + }, + { + "epoch": 0.7074039857463376, + "grad_norm": 3.791325092315674, + "learning_rate": 4.782185186617523e-07, + "loss": 0.1053, + "num_input_tokens_seen": 2631872, + "step": 5360 + }, + { + "epoch": 0.7080638775240861, + "grad_norm": 0.12838907539844513, + "learning_rate": 4.762547872586603e-07, + "loss": 0.0618, + "num_input_tokens_seen": 2634560, + "step": 5365 + }, + { + "epoch": 0.7087237693018344, + "grad_norm": 14.399864196777344, + "learning_rate": 4.7429383504562605e-07, + "loss": 0.1344, + "num_input_tokens_seen": 2637120, + "step": 5370 + }, + { + "epoch": 0.709383661079583, + "grad_norm": 0.2652495503425598, + "learning_rate": 4.723356724282029e-07, + "loss": 0.0227, + "num_input_tokens_seen": 2639552, + "step": 5375 + }, + { + "epoch": 0.7100435528573315, + "grad_norm": 20.664852142333984, + "learning_rate": 4.703803097971426e-07, + "loss": 0.128, + "num_input_tokens_seen": 2641984, + "step": 5380 + }, + { + "epoch": 0.7107034446350798, + "grad_norm": 11.795884132385254, + "learning_rate": 4.6842775752833763e-07, + "loss": 0.0719, + "num_input_tokens_seen": 2644352, + "step": 5385 + }, + { + "epoch": 0.7113633364128283, + "grad_norm": 0.1572529375553131, + "learning_rate": 4.664780259827689e-07, + "loss": 0.0018, + "num_input_tokens_seen": 2647040, + "step": 5390 + }, + { + "epoch": 0.7120232281905767, + "grad_norm": 0.04447837546467781, + "learning_rate": 4.6453112550644857e-07, + "loss": 0.001, + "num_input_tokens_seen": 2649472, + "step": 5395 + }, + { + "epoch": 0.7126831199683252, + "grad_norm": 0.3557925522327423, + "learning_rate": 4.625870664303663e-07, + "loss": 0.0643, + "num_input_tokens_seen": 2651840, + "step": 5400 + }, + { + "epoch": 0.7133430117460736, + "grad_norm": 0.15744389593601227, + "learning_rate": 4.6064585907043486e-07, + "loss": 0.0024, + "num_input_tokens_seen": 2654464, + "step": 5405 + }, + { + "epoch": 0.7140029035238221, + "grad_norm": 0.013112170621752739, + "learning_rate": 4.587075137274334e-07, + "loss": 0.0598, + "num_input_tokens_seen": 2656576, + "step": 5410 + }, + { + "epoch": 0.7146627953015705, + "grad_norm": 0.7360963821411133, + "learning_rate": 4.5677204068695597e-07, + "loss": 0.0527, + "num_input_tokens_seen": 2659008, + "step": 5415 + }, + { + "epoch": 0.715322687079319, + "grad_norm": 0.024803217500448227, + "learning_rate": 4.5483945021935356e-07, + "loss": 0.037, + "num_input_tokens_seen": 2661632, + "step": 5420 + }, + { + "epoch": 0.7159825788570674, + "grad_norm": 0.0293336883187294, + "learning_rate": 4.5290975257968155e-07, + "loss": 0.1053, + "num_input_tokens_seen": 2664192, + "step": 5425 + }, + { + "epoch": 0.7166424706348159, + "grad_norm": 37.842960357666016, + "learning_rate": 4.509829580076452e-07, + "loss": 0.185, + "num_input_tokens_seen": 2666624, + "step": 5430 + }, + { + "epoch": 0.7173023624125643, + "grad_norm": 0.14816348254680634, + "learning_rate": 4.490590767275442e-07, + "loss": 0.1415, + "num_input_tokens_seen": 2669120, + "step": 5435 + }, + { + "epoch": 0.7179622541903128, + "grad_norm": 0.13981057703495026, + "learning_rate": 4.4713811894822064e-07, + "loss": 0.1221, + "num_input_tokens_seen": 2671552, + "step": 5440 + }, + { + "epoch": 0.7186221459680613, + "grad_norm": 0.21771204471588135, + "learning_rate": 4.4522009486300204e-07, + "loss": 0.0782, + "num_input_tokens_seen": 2674240, + "step": 5445 + }, + { + "epoch": 0.7192820377458097, + "grad_norm": 0.08881372213363647, + "learning_rate": 4.43305014649649e-07, + "loss": 0.0865, + "num_input_tokens_seen": 2676544, + "step": 5450 + }, + { + "epoch": 0.7199419295235582, + "grad_norm": 0.0907829999923706, + "learning_rate": 4.4139288847030155e-07, + "loss": 0.0004, + "num_input_tokens_seen": 2678912, + "step": 5455 + }, + { + "epoch": 0.7206018213013066, + "grad_norm": 0.06906948238611221, + "learning_rate": 4.394837264714233e-07, + "loss": 0.0538, + "num_input_tokens_seen": 2681344, + "step": 5460 + }, + { + "epoch": 0.7212617130790551, + "grad_norm": 0.9202603697776794, + "learning_rate": 4.3757753878375005e-07, + "loss": 0.0013, + "num_input_tokens_seen": 2683776, + "step": 5465 + }, + { + "epoch": 0.7219216048568035, + "grad_norm": 0.03742950037121773, + "learning_rate": 4.3567433552223375e-07, + "loss": 0.0553, + "num_input_tokens_seen": 2686016, + "step": 5470 + }, + { + "epoch": 0.722581496634552, + "grad_norm": 0.49609553813934326, + "learning_rate": 4.3377412678599e-07, + "loss": 0.1592, + "num_input_tokens_seen": 2688128, + "step": 5475 + }, + { + "epoch": 0.7232413884123003, + "grad_norm": 0.0728292167186737, + "learning_rate": 4.318769226582454e-07, + "loss": 0.1678, + "num_input_tokens_seen": 2690368, + "step": 5480 + }, + { + "epoch": 0.7239012801900488, + "grad_norm": 0.5910032391548157, + "learning_rate": 4.299827332062811e-07, + "loss": 0.0807, + "num_input_tokens_seen": 2692992, + "step": 5485 + }, + { + "epoch": 0.7245611719677972, + "grad_norm": 51.44681930541992, + "learning_rate": 4.2809156848138363e-07, + "loss": 0.0951, + "num_input_tokens_seen": 2695424, + "step": 5490 + }, + { + "epoch": 0.7252210637455457, + "grad_norm": 76.25809478759766, + "learning_rate": 4.2620343851878616e-07, + "loss": 0.1498, + "num_input_tokens_seen": 2697856, + "step": 5495 + }, + { + "epoch": 0.7258809555232941, + "grad_norm": 0.06275495141744614, + "learning_rate": 4.2431835333762123e-07, + "loss": 0.0717, + "num_input_tokens_seen": 2700608, + "step": 5500 + }, + { + "epoch": 0.7265408473010426, + "grad_norm": 0.07024704664945602, + "learning_rate": 4.224363229408628e-07, + "loss": 0.0003, + "num_input_tokens_seen": 2703104, + "step": 5505 + }, + { + "epoch": 0.7272007390787911, + "grad_norm": 78.2071533203125, + "learning_rate": 4.205573573152753e-07, + "loss": 0.2012, + "num_input_tokens_seen": 2705344, + "step": 5510 + }, + { + "epoch": 0.7278606308565395, + "grad_norm": 0.2134246826171875, + "learning_rate": 4.18681466431361e-07, + "loss": 0.0556, + "num_input_tokens_seen": 2707520, + "step": 5515 + }, + { + "epoch": 0.728520522634288, + "grad_norm": 0.714931070804596, + "learning_rate": 4.168086602433055e-07, + "loss": 0.0709, + "num_input_tokens_seen": 2709888, + "step": 5520 + }, + { + "epoch": 0.7291804144120364, + "grad_norm": 0.3997064232826233, + "learning_rate": 4.1493894868892676e-07, + "loss": 0.2017, + "num_input_tokens_seen": 2712192, + "step": 5525 + }, + { + "epoch": 0.7298403061897849, + "grad_norm": 0.4337630271911621, + "learning_rate": 4.1307234168962093e-07, + "loss": 0.0165, + "num_input_tokens_seen": 2714368, + "step": 5530 + }, + { + "epoch": 0.7305001979675333, + "grad_norm": 0.09288299828767776, + "learning_rate": 4.112088491503095e-07, + "loss": 0.0494, + "num_input_tokens_seen": 2716608, + "step": 5535 + }, + { + "epoch": 0.7311600897452818, + "grad_norm": 0.06428027153015137, + "learning_rate": 4.0934848095938937e-07, + "loss": 0.0011, + "num_input_tokens_seen": 2718656, + "step": 5540 + }, + { + "epoch": 0.7318199815230302, + "grad_norm": 0.03982330486178398, + "learning_rate": 4.074912469886763e-07, + "loss": 0.097, + "num_input_tokens_seen": 2721152, + "step": 5545 + }, + { + "epoch": 0.7324798733007787, + "grad_norm": 5.011870861053467, + "learning_rate": 4.0563715709335657e-07, + "loss": 0.0014, + "num_input_tokens_seen": 2723264, + "step": 5550 + }, + { + "epoch": 0.7331397650785271, + "grad_norm": 143.84207153320312, + "learning_rate": 4.037862211119315e-07, + "loss": 0.198, + "num_input_tokens_seen": 2725568, + "step": 5555 + }, + { + "epoch": 0.7337996568562756, + "grad_norm": 0.1886509656906128, + "learning_rate": 4.0193844886616715e-07, + "loss": 0.0634, + "num_input_tokens_seen": 2728192, + "step": 5560 + }, + { + "epoch": 0.7344595486340241, + "grad_norm": 46.56074142456055, + "learning_rate": 4.0009385016104137e-07, + "loss": 0.2335, + "num_input_tokens_seen": 2731072, + "step": 5565 + }, + { + "epoch": 0.7351194404117725, + "grad_norm": 0.030098050832748413, + "learning_rate": 3.9825243478469164e-07, + "loss": 0.0761, + "num_input_tokens_seen": 2733440, + "step": 5570 + }, + { + "epoch": 0.735779332189521, + "grad_norm": 11.673151016235352, + "learning_rate": 3.9641421250836484e-07, + "loss": 0.0718, + "num_input_tokens_seen": 2736064, + "step": 5575 + }, + { + "epoch": 0.7364392239672694, + "grad_norm": 70.8289794921875, + "learning_rate": 3.945791930863622e-07, + "loss": 0.0312, + "num_input_tokens_seen": 2738496, + "step": 5580 + }, + { + "epoch": 0.7370991157450179, + "grad_norm": 0.15004687011241913, + "learning_rate": 3.9274738625599137e-07, + "loss": 0.0019, + "num_input_tokens_seen": 2740800, + "step": 5585 + }, + { + "epoch": 0.7377590075227662, + "grad_norm": 3.4134578704833984, + "learning_rate": 3.909188017375112e-07, + "loss": 0.0637, + "num_input_tokens_seen": 2743104, + "step": 5590 + }, + { + "epoch": 0.7384188993005147, + "grad_norm": 0.05561397597193718, + "learning_rate": 3.890934492340819e-07, + "loss": 0.137, + "num_input_tokens_seen": 2745344, + "step": 5595 + }, + { + "epoch": 0.7390787910782631, + "grad_norm": 19.8775577545166, + "learning_rate": 3.872713384317147e-07, + "loss": 0.0649, + "num_input_tokens_seen": 2747520, + "step": 5600 + }, + { + "epoch": 0.7397386828560116, + "grad_norm": 0.08291494101285934, + "learning_rate": 3.8545247899921776e-07, + "loss": 0.1226, + "num_input_tokens_seen": 2750016, + "step": 5605 + }, + { + "epoch": 0.74039857463376, + "grad_norm": 0.08636556565761566, + "learning_rate": 3.8363688058814614e-07, + "loss": 0.123, + "num_input_tokens_seen": 2752704, + "step": 5610 + }, + { + "epoch": 0.7410584664115085, + "grad_norm": 15.197744369506836, + "learning_rate": 3.818245528327526e-07, + "loss": 0.1293, + "num_input_tokens_seen": 2755328, + "step": 5615 + }, + { + "epoch": 0.7417183581892569, + "grad_norm": 14.93408203125, + "learning_rate": 3.8001550534993164e-07, + "loss": 0.0808, + "num_input_tokens_seen": 2757632, + "step": 5620 + }, + { + "epoch": 0.7423782499670054, + "grad_norm": 0.16387708485126495, + "learning_rate": 3.7820974773917413e-07, + "loss": 0.0508, + "num_input_tokens_seen": 2760192, + "step": 5625 + }, + { + "epoch": 0.7430381417447539, + "grad_norm": 0.04745183512568474, + "learning_rate": 3.764072895825117e-07, + "loss": 0.0011, + "num_input_tokens_seen": 2762816, + "step": 5630 + }, + { + "epoch": 0.7436980335225023, + "grad_norm": 13.764304161071777, + "learning_rate": 3.7460814044446934e-07, + "loss": 0.0735, + "num_input_tokens_seen": 2765120, + "step": 5635 + }, + { + "epoch": 0.7443579253002508, + "grad_norm": 0.09650138765573502, + "learning_rate": 3.72812309872012e-07, + "loss": 0.1235, + "num_input_tokens_seen": 2767808, + "step": 5640 + }, + { + "epoch": 0.7450178170779992, + "grad_norm": 0.39747825264930725, + "learning_rate": 3.71019807394495e-07, + "loss": 0.0109, + "num_input_tokens_seen": 2770176, + "step": 5645 + }, + { + "epoch": 0.7456777088557477, + "grad_norm": 0.43890663981437683, + "learning_rate": 3.6923064252361505e-07, + "loss": 0.1873, + "num_input_tokens_seen": 2772672, + "step": 5650 + }, + { + "epoch": 0.7463376006334961, + "grad_norm": 0.17724739015102386, + "learning_rate": 3.674448247533561e-07, + "loss": 0.1134, + "num_input_tokens_seen": 2775104, + "step": 5655 + }, + { + "epoch": 0.7469974924112446, + "grad_norm": 1.322895884513855, + "learning_rate": 3.656623635599432e-07, + "loss": 0.2252, + "num_input_tokens_seen": 2777792, + "step": 5660 + }, + { + "epoch": 0.747657384188993, + "grad_norm": 64.87480163574219, + "learning_rate": 3.6388326840178865e-07, + "loss": 0.1396, + "num_input_tokens_seen": 2780416, + "step": 5665 + }, + { + "epoch": 0.7483172759667415, + "grad_norm": 0.14808109402656555, + "learning_rate": 3.621075487194435e-07, + "loss": 0.0013, + "num_input_tokens_seen": 2783232, + "step": 5670 + }, + { + "epoch": 0.7489771677444899, + "grad_norm": 7.88364839553833, + "learning_rate": 3.603352139355483e-07, + "loss": 0.1226, + "num_input_tokens_seen": 2785664, + "step": 5675 + }, + { + "epoch": 0.7496370595222384, + "grad_norm": 0.24036580324172974, + "learning_rate": 3.58566273454781e-07, + "loss": 0.0986, + "num_input_tokens_seen": 2788224, + "step": 5680 + }, + { + "epoch": 0.7502969512999867, + "grad_norm": 0.09827781468629837, + "learning_rate": 3.5680073666380817e-07, + "loss": 0.0314, + "num_input_tokens_seen": 2790656, + "step": 5685 + }, + { + "epoch": 0.7502969512999867, + "eval_loss": 0.10055803507566452, + "eval_runtime": 7.8216, + "eval_samples_per_second": 861.081, + "eval_steps_per_second": 107.651, + "num_input_tokens_seen": 2790656, + "step": 5685 + }, + { + "epoch": 0.7509568430777352, + "grad_norm": 0.024036020040512085, + "learning_rate": 3.5503861293123514e-07, + "loss": 0.1421, + "num_input_tokens_seen": 2792960, + "step": 5690 + }, + { + "epoch": 0.7516167348554837, + "grad_norm": 0.17825555801391602, + "learning_rate": 3.532799116075571e-07, + "loss": 0.092, + "num_input_tokens_seen": 2795648, + "step": 5695 + }, + { + "epoch": 0.7522766266332321, + "grad_norm": 19.003950119018555, + "learning_rate": 3.5152464202510777e-07, + "loss": 0.104, + "num_input_tokens_seen": 2797696, + "step": 5700 + }, + { + "epoch": 0.7529365184109806, + "grad_norm": 17.081161499023438, + "learning_rate": 3.4977281349801056e-07, + "loss": 0.1443, + "num_input_tokens_seen": 2800192, + "step": 5705 + }, + { + "epoch": 0.753596410188729, + "grad_norm": 0.1098131462931633, + "learning_rate": 3.4802443532213056e-07, + "loss": 0.0584, + "num_input_tokens_seen": 2802560, + "step": 5710 + }, + { + "epoch": 0.7542563019664775, + "grad_norm": 0.023672033101320267, + "learning_rate": 3.4627951677502233e-07, + "loss": 0.2492, + "num_input_tokens_seen": 2804992, + "step": 5715 + }, + { + "epoch": 0.7549161937442259, + "grad_norm": 0.9849115610122681, + "learning_rate": 3.4453806711588397e-07, + "loss": 0.0061, + "num_input_tokens_seen": 2807296, + "step": 5720 + }, + { + "epoch": 0.7555760855219744, + "grad_norm": 0.09603046625852585, + "learning_rate": 3.428000955855054e-07, + "loss": 0.0309, + "num_input_tokens_seen": 2809984, + "step": 5725 + }, + { + "epoch": 0.7562359772997228, + "grad_norm": 0.11034424602985382, + "learning_rate": 3.4106561140621983e-07, + "loss": 0.0018, + "num_input_tokens_seen": 2812736, + "step": 5730 + }, + { + "epoch": 0.7568958690774713, + "grad_norm": 0.09973105043172836, + "learning_rate": 3.393346237818567e-07, + "loss": 0.173, + "num_input_tokens_seen": 2815040, + "step": 5735 + }, + { + "epoch": 0.7575557608552197, + "grad_norm": 47.743797302246094, + "learning_rate": 3.3760714189769015e-07, + "loss": 0.1591, + "num_input_tokens_seen": 2817344, + "step": 5740 + }, + { + "epoch": 0.7582156526329682, + "grad_norm": 0.07995446026325226, + "learning_rate": 3.3588317492039266e-07, + "loss": 0.024, + "num_input_tokens_seen": 2819648, + "step": 5745 + }, + { + "epoch": 0.7588755444107167, + "grad_norm": 40.636417388916016, + "learning_rate": 3.341627319979834e-07, + "loss": 0.1302, + "num_input_tokens_seen": 2822464, + "step": 5750 + }, + { + "epoch": 0.7595354361884651, + "grad_norm": 84.80926513671875, + "learning_rate": 3.324458222597839e-07, + "loss": 0.2033, + "num_input_tokens_seen": 2824896, + "step": 5755 + }, + { + "epoch": 0.7601953279662136, + "grad_norm": 0.16351526975631714, + "learning_rate": 3.307324548163657e-07, + "loss": 0.0718, + "num_input_tokens_seen": 2827648, + "step": 5760 + }, + { + "epoch": 0.760855219743962, + "grad_norm": 1.872399926185608, + "learning_rate": 3.2902263875950374e-07, + "loss": 0.0575, + "num_input_tokens_seen": 2830336, + "step": 5765 + }, + { + "epoch": 0.7615151115217105, + "grad_norm": 14.924793243408203, + "learning_rate": 3.2731638316212894e-07, + "loss": 0.0498, + "num_input_tokens_seen": 2832640, + "step": 5770 + }, + { + "epoch": 0.7621750032994589, + "grad_norm": 0.5178006291389465, + "learning_rate": 3.256136970782782e-07, + "loss": 0.086, + "num_input_tokens_seen": 2834880, + "step": 5775 + }, + { + "epoch": 0.7628348950772074, + "grad_norm": 0.028780991211533546, + "learning_rate": 3.23914589543047e-07, + "loss": 0.1474, + "num_input_tokens_seen": 2837440, + "step": 5780 + }, + { + "epoch": 0.7634947868549558, + "grad_norm": 29.812068939208984, + "learning_rate": 3.2221906957254276e-07, + "loss": 0.0621, + "num_input_tokens_seen": 2839808, + "step": 5785 + }, + { + "epoch": 0.7641546786327043, + "grad_norm": 0.09762804210186005, + "learning_rate": 3.205271461638346e-07, + "loss": 0.1094, + "num_input_tokens_seen": 2842432, + "step": 5790 + }, + { + "epoch": 0.7648145704104526, + "grad_norm": 0.17772820591926575, + "learning_rate": 3.188388282949085e-07, + "loss": 0.1338, + "num_input_tokens_seen": 2845120, + "step": 5795 + }, + { + "epoch": 0.7654744621882011, + "grad_norm": 46.48423385620117, + "learning_rate": 3.171541249246166e-07, + "loss": 0.1247, + "num_input_tokens_seen": 2848000, + "step": 5800 + }, + { + "epoch": 0.7661343539659495, + "grad_norm": 20.354982376098633, + "learning_rate": 3.154730449926316e-07, + "loss": 0.1788, + "num_input_tokens_seen": 2850624, + "step": 5805 + }, + { + "epoch": 0.766794245743698, + "grad_norm": 0.2434767633676529, + "learning_rate": 3.137955974194e-07, + "loss": 0.1394, + "num_input_tokens_seen": 2852992, + "step": 5810 + }, + { + "epoch": 0.7674541375214465, + "grad_norm": 14.338163375854492, + "learning_rate": 3.1212179110609125e-07, + "loss": 0.0413, + "num_input_tokens_seen": 2855424, + "step": 5815 + }, + { + "epoch": 0.7681140292991949, + "grad_norm": 0.05543454736471176, + "learning_rate": 3.104516349345553e-07, + "loss": 0.1604, + "num_input_tokens_seen": 2857984, + "step": 5820 + }, + { + "epoch": 0.7687739210769434, + "grad_norm": 0.143641859292984, + "learning_rate": 3.0878513776727144e-07, + "loss": 0.0702, + "num_input_tokens_seen": 2860672, + "step": 5825 + }, + { + "epoch": 0.7694338128546918, + "grad_norm": 15.186430931091309, + "learning_rate": 3.0712230844730414e-07, + "loss": 0.1228, + "num_input_tokens_seen": 2863040, + "step": 5830 + }, + { + "epoch": 0.7700937046324403, + "grad_norm": 35.79595947265625, + "learning_rate": 3.054631557982539e-07, + "loss": 0.1412, + "num_input_tokens_seen": 2865856, + "step": 5835 + }, + { + "epoch": 0.7707535964101887, + "grad_norm": 0.11609415709972382, + "learning_rate": 3.0380768862421156e-07, + "loss": 0.108, + "num_input_tokens_seen": 2868096, + "step": 5840 + }, + { + "epoch": 0.7714134881879372, + "grad_norm": 0.14167936146259308, + "learning_rate": 3.0215591570971234e-07, + "loss": 0.001, + "num_input_tokens_seen": 2870784, + "step": 5845 + }, + { + "epoch": 0.7720733799656856, + "grad_norm": 0.7140024304389954, + "learning_rate": 3.005078458196868e-07, + "loss": 0.0313, + "num_input_tokens_seen": 2873216, + "step": 5850 + }, + { + "epoch": 0.7727332717434341, + "grad_norm": 0.13905233144760132, + "learning_rate": 2.988634876994175e-07, + "loss": 0.0011, + "num_input_tokens_seen": 2875776, + "step": 5855 + }, + { + "epoch": 0.7733931635211825, + "grad_norm": 0.11488426476716995, + "learning_rate": 2.972228500744898e-07, + "loss": 0.0322, + "num_input_tokens_seen": 2878336, + "step": 5860 + }, + { + "epoch": 0.774053055298931, + "grad_norm": 18.05517578125, + "learning_rate": 2.955859416507467e-07, + "loss": 0.1583, + "num_input_tokens_seen": 2880896, + "step": 5865 + }, + { + "epoch": 0.7747129470766794, + "grad_norm": 0.03384196758270264, + "learning_rate": 2.9395277111424357e-07, + "loss": 0.0666, + "num_input_tokens_seen": 2883648, + "step": 5870 + }, + { + "epoch": 0.7753728388544279, + "grad_norm": 0.047510821372270584, + "learning_rate": 2.9232334713120035e-07, + "loss": 0.0659, + "num_input_tokens_seen": 2885952, + "step": 5875 + }, + { + "epoch": 0.7760327306321764, + "grad_norm": 0.21850033104419708, + "learning_rate": 2.9069767834795655e-07, + "loss": 0.0666, + "num_input_tokens_seen": 2888576, + "step": 5880 + }, + { + "epoch": 0.7766926224099248, + "grad_norm": 1.7232064008712769, + "learning_rate": 2.8907577339092483e-07, + "loss": 0.139, + "num_input_tokens_seen": 2891136, + "step": 5885 + }, + { + "epoch": 0.7773525141876733, + "grad_norm": 0.034715685993433, + "learning_rate": 2.8745764086654654e-07, + "loss": 0.0791, + "num_input_tokens_seen": 2893696, + "step": 5890 + }, + { + "epoch": 0.7780124059654216, + "grad_norm": 0.3917783796787262, + "learning_rate": 2.8584328936124424e-07, + "loss": 0.0014, + "num_input_tokens_seen": 2896512, + "step": 5895 + }, + { + "epoch": 0.7786722977431701, + "grad_norm": 15.660504341125488, + "learning_rate": 2.8423272744137674e-07, + "loss": 0.1734, + "num_input_tokens_seen": 2899008, + "step": 5900 + }, + { + "epoch": 0.7793321895209185, + "grad_norm": 0.46314364671707153, + "learning_rate": 2.82625963653195e-07, + "loss": 0.0576, + "num_input_tokens_seen": 2901376, + "step": 5905 + }, + { + "epoch": 0.779992081298667, + "grad_norm": 12.847580909729004, + "learning_rate": 2.810230065227944e-07, + "loss": 0.192, + "num_input_tokens_seen": 2903872, + "step": 5910 + }, + { + "epoch": 0.7806519730764154, + "grad_norm": 0.09266316145658493, + "learning_rate": 2.7942386455607203e-07, + "loss": 0.0012, + "num_input_tokens_seen": 2906240, + "step": 5915 + }, + { + "epoch": 0.7813118648541639, + "grad_norm": 0.7352420687675476, + "learning_rate": 2.77828546238679e-07, + "loss": 0.068, + "num_input_tokens_seen": 2908736, + "step": 5920 + }, + { + "epoch": 0.7819717566319123, + "grad_norm": 0.6023374199867249, + "learning_rate": 2.762370600359774e-07, + "loss": 0.1235, + "num_input_tokens_seen": 2911104, + "step": 5925 + }, + { + "epoch": 0.7826316484096608, + "grad_norm": 0.05204444006085396, + "learning_rate": 2.7464941439299484e-07, + "loss": 0.0383, + "num_input_tokens_seen": 2913472, + "step": 5930 + }, + { + "epoch": 0.7832915401874093, + "grad_norm": 13.93787670135498, + "learning_rate": 2.7306561773437887e-07, + "loss": 0.1809, + "num_input_tokens_seen": 2915840, + "step": 5935 + }, + { + "epoch": 0.7839514319651577, + "grad_norm": 0.12649060785770416, + "learning_rate": 2.714856784643533e-07, + "loss": 0.0033, + "num_input_tokens_seen": 2918144, + "step": 5940 + }, + { + "epoch": 0.7846113237429062, + "grad_norm": 0.04809973016381264, + "learning_rate": 2.6990960496667313e-07, + "loss": 0.1415, + "num_input_tokens_seen": 2920768, + "step": 5945 + }, + { + "epoch": 0.7852712155206546, + "grad_norm": 0.12313824892044067, + "learning_rate": 2.6833740560457976e-07, + "loss": 0.0698, + "num_input_tokens_seen": 2923136, + "step": 5950 + }, + { + "epoch": 0.7859311072984031, + "grad_norm": 0.06649130582809448, + "learning_rate": 2.6676908872075757e-07, + "loss": 0.0759, + "num_input_tokens_seen": 2925568, + "step": 5955 + }, + { + "epoch": 0.7865909990761515, + "grad_norm": 0.062394797801971436, + "learning_rate": 2.6520466263728836e-07, + "loss": 0.0742, + "num_input_tokens_seen": 2928064, + "step": 5960 + }, + { + "epoch": 0.7872508908539, + "grad_norm": 19.138282775878906, + "learning_rate": 2.636441356556087e-07, + "loss": 0.2564, + "num_input_tokens_seen": 2930368, + "step": 5965 + }, + { + "epoch": 0.7879107826316484, + "grad_norm": 15.425389289855957, + "learning_rate": 2.620875160564645e-07, + "loss": 0.1123, + "num_input_tokens_seen": 2932928, + "step": 5970 + }, + { + "epoch": 0.7885706744093969, + "grad_norm": 35.93429946899414, + "learning_rate": 2.6053481209986715e-07, + "loss": 0.3593, + "num_input_tokens_seen": 2935360, + "step": 5975 + }, + { + "epoch": 0.7892305661871453, + "grad_norm": 0.08447807282209396, + "learning_rate": 2.5898603202505155e-07, + "loss": 0.059, + "num_input_tokens_seen": 2937920, + "step": 5980 + }, + { + "epoch": 0.7898904579648938, + "grad_norm": 0.1833449751138687, + "learning_rate": 2.5744118405042923e-07, + "loss": 0.0823, + "num_input_tokens_seen": 2940224, + "step": 5985 + }, + { + "epoch": 0.7905503497426422, + "grad_norm": 0.16191020607948303, + "learning_rate": 2.559002763735485e-07, + "loss": 0.0012, + "num_input_tokens_seen": 2942848, + "step": 5990 + }, + { + "epoch": 0.7912102415203907, + "grad_norm": 0.1544707715511322, + "learning_rate": 2.543633171710472e-07, + "loss": 0.0604, + "num_input_tokens_seen": 2945344, + "step": 5995 + }, + { + "epoch": 0.7918701332981392, + "grad_norm": 12.624445915222168, + "learning_rate": 2.5283031459861205e-07, + "loss": 0.008, + "num_input_tokens_seen": 2947840, + "step": 6000 + }, + { + "epoch": 0.7925300250758875, + "grad_norm": 0.09669650346040726, + "learning_rate": 2.5130127679093396e-07, + "loss": 0.0374, + "num_input_tokens_seen": 2950144, + "step": 6005 + }, + { + "epoch": 0.793189916853636, + "grad_norm": 110.95389556884766, + "learning_rate": 2.497762118616652e-07, + "loss": 0.0336, + "num_input_tokens_seen": 2952384, + "step": 6010 + }, + { + "epoch": 0.7938498086313844, + "grad_norm": 0.06578873097896576, + "learning_rate": 2.4825512790337745e-07, + "loss": 0.071, + "num_input_tokens_seen": 2955136, + "step": 6015 + }, + { + "epoch": 0.7945097004091329, + "grad_norm": 24.038101196289062, + "learning_rate": 2.467380329875163e-07, + "loss": 0.0369, + "num_input_tokens_seen": 2957824, + "step": 6020 + }, + { + "epoch": 0.7951695921868813, + "grad_norm": 0.2718788683414459, + "learning_rate": 2.452249351643615e-07, + "loss": 0.0014, + "num_input_tokens_seen": 2960256, + "step": 6025 + }, + { + "epoch": 0.7958294839646298, + "grad_norm": 0.3302108943462372, + "learning_rate": 2.437158424629817e-07, + "loss": 0.1182, + "num_input_tokens_seen": 2962944, + "step": 6030 + }, + { + "epoch": 0.7964893757423782, + "grad_norm": 66.44668579101562, + "learning_rate": 2.422107628911929e-07, + "loss": 0.2256, + "num_input_tokens_seen": 2965504, + "step": 6035 + }, + { + "epoch": 0.7971492675201267, + "grad_norm": 0.32538238167762756, + "learning_rate": 2.4070970443551673e-07, + "loss": 0.274, + "num_input_tokens_seen": 2967744, + "step": 6040 + }, + { + "epoch": 0.7978091592978751, + "grad_norm": 0.16842018067836761, + "learning_rate": 2.392126750611362e-07, + "loss": 0.0032, + "num_input_tokens_seen": 2970240, + "step": 6045 + }, + { + "epoch": 0.7984690510756236, + "grad_norm": 14.741007804870605, + "learning_rate": 2.3771968271185538e-07, + "loss": 0.1761, + "num_input_tokens_seen": 2972928, + "step": 6050 + }, + { + "epoch": 0.799128942853372, + "grad_norm": 0.018400076776742935, + "learning_rate": 2.3623073531005579e-07, + "loss": 0.1485, + "num_input_tokens_seen": 2975168, + "step": 6055 + }, + { + "epoch": 0.7997888346311205, + "grad_norm": 0.2021035999059677, + "learning_rate": 2.3474584075665493e-07, + "loss": 0.1396, + "num_input_tokens_seen": 2977408, + "step": 6060 + }, + { + "epoch": 0.8003167480533192, + "eval_loss": 0.09634685516357422, + "eval_runtime": 8.0558, + "eval_samples_per_second": 836.039, + "eval_steps_per_second": 104.52, + "num_input_tokens_seen": 2979456, + "step": 6064 + }, + { + "epoch": 0.800448726408869, + "grad_norm": 0.04960273206233978, + "learning_rate": 2.3326500693106533e-07, + "loss": 0.0051, + "num_input_tokens_seen": 2979968, + "step": 6065 + }, + { + "epoch": 0.8011086181866174, + "grad_norm": 59.42499542236328, + "learning_rate": 2.3178824169114975e-07, + "loss": 0.2232, + "num_input_tokens_seen": 2982528, + "step": 6070 + }, + { + "epoch": 0.8017685099643659, + "grad_norm": 0.30131280422210693, + "learning_rate": 2.303155528731837e-07, + "loss": 0.0557, + "num_input_tokens_seen": 2984832, + "step": 6075 + }, + { + "epoch": 0.8024284017421143, + "grad_norm": 0.18146446347236633, + "learning_rate": 2.2884694829181016e-07, + "loss": 0.0009, + "num_input_tokens_seen": 2987328, + "step": 6080 + }, + { + "epoch": 0.8030882935198628, + "grad_norm": 0.08123955875635147, + "learning_rate": 2.273824357400005e-07, + "loss": 0.0703, + "num_input_tokens_seen": 2989760, + "step": 6085 + }, + { + "epoch": 0.8037481852976112, + "grad_norm": 0.2558766305446625, + "learning_rate": 2.2592202298901174e-07, + "loss": 0.0457, + "num_input_tokens_seen": 2992320, + "step": 6090 + }, + { + "epoch": 0.8044080770753597, + "grad_norm": 0.09454154968261719, + "learning_rate": 2.2446571778834555e-07, + "loss": 0.0022, + "num_input_tokens_seen": 2995136, + "step": 6095 + }, + { + "epoch": 0.805067968853108, + "grad_norm": 0.08113214373588562, + "learning_rate": 2.2301352786570827e-07, + "loss": 0.0008, + "num_input_tokens_seen": 2998016, + "step": 6100 + }, + { + "epoch": 0.8057278606308566, + "grad_norm": 0.04773727431893349, + "learning_rate": 2.215654609269685e-07, + "loss": 0.1533, + "num_input_tokens_seen": 3000832, + "step": 6105 + }, + { + "epoch": 0.8063877524086049, + "grad_norm": 19.62008285522461, + "learning_rate": 2.201215246561161e-07, + "loss": 0.1716, + "num_input_tokens_seen": 3003584, + "step": 6110 + }, + { + "epoch": 0.8070476441863534, + "grad_norm": 36.953800201416016, + "learning_rate": 2.1868172671522357e-07, + "loss": 0.0731, + "num_input_tokens_seen": 3006464, + "step": 6115 + }, + { + "epoch": 0.8077075359641019, + "grad_norm": 0.20668062567710876, + "learning_rate": 2.1724607474440216e-07, + "loss": 0.107, + "num_input_tokens_seen": 3008896, + "step": 6120 + }, + { + "epoch": 0.8083674277418503, + "grad_norm": 25.05734634399414, + "learning_rate": 2.158145763617646e-07, + "loss": 0.1277, + "num_input_tokens_seen": 3011392, + "step": 6125 + }, + { + "epoch": 0.8090273195195988, + "grad_norm": 0.5729929208755493, + "learning_rate": 2.1438723916338198e-07, + "loss": 0.2135, + "num_input_tokens_seen": 3014016, + "step": 6130 + }, + { + "epoch": 0.8096872112973472, + "grad_norm": 0.34563905000686646, + "learning_rate": 2.1296407072324495e-07, + "loss": 0.1745, + "num_input_tokens_seen": 3016576, + "step": 6135 + }, + { + "epoch": 0.8103471030750957, + "grad_norm": 24.23431396484375, + "learning_rate": 2.1154507859322336e-07, + "loss": 0.0661, + "num_input_tokens_seen": 3019008, + "step": 6140 + }, + { + "epoch": 0.8110069948528441, + "grad_norm": 56.11611557006836, + "learning_rate": 2.101302703030252e-07, + "loss": 0.1033, + "num_input_tokens_seen": 3021504, + "step": 6145 + }, + { + "epoch": 0.8116668866305926, + "grad_norm": 0.6069444417953491, + "learning_rate": 2.0871965336015885e-07, + "loss": 0.0688, + "num_input_tokens_seen": 3023552, + "step": 6150 + }, + { + "epoch": 0.812326778408341, + "grad_norm": 319.5021057128906, + "learning_rate": 2.0731323524989031e-07, + "loss": 0.0896, + "num_input_tokens_seen": 3025856, + "step": 6155 + }, + { + "epoch": 0.8129866701860895, + "grad_norm": 10.510120391845703, + "learning_rate": 2.0591102343520616e-07, + "loss": 0.1915, + "num_input_tokens_seen": 3028096, + "step": 6160 + }, + { + "epoch": 0.8136465619638379, + "grad_norm": 25.165172576904297, + "learning_rate": 2.0451302535677206e-07, + "loss": 0.1774, + "num_input_tokens_seen": 3030528, + "step": 6165 + }, + { + "epoch": 0.8143064537415864, + "grad_norm": 142.08734130859375, + "learning_rate": 2.0311924843289396e-07, + "loss": 0.129, + "num_input_tokens_seen": 3033088, + "step": 6170 + }, + { + "epoch": 0.8149663455193348, + "grad_norm": 0.14164146780967712, + "learning_rate": 2.017297000594794e-07, + "loss": 0.0907, + "num_input_tokens_seen": 3035200, + "step": 6175 + }, + { + "epoch": 0.8156262372970833, + "grad_norm": 0.1182747557759285, + "learning_rate": 2.0034438760999696e-07, + "loss": 0.048, + "num_input_tokens_seen": 3037696, + "step": 6180 + }, + { + "epoch": 0.8162861290748318, + "grad_norm": 16.164520263671875, + "learning_rate": 1.9896331843543856e-07, + "loss": 0.1593, + "num_input_tokens_seen": 3040128, + "step": 6185 + }, + { + "epoch": 0.8169460208525802, + "grad_norm": 0.241964653134346, + "learning_rate": 1.975864998642789e-07, + "loss": 0.1511, + "num_input_tokens_seen": 3042560, + "step": 6190 + }, + { + "epoch": 0.8176059126303287, + "grad_norm": 39.79319381713867, + "learning_rate": 1.9621393920243767e-07, + "loss": 0.2786, + "num_input_tokens_seen": 3044800, + "step": 6195 + }, + { + "epoch": 0.8182658044080771, + "grad_norm": 1.3789013624191284, + "learning_rate": 1.9484564373324074e-07, + "loss": 0.062, + "num_input_tokens_seen": 3047040, + "step": 6200 + }, + { + "epoch": 0.8189256961858256, + "grad_norm": 0.04190517216920853, + "learning_rate": 1.934816207173805e-07, + "loss": 0.0633, + "num_input_tokens_seen": 3049600, + "step": 6205 + }, + { + "epoch": 0.819585587963574, + "grad_norm": 0.25988835096359253, + "learning_rate": 1.9212187739287943e-07, + "loss": 0.1436, + "num_input_tokens_seen": 3052416, + "step": 6210 + }, + { + "epoch": 0.8202454797413224, + "grad_norm": 0.2508937418460846, + "learning_rate": 1.907664209750488e-07, + "loss": 0.0028, + "num_input_tokens_seen": 3055040, + "step": 6215 + }, + { + "epoch": 0.8209053715190708, + "grad_norm": 0.35706770420074463, + "learning_rate": 1.8941525865645336e-07, + "loss": 0.0553, + "num_input_tokens_seen": 3057856, + "step": 6220 + }, + { + "epoch": 0.8215652632968193, + "grad_norm": 83.89398193359375, + "learning_rate": 1.8806839760687076e-07, + "loss": 0.209, + "num_input_tokens_seen": 3060160, + "step": 6225 + }, + { + "epoch": 0.8222251550745677, + "grad_norm": 0.15399783849716187, + "learning_rate": 1.867258449732545e-07, + "loss": 0.1147, + "num_input_tokens_seen": 3062592, + "step": 6230 + }, + { + "epoch": 0.8228850468523162, + "grad_norm": 27.60859489440918, + "learning_rate": 1.8538760787969676e-07, + "loss": 0.0562, + "num_input_tokens_seen": 3065088, + "step": 6235 + }, + { + "epoch": 0.8235449386300646, + "grad_norm": 0.4883517026901245, + "learning_rate": 1.8405369342738907e-07, + "loss": 0.0017, + "num_input_tokens_seen": 3067712, + "step": 6240 + }, + { + "epoch": 0.8242048304078131, + "grad_norm": 0.11648905277252197, + "learning_rate": 1.8272410869458598e-07, + "loss": 0.0602, + "num_input_tokens_seen": 3070144, + "step": 6245 + }, + { + "epoch": 0.8248647221855616, + "grad_norm": 0.22444108128547668, + "learning_rate": 1.8139886073656653e-07, + "loss": 0.2637, + "num_input_tokens_seen": 3072448, + "step": 6250 + }, + { + "epoch": 0.82552461396331, + "grad_norm": 0.2944018840789795, + "learning_rate": 1.800779565855971e-07, + "loss": 0.2488, + "num_input_tokens_seen": 3075072, + "step": 6255 + }, + { + "epoch": 0.8261845057410585, + "grad_norm": 0.07640720903873444, + "learning_rate": 1.7876140325089463e-07, + "loss": 0.0066, + "num_input_tokens_seen": 3077376, + "step": 6260 + }, + { + "epoch": 0.8268443975188069, + "grad_norm": 50.32258605957031, + "learning_rate": 1.774492077185883e-07, + "loss": 0.1657, + "num_input_tokens_seen": 3079808, + "step": 6265 + }, + { + "epoch": 0.8275042892965554, + "grad_norm": 0.03833077847957611, + "learning_rate": 1.7614137695168408e-07, + "loss": 0.0009, + "num_input_tokens_seen": 3082560, + "step": 6270 + }, + { + "epoch": 0.8281641810743038, + "grad_norm": 2.642076015472412, + "learning_rate": 1.748379178900261e-07, + "loss": 0.0715, + "num_input_tokens_seen": 3084608, + "step": 6275 + }, + { + "epoch": 0.8288240728520523, + "grad_norm": 98.66949462890625, + "learning_rate": 1.7353883745026055e-07, + "loss": 0.229, + "num_input_tokens_seen": 3087104, + "step": 6280 + }, + { + "epoch": 0.8294839646298007, + "grad_norm": 4.167269706726074, + "learning_rate": 1.722441425257999e-07, + "loss": 0.1264, + "num_input_tokens_seen": 3089408, + "step": 6285 + }, + { + "epoch": 0.8301438564075492, + "grad_norm": 0.2311401516199112, + "learning_rate": 1.7095383998678402e-07, + "loss": 0.0197, + "num_input_tokens_seen": 3091776, + "step": 6290 + }, + { + "epoch": 0.8308037481852976, + "grad_norm": 0.08988851308822632, + "learning_rate": 1.6966793668004653e-07, + "loss": 0.113, + "num_input_tokens_seen": 3094208, + "step": 6295 + }, + { + "epoch": 0.8314636399630461, + "grad_norm": 0.2825041711330414, + "learning_rate": 1.6838643942907625e-07, + "loss": 0.006, + "num_input_tokens_seen": 3096768, + "step": 6300 + }, + { + "epoch": 0.8321235317407946, + "grad_norm": 39.45750427246094, + "learning_rate": 1.671093550339815e-07, + "loss": 0.0423, + "num_input_tokens_seen": 3099456, + "step": 6305 + }, + { + "epoch": 0.832783423518543, + "grad_norm": 414.50775146484375, + "learning_rate": 1.6583669027145542e-07, + "loss": 0.0422, + "num_input_tokens_seen": 3102208, + "step": 6310 + }, + { + "epoch": 0.8334433152962915, + "grad_norm": 0.2666016221046448, + "learning_rate": 1.6456845189473767e-07, + "loss": 0.0013, + "num_input_tokens_seen": 3104896, + "step": 6315 + }, + { + "epoch": 0.8341032070740398, + "grad_norm": 0.1291654258966446, + "learning_rate": 1.6330464663358123e-07, + "loss": 0.0676, + "num_input_tokens_seen": 3107520, + "step": 6320 + }, + { + "epoch": 0.8347630988517883, + "grad_norm": 0.08973629027605057, + "learning_rate": 1.6204528119421346e-07, + "loss": 0.0017, + "num_input_tokens_seen": 3110144, + "step": 6325 + }, + { + "epoch": 0.8354229906295367, + "grad_norm": 0.12144739925861359, + "learning_rate": 1.607903622593042e-07, + "loss": 0.0483, + "num_input_tokens_seen": 3112768, + "step": 6330 + }, + { + "epoch": 0.8360828824072852, + "grad_norm": 0.026064425706863403, + "learning_rate": 1.5953989648792743e-07, + "loss": 0.0005, + "num_input_tokens_seen": 3115328, + "step": 6335 + }, + { + "epoch": 0.8367427741850336, + "grad_norm": 0.3229873478412628, + "learning_rate": 1.5829389051552678e-07, + "loss": 0.0166, + "num_input_tokens_seen": 3117888, + "step": 6340 + }, + { + "epoch": 0.8374026659627821, + "grad_norm": 107.5579833984375, + "learning_rate": 1.5705235095388136e-07, + "loss": 0.0081, + "num_input_tokens_seen": 3120384, + "step": 6345 + }, + { + "epoch": 0.8380625577405305, + "grad_norm": 0.10149043798446655, + "learning_rate": 1.5581528439106907e-07, + "loss": 0.0288, + "num_input_tokens_seen": 3123008, + "step": 6350 + }, + { + "epoch": 0.838722449518279, + "grad_norm": 0.22135783731937408, + "learning_rate": 1.5458269739143292e-07, + "loss": 0.0373, + "num_input_tokens_seen": 3125504, + "step": 6355 + }, + { + "epoch": 0.8393823412960274, + "grad_norm": 1.0634685754776, + "learning_rate": 1.5335459649554538e-07, + "loss": 0.0028, + "num_input_tokens_seen": 3127744, + "step": 6360 + }, + { + "epoch": 0.8400422330737759, + "grad_norm": 0.06553785502910614, + "learning_rate": 1.5213098822017357e-07, + "loss": 0.1164, + "num_input_tokens_seen": 3130048, + "step": 6365 + }, + { + "epoch": 0.8407021248515244, + "grad_norm": 0.2539460361003876, + "learning_rate": 1.50911879058246e-07, + "loss": 0.0148, + "num_input_tokens_seen": 3132480, + "step": 6370 + }, + { + "epoch": 0.8413620166292728, + "grad_norm": 1.5171750783920288, + "learning_rate": 1.4969727547881628e-07, + "loss": 0.0826, + "num_input_tokens_seen": 3135104, + "step": 6375 + }, + { + "epoch": 0.8420219084070213, + "grad_norm": 16.333852767944336, + "learning_rate": 1.4848718392703052e-07, + "loss": 0.1787, + "num_input_tokens_seen": 3137344, + "step": 6380 + }, + { + "epoch": 0.8426818001847697, + "grad_norm": 19.633960723876953, + "learning_rate": 1.472816108240915e-07, + "loss": 0.1727, + "num_input_tokens_seen": 3140096, + "step": 6385 + }, + { + "epoch": 0.8433416919625182, + "grad_norm": 0.48766201734542847, + "learning_rate": 1.46080562567226e-07, + "loss": 0.0868, + "num_input_tokens_seen": 3142400, + "step": 6390 + }, + { + "epoch": 0.8440015837402666, + "grad_norm": 0.19222283363342285, + "learning_rate": 1.4488404552964993e-07, + "loss": 0.0302, + "num_input_tokens_seen": 3144512, + "step": 6395 + }, + { + "epoch": 0.8446614755180151, + "grad_norm": 35.827850341796875, + "learning_rate": 1.4369206606053463e-07, + "loss": 0.0434, + "num_input_tokens_seen": 3146944, + "step": 6400 + }, + { + "epoch": 0.8453213672957635, + "grad_norm": 0.27888330817222595, + "learning_rate": 1.425046304849742e-07, + "loss": 0.0951, + "num_input_tokens_seen": 3149376, + "step": 6405 + }, + { + "epoch": 0.845981259073512, + "grad_norm": 8.114583015441895, + "learning_rate": 1.4132174510395024e-07, + "loss": 0.1082, + "num_input_tokens_seen": 3151744, + "step": 6410 + }, + { + "epoch": 0.8466411508512603, + "grad_norm": 0.21486525237560272, + "learning_rate": 1.4014341619430003e-07, + "loss": 0.0054, + "num_input_tokens_seen": 3154112, + "step": 6415 + }, + { + "epoch": 0.8473010426290088, + "grad_norm": 0.10914035141468048, + "learning_rate": 1.3896965000868188e-07, + "loss": 0.0044, + "num_input_tokens_seen": 3156480, + "step": 6420 + }, + { + "epoch": 0.8479609344067572, + "grad_norm": 135.10137939453125, + "learning_rate": 1.3780045277554276e-07, + "loss": 0.1166, + "num_input_tokens_seen": 3158784, + "step": 6425 + }, + { + "epoch": 0.8486208261845057, + "grad_norm": 0.17047731578350067, + "learning_rate": 1.3663583069908535e-07, + "loss": 0.1708, + "num_input_tokens_seen": 3161152, + "step": 6430 + }, + { + "epoch": 0.8492807179622542, + "grad_norm": 0.020379789173603058, + "learning_rate": 1.3547578995923447e-07, + "loss": 0.0101, + "num_input_tokens_seen": 3163776, + "step": 6435 + }, + { + "epoch": 0.8499406097400026, + "grad_norm": 41.39136505126953, + "learning_rate": 1.3432033671160458e-07, + "loss": 0.171, + "num_input_tokens_seen": 3166272, + "step": 6440 + }, + { + "epoch": 0.8503365448066517, + "eval_loss": 0.10069070011377335, + "eval_runtime": 7.9053, + "eval_samples_per_second": 851.955, + "eval_steps_per_second": 106.51, + "num_input_tokens_seen": 3167488, + "step": 6443 + }, + { + "epoch": 0.8506005015177511, + "grad_norm": 0.44015660881996155, + "learning_rate": 1.3316947708746762e-07, + "loss": 0.0712, + "num_input_tokens_seen": 3168640, + "step": 6445 + }, + { + "epoch": 0.8512603932954995, + "grad_norm": 0.051551755517721176, + "learning_rate": 1.3202321719371967e-07, + "loss": 0.0922, + "num_input_tokens_seen": 3171008, + "step": 6450 + }, + { + "epoch": 0.851920285073248, + "grad_norm": 0.023698126897215843, + "learning_rate": 1.3088156311284893e-07, + "loss": 0.0878, + "num_input_tokens_seen": 3173312, + "step": 6455 + }, + { + "epoch": 0.8525801768509964, + "grad_norm": 0.08452281355857849, + "learning_rate": 1.2974452090290322e-07, + "loss": 0.2677, + "num_input_tokens_seen": 3175808, + "step": 6460 + }, + { + "epoch": 0.8532400686287449, + "grad_norm": 0.07100846618413925, + "learning_rate": 1.2861209659745865e-07, + "loss": 0.0748, + "num_input_tokens_seen": 3178048, + "step": 6465 + }, + { + "epoch": 0.8538999604064933, + "grad_norm": 0.09944210201501846, + "learning_rate": 1.2748429620558654e-07, + "loss": 0.1044, + "num_input_tokens_seen": 3180544, + "step": 6470 + }, + { + "epoch": 0.8545598521842418, + "grad_norm": 13.341742515563965, + "learning_rate": 1.2636112571182167e-07, + "loss": 0.1888, + "num_input_tokens_seen": 3183040, + "step": 6475 + }, + { + "epoch": 0.8552197439619902, + "grad_norm": 0.08588089793920517, + "learning_rate": 1.2524259107613178e-07, + "loss": 0.1613, + "num_input_tokens_seen": 3185664, + "step": 6480 + }, + { + "epoch": 0.8558796357397387, + "grad_norm": 15.565762519836426, + "learning_rate": 1.2412869823388382e-07, + "loss": 0.1552, + "num_input_tokens_seen": 3188672, + "step": 6485 + }, + { + "epoch": 0.8565395275174872, + "grad_norm": 0.09630011022090912, + "learning_rate": 1.2301945309581486e-07, + "loss": 0.0598, + "num_input_tokens_seen": 3191168, + "step": 6490 + }, + { + "epoch": 0.8571994192952356, + "grad_norm": 139.6576690673828, + "learning_rate": 1.2191486154799846e-07, + "loss": 0.116, + "num_input_tokens_seen": 3193664, + "step": 6495 + }, + { + "epoch": 0.8578593110729841, + "grad_norm": 0.07933595776557922, + "learning_rate": 1.208149294518147e-07, + "loss": 0.001, + "num_input_tokens_seen": 3196224, + "step": 6500 + }, + { + "epoch": 0.8585192028507325, + "grad_norm": 0.09007618576288223, + "learning_rate": 1.1971966264391954e-07, + "loss": 0.1906, + "num_input_tokens_seen": 3198784, + "step": 6505 + }, + { + "epoch": 0.859179094628481, + "grad_norm": 0.08821459859609604, + "learning_rate": 1.1862906693621233e-07, + "loss": 0.1289, + "num_input_tokens_seen": 3201472, + "step": 6510 + }, + { + "epoch": 0.8598389864062294, + "grad_norm": 0.09566283971071243, + "learning_rate": 1.1754314811580623e-07, + "loss": 0.1718, + "num_input_tokens_seen": 3203584, + "step": 6515 + }, + { + "epoch": 0.8604988781839779, + "grad_norm": 0.14483189582824707, + "learning_rate": 1.1646191194499655e-07, + "loss": 0.0728, + "num_input_tokens_seen": 3205888, + "step": 6520 + }, + { + "epoch": 0.8611587699617262, + "grad_norm": 5.497840881347656, + "learning_rate": 1.1538536416123168e-07, + "loss": 0.1805, + "num_input_tokens_seen": 3208000, + "step": 6525 + }, + { + "epoch": 0.8618186617394747, + "grad_norm": 0.27670353651046753, + "learning_rate": 1.1431351047708072e-07, + "loss": 0.0119, + "num_input_tokens_seen": 3210240, + "step": 6530 + }, + { + "epoch": 0.8624785535172231, + "grad_norm": 85.52823638916016, + "learning_rate": 1.1324635658020432e-07, + "loss": 0.1218, + "num_input_tokens_seen": 3212672, + "step": 6535 + }, + { + "epoch": 0.8631384452949716, + "grad_norm": 51.2424430847168, + "learning_rate": 1.1218390813332479e-07, + "loss": 0.1695, + "num_input_tokens_seen": 3215360, + "step": 6540 + }, + { + "epoch": 0.86379833707272, + "grad_norm": 0.06896913796663284, + "learning_rate": 1.1112617077419472e-07, + "loss": 0.1279, + "num_input_tokens_seen": 3218112, + "step": 6545 + }, + { + "epoch": 0.8644582288504685, + "grad_norm": 0.21461394429206848, + "learning_rate": 1.1007315011556884e-07, + "loss": 0.0386, + "num_input_tokens_seen": 3220288, + "step": 6550 + }, + { + "epoch": 0.865118120628217, + "grad_norm": 0.17472003400325775, + "learning_rate": 1.0902485174517251e-07, + "loss": 0.0013, + "num_input_tokens_seen": 3222976, + "step": 6555 + }, + { + "epoch": 0.8657780124059654, + "grad_norm": 0.14662866294384003, + "learning_rate": 1.0798128122567285e-07, + "loss": 0.0532, + "num_input_tokens_seen": 3225472, + "step": 6560 + }, + { + "epoch": 0.8664379041837139, + "grad_norm": 115.46258544921875, + "learning_rate": 1.0694244409464992e-07, + "loss": 0.1791, + "num_input_tokens_seen": 3228096, + "step": 6565 + }, + { + "epoch": 0.8670977959614623, + "grad_norm": 0.0434236116707325, + "learning_rate": 1.0590834586456577e-07, + "loss": 0.1216, + "num_input_tokens_seen": 3230720, + "step": 6570 + }, + { + "epoch": 0.8677576877392108, + "grad_norm": 28.532846450805664, + "learning_rate": 1.0487899202273708e-07, + "loss": 0.1303, + "num_input_tokens_seen": 3233088, + "step": 6575 + }, + { + "epoch": 0.8684175795169592, + "grad_norm": 32.79645919799805, + "learning_rate": 1.0385438803130364e-07, + "loss": 0.1208, + "num_input_tokens_seen": 3235712, + "step": 6580 + }, + { + "epoch": 0.8690774712947077, + "grad_norm": 0.07639691233634949, + "learning_rate": 1.0283453932720199e-07, + "loss": 0.1107, + "num_input_tokens_seen": 3238528, + "step": 6585 + }, + { + "epoch": 0.8697373630724561, + "grad_norm": 0.7503368258476257, + "learning_rate": 1.0181945132213476e-07, + "loss": 0.0808, + "num_input_tokens_seen": 3240896, + "step": 6590 + }, + { + "epoch": 0.8703972548502046, + "grad_norm": 0.1267632097005844, + "learning_rate": 1.0080912940254227e-07, + "loss": 0.0017, + "num_input_tokens_seen": 3243392, + "step": 6595 + }, + { + "epoch": 0.871057146627953, + "grad_norm": 0.19074136018753052, + "learning_rate": 9.980357892957492e-08, + "loss": 0.0143, + "num_input_tokens_seen": 3245824, + "step": 6600 + }, + { + "epoch": 0.8717170384057015, + "grad_norm": 2.3936076164245605, + "learning_rate": 9.880280523906337e-08, + "loss": 0.0015, + "num_input_tokens_seen": 3248128, + "step": 6605 + }, + { + "epoch": 0.8723769301834499, + "grad_norm": 17.094982147216797, + "learning_rate": 9.780681364149091e-08, + "loss": 0.1882, + "num_input_tokens_seen": 3250624, + "step": 6610 + }, + { + "epoch": 0.8730368219611984, + "grad_norm": 0.6837690472602844, + "learning_rate": 9.681560942196587e-08, + "loss": 0.108, + "num_input_tokens_seen": 3253312, + "step": 6615 + }, + { + "epoch": 0.8736967137389469, + "grad_norm": 0.05720958858728409, + "learning_rate": 9.582919784019194e-08, + "loss": 0.1163, + "num_input_tokens_seen": 3255488, + "step": 6620 + }, + { + "epoch": 0.8743566055166953, + "grad_norm": 0.04769499972462654, + "learning_rate": 9.484758413044236e-08, + "loss": 0.0734, + "num_input_tokens_seen": 3257664, + "step": 6625 + }, + { + "epoch": 0.8750164972944438, + "grad_norm": 0.1479378342628479, + "learning_rate": 9.387077350153017e-08, + "loss": 0.099, + "num_input_tokens_seen": 3260160, + "step": 6630 + }, + { + "epoch": 0.8756763890721921, + "grad_norm": 18.90147590637207, + "learning_rate": 9.289877113678168e-08, + "loss": 0.0644, + "num_input_tokens_seen": 3262528, + "step": 6635 + }, + { + "epoch": 0.8763362808499406, + "grad_norm": 0.020846739411354065, + "learning_rate": 9.19315821940092e-08, + "loss": 0.0668, + "num_input_tokens_seen": 3265024, + "step": 6640 + }, + { + "epoch": 0.876996172627689, + "grad_norm": 0.25527259707450867, + "learning_rate": 9.096921180548234e-08, + "loss": 0.157, + "num_input_tokens_seen": 3267456, + "step": 6645 + }, + { + "epoch": 0.8776560644054375, + "grad_norm": 0.35352909564971924, + "learning_rate": 9.001166507790259e-08, + "loss": 0.1047, + "num_input_tokens_seen": 3270208, + "step": 6650 + }, + { + "epoch": 0.8783159561831859, + "grad_norm": 21.19246482849121, + "learning_rate": 8.905894709237427e-08, + "loss": 0.1139, + "num_input_tokens_seen": 3272960, + "step": 6655 + }, + { + "epoch": 0.8789758479609344, + "grad_norm": 0.26658570766448975, + "learning_rate": 8.811106290437975e-08, + "loss": 0.083, + "num_input_tokens_seen": 3275136, + "step": 6660 + }, + { + "epoch": 0.8796357397386828, + "grad_norm": 0.2020629346370697, + "learning_rate": 8.716801754375036e-08, + "loss": 0.0826, + "num_input_tokens_seen": 3277696, + "step": 6665 + }, + { + "epoch": 0.8802956315164313, + "grad_norm": 14.342360496520996, + "learning_rate": 8.62298160146413e-08, + "loss": 0.1297, + "num_input_tokens_seen": 3280064, + "step": 6670 + }, + { + "epoch": 0.8809555232941798, + "grad_norm": 0.19681094586849213, + "learning_rate": 8.529646329550466e-08, + "loss": 0.0166, + "num_input_tokens_seen": 3282304, + "step": 6675 + }, + { + "epoch": 0.8816154150719282, + "grad_norm": 0.16262973845005035, + "learning_rate": 8.436796433906235e-08, + "loss": 0.03, + "num_input_tokens_seen": 3284736, + "step": 6680 + }, + { + "epoch": 0.8822753068496767, + "grad_norm": 40.94983673095703, + "learning_rate": 8.344432407228141e-08, + "loss": 0.0714, + "num_input_tokens_seen": 3287168, + "step": 6685 + }, + { + "epoch": 0.8829351986274251, + "grad_norm": 69.14717102050781, + "learning_rate": 8.252554739634577e-08, + "loss": 0.0623, + "num_input_tokens_seen": 3289600, + "step": 6690 + }, + { + "epoch": 0.8835950904051736, + "grad_norm": 0.04172307625412941, + "learning_rate": 8.16116391866316e-08, + "loss": 0.0589, + "num_input_tokens_seen": 3292160, + "step": 6695 + }, + { + "epoch": 0.884254982182922, + "grad_norm": 14.343789100646973, + "learning_rate": 8.070260429268172e-08, + "loss": 0.1393, + "num_input_tokens_seen": 3294592, + "step": 6700 + }, + { + "epoch": 0.8849148739606705, + "grad_norm": 21.479198455810547, + "learning_rate": 7.979844753817855e-08, + "loss": 0.0539, + "num_input_tokens_seen": 3296960, + "step": 6705 + }, + { + "epoch": 0.8855747657384189, + "grad_norm": 22.292438507080078, + "learning_rate": 7.889917372091982e-08, + "loss": 0.0709, + "num_input_tokens_seen": 3299200, + "step": 6710 + }, + { + "epoch": 0.8862346575161674, + "grad_norm": 13.006369590759277, + "learning_rate": 7.800478761279183e-08, + "loss": 0.2047, + "num_input_tokens_seen": 3301568, + "step": 6715 + }, + { + "epoch": 0.8868945492939158, + "grad_norm": 14.817943572998047, + "learning_rate": 7.711529395974592e-08, + "loss": 0.1478, + "num_input_tokens_seen": 3304064, + "step": 6720 + }, + { + "epoch": 0.8875544410716643, + "grad_norm": 0.05923435837030411, + "learning_rate": 7.623069748177135e-08, + "loss": 0.1855, + "num_input_tokens_seen": 3306432, + "step": 6725 + }, + { + "epoch": 0.8882143328494126, + "grad_norm": 0.2706301510334015, + "learning_rate": 7.535100287287111e-08, + "loss": 0.0866, + "num_input_tokens_seen": 3308736, + "step": 6730 + }, + { + "epoch": 0.8888742246271611, + "grad_norm": 0.10623639822006226, + "learning_rate": 7.447621480103783e-08, + "loss": 0.0024, + "num_input_tokens_seen": 3311168, + "step": 6735 + }, + { + "epoch": 0.8895341164049096, + "grad_norm": 31.206645965576172, + "learning_rate": 7.360633790822713e-08, + "loss": 0.2758, + "num_input_tokens_seen": 3313664, + "step": 6740 + }, + { + "epoch": 0.890194008182658, + "grad_norm": 0.22586752474308014, + "learning_rate": 7.274137681033498e-08, + "loss": 0.044, + "num_input_tokens_seen": 3316224, + "step": 6745 + }, + { + "epoch": 0.8908538999604065, + "grad_norm": 0.25102493166923523, + "learning_rate": 7.188133609717184e-08, + "loss": 0.0791, + "num_input_tokens_seen": 3318464, + "step": 6750 + }, + { + "epoch": 0.8915137917381549, + "grad_norm": 0.05701738968491554, + "learning_rate": 7.102622033243843e-08, + "loss": 0.0008, + "num_input_tokens_seen": 3320896, + "step": 6755 + }, + { + "epoch": 0.8921736835159034, + "grad_norm": 0.2995738983154297, + "learning_rate": 7.017603405370276e-08, + "loss": 0.1241, + "num_input_tokens_seen": 3323648, + "step": 6760 + }, + { + "epoch": 0.8928335752936518, + "grad_norm": 0.19232375919818878, + "learning_rate": 6.933078177237429e-08, + "loss": 0.1568, + "num_input_tokens_seen": 3326208, + "step": 6765 + }, + { + "epoch": 0.8934934670714003, + "grad_norm": 0.24058905243873596, + "learning_rate": 6.849046797368108e-08, + "loss": 0.0287, + "num_input_tokens_seen": 3328576, + "step": 6770 + }, + { + "epoch": 0.8941533588491487, + "grad_norm": 4.3670430183410645, + "learning_rate": 6.765509711664574e-08, + "loss": 0.0018, + "num_input_tokens_seen": 3331520, + "step": 6775 + }, + { + "epoch": 0.8948132506268972, + "grad_norm": 0.28316637873649597, + "learning_rate": 6.682467363406174e-08, + "loss": 0.0488, + "num_input_tokens_seen": 3334336, + "step": 6780 + }, + { + "epoch": 0.8954731424046456, + "grad_norm": 0.2006041258573532, + "learning_rate": 6.59992019324701e-08, + "loss": 0.0703, + "num_input_tokens_seen": 3336896, + "step": 6785 + }, + { + "epoch": 0.8961330341823941, + "grad_norm": 12.302181243896484, + "learning_rate": 6.517868639213553e-08, + "loss": 0.0708, + "num_input_tokens_seen": 3339328, + "step": 6790 + }, + { + "epoch": 0.8967929259601425, + "grad_norm": 0.21891701221466064, + "learning_rate": 6.436313136702387e-08, + "loss": 0.0182, + "num_input_tokens_seen": 3341760, + "step": 6795 + }, + { + "epoch": 0.897452817737891, + "grad_norm": 18.251375198364258, + "learning_rate": 6.355254118477815e-08, + "loss": 0.0659, + "num_input_tokens_seen": 3344448, + "step": 6800 + }, + { + "epoch": 0.8981127095156395, + "grad_norm": 0.09570349752902985, + "learning_rate": 6.274692014669602e-08, + "loss": 0.001, + "num_input_tokens_seen": 3347008, + "step": 6805 + }, + { + "epoch": 0.8987726012933879, + "grad_norm": 0.09717115759849548, + "learning_rate": 6.194627252770768e-08, + "loss": 0.0006, + "num_input_tokens_seen": 3349824, + "step": 6810 + }, + { + "epoch": 0.8994324930711364, + "grad_norm": 0.06764009594917297, + "learning_rate": 6.115060257635174e-08, + "loss": 0.0903, + "num_input_tokens_seen": 3352320, + "step": 6815 + }, + { + "epoch": 0.9000923848488848, + "grad_norm": 0.19751790165901184, + "learning_rate": 6.035991451475375e-08, + "loss": 0.0013, + "num_input_tokens_seen": 3354688, + "step": 6820 + }, + { + "epoch": 0.9003563415599841, + "eval_loss": 0.09756959229707718, + "eval_runtime": 8.0458, + "eval_samples_per_second": 837.078, + "eval_steps_per_second": 104.65, + "num_input_tokens_seen": 3355520, + "step": 6822 + }, + { + "epoch": 0.9007522766266333, + "grad_norm": 0.013898173347115517, + "learning_rate": 5.9574212538603505e-08, + "loss": 0.0663, + "num_input_tokens_seen": 3357056, + "step": 6825 + }, + { + "epoch": 0.9014121684043817, + "grad_norm": 26.278072357177734, + "learning_rate": 5.879350081713252e-08, + "loss": 0.066, + "num_input_tokens_seen": 3359488, + "step": 6830 + }, + { + "epoch": 0.9020720601821302, + "grad_norm": 0.15908479690551758, + "learning_rate": 5.8017783493092386e-08, + "loss": 0.2437, + "num_input_tokens_seen": 3361920, + "step": 6835 + }, + { + "epoch": 0.9027319519598785, + "grad_norm": 0.18942204117774963, + "learning_rate": 5.7247064682732104e-08, + "loss": 0.0012, + "num_input_tokens_seen": 3364416, + "step": 6840 + }, + { + "epoch": 0.903391843737627, + "grad_norm": 0.23464049398899078, + "learning_rate": 5.6481348475777566e-08, + "loss": 0.0617, + "num_input_tokens_seen": 3366912, + "step": 6845 + }, + { + "epoch": 0.9040517355153754, + "grad_norm": 0.01882772147655487, + "learning_rate": 5.5720638935407796e-08, + "loss": 0.0012, + "num_input_tokens_seen": 3369088, + "step": 6850 + }, + { + "epoch": 0.9047116272931239, + "grad_norm": 0.01236939337104559, + "learning_rate": 5.49649400982356e-08, + "loss": 0.1105, + "num_input_tokens_seen": 3371520, + "step": 6855 + }, + { + "epoch": 0.9053715190708723, + "grad_norm": 0.031979262828826904, + "learning_rate": 5.421425597428442e-08, + "loss": 0.0005, + "num_input_tokens_seen": 3374080, + "step": 6860 + }, + { + "epoch": 0.9060314108486208, + "grad_norm": 104.13761138916016, + "learning_rate": 5.346859054696784e-08, + "loss": 0.1294, + "num_input_tokens_seen": 3376640, + "step": 6865 + }, + { + "epoch": 0.9066913026263693, + "grad_norm": 0.019581180065870285, + "learning_rate": 5.2727947773068773e-08, + "loss": 0.0709, + "num_input_tokens_seen": 3379072, + "step": 6870 + }, + { + "epoch": 0.9073511944041177, + "grad_norm": 0.8969870805740356, + "learning_rate": 5.199233158271732e-08, + "loss": 0.069, + "num_input_tokens_seen": 3381696, + "step": 6875 + }, + { + "epoch": 0.9080110861818662, + "grad_norm": 15.742879867553711, + "learning_rate": 5.126174587937149e-08, + "loss": 0.2041, + "num_input_tokens_seen": 3384064, + "step": 6880 + }, + { + "epoch": 0.9086709779596146, + "grad_norm": 0.0772380605340004, + "learning_rate": 5.053619453979485e-08, + "loss": 0.0024, + "num_input_tokens_seen": 3386304, + "step": 6885 + }, + { + "epoch": 0.9093308697373631, + "grad_norm": 0.030766058713197708, + "learning_rate": 4.9815681414037025e-08, + "loss": 0.1257, + "num_input_tokens_seen": 3388800, + "step": 6890 + }, + { + "epoch": 0.9099907615151115, + "grad_norm": 0.5838080048561096, + "learning_rate": 4.910021032541334e-08, + "loss": 0.097, + "num_input_tokens_seen": 3391232, + "step": 6895 + }, + { + "epoch": 0.91065065329286, + "grad_norm": 25.251256942749023, + "learning_rate": 4.838978507048319e-08, + "loss": 0.1039, + "num_input_tokens_seen": 3393664, + "step": 6900 + }, + { + "epoch": 0.9113105450706084, + "grad_norm": 0.1599751114845276, + "learning_rate": 4.768440941903207e-08, + "loss": 0.0018, + "num_input_tokens_seen": 3395968, + "step": 6905 + }, + { + "epoch": 0.9119704368483569, + "grad_norm": 0.09924237430095673, + "learning_rate": 4.698408711404944e-08, + "loss": 0.0407, + "num_input_tokens_seen": 3398272, + "step": 6910 + }, + { + "epoch": 0.9126303286261053, + "grad_norm": 22.53904914855957, + "learning_rate": 4.628882187171046e-08, + "loss": 0.0894, + "num_input_tokens_seen": 3400960, + "step": 6915 + }, + { + "epoch": 0.9132902204038538, + "grad_norm": 23.106115341186523, + "learning_rate": 4.559861738135506e-08, + "loss": 0.1429, + "num_input_tokens_seen": 3403520, + "step": 6920 + }, + { + "epoch": 0.9139501121816023, + "grad_norm": 0.8851416110992432, + "learning_rate": 4.491347730546913e-08, + "loss": 0.2526, + "num_input_tokens_seen": 3405952, + "step": 6925 + }, + { + "epoch": 0.9146100039593507, + "grad_norm": 18.905851364135742, + "learning_rate": 4.423340527966512e-08, + "loss": 0.1429, + "num_input_tokens_seen": 3408320, + "step": 6930 + }, + { + "epoch": 0.9152698957370992, + "grad_norm": 0.1432974636554718, + "learning_rate": 4.355840491266205e-08, + "loss": 0.0675, + "num_input_tokens_seen": 3410880, + "step": 6935 + }, + { + "epoch": 0.9159297875148475, + "grad_norm": 0.04884126037359238, + "learning_rate": 4.288847978626686e-08, + "loss": 0.0589, + "num_input_tokens_seen": 3413440, + "step": 6940 + }, + { + "epoch": 0.916589679292596, + "grad_norm": 490.322265625, + "learning_rate": 4.222363345535585e-08, + "loss": 0.0656, + "num_input_tokens_seen": 3416000, + "step": 6945 + }, + { + "epoch": 0.9172495710703444, + "grad_norm": 17.165851593017578, + "learning_rate": 4.1563869447854505e-08, + "loss": 0.1151, + "num_input_tokens_seen": 3418240, + "step": 6950 + }, + { + "epoch": 0.9179094628480929, + "grad_norm": 0.17861710488796234, + "learning_rate": 4.090919126472048e-08, + "loss": 0.1535, + "num_input_tokens_seen": 3420672, + "step": 6955 + }, + { + "epoch": 0.9185693546258413, + "grad_norm": 0.6773964166641235, + "learning_rate": 4.025960237992332e-08, + "loss": 0.0099, + "num_input_tokens_seen": 3422912, + "step": 6960 + }, + { + "epoch": 0.9192292464035898, + "grad_norm": 79.64431762695312, + "learning_rate": 3.961510624042741e-08, + "loss": 0.0129, + "num_input_tokens_seen": 3425408, + "step": 6965 + }, + { + "epoch": 0.9198891381813382, + "grad_norm": 22.402997970581055, + "learning_rate": 3.8975706266172636e-08, + "loss": 0.1038, + "num_input_tokens_seen": 3427776, + "step": 6970 + }, + { + "epoch": 0.9205490299590867, + "grad_norm": 17.22422218322754, + "learning_rate": 3.834140585005696e-08, + "loss": 0.1456, + "num_input_tokens_seen": 3430336, + "step": 6975 + }, + { + "epoch": 0.9212089217368351, + "grad_norm": 35.29188919067383, + "learning_rate": 3.771220835791844e-08, + "loss": 0.192, + "num_input_tokens_seen": 3432896, + "step": 6980 + }, + { + "epoch": 0.9218688135145836, + "grad_norm": 0.24460290372371674, + "learning_rate": 3.708811712851634e-08, + "loss": 0.023, + "num_input_tokens_seen": 3435136, + "step": 6985 + }, + { + "epoch": 0.9225287052923321, + "grad_norm": 0.08124759048223495, + "learning_rate": 3.6469135473514936e-08, + "loss": 0.0816, + "num_input_tokens_seen": 3437824, + "step": 6990 + }, + { + "epoch": 0.9231885970700805, + "grad_norm": 0.0361192487180233, + "learning_rate": 3.5855266677464744e-08, + "loss": 0.0381, + "num_input_tokens_seen": 3440320, + "step": 6995 + }, + { + "epoch": 0.923848488847829, + "grad_norm": 0.23591069877147675, + "learning_rate": 3.524651399778555e-08, + "loss": 0.0565, + "num_input_tokens_seen": 3442880, + "step": 7000 + }, + { + "epoch": 0.9245083806255774, + "grad_norm": 0.06923260539770126, + "learning_rate": 3.4642880664749296e-08, + "loss": 0.0016, + "num_input_tokens_seen": 3445120, + "step": 7005 + }, + { + "epoch": 0.9251682724033259, + "grad_norm": 0.1492045372724533, + "learning_rate": 3.404436988146242e-08, + "loss": 0.1966, + "num_input_tokens_seen": 3447424, + "step": 7010 + }, + { + "epoch": 0.9258281641810743, + "grad_norm": 0.01087052933871746, + "learning_rate": 3.345098482384956e-08, + "loss": 0.0537, + "num_input_tokens_seen": 3449920, + "step": 7015 + }, + { + "epoch": 0.9264880559588228, + "grad_norm": 0.2497768998146057, + "learning_rate": 3.2862728640636105e-08, + "loss": 0.0494, + "num_input_tokens_seen": 3452416, + "step": 7020 + }, + { + "epoch": 0.9271479477365712, + "grad_norm": 18.70515251159668, + "learning_rate": 3.227960445333155e-08, + "loss": 0.1016, + "num_input_tokens_seen": 3454912, + "step": 7025 + }, + { + "epoch": 0.9278078395143197, + "grad_norm": 0.039576705545186996, + "learning_rate": 3.1701615356213295e-08, + "loss": 0.0633, + "num_input_tokens_seen": 3457472, + "step": 7030 + }, + { + "epoch": 0.928467731292068, + "grad_norm": 0.12152862548828125, + "learning_rate": 3.112876441630985e-08, + "loss": 0.0683, + "num_input_tokens_seen": 3459712, + "step": 7035 + }, + { + "epoch": 0.9291276230698166, + "grad_norm": 0.22948475182056427, + "learning_rate": 3.05610546733851e-08, + "loss": 0.0577, + "num_input_tokens_seen": 3462144, + "step": 7040 + }, + { + "epoch": 0.9297875148475649, + "grad_norm": 18.062097549438477, + "learning_rate": 2.99984891399212e-08, + "loss": 0.2195, + "num_input_tokens_seen": 3464512, + "step": 7045 + }, + { + "epoch": 0.9304474066253134, + "grad_norm": 0.03376483917236328, + "learning_rate": 2.9441070801103808e-08, + "loss": 0.0013, + "num_input_tokens_seen": 3466880, + "step": 7050 + }, + { + "epoch": 0.931107298403062, + "grad_norm": 0.17363989353179932, + "learning_rate": 2.8888802614805085e-08, + "loss": 0.1014, + "num_input_tokens_seen": 3469248, + "step": 7055 + }, + { + "epoch": 0.9317671901808103, + "grad_norm": 75.9137191772461, + "learning_rate": 2.8341687511568734e-08, + "loss": 0.2786, + "num_input_tokens_seen": 3471616, + "step": 7060 + }, + { + "epoch": 0.9324270819585588, + "grad_norm": 0.2475104182958603, + "learning_rate": 2.7799728394594547e-08, + "loss": 0.082, + "num_input_tokens_seen": 3474240, + "step": 7065 + }, + { + "epoch": 0.9330869737363072, + "grad_norm": 0.09209995716810226, + "learning_rate": 2.7262928139722198e-08, + "loss": 0.0789, + "num_input_tokens_seen": 3476800, + "step": 7070 + }, + { + "epoch": 0.9337468655140557, + "grad_norm": 0.04198440536856651, + "learning_rate": 2.673128959541693e-08, + "loss": 0.0807, + "num_input_tokens_seen": 3479488, + "step": 7075 + }, + { + "epoch": 0.9344067572918041, + "grad_norm": 0.019190721213817596, + "learning_rate": 2.620481558275367e-08, + "loss": 0.0005, + "num_input_tokens_seen": 3482176, + "step": 7080 + }, + { + "epoch": 0.9350666490695526, + "grad_norm": 16.029815673828125, + "learning_rate": 2.5683508895402382e-08, + "loss": 0.0278, + "num_input_tokens_seen": 3484800, + "step": 7085 + }, + { + "epoch": 0.935726540847301, + "grad_norm": 14.575031280517578, + "learning_rate": 2.5167372299613853e-08, + "loss": 0.1436, + "num_input_tokens_seen": 3487488, + "step": 7090 + }, + { + "epoch": 0.9363864326250495, + "grad_norm": 14.435125350952148, + "learning_rate": 2.4656408534203365e-08, + "loss": 0.2508, + "num_input_tokens_seen": 3489728, + "step": 7095 + }, + { + "epoch": 0.9370463244027979, + "grad_norm": 0.028600651770830154, + "learning_rate": 2.4150620310538273e-08, + "loss": 0.2469, + "num_input_tokens_seen": 3491904, + "step": 7100 + }, + { + "epoch": 0.9377062161805464, + "grad_norm": 15.751771926879883, + "learning_rate": 2.3650010312521673e-08, + "loss": 0.0832, + "num_input_tokens_seen": 3494592, + "step": 7105 + }, + { + "epoch": 0.9383661079582949, + "grad_norm": 0.0997326597571373, + "learning_rate": 2.3154581196579648e-08, + "loss": 0.1798, + "num_input_tokens_seen": 3497088, + "step": 7110 + }, + { + "epoch": 0.9390259997360433, + "grad_norm": 0.07149897515773773, + "learning_rate": 2.2664335591646377e-08, + "loss": 0.0559, + "num_input_tokens_seen": 3499520, + "step": 7115 + }, + { + "epoch": 0.9396858915137918, + "grad_norm": 0.024605661630630493, + "learning_rate": 2.2179276099150158e-08, + "loss": 0.2113, + "num_input_tokens_seen": 3502208, + "step": 7120 + }, + { + "epoch": 0.9403457832915402, + "grad_norm": 81.53313446044922, + "learning_rate": 2.1699405293000182e-08, + "loss": 0.1584, + "num_input_tokens_seen": 3504640, + "step": 7125 + }, + { + "epoch": 0.9410056750692887, + "grad_norm": 0.09356902539730072, + "learning_rate": 2.1224725719572235e-08, + "loss": 0.0448, + "num_input_tokens_seen": 3506944, + "step": 7130 + }, + { + "epoch": 0.9416655668470371, + "grad_norm": 0.28894391655921936, + "learning_rate": 2.0755239897695453e-08, + "loss": 0.0454, + "num_input_tokens_seen": 3509376, + "step": 7135 + }, + { + "epoch": 0.9423254586247856, + "grad_norm": 0.5616478323936462, + "learning_rate": 2.0290950318639256e-08, + "loss": 0.1705, + "num_input_tokens_seen": 3511680, + "step": 7140 + }, + { + "epoch": 0.942985350402534, + "grad_norm": 2.1705074310302734, + "learning_rate": 1.983185944609944e-08, + "loss": 0.0576, + "num_input_tokens_seen": 3514112, + "step": 7145 + }, + { + "epoch": 0.9436452421802825, + "grad_norm": 0.15767821669578552, + "learning_rate": 1.9377969716185994e-08, + "loss": 0.0709, + "num_input_tokens_seen": 3516480, + "step": 7150 + }, + { + "epoch": 0.9443051339580308, + "grad_norm": 0.03708624094724655, + "learning_rate": 1.8929283537408968e-08, + "loss": 0.1222, + "num_input_tokens_seen": 3518720, + "step": 7155 + }, + { + "epoch": 0.9449650257357793, + "grad_norm": 0.16703498363494873, + "learning_rate": 1.848580329066718e-08, + "loss": 0.0012, + "num_input_tokens_seen": 3521216, + "step": 7160 + }, + { + "epoch": 0.9456249175135277, + "grad_norm": 17.98069953918457, + "learning_rate": 1.804753132923431e-08, + "loss": 0.4089, + "num_input_tokens_seen": 3523776, + "step": 7165 + }, + { + "epoch": 0.9462848092912762, + "grad_norm": 0.2615845799446106, + "learning_rate": 1.7614469978746827e-08, + "loss": 0.0013, + "num_input_tokens_seen": 3526272, + "step": 7170 + }, + { + "epoch": 0.9469447010690247, + "grad_norm": 61.300594329833984, + "learning_rate": 1.7186621537192304e-08, + "loss": 0.0095, + "num_input_tokens_seen": 3528576, + "step": 7175 + }, + { + "epoch": 0.9476045928467731, + "grad_norm": 0.127578467130661, + "learning_rate": 1.6763988274896003e-08, + "loss": 0.0009, + "num_input_tokens_seen": 3531136, + "step": 7180 + }, + { + "epoch": 0.9482644846245216, + "grad_norm": 15.952384948730469, + "learning_rate": 1.6346572434509876e-08, + "loss": 0.159, + "num_input_tokens_seen": 3533696, + "step": 7185 + }, + { + "epoch": 0.94892437640227, + "grad_norm": 1.98032808303833, + "learning_rate": 1.5934376231000248e-08, + "loss": 0.1343, + "num_input_tokens_seen": 3536064, + "step": 7190 + }, + { + "epoch": 0.9495842681800185, + "grad_norm": 0.20912101864814758, + "learning_rate": 1.55274018516357e-08, + "loss": 0.0016, + "num_input_tokens_seen": 3538432, + "step": 7195 + }, + { + "epoch": 0.9502441599577669, + "grad_norm": 0.0482788160443306, + "learning_rate": 1.512565145597633e-08, + "loss": 0.0683, + "num_input_tokens_seen": 3541120, + "step": 7200 + }, + { + "epoch": 0.9503761383133166, + "eval_loss": 0.09811879694461823, + "eval_runtime": 7.9135, + "eval_samples_per_second": 851.075, + "eval_steps_per_second": 106.4, + "num_input_tokens_seen": 3541632, + "step": 7201 + }, + { + "epoch": 0.9509040517355154, + "grad_norm": 32.42230987548828, + "learning_rate": 1.47291271758615e-08, + "loss": 0.0802, + "num_input_tokens_seen": 3543680, + "step": 7205 + }, + { + "epoch": 0.9515639435132638, + "grad_norm": 22.951187133789062, + "learning_rate": 1.4337831115398991e-08, + "loss": 0.1379, + "num_input_tokens_seen": 3545984, + "step": 7210 + }, + { + "epoch": 0.9522238352910123, + "grad_norm": 21.046493530273438, + "learning_rate": 1.3951765350953548e-08, + "loss": 0.1338, + "num_input_tokens_seen": 3548544, + "step": 7215 + }, + { + "epoch": 0.9528837270687607, + "grad_norm": 0.031218115240335464, + "learning_rate": 1.3570931931136009e-08, + "loss": 0.0956, + "num_input_tokens_seen": 3551040, + "step": 7220 + }, + { + "epoch": 0.9535436188465092, + "grad_norm": 0.17024770379066467, + "learning_rate": 1.3195332876792532e-08, + "loss": 0.0867, + "num_input_tokens_seen": 3553536, + "step": 7225 + }, + { + "epoch": 0.9542035106242576, + "grad_norm": 0.06077006831765175, + "learning_rate": 1.2824970180993488e-08, + "loss": 0.1628, + "num_input_tokens_seen": 3555712, + "step": 7230 + }, + { + "epoch": 0.9548634024020061, + "grad_norm": 0.11309027671813965, + "learning_rate": 1.2459845809023484e-08, + "loss": 0.1277, + "num_input_tokens_seen": 3558080, + "step": 7235 + }, + { + "epoch": 0.9555232941797546, + "grad_norm": 27.433135986328125, + "learning_rate": 1.2099961698370353e-08, + "loss": 0.3486, + "num_input_tokens_seen": 3560640, + "step": 7240 + }, + { + "epoch": 0.956183185957503, + "grad_norm": 14.181526184082031, + "learning_rate": 1.1745319758715288e-08, + "loss": 0.0935, + "num_input_tokens_seen": 3563392, + "step": 7245 + }, + { + "epoch": 0.9568430777352515, + "grad_norm": 17.118762969970703, + "learning_rate": 1.1395921871922509e-08, + "loss": 0.1487, + "num_input_tokens_seen": 3565824, + "step": 7250 + }, + { + "epoch": 0.9575029695129998, + "grad_norm": 0.10188383609056473, + "learning_rate": 1.105176989202905e-08, + "loss": 0.0008, + "num_input_tokens_seen": 3568256, + "step": 7255 + }, + { + "epoch": 0.9581628612907483, + "grad_norm": 52.97846603393555, + "learning_rate": 1.0712865645235659e-08, + "loss": 0.0075, + "num_input_tokens_seen": 3570752, + "step": 7260 + }, + { + "epoch": 0.9588227530684967, + "grad_norm": 0.1891770213842392, + "learning_rate": 1.0379210929896131e-08, + "loss": 0.0681, + "num_input_tokens_seen": 3572928, + "step": 7265 + }, + { + "epoch": 0.9594826448462452, + "grad_norm": 63.22892761230469, + "learning_rate": 1.0050807516508553e-08, + "loss": 0.1822, + "num_input_tokens_seen": 3575296, + "step": 7270 + }, + { + "epoch": 0.9601425366239936, + "grad_norm": 0.0791056752204895, + "learning_rate": 9.727657147705737e-09, + "loss": 0.0006, + "num_input_tokens_seen": 3577664, + "step": 7275 + }, + { + "epoch": 0.9608024284017421, + "grad_norm": 0.34656962752342224, + "learning_rate": 9.409761538245575e-09, + "loss": 0.2031, + "num_input_tokens_seen": 3580160, + "step": 7280 + }, + { + "epoch": 0.9614623201794905, + "grad_norm": 0.3039737045764923, + "learning_rate": 9.097122375002264e-09, + "loss": 0.1012, + "num_input_tokens_seen": 3582464, + "step": 7285 + }, + { + "epoch": 0.962122211957239, + "grad_norm": 0.30660831928253174, + "learning_rate": 8.789741316957312e-09, + "loss": 0.1369, + "num_input_tokens_seen": 3584896, + "step": 7290 + }, + { + "epoch": 0.9627821037349875, + "grad_norm": 0.5878282189369202, + "learning_rate": 8.487619995190986e-09, + "loss": 0.0152, + "num_input_tokens_seen": 3587584, + "step": 7295 + }, + { + "epoch": 0.9634419955127359, + "grad_norm": 18.56205177307129, + "learning_rate": 8.19076001287311e-09, + "loss": 0.1341, + "num_input_tokens_seen": 3590144, + "step": 7300 + }, + { + "epoch": 0.9641018872904844, + "grad_norm": 0.07710211724042892, + "learning_rate": 7.899162945254945e-09, + "loss": 0.001, + "num_input_tokens_seen": 3592832, + "step": 7305 + }, + { + "epoch": 0.9647617790682328, + "grad_norm": 23.307418823242188, + "learning_rate": 7.612830339660758e-09, + "loss": 0.0999, + "num_input_tokens_seen": 3595456, + "step": 7310 + }, + { + "epoch": 0.9654216708459813, + "grad_norm": 12.40549087524414, + "learning_rate": 7.3317637154796105e-09, + "loss": 0.1011, + "num_input_tokens_seen": 3597888, + "step": 7315 + }, + { + "epoch": 0.9660815626237297, + "grad_norm": 18.231792449951172, + "learning_rate": 7.0559645641572465e-09, + "loss": 0.0699, + "num_input_tokens_seen": 3600384, + "step": 7320 + }, + { + "epoch": 0.9667414544014782, + "grad_norm": 93.2337646484375, + "learning_rate": 6.785434349188102e-09, + "loss": 0.1521, + "num_input_tokens_seen": 3602880, + "step": 7325 + }, + { + "epoch": 0.9674013461792266, + "grad_norm": 0.19403959810733795, + "learning_rate": 6.520174506107867e-09, + "loss": 0.045, + "num_input_tokens_seen": 3605248, + "step": 7330 + }, + { + "epoch": 0.9680612379569751, + "grad_norm": 0.17541255056858063, + "learning_rate": 6.260186442485494e-09, + "loss": 0.001, + "num_input_tokens_seen": 3607808, + "step": 7335 + }, + { + "epoch": 0.9687211297347235, + "grad_norm": 1.3419514894485474, + "learning_rate": 6.005471537915863e-09, + "loss": 0.1172, + "num_input_tokens_seen": 3610112, + "step": 7340 + }, + { + "epoch": 0.969381021512472, + "grad_norm": 35.56879806518555, + "learning_rate": 5.756031144012685e-09, + "loss": 0.0319, + "num_input_tokens_seen": 3612352, + "step": 7345 + }, + { + "epoch": 0.9700409132902204, + "grad_norm": 21.5054874420166, + "learning_rate": 5.511866584400837e-09, + "loss": 0.1853, + "num_input_tokens_seen": 3614848, + "step": 7350 + }, + { + "epoch": 0.9707008050679689, + "grad_norm": 0.22669829428195953, + "learning_rate": 5.2729791547097e-09, + "loss": 0.0038, + "num_input_tokens_seen": 3617408, + "step": 7355 + }, + { + "epoch": 0.9713606968457174, + "grad_norm": 26.995397567749023, + "learning_rate": 5.039370122566389e-09, + "loss": 0.1072, + "num_input_tokens_seen": 3619968, + "step": 7360 + }, + { + "epoch": 0.9720205886234657, + "grad_norm": 5.098914623260498, + "learning_rate": 4.811040727588755e-09, + "loss": 0.099, + "num_input_tokens_seen": 3622016, + "step": 7365 + }, + { + "epoch": 0.9726804804012142, + "grad_norm": 18.19532012939453, + "learning_rate": 4.58799218137873e-09, + "loss": 0.1695, + "num_input_tokens_seen": 3624192, + "step": 7370 + }, + { + "epoch": 0.9733403721789626, + "grad_norm": 0.12403739243745804, + "learning_rate": 4.370225667516325e-09, + "loss": 0.0006, + "num_input_tokens_seen": 3626624, + "step": 7375 + }, + { + "epoch": 0.9740002639567111, + "grad_norm": 14.581175804138184, + "learning_rate": 4.157742341552861e-09, + "loss": 0.1853, + "num_input_tokens_seen": 3628928, + "step": 7380 + }, + { + "epoch": 0.9746601557344595, + "grad_norm": 0.035725370049476624, + "learning_rate": 3.950543331005307e-09, + "loss": 0.1044, + "num_input_tokens_seen": 3631552, + "step": 7385 + }, + { + "epoch": 0.975320047512208, + "grad_norm": 13.293424606323242, + "learning_rate": 3.748629735349839e-09, + "loss": 0.0016, + "num_input_tokens_seen": 3633984, + "step": 7390 + }, + { + "epoch": 0.9759799392899564, + "grad_norm": 0.3222048878669739, + "learning_rate": 3.552002626016293e-09, + "loss": 0.2102, + "num_input_tokens_seen": 3636224, + "step": 7395 + }, + { + "epoch": 0.9766398310677049, + "grad_norm": 0.12731555104255676, + "learning_rate": 3.3606630463824947e-09, + "loss": 0.2375, + "num_input_tokens_seen": 3638656, + "step": 7400 + }, + { + "epoch": 0.9772997228454533, + "grad_norm": 0.33530130982398987, + "learning_rate": 3.174612011768607e-09, + "loss": 0.0009, + "num_input_tokens_seen": 3641408, + "step": 7405 + }, + { + "epoch": 0.9779596146232018, + "grad_norm": 15.725085258483887, + "learning_rate": 2.9938505094316834e-09, + "loss": 0.1826, + "num_input_tokens_seen": 3643840, + "step": 7410 + }, + { + "epoch": 0.9786195064009502, + "grad_norm": 0.08356328308582306, + "learning_rate": 2.8183794985605637e-09, + "loss": 0.0801, + "num_input_tokens_seen": 3646336, + "step": 7415 + }, + { + "epoch": 0.9792793981786987, + "grad_norm": 0.0940588191151619, + "learning_rate": 2.6481999102707654e-09, + "loss": 0.0731, + "num_input_tokens_seen": 3648960, + "step": 7420 + }, + { + "epoch": 0.9799392899564472, + "grad_norm": 0.3441082239151001, + "learning_rate": 2.4833126475994894e-09, + "loss": 0.0011, + "num_input_tokens_seen": 3651200, + "step": 7425 + }, + { + "epoch": 0.9805991817341956, + "grad_norm": 0.3757539689540863, + "learning_rate": 2.3237185855008443e-09, + "loss": 0.0073, + "num_input_tokens_seen": 3653504, + "step": 7430 + }, + { + "epoch": 0.9812590735119441, + "grad_norm": 150.4886474609375, + "learning_rate": 2.1694185708414083e-09, + "loss": 0.2482, + "num_input_tokens_seen": 3656064, + "step": 7435 + }, + { + "epoch": 0.9819189652896925, + "grad_norm": 92.5436019897461, + "learning_rate": 2.0204134223952284e-09, + "loss": 0.2875, + "num_input_tokens_seen": 3658112, + "step": 7440 + }, + { + "epoch": 0.982578857067441, + "grad_norm": 19.585914611816406, + "learning_rate": 1.87670393083994e-09, + "loss": 0.1509, + "num_input_tokens_seen": 3660928, + "step": 7445 + }, + { + "epoch": 0.9832387488451894, + "grad_norm": 39.90876388549805, + "learning_rate": 1.7382908587525447e-09, + "loss": 0.0779, + "num_input_tokens_seen": 3663232, + "step": 7450 + }, + { + "epoch": 0.9838986406229379, + "grad_norm": 0.06113344430923462, + "learning_rate": 1.6051749406049697e-09, + "loss": 0.0016, + "num_input_tokens_seen": 3665600, + "step": 7455 + }, + { + "epoch": 0.9845585324006862, + "grad_norm": 0.033529337495565414, + "learning_rate": 1.4773568827607386e-09, + "loss": 0.0008, + "num_input_tokens_seen": 3668096, + "step": 7460 + }, + { + "epoch": 0.9852184241784347, + "grad_norm": 0.1556025892496109, + "learning_rate": 1.354837363470529e-09, + "loss": 0.0016, + "num_input_tokens_seen": 3670656, + "step": 7465 + }, + { + "epoch": 0.9858783159561831, + "grad_norm": 52.730857849121094, + "learning_rate": 1.23761703286962e-09, + "loss": 0.0971, + "num_input_tokens_seen": 3673024, + "step": 7470 + }, + { + "epoch": 0.9865382077339316, + "grad_norm": 0.017705397680401802, + "learning_rate": 1.1256965129730068e-09, + "loss": 0.0012, + "num_input_tokens_seen": 3675712, + "step": 7475 + }, + { + "epoch": 0.9871980995116801, + "grad_norm": 0.13253773748874664, + "learning_rate": 1.0190763976734018e-09, + "loss": 0.0803, + "num_input_tokens_seen": 3678080, + "step": 7480 + }, + { + "epoch": 0.9878579912894285, + "grad_norm": 19.60429573059082, + "learning_rate": 9.177572527375721e-10, + "loss": 0.114, + "num_input_tokens_seen": 3680448, + "step": 7485 + }, + { + "epoch": 0.988517883067177, + "grad_norm": 19.607324600219727, + "learning_rate": 8.217396158030076e-10, + "loss": 0.0938, + "num_input_tokens_seen": 3682752, + "step": 7490 + }, + { + "epoch": 0.9891777748449254, + "grad_norm": 31.56887435913086, + "learning_rate": 7.310239963755904e-10, + "loss": 0.108, + "num_input_tokens_seen": 3685376, + "step": 7495 + }, + { + "epoch": 0.9898376666226739, + "grad_norm": 0.1998118758201599, + "learning_rate": 6.456108758268186e-10, + "loss": 0.0012, + "num_input_tokens_seen": 3687744, + "step": 7500 + }, + { + "epoch": 0.9904975584004223, + "grad_norm": 113.81692504882812, + "learning_rate": 5.655007073909202e-10, + "loss": 0.1473, + "num_input_tokens_seen": 3690240, + "step": 7505 + }, + { + "epoch": 0.9911574501781708, + "grad_norm": 0.039434801787137985, + "learning_rate": 4.906939161627432e-10, + "loss": 0.0775, + "num_input_tokens_seen": 3692736, + "step": 7510 + }, + { + "epoch": 0.9918173419559192, + "grad_norm": 18.382701873779297, + "learning_rate": 4.2119089909542495e-10, + "loss": 0.2057, + "num_input_tokens_seen": 3695360, + "step": 7515 + }, + { + "epoch": 0.9924772337336677, + "grad_norm": 0.3242112398147583, + "learning_rate": 3.569920249981706e-10, + "loss": 0.0823, + "num_input_tokens_seen": 3697856, + "step": 7520 + }, + { + "epoch": 0.9931371255114161, + "grad_norm": 1.300443172454834, + "learning_rate": 2.980976345344777e-10, + "loss": 0.0409, + "num_input_tokens_seen": 3700224, + "step": 7525 + }, + { + "epoch": 0.9937970172891646, + "grad_norm": 0.07868517935276031, + "learning_rate": 2.445080402202482e-10, + "loss": 0.0481, + "num_input_tokens_seen": 3702592, + "step": 7530 + }, + { + "epoch": 0.994456909066913, + "grad_norm": 0.6571361422538757, + "learning_rate": 1.962235264222345e-10, + "loss": 0.1701, + "num_input_tokens_seen": 3704896, + "step": 7535 + }, + { + "epoch": 0.9951168008446615, + "grad_norm": 0.6455036401748657, + "learning_rate": 1.5324434935615195e-10, + "loss": 0.0378, + "num_input_tokens_seen": 3707264, + "step": 7540 + }, + { + "epoch": 0.99577669262241, + "grad_norm": 15.328804016113281, + "learning_rate": 1.1557073708579057e-10, + "loss": 0.1023, + "num_input_tokens_seen": 3709824, + "step": 7545 + }, + { + "epoch": 0.9964365844001584, + "grad_norm": 0.0523066483438015, + "learning_rate": 8.320288952168297e-11, + "loss": 0.0658, + "num_input_tokens_seen": 3712192, + "step": 7550 + }, + { + "epoch": 0.9970964761779069, + "grad_norm": 49.20591354370117, + "learning_rate": 5.614097841988297e-11, + "loss": 0.1099, + "num_input_tokens_seen": 3714880, + "step": 7555 + }, + { + "epoch": 0.9977563679556553, + "grad_norm": 0.39536726474761963, + "learning_rate": 3.43851473808554e-11, + "loss": 0.0216, + "num_input_tokens_seen": 3717184, + "step": 7560 + }, + { + "epoch": 0.9984162597334038, + "grad_norm": 0.10730185359716415, + "learning_rate": 1.7935511849587192e-11, + "loss": 0.0521, + "num_input_tokens_seen": 3719424, + "step": 7565 + }, + { + "epoch": 0.9990761515111521, + "grad_norm": 0.08098907023668289, + "learning_rate": 6.792159113921947e-12, + "loss": 0.1418, + "num_input_tokens_seen": 3721920, + "step": 7570 + }, + { + "epoch": 0.9997360432889006, + "grad_norm": 14.478204727172852, + "learning_rate": 9.55148304560005e-13, + "loss": 0.0767, + "num_input_tokens_seen": 3724288, + "step": 7575 + }, + { + "epoch": 1.0, + "num_input_tokens_seen": 3725120, + "step": 7577, + "total_flos": 2.175051626840064e+16, + "train_loss": 0.12628782090838944, + "train_runtime": 1516.0655, + "train_samples_per_second": 39.981, + "train_steps_per_second": 4.998 + } + ], + "logging_steps": 5, + "max_steps": 7577, + "num_input_tokens_seen": 3725120, + "num_train_epochs": 1, + "save_steps": 379, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 2.175051626840064e+16, + "train_batch_size": 8, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..a9d6c18 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b1f79715af279a18ec83044418c7aa286e0403bf5c3b4fcf52e9f737b0b959 +size 6289 diff --git a/training_eval_loss.png b/training_eval_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..26743e0b1ee37fc2f0c6cea71052a010e6c76b33 GIT binary patch literal 46316 zcmd?RWmr|+_cppWX@DRiT?R@>OQ%YxAfXZhlG2^hA&P{664IfF;HIU!M5Mc0y1VO) zI^e2PM0d7)6~ ziF0`H8{W>5Y50$jy_A~$Gb=;;*SfX_s3*Gi*5+3B<|cX!js~`NCRUa_>|C7e0(TgU z?d`4Ygg7`X{_iW;t!#}rYBU_$;4bH_AHJ|dp@?*mA9R{{stF2}ul7jt-gBq8<&1f~Cfb)!f;FCN1d20p&NnLU#y7cO2bSt%U$3kbNcL`vs0fqu>3 zXrZUCU$Tfv9~u2XR$x2xm{e-=m;aSu3;o|8bX%ghT3r$b2Gk5&qB=7g%$axRj2nV! zS1lj=Fa^|xDTpl;YmJ(*#f-!M`hR75WoXEENMTgvSX;219c?`N4L>JZbZ^8iL$f5b zY^^eOZ`?Cc!?L7)^oi-t?#gfje2Q88o5g@xc7?Q#4#UjM4BWY5WiSt4N@<|bBDO5H zYk7BdwE5ekFu%aSx`u}LIXRrtK~(kp<8IHgkFvF^5?B)c5`!sE2avEEpIR~ zri@vr6_{T2JQ^OK@5`hP_=#T&4`ZvE!X8-cUqtrrER%3!_x0u z{RXF#o&JN}VXH?EA2P78VA}Y~4`ySRM@qu3J@EY)5z(tjl&Q|h$T)AGbxO#0%54I#J_OzFvFL zeyK0W{qYyJm!!@9bjZo9aLy+xHEnR==UsQ-1q?r}OUt7$n+;?jBS zPvVJ^J1+HQ>W`K>h`{3ZdWgkL@feWP(<`W`kX^fW%?+L@7jyT=&!5ZWFc(cDOU2oxO7qGOll#-G*F%5p`F0cgaqlhX02Tzl`s4>r|u0-1lBKtWfh?N-B{C(~Gyg9(RBLmC2!v z2$NoME6gAFA{jA^0d^+Lgr?KvJM)2@np_2EXF(WKOPpX{)5g};78g~J$o_;+u!Vtv z0TS`{D??X(Y9!uYqIKGze4lEh*;n=o#VIH%-47_+xNJ85y!;$gAuWf5^$pwP*>=&M< zo-AiiHqd*vK;X&4I*N&jP0!6?ufww1L6lsfpzsR`Axf4BG2EJM-4XJfsrtDxcQ75M z;I#N7)z9C*W_&!6+OpWYyj-NIsmW==8{f~*ue!ZGB$~%a#o4_r0oyn+q|kZGaJDs8 z#>q(lnSj@$4zFIl5*RJ2OdM}&A5K$BUf|pH>Dk%MVXG>enFv*tl1x5AcT31k z3eq8TK`_{tWsWm>?PAyyk=h=*139`*uCCq5GDIGS3%65`5+RAWu9m!qcbiyQd17qL z6n5*0Y1iEgnJTidQh!=oGwsHelBJaol8t-Pl;Ej3o@b{n@!1e{gokx3JUn5IVYjak z6HCBHA&rZtq@?VWt_|9uR_uC$X#{IOQ1YC+aN#;9=SO4)4+t|>%B-h;2L;ppg?|fG zR;grZp6@xP#AH2j>}_3ZZEZDJ9Vz+s`?nq^h4FZ$X!rLgH+XpR+V}?6tUSdN1#I3x z@&HdG{TM~U7GG3N_mgT4jhfw7*YNI*bN<3Q+@jUj?s&GMf zq^oiuDQ@{^^Eo1-xlS2+MkXe|E4SqZa6j%ugoV{1g=)GntYqUiHIfR7k5h@hY_1eTc*!zIZ|DQjw78c^bVj)qvEJD+(gs(#g8@0arEMHtLVpJkRv!JH8NF zcGteUxUsuC3y+!k^XW$U?vNRb`b($rpT@??#@mUnpdcW)2l7~+PR$#k5N9a!muYBP z;D$B+S8l77J8|V1wL8XCb$x8Nf;s`k45^*RD^{L2xVcHRwYA4w*F^g=HRi&n!(w8Z zVEHr+4(nog%^w{tmioRhT>xbALR71fhiY?Vc6!>nS6P({64I?FF~4H1DjQ)z4*FMby%6z;se%#|I2(nvOrMs(qoInlo$tW&;07lvsu2BI20Zh!y z*El#rva3#G)~e1Dn4f*WJI^(Im5l7En%YA(HMQhb?MNg6QBya=ybqQ-u%5xoBU4?m zH)htwB@FS4{Gq^%+^Xt?@ABo#2-c7o9e-Ehvh#N#HPNu<4K5OGNEt(ETG!wP+dbc- zH1(^kz0Y30et&muyglPZp1@l9)}NM^>80$dSx6Z>rVnQJ@&MPg@{doimaWZ}E@e$Y z*y1NaatuCcHROR5r$7DY(;fBvKN}v0u=$wT*=OO(TaZ62h6^`_%(86`w@t)Ow!4Ms zn_+lOi@oV3a|y2NdwX-@X9q+Oo;SI;K6P|-xQNn=pYGq_A9K19scGv!&-yA&;!$Yt;g^)ed!NI}uK&}sDe4B-oNZYyi*P(H7Er8PgK>gFs-unLiJJ#LB zlM1H|J*YHJ#~TgQ+eb5t?WAXi{Z-GEm6g+bF~5KPN`r?#XFY3d@xJ>`K40qfC z?4pF`y>TP?x4yRPN`Yyjm^)Puow9OoeIR+d*I^Aly+C2K+%1Rw^+`-(Vq#2U;@ZI2 zk7u`cVBcqKMeUem51OkqH#Nl-&P-3Iefsoi5!Qod7~($_YZ21@RQ?+5-!H%G>jkr_ zATMF0la~&zLqB}*2yM-eU~!Zs zMssw1x=*V1|6aVRSY$Om_RSH>wK{H3q?Su#Ze~V?9Ib$L64m9)Ut;8L!KfVSd~ z?K;G1z|;WBdwx|)sUd`Zt><*I?!D>(jl*Kkqj)iQmx!%kTH(GQL3VR($_46~F|n~r zJ*#=jdj|#LR!~eFhWhn#(^iIyR8!@m|K^`S7FB^eh0qGm=2z%91TR7|QA)|&*w~N{ zIU7GaExM4V?Y^VzGgRujXL(go9Kw#}XeeI5=65 zD+GhLDZR{0f9aR@6+nrAZ6~VHR~31wf}jwpG&mm3xkBnINHA*t%*K*bxi{w8D~8`& zvehQ6Tx~N35b9oQTU*xN39IXDw9#{kmsK9_K5N6N3W+T3MWgU`U$7Q=`!%QXPZC^L zmC!p7qiI|Fzz}!!RZbx~lq*(CmwGxn6dQI9-N-G+D=V6o^i{i!(n|RT<4*>)a&){e zq@}B7XZ_4R$}U#$DGcl!w&9fbsBN zzka_0GRM-Wd|7xnY47;B_RB)^Xbi@vl7DfltS`Jh{N}S0!qd9sB#p><5cY-^c)6>)I2#h)5J%c>h1x30kR7V3&172O~x0xQ-v!Uu8@!jxb1WDkJ?`W_8dHynU>}!%U<&KNh}}lqH_$N zMa;9OzjAcz6qO4ehfKr&AeF%|ucS?X3^KC(0}gU6r)y+^@4{{?2o>^9Z<%pYVB|PD zjPH)PZMC`qXCoyg6)5xsHi0B=`_+-b+!aWr*SWZIhraXx1+H7zfZ{qjZ!ZKSzB{RK z$aNp`hUy9_nOASRs(yibw21T1ZdY*@mH^AqQo$$b06_pr6xP&L?O0^TLpn-+O_wAS zLWhHk+X)loOGrICV0q>_^Ch)uj+ukwHY;l&%qkGA>FrU)NPIdcFNAvmU5W&hpr5P8 z87;TtS$&nyV(8a11<`r{8MNcKTUVffJCu6BtDyxdw5b-e%2sVlJtp6ghekxqMD2Fc zjKAx3_oe!aux5xv`SE1Oo#^)dfxWHK*W)h@G-mc*0t=0fjz)%^hG|+IEn5 z_mw!>TT_sbknr(U_IdM$iG{_MV6HE}eXPP&&~4wkB1Gd#dT$d{Ejdd|cA$gmK5J)x zZiEPMyHI~+6nhr4y=~tR0Yz5v>C@VNZBN31Qu_Xk7j>Ys#Elud?yb&1DBJ)n@8yN6 zt*bj29zVrXG-!MB4ACOy=ZzaW-p9MAb)44m88neff1s$bC>oW1_3GxcRQVaubZibg z#6XeQKRDpBpI1Z_2`JJU*}AQ;z+IUdMJ!WWMnzw)Ep}^pAyWvjRd|-`?fdu0umwfi zK{Wt;wArhwEjSyHsZ|jJ$UGIbzCKyEJX#hBydYI}Z*>$sEYjecpD9-AxS~EI+vHJM zI?EbFCmMr%wC9<^Wiqng1^rsh0asZutw|VJdwcr`|1#c!WLp%rK&2#<$w%f%!|}BcZ3=S8wf64!n2Oi=m&r%Cns0%=nl}76$Yh3Af#UJ8ZU3}f~})Ie3Ncu*D~L^GrgFe zoyA>M%7=f6W&##8*=oG9{A71nzR1AHNI1TVxr)fBO1sp4;f-{%O}RFeT~?_WN9)E* zHAugez_o_H-HiTSp6DP%3-6WvQxsqdC66I73CSCvDU*|vP&uj6#;wi<+xZ6)w({mq z`(`1@e}V7;)|&vF0paf~Tjvrz4oz(B>=woC0?Qv`2#D|JXBzI0NBA9(ydyK&b_dwWiNZjh{X22VC0;-wKxdtx_Ql}9-cn%=_3)4FGgg#|cL zO8d)s?E?T{5dw&aMv$_~x4UG`M@z2)3yh2_+SD%bni4&M7wl8h`@&`MW5GGY#MRv+ ze5usxfq0dXIJskm>mE?p1mwj`y1#D#xJv3@`j_N9V9qB&__BIFtNUQ+uuGPMOaC`P z<>4YLqQK0yL{CMr_5liqiV^U2{bX-k^@v8<;{;yffw{T4Pu>Cb;RxT%P8G5;xq7%n zBI_uSDQ>)oHYPoM<5(G(j zWI!42OqQV?$43GxyL|HkKqw1Eg%KntQ(KkSK%yN_i>V|MKjuVA4k${F$6xd~j1xjb z@9XL5MI;qxwLiD(iU;jhp8A$TLQ8sfC_yD#s}n8pZw%;%`OoX1DE58BOPzh+sNWfiPzQ*WG2)HBZn+*-PiIH|zkTdiwM!&CDaJp*|3L zJF~UL={%2ZJdRfQky6o>B8y0{3tcG}F_^9rJ0qEPt0$E}#aS4iE+#WpQ6ocz^xOtC ze|kVgU41dUhWhGNWrL`UEII;LJ|lM*I}nwNf#ox?vg$)d$v5lIY7*n9*baTR1`@e_ zd_!gr~ZGTyEM>|0x((I~c%__zUtgnT4UCloMrgcw= zRK~=Ad3l*-uVAll;5|XRM+V3iQ2vuKrkQpvS;c=ZJbm^oes& z}BSNRH*N)lJblf>$&saE02W8$~7jS_5@R-X| zCX1*SkmzZkHP(l81$kBYrlt>`tQongSUnih96bW|m%7QyHn}`*6C^$LM<;8cXbePV zz>-2ImOZ&0F>bbgg`1I!!jzH}6ADqnh) zRYjoJAISOEJVafH=q?3>jPe`5i|oZ-AoC+z1}KFh={wN)s_wlkCbU6fwo{56Njx@x zf1Sr8ps0q__pj4{O(ZfgAMbp)kUE%eaz$0knK53-;ku}3Jjf3|P`ZUl)Y!|Gxj~wy z;L^hZHoiPwl?bUk9t!i%KFdA;-9FI4L28TR>c}H=^E-*|yOf|-7;gNn4_f@1soFr2GF>cdJ7L10Z0^$xv&lwS%C}|3WVf6gn&wh+T?%{XphDP z>PTM($Ui3q0ixL<>8czwKSaQ{U+8)VY5FsVwmgEKU5&pcCp!Zo7qIz@Gg|iAs28Jr z^XAR`v2;sNy)#575O zv|O>R$VP+#+>(zwH{f9obNXVoJ+U1yZ4^k(Ag0lXd&B|ye1ptCGzmTe_td#d74LFu zDIHQLGUa2QXYK$R7e>qYH44oqLDa>(W)6a|2|GS^gWf5^P=EaRfkYOKfVCGQe3(3R zJ3T%?vJc#Tq;uF2!ZFWcm=Cr?J%IE0#c&XuxO8jZ3JvF&bl;Leg@5{VPf6)h^1upI z!8jMCn!YfXR^EPVV5NBm&17Qx6WEre3*YhDn@#9u_rsQD zLCeeL?3Md^Lq%5YASXH_iYEv@Q~cS`ltSe2{e35p?I9=O!`w%A8^1jvI)e?$X*nVQ zSqJ!y0Vv#Zv3x-wSs=@r%0OtIxK&(S>{3urD(Ot( zTS-}&jfqKdt}Q-YT1F-vI>e>`k$a#s(D`Ge{%~ih7gC){P;juyj!OjHW3W~O&A3wDeHpg~hLwJ1#gQZE#0Fmb(>pSbLEp4H}I~ zgm^wwG&C8I?9(AJhfg`DDGV>xooZ%i6v?lQS5=vEQuF|tQ_;xMKiHfx)zpjw1&wws z83fE9kZ_WRa`k0;bvV;Nwp~T7wHibytN0thigC~ANhXkcmN*FDJ?@ai9sgjF1b;-3kA9uj*%7AWOD z{Yj<=*lBM=gA6UdWgLjQpG>vu0O~rxhBB3t`+x)qJRlufovJ)MJZ2UTEY{{g)qeu5 zM^%Wu?kyhoLwgu@(a_QIaFGJ^;r@vp~zeE;@MU>AXiy%5Hjd-v{Pii(PcfKlyepB+X%8)VKK z%oqdRz|_g981(1lirqblCy_CaS9(;RjQ6%~L}M}v8+1~iFEdHT@*1{KaP#mi#mU^D zS_Lq#SNrz7`A~kNk{6i{Y-GqoA7Cn6TDtrU^P*u(gNpbE3@cNsv*$W*ZhDY8Y{d0W zza!3UgHD=%U|_nVX|-Lu=p0uK{lKhiYrJsLkc-)UCn{(0z|wp*A{|FZ$4p%50(Fa^ z=I{P}jG$BYJ;imYsMJ~_=2Lbbf7XRPa4dGZuYU?%TjWvjM(QbwWyJUIzOC2$!Ski9 zy}jLFri!ZerA2FVbNbKK&B5iyh@GzR+-2V!4*zG}DO~y^wW6l6>8PIKZ_n(~*IY4T zc7u|2sDGillv#xN=b;HEuC1dL_bBgMvolpIZKECORXK7S8Db~w)D!hWG;3asKhR>o zd_y{4@|olni?Q;OzN-6ge0-MfWOmU^i!#0?ws>G-^5ceV!7Upbo1M052gcV04$w-y zdHZ&Mslo%(-p3?<|Fu(vN+3=vaA66(=C2NWk*N|I7PhgsXSHoBfq1cuUtlm#6%{2A z0mdPu{VEBH@1CtKH?5Gp^=lsFlbz>)QGNxneAUud;~{DQXP0pT+TBth(#C4sfGhkC z|FpLw_J<(#rh?3msGRf5b(Lr|`aiBOx>?PHN(akJZWsSq!0P@VEMS6&VXVy=gV6)g z_vM_X)1^$6K>1YR)VclMdVQ>Fu(PZK+YW^$n-?1UUmHxw-nifha!Vw5Aad;H-aipaVpDzA;4H@Y>xm#C&9)Y!^tc>|9<-z`bN7hT>ZI=r0 zF|jyHqKZv>Ss>dt00pAtGp7h7=P-n30*#2%M=&3-9FdcgUm+)N01+-q__bw0!$_rj zS+}-}=gAH^RB2{t*xL?HArn@rmZ<`EjbN2@Mj;`p3N4NbX*zjjWq3LzB_)CoKvas) zt4}bSx@?9ff*1$W&pNcNunURILEkC{Ztnz`$gIK&1_BIUB7&|uPjtN+8)*>Ih`AMy z(VqfX02I;K+#JTudH>v`_hVUEL62hrK#8>t4Gp8Mms`_{i=z-h4=CIR>Ev#U&7&3c zBL?U@0PyKxgMY*oT#!2Gpdtv)Jpf3Q{zn$R}c{@Vv=OptmqU17F)` zH4i%5<>lp?J=Z7MGb`~Gv-^==G1Oz)VNh0<`m>Fo&-Fy?6y!%(+X?7#nQ!JIvE27Z zYpw$*05tsYM)_~v!~vrKd4XK9EDQyW1P5dqXL!aSH2)yU@dG;nr_B{a<^g%Yt>F|V z`0ZO95)u;7oPo1^`uMRLj0$nVW(DdmK(K-QER$*`8vljfO7>M(*SOPM{}g!8;K?eO zjEoO}Wr#0d_6CIvGCVY9X}thSePy~Z?s+B(vwv#vKeGAgJXV zUxvorU$FGq39TxKpGfNIUC%RYHSKJ87CGu)VlMuvj_4@ncB9m}Ymz6?Y$`>XREv}E z>1P2;%>n*400|JRNDk1>YyJVE$Zr6P-HPu+_~TayK9Hp%4yIbve&HYGv9X^fpo{Xzah_@qu5mJ)kFNc z-x1eN!JCT>+6=MHC5RNeS5&P91_U4$w-+V0jNk~s*8#wEygwCk46ROsKOe85M4+dq z2`xunx;fCdp_CjTyarW%dborrZf#rIKxUEG_R1_;1Ky+9+WDzX1{ftj@X*`0Vx2Dbg=#~6@|s@;0+1Dy%4UeV z)(1qQzd%GD1j{GD9$~O+j(|+CBi05%)Br8~0}$l}oYol-50#*xU;%redL*RlPf<~S z5IY;lm*8tStwR9*{M7k=sCE&H6n`Ha=~$uo=vu7p%pi&6^MQUYg6Iy=#GNePYMTPo z30OOLVq(IDe(IA9-6XV}Uk&A(5YUU!fT#>jhxeVv=JsV-C9_nsZSl8 zJ3t^>d3yEMdE{?|uoPD>Zg14ir=-|LWrmieM)*Mg1|mRi)|bPU9qxXv{}Xb}W*>G3 zTP@FfZv}(MoJk41G7?5_NK$W&pWH;5*KZ3ER^nwQ)3kg}ei0rel1d}za*rA1%s69d z>5mjO7VyMIT-@HhUOO)Fw#u73FM_Rsdvx@hOEWt+T2Xyf@LoDxX2Xs|23!U{Zan*Q zSUPp+_9*-`3`2AVgdNzJIlefUGw(*m6(%aNLx3Vn9>GAT(kata5J|Rd-<}n zAzjk#jIl^<)8FO=1>Km(9N>}9cepJdC!s_NC1zxlREdZLRcL!}ObeBN@$T1tQ-Szr zwVfaC^A}+(1+UgsIsONPWxj{C()21K55R)`cax7|{e$krvfdmjM-p+{8>=Ad5a>LJ zu@hi6NZ_)dAL#$tfhq!Kr%+G_kmgN`ArF!0HZizM5jP|vc+pycVF3|wf~Q8IS4>Kl zuwV_Lh9p6_gwCg?y4oB2MVVvf)GipUusNZ2kV+x8b@>KuC?G3C1vkKn1O5HT%}t*3 zZvc8AUe#Z}eoerBg--N9u}yOKiE5VSBj8q004I^gCo5}ubV8$D7>p@SC3(UsKXZUz zfDdQ=gDt1g9*V441crpKs2rgeHpmv~E4K#Ls(%{}${`|?K}EHNA}Sob0i`Gmj5*(* z#5#dA;{4bDb}<<3&t1ASi}>)M9sIXVcx@WAB^2q^t6ZQl00bYbbQgwZ0yA*RD~LZV zZVL$845%Y|pa&j90Yeg>SyqWJv}Le!K&3$;v5yo?=nYI&f;2S&X&W&MBE8iJR@I;2 z>2FwpTNy(3bc5aiaudY20L5;^W*I7fJYp*Z>vR}k2`TcIzraO0TulA~m6Vpi`6VNw zsl6TgKOX^AfnQS7F+rQiC^YJ&Tyd56@c6KIq>668I7j{X{LD`~zFs3?1$}Of^Sc|@ zQ;XwHSFjhTugtF+!UjUD-GEu;LCFBaFllVdwpLCXo5kSXwt(Aqsmn^4SwH*VsVPCw z;Q(XWmRkJ&K#6o)fE9k}95{4FJPVSNII(;dSfC0LQ&9Xt9Ebq&UR1gXBKQPIL~Vb6 z;eIt3Ka!Wf1(6jMMX_43r**m!;wjL^3+-rM0?Jxwz#@Vl09B;M6VM3cJa&bK zXMjpNuFmFkqw!rTq^yA02b}K)v^|lQ_X*Nm1?|ImwPX%)x&3Kwo`U|R-G~^t;rg;( z%34}l7PNN`W?LAr?HrB9JR(ZMKew5S>*9e&8(-(fT$E-m*5y)Gd9k@Aszv4Q1xef? zF?()&IGqyH4y>biI#d?%q5{g-gOoTu9miZc4&sN*IzBNa<)bQ(6Po@4bvCdNe@h*f z4oCcI@F|)a`f9(+H(*B~ECMh)a4$+Oy|>SVkyZ=T>Lqh4Fk-=F5}-EG%#Gz45rNSH zh|Sd8+*~n;mK-#qE8Qy`@q)|>q{i}0o=O)jWSL83dy2K5)z0?LY4bb8fV)vu>*!S+&at%Ui zC&V!h`|U08#n%qBuZSoip*rZkrg_YSz zZqHi9Tx^mFKba{YRzp=;K35dgqo1*VKkO#)wYRqwNmIt^a#p`HT>z3xX-0{=^DLvTAgSoSCdB^O#0f7 zE6ZY4*p4nRT&r{`-zh{X`g*-1{(5i>4Gs}F|ALtHe*KaJHT;RRG#V` z=^Fs6=Rh6Q1C%xb8+OFDnGF~a)_TVSq79JOa)2@-z3Jo-vBv0BBG9y{*~%1&NVuONI4BS8vRBAuL&F|Kdd(!HV1Z=FAPP6yf@NQ(rZeLR4a zIAEjxpyu;0I)UvT!5yHgBHN0Pf25i*QuAM%YQP8{i})U@Kw8^g>JI_;_2y2$HUgzk z_CmCXeG}=Tb#``Yf?aS&>SXQX|B`=1#Jo2bcG;jZkDm)p1}={F{U2)r*=gW47}7uG3P739s?p3wZG>7PsoEp-M|GF`$#)=NMtlkwtck4ZL6dlNi)I$gqokFe2-@9%&i^A zOS<9}79wC|`r~-f)oNrr5TwjT#+0PVNTHmVumcNr(B`-O8U8)|Iywp8rUm;B z-{o;;3QwQlR7^~*+?S>--x(sOtui`Z2vnLm+1pHotC@)P*6*qklc|7 zTjv2QGk%zc<|VJ}dx7^}-x^kRfunSp@ua_u5i%a%fa4|m`OY;yKCZM_L*ibz#eE+ILDJCIB$R zK=#sw`uXz2nyU5Fc}=~G`M>RpB76?E?CB_R4c;D6kM!{g_i{DDf>6=;$+$_@_Xt zoCHpp`Sa}KwFea3ug*yn6k-26;WXdjjbN8T2XLz4W?G5uqH=z{N@+2_cD?%HcogdN zanoGn1IiKN@v+R6=B!)T6mjppG?otQ;lQIRkSDJj=SVFcC@OxOD!8g#aER)7#hnWh z6f}a?2EKP1QwTePv~O;*ZBuo6XomQSKrz|}odk}xOo9Pt61a<1uwmI-t<;+Sq?ELl z`&u@Fm(l9%iT1SzpO?njQ$ zRq)ZuHags1=p9Q1$>HZu?uH%c;z}o0GdhlMS6XxU1q?Z2|KSo zKz=E~Bwnz7CXK~ui8uI~ws4Si&3ww2{E^50jS%j{UzNK|3rOz5nb3xt-go)I-sU_P z-vB(fA?cn^@l>#IF)R=?7)^rqUKCqj0}d06oNQ6gspq?QwZd%o!!UZq=iKhb*QA~n zptx*fbizlW_D1bzd0U?)p_~wZ?KR#(>-?XJ&=aa*E0_+@h#iOez$OHcz^uIe_+Sf! zF*{ADHNEp&{3;*!qSd`n>Or;h0k4Q(fA(q2x`zHGuY!FU+4>F_as)V%QpAZ9gi-@&!XkC==bO|gvC`1+ zyGYKCWA1+g@~PdiIJEacL4p-Q`p77-r_H>%$UcGSIe>l4hYN$Cxf%#R&7wp<6R=Nd1L>;y*c-pn09*ftHn=s<%W;;GXxW!?nQ|qMTvjgyGvTi z@`V{hy^u_0*0Jb{LVuTwu7yKu;HW}F&;91LYu-=|gh(F1bOLs^Sxy9y468_S*O(ae zQ!vx}fevIdY*8e*O9>kbI^wuzd!A=9AiOw(%~%bNPJkoaE>OJEx5Jq9ILJr^2d&Y; zoA!VhMLo(%5U24pSQ(ci^G#ySE`PoDBj=1EUFz%Oc0xq@^+Lb9u#uy|#fdW8D6EzQ z(O3Y!s;J0FFdrGX!eU`+qlH*V#BSeb7Z4M@sKS&d7HULS~vYWDS6 z7`dCFA6PiIJgKd$?0gvOKA`<3$Y9vt{DT(Nb!_wWu(+l|w#FO(rtIy}BhF73EI^qJXRAQL5!NA*w5ACUp@ zHJ#r7wVO#znTd%b!L)o6{-Cu4VD|3+x)iYM-Nf+UzVe*OBjuCy{^va6w)-CekySsl)6PC zKV!>KfYPq`{GNSH$skdz(;F4n#*9WV@3ptq{7}-vE68+oe^BPl$f;NqofFr4Q_dBg zX)gGAp^K07b2RfEo;*t{7E~U`s`T5c+$N7*$&XiF6gvBd;#@}}FcPYA(|n4jkm=qM#b2Lnt-wY-#^fBi*?&;L@)jV6 zJR@VzTZYjg1?cME+1Q+*b?L^8|b`eU|*trG37xO^p^=gEL7vZe+J&a z_lG){5a`=wd5dIpPvM+Ldpm-q)1PnBGA_+V!8-87gf9{pRCe_?1y zkHyYbq!O)al!#w^BFTrFqKy6PyIR2sDL%_*$1+Pr0wIf0tK_j2^Aw%Xt;Yx*kH-JE zvxDG0TV&H~+S9P(c)Zbib#4nZvw?${p9c@OB77QIndegIFJW0fYJVu?yWg|qF?#)^ z!<00j>CSXSxGWL!Edi6#0FH}eNbV(dVHjEk2#$vi>t0=r_Pcb~7L>o5%0rjYc94NI z-qP#D;xk1ffbd@+P12ZQk;h_2X4CMUa-5rLXj++G%~;(=6&vc@RS&xVP!wAtt^B6u z|C-QG@S<7Y)xC6NJJxr*LbVisSB4+oN?g(&UuiH`rW_TG3%*tl1z1S9S3Xl@Ur>Y{Z% zh9o$8OQV8~t~Qz?aP@60$ZB{4SMFh`@q*89ewXK^(TK-4-uT|agHVV zq$2XctKNq0JYKAM+2=yzH13;}{5SFdzgkG>NL`oK;!V*({eDh>ZDsz8bDdS3?s`>^ zTsxEJ_e%?YgL)}RJ$yYhUDb3FUSpkwZ#tMuQbNz)LADy8Y6}TPDF&67w>Ycouhvyp z(KJ=-WuE0MdH1-99iQApUCdeyQc3>!Ofwksrbx@DsPgnYgX7Z+(#Td9KaUzl9T8i5 zJQD0P#VX$t!kx0}`SkJ?QtNhvzGE;VC#_-`ESh7t11^>h{PedApyoeo&kE6hGQquR zc1{iXmWoMr(9zJ9c(g*9ZY6B{e8=8 zpnz!iw@h~ZR}76jt8ot(jNx48UAV*L0>(F}4+~0{QGLmDI?;o*Rh7d;)fP8|yScVo zT&i~Is(n9u(*!f8@DU2DA?KB!KV-*Z<51psW?1(kfo;6xE=k6jV>X|vI=d?cuHbz3N?d)Ieyu#F5w*Un_R{hyb2LSEjxfYhh3 zEKO!~Mn_B2_2c!hcjy)D5)Z`>-4;e95{p%*Rt|^tIB08@RJDM6NZeT>FRn|33T(O) zu7Tmm5&52)Nz?MZju+XJMI0~V8v7;zmb&iD=u{r?yraEs2RnH4&whgP zYC5Jh424xFH*u+E%!`c~QGSWpn*Y;gCI;>Vy*IG80nW;VqnYsK7Vu>o{y{-fN~B~Q zTABul@D&v#Qc7{`V3#3u6Yg@j7VrewoA?%U&}F z5K7Ga-3#d7zi)dDIAEA?^Ed>n8XHJp=SkK%{qL?b9LB1F_67x~4hnoGH$*EAV;q5p z{i?6u0LS|ku-H!79BnT=c>FkEY7;CqrHj|{{doKtc(Zf3Fd70>^(sCb%tbg}2C>1R zajK8yKJvf*5Rks>v3uZoPfUv`;OUAOVJG7Vta_+k2lDX1EkD#c@RC^|Bu2mrwpT}E zQ)D9n3D+S<3|CGc_!3NlR`UuB^b`cXR3Yiz3-HY(wwkrIwVFG`>XM40Sk*e(qCP@H zvwIdIQS!Ey=Vd(wFH|Q_x%L%TS~*_1D3O?H^v&W?@%Eda>O7IiKI=RNree$;Jy2qI z8_0=+dAIT1546H?3c2v^!oYhX`ddOmF~!9Ki2MTZGj>R`=;t2lb983-XARSlwd)NS z21=2$6ZGTeOagzxS`gw0ATzmQw-J8((((`NJ`3u zd{Gb^dwP1L>0iU@A_spF!2_rf(j-9+fL*v?N*8*EmGy?W`1nFs%zQr8G0W^+Z{J0M z@9!a|Io@|29EQ9i#Z4$KRmgl$7ECZe+Kuj*naE$ik7)obrWdDy(_P# zzkQyX(;`X$szwDH`aer1zTn>z89P@0TUvqOL2v%DJi`%6P=3S!$IU9 za8&mc{~rX%e9nq}mvM5_bOHUG^j#o}3;KjWh>oT|xldn39wk^NV6X4&YT{qGhiW3u zL5A@ahLP64y8qR&4S_LI~+{|A14;_B@EDwR0F1{BTEC_y2Pn7pd#S?oPe`C&^kst zt=Hg}fQ}5dvMY^^jmS4!z?@iuad}VVk0FWL59k2&QqAq`1f8Fbe9w;Q=gNyUIbYla zkRCV#WP_(qEhitk=w{X-o8hgo*nd0VA3hL}-BFV;HDv)R^a>gj!M{F&Hh4FNCq5dU zLqK)+kBvJ>{Rj(!ZeX6xlr%~{Q4Be3{}4`zBj;{t1VcfOB%z}l`x=s2azJfw%&Sv~ z0mQk%&j(*!!Rms#DpjMAo$~VICw)q(W!bjKe_w)Rd<|aVe^Z`V(X_lkNIc5D>LGiG z_g}SJ{c4c(wd#2(c^ko!`k5z}P_lAlkL6TQGJ~II^%C)&KwztAbe33>#UR*u=&Oo2 zzT(}HXvRs?M0_>+U91lDn2`O@tb3W$l0&ewSLiteH|Eno`DAdt{?HD`YnNc+qan>{ z!Pah97yF;j=gY-YQ0WD`S{nbV4AH*}nWKgR?)69NpK9|!A%xgDzsEC?qRe!M$Bren zc(5J0)DHu#G@oU(4)Ed6w{|hSdlwiYoR~LMBxv-l_XZZbOy=^XNDdl$-+NCuI>vp68fB?mw)xl>ksgF#pa>x z4Wu~;1F)1%Avk-EpZ>hitZB=Rynoy^xKl4p0V?lh6q?{_y0?=Fmy^i?u_hOhqOUiS z$0DH(7<3_H9({);PlsEB+RZbs{;`KYrS%g+31R(uPV2~X;u8NZ_4|wzNrMiPjURu0 zTF7ze$V*}Q6=_ZV>2tt6%AKlpL;v>$-@pqFMC(rYwqx6qdO7N@(NCOvI*c#NOaZU- zH3dMLFRlx}htx+JawF96AdmMj?hsaWGUYo+jhZg_^LgrjoaxxhDnpn|lh z?z``(DGPj5pXjnfzJzN|2qu!#m22L&4V|y9EYmTMAP=2$1%ivSy`>shyu z`{?w1VJe)!{Ca+-+dC3!o52DQ=$Jr=yl}mR*!oe)j2tQ|bnbuNHeSW2s*|jGhL7R$ zbj!NcR`!`IpDW2j|HjAJO#fq$n))R7Xjr|9o%YGAlkzh0usRrPRW8g*n4-zj7dP#Y z7noy#*DPkR(jbNwdq*x_PT&=Zi561^)TdKv*ul_jmVb4%QPsmtB|5FC61>r^lFy7-(+vf$Vy1mCwc?{D7@BeTMx&j*$PNWa z?)}G>rYQxtY8y{_kdDq%PDyIfoICw*`P^-EW;f)(efHGy%WL8Pj79SaTr3YKJ+430 z5}idGk{7i=lnXwtiE0afGsyby`^+Y}Nl*#cSQSg!#HEZpUMn9WOwqd^Hf59;@^U_G zzv&_~^MPQpVgH0$r_oWs`Jr$tM-+RYSGHPt_NB?Cq!2BcIZh2h3Q9agrq+CbRc+^W z1C^0XVXqqYTaKn6S~A%r z8i!b*8(U4?vffmg@vZpN}`YZ5fJrN7oIB<_Xy{Q zGhI@d3u>~3(>k~DKJ+22J+U#S8stb>CT^95oBfKG{0PF+f790+cXf93uQsiVIX$1w zU1xoRT$XhmJt25KDOj)Lf2FO@o*K`!2yy;9#&^iG26(&!pODEJnnet+P*z{Fq&UT$ z>y_|&?9bqAX%d2Dn9q+;PQe{ZclW8x@2NQKplG+w)CJ&KT=?r5bk!h~MX@PktHARB zL;t^2)%*0}@Yfc6y&8B8JIaGB4NNtz3?!gOLd{UBvr*V;o!AuAi-93pveAQ08!gw1 z@*lx?jMG7;)`Y`g@O4L1{db>Xn>A(( zgQHBamJomLsbQhw|Har_M^)8!eWM%ckdjckL0SZn?vfG(L>fUFL_k150RR35gcK=mTKUHX2Q~Pr;S2pKOkdJ|-@xNY+ zfxQ2XS2H3>DPCYs2Ghek$xTFL1642_{ATrArB3s*pmL;*181Dz-_uRvxs8A{>1u_H zF;~lg%U)PTVtCS%*F%146Hsv;pfVTIbA$@bkcKiS(B=Rwl`B#7SqQjQQ$R^YoIaqp z^Gb0I2yB@A+cPZxL0tqXlWM8&(!=sI2jriCPW%I?w@V;^1j1cDAhZdR@WjT}b|a-9 z=!_?`lI<5!k&$5KL_)XVf&ARs(gb)nsc#-EpVrpaF&hp@*{5*BS_#cs_~`swJe~9j zjdT&~EARLS?hI4pAy_WJdW4Lij*bpU*ungqnJECyG~nXblnGSS)a27ehT`M@11;11 zpybhS0Sp>U1%eQGX1}^r$q8$*4t8xFiBgQjkINS_>Jq+wzQdRP-Ki)g3||x?ngIR# z$c&rYT}o=|$+^4%7gqlLn=9XK$a-{RPVc$ouA^~F>ZnMD3e!c=SHkTl}EHwY5%TR8V%y1HZW`-Xr0P3#1nC{(Yei_*4! z1`{K?pBG|^Hau=o6Mh!6m4XxXwlHilge3sk_3*akyaH0Ef9|}`)a%*@fxY+<=~QQ? zAd5@Ft?&0`QF)xFo-9|Q#(ytSz_N0pg#B0M5XH|5O`EB3{)JaXSFYdfUi7!ILVh1} z%BE!Rg>4+%^0eXL7TP=6;TEpE0~<+gnKjC~SPvcy13P;bt0q_9qe4vUEepHL%?)#P zRLajXOrfZ%gSt{r2j^huW{%fwDol;XaZYywM*@g{CN2!3w*9c_=79F)GsQoLY_eY9 zX_SD8>5Kmy3hGz9w!Uf1R4y?uA!1+20cexuz63-YSd5k22(ugu^r`hfAz89Az1wbz za${eL(Ba6mq2U+JmjyXlV?~eg8{#MJ-i-n-2f4Gz{`t|6 z3T0_&DH>~M0KtNw!a!_AJqbccG*#8^a2ny^b6?SSvc3anfD4U0zGNqeS8t&Zp;*f9 z8`6_*dz*+2HY2EMY#rVyVR%`4mp_#PkJ{FiLlZr z$1LlDl%1USG79+hPH>d2PFC`PNP%XuIO66&TwdV*f*XQQq%&m8fR!{l5X#E+YPf$OWFef8 zQS#a0%IY&J-gT-#U33)@*7dmRSUA%&s|8Vp;8X;uAZiZIiv{F=u+1-nT4oun_O6Rx z0^SIC+TVNqeS$BB32{b~!c4sSqSt#e^%K_Zjr zrADx&$AUuA1r)(M5SmpAZ0Un!eGh(k<~30dTR-G;0zONE*5)}|Xy-4LB>Up7&X_mL z&=-0%L1epODhShKULx${kq7012+tdct6Gs;sVZ#$wfhD{PdcR>0> zA|++;ME=elJdnMFb7}I3>#4^#`bipxt()N9v9;Vf3&lNj+t0kE4Jh#+4Mx=IbJ1|9 zQ!VXMpaM8@vAK4YkFU@+N&-}>Yh6QlL=WJ(0av5a#bai2N3yxrzruA$U!t_NtN1Nb z>fwaX!GKT`e84>oi;3UpVOx_0185m=vqoDpBz#c-B`kuq+#K{b2nK{WZP&+cz>4!I zN(hm8&GKq^5q|3;1-Z%V*la8opJ5ASdmQLtq35lji8%%ab3nHW7DJ^YLIGQXqy~Xq zKvuN}%RwyAKOkE}{b3{O#b+|L{IJg{D(BW=Blqgcs1)5U%VlXPcXB;0#F&8(VXJb* z`2$)3B=b-liaVVOB(W7yaTkc!Z{HQ_Mf1N|jv~q;ziV015&1Y~Aucw`_-cfpXRv6=U8H^@7m)4u+0V|O9O-=Wk$H)dKv*KG-i?)*6x)5lNlTJWS# zs>-mPKec|xHUcjaOMC|r^ou1+zrkM%Xx1HS;{0k;hH@2cMzRpI;n#EVQnYRa=42bjq zYC0Qs=LIbDZCBWozzGY9v)LsQK=B3z;UJ5<2o9Y@T5FCFD7>|sZFNMFZB);1*B+(- zY`(vmLZi&X(9_?j8inO_mU(_lkV``j2YTU%wjeR0X2 z1)?{O^Ah)k`K7Cq-M6%-*hNuEy3HMqW_c%EF~fBNAn(XB zIgvgRH-&vk{U^L3DHo^g;N3-1K6+B5=zT#>h*(kp68(j2P0JfPBq-gRM0ZJLazyWG zo$&Ea5xrYd+ied-U*-Ng&w$c28jAZ?%osKa()i||vezgmyQB(MS_j@Ty_`sC(>xg* zi~rCJ(vH)Z=>DH6ghRaFt?{wElmt@ch{ZIQZZDxLVs;@r(Y7EwB60;YScOQcBlw_E zr)OtI&+iN<4#(o!(_flNNemy!5ycc=PD>NGdA+(qw%3R={}hB(5hCGW=19+55|CpIjtsP~(2Lf%Yz4Z9Z z<5tRscrUCP=jP`d)n%I6<>T#8{pzP!5}`ocr@i&p9Mq7un?s?unr70q4b=gUv{|88 zZJ$~2KFnB18bX7(44Q87`zJ*9xQs3j&b~o)m3HZE-A?7+_cf}Nt;hR=&RYFAyuYvc zjZDNzs60o0`ZKTlBGI}XpUPyDPtH;OFMND?=fA$)pzTzb6C1p){YnOog8T#tR3g8b ztPB0U#MkQ*zCtn7K=Yg8qoVez>z;_kRVe7_0Hsd~)OLr`)}V`!Hc-`2P=IKhR@UBc zJ9mv}Z|GbQ{%^NqFnd$O@zRQoARf9X#tnGZJ`H);24R-F^IO3*%Gc*SbV-zMhTQ(! zeM55kX+p|{WX*_#3ET#IxCU>KB2#&%ARg0S33dhFemw9b@K<+mL46vGbmED?aTd+; zcW8IvUlDw}MHvwOwbfE%xby2SfCcnrQ~~fypFcY@L!AqK;)Cz5-amzX`O}CsQugZT z>;Mt+H;|d8pZn2{=9}lc34xa-0CKUu#%qFKCAnF*rvbq7)HK0B$nY&};#Bvt{8MFB zZuQvMC#pppH!BMcoS^!QCRNQ@7-G5@z}=N@!zFE zv(`F9E;EZfXO{X@g$V`(BG6Yrjp@I32IR7IIyg9*XD35dy_6mm z=ZNoZoKx7nfwSeW9XVhxRySA5#^SQ`9qCMc2SUThU1knz`5Cx)DkBW+(^AV4&&d_S zj}rTsON;WtylQ3!Le^*d%)a&tUZ?%<*WTXQmDb}VIkd63#C~A% zer4$VS-gt{4M3%}0dx<;z5mzT5r|@<;B-P_dcpV(0`X-yr`+e6i7!7kxl&c5W}2-{ zJb~HVXmgyAH}fpvL~5oN-;Stg`vhJ5?u|NIoq3=kqYd(UU(N)U6&4M@)yUmG?i+#) z4?R7OXO(%le=hdcGlGLpUY~ich=>&WU!!cfwB6%=GWFLGirwrk=1YxGf87AoJ=xt0s{VI$gN2R8FqLub~b;A@mCWQ1*uL z?t&J3ygOavFPUmPmmTub$vf#gt68}xT?u?C*$%Uwy!DE+q#nL;H9annG%8=(HM=kw zx|q6##m@$lV0dkMxTa#2*ZP0J8)$k^1VVTlEkte*BJt-j{{Rk9`=N5`Y3D$U>Q-}J z=yMi|+;#xu2eZO0cq_2VM=tr_@w-Hw|vb+*i9}jN5%-g@3+D zL*8DFZmwTOJ2GHPCK~Y9nZMlk?JEJGT3#RL9u@t`l2f}%CKpr~9YBJpT6Hjd5wj-9 zgC{1z846f}YaS~>>i?%7jNLQfrhs75`_Q3ZmGt%~rMWMdq-m64%87u!3IO`j$hD2! zFvwe1=|cEvq>vAb68X^6*Btp2cD5DLwx9wtf^d9=!lCWfO%~MOa-xNe)z=S?CvhnX zL>j+Fd&7y_!Oi(=CbULWcg`A@T_CiR@5bK1Rxo^cb&JNmEjCdGWTC#zD9n#jaHlVG70E<+WSP;4mpdNM2T}Xw7^%IhclFUODka{7A`FUnkBv4N zYl8vLj&EN*kphQ@m;HK{KjwpjrM5+b8j*-j$&aQAK& z9V@ea47b>w9N-?rPrUgI{jF%AJ1!y^;awqBjB}dRpUpk|>qCOp$7Qn*9Mpy%~~VA(XuI5jFQx z8hwE%LwSeR(dIy1`SHL5LY5#RWVFy^OV4WTKj;|*jZfz-m+0qf$kkchyh?DDVDozM zQ{LU3l6ncdJD1R|Y8MYbRH?>%cj;^r`$ihmoLJ#~r~JK3cK5X{GhvfWllI_wtm9Z; zbo0}>Cq=$k$7&+!=3i5GAF&4JaFg-cf#rhEf+&%&x3dqK9~phca=s6+9+Kg0~{7^LcBaudlD?wEIlmbF~!7 zB=9ue1TPFI4%EPh#mwaaUO_NL6#*XF7<;?qzru6<1HXj9dW=}C!6bE^gJTZd2#-KR z0Mh@0YPu3@rt}#Kh7X*&=wAws91T-Aj1vS=KIvg*Pd{OJ3Tp}kzW5_NretE3>a5e? zmaQ8zQXBPWc3w?#ETJRpib$Q?FNPY0Tbe{hiZa*SzcyR}V&sV{D%|AZp5e$S6K_vH z1_N}fB3e{c- zu^4r*9RK%(tJL6sN4P?acszI!K#U50^T7rmA0&PVJXjO{O56!iFNBCgA-#XuD*Lb7 zh&35B3QrDQCgXfU39@V3A7qX2*C=5;w&XHuKKsMO7z`wU;o09p?y4LjVZx2?pGBUq zmBx5UPN^uGT{C-$m0Xuel%N~EuNC#d^a&7^Q0)!wb_d}J?rvAniJu;)oLZfk6-e>5 zIVj`;L}Qqh&1)D0F}z!k!7?HaW=q5}!u_zs|MO=SK+4EG%Ao&k;?H$| zl4<>+kTeq1*G@KD%1vhmyn00`?rP!Np6qV0-&(mp;%&`z9^L9U?Y=QdFY(~euHEIw zk)7+-f)scujw+K|;H5iBE0~hxEEsk+V-I3o&-#dbYul$`8X1!1{qi??GVJZ5X0K116zQ(4tM?(AVex zD9pUaUvO8?GBdm9R#p+Cj1?%mkfwCN>*?Mx?em4*WYD?HZm7(MJh*5F4fkco?)FJi zq|qQV?V2Mb=W_5++{Ui3Aod*^XN5Wj92=U34qRpDI~DSA1-}5ePqTy$sI;^+IJC4E zake-`zqkfzOyDYWUi_j!Z3YCK0h^OcY5xWO&d9Hf{0k+RjL{d4-@1~)*wE7Rz3-d1 z+YzQK!4Bi~N`L5zi!7Q+xJUm!tJxBd@0DsO8R@9Y(`1pD#Qe^h_V@v zxm{n@AE5%>28!dsYJ13(OFAF_)yC66(R4hXO?F`-{i zd$(PnjPX;SL3l(o=8uL*Z6H%w(0D$x3Cq<4}ze!M>-I-FXMQ;wH4+vJQ`Rl zIi^sp@L0Q&U-21!`;S!C91;g-VK2V9osgypRCw4{uyK}IcQNhBP zK@zbGC>N?i=y@FX!&e|tLXe96?{Wb7Su?}_+d@9LXIF6XfPO$`ChV`bLAd3oA#0Ck zzom`qK1t0O>%SCBX#E3Er5`(o$h)hDV$<7)9b6atLHky_rUs-caZXa<+^P0NsG;3% zjy%108FE2H?uORXv>uMVFF_Z5^mp_DzmxdjmCt+av>=>!810JO4Ao;L6|w1G~kNRIfMq;d2=5iV}y=Wn!s-1?L~ zEAbg>J6iH$#5_Q#t??~9C+BppyFvMOjH<6zd-r{;2otSve%`6lK%Wio%c5zQ99*tz zYX8Qp^HQT^I=!6O!)e*Nbj8uu=m4*~=d_IPUCL3`eaGU_7ue8J^TUGDOcGsmt%tNE zL&)j?glIMs_M56PQM!z=^^qp zkGUjm@;dAd-xhA;niM@_dg{S`#fD~Qd(NxzoXGnYIVXg0_?iLk*w)r2;JI&&R-?G^Ih{o+q=_s{l>!qTl+=Tgl+_1 zr79zfO&EXLRLw5V`Mu*!Wm5m^xMx7^UHvW@0S$)|jMVu&>G=sNjOQ&~^v{a>&D4Ow zF}&UsvPIS;gr26QfgJ%Nuq+MLPRJGrn{`~UZP3_uEC-ZBr`cT^`XxV4nH4VzCQPtz>ezErCfSg%*MtX3$s9kr}vm`(23f4$%uQRne* zwh8#a!wHhU{da^I3=J*Z;5iGrl?BQL@G9=X{ELrZ{Skob0URWHB^D~GiTY(|VQQvP zc0T??33}%lw@A(v|H@CsQct{On$#l9C}Bvs8ITpO+anW-Cph=Seu~sN|6LkKSR{XY zAKokTS9R6q+LVpD6qy+%U%9v{^+Y0URYw69@vSso%a)60uJ?uSM+hL`s}cGR+M1t` z<7f`ysbF4>Mxwi>AY>4ESaSNDBrVB_!~+D#GNPtc{*aRF9NP6nNuYR?KMTUt!XB5s zTL>?0)y44r@;pPwR%}K{G%Op%4AuLet-^MLItQhjcp&2cbM2XH-iN}gKkdBu7RX{M zJ-nbpjDhtcd9q%L#74pT-GP<_$z(xBLUr8_xs}bTi{8n_n^iV->w<6ihY(t7W}4vJ zI9sBkbZV%Q5%tOH9ApSktfnima$o1>k^RN+Ji3y(G~K?Zv(*9qkh?{8Bhm z+9SMGi}Z8|wWEKpPV+WuIf=Ej>*5RKDwF;Ix;PYeY*?=aU;o+~d+#XlR?S@kBOb~F zd~nBLu{3&aI}ljbV#{#2KI?R`lyu>KOX_tPXzfvdxUM%$Ff3aukjmPBC{&&N$$MxK z@yqHmI=bOah6F#_R~)w<{&B~T4G>9wC|}$OLTEWC@^8_oEl>RLS*+eVGS|^Tv?*mG zu|L%if5(XgG8u8Us=)wf?61#XoAc&Te<2;;v zN-}WE>tcOTs;0%;0<(RPalc_$z(k1}bWtdvpmke{m+bXsk5X~|$a$`cAxQC@9aYLD zyg}&{ZajeRD=bXMDpY9m*vvUpUHtgKxQ*wW9u`gN5C@m9%C7i|=%7jj0VokO}INnoWc zBz?(1b#K&8q~Xz*Dv&=h@(2s_v}3= zi1Vhr69@Pl5l;%u-f43D_c*S<<>{Jgspbja#%q-R4&@r5D0CM4hn^$SP3xQb7Kti_ zKalBs?E+4+g3-C8GJVlLHsi-WR-u4kf;jr>w8WHygVUQnvx+VBlP-2EupVGO81HJz zn@MWfY)QnT^@02qUX!|DK5>9#IDt_WFmI%}F6@I@q-~ zf)&$xi;ljNeN3pNNELhI)4%j&U$#)JQZf>dlVJdEXtgijgnGW% zZ~)!9Jja5p%>GPjz6T6FMiIiMxqf<4P+0ke8+UKE7=FE@T=2A^bouzX4Y^}O(M@VP zn&#eS(N9CR;0j#UuHf0L(yVP1ogCx+{tc^EEJ_B{g(G9Nl-Eob035qiQ3Amt7!QQ|pV${Fzx*JU06?^Q>QVd; zcasu_k#G<)9Pn01n5FVuTR8glF#4lWCCexH3NjdgshFPN?G?kZmABSm&7c47gM~${nEabgrVh2 z3BGr=D3*TDjF}fEEFJ4CBf3#8|G%r$G5anyg~}igEeTaSeJP&%?T8YPR(bHwxAQ~d zPHe*U>y^U~YtngR)-F0v8%965eBkp*?E2+lNn*roTR=G>%ofqV^%X^ayU^UJKFmSD zKqS$UYksiS=xq61hl1StvxyqRq~^l*;wB64%DprGQb@?V1P3l%y2t}`6+UZ;gA0Fk zxFKYi0(e~<9QiL=-@&3=qdi5VxxSflrC8n%AQ({DC}@^#M&G&u`(lGE z$N3Hn-Y5DutaEi(OB*ZFUbFa?(MfvJYLTNI2lphr@uTjtFBZkSeH2V+eJ}h89G3s_ zYeR^Ur;8A>5)v_do6H3tusK<3T?3V?OcrB@`r1Xv@9}Q%O>*b`2%$fC3b9xMr3j-A z)1>~1_#M>bG!Vs z4d$1DqfMxraR~~a(IT{L_IpbeS9k^Pbl?9q5fXq;DFEYBf!z!a3NnS*I*3R49uO`q z81n+B>WhT0)#ydc{OqV=*2woSX>pr+mc2q~Yiq!m0s2yRK=rf9PJ{bPA+eN%mY*U( z#-Je@J&hS$Fb6%B*#Bs$5xMy%j z_^^LO(@BTI1K9?3Z`#2sjUzRd1~dxxHr`FpsfInC^_0gFRGpTD*pYgTUn`iW&XtIW zS{zZR@im+ZATeV%t@@C$nh=mo2HATvpt!OEB0Vq;d?|HIbP9KpLI*XIWhfY_A{FVEwcT(r zGb{n1nr8Yqb7DpLb4}sm(2t`L7*~}p2XAV?u8sbC>&@hINQ*<^;Nsd;K!)10LtBP- zPczR`_Rq_8K@~@7i9Z%5Y{f9w?ehl;y^_;(PUnWIN*|$Sl zN9^El^hOw|#7%(@_`k*^Gc&V_y1GNG3q)cf^Nb<(Mh0Yrc2k9rJOJ=lR;aZ|Z!uK| z$dltQek8O8jxV8QE>oK0PFhyDt+BIN921lQ;-J~q1Kzsk%RgA_5k(assx1~Xi zYLAONIwXM;q%BYLPk3PH2ZYYGXFwYZ>5^tv_D#@>wQ}xVi2FATggW^cM9h3JZmcJF zxu}ugup=7@n8l{c?a`QvCz=hlkcpITIzp=m}NPiB1w; z>WzU|zF_FHAdCK_mHMD|Y2yst!0C5}4!?)ZwSkcen#5rY_|Am?A&Edo2MK`M12@(- z0Ek1?F3X}@Fh>#xAhMdE*pX;8)Am!TYv%_zP_KjdaaXk`EP3*8k=3~y;a;oKR>ESR zoVP=BBc)p@rtd5Zi+TAi&3Rkcc5vY)VjyE9pg8}R%7~~^APNu3yK-4lLqRlF8^kHl zo_the1C|5PgIWl@hv04qyHN_GdAjZb0m{1|y4nW$%sgmB!8Zd!-sos$MH9PGxGWXa z4!37gTe0I-u;<~WC9-(sJ{|=vV3pU-rAx7WCDKlJgnujdaUpK|xFk)`zz@G8OJiN2@EXy{NWNiCmu zJXl7K#gRrVYZsnW@Jy~eY}NZc&}^A<@&g1AK9q!eljw~gL42_9fUT?!aty1dy?=u6 z|9>I~s>7^Z@^5nL>zc>C?&juh&UsZRvo_c$Em#Phs-!1RD;qvAo37c9d1j#rA}tL? zTlv)lYP>6`rI-&@mePU{Gx-SGmE@WVA}pglwj_`Qae2rCw&3tM_2|ETiAgK;*ufsFCi4R|8zk& z!qmKrwQA^9u2-{0j}rf(jEScmZvytoXogKei>BVUnspHxN~#DmkiaZQpzeA^x8-5| z6u;2)L`kTF&lggX@;CukD{xCe|8lIS1NOArzp-odofJ?Xj4Xam_}xGuJWO5WE`>+~ zNaq9oeXk`P8m|Pj$xq*kdS9lyxuK&?O6gdLtEabEG3bo1G{oh3@kqZwFzSUu1mxk= zPaF?157I}qc1<+g`&|VAu2m`UF~2;7`LB%KIGvQ0kV`v$MzAB3F72iTb|<#1NvJcx zM+Fu10PpwO)(Nto4{l%>+RN(9Psmi5&G8{6>O2}4Iq0%J#W${oUHUF?y7uL*vHl}Y z+e^9{SO6Q)sPUlmEjLXbpJUP1gvdvn4&K~D`A8+J-$@?6LM~h8h@8Sh5dfBq-_a;` z(1>O6^{9X3HtH$GHgo4`Kd7rcd`6Hs_1(x8k7 z^kjFDk1+>Z?Ai^CMB}?5IjZ=(ay`C;ZaBb)2NEg2;Y;n`!D3YgMtS51iTJMGyC_r#pFOtpJ;xg-_w4I^ z>L)N$2g_r?wbY>gJgjjQNh^q zKrXdrCilEcyWNkEi@``cTc5othTes~3rH{P;Gn`8CKW-E+j9)U>G0caX)= zqK2Zjy_g8?BM;|dc^+1zu_^s|%uGWC%dKI`B;9YRLy+M(JKf9J@&n&DG32kmA|FrO z(Ys4?s-57KDZ7XK?q3-rsY9dnR6)#W@_{~+WKZg2cV47d)jc8eOgd?3lJ$1jQ!Nec z<3_XU$1*Nu4-jx^9?eG%vAJ`I#iaUFpf(2!w;CKkk*L9?Kh*X5y(KRpz5~)9v`20& zZ=F`%WkM%_RD#kS(?GG0?Eb_f$SwO^BjC5OcL7u~zh~#E)VwI-x=Vo7MtT!MXnyKl zTj2V4jk3r!F5CzEkiK8E4+)PPScybFtlwE9GZFiKi{NzV+*K(MESY5#$RAqdrIV>8 zyf`z7zhKw*l^|iM&F(4A*K|cqGoA9s=jTmF{Vo8vf_yph0(_|u@dbF-oI_*jA~@D5 zldLB`SrXQ3C&N85eVl;_WfX__J&+S^ESkJ}QOCbxah~E-Pdu9w%;0NIHy3OE@bgkk zO$PE9Xp!C`$AK`l{#4a}_~Hr=OXJEjHj>Z7>ti#FEpHf$zh!fJpS{_?gvY24{=k2K zYnqUE!KME}F`anfz7}y!$AareiE9hp)BnEP^WS%?=lVg$AX#*R7MTi)gr{4QAn}p7!}(cL`a<2}JN~!bwUe>+5FPIgi6%4^EE3r= zx?TM1;=0e^tv}r56S&YUD~h;Nj^bi})fk^K|8*+q?MRMpbs^kJL1b0s@RG3Pr#?C} z!9^+H*+m#LrQQ|hoy6m#~YadYrwW%s;N^y7y} zga9uL&q-35u3QxiznjgCQX8u2sbzIt8?Zm!LoPFSmqz+zyRhft%I4<*4h+v9;sl_T zL_~4G&*YtPm1iI;ns8SY?(E`-bfk+a3YOj!-|!aLO2#3@Q?_-`$%M6I&%Tn0Xb?8dR?JSh{iL9 z`69{?#vGDXTfydgYr1N_x`QHspkJd}#BgyUOpJ%h*a_W(cZrVi zt1)UpyObqyy8QJcJrF~=S0&Zi zn@rL(j|&l?p&L$cMM5Hxb7(i9tnI8DMLsOR?@b+ih5jn=-shM~2Us-S%m2!6uJMMn100CVgem}WV&Bw0%Q+ae zJKjwuIgLqtqmiCEV$FH3LvvwE`$MS0r@XIHtip~=P-BuD?&a)xJcz2}7cayVLGLNd zGust+6viN%sfzQo&kl@c#)U9VD;aUg!w5pu{|cA~&HbiBqBS|B4oy#EFeZZc8Auxo z%9to4>zrFCjG)VV&mM+PZQid2x@_Zh{qxP5ucv22QYw91i?Qw%JDs%6xcfWKozI~w z|1`qxheFaCk(5P%K1+NqUT%Ipar{5bTS(G)*qJ)p6j0_Z)zs_<+S$NVLxcIrE*^V@^EhLXMuiW<6vBlRT`w;eXgvjI4irms zqwbaWAC;7O)WTt|l)Ht7@c{-y!4w0eG9Mn+hMf40|6Q3|3tBxIUs$lfx=giD_0@WS z38sp*K-TSe)l+7anA`ds5N6Kn<|&iHU@L+4cJ(hdtH1S-toH%r@Z`9un?9I?2r!)h zHyOotr>zw_5;AQ9>@9$YBe0)*k(}L)WU_P7r1q{^4bu`mghJp` zr}9-K&2AA5^{O~U1j>lLx$4N=k!VJ!%S6*mYRtf?I`H;C6wX7 zV_A&m2eBIrQ)1R7-@Lf(2fE0bvV5pSWssa`r}qp`_@XJ4F+{-j3ugCv4Y@+MXI6q( zo?c+{Ao88g+VxnPkbJvE9nkq`5p=uTRto&r{jF=^NRY*$9Iz4M)x-d91SI(AsZhFj z8lAxmx>k&|Ax@D00#|IdGwf&hoi!SgXRZN9AejE0bpy(BLMQ?l{qe__(Uz*L6(X8f zF`@q490g=xU_Q2Et!dE#HuSWE-WgWZHF2sk5+EFMkxRKAaV@H6rjoRFITE}zj0 z^Gw#b*t>W{WF|L?tu`qb@ z=){zMruG>J{0o-EuEhc(w?_g7AM@epK8pIcRyuTo8N8zQ_ziU6?QzA~fv`z9kWCey zuE>4CB-7nLd=|cM)!M@d6xA_Exz5j5>GkqUEE0(wpjCq(^5~mnuK`gJ$e^2TD!7eK zy6DtNt}Liq_@d?F`RL}cU2-yRH;tVk4Uf~E|0osteD`C0iDMD5ga3d2>)v{%j^xkc zd7RLIl3p{lk2NR!eU+dwIPVceD9|8B(Q-y7x)zzolWrAbBcG~=eeC{DeE;r1YeFfR znqzS=WTp8!D1){+)pIL4@$MH&;yK8iL()S~6c?@^jw%zaEB5dhr{w-UyJAy% z112O&Ah>hzv-$YzQh+bR8cV7nEXZFM-RAf)%cAHHRN^i1*b}~0tj1S`N4p2~oxPrp zjPl)3mBS0Relc0Qx00QM;WIb;!0YiB?L$09d{rC+9AyS9dDkEYf$6j`^_#AxK@zW- zndweN9EZ}T)1CHLzE==#T33dRiN2~RX_eNCrj;dSVkDNOxc9|gXPmQqW|kh46%&J$ zK_%et%f2si9$TZ`FOI}>zD^x&*5g$Zh`zI8P?r0+!I>duWxLw=&;^?X_i7ZeTYAni zd7iGRo;?SOp`ppUGc~-u^gh277p^Qy^OT2POmld8Ta;L9%M``J^c!>jTQX{Fc&Td1 zoF;#t`}h`%XbUyRlQJ#zrqp{Krp2Onb!V4KH6vN-wnMf4wBLB@RD}Vau6R11;xO4Sm>YM6mzuA{X^g8Mr68h{+HN{s^!9kwij;m3H zj~SGo%Zc@D5OOS%Dz*e1${%=lJSJ^RrZzM5t~f3^xU9=nHWq-PV1_$Bjekz)H<#XIE<9fT`Ne(sB@8<-*^78ecYq?(C zHgqIQT6>`yO7vQGrj~yEhUn#=&E>>D2RlFU39^V{(DNktn#RybCEGUsTHBrfS@TW) zu<7sLzp_zdu4L*wvVP0% zO;^Bga${JXiYh>ODJ($k(kN|q3zxwi&)fw0VfBB%p#^*`I-Y3ZNe+QSti&XF@{i>2 zKG80`Z?j`|w}VBnVq9y$V{z4ZlaBUH+?FajDz8&4;K(iZK#@E+`{Tb0(R$#BUOApP z(-|{#Wk2Hc*VQvI&GcyV1yujS_v4tQT*=v^wcucn-<$I&-?&@n{(OYGhaR-S*_Aaxe8FGW=#7HEsxHrO9@{NmAc#USUL0uIw~aRqnV5G@ij%2 z$nBn<`9E1Z==09_+-K`Jhp|HYvg*OvT>q|N;Fw%y!aj~3$GNPFfYH|EsjILD3FR~vXct>Q$Aj0qcQ_XCHcn5qU5>6CVp>Vc=1T#P0r4b)_C}( zTK6Vjy^$34b*sI=AiuAQ9g@TIfOhU@zrKTpJx@Wa@Uc~KeM?J(deU!7v~7^qv~RsU z5`$zW94LBQU;x287+ir&(v0Jgg326GvHyXI%9qRk?hbU#8x+M)FFh^1ZJY#cF(e}i~*Fg*J=Ts$T$bt?ry>4}uAmHiTU*SpH;QrR65x5Vt`i<6($l`}r+&u$xz>F8r;8AwNpe-qED zqF`;y?RQ@x@+aoVD`6=7Ob9C%ZnPRT$!l2D{wR%+^7$>L{0hON`4kc9~~RAb`B`#%XwZVmO3a%+7S=oK=_Q&d|<=WvS>Hn>xP z7bsGuGAI1G@9}Kw;#$j;646PkPE`@^X@mjGnLn;kU3pcj*v6!r^({Ku+9Ld|j71Qh zMy0e&45km??a-2%QAr!SUA~v}sI$(l7%mbDilrB`JN?paGi>;3-C?e)GU@hC^36Z@9c?tV_d*CC2!0!W^jenJ z%=V7ps}Vdkm0(3h=i3&f$g|B@2o4u-jiK>>qB!B^^5f2 zZWpUyxmeLg74CCZHoXbj7cWGIu}{6Suc2b@1i)YcW?^AUh~B_LRZTlCEG<2PS>g4b zYUTRVtEr?+X`47i=g*TH_We9Ncvs3-H5UYME3@S1Pg2yZt;@|H*hpj&hHj1?_w?UU zH2+AO+rZZv@+6E=Ew`oK{FhhJXtGMBd)(-JRWZ2`1(&YFU))~W5g6jvBk`V_lR@`y0C(+-w-L6&)UOIT27$Ve|F z3R^%x08zx}8P`)eI5;5l&QPY%WP>H99hMxL2i9|N%z60~6ci}JP$n2l%MY=BytGk4 z+3a7)ojs^Ox&I1m68O3g#zIuh??aj@=*iRgq(2R52p*>(0zb{n8r- zPQ-6le8fUvi*f(lHnm+dT0U0vB^zt)@WGtC16LyD=Zp?ha;%kdj=YLF>E~AnqlM>* zW+}`K)99|Lkl+yQ`X9DcP)*$u#Cu;~r){G82EF#qnwg_}YVW3h>+eQ)OsnFo9^w5A z_LZk=sW^!_c5-Ir*UEcuC1xM&yS;o?Mdiy*Mi@pYWB38U|IU`@GE$N1j7EZ z1O0SLshd&qQqM{E!6?uI$Q)k!KoF?De?sP+G&sIcb75ke(s0%w5^$6>Oz#2+z_s&6 zrbbc-4B_LYE#*r1_z~VwtkBj=Nd-P?)6(+8_ied#*EzntHb7l3X8aIAGmw8&JAEnK zCpjE8jR3{#%~?dVAv-GbKa2{84jjfjdxG*?%WoSF_~SPmkTSpGH`nIQ3>TP-ZE=Ef z(Uv=TRr?k>)zdk(bj@Sf-4v-@m8q`=)+$nYI?QQ2HWzdD$!Q(n#1BgUIwL`z}-X*xGZn5fJQ6$fZ8IfU_B^+Ko;q^Ckb6%Q_`0k{QfpII)#6AsVnGmk)86?sbq%z?d9M@f|4qB9>V5Fay8FR zP9DX&VONk*?`#Z|{+YLUt*JSijV9Vdb>+=No2SYl1YehCpWa}^c-u?cQ7Fg^ht)B; zrS`4z^fQ4g%3O=2_bz|B>iC^ekM)f#FYM7WtZ_1oQ8Hg5Qlp<&TwfI6=s)`s(VZHp zdbfj@!{^(}#p+)i{j_rMC-8^qk<;6aom)?^8rPcegMwCeL;9wjF_2gAJzq|{jGVDK)sAWf5dky359>SWp;ENU;I8@kc1Ze4A9HVKtGyq%_hv-Mypye52u zKNp9It6f31H@o6A*co;M-SqP6 z#cVxZ>XM!VDn{+8_R{Aj%9zqvT3$X$%r%pQwN1B!#k8x)8d{raPag*tY&yL?=A48) zIF;Y@pD*gVju~|vf1yCWe8&QPol;Hg3VB)^91k~MXmi6l+drf#pGX|LXW`$ws_3ju z4F9UeY}wkSrf7rxigWnKyV?%lRHC*TBR_XA^w7}0@fsvh4kg;decek-=xt&cx`k(3 zR9e=@zJJY?>TMX2+-L;O=@1Vt4*tC~KD|6bntZ|ZoX*mz6vL&5L)E=Y^3Pw0t@8@g z@S?rxzMR#4xmLAt)wy}zxp_(a!ui|FO{?0W7n>5vMM9CH1>6m5TXzN~y?}L+8xjIdMrT1b6j=$b@h781VwxNAcXZhQ$9*XJ;OdRom_HO=gKZW9DQoqC_b~C?yf8 zD3qj-=t0IJgfvJ*DPv{IaA&GV#yc8C$wP+Q5D6JGML56R^S+<=J?HcOanA8+{G`42 zy|3$9*IMgZ>-)1aKfcYJDjmYQ+Av-BxIWJY)}6C8Ox;CwVw?AW2&q-yH)@;Tx{>{< zakQPM_g{s@tsVKAM-nUAj%w@9I`M5_7mgLR>U$Qqo297w56;co4uyVmwb3|8`_}}0 z)9xB{|Doq*XVNF_##1-2X67!|a`GLpR+;H2qgy|>=ben#RupL5DXgOQ^$qW-CATNy zj>4@eW^YvNV;HIi6B8C5mp5IOF!8+|d&{Wu)n+lpyRFpBhVU~l_vULV2PBUCDhLMh z$naXtm6O@L8`y;sGG4j`Uku1&TaC|u{gUFwR+ppJQw9og$z_r)KQC|FqSk+5WY~xQ z-%QB;#=hF=Xw6SWEy)L7M`=k3q}(0p__)oi?NYTOr|X^wy~nxEWx6llTe%f}WW2-l zixxgIqiw^P&=?xvaE)&LD1xFJzgeD9xuo(sudK^DwbWFq7(9hzf5kHh35Z<67)&R+ z1~$sz>MA~`Eb=~0Sz%7Zd@4@PdOf)6fxGg%1<{EU^rQt(ZQXyZiKF(2#uoM!sg!Kx zNj2-rrBEBPd|ef9Iu$sY=n=S~=ni{d$MW(Y*F_R;+8(=XO{^AXb`=rsEBGbRH6W(7 z|Max7s$jOc{X|1X!a2IuMcU}-g?s@O3T5h|V(9Yok7_0L)3!T@@wV+T&fik%B|h95n;6WRBudG*R;5HRU|+9RnZj=vo9kb zSYCuVcMDVoO~`&%&e@41&R&B}8O~H)g*X)%84mmP8v{c##|G(||pikk0Fo!e#sXT?}d;F^1c?wxccF8w#m7@pLof5G~?hvutoe`VXjc)Y9z7X;&vHsyKZCZP=&wsZm`>Z<)YRe z4XKfS>uMrOls{x(jeW|{S399pk%#@YG+qkDQwnbKYX!3w&(sxtT*Ibo9fXqj-0NOu zpE~uDT2My>Mg&VyR;8A|+3IU+5iUIQpawBU#8}tJ-q0N$X;fCIFwf~fw~4f7-N{Jo zzM6x5`beYuyJ4^IO3nmOzK^+~6YVc*^#jPPO8A`dISZBAB#{g=Q-|?Y3T^yi zD+CcS1ve`32tKN637Qknkoiy-_WN5cvR3mU%|UEi<4~_w=s6JJS~8aVoRVs0_p#xX zw#20FCtDTry(aB}UvZ3@=+H5J&#Cfo!Bp1hmi?yMuk$`M2);A&yq-$|+=Z$Z|yujN8}$U?e^S*KGN?9lYF52gyU{DvMmvw30R;lH9S zWnStmzY%1pu*1A`8LY0PQDtw6*%7^K-!#b?c(aq^pEIyNhfX?^4bJmVE%g^9ni*xK zq$&j9J#?gTof>f4@QczR`TIT0=xy2^GEuz#0~gJ@QXgLom&w5im#-urk3wM!<`8bh}S!S|QFT6bWMH6`>i&|JxUYLP!EfK*<-YjHw&Xa1I zaWP379akWB90T0bx1CzFWpLb$8){wa>|97@ZE!950>Q*r@83_m-gcgHb7`S7BP&a9@7}%Xp487S^f5LdSgVNpSt= z#Hgr-TTL>U72*vaKVHhu&o9q4Od6Xfg!uWHpB=g0+G>?FTvSv9o$$DT8&!5soqm!r ztd5QZ?(0=528BD!42b#}rhAg=Mfpf&jdpgpY6y#nP*$yCH;T^fo1829`t>A9+k{${ zT~Z3svZ9|VwykA_xC<+Had22gQ7{jql9CeO{o8F1KCGV&AS^O1gmf-!1N>dpZ`y@O z?21iDhy-5WW?Jj;;lr=$>T004JkoLd)~(>jk00-Olelm3;lqcd^zh>BOC2vO!6GZJ zBCFwoy?M>&M?+loH1EG(zoPu7RFOqBq& zCFka@Agd@)$^iy!WL<)WAFD60G23P5eYXFA;@MaQ=tZ;jOTYG!1rWQ8jH)hkiKw90 z_3WLycZH$NEs8M-kBp?DymWlNbE&+!{u%~3qhu5{6j z_r*u4FU4v0H?(keA{h0_X%m#e-Cv&>-%k7eF7p31AWH*+yt>$OC?BqUnfd3R$jt12 zv>D6YP-XpM{e^K(AbE*sX;P9~dp?xMd+}#KMNp76$1)NMiV#$ui#hG$@&fpaVp87g8zs#SijI6><)7lN9G4hd zA-Pop{WiJsxxuvz+esj;<5JdvZ2d!r;vu0ByxDg$W43SoMFj-=(vK~(OWr|WTM1-_ z8hV*u4Un-fU|ee2pZ!rbuOtwOj3UWC<~1-d=m95%*DA*n!q{8OJntSAdOhVha+1yr{`3N#w44HN(0ypkhR7=@ zP{<}{Q^nZSjEr4u6rnS2)P?z(NE9-to_r@nb@{wubb9;gNGJw|o23~>VDgS;=jOgI z)iG^Np;FCY&Lhyya0LXv2p9*d!&?FOiC&|#cko^TOV)1IGcmbNNEV;%R1RUgH`INy zir8f%$hy6xO=&qxu=iBc!Lqh@Cksron|{9+l-wOTvW^Ic_<;9Y6hay8ik8mG23bPy z7uM1ZHg0Y~^@KX>uOQ2;gwfaXH*BuOaUF3S=ntUVwycfaP3o(9za`s}83S7i9B=Sc z^FDCca7RV>8hrz14h5FPkG?c6v9ucPkbOT&!MR(5g#CxcbdNgpSJ!|^B@uN7wp0qL z#rk;qcumhN4T5FAH8T8q57N_Zy=*0mXy*I0WYCRQY%;?-=-7we-xnY+g|rQ?$RIzY zb>*i_^dr+wsY#K^Zl!hWmfyK^2am%|*g-P7VQ30e;IZ4U-@m_XEK5Tz{c{IbU;;BN z6wltl#*_Tu0TZ@}G7t5mj?_a0si{f?VhL1ryUiBT{@z!a6))NfJO(D>3q zwWn_o6#wFX=f}%2IpsLcp}%r=SX+xcdGdtu372@lq#1azL(y|AR@PX{$14LF$fF6c z2*a*i;UI#VR&@IR;6l=GtSgvXN>-KyQ;G(vb$^FMcv37jiX{IDc5&Ztt9M27nKskv zE-^%DI;aUVRQ5{@{j5mpbW{_j@bZ2suuUVEDlTXlUKd?u zdWInINod`)u(F{@TluI~sf`JZJ{IyY8rWWo5N zyC7zccx9#$dtr^6aD1y=>Ow;vfThR;Bfg|XigfsY@ri?2J0 z`@XU!L8WeZHSgX{-u?_79MKhFB{0D&_M4kiAR4mAv2n|4rrXL#ub`rgERuxoVpRPi zoR%G#7ITF=jEvY76&3wkQ}Xj0`j=_T$+2QZ&)3|HjqUs6>JNwa5;Tct9j+}d#eq)2 zryC#P+juaR^n;K##$@kb*kan+b37*}XS3%ZUr$dDKoJpHdttt<^Ga%}6xFpulfuW>t6?s( z4b)Ysb?c0K`}%$wyEoA3BT5A)Uay1?DPMf1O%`5?JQlOQrRDAOOFsv=ARVJjZW#Df z1|A-h4(S@+6R+iJ_USB0(|w1OD(=#|fU*!k=^0P@zNFs|MgBcnIs!B}j@685T$+D$ z%iFDHOjja#csJwX_e*&ena0-ZfLP zR7P%vPDNJ63F>=eVq#`R(^67&!TUUjrO$TXL=IJR(pbv=ZvaoQX!mM6qX+*3P%Ela zQx;vbCi~C!pUZfhn{%gbQ>}7(Iv0mK^}W5HvT<;%oas29l#!V^zQx4H=NX{xj{vOy zy(vN)ry7Pc2HN$dh#DT7W?CEvL0-EeEl&#&87Tz?BN$$an3xj!eZF#C)MGLf@%Y+9 z2+5yOb$l-hA4twZF%}0Of`5E{H-2Yc*|b%cZS~^fOhqIla5$lR4n(~&Jz(Z&(n8SK zVTBML2;fo(F?2t43WYMU2v!G1fFNxI zr0g--Q=UH;jTBJQ!z0@OI$XZ(s8nk9aY8yZ!DjDXu6rhOBNa;*;Ak)q@Y)E}?g^+T zaIpkeSucV|6x23ci!GbmD4HNJEkbSbcG}p8V{NP;aFqE3!_%w_=vvKwqN_a>|&FT-Z)YS*39--4r+%jS~Pg*8qr35f;7@6~%)Iik*#7 zOiT=>Bc|Rx_|m247wg}=(Q|fQi+#aw(jUjef__BAw?}euZ*L;9A%W9qtgHcH*O6pT zv_RIv;cZEA@o^MJ&%#4l|5;E>tfLX(+n_swc0L{?LO@Md^_e(9f|$wuWNvCGWq)SZ zxo7@w=s;=BqS^ra?6UhN%>$}8#I-oGn>cbTIf<6i^XuVH!vSwd>(|rwDD&ow4|ny2 z>7il&xf;yMjrGiE8!*K`I5?fjI zKw~;ALfA`jzvTxG9H4(`9rl8#wh;P9TTsx7&?5-Z+{8~EsR_UD3>d0JlXTkq`&+3{ zkH=B@8U+RRys~LwM5_@XoMDhxuUWGUR=1@*U@HkjhKdI7KCLM}a%c++3njI+#o@^R z7@*t(*bI)B+x&0|?PLK71NH_hd2U2MBK*%?zcU3)6tjz@GzJW*OG|!AUbde8r!&v@ u>HfFq<}3pl|1b+p|9=uE|6?)6FL7Jddz|a%y7`X4myv;qey*O~rT+p=pEM!> literal 0 HcmV?d00001 diff --git a/training_loss.png b/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..279488bcbfe74550e29ae1c771b2caca834e6f53 GIT binary patch literal 48854 zcmeFZ3Gfw?EBsyp5u6*Kj8ha_fKH0YhBlzXN)nZ7&rNgns?JGskOt5`cydj_okoE`@}%yCTzt{&a7$bT+2>aG!`ydr@%;=_{n<%K z)Z{6TOQ&_K4qH7NW=lw%o^I(<$uIx3;g%%zd3tubS9Gz(qs5J?E}xrRo`fTSy4_gm z`5?CU&%Be^u>fj$l1an={~!O4i_munXiDnzqN-M+O zvYVTm&j%^Wr-!TA;1xUDTLYr0t??nYo2v`IhpVgWBI(zsl{OeQQ3UtgYuL`DYZ zlf4%CGM~C$M9$c{rO`NYvVtba_oh;my)!xz09|E7DR z%ael#vu2JlGBMfz_()T+Iu>^4z1gFJgmKX#>;9n5jN9ciq&4x4jTc>ALsklul$7L* zj5wvFr7!fGdZ?w}?5Xq+Q_t3(oPOP7Jk^y2JNTf#qIFr^W0~8}-+$pp^wp!>+!PHB z4RB#T{`;$T%xCWr;1eGZ-slMmBKndbMg?oa!|J(oT|q%%nw^(q;D0;?ISLERuBL;o1RqFy2&rna-m-Tj#~x4J*s8%yW0{#9fLUH%;~oYL(q#Mte)g zeFqDa_q{5!Mu6_cdAi5C9cV_KPWc23D5$O0rD&rD!hu{vnS!>F=GL3$w8a31P9i?xZ(ftBe*o z^Yn)N59dQntF*YW16 z?VFg;oYYjD_x9Qenf2eCred#jD*k>x!`07vfBsy3L&NCHNSO~!Y~EJOdAho~;*P(m zv&&~CZ2HerNe9%|E6fHMH(wHzlw^X`ImyST=;~Tx#8*#58(M#=nw}$KJE-p+&#-BX z@we~a32bd`6WBU*Yn>HKHfGE7ta=4?V{EoJ*OV?@s?9fUW$6xSA}VSKVHhWFfAqzR7bP>r1NXv4 zEb)9iW=n(nxil)>Mao>}4#0;}u*onJQ?Xig#Q9`qau2voB$AMl`bI`lWmhh1S`C(U z{_sMnxBhR6n2n8%fSA|_vUC+nM`^#MrRBo+8&^351ZV`GQP9xPlx(k0+5i1Cd6pstG|pKG^Eonn8QorBx^)rTwvxX#oKQSPg6@d5}S-u7-xCt&I&YM1s#yrAJ+V zKT~RIYRO`Yq?`H1cvGam0mJ=&owvC*hD#kFnQG^%cUr8^oIF{xxwZ%yO!`bE$ZKnT zG>oq*x7>Q!b!E`yQB)KLkM)pAETa3X!y&YInBNq@HJpMCQkEl8S zV{2;@RJez*9tsyOjLsAf|C+gKMv>yBt#j@i&ZhJy9V`=vloWHT)FOp2BjwzJZRI~Y z6ifj@K_6gM;KqC2n@2aSz*BfdeY)FIhyF{UteF>ACDAW`-^P` zA5?j6#BZ|Z=jZb~{kgfizJ8R8izugR{q&s}r?*)UBaOemy`(vGh(K0Wc4>ByX=km~ z+jZso>8Gd!JdTd$fRf6_7CDjRaX|T1`(1C3mDxbG^!oSa9V#{j^+PMm5b_GcRh}sB z9&sw78jks(EdKQAQ&jU$23fC)OScDW{fX@-5?x+s726D0x~)&X`PS28cH4vUf`UR# zQ&W@0?borf^m7WYT&A*$@v!!e4r_NA5233kt~{@C>eeBKO+0q|xCVt9C22VBd*qo4 zC@fqmaTr8lePg3x=et{6k;RVO+EA;LJeM^vIW;v}m(6x>UHR%%7D?wgmRK{J`*RIp z^a7S$+^`cUwkkbV8X;E9ZZKinD{g~jPAJlF*g-Cpk=Y#E%Z7$WZOSIOrUyz7o)12N z_E%=@$3d(nR?jOm^x%o3M~~t`pnGmCAEr1R-nz2hU2Z>qu>yiVBrMEdo3|_BP7L{F{(K6E?* z2=&>@ise4bQhzm9SMeg-;Rs?@S4>1i#Pv`58!MZHtg7vGOIRtx(GP)U78W0%B1OWs zqVNrQ_^_TcQp)ec2l?rt%Kl@AAyRAxJXZ$egw1J(?k}ohWo#c(&j-&#TkY$NfL%Js zBx+T2@TwFJN|1{u|QM=xr>kr2M5P0d=kI?m_o(cuY^@V z81r9*TJ_;k86=%E8@9}a8C4P`4s%|7SOX9(P}*a81Zv8~NLK0j9-~P66%QzU0uH}a z1^~2}+1NBf`9`@o1{F{2Q~TCJ6I)M-JtrNHWW|!`k8whYgK|#CUZ5%eTnpt#0rY-d-PJ-FI7*3r!g^=NL~}`c{8(<5iF8Hu;SS59NmUU*=;iikBp2Az>n9owI8kw zc~C)MRM@b29HOVk$3A@c!0cXe{MM~oB@2yAsA8baM{C6DF)iTg=4Jq`_`uvE+GXqF z!61zS6N8S|s;K!2=+|Jp^Tp2G6*EQsc58o)H|Oi9P$w$wwu$>DyiIwWi>psWcOEb& zgOCXYN(OiVCp67x&z`NqGS9D1<@A3is+(Kv$uru`JMWzhw(Z5_9d-x{tYinT23FY) zt~mZkk+l|K3+Pk$7(ygVQ{7astWe&FQ5gVAg=uERY_MwmZDg{QJNjtknQ4-*d} zlO3eu2-JPiYPRMWo;m>i3nTtihO6_VZ`0Fj0j{CWt?j+_4|6n%XoU=hBF~I~3lC2N zK#E7PvB3aoDq!VYVYx>qCYlJ_yS%0VU>@);PImuuN+pgT2YJjXYBONAINrA?X50cj z71eQ+?R0Z4f4-ked-KL&j?EO}I8*tR;lHjdttLGErf{Yv&FHA8nwCV#*o~DNSEU>9 z^r={-K3ZpFWf@05e%u2etp4&_E_ZXj*zkR!{v18ou#E#06nCLBn-x+vqW;;{+#L4x z%a@bOK|EJ7nT#K*@kohW!^-SvBz9G+?U zPiMx!@=L|Ye5~h9vR8b6k=>{~ozEwkr2Bs_iL$f%+{);*wjjsoFpteudmAkPIcH*< zdm&q&_7^!$s=@DJM;BR>qoeDTU#TqvEt#;Eg_M{Y9j)z`ahcT?<>09Ou@=j#WARst zN_LaKST#$%017yF9se|wZAGnh&bxPpm6erl)udY<8-O$ZCedRXe=>6ZCV9+{)LL0s zoVHC^Sb0}k`fO&nT2>N@Nwo9jW38HC^&d#F6Gtf;8aJkp7U$;_Kr7ZUR^!PY8Hsl!? zL3!qO_T3{v1`ZAmfkSxbp!)vuV)OFyng$Y5&vIi%#O?20w5VC{-sMl(8yg#QRnwdw zZwxoW<=R$ni59D--^}+XqBP_@dbH=)FO#qh;G0Vu!cq~ZpDK%&4 zXKrV^^~d5jp%o@ti-XN%J4HX!#nFpEbe%6OLb z_Gi3%XC*`(zbJtC z=iP@VCMJSWZH1m$0$>RnEGf^poihdysyJ`r*yj zbacX@bK$pzkM~r#37LF}!^Ie1*VS#=QiaAu7U~lc#vVucznE>~LK$RZ|EJ zC%W5=NJ=s?c~4JizQVb;fFF;Fh&5QA@1feUt-pgB4R?qRF}D-kDov1nTBs%ww;6v?Q&VeubCqq#R2)(Z8}ST+ zTR*R>n{?iYZpO{_glc^K6cLMnApxed{9$-__-^^=gxRVT>@;w}CIoR~jP0Q&CiJ7^ zHH0|4Q(!`gE($pLuSagfgTrTXOh`q0AZYGbE`b(mG`Lg|3J!$ar zBoyLibr0xJP{}J+G#(nIw%LAEhZGUF8^M0HCP&%~mMz#6IH~z?4o{?|9m}5h7&W?b zCG}cLMFlgY(0O%rx=QolC5~st+RCc_OiqR0>ZbhKiZ!t$zfJx8s6 zlQVUbqwWwO`RSWAeuU(08MpaV5=1GX`o_t6%K-4n^%2U85l@PwQU~HQc+O6pOoW@ZB`}fASNbGkXi;H)>PQ7OJ1rS z5fw#^h$2V{v{F7y)%5Pr7uXK4NYrm_djX<(d-L>w$6RH_#-u4LW2DC;rDI(Fkskm4 z5MmW`K|I!pke3(383T#g?o$IHD4EJG&jnVZ%kTR0^Wo>R-a|hYJ7nLCnwB_CsViK( zC~@<{r=%72-;2aPuuQcxLCHqCx~#L+J6;I(jY~r>CdLLFKt6a;QWCdfYW3seBP6sT z7=(Dyu-67p47Y}1x8)GPZe91u<5KfA_!X%{m`c*{H-QHN0s>soc@L}kmSt{hYd^n4 zZM^A0Gk(WxR_reM)>=A`6E(}4OoHViU}=7+>4=-2JV`P-Iy!JiOAAkKe6B)9;O^Cw zWoTnB%E}l~j{4y6=cfx=$Dm6M%mDwgty<#(aNpwOmZMpyJilS93Z(?`Hh}hHK-Kcf zy(WQEg#G<{k6W*5AiGIpUA6EHbgcsbtJRxicGf16Po6wUO>rnujhG)G7PP_-0FVXT zm&~k&Dvm%;Z)|^cxpV_Tb`1>;s5Dg62M_x1Y*g=@ulCx?g;Eh~H8&n98_})j%~D|U z^#gQ-Jj-rgpbkjB;CdDTmC*?LA0&D(5NF^35BhDZ6D1e^%(Gmy37Hzg+u}s6<3HU|%sWDr1gQfGgrxH{_5I-`{Ir?lPnE6vh-&WM z3&`3Ka-JVK_vQInL@_~Ns|DFG7ibHtlj8i@FON&Vi| z=Cif2BB{O8+EwK4;V}-G(NkbbHCwr&i#T3^X=@`if>z@KsJoz%=r5O7>(}Dhcmq7I zqZAv^zuimd(U)O5yO_Vs(q<-%B%eG8EvcQ&#h!d)a>Q{}ncH@{#H@OJe*ZQbNgyfFtdPJy#6YmnQw91s^64&mX;IwJa0MQ!OG85h!2H;V{gjn4i-n{@0Vv z!okFZi%T^=0QRv0XnIeX(;2vWIDjoi?2E}TW#P}&*J94ockY^)fWlcN2deWzuW7Qu z$0&|fh?kNLsej*Zl-yqv1eKH&@(e=b2+$5^YqUGmT zJZlRJT4p&Zk7X+eaOMOt+lzPa9<#8pKvL9#Zg6$AtT1D^YR4yQH$H2QC$Fnv4fr^% zCTo8D{26#e$V9*K;gL2d$?%y-->BI9+sxl0EZKelq?L^0C*7BRLo0vucaY``L#cYA^C#SfV9K2)j_P>B%3L&TtB0}(M3({_tO&AZ0N3qw~u z)A6=k>XM3-kI|~c3zJ53seX{0tMEU3Mt!7#UauZtCaMBUzrXosSQ<}mr~{|~pdfj( z=|<*CS3E4%7?RVV7}!DB*!PDAD+BHAoE<#~GPJ1iJq!_=l7C%V0*=40Sq+q2w{w2E zu!s;>_VRBa0`X7o3T{`0{L^mCWFeoayoPBC=`}Xp^Sr2YHTih4dP=`G(-+TV7V|{_ zk&VacDTLf24)~gfK}AOTIFe~}bXXcASi+2(V-|us;Xd(qwpXeb=Dc^9Zf9%PrkwMi zU+%XZhvX*IUz3JKErB|d>oTVcH}j}DyZ`08cVr-D16zJNGW{32<-q;LuN9UDR*mfAe$$?5L^?RgAG}-{j{swNng1qn^Q#ZOoea^B~0e%POy`#Y=*=dk-JYwX!2>%5++nb4)JaK61Kc;Y`ZYB)%=719D1$TGNw0=rDTO{+1_n2@Lf3{gJy?B`MGQ2$(xlWJ9fi5BCVkoHIQUuW z$B!TSb3>I}I)T8)KLUfazI^p+)6!(eqqw+`Veg$mtJgiNYgxt|U$19$R;YM5I0&Jv zftKxH#|KST*AguK zOXmtWt?AZ>P8}lq#%Gr)u&n}cC+hk0FI!zqjEpMktq{+|n_F9M6O>Re3UYQJpPFDd za^ad81qNS3Lqci*Bw76xGx$L8@#nown1fY}(iLq(I02+USdTQKTl77kY(O>%l!v52 zpA@Fz#ShX?JnQ&V>);d?P>?YCzWAl>v_(BhUjGFu$N6&u!5}=~x-- z#Hkyv*-xJ)dwDTj9x4n-vaPS_Y6gZ7$o?^yJE8U?fBrn-%2_CAXuJXv zvg?R1ammWXxp1+e8dM}eGDNlccYiS-fOVu)fM^#i`KYg5RO|SO6Go7kuG4u<@Iea@ zLma}wPsHNXy)o~x&=W`k=Z$j((e1j1#;%MDvLe7v)YkdU+SsFg-*hd_4YS>NbLHn# zUz~nN&qG+C5qOBY$Hy<1jeh4UeVY zzQETst?NLB@gEq_2DJ^t4ls+?9FD1kyK}3Q1pMa;EDoBcziy?wL0u3f!Zy&e`?Ajz z_T1zC&Q`5^f8m0SSv{!J+;mZZjO$?)Ly=HNQI`VcWEBRAg!qd)TXWv1Oa)OK@k7fF zF#F@DPqh%gk78m>@+f~*wF2SygL;x+TSXcu4?1jP=Ssnn?r)E~tZqMOU;=0`(^nW0 z5+Zl~`Xik=ORc4uetJ}5K^H+|8&GAkE0|K6DXv0eLfL@^8l$7W5XDE1A3t6Z_Wk?! zoA;N#DZ0)Sc0-Cj3<)7Yi8NQa!rGOo;SUS(p{Xgjnc>f%`&5=F&w-Kgan3tZZXm9S zJ5Mvri6V&}(HjksEn4UGVRdfpV?>*U5y1)Qk&{6=TXT`Xe&ks zX=(4kqZ|N6FAej=g!uT+Lw0qP>Tl?nVtoxXVnE}%J6AG(K=kCvkf+T*r{_oOdZ9`s zx+KE@CIAK>+)zk9f4(bN1ZxR(RHpg#A+i`_ryHBeFePywsqxJOd@waN)eQRVdpvB`WXkCZmn&n%2JcIxPz_?plZ6d0I?beZqz zH+sY9`N*miL6n15II1jx1O&fUEj6_dyxJvE;gON1NLhmkvNMeTrXd6@Zue&j+~*te z+OQUtkx2qkXgW^7s0RkEi?bQ(8NDDlKBuIjGCdMB`a09L?|o<@xDuFXXlmWv-11;p zW5fpgTJ-kq$6wC5nc0WxU{c=;jXP!r#P&1MpL#$rPIw~M7HcYS`^sHt-qTP_HK2@k zb$7?kbiAP|2Ze4Kko|z?^eKF!O{rg>@zI#@_Ja@FM;KC@{v2{aS{Yh~-OIyzV8;JU>f&(MmoF;LpP!t{glQ?$kt3gYb;`b{ z5rpzs50<;|c|aBvKsIDTb7netunv^&!RepPv2Gg{HZ~?8ov9YVBrj8i%gEo~zZXKy zdF}7dO!-v(LQNj@%-NcSpVPh;#rT>xdsxn{rh3n^d2c@IcLo*6`R|WUnaRm)OmuXO zGEfz#p%kfB(f{JsDSN^K(-9_S<}dE9uDS5((>gAL4M}Gm8h=!gl9E<*r`x_Ml}$B@ zruIBVmnu8{m}hJKpHU>6Y)b_5*~bu0R`T+A8&Ko>mSA;iNS?Ythq9KY1I)8yY-D7l z5vuUvOq1cH*iCiyM%c%h-A9Lylll9Rb6~DvJP>88Y9z45LN+zwD4u9*Ko&W+U$S91i)*M9za zZyBJ9kOy0k@!Hm17+gSEC;@Swpj@BC{3`fcU?Ne$t9Ud5Q4uH?XCH)xjgF7kS?j@2 z1kL9T9X@>a$(liQsrfSe*5UF5fYBK5X=x+% zp$Ba$m4v@NJ;k4$VEU!CwRP70QbewL_a~Tm!dUnT?vMt^HOtez{xIG%K=ldUEjH;# zEzfMwOtA!LH#UUhd1n{MAz`olDk>^mn;j$?pg#9}{HWB`(GeZ~@ZnvQ{4r0S^mGQR zYDX95k>%#5MfYSDo|m=36MbmRS=1592jE0sc69{bR4kafo%H_N&sg=yN%_m&XZ;KM z-s!z=9Z1f)++TPiTEHi55zXIV7G%621IZ$$@iSGLf%gd4F)ps4GFcLidP-QrQP8RB z=Az@{|IFv-8{SjbqGFM_Yaf^}GNM29_)Uu(jvbs}@=EmMPtYpDKSLHB2l|fBOamlY zt=`#?eJ*Z~cj3Z?Rp9%C%6@HBNxy%7{J5h`t#{+G(Jj5x{=ZOA~%;B zTD^^!|6}APdv_=10yID{7^%=1{yr_CirvxEi}b}OHiSu#C?By9%!r;mc`^b6O-1PW z4<0lbhQ%S{O(Qw=<@_wzdY1+re4r`HKz$9~c)M)c!d197^;EULX*O{luECyf47m$nW3Kb0U9qpqLRS+ zQHT7>JDqv+v>W-&?yfF83?TiU2W~*+HfvRGBZZK$-S_8+{*Pw%`+XYZfRarTsKY>L{BL5kBF~^Ik zeB1~CmwAv+USwxSXpye~ABa*qrsI5(nj^sR7I!l+A1&?brzKSBH_51|B6+17TjQ@B z#JV~=IXF4}H(X$l(B9roO-t(sXx9Kn2mozrfKgLoaYCjCwl{`%3_-}dQ+5CB=jP@G zXn|*=tlu7PR$n`lqa!20OqslX)C2y zYW4N?pw))uU$luZ)&LpwC76$38U=%4(^#HmE7B~&0V0?{l2A|t$fu?V@&4n}(8>2H$mxl4wWNPInpUKVg?8OF#XaQnqm0!UnkX=H!;g?f#> zu#q?m6!M$d2w;HDs=`}fIg>1WAb!vZSN_(4knGS+a=uH7aFLTwm8D=#3DC+1Ob^gx z7a*Q74Afz&AOob1rM-SF&lNoi^;vMz9p+%J0K=&d9SUe`yM}b4I7t^?G_sqOY1FBK z3FDnSLqZU$sl2_t9jCe|lfBkY02IEEcI6oVPz>F z{#<-s`mQE9_A}T4;koa9XUw{>J^c?fd;@6xyOII0gk!)BU~cm^GxNvnA|gCMDC9t& z%`W}L814B#vvm-G#$Z3uAQaXwQ)UGSeK<&zV*qoIOoG%;?J~#E@>@U*RK^tt2~X6lmVq+n1zo-U$kCFRw5s#V(3j9DtJ=%?|Ysi}o;ifjge zWI*6!#Ps3K$i#>0I0cg^1vU>kHU?u!vGQaDhe05!%_<%u!&YHloQLKnt={9|V#wBo zIrdh;Y?U5Zzm_3`I%VzF<2&09Kx8V{JI(YgiVsc|e zZtm`A?5lM3>I7a5JZ1b~uzafArAwqiRBSEQ(aNuoxk=sfET?&#>RkpRnAX7z_-B!I zPcCi;vMcJ@v(U0KiMO49c(v?$Z(YZfAST|=M=A4LnmzAG(z2?ms(LYZ(C1U8evm;) z$^uY4BoZM%4Du{MM?yD<(1Wu%xjjWV&hgUw1IIZ6#KVGbjy;hDlJO0H-%VGn`bupS zI_x>X=GJ|R`uglgIXO#1IWfe0V0+8^3=sf^K&=4Ym6`+&@T<}Nh4^tz3hNgowKy4L3 zBk#)5iv&Jn0NamhDa#O>Iotl?{)VXXQO{@q4iwhcr-^DcI3^YB>~gHytiI9<;88Qn0#TH9%YfLBLe3X%duMm?H5*gW3e#=H%?qSKn^h zuRCGuB7a1VzA4`-L2Uumkh8!}dI~M+LA@q^r51{W6{t{9L?a3kF7_Q!#j`&bw7~k) z6nevZ`cMTwJEfN@lc&&alJpluQ+HDdg>H#e5tAQCEn~(OQ(8EVDbu zP0su^yXN!Ev3Ceh{OiKW~E!w;0Sq}kuh%5ZBd922n{_wF}Q}HN*ln?Z(s(f zE#?E{1={XIHrb@&o#G*Pa%f8=ARz$90a34{|B3SPB)4Bj!1?x}yPF>QezvzZ+#>a$ zIf1>H2&&`&uuyPfQBNjL$DhO;&k=TpuO82$E>yLcF2D0<`WGx(Y;8U_V|?e8HKUog z8@HehBJ0)SM5`iHL^Rv$w3O&KZZ1mf;XC((dU z3ebLu`@hpzN>vpr=q4BJ?D&z+vngqa}{ z8?X^@XJBYzp7QoB32HJpEt60Q5FnD%;ermEnJRA=9VrFI0Ut@Ky z%Mq(dS!K7<5LbTh2|e4q^ZWMz=-J?cI>#IPGF2nIDreeJS&O$q;;@V^tLWg$k5AFa znFQ(?EiJ8U@u2t4R!_CJEI1|D&5vCC4!i?7r~!3iSolSM@O|EgO0zqNbDq&e4G-L( z$cK*U!w>}+FA*6zIha>NVJ^~Gc@ajjW5BP`1jWFB16s|A zV`wx9zQBx`neH4m`c0f1NUtjckQ#v(U!Kd+twdO3YYXZrQeOMSK<68h0h!zUpIfL~ zk&Z>wfm<)k#XE93#MXg1Wy7o*6q#} zz^04CKqRi%5Tf8LQO)QqsvH%~T^ax>K1%r&jOz*bln5|c+3Ex4dbbs>2a;=gImkYo zJrZOpmWac?i(V%JFeQOk$8Y0M`<0&pJp?@7=+oP}=YSx4ZLgUIFF$?!7*)j7s;Z=B zJn+4c(1sF#Z{;G0Y(N^&NCb%s9s_973G-~s2ZR7jXC)tv!6_h4+S}EDVl`TAEY)TW zfr4Y*y+|$d2haK3IT_vGEI%W!=?zAv=U4T9;(-D+rX0a44SoRik=2E9*!4P?wFdxS z1O6xez8Xy3#4rN{aiRfq#a!EA8L92n@e)wvkVhIrjc)-oS3^+aN*pI?bzMgZ(_XzA z1y3dc2BBL6JP{_02myc*K(%!crrpR3fo2)=FdXLq2RjrhWEm?J@V+XwK!6lXRHV=h z1jM(4;%?a1NhwP|n zoZxw5meMUK7@*3D!py_Xc)IJC*uO3x?u3^cCSOsb_Gd_G{ht5- zMD_rWKnGl8Wuu|NfyW|$(Cv<^G6UwL+#zuJAN0E0FZEtz!r6_Xp`j}_lr%TapU1~K zjDLq*`Trn!6PdrxD)iA}q8X>)Tv^mI`%`5wKm|ayVr70GDeA;aZ>8~oHUQUyfi3*$ zZhjR%L`h&uVyZOxCDzvT`qu|<=WQq7r?^bf7#XR1;?Fh!p5M9LVW369P)4%+l!C&! zbLT=HJfNlcolfm|;xpzf%8gNFlgAl4LOW=Gy+HF^qb1(@FxY!?y|_a)a3ize6itbMhjRMC_LbzFhh-)W=w4tms1N|$9{iU zGQtwjZIN?;`el*b|ndP zQSz4(C~HZ~so(|tROVCM`kJ|c2%Q+uit`zWrE@4a!e@xvh)};HL0{{iRQo^NMK?$kq*HT~CMh_^ts<*D*Bzk5q@Zv}f2gaYfrJ7$WC&g}mX1420u&=0ot_H9z&YXC zhM*Ve13o1>z#IZVqTg``D)I+e-1nxK>#(Tz0l!bb+uO-Uj`0-w zTIPkCV81zf>{xxT>L@=&9UR#(ODB)pUH{+0M{0@yofdcl#Kelyl z+~}B{X?MY8?1#mpYedvFXpjk|$q3A8pfT`!RD%Z%Ir28bA|q{AiYA+D-kMYFihm02 zKk;k+O?8h$~>mOS}tm8GQ!}fElW#`TO*$UM$N0R zvbf)6p0F2TaMNr6%jN9t1u)c5q4-{Lqm)nE55l8U!a6lgk!(#Pwf?2Fyf8Xxgnuo3 zK9hrC|52BApw|X!W;Fulr(t3Fx+T5#Bl?PY_1UZ=a)0oU))pczp-KdUs|9_HMU8v_ z9}C-+-aFgN)=^4tsfBlgvddi1C-JZtd0gXOIPYdg{C@O8DHvOdmV0|(ck$}wA%Mdu zmw$2jUPEOCipTD6$d_$&$RhT0V>hUI2$AeVorg*Z1A_`)>i%*OB6@tp2jrd&|A`G z(8sI!W7p14?Ikz527l1EPQ35`*>O}3jTnNO@!A>oveOq&PAp}PQ2oZ<0x7@?n4;P( z*muha4WW;Xk2*eDxsW)N@av3i>l7&u_LmM1>H$LsElzpAG%G+AWomQ5-PnIfbZxo) zk`M~F|C$ePP=Y8*aIeftl3{~B?~l`_?FS=#GI>WUUKhNd!)$kv(EDpTar-aWy|oc_ zyi|d`ihBXa9Euu`l#Vfz^< z;24kP0Q4bb(>oRZ9ThTNcR8e-ISy!e19YUuc!38V2;MRpjLx=Of1*!>498KE8Z|ve)RNdAUa=%4i?9YSR%`&)Yei*i&@o$ znhmaHD*iW4z1-Csqpn-T;1=!q? z_f7jX!9xz9dHXjc^q-=Ed)#)K4QAj?sQ%~OvVN&YnpQ|bvG>Au=R_|2o@a&i-unr9 zayO=*%B8*E!xsMuV9PyWjhY6!A<>df&FTI6f`0x`@>K3We}-~Fbc_d=@?gIf?dIDS z8T-0~595B%*}DY14qME$pDxUfORHSxi$XeVfRlMD_+eI_$Pvsbb zKG&dLqad~W*Ta6h5!8;Ru&n$muECUMr?ez_9~VNyg5H6 z&pYdK?Jff(;jo6X#5A9>CrllEfwfU8Efx55?&*HJ6~zFa25Q<@VMG~8IF14~q5Mxd zMX+hS3-9%Rzx}^p7(VO6Dr#Z!m{<0DDbKW9Fa*gJl5qrY8FuS=AA$#65=6O9OiuU+ zk)&mzX9_wZC$hh37f})OWRYvs*An{gUtPLP@X^mV_NFWiRB2Q%-c!Ppez>9hY7edK zLNpnC5-e$dx0TRt6FJD1V7VHq(Q+u<+eH&kW7=?57*3jk2@oCJ0~^|xv0Z3@4vqr2 zhBNj}(6_?jz~TXmEGG&+e5HNVqX-oUxj^9vrqN{kD>QUOxCBD)#ryX+=eL3LN+T)? zW9vhclas4J$MV3M4NjPy$&r|Zre@6jKMOg!gw1EK=S+SHD7q0ocL8*&eJ02~O_+EHX6<$qWn(T;cF4$j{*Xy7F8c9Z`4aKSoOm z4zh=wiV-9-zsjbv>);?^i4WhIGvvr93wm%*jUtTk%cbXl zJLQ3d35pWYiK|KVNKOF7Xbg^;M*6sUO*hBgR8<=$6X5CQw&nB z{JeTqUz}=_WW8Bojw3q53EwyXA~&+n%)tL4igW)9Q16FeV5bL7ogLG!@xi^#$!P*2 z{}A?vhBnmPs^ab^T5jEnxD6NhhK6!t-}UQ0+C$dJrI~=%Dcnn4uxJD;(~_ z(AXQDl(+5+24O|*#tl@HZ4y9*2j79fy&p=oP2f(7BXEQJ!D{k9oQqN6IuDh7E~j!b z?3_mt1yR~wM|uCWL&yjC7@D%E7V#m+_!is^15#69CL{pb4f3|4n}+zpFyziRG&0JA zeuLG3f-?`%rw`|?7~rG_oOYZ?3O;Bc+U&o{mIU4rXYDdA>POq?sgewTdz6C)qG~$61@aS6^{QU61 zeuzE=eRW2I_akfe|Fr!hb@5Yk)9gsY17B1qoD-u#I&`i<9cmwNb_SVSYQe=j`Q?|! zO*r5Qa^=ZG51gkCY#-0U{wY&#S7<*-oVYyySJiW&=69O28!xIlXMTq)7H2rP6Y+x< z1WGL-h77B4B=jJha`lC#U8b!nW7=l=AIN5CzkZCGkB@KHAcmX=;3UK_K+h6sElC+2 zd_?m96;L4LhNB_@S&E!fqEz4N{6AL;{dp%uGl0lPU6d%Hy?{K(IksN1=;$?5`{jTEt&^8I>E{tb}zAwv76I+ za{Z~G@IFDYbH_+9#&ATo&Vdw;rGVlYch=$c<<4;jIx0`>vx_vn!?T2+Am zNJqj3`J0iD-e|8I-EgX-Kf-wYA@bAPBHs_(?qC3;U8D}hK1E1v5w zj@;M*IsZ*%!Z_Vhf$u)2>-&5PHv&z-+2z32W$-_KkrlIJsA;dmqXSFd-pIS@ZUV z)csyg4)8r7z`#s;kDmBJ8-K$`K#A$H3Lo5M#Ryp>=+_nz`7nk@YwZ$n7f=-7)(`s3 zTRbCqv5)KfeDLI4YSs1$8hVs*V{9Kpkid;_uJh{eq0^`$z#a{grnrLrrKtawj#q=` z32@dJ4f)nc8L)CDw298!KfD{kjLm09L!q=-fU9+44%JrWu-PHnm;fN0%pYB8O zu`-}{LlqB(ok1EuBIc#u&=FBz0S#FnFn>sR_ysuT>gVStQMDkdPkG`$ys|H)gTM#P zl33k;b0B9uHV+mABQ!~clN;c@;)@&DK}R@@jgN!zk>cvrtC$>!=!&AfTu>J(e(;F8{4qKjB)xNRaa;~g;xWo?_sh7KBD=e*e6fGYppyl0F%Gpof-6C zjW6Z_KR%EhIKfYM{|mU0Q?8vXsRjtKpc_DWcMpUr5F{SOmj3>g2Pqo9y{Fl_!=kVU z{D&7Km`|<7!PEjhjHb0EzY`oyS5Q=}Yi_SEdAd_j_feTo=$VZfM;c77IsZ57?8J{QXbLp#=4C#TXHwYu@p&p z2n+$aj;iNKIC#TgA|GLXgz#g&&(+IBxv3fz*tKL;?zc9Ftdk9In7@B}`(5H71#0ab za2MepwFG^_PgC~rKG9uUyNUCo!OB~Z6?thLE|@#zx} zx?KrkB%QV~$jJ@t=`fBwP%CND14b=yq7TGr2vTqx@G_;_P?QteBG)=haZCy3Qq1VR z%;({E-&zT5tY#&Q_LwR!Dw8X;~lCdzoUJjvn<||k@1~Uh}I3u_u_V?%)~iQUY3$~vK>z=fQ_)8H^sSp zmGBXM{V*!xwZL1NSKr!gqoP_+H8&L|$Q8l=J%(df#UKvkwdo;v8k4G=E$oMNf6vFomG znBA6yPvW;;KZ_qv#Po+71i`Hafopzn_X&h4(<)7HVTqZO4|Qt(DSs}5*qCI7jS@nI zZc-_6!4R+yE~Qy0iQokv{`em!j3-g(y(XQa;F+lFn%xF79Q8V{e%|J+eB0Rj71J*h zKF(3^33T10M8Jo)iZDJ;33AKa#rv0n zrP%DPC&&(oKfC=CzO9bfDIS|ghds{2mv6W&{z3=HSHbK6u3vw?s?`tEM$l5=3(Hv1 zc|4GX=4!h7YRzavu1c!n3DC#BZz>Tp%{*8kR(a@Ep)zyDSOue(>S@ZNw8J9`ye#~o zTLHYR5hl0f)4Rs5U33e6pIVk$dOj(*L?$by;aLWmHut*=m5=|lm%Y3~gNgp%8(?o! zC7c|Au8cfQ`W=hl(F6Cx{I`_|9m5LI=Eha*tk+ zmOiC4nKPPnm1`oCpH{490^L;N0%n#2rYUsB8IEr8z&Ej2c@6w;uiJFCdc|*h^;AV# zS!C8{Wfzqz7w|0-zMoVR))>q&D9#)WZB(PrZKM?Pne8@|&vaFShRD-ucxM? zBLc6&W7_SSA8_yuzIf}|fGk){zzKw07{%ZVF#ZIyX}ihx;{ea=e%M1>6nv)gqf4tx zlO*1HP0U|k@9LB9C$A5t$ZOjLi#8qjbyexfC-!=;mi69ic9#O$ia%^QJ)lVWzcbM2 zjg`p`VxV6aU~;e`24Ba6#xEcWva}ako&kZzj6s-i!xe{}p6WN1D=M|p_n5A(%agn1 zDfG3`>AFRDj0_VbHkNo4WEwOv7$|i>2OZH@wxLrfU?>!@9g@Oo&|n+PB#5>H&V%E< z6VftZOu|%(Booq(NU^_Xn5Yl_uy$c$@w{Ss%~Hck_V&Y} z>t0H#BzaSLjpG8L#>-yB@i!Sa9rG~*FWtEIR$+(X&PhC@(K&V`y!B)No`b3GML2`6 z>-O_7e1(otTgo})G!YXx#>YoR8@h2^>WD9eeu(X5?4%)4Zk|S%|LxD;&a_jV`i8Ua zi6r{zq#QfPT5?m{)CDu+E4)ZfW!_)y02xOT438OsOlqkc8uY2>KK`dR=hFmHs3hGe$1x0-N| zUhoj1Olr=BO11F!n--c(J*o%`9V5c|Y!lPB(_%?{ndizz(PPi8qk@e{SMo|GG3@n#=V;FIt)%i|GU8m$^A z>R9V!=&f7+Ic-&&kZZ6Im1Ft*#q~hWXGJb^&adQhrG;EiIAq|kLHYY7&lbpIm0iL7!nDnr-dK?Et@|x`-(zIwaulnFM?C!YJD5u zubCQ^4L@>tQl8w?=idH*7`w{0D7$D)cL~xZBHay2BPboxLw7fVbcdwU(h}0$-8CQ} z-Cfd1=h?g;&vibWA24&xJkQ>H-Rq9EE4EIpNYWJMUwAj8?4|t&%V7Nskve8%lUi(J zSPeXlS)-zWbK_`B0XBo0xTwyow#iCePFAcGmG8DNmNkp%V$($(U>*MO9v6&PFav@v zl)5>XuImSwRW_N3CC$otQ}cBziRr{g)zz7k7<9Zf7qv~FDh|TxekT+B9IsL;g7{MJ zpyM}aF5V2S)EvKw{k$kZ)nf@}0+PnE-`;waF0^RFb>y2Z1h9F|l3LW5do#OX6Z8(R zR@&?gqh$Opm&&TA6BN=e|G-k}X&uAz3oT34+HoOPv%<#O|7g=eL^*NK+CE)qm+mN{ z?Z?sRMU3Bj2LXOhPQS~lE4R`=vxGraW{>S$-`SgBZoIPLzDnKg^ENqKzJw^?uUyfOT~rt-0IO!H65FodUH+kniVa5$MgAk$Ce;27Wjbb2mucO_CZdi8)j_b6B>+} z#*BsRwqKHK_1a^d8BFjG6UBEIx?h-~M)n@4(M^(umPmV&JpAe9qLt!v`9hZO)@bU5 zMd2g+n!nzwEb%!1#m#I;k$S1lw-zHyL%u*D9%cdF416iHv(_#GBOV^+&l$dYdDo#( zc+JeJ-h&T0rot%xWL8Df3)5N|a7^3&fMr2Skcu#?ozB)F>)x$WjK+QE;CS9zZp*2Q znyptz;93>pI7rPQP3A?dxT8T`T%s^p$3KL>@znR3C;%L_MBGSYnC@RbX8p0y<}_$B zUG2JeF*PV6O?Bk2CZlc&6)zos{aTcesBX(dS;@39t2*c0w(1x9?DZw^$3Fw`N;UP2 zOw-ei(_$FEYaIJ#N;b25+P<5W@#9|mUl9#YiYOP7((-th`AM%iMMI<+zVRN@HMdaw zIxAwY)8OyAHz7|<;qoDYEQdTFQ1vBAi$aTv=e&*RKMtio?z|@!<$Jc~TxARtuGifR zx>S1V#*tje@O(~V>dQD+;YN)_t+~q0)Kj%S(cH(bbA9U4?I?Z9)SvU)5J*t3mLdQ0 zmb0XCX3XZv9a={aK+p`SDQ%`NopLqSXBao_m9aY5pBDbEspniwGp-X=ni8g{midyD zx!KqfQ%W)ijYobRYyLND`A*dv+sb1j1}r^>{;ltCO-NmM&=9l8wW!NVVUv60?(3ga z7>2A4(KC7mdXmw1+3;u9VHkwuKM{Ad#_9~W2xfbhnJlcabwf+9T zYU)s%+2S>c%gvwgQe|NX)b}$+Z?P~kTFJTm=$wj`N-BiQR1RhrbPh$7IsK6C_}%l! zz!^>|m~@xk%G^pfy37k40BAT_BJ-F_?0PPpduQ!V zh`;?-EH+)>miqCZW+S>?c$XZB-BXVljo6VX&A{#6R-zuRuSn?hR9EZ3^~%o8+WKUh0W}; zY=6Ca=ayhWw<9VNsBG*q{T2Nb)}V%<+~;R-r*}1Ue>~U8XXdNs&f+C==ucH^WhE9t z)V}P4q=De95la=ziesa~K{;LH>E(CUI}Ml2qek{OR2pMrC4JLelCw@lqLafOVy@Iq zj3f@V>9i(u-P0P9r^>~&2}pUh^3%t=v_n=2v>VVbgn?K-7yp=CSB_5!K@Z6cSEcWj^${$%w-Rf$`hLiS-{PyC=!$?DRm zsvmV;08M-3BbV@0iD23C%iaDkPIkY0zrq*GsG zh{deHNJ9X)o5Dz_H>TGSJC$V=+pfU+4JG= z4P!wT@BZ=4N&H{C2{u%XTnlkM)4*OPMe|bnY>|&dZCKgxA1q}pUpPyey)(kC2!R&V z9S+Vr>3mu^6}KhNGy&+LXk;|G_HwDx&60hYNVJ=RhHwC8{wH;yu&h|+ESp;98e@S~ zjQ~+S@AA|ijY-{r58W%dLe)cuEZxp0GQ{90<@ci6{5Z(y8Ge%<*90ZZiUWQT%w1nH zaajKrQ)&K@b8kNcVn z9-^aB_GV4ZC6mg@SfSrUCg`v^!)4@m;}%*6g8GqhU)1g&v_5|QO3I9e#4(OQ zy7R0Pf5Z^Z13{+v>6#4Hb6A5MWf*tCP+v~&TvOM;8Qa%JL3yVBIa>I(6tlmvhvw-J zUZQ=Es&_FF63@D*O`KskjTzsu-d~&eMv%#iHi=~#kG?XlkYak#BFz+H|4WFF0d(;N z1=hSN9M%j2`(bacqn&%NH;fpnhW>&c*D*AynO>!)^-j5KmJ2oaUwTh!6l*Sdqx7wI;+jw^FB=W(_nwM#$C+uM`qXhKsdAMHMeX#R!33DF#1Gnk(;g0D7 z*~YrH33l%*n=fUo~^1cszpmC8qrkf=^Fy&&DRt@9i?OQvzGFne5yZ4(?? zKF3`Y;MR-Zsp@Tuu%&!59i3_7%IJzQ{nsx#zmNcBZ{pM|YcZ>mg1!bjpi*o(%u366 zIn5)FL@@~m(!80u=Cxpoo?>P{UjrldV(BnlR zN*Fuqd4f}|^U+L;94xXQHudU^%7xQEo5X^LZp|j$I^0P+&cvoquIF<9tg1M&{E2X> z=7(A(@TcqBepatFsGBf|>!C-hsJ)w9K44~psW}@1XZC8xmeZzcvi_R*Fgjv(1cIl4 zGYu|ev>bE9YLcXcz~p`o;)O*h6h6aSSaBiuqKf(DPu>su`3PgJq0w(1Fww6Ue&)2( z02sx>1e-#E9QEMQgacug!*zZ+0{0nc`b+Ouc41(e;A7Vm*?KgPU*<< z98?eewSlyXzZdTeN!}8#8ZPnbl!vR#hE(;5OQS%z0%>^Ur)8xy(O@t$`rS)*kI-rO z^$Xq&pvM%}+}HG#iw+yNH*zHQ@vuehd2W9#A~igUs?0hLhkgw69Y5N#VBWA40s{ zr4QeY)Xh{7h-!=;JD3UB*XF%tYW>isMp(nFG%?^S2Z0>?)K6E4Y4TeNdW4fMHvJ+p zAZow#L9_U!Ta-T4c0gX8!)6E7_Sn0BOQDI?MlA+;TU>@jNT9~ORQp#gIUT`Nt>gEM zj_q`Q4L%IFK$>>8pCBLQ|joru3k_(h~IcPU9NoSKDL zsuEdhxQUB|LX~E@QkO}hmIyO1+siJ8Vg9nMs*wM6*QB`L< z`}o}C$vfm3XeMf4kLj1~m+`c{wnp!MU9<3;z}Tjoy$A8G2I?PfdPrF^nu)krrw-=5 zUsU^HUfSDz7gv+uiZ;{u>1zX{u&rKSh?%IMo*11Jg7*r;9BbYw57+F%y$k zS|%Ek)SRMrSHBFQch)grFAe~-bZ-4~Ve764n!Gn%oX+)=^q3ctd3;>*+?PJbHsZA5 zDa-39qe)YF3T!N-Y+~!>uj+a8<-6Dqwg2XW(2S8}Tz4iPm~_ruEYZ+T=D)lhS{By3 zjFCm{X#1f@^0$r?z%-Q?CI9-eubD8r!l7TPd_WQsE1bX|7g=3ulVXR z^y_vvr!=}P%!we4wG}(aB0{FjknT`*(|<61aw-$8kItj+%+$`=LiA4jF1oE(T@G)0b|T z^^hWOdKi5!v?6P`=5CqU`mTMBa^-xdRc@>Gsw1OzSNiTJho7BzS1D50Q+Dtj6z5b^X_? zl($Z0oEflo*J&+fIw+Go6IB7noq!8W`>kQHKli%0JbTt4AgJ{hkMnV1-f;Y>?e;QP z1f2!)viZhA46CPYEBWWz;;8d#`RdXVRF?Mz4}FebPrWgWg+GY@s6+6DQL-~TaF$HR z{ZP#)_cy05Va=_)Oxm_`xhQr+K?%+*!ZI!lDPz$r28N07N?Km_TjbYd(jjm<}A*T zH>$%en6@t4Htt?!-ib0LPJC zr;U|_VJ`&Kicl`55`qsJ*0n8V+PZ`lmPxOmRV_Se@|g>hfKdXfYCvn2eoGCCp@O{WSb7UJ6&juk7)OjAT9-oMoWd9s~J8HYLdv=q6td^LUmtekJ3NWRd!qamklfqk+)Tmp! zRjNSvIomMDrdB;}lANzcN6j7cdbm+4>Pws8V;(jfhB@5+;Ibmv&SE((8>4og^ie$~ zC`XI1C1f{s)>uQgoyZ96xcIimH+??4*bC-M1*t!^~ z%Z3c6g_!Y7KgET*hB`OkZSnc;{8$|QHs^bpWW+wYC@uRWoC?+Z>KbcCv}W+hLcP8b zFZ5J)H7RIq#ccoD`a{fk;{5kdc5O^#>_=E;jadUK-tVDHcLYs_h!msPqVoNdB*)Q+ zzPKL&V*~aazvgn+t?|KJDGMHF(cjcBT#wi~yqIHwCBr4A!}smQ23n3ECQ}w>g2i>Q z!`FuGU;rf>I&{lxLPc)TA_e`~8M1y3oDeN(0Fn-E*3Qe&J8<8}qZN}PviXHy1M+@$ zaWN8)PT^UIU*rX$9I!PufJ2t|Fb9NhK;j(C+?+l>K)BU1zL1%q{A^RfN1(rgzRYs5 zF|1oVCzCh6J`t#;>B){RQ|ldAP(8F?0encH;%xv8$o@WTEFrTMHp?-|($JOK-YlO( zwz-~Lba7rG3CilB;yJ_lr@ek-8qZ)XG_e-<-M+DHqNR^1d|f7!lvLqXxbdM{ zs#4*!gIHWEpuuyuG@OeUW;Z}JJZLxZ?nQSlk$o>wLxK!_La9i}50d`=-Z|(zzISpaMz)V$gZ7j~-8*UM-!hB` zlSGlv-5mv$TE;UfQkmq#b?(hlP;o{>0PQ(sfXrnfUNv%uB-fwu+~R@t9y+c0u$Oyt z+bj}0evu9seq)9bvRj7a=%r=j0L*&v|%pyjmclrlHhKD`?; z$3&urHHBGodE48-&aLsKLw$N$1=)qr?6$HUjceo0KPJ-QWhBjG8u}7DaYI+UvT*dO zd5VX98|$-x*I$*>w6BVF*%gxZuj6kXPO4ZUJ*W3)_fHM?!XUwq3@G3r-=7zzFw3&OT0)64U(wP(@t+3r5M zaecxciYF2I9lLrU>HpxofWeFQuw26oMK94*zvdE1Q#QQ(5|!Eihu4$X>|<%`VVzI@ zArD3AY?rxlR8A*lOz@1_FV&o%3gLEC!uiz}7jee|X3 z6Q+5y3z|@ON=+=tAM6_b5cQXp0q;v_aIhF-!q42Gb_H9I)dcgfnT0RGgorNSM|%$9 ztpNi?rTYqvY@%qkl7laBo7vhmmkQdT!9X@{06UO9ZBcn)^P;AtOtZWVB1(_0x-=Ha z_gSZB^jF!>!K{UP<;}O+l3!_;)lBmfSm}+ybPkVgtl{V~-IB~;tLS9vh@eZFmo3Tr ziFGcVggFVF!qKG_9Rao0Mt-M6qCz3#-ffpy6!oUe8DJEKu&nLybyv4e-3Lok-h#1i zn?W)ybYYB@Orv0au`oM~^qU>m^Z5>mNL4F{ru(h_1ezm#4xAR8ah5Hr-skjsui?sN z#Kpf#W&*tFIIL6g%Gwdk->loMYM3u|=xa&tiK}@8vnz z3A0M;0<0ke2OG~+ccfSI#YIOaL*vwbatY-=csG{VcfUc!r<~X5LKkGb_Lu%4dFn{xuVM@+uPL zFCHdw{Up&6mqJwScev;C^4-0ay7l1@>;6|Lq`jd;qv#ZfEazX(KR5+lY~XZcjw~jY z`-YE85}`Y?7L*)zpYRoDVkBw|9^AeGIl&V+`PE|9^{)Fee~gybjXQozKxNAoRZ^+($~ky}9We9j$|x|4>B(PegeT$fbe5 z*glF+KfHX^oC79pBOkSw#s90Kc_NBm;&;d+1OFUC#y6Y$$6)L8KVz0(ml5J}S!DVY zzs0~g6hd3``9__u=zt=I+C@*~8zdNz)POfv*8BC|$23O*YPh#Yx1gH5XNSA*H#JsL zY0aDNGbbQ%m=0?rs}Yk!EV_}%G^O3lM!-yip;hsbOPe#sR7-V|FO^)yfD=90)rNr| z0>_hmHR7>q;0q}kWG?>DD(3y(*?Qp7alB2gxl}egeW+NTOS2D!aeFws(3T|GoY@5{62i-_9-2gIy9Ko5*NVi znhmC`yDd5*+l$C1vG#&%!QNKw@q#{=0=LhIZ?<+x;>GG=IA!$KXbVs)1XN(QJZ~$9bP-ZVxuQUN)rBW&; z9feEPmSHwiHU%x8B)4GI)N(3h={e}Dm^PgyFd`d0oI~^_e%s#j{HBDE)d~LGkMul@~qEl;a z`2~Bw$*|sI80&0jxh2`38ke0$y;>k5#+|2?M1#Z5e7;-*Z>z|beK6XB4C zorDXWwu_WGEF6=jgn^ZwWuZznsTk5;&5W%=SmmLQq}NthzG}PO^aHk|p2nGIduHC% zu0`;Zha)CZAM)CU2p4bxbWs~OQ+K{Xxd$Gpq=Ym+#utI>fe0DWY1FYYIlaMMBF~$7pD_*)^e!U?I2K?_BBr-NNNMl3x7v{Gs+yEB8L7dtlz_* zS2^k`c=*T5dH-Z!nX4L1vs3DcCg|$L%+vCGeJO7is!qh!=2u~As}C`f?WVv^kb*u; zmnQVS@Q6^{oUdO@bBrw%@iI%8kvL+gwY+)T?Kl~&6Zyk4D4(2mQs6Dd7I3ya7>_(r zNH4g4m42lgTnhgSJm-&C_J^#em+|X$RF27fjHole-fO$RVIPvKx6F|-{;U#|*ER7- z&=h@Pd=4xZ1ts>|eIWo0ZNx<6=@8Z#CY@6f$_7I%W*sBJSlxpv`Sx6VqwZ6$d!N2D zl1y@;y5EN4bJ&T!;|FN*le4^d6B#pBUW%Sg^-S(GhH{yo=y#_P4Y!+Y4(}puv~s2# zlEB7td^7PF!2tO^BVNAe;#1pe&^<3Xn76LIsqt3bqgOfPIBCuPw~j^?N4G)Q$8n2F zmpCB|u80u()LJ{4?9nZiN`5>JRjX17Yr=>x^iDMj1$nf|q&vgyF?-~|Sft4;A@Llk z;WL81K|g9k>ijvJwLiQd`?W_&AK}jZHSJi?cK~` zy}~|4x^kz57&8qcMGsWa`qDYn4x^Qs8IE$CbR;-2-yI5SpdSMEN_f!?F_d%2kyDYd zB5k->O1tf5wf9>fE3|6XU64|rY$!w~M=~9SsZP^d!QXA$%McUT?RxG!%TWZyEhxzq zcOQ84RG=i4N$)2~M#5?d*wG4YRp#O=UwAwK23d!(OrkVJ+cFXEA^^<58Yr!5kg7}$ z(#tUvwcD>i?#?4|#hWatHl6if(+vyIV4GHMZV@R*>(V3o(G0v$ zv!odA-)RduTxI14GC*miuER=0x?VD+Pp`B=H zc;dA`O(QU`-Fy7VWFcL72Pc6S@QvticQK#)!m8%-!)plK*xB1WgF!@?0*;}VlRSml z(^jWbYh-$37W-mKdE-VqUzUP0y; zMN(j;QRmcPiI73N!4bx9ZTK^qC}`eNvvVbp=^#R~jxfe<|KJaLFj`Bckgmg$LH0i= z_*7_<--v*bp*sRo7xx&jXQ;Qo16~ud5#ALnXUB>>=la>&y^=LEEp(ge&^4;jZzb7{ zJKV!C8Q^FKEe7v>oV}~AwTARPsZagHS+V0}*VUziRAX<)Z}tK8xrTt~O7NWx7Wo5$ z==-fGtY>wf1pt}#Lh+rI`Hl9jM*=%WE-uoe(?m)=CpN*Moz!cNNo3p*F&Eh^ z^~FD?$r^JVrbAf7=>^Drh~i!B4YnW2C@2;J32U%;w5$1fKN6B@zjfTp{7^1kDh6;d zYr^EZyB&U;@b|!W&LLY0pfanN>K!DxFL z?Q<@ltVN-uov-bH$u7f`cCl`4^Y0`Sq~>W&v{;OY=7^z1?RmHb8(r#@D{`0BuK^ri zVz;D?{q`D6oad`Uo^PVC@d2fp6Z&_gEHm}fxZi=34_|HLk5pe%{tPN!zLu;y>BAEr z@=`8on~6eNf0xgfCNOtW$g2ejf!cm87aPZvq$q5K2tw2ka!pDB-YzNP-gUd+=!Jzz zRnXa5D%Y2TG1Joeepo0ibh^CEbduzmWnW_{-`t}_sdt08A^sa!VeLz1d)Kvfn9F(_ z^zwPugO*E;0v+uEti885Cy4|SXLt&{Yl^IQR<^43H;uV4-JJ+W00JXu&)>(3x;0gr zMKws)UN9rtifgfV`=1l%xi-{!(oY}Ec<1|YGTinhW3{lBe=?d0#*IA2k4}Cyp=Q!h zH#^~g9@K;~VtPJ|C~V{k%U8$^j>{1BAdJ{kYbEZYjwD17;IEH4bxkzM#8QHl0IzB~N=fC!%%4L}55T zzr;J!q?wKMrKI7ba*d$&DVqG(aGRQ(rP#R`)cnvojofyF2NvKx%~db#1D?~k1+X$s zF4le1)!>kONJyImKmCLsW0@s=2MJJQfv#JrQ8VsC;75fBWgJ>e1G<0z>rM95eQi&f za4`ZLP+bE@h9{Tbf6mE~zf)xBX6a0VC}XFDPQFPNbgm`2Nx)3zef5JdEoqWFyGaa@ z_s{6To!zXNPQXG6p66a3b0@17SZ|rKU5RMLTVtld z?qRewKDx4GxtA?K6RrxEFBNAHaxNf<9&s}rcaA_B)?8C(0I`F53S=k+gt0O7Hd_3bbFgzW^LxAo@_k_CF7l6a2z9?$-w)=}fIy9RIZenZVa<|ejPDv>4>!>E9W=E?W6_NX zDO|NynFl}HF`lIrNIey_&OY136Gbt|cqFls0}E!v6}CRu)<1*YS$>SN-OEJf{Wav+ zlj+)Bkux+X5p+OMpLa1rdo)U5OW5I9sFRwq zLA8-C_h$|lUCtQKib+nF#&v82Gh*cF%AAg+tFOCgm{#WVpl0TYQ){Wz0tGLUbs?4~bKC0Nv-nmIUm7tWf6(0N zG`r(+*JOmY&4NgO2ehcnza7X(MP=@y5-T0o#++8zR6lKt$b3o&E>?@WK6Bs&4~OwO zIqfS_XcHkQ#+An^44R3x#j)2bS_!~ph;>TXWNo^?F8~gMa;%+M)%w_ldh$c|Bv@{~ z#BmiE`pdue(JzndF6V9c8mTUGfZwNby48velB6G}HTWGYh4}+Us%chZ>n*xR=3O1v1`7rF&YFrKwhB) z99SI890=enY|;7|HF7@#Bn{WR&~We9IAGc8|3PyATPVjPNSk@F)Qz*8WTHHL?UBWh zDDJ2YymVl|Gn84OU%rHCq+?4>QdS=|ZH~9{sVFhjVuiO9jHvjjhspwd%{vQW#~HKG z0`Ge>qjaXy@@DE8fl3>;HGn!1QC^v?75HbK*6UG&7v`1son(uTtnc!1$&f*C#Nt;E zdRxJ4LI#q?xouP`;YH1f=1@0@OnTq6-{pN@0?XW-5vwspikWC!iN56)Pu%qPsw@i9 zPrsQQuVSuC`y;Q@^hJreh~!7Mg=+SPh7(S!Da;Xf-(!4?Fw7oXiS>rVJRbR3-$smX zJPDljonGB6&^d)B+LF7?ns7JfW@}-xVWSGZ!QE7yOnty427#65S%zy!h(BG4J?>r) zyq1iUApDsKAmTHEEJPLKt^Xh*>;Zg+$8HFkD6bFQ3&o-MNAiSNJ+R3oEk?5}cKe%T zLM+7)smc!xl)x(?Q8>MtC{_tZ?3km!yk66!@M_6*Kka*&I;u5Y70deF{m|w4s5Wx5 z1%5zw@UAXoYP(?f|+fUq+y#VA|~)BC`V0cWdJ?d$iWMT zQ)b^`AX>bOFv9xujBQ7*Zidf#Y>b&qbW?-(RnH9iFKx4Tq{1sz#19n*_5T85tW_;f z+FLc)xjBetE>Hp&KLvPjZR7%TxBJG23u2&HBLFybnVYIlr(STUqquS*spY9LrVZ-Q=}Qr`Dj z;H(ZVGTPZ#WyR1Dz7*sbclr4pn0wXUxoVAVG^(}0I4rG^sqz)YChCu%7esIER@>x* zVsYJ`o)k;89f&ODR{y1uPgEmUJ5zw-I}V0#BVF{4YPNaq!+zC5^>8{1FU5?v57-V= zQ+W+v)r(pfC(W zi8a=MO2!^Ta3JjJh^hprhMWxO zK58x0_zM7FaL_7xTg#;7PNpqjLc}19xJgmnD6^25mSH@UXX~|wOvu-vNBIkVgM{0f zM*wUJh9}QCk%b)c)a{F-E-!cnGoj~Ns6LY(@@9p{?Iw-ZdYP`1?MSVQG83pD_oHNR z9=!fCKK}cs<>mb*ly9-a!Qly*$>K^f+wQKrbA34jj?^cKLZmufS#2o~_FXJ8#s zTfa7;w)3fuf7jpMbRgiD>f}yW0qPF}z;m);`k5&lo`0Ha>pRSB4*VZJZYB44FK^AE(LShb7rn26<#^3c>&e`CQf61HIg;8A9;twsuNUYlkw>3z9*(|UIe1QiOAsaVD^f)fWqwKZZ z@3dnKiFy!*8c#iAqW1mUs~LfJ>E)z00cy6eg{q}Ho#{rU&W7g)hdI6@o*IPe3>8$p zmP)pysefm&t6+hgYDfvx5##68z0WgroRVW{N&D*IRUF^XTo( zcK z-pdlWHsLlibP|Gq&k_(Il`|H*eZqko-M;mD9W{^24V5%_^s2;uo^5c5Z0y1sSsh@> z2)aqwU%P9GxXy6z(e{PU(LDBM+W-q#qX9d{EDL^$26s``c-3NZZ$xh`eN7DprKI0s z04IQ7lrNCkz$*;Ro##$GY#+QU$8)B&_}hHK+Z2HX17O;o%Cr1jY0 zy^;PLyLKmEKGI;&o=+cc%pWzK>gL3Cv$wf547L%-f82h6w2Py|*tHk{+f^J!x{~Pn z%GvD(24^(h-Ft(h0fcHTF;L0Gy;_;0$xCfjoVVPVr=-Z<;NwS0D!6AQ=nK`=d>sg+x^9Jr-ntuwj zRP2ThxvIjD}V^>L{t+F`Sc8`L~SAQn$x3^}r61U84%5@fZhbd4Is&oDHW^*x`@YaC0qzw;IL zNP_`zPBu0Z_hnUiTmj zI<5>L^dNjO_BwV5x*2pB4YO-7e-B5vxUZOdF=E9`k{MYk)GZ$nv4^w~bDq-9A9%0_ z1_z%u!VG*AID4x>lLyC2 zj1}^c-u(sEtP*ug$HbkiYlHLf%N^Fm+xLhktbOYNt&Ugh6US3~#b|N(M!1n7)CcW4 zAvtpii*gPyn!bXgHdoH+DpC4>TvCRfu|JdoOCF`q*Z#=>r22w<1cnim;sXN$1^v=KNZvZEU)NV*?(JcsO*PO{ja_xj*V+uKQZ>xsc$-<1R-O}@PLxBJm;O#%rZHOE=-U( z$VGbu6t8=D<{Q8jyG5{pJ$?~ zg>2&S&n~{N|DJSbCRzzxpfx12&`L}?1zWVLfuv{rKn5@?Cw)>#?w-%?0S9r;5SI<# zL={xy&zC2w*ROOY&QkdSCIODD2G-RScw?N+!*H`G0y-y1^Nv;`$hDvY?!~a`sLswk z{HPI_iCB$IS)KDt=cZNo;m((!q>qC;Q>`sJDxsjQn`LDe`)CmmV;Cg?z<6=fKtb*& zP)6Ro<9*G5z;})(Oba90lyFfyaaP2#jMZ`AzGIW~HnZGTp6{KsoIN1keMCNm0W5Hz zp!^#W(G2kC)4~_jrx{MekK0rn4CB3U01QO0%21H7M1222dnClE@u#;TjllP*%!9z$ z9&okaj#zZl#q;o)U7?MCuTed%yokAc=)2j8CaPWYcfmtG;Mb4j0?8FM-V(IcuzinY zR>>K44zXo|85bl!82iUV045xtMA*xC!btwGgk6z;t9QYZB|-v7-~U7Z#j0@3W2HaQ z1lO<$Ttsqkv)t>$$Z z<(el-zqsgNg9Z!Djv03GkM^Q`$R{3gYs zdHT!kh`Tb|!w}vh^-148;IM9>=D`A=yXg5{#q2iBp$?Le-^CKADy%aM{dN;)toeVB z=@gQ}X!27LUq#6wWRX^#Oi1fu$~wcY0zS04xkv7h!Ao>9MIukmL_OJLdFNX`VpObt6_B=?wqw@ z?H9&^3>LWpGFi&3EJA>o`K1&WlqDdjBWv;#oFy!p# zIux*V*Z&$3F#PEF=~^h@?f7}aknHwq2$E$p3*?#Sx(b5hog9Or)<`ENb_s+0>Ka0! zjqiX*RLaYgqQMzl^zjD6hrf@KZ7o^^=Nr`3P}Js?eaMz$;CCVq$IdP;PfTf=j@^v4 z>j{g#ysdurWD!PGz`JbxXn1w-Rv%<=Z7Jz2<=b~fm*2!!3PA$N!64qmk%Q2AT70h- zL3d&)XXxYJUi0jSH^HkLiPEox_41J~A3^04U`HZhvHm`F8vBvmTNLAam)H0^6?dtV zS-rK77#EVjb;Sl@G$eBW!XAcs+4qm{92Vy2joEc=%Iv#<)I*Q{SbjZ1Ynxa;BbE|~ zP59y`t3UWc*@_5kWAyBQIS&Z&{5&!G?o*79y80zvcODp?>Y%33(Oz(;I2g^Awgd4L zS6lc4HfnczR-ji4xCTTJ*z*i5#MxgDM;7Y5&0*ss)f+vzsVO<~W?!t=YgNH43=(U| z9DcL<5$kG$)@@6j`&FJPuX}ikt6nHwh{JKX59jZ}7ArtpWHe=DS{B(^^!59iImNl3 z!`j+O!h_li475bvIq)UF&!$tkT1WxY1$xM+s>G~Q@Gfb!goU!F0>QFU(kyL$g3pO- z7!5KclG`I3EFBjF_pua_s)8?g?;zqKkEFHrLYfNYUmO(=)$E(unW~Pn71oow2lv2m6vu>c@jZF^KplMCuYn5$#|1{-S<-(WXbk@i7B_q`zz{@eqYRO4 z65_0T2N(l(MuFjcPRvRq*y^zcX)tbekcsYJkvpA&rEFn}*y*dFF+84W8l@@9L2o}g&Cn9`c={ztN*Fjqu7qX(bvU6LBU>*IY~-E@ZFYE2=4(Z!1Gbi@5J~GGVUkF zvee6`ix>GHM+2Ni1z)!^)2sz%T762jj)P0!0Ga@sik8OZrIF8vuMe=p*Tn3J~fz;Y& z12627xy*2vK&^?>PT`i7tkCxXa}pbljkyF5#&8fuwD?sU|1O(w(ry)%+lx$C-R)+# zToEEEzWp}2SJ1-gih#M^k}8ilX?72BJVzMahar&hh`aif35#)d+O=PQ-d~1Jvv}nQ zSQ@~a!*qk&)$@HCGSxgL!VPVNiGa#7WV=jd7JGV{1;a5xw}^RiAslu0zzv{aLXsM&42QSt~bVvAsl z@q-+uVR(M+D@@=bcc)YIoGGiLWt~NS%J}nE40Iydv#EMt8w@B@Ih&1=Mc$%%g7NvX z53o%(!J1pVDkYPOY4dDofQqzp#S*Pos1b%aFyxL%H6$vlQ3xw1^a#2$4Cr8XZUwYn z_pR}lWPy(}@Mw$m=pVG86EAOxauunG+#>x|7TXoVx;Wc6Mg!Wfs7+ysZWj zqFTdh3rDur;|j%ygm*R4@ox%~3E{9q@GiT8{+7DtUJk`vM4$DK1R6CkEuXe_aWtgf zFvoLLCVh93ylm<5cNA;cx)~-WqwFDdo|}F(Ph##RBh>XU1_Tt~ZK&)uNK>~!9|f{l`xva0=Fot`oKEKQ0Z9$!ChGWp1#kGVAdqo)e@VpIQ073ycrarMTn% zP9?K_Y%aoO8vMTr=t~I92}y*1wpX0T?$Xi`_pOT)c2hTp8rhUPcztF^Z_T-vrxhlS zaLy7Hu8fB3Q0P)gRNSo_A2b9TE07ldsb9FP-rIQPTrf9Mx>Cz}9+$Ghfa9kpO0*d& zAuPqWmtPITsSFH!VQs^MUU+-`tR`;PIDCP$m> zQK^HiVzVY?4BwiI8v%{nYcjQk`oUK;dJ@5a;wopB=J}E4BgVhp8}SL(GL}-|9Ktm= z2_R>ehgIoS#LzW`-mC>Bs4#{UAG}8x;ILQyzWVSc(yr=z8xAiFnDsBEl1%9#b?w+K zRdz@*R9dsXpb|FcK>xM0y>RxGuG<+P@YqXzxq&tJ8SBJFoJyNj<@(u0o?-W&jlKJm z3GG|{M$)e)xJ$k_il}Go8EkCt0l4VKgGv?Zig4@h zRC@yM&G=v^DU`2|7bU`)X!MlFxoDgJ`ByA4yfHf|gZ1d{YObz?NqL5l5eG(bE==7X(y51E~ZYV1NM#x*Z%F zkva8oW{UrqJRNW)4qo`Pg9w-jC61{47eApj{(3pOGKLI#s0p`_*%-JE)()M|O1lV* zFNjFYYzfql=|uoT4%`q?)nXCPF6jZt9Sz)#RZu& z3~+cR&ceHNhWpeN`3x@yEx%CWE*N8(L0TPZ^s{X14L3mNws>Ux~rD83mY zmf=%(a}GO>a&p;$gN~OT2@YSd%*5p5NRqx|f}DP5Bv~;Wt0RIhf7Uw1GBl#vXx< zGYrw@hULVtj*w^cNFTD3hS%}omIYsH5bOb2>8r1G2pQpq!UGIDih_;V`Y)eH+<+f5 z-HS9_9&1#N;+rz%;gRTq{cr2y{k^&N*O9m!@Xya9P**v_fOsMaLZ0zfEJ+vNWr!9t zNOm0V4tm)!C`f1EK}r!gyIj6T6qf~{9W)ez9opi1M_g`eeL^i4eS-IUeeU|M z&RiwPM>5*N-)O2%@F_@mtwjxX*b*w%w*bALX*17lw}=ycgJJ9(yG=EYUlomA>0MDR zglvJGGqd?x`X{fW3yObZfAF=3_Pt$ALhVI0CVC2dY38@aBT2wI5-5D^16rH=3L->? z+!Z0j&^^!QAe~qQ;PdssR=^~Sg2K1>jU>iX>J2|nH!`22ZW54D6`R%k^oExD8B&2Y&Kqy&L&Jk_L^{ z{F0ub&Ly%-fY4c{D=F&yX20$cJ%T>uNc8+ zGM6;4GJEZoas~Tc*<$OWxjOXA zvtEox#MNk%b;p&bhqi%n{rVC4=1vn0o_JSpx>ladd*R6kZR;H1g#;RixfWMvH6?a= zpu`u$va>RRWdGXTgNI~yI?0=ol^|PwZGyk&+5a+JC2zif-OzW31$Kbe8zi_!bA-5* zi{b=?7fK)G(DW(79fzk6HT@Uvu#$bBsSF)*PK>_jSBG>IKr#^A*`|?>=rTH$GQTGW0%NE|eoK$p z*vq26v`N?bTla)uG}El8*+xbK*1I&Nmsr?Ce}nz6D4{yOfAQ`E$B*+n==_xha#Uqp zq^OZ)LgY4M3)2E{h9|-*ab?QSpNrii z_~NJ1`-&UtZODx-a_|K|Srkp*4YQ<39OW%8UXFUK7%BA3OAMiHiJKB(J@!@U!du#V zLeDDl&$DG(vnm!!FbdsbwE$}}GG2{OJ&n6RH05v=1zOj_K&T>H&~rf{iQS#(M0rc6^J-ASar zGo5NIZEIWh*-yTJ{`MY8kC-{k=fT7h`krMNvN2C#`5hYx3w^?4sN5u&#F*y{#Eaa< z*0vb*4&fhPC`LND{q_lCFA?@jJH8VeDq@>w6Od*e5!eWJi0g00|FTJ$_UZPvcxQ?B z)5RxdSY`HeCcaf#{KM#}0yDkanLW*&&K+S~j!K$+-{MO$2V7Sdf~G{fUxJ`mL+mCf z*&)yt`A$j_+v|5S(8`hEnMH_1#6KSrdKe?3p^Rw^wM1zoD%RCmyQ!U*Q3%z`O`y9E zI|OgZf*zlS64jgOTEzSW&x@e1uyKoW zj;7*oZ$qm{j+)k&I7jVhZd#t z{t}V6)7T-l-b~ZSPuI`7w0gI(H6Y@dE4JoG8j7Y5)}JcfHqT+g7-%Zf-_OJ}jC1L8 z44!J$aCGa@+WEF9T3ZGL{U+nciyY!l!8%RZM_k;ENiP*sU;9j#pG~(Xa%YG{(o82P zo2hR$@NK$E!f|j`%#Lp9_^35o=Kh4x+P$MG19O}0K2y!kAeInO>EH)f`Q*n1ScC&4 z7_cZRmZhS!rT3aa2~TdaRzLLp=24W}4fA=%naw-+Lykg2&)7NVw(U!c7%!MOZaUUK z^v$QY^tV=Kn?KxYa(b?0V|JG2K_5SLo4&PDW`26|b^ncdT8? zB(%v|r%X!_*0kB>!px3d6tJM^gN;;RiQ;Yw6I(eCZ7vXPP#A|?izbvg&u2PnN`}W& zTwGS`R&H=FWi8qcq46(k+52PD+Y@bda72%4EKn(h9=);Qc{{p(6S{{Y=KAUZ!uIAj zP+(|_ujwk?-ixx|22F%e8*7Opt$4PQ^`t3AIT zqv==4tP{M&{pPWmb66UB`99&qiE*3|s9IyhwExR8DAE)!-&8g+zY+y$?ckJzz|?dE z63eS;#c7CO2DxH+4vtZ_N#bWN4iVMt7I%Mq^{BEH5 z-qv0kQ>w`$)#5Kn&-XF+;1{bio6Zt_m}zmF*1dcYSZx+Ib-0> zECVhvhPttkl%?2`YFJgEMHO0nD7w!FWlnDcS`iL<8RpRq-gnxA!deO0*;5}-LOLoh zlq#tE{O|Gl&r5Fo?8uTW!;yGy&%9#Fcmt|~kk$d@ECZhT!bU}MaCC$L`Z044@adkZ z85wiF`&`__y0xB^Vw_vjadDP~$yJ8(5)BdWGzXMB|5&{r23D51gTHQ> zNk25wC@nwb)35Q6I-YzpEzUyzL{WcZ_*-Ai`6fxHFb8E8#gwq(%uqaD5#vwn4jImU z8fY~?t1Oy-WQb!aK^ZxoTKdPvx&;b1U+??*fZ>pec8X`9R5O^1MxE2b!@^gVU zh``v!b00?=Po)**pvnnXRwzH{(cd5L4mQ<}uB1CkP372Bl2$gIk3HSs55Xdyexa!F z0;$u7>^f?RDj}AKczagI_gd2zcYkPi^PT2mCe7aPV@wV(;Wkwjoh{w@eGd;J4Ftzy zHl3bu=w(KTCr1bPHze zZFf>h+>A!GGW(zcxn8hL+W45`(hJ&R0?;AUHs2SOAq9i8{WQ$tmNDN4vEF8^7qsH! zc3BY;JMBiwKt{)9k6673y;H#bO`(VOY7xxl#cKBjJ*nfSu*# zD`ZHAfROy#2HTT(?w)nNZ*2lo8<=4?D)%f;)K&X_*FjY{Uq?R~i{d5s7_LWc_KkUp zgqru8@THYsW23G^-NHQ1lFef-=LT7K7H)oiqUl1~sc!b4y{|@$iBwn`%Ka+30uJAt zef^Nbu3emB*KH<b9vvJRI@S^;vO}MEeXaSK_jpN_ zxsi7`x@Z41$X-^PL?Wr{&*aQZICvU+v%2m0vE-I7B@jRtKEE#AboDx3i2+@!hb1Zj z>;UMn;_A}2HuBX~Vg^N5*Cgmza7(61dic{%l<_ZwQBs~yt_LKU!g?AFcpeAIchc{Z zXl(SNwG%e9I~A@Rs)&PW!i`3hz;JI-a=G(1ttbV>KJZaP`@$kU->goR!rrvCx9`(R z6tH?vu5HVIX1#2$4Md5B4l$!n+Jx)su!nFcAvx~Fv#8ZmKBdUobUYdxV~2z_<~#3p zEV#?9#^Y`@D!~$|q(?0kvXIswDHNG`UM$!Ccg%UBg2+rF5&z!P7nT~iZbCE9|8ISox zO4SP@zn>_&RJZHW2nrIjv$Mx`f$pX;tl|*3E23MebI;1AEqLb5LxO_CkXT!uPx7!| z5nv=*BGs;MBF2Lyf)i!%#Hg0cv&G3tt&9Ae6~*sZbJ1PAaZX3*tt+qDOV=?AogzY1 ziln9KpEVsN{07Hw&ta&$Y9m8BX&fq0^8^uG^WiEC4i)C6qSggUUSlSGcNT0@bAg|y ze;IZx8+g4SOgKRw@+1d$4U_Yj3x!6JKSe4Ax#ozlPni2#j0AZ=^g`T)6P7q2>bvPwR_j-O4Dk=nwcF zxqiaI_t!-!*LZ?llF6nWM;e>r#DJg>iZ&$Qgr-}8gPYdl^4O}wU73Qk?y@)q)7j!^ z_uKR^bsg;lEk|Vq*Lf~3RSj3>E*1*U9v`^o_+aiP?@VbXQZW~I_u0?Ii3gPoeKZ-} z+I-t{&ysLNDzX+j94IuG#*9@h8)|Ybbw-c5yF$1<9)092VE1&XhiD;TcpRV0ITa}- z&I!byRsio4k!sd+HYRVB(R9w6zy?ysUfb9E%64rFDu`ePIr#kz){HTpt0rx!#ZlNE z9)0u7l{XG1A-m8 zCKdz^4HZHsGjZ3?)>zV5YYPnWxI?TZ@i@If`uY2|XxkUWU2A)g&mV+L91-xEJQK-y z5uEYd6KSu=5D3;zU*XKUQ8V7IU%=19vpy!f9R0`ABe3h`Q!#z{whp~bb?${R{1M_4C@%I~w?qQVQiWCX!U7<5KcD zto9pEZ%KVPt~CNiW^nQ%Wg|^kcid|mo16O_8b4nA5v4al5QXB}@nuJMAAuI*Zl6;f zKN)f88SNoR)y&J*l%kfOk;SHvLJmp8e2TD*KgdXDN|%Nb#*7(2Ig1PTt{fR5+(@Nv zXAMzUT?*; za@^okWR$_Hb}%{IB~Qf|QK^d}Z^>{cPqWwV?RC0B(J`FoPq%uVCSz1Js}%C|>py;z zrv9CmpFzbrg~*q`YlRot^IGr0aF3r&TLNdIe7_LiFO5UIw2C3Gf}7Si|4EHK#A>;| z#(C5|*J=Ox9#VOO4bPGnMxG#9ew?3b$}#cY`G*5c=eEi7RLb5G-m~PQl*ct8DAH1% zp8Np2q75QKN3OLVB{E1TOkF-oFF^~5jEpSXg9~*sFXWZJK@huvB2jBMMGN|to9%xq z_W_ER`|*k}+}Z@~@Gs_z3kxBRb5#fsc$4)EV=vPG>nDRw@{W&n*0-apo z{j3FCR-yrQNLPve&w*rV=|w{6u=r`|!IwckKOgdFo&UiKWTO54H69{9kp2tp$V_AZ zODxmagVy+95E03IvIzfBo6oZUk03-hrtvS!`_ATH@)i9#FEcNp5l;kzroF4H`YScK zyY^o9XJ_7cN)h;+6pu0q4Wgm1pZOyfeqMAY;A`DV{>8;-nAun@REVLFPOxNVj@h_D z1rBOnDU~O)#xQ%OLbOi>pX#8aHavP&g1oP6Pa!B8$no zgVud10qsK4ux-eeo+^Hm3Vs~t|9w$K2EVc6gUmGVA^Z}cKezmk(~hF)Fi8T!jBL$3 zqbRE^ZQe+Znl(yUdpTR)2<8Vp_>uPFMgGC{z-6lVhXDm={2xd7=l=iah3hu|`Ty;8 ztZd8Gmz!OOX7x-Hz}VfOQ3>RNBb~PK8-OE{H!-1%S9rR=zwh>A_>n<2ukARTBB|A9 zt6g;Z2N$23qEUW*x-P9!AVGl|j_~Hq8=oI<6;a#l9?ex5gvW8TqTAGys+B$glcR5= zFUs1!wY9a@X_3du*7hlA7cY79McwWE$8&>hFmKGqbA`FGRNO@J^gq9%50EHeQ?;~w z3fdnbf-3>oc{uw5J=~Osx3XtY%VomFJn(8e14LN#_tF;zed54iS{K3vig?bo0ZZCd z=iM<_1?sv0{C0My&B6)^_%$YYy*LpRd3fkVlAxfit7|clFTQzI?vcmB%p9}O3>`9G zth0u^aQ*%cnTw~Y%CsvVBdiAYp(B}+I|55AqzAWY#N)CcS^kSHnO|9E$GVykED zNyy5=VnIPcVUZ1-hPvKfnI;hbO|}!1UZ8hUy)wsVx%;)_bUCz8z8A=eX+7&)vYp%!lkfKm$;#uvEy?Bw@LQpTJ!gyoIhabW(9$lq@n@W zTx|e@%Tg<~92*;B*3&Hq3PU|;`Y+(VDc2Nm^XlxEHp>a{Oc$@uwibca*Waa8s#aoU zFp(?V2Vj~-KA|vUuTW7U(bv$#ElieI`hdkU6mB#aGla6d1 z9UbPN3f~2<>2#4M2zXD$#l_*hRzS@4Px$03 z8XHr9p=9;vUQB=x0BbERYsRdDytDHs{pvhX?_QhwqK_XHRJ4FkmcKjo?Hk?4EZ{F7 zOXJS~T4?KZqwo6R?j)*=?=8H5g8=Rx5puZNMr=}}r@ICsgMg6m%ZQgD=tPZblXB_*lA zAN>GUc0XL;hLr2gf$2jIWZ9PE)`N8q5x5&I23ScDX90QpdwV@_vyj}S1pzu#vhwf! zCJ_$2<+~5+I*dRH0pngX8InYFG9i+yiJ{A96adwIhj||80#`=ner5YrQE4d}IL*4>8{0>fY*W+v zZ0R&z!dPJ;U}6>n_Y4#e(qMhd_t}g|Wjz2?YoF1GBToKV=)(P0ZsnI)VFlsb02spgOY!5)bBTmyYMBI z8v~Ue%Ob3E(V`<(R93>kf_GLgMIFL!*wlUG#mH^@N9*NF%#2ZbRy}`z(d_K({#Tz@ zT^br2%}>@kEVAK!hSzZ6!&jud09-n!)t@bKvC``_oh#At)9&_Uh^? zv)&v)MK{5B4FU#qpes9@jLoP;}-ZwUA#OMLM1XnCmf;ns0b-^~XlXKZlI?||J4BxnKeW21o$LIA6N1(#+4 zjVhoU%x9}UR&aq}Am}c^q{-zM6s!l4!JG1h??)f&3P_k=9UAKf2Nf2%uy!X3h-W~{ z!c-7IFmN#ojuz{qzy;p%Y8yC_m1Q&X-A;1?R2V#murV?!x<|hOwtOAXPgBJ&zG*!t zwb%fu+6v49OMp^Zqv26n0icj^ODM4e6pHPNWnc0dqbW z1`-%ZT>6fVjw5NFSI4U=m9uqV{K>$yj_5caVf|{w0|V-&fl7+fJo8{!@iVZf!E`Eh zvA^sm!NP@|=6t`8+}_#Y z=`fkF8PEL!ygW9;LGSN@L*O&fZm^7i3}CLD&Sp-Tq?o<~+BP0eD|1?dTSG`dPzzGO zPgyL}3l>HQP}@YfRc&nl!W}a2K9)y~J{WKi|IwHC7s}D{TvfGj5E@q%#5g2uPN=hFX5;JNrxI_kNAQ6^p zuYn@G9$=T?1*}X=X1{hPG7{o4l&r1eVO@WYT%CF&FjQ*h>%l623Cj18PW6%l0?YUg zkjt^9no=^)UK+OhaD(MEFkDPTqIyX(V#TL1QS3Sxa|OH@3A7vz?Zp|0~-;#?K~lOM2P~t zc@uwjcsxVW($XN1;;Cp*bhH?8aQ}g)J+NBs76em5hY%ouTSf!xABZh@;6NbK_;9PS z+lt5h{`&0t$Tc_)M9*d@8YN_628&2$_*7nxN#@x|Wkp3VNWYpOV;@wv;ZBHOK|B9G z+?DOYJ$g`rKtZ{km6bL8^{bq&E)giUPeE22PIu(V>i^re>f+(yu@0)V@RyW82a*-KrNlYh#Pq9nT3W6l>z|) zHWLuD`D$bM_{_~W3e$nSb{l5`bkG+jphSclmLNHzfu*(&PV9m@(tM@G9q92rJ>h8X z*Qe&W5`knUHN-%ojOg3w251wwm$>k3osf{waxrIkR`B;;(a1$z9nYoxOaUt5fe!xj zrWX{a?xXC@8h4U1!?lY1ArZ-`wlICTY%BI~y=4b>cJA)n|7>~l#o?ukos*NCsw$3% zh)696N+VDJEOZ8n!W-U!b0PxUL?G0{5!)&SH(