From f0ae4d1144c69b5f12ca9290437004a8ba618530 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 16 May 2026 14:31:17 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: rbelanec/train_cola_42_1774791067 Source: Original Platform --- .gitattributes | 36 + README.md | 81 + all_results.json | 13 + config.json | 39 + eval_results.json | 8 + generation_config.json | 12 + model.safetensors | 3 + special_tokens_map.json | 26 + tokenizer.json | 3 + tokenizer_config.json | 2069 ++++++++++ train.yaml | 55 + train_results.json | 9 + trainer_log.jsonl | 982 +++++ trainer_state.json | 7911 +++++++++++++++++++++++++++++++++++++++ training_args.bin | 3 + training_eval_loss.png | Bin 0 -> 40596 bytes training_loss.png | Bin 0 -> 43109 bytes 17 files changed, 11250 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 all_results.json create mode 100644 config.json create mode 100644 eval_results.json create mode 100644 generation_config.json create mode 100644 model.safetensors create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train.yaml create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_eval_loss.png create mode 100644 training_loss.png diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..d023fd2 --- /dev/null +++ b/README.md @@ -0,0 +1,81 @@ +--- +library_name: transformers +license: llama3.2 +base_model: meta-llama/Llama-3.2-1B-Instruct +tags: +- peft-factory +- full +- llama-factory +- generated_from_trainer +model-index: +- name: train_cola_42_1774791067 + results: [] +--- + + + +# train_cola_42_1774791067 + +This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on the cola dataset. +It achieves the following results on the evaluation set: +- Loss: 0.2517 +- Num Input Tokens Seen: 1932608 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 5e-05 +- train_batch_size: 8 +- eval_batch_size: 8 +- seed: 42 +- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 5 + +### Training results + +| Training Loss | Epoch | Step | Validation Loss | Input Tokens Seen | +|:-------------:|:------:|:----:|:---------------:|:-----------------:| +| 0.2682 | 0.2505 | 241 | 0.3847 | 97664 | +| 0.3383 | 0.5010 | 482 | 0.4081 | 194560 | +| 0.2962 | 0.7516 | 723 | 0.2960 | 291712 | +| 0.2807 | 1.0021 | 964 | 0.2739 | 387464 | +| 0.2836 | 1.2526 | 1205 | 0.2581 | 485192 | +| 0.2936 | 1.5031 | 1446 | 0.2570 | 581704 | +| 0.2705 | 1.7536 | 1687 | 0.2560 | 677576 | +| 0.2243 | 2.0042 | 1928 | 0.2575 | 775312 | +| 0.2477 | 2.2547 | 2169 | 0.2924 | 873104 | +| 0.2379 | 2.5052 | 2410 | 0.2577 | 969360 | +| 0.2934 | 2.7557 | 2651 | 0.2561 | 1065232 | +| 0.2209 | 3.0062 | 2892 | 0.2571 | 1162016 | +| 0.2647 | 3.2568 | 3133 | 0.2563 | 1259168 | +| 0.2795 | 3.5073 | 3374 | 0.2642 | 1355552 | +| 0.2751 | 3.7578 | 3615 | 0.2587 | 1453088 | +| 0.279 | 4.0083 | 3856 | 0.2559 | 1549360 | +| 0.2511 | 4.2588 | 4097 | 0.2517 | 1645808 | +| 0.2709 | 4.5094 | 4338 | 0.2577 | 1742960 | +| 0.2582 | 4.7599 | 4579 | 0.2605 | 1839344 | + + +### Framework versions + +- Transformers 4.51.3 +- Pytorch 2.10.0+cu128 +- Datasets 4.0.0 +- Tokenizers 0.21.4 diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..09451bb --- /dev/null +++ b/all_results.json @@ -0,0 +1,13 @@ +{ + "epoch": 5.0, + "eval_loss": 0.2517484128475189, + "eval_runtime": 1.0765, + "eval_samples_per_second": 795.158, + "eval_steps_per_second": 99.395, + "num_input_tokens_seen": 1932608, + "total_flos": 1.1284259767320576e+16, + "train_loss": 0.28020706261022177, + "train_runtime": 1219.1473, + "train_samples_per_second": 31.559, + "train_steps_per_second": 3.945 +} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..5a2b93f --- /dev/null +++ b/config.json @@ -0,0 +1,39 @@ +{ + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "head_dim": 64, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 8192, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "num_attention_heads": 32, + "num_hidden_layers": 16, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 32.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": true, + "torch_dtype": "float32", + "transformers_version": "4.51.3", + "use_cache": false, + "vocab_size": 128256 +} diff --git a/eval_results.json b/eval_results.json new file mode 100644 index 0000000..644a594 --- /dev/null +++ b/eval_results.json @@ -0,0 +1,8 @@ +{ + "epoch": 5.0, + "eval_loss": 0.2517484128475189, + "eval_runtime": 1.0765, + "eval_samples_per_second": 795.158, + "eval_steps_per_second": 99.395, + "num_input_tokens_seen": 1932608 +} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..2b8ae57 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,12 @@ +{ + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "4.51.3" +} diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..ecb65f0 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49453a8a59c41f07303c0305d6cb0bfbf753e3a0717998dae6c48680bac9eb03 +size 4943274328 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..14daf45 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,26 @@ +{ + "additional_special_tokens": [ + { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } + ], + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "<|eot_id|>" +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..1c1d8d5 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..ddc3ce0 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2069 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "additional_special_tokens": [ + "<|eom_id|>" + ], + "bos_token": "<|begin_of_text|>", + "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n {%- if strftime_now is defined %}\n {%- set date_string = strftime_now(\"%d %b %Y\") %}\n {%- else %}\n {%- set date_string = \"26 Jul 2024\" %}\n {%- endif %}\n{%- endif %}\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n {%- set system_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n{%- else %}\n {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message #}\n{{- \"<|start_header_id|>system<|end_header_id|>\\n\\n\" }}\n{%- if tools is not none %}\n {{- \"Environment: ipython\\n\" }}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\\n\" }}\n{{- \"Today Date: \" + date_string + \"\\n\\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n {#- Extract the first user message so we can plug it in here #}\n {%- if messages | length != 0 %}\n {%- set first_user_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n {%- else %}\n {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n {{- '<|start_header_id|>user<|end_header_id|>\\n\\n' -}}\n {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n {{- \"with its proper arguments that best answers the given prompt.\\n\\n\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n'+ message['content'] | trim + '<|eot_id|>' }}\n {%- elif 'tool_calls' in message %}\n {%- if not message.tool_calls|length == 1 %}\n {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n {%- endif %}\n {%- set tool_call = message.tool_calls[0].function %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' -}}\n {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n {{- '\"parameters\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- \"}\" }}\n {{- \"<|eot_id|>\" }}\n {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n {{- \"<|start_header_id|>ipython<|end_header_id|>\\n\\n\" }}\n {%- if message.content is mapping or message.content is iterable %}\n {{- message.content | tojson }}\n {%- else %}\n {{- message.content }}\n {%- endif %}\n {{- \"<|eot_id|>\" }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}\n{%- endif %}\n", + "clean_up_tokenization_spaces": true, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "pad_token": "<|eot_id|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "PreTrainedTokenizer" +} diff --git a/train.yaml b/train.yaml new file mode 100644 index 0000000..2cf3291 --- /dev/null +++ b/train.yaml @@ -0,0 +1,55 @@ +seed: 42 + +### model +model_name_or_path: meta-llama/Llama-3.2-1B-Instruct +trust_remote_code: true +flash_attn: auto +use_cache: false + +### method +stage: sft +do_train: true +finetuning_type: full + +### dataset +dataset: cola +template: llama3 +cutoff_len: 2048 +overwrite_cache: true +preprocessing_num_workers: 4 +dataloader_num_workers: 4 +packing: false + +### output +output_dir: saves_bts_preliminary/base/llama-3.2-1b-instruct/train_cola_42_1774791067 +logging_steps: 5 +save_steps: 0.05 +overwrite_output_dir: true +save_only_model: false +plot_loss: true +include_num_input_tokens_seen: true +push_to_hub: true +push_to_hub_organization: rbelanec +load_best_model_at_end: true +save_total_limit: 1 + +### train +per_device_train_batch_size: 8 +learning_rate: 5.0e-5 +num_train_epochs: 5 +weight_decay: 1.0e-5 +lr_scheduler_type: cosine +bf16: true +ddp_timeout: 180000000 +resume_from_checkpoint: null +warmup_ratio: 0.1 +optim: adamw_torch +report_to: +- wandb +run_name: base_llama-3.2-1b-instruct_train_cola_42_1774791067 + +### eval +per_device_eval_batch_size: 8 +eval_strategy: steps +eval_steps: 0.05 +val_size: 0.1 \ No newline at end of file diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..eedd4d4 --- /dev/null +++ b/train_results.json @@ -0,0 +1,9 @@ +{ + "epoch": 5.0, + "num_input_tokens_seen": 1932608, + "total_flos": 1.1284259767320576e+16, + "train_loss": 0.28020706261022177, + "train_runtime": 1219.1473, + "train_samples_per_second": 31.559, + "train_steps_per_second": 3.945 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..a8598b6 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,982 @@ +{"current_steps": 5, "total_steps": 4810, "loss": 1.2842, "lr": 4.1580041580041583e-07, "epoch": 0.005197505197505198, "percentage": 0.1, "elapsed_time": "0:00:00", "remaining_time": "0:11:53", "throughput": 2757.56, "total_tokens": 2048} +{"current_steps": 10, "total_steps": 4810, "loss": 0.8545, "lr": 9.355509355509356e-07, "epoch": 0.010395010395010396, "percentage": 0.21, "elapsed_time": "0:00:01", "remaining_time": "0:08:39", "throughput": 3904.41, "total_tokens": 4224} +{"current_steps": 15, "total_steps": 4810, "loss": 0.3278, "lr": 1.4553014553014554e-06, "epoch": 0.015592515592515593, "percentage": 0.31, "elapsed_time": "0:00:01", "remaining_time": "0:07:30", "throughput": 4453.08, "total_tokens": 6272} +{"current_steps": 20, "total_steps": 4810, "loss": 0.365, "lr": 1.975051975051975e-06, "epoch": 0.02079002079002079, "percentage": 0.42, "elapsed_time": "0:00:01", "remaining_time": "0:06:55", "throughput": 4827.17, "total_tokens": 8384} +{"current_steps": 25, "total_steps": 4810, "loss": 0.4433, "lr": 2.494802494802495e-06, "epoch": 0.02598752598752599, "percentage": 0.52, "elapsed_time": "0:00:02", "remaining_time": "0:06:35", "throughput": 5084.42, "total_tokens": 10496} +{"current_steps": 30, "total_steps": 4810, "loss": 0.2526, "lr": 3.014553014553015e-06, "epoch": 0.031185031185031187, "percentage": 0.62, "elapsed_time": "0:00:02", "remaining_time": "0:06:21", "throughput": 5245.81, "total_tokens": 12544} +{"current_steps": 35, "total_steps": 4810, "loss": 0.3051, "lr": 3.5343035343035348e-06, "epoch": 0.036382536382536385, "percentage": 0.73, "elapsed_time": "0:00:02", "remaining_time": "0:06:10", "throughput": 5345.36, "total_tokens": 14528} +{"current_steps": 40, "total_steps": 4810, "loss": 0.5129, "lr": 4.0540540540540545e-06, "epoch": 0.04158004158004158, "percentage": 0.83, "elapsed_time": "0:00:03", "remaining_time": "0:06:03", "throughput": 5443.98, "total_tokens": 16576} +{"current_steps": 45, "total_steps": 4810, "loss": 0.283, "lr": 4.573804573804574e-06, "epoch": 0.04677754677754678, "percentage": 0.94, "elapsed_time": "0:00:03", "remaining_time": "0:05:57", "throughput": 5503.03, "total_tokens": 18560} +{"current_steps": 50, "total_steps": 4810, "loss": 0.454, "lr": 5.093555093555094e-06, "epoch": 0.05197505197505198, "percentage": 1.04, "elapsed_time": "0:00:03", "remaining_time": "0:05:52", "throughput": 5567.22, "total_tokens": 20608} +{"current_steps": 55, "total_steps": 4810, "loss": 0.2518, "lr": 5.613305613305614e-06, "epoch": 0.057172557172557176, "percentage": 1.14, "elapsed_time": "0:00:04", "remaining_time": "0:05:48", "throughput": 5624.89, "total_tokens": 22656} +{"current_steps": 60, "total_steps": 4810, "loss": 0.2538, "lr": 6.1330561330561335e-06, "epoch": 0.062370062370062374, "percentage": 1.25, "elapsed_time": "0:00:04", "remaining_time": "0:05:44", "throughput": 5658.03, "total_tokens": 24640} +{"current_steps": 65, "total_steps": 4810, "loss": 0.3571, "lr": 6.652806652806653e-06, "epoch": 0.06756756756756757, "percentage": 1.35, "elapsed_time": "0:00:04", "remaining_time": "0:05:41", "throughput": 5713.0, "total_tokens": 26752} +{"current_steps": 70, "total_steps": 4810, "loss": 0.3588, "lr": 7.172557172557173e-06, "epoch": 0.07276507276507277, "percentage": 1.46, "elapsed_time": "0:00:05", "remaining_time": "0:05:40", "throughput": 5695.8, "total_tokens": 28608} +{"current_steps": 75, "total_steps": 4810, "loss": 0.2553, "lr": 7.692307692307694e-06, "epoch": 0.07796257796257797, "percentage": 1.56, "elapsed_time": "0:00:05", "remaining_time": "0:05:38", "throughput": 5762.97, "total_tokens": 30912} +{"current_steps": 80, "total_steps": 4810, "loss": 0.3869, "lr": 8.212058212058212e-06, "epoch": 0.08316008316008316, "percentage": 1.66, "elapsed_time": "0:00:05", "remaining_time": "0:05:36", "throughput": 5779.52, "total_tokens": 32896} +{"current_steps": 85, "total_steps": 4810, "loss": 0.3812, "lr": 8.731808731808733e-06, "epoch": 0.08835758835758836, "percentage": 1.77, "elapsed_time": "0:00:06", "remaining_time": "0:05:34", "throughput": 5785.23, "total_tokens": 34816} +{"current_steps": 90, "total_steps": 4810, "loss": 0.735, "lr": 9.251559251559252e-06, "epoch": 0.09355509355509356, "percentage": 1.87, "elapsed_time": "0:00:06", "remaining_time": "0:05:32", "throughput": 5789.57, "total_tokens": 36736} +{"current_steps": 95, "total_steps": 4810, "loss": 0.4027, "lr": 9.771309771309773e-06, "epoch": 0.09875259875259876, "percentage": 1.98, "elapsed_time": "0:00:06", "remaining_time": "0:05:31", "throughput": 5803.2, "total_tokens": 38720} +{"current_steps": 100, "total_steps": 4810, "loss": 0.4605, "lr": 1.0291060291060291e-05, "epoch": 0.10395010395010396, "percentage": 2.08, "elapsed_time": "0:00:06", "remaining_time": "0:05:29", "throughput": 5806.07, "total_tokens": 40640} +{"current_steps": 105, "total_steps": 4810, "loss": 0.2999, "lr": 1.0810810810810812e-05, "epoch": 0.10914760914760915, "percentage": 2.18, "elapsed_time": "0:00:07", "remaining_time": "0:05:28", "throughput": 5825.69, "total_tokens": 42688} +{"current_steps": 110, "total_steps": 4810, "loss": 0.2839, "lr": 1.1330561330561331e-05, "epoch": 0.11434511434511435, "percentage": 2.29, "elapsed_time": "0:00:07", "remaining_time": "0:05:27", "throughput": 5819.07, "total_tokens": 44544} +{"current_steps": 115, "total_steps": 4810, "loss": 0.3329, "lr": 1.1850311850311852e-05, "epoch": 0.11954261954261955, "percentage": 2.39, "elapsed_time": "0:00:07", "remaining_time": "0:05:25", "throughput": 5813.31, "total_tokens": 46400} +{"current_steps": 120, "total_steps": 4810, "loss": 0.2089, "lr": 1.2370062370062372e-05, "epoch": 0.12474012474012475, "percentage": 2.49, "elapsed_time": "0:00:08", "remaining_time": "0:05:24", "throughput": 5831.11, "total_tokens": 48448} +{"current_steps": 125, "total_steps": 4810, "loss": 0.2829, "lr": 1.2889812889812891e-05, "epoch": 0.12993762993762994, "percentage": 2.6, "elapsed_time": "0:00:08", "remaining_time": "0:05:23", "throughput": 5847.65, "total_tokens": 50496} +{"current_steps": 130, "total_steps": 4810, "loss": 0.2434, "lr": 1.3409563409563412e-05, "epoch": 0.13513513513513514, "percentage": 2.7, "elapsed_time": "0:00:08", "remaining_time": "0:05:22", "throughput": 5848.59, "total_tokens": 52416} +{"current_steps": 135, "total_steps": 4810, "loss": 0.3621, "lr": 1.392931392931393e-05, "epoch": 0.14033264033264034, "percentage": 2.81, "elapsed_time": "0:00:09", "remaining_time": "0:05:21", "throughput": 5862.86, "total_tokens": 54464} +{"current_steps": 140, "total_steps": 4810, "loss": 0.3338, "lr": 1.4449064449064451e-05, "epoch": 0.14553014553014554, "percentage": 2.91, "elapsed_time": "0:00:09", "remaining_time": "0:05:20", "throughput": 5869.77, "total_tokens": 56448} +{"current_steps": 145, "total_steps": 4810, "loss": 0.3185, "lr": 1.496881496881497e-05, "epoch": 0.15072765072765074, "percentage": 3.01, "elapsed_time": "0:00:09", "remaining_time": "0:05:19", "throughput": 5869.29, "total_tokens": 58368} +{"current_steps": 150, "total_steps": 4810, "loss": 0.2379, "lr": 1.548856548856549e-05, "epoch": 0.15592515592515593, "percentage": 3.12, "elapsed_time": "0:00:10", "remaining_time": "0:05:19", "throughput": 5893.67, "total_tokens": 60544} +{"current_steps": 155, "total_steps": 4810, "loss": 0.3634, "lr": 1.600831600831601e-05, "epoch": 0.16112266112266113, "percentage": 3.22, "elapsed_time": "0:00:10", "remaining_time": "0:05:18", "throughput": 5905.86, "total_tokens": 62592} +{"current_steps": 160, "total_steps": 4810, "loss": 0.3093, "lr": 1.652806652806653e-05, "epoch": 0.16632016632016633, "percentage": 3.33, "elapsed_time": "0:00:10", "remaining_time": "0:05:17", "throughput": 5911.89, "total_tokens": 64576} +{"current_steps": 165, "total_steps": 4810, "loss": 0.3377, "lr": 1.704781704781705e-05, "epoch": 0.17151767151767153, "percentage": 3.43, "elapsed_time": "0:00:11", "remaining_time": "0:05:16", "throughput": 5927.46, "total_tokens": 66688} +{"current_steps": 170, "total_steps": 4810, "loss": 0.3224, "lr": 1.756756756756757e-05, "epoch": 0.17671517671517672, "percentage": 3.53, "elapsed_time": "0:00:11", "remaining_time": "0:05:16", "throughput": 5919.3, "total_tokens": 68544} +{"current_steps": 175, "total_steps": 4810, "loss": 0.3814, "lr": 1.808731808731809e-05, "epoch": 0.18191268191268192, "percentage": 3.64, "elapsed_time": "0:00:12", "remaining_time": "0:05:27", "throughput": 5710.55, "total_tokens": 70592} +{"current_steps": 180, "total_steps": 4810, "loss": 0.338, "lr": 1.8607068607068607e-05, "epoch": 0.18711018711018712, "percentage": 3.74, "elapsed_time": "0:00:12", "remaining_time": "0:05:26", "throughput": 5718.74, "total_tokens": 72576} +{"current_steps": 185, "total_steps": 4810, "loss": 0.2853, "lr": 1.9126819126819128e-05, "epoch": 0.19230769230769232, "percentage": 3.85, "elapsed_time": "0:00:13", "remaining_time": "0:05:25", "throughput": 5731.48, "total_tokens": 74624} +{"current_steps": 190, "total_steps": 4810, "loss": 0.3374, "lr": 1.964656964656965e-05, "epoch": 0.19750519750519752, "percentage": 3.95, "elapsed_time": "0:00:13", "remaining_time": "0:05:24", "throughput": 5738.89, "total_tokens": 76608} +{"current_steps": 195, "total_steps": 4810, "loss": 0.3221, "lr": 2.016632016632017e-05, "epoch": 0.20270270270270271, "percentage": 4.05, "elapsed_time": "0:00:13", "remaining_time": "0:05:23", "throughput": 5754.71, "total_tokens": 78720} +{"current_steps": 200, "total_steps": 4810, "loss": 0.3944, "lr": 2.068607068607069e-05, "epoch": 0.2079002079002079, "percentage": 4.16, "elapsed_time": "0:00:14", "remaining_time": "0:05:23", "throughput": 5787.47, "total_tokens": 81152} +{"current_steps": 205, "total_steps": 4810, "loss": 0.3755, "lr": 2.1205821205821207e-05, "epoch": 0.2130977130977131, "percentage": 4.26, "elapsed_time": "0:00:14", "remaining_time": "0:05:22", "throughput": 5796.3, "total_tokens": 83200} +{"current_steps": 210, "total_steps": 4810, "loss": 0.2949, "lr": 2.1725571725571728e-05, "epoch": 0.2182952182952183, "percentage": 4.37, "elapsed_time": "0:00:14", "remaining_time": "0:05:21", "throughput": 5799.6, "total_tokens": 85184} +{"current_steps": 215, "total_steps": 4810, "loss": 0.2174, "lr": 2.2245322245322248e-05, "epoch": 0.2234927234927235, "percentage": 4.47, "elapsed_time": "0:00:15", "remaining_time": "0:05:21", "throughput": 5807.71, "total_tokens": 87232} +{"current_steps": 220, "total_steps": 4810, "loss": 0.6706, "lr": 2.276507276507277e-05, "epoch": 0.2286902286902287, "percentage": 4.57, "elapsed_time": "0:00:15", "remaining_time": "0:05:20", "throughput": 5807.19, "total_tokens": 89152} +{"current_steps": 225, "total_steps": 4810, "loss": 0.4387, "lr": 2.3284823284823286e-05, "epoch": 0.2338877338877339, "percentage": 4.68, "elapsed_time": "0:00:15", "remaining_time": "0:05:19", "throughput": 5823.81, "total_tokens": 91328} +{"current_steps": 230, "total_steps": 4810, "loss": 0.3047, "lr": 2.3804573804573807e-05, "epoch": 0.2390852390852391, "percentage": 4.78, "elapsed_time": "0:00:16", "remaining_time": "0:05:18", "throughput": 5827.3, "total_tokens": 93312} +{"current_steps": 235, "total_steps": 4810, "loss": 0.2717, "lr": 2.4324324324324327e-05, "epoch": 0.2442827442827443, "percentage": 4.89, "elapsed_time": "0:00:16", "remaining_time": "0:05:18", "throughput": 5831.51, "total_tokens": 95296} +{"current_steps": 240, "total_steps": 4810, "loss": 0.2682, "lr": 2.4844074844074848e-05, "epoch": 0.2494802494802495, "percentage": 4.99, "elapsed_time": "0:00:16", "remaining_time": "0:05:17", "throughput": 5831.46, "total_tokens": 97216} +{"current_steps": 241, "total_steps": 4810, "eval_loss": 0.38468512892723083, "epoch": 0.2505197505197505, "percentage": 5.01, "elapsed_time": "0:00:18", "remaining_time": "0:05:47", "throughput": 5322.21, "total_tokens": 97664} +{"current_steps": 245, "total_steps": 4810, "loss": 0.344, "lr": 2.5363825363825365e-05, "epoch": 0.25467775467775466, "percentage": 5.09, "elapsed_time": "0:01:24", "remaining_time": "0:26:21", "throughput": 1169.55, "total_tokens": 99264} +{"current_steps": 250, "total_steps": 4810, "loss": 0.3993, "lr": 2.5883575883575882e-05, "epoch": 0.2598752598752599, "percentage": 5.2, "elapsed_time": "0:01:25", "remaining_time": "0:25:53", "throughput": 1187.72, "total_tokens": 101184} +{"current_steps": 255, "total_steps": 4810, "loss": 0.4414, "lr": 2.6403326403326406e-05, "epoch": 0.26507276507276506, "percentage": 5.3, "elapsed_time": "0:01:25", "remaining_time": "0:25:27", "throughput": 1207.94, "total_tokens": 103296} +{"current_steps": 260, "total_steps": 4810, "loss": 0.3322, "lr": 2.6923076923076923e-05, "epoch": 0.2702702702702703, "percentage": 5.41, "elapsed_time": "0:01:25", "remaining_time": "0:25:02", "throughput": 1227.21, "total_tokens": 105344} +{"current_steps": 265, "total_steps": 4810, "loss": 0.3314, "lr": 2.7442827442827447e-05, "epoch": 0.27546777546777546, "percentage": 5.51, "elapsed_time": "0:01:26", "remaining_time": "0:24:37", "throughput": 1246.38, "total_tokens": 107392} +{"current_steps": 270, "total_steps": 4810, "loss": 0.2951, "lr": 2.796257796257796e-05, "epoch": 0.2806652806652807, "percentage": 5.61, "elapsed_time": "0:01:26", "remaining_time": "0:24:14", "throughput": 1265.4, "total_tokens": 109440} +{"current_steps": 275, "total_steps": 4810, "loss": 0.2986, "lr": 2.8482328482328485e-05, "epoch": 0.28586278586278585, "percentage": 5.72, "elapsed_time": "0:01:26", "remaining_time": "0:23:51", "throughput": 1283.53, "total_tokens": 111424} +{"current_steps": 280, "total_steps": 4810, "loss": 0.407, "lr": 2.9002079002079002e-05, "epoch": 0.2910602910602911, "percentage": 5.82, "elapsed_time": "0:01:27", "remaining_time": "0:23:29", "throughput": 1301.55, "total_tokens": 113408} +{"current_steps": 285, "total_steps": 4810, "loss": 0.4506, "lr": 2.9521829521829526e-05, "epoch": 0.29625779625779625, "percentage": 5.93, "elapsed_time": "0:01:27", "remaining_time": "0:23:08", "throughput": 1319.43, "total_tokens": 115392} +{"current_steps": 290, "total_steps": 4810, "loss": 0.4738, "lr": 3.0041580041580043e-05, "epoch": 0.30145530145530147, "percentage": 6.03, "elapsed_time": "0:01:27", "remaining_time": "0:22:48", "throughput": 1337.92, "total_tokens": 117440} +{"current_steps": 295, "total_steps": 4810, "loss": 0.5248, "lr": 3.056133056133057e-05, "epoch": 0.30665280665280664, "percentage": 6.13, "elapsed_time": "0:01:28", "remaining_time": "0:22:28", "throughput": 1355.54, "total_tokens": 119424} +{"current_steps": 300, "total_steps": 4810, "loss": 0.3321, "lr": 3.108108108108108e-05, "epoch": 0.31185031185031187, "percentage": 6.24, "elapsed_time": "0:01:28", "remaining_time": "0:22:09", "throughput": 1372.32, "total_tokens": 121344} +{"current_steps": 305, "total_steps": 4810, "loss": 0.3707, "lr": 3.16008316008316e-05, "epoch": 0.31704781704781704, "percentage": 6.34, "elapsed_time": "0:01:28", "remaining_time": "0:21:50", "throughput": 1388.99, "total_tokens": 123264} +{"current_steps": 310, "total_steps": 4810, "loss": 0.3574, "lr": 3.212058212058212e-05, "epoch": 0.32224532224532226, "percentage": 6.44, "elapsed_time": "0:01:29", "remaining_time": "0:21:32", "throughput": 1405.52, "total_tokens": 125184} +{"current_steps": 315, "total_steps": 4810, "loss": 0.2851, "lr": 3.264033264033264e-05, "epoch": 0.32744282744282743, "percentage": 6.55, "elapsed_time": "0:01:29", "remaining_time": "0:21:15", "throughput": 1424.06, "total_tokens": 127296} +{"current_steps": 320, "total_steps": 4810, "loss": 0.2794, "lr": 3.3160083160083164e-05, "epoch": 0.33264033264033266, "percentage": 6.65, "elapsed_time": "0:01:29", "remaining_time": "0:20:58", "throughput": 1442.47, "total_tokens": 129408} +{"current_steps": 325, "total_steps": 4810, "loss": 0.3015, "lr": 3.3679833679833684e-05, "epoch": 0.33783783783783783, "percentage": 6.76, "elapsed_time": "0:01:30", "remaining_time": "0:20:42", "throughput": 1460.75, "total_tokens": 131520} +{"current_steps": 330, "total_steps": 4810, "loss": 0.2826, "lr": 3.41995841995842e-05, "epoch": 0.34303534303534305, "percentage": 6.86, "elapsed_time": "0:01:30", "remaining_time": "0:20:26", "throughput": 1478.21, "total_tokens": 133568} +{"current_steps": 335, "total_steps": 4810, "loss": 0.3704, "lr": 3.4719334719334725e-05, "epoch": 0.3482328482328482, "percentage": 6.96, "elapsed_time": "0:01:30", "remaining_time": "0:20:11", "throughput": 1495.54, "total_tokens": 135616} +{"current_steps": 340, "total_steps": 4810, "loss": 0.4519, "lr": 3.523908523908524e-05, "epoch": 0.35343035343035345, "percentage": 7.07, "elapsed_time": "0:01:31", "remaining_time": "0:19:56", "throughput": 1512.75, "total_tokens": 137664} +{"current_steps": 345, "total_steps": 4810, "loss": 0.2863, "lr": 3.575883575883576e-05, "epoch": 0.3586278586278586, "percentage": 7.17, "elapsed_time": "0:01:31", "remaining_time": "0:19:41", "throughput": 1528.46, "total_tokens": 139584} +{"current_steps": 350, "total_steps": 4810, "loss": 0.4921, "lr": 3.627858627858628e-05, "epoch": 0.36382536382536385, "percentage": 7.28, "elapsed_time": "0:01:31", "remaining_time": "0:19:27", "throughput": 1544.03, "total_tokens": 141504} +{"current_steps": 355, "total_steps": 4810, "loss": 0.3078, "lr": 3.67983367983368e-05, "epoch": 0.369022869022869, "percentage": 7.38, "elapsed_time": "0:01:31", "remaining_time": "0:19:14", "throughput": 1560.88, "total_tokens": 143552} +{"current_steps": 360, "total_steps": 4810, "loss": 0.252, "lr": 3.731808731808732e-05, "epoch": 0.37422037422037424, "percentage": 7.48, "elapsed_time": "0:01:32", "remaining_time": "0:19:00", "throughput": 1576.94, "total_tokens": 145536} +{"current_steps": 365, "total_steps": 4810, "loss": 0.2894, "lr": 3.783783783783784e-05, "epoch": 0.3794178794178794, "percentage": 7.59, "elapsed_time": "0:01:32", "remaining_time": "0:18:47", "throughput": 1592.2, "total_tokens": 147456} +{"current_steps": 370, "total_steps": 4810, "loss": 0.1779, "lr": 3.8357588357588356e-05, "epoch": 0.38461538461538464, "percentage": 7.69, "elapsed_time": "0:01:32", "remaining_time": "0:18:35", "throughput": 1608.02, "total_tokens": 149440} +{"current_steps": 375, "total_steps": 4810, "loss": 0.4928, "lr": 3.8877338877338883e-05, "epoch": 0.3898128898128898, "percentage": 7.8, "elapsed_time": "0:01:33", "remaining_time": "0:18:22", "throughput": 1623.06, "total_tokens": 151360} +{"current_steps": 380, "total_steps": 4810, "loss": 0.4363, "lr": 3.93970893970894e-05, "epoch": 0.39501039501039503, "percentage": 7.9, "elapsed_time": "0:01:33", "remaining_time": "0:18:10", "throughput": 1638.67, "total_tokens": 153344} +{"current_steps": 385, "total_steps": 4810, "loss": 0.2689, "lr": 3.991683991683992e-05, "epoch": 0.4002079002079002, "percentage": 8.0, "elapsed_time": "0:01:33", "remaining_time": "0:17:59", "throughput": 1653.51, "total_tokens": 155264} +{"current_steps": 390, "total_steps": 4810, "loss": 0.2539, "lr": 4.043659043659044e-05, "epoch": 0.40540540540540543, "percentage": 8.11, "elapsed_time": "0:01:34", "remaining_time": "0:17:47", "throughput": 1668.91, "total_tokens": 157248} +{"current_steps": 395, "total_steps": 4810, "loss": 0.332, "lr": 4.095634095634096e-05, "epoch": 0.4106029106029106, "percentage": 8.21, "elapsed_time": "0:01:34", "remaining_time": "0:17:36", "throughput": 1684.86, "total_tokens": 159296} +{"current_steps": 400, "total_steps": 4810, "loss": 0.3, "lr": 4.147609147609148e-05, "epoch": 0.4158004158004158, "percentage": 8.32, "elapsed_time": "0:01:34", "remaining_time": "0:17:25", "throughput": 1700.71, "total_tokens": 161344} +{"current_steps": 405, "total_steps": 4810, "loss": 0.2376, "lr": 4.1995841995842e-05, "epoch": 0.420997920997921, "percentage": 8.42, "elapsed_time": "0:01:35", "remaining_time": "0:17:15", "throughput": 1715.8, "total_tokens": 163328} +{"current_steps": 410, "total_steps": 4810, "loss": 0.2709, "lr": 4.2515592515592514e-05, "epoch": 0.4261954261954262, "percentage": 8.52, "elapsed_time": "0:01:35", "remaining_time": "0:17:05", "throughput": 1730.79, "total_tokens": 165312} +{"current_steps": 415, "total_steps": 4810, "loss": 0.1471, "lr": 4.303534303534304e-05, "epoch": 0.4313929313929314, "percentage": 8.63, "elapsed_time": "0:01:35", "remaining_time": "0:16:54", "throughput": 1746.32, "total_tokens": 167360} +{"current_steps": 420, "total_steps": 4810, "loss": 0.9994, "lr": 4.3555093555093555e-05, "epoch": 0.4365904365904366, "percentage": 8.73, "elapsed_time": "0:01:36", "remaining_time": "0:16:45", "throughput": 1761.1, "total_tokens": 169344} +{"current_steps": 425, "total_steps": 4810, "loss": 0.603, "lr": 4.407484407484408e-05, "epoch": 0.4417879417879418, "percentage": 8.84, "elapsed_time": "0:01:36", "remaining_time": "0:16:35", "throughput": 1777.09, "total_tokens": 171456} +{"current_steps": 430, "total_steps": 4810, "loss": 0.3054, "lr": 4.4594594594594596e-05, "epoch": 0.446985446985447, "percentage": 8.94, "elapsed_time": "0:01:36", "remaining_time": "0:16:26", "throughput": 1792.97, "total_tokens": 173568} +{"current_steps": 435, "total_steps": 4810, "loss": 0.3208, "lr": 4.511434511434512e-05, "epoch": 0.4521829521829522, "percentage": 9.04, "elapsed_time": "0:01:37", "remaining_time": "0:16:16", "throughput": 1807.43, "total_tokens": 175552} +{"current_steps": 440, "total_steps": 4810, "loss": 0.2942, "lr": 4.563409563409564e-05, "epoch": 0.4573804573804574, "percentage": 9.15, "elapsed_time": "0:01:37", "remaining_time": "0:16:07", "throughput": 1821.82, "total_tokens": 177536} +{"current_steps": 445, "total_steps": 4810, "loss": 0.3005, "lr": 4.615384615384616e-05, "epoch": 0.4625779625779626, "percentage": 9.25, "elapsed_time": "0:01:37", "remaining_time": "0:15:59", "throughput": 1836.74, "total_tokens": 179584} +{"current_steps": 450, "total_steps": 4810, "loss": 1.7773, "lr": 4.667359667359668e-05, "epoch": 0.4677754677754678, "percentage": 9.36, "elapsed_time": "0:01:38", "remaining_time": "0:15:50", "throughput": 1850.96, "total_tokens": 181568} +{"current_steps": 455, "total_steps": 4810, "loss": 0.2889, "lr": 4.71933471933472e-05, "epoch": 0.47297297297297297, "percentage": 9.46, "elapsed_time": "0:01:38", "remaining_time": "0:15:41", "throughput": 1865.07, "total_tokens": 183552} +{"current_steps": 460, "total_steps": 4810, "loss": 0.2556, "lr": 4.771309771309771e-05, "epoch": 0.4781704781704782, "percentage": 9.56, "elapsed_time": "0:01:38", "remaining_time": "0:15:33", "throughput": 1879.73, "total_tokens": 185600} +{"current_steps": 465, "total_steps": 4810, "loss": 0.2378, "lr": 4.823284823284824e-05, "epoch": 0.48336798336798337, "percentage": 9.67, "elapsed_time": "0:01:39", "remaining_time": "0:15:25", "throughput": 1893.65, "total_tokens": 187584} +{"current_steps": 470, "total_steps": 4810, "loss": 0.2859, "lr": 4.8752598752598754e-05, "epoch": 0.4885654885654886, "percentage": 9.77, "elapsed_time": "0:01:39", "remaining_time": "0:15:17", "throughput": 1907.49, "total_tokens": 189568} +{"current_steps": 475, "total_steps": 4810, "loss": 0.2438, "lr": 4.9272349272349275e-05, "epoch": 0.49376299376299376, "percentage": 9.88, "elapsed_time": "0:01:39", "remaining_time": "0:15:09", "throughput": 1922.49, "total_tokens": 191680} +{"current_steps": 480, "total_steps": 4810, "loss": 0.3383, "lr": 4.9792099792099796e-05, "epoch": 0.498960498960499, "percentage": 9.98, "elapsed_time": "0:01:40", "remaining_time": "0:15:02", "throughput": 1936.77, "total_tokens": 193728} +{"current_steps": 482, "total_steps": 4810, "eval_loss": 0.4080815315246582, "epoch": 0.501039501039501, "percentage": 10.02, "elapsed_time": "0:01:42", "remaining_time": "0:15:22", "throughput": 1893.12, "total_tokens": 194560} +{"current_steps": 485, "total_steps": 4810, "loss": 0.381, "lr": 4.999994075155936e-05, "epoch": 0.5041580041580042, "percentage": 10.08, "elapsed_time": "0:02:26", "remaining_time": "0:21:48", "throughput": 1333.87, "total_tokens": 195776} +{"current_steps": 490, "total_steps": 4810, "loss": 0.2916, "lr": 4.999957867877242e-05, "epoch": 0.5093555093555093, "percentage": 10.19, "elapsed_time": "0:02:27", "remaining_time": "0:21:36", "throughput": 1343.99, "total_tokens": 197696} +{"current_steps": 495, "total_steps": 4810, "loss": 0.2766, "lr": 4.999888745376028e-05, "epoch": 0.5145530145530145, "percentage": 10.29, "elapsed_time": "0:02:27", "remaining_time": "0:21:25", "throughput": 1354.51, "total_tokens": 199680} +{"current_steps": 500, "total_steps": 4810, "loss": 0.2596, "lr": 4.9997867085623824e-05, "epoch": 0.5197505197505198, "percentage": 10.4, "elapsed_time": "0:02:27", "remaining_time": "0:21:13", "throughput": 1365.84, "total_tokens": 201792} +{"current_steps": 505, "total_steps": 4810, "loss": 0.2689, "lr": 4.999651758779754e-05, "epoch": 0.524948024948025, "percentage": 10.5, "elapsed_time": "0:02:28", "remaining_time": "0:21:02", "throughput": 1376.7, "total_tokens": 203840} +{"current_steps": 510, "total_steps": 4810, "loss": 0.3363, "lr": 4.999483897804933e-05, "epoch": 0.5301455301455301, "percentage": 10.6, "elapsed_time": "0:02:28", "remaining_time": "0:20:51", "throughput": 1387.08, "total_tokens": 205824} +{"current_steps": 515, "total_steps": 4810, "loss": 0.2583, "lr": 4.999283127848029e-05, "epoch": 0.5353430353430353, "percentage": 10.71, "elapsed_time": "0:02:28", "remaining_time": "0:20:40", "throughput": 1398.29, "total_tokens": 207936} +{"current_steps": 520, "total_steps": 4810, "loss": 0.3915, "lr": 4.999049451552443e-05, "epoch": 0.5405405405405406, "percentage": 10.81, "elapsed_time": "0:02:29", "remaining_time": "0:20:29", "throughput": 1409.0, "total_tokens": 209984} +{"current_steps": 525, "total_steps": 4810, "loss": 0.2461, "lr": 4.9987828719948284e-05, "epoch": 0.5457380457380457, "percentage": 10.91, "elapsed_time": "0:02:29", "remaining_time": "0:20:19", "throughput": 1420.08, "total_tokens": 212096} +{"current_steps": 530, "total_steps": 4810, "loss": 0.2863, "lr": 4.998483392685055e-05, "epoch": 0.5509355509355509, "percentage": 11.02, "elapsed_time": "0:02:29", "remaining_time": "0:20:08", "throughput": 1430.25, "total_tokens": 214080} +{"current_steps": 535, "total_steps": 4810, "loss": 0.3052, "lr": 4.9981510175661606e-05, "epoch": 0.5561330561330561, "percentage": 11.12, "elapsed_time": "0:02:30", "remaining_time": "0:19:58", "throughput": 1440.81, "total_tokens": 216128} +{"current_steps": 540, "total_steps": 4810, "loss": 0.3625, "lr": 4.9977857510143e-05, "epoch": 0.5613305613305614, "percentage": 11.23, "elapsed_time": "0:02:30", "remaining_time": "0:19:48", "throughput": 1451.32, "total_tokens": 218176} +{"current_steps": 545, "total_steps": 4810, "loss": 0.2801, "lr": 4.9973875978386843e-05, "epoch": 0.5665280665280665, "percentage": 11.33, "elapsed_time": "0:02:30", "remaining_time": "0:19:38", "throughput": 1460.95, "total_tokens": 220096} +{"current_steps": 550, "total_steps": 4810, "loss": 0.3041, "lr": 4.996956563281524e-05, "epoch": 0.5717255717255717, "percentage": 11.43, "elapsed_time": "0:02:30", "remaining_time": "0:19:29", "throughput": 1470.96, "total_tokens": 222080} +{"current_steps": 555, "total_steps": 4810, "loss": 0.2498, "lr": 4.996492653017952e-05, "epoch": 0.5769230769230769, "percentage": 11.54, "elapsed_time": "0:02:31", "remaining_time": "0:19:19", "throughput": 1480.53, "total_tokens": 224000} +{"current_steps": 560, "total_steps": 4810, "loss": 0.3224, "lr": 4.995995873155958e-05, "epoch": 0.5821205821205822, "percentage": 11.64, "elapsed_time": "0:02:31", "remaining_time": "0:19:10", "throughput": 1490.44, "total_tokens": 225984} +{"current_steps": 565, "total_steps": 4810, "loss": 0.322, "lr": 4.9954662302362973e-05, "epoch": 0.5873180873180873, "percentage": 11.75, "elapsed_time": "0:02:31", "remaining_time": "0:19:01", "throughput": 1499.45, "total_tokens": 227840} +{"current_steps": 570, "total_steps": 4810, "loss": 0.302, "lr": 4.9949037312324155e-05, "epoch": 0.5925155925155925, "percentage": 11.85, "elapsed_time": "0:02:32", "remaining_time": "0:18:52", "throughput": 1509.26, "total_tokens": 229824} +{"current_steps": 575, "total_steps": 4810, "loss": 0.3875, "lr": 4.9943083835503467e-05, "epoch": 0.5977130977130977, "percentage": 11.95, "elapsed_time": "0:02:32", "remaining_time": "0:18:43", "throughput": 1519.42, "total_tokens": 231872} +{"current_steps": 580, "total_steps": 4810, "loss": 0.314, "lr": 4.993680195028626e-05, "epoch": 0.6029106029106029, "percentage": 12.06, "elapsed_time": "0:02:32", "remaining_time": "0:18:35", "throughput": 1529.47, "total_tokens": 233920} +{"current_steps": 585, "total_steps": 4810, "loss": 0.3189, "lr": 4.9930191739381775e-05, "epoch": 0.6081081081081081, "percentage": 12.16, "elapsed_time": "0:02:33", "remaining_time": "0:18:27", "throughput": 1538.53, "total_tokens": 235840} +{"current_steps": 590, "total_steps": 4810, "loss": 0.3418, "lr": 4.9923253289822116e-05, "epoch": 0.6133056133056133, "percentage": 12.27, "elapsed_time": "0:02:33", "remaining_time": "0:18:18", "throughput": 1549.37, "total_tokens": 238016} +{"current_steps": 595, "total_steps": 4810, "loss": 0.3307, "lr": 4.9915986692961045e-05, "epoch": 0.6185031185031185, "percentage": 12.37, "elapsed_time": "0:02:33", "remaining_time": "0:18:10", "throughput": 1559.36, "total_tokens": 240064} +{"current_steps": 600, "total_steps": 4810, "loss": 0.2835, "lr": 4.9908392044472865e-05, "epoch": 0.6237006237006237, "percentage": 12.47, "elapsed_time": "0:02:34", "remaining_time": "0:18:02", "throughput": 1568.82, "total_tokens": 242048} +{"current_steps": 605, "total_steps": 4810, "loss": 0.2584, "lr": 4.990046944435105e-05, "epoch": 0.6288981288981289, "percentage": 12.58, "elapsed_time": "0:02:34", "remaining_time": "0:17:54", "throughput": 1577.81, "total_tokens": 243968} +{"current_steps": 610, "total_steps": 4810, "loss": 0.2953, "lr": 4.989221899690704e-05, "epoch": 0.6340956340956341, "percentage": 12.68, "elapsed_time": "0:02:34", "remaining_time": "0:17:46", "throughput": 1587.65, "total_tokens": 246016} +{"current_steps": 615, "total_steps": 4810, "loss": 0.3214, "lr": 4.9883640810768764e-05, "epoch": 0.6392931392931392, "percentage": 12.79, "elapsed_time": "0:02:35", "remaining_time": "0:17:39", "throughput": 1597.04, "total_tokens": 248000} +{"current_steps": 620, "total_steps": 4810, "loss": 0.312, "lr": 4.9874734998879316e-05, "epoch": 0.6444906444906445, "percentage": 12.89, "elapsed_time": "0:02:35", "remaining_time": "0:17:31", "throughput": 1606.81, "total_tokens": 250048} +{"current_steps": 625, "total_steps": 4810, "loss": 0.3215, "lr": 4.9865501678495375e-05, "epoch": 0.6496881496881497, "percentage": 12.99, "elapsed_time": "0:02:35", "remaining_time": "0:17:24", "throughput": 1616.56, "total_tokens": 252096} +{"current_steps": 630, "total_steps": 4810, "loss": 0.2892, "lr": 4.98559409711857e-05, "epoch": 0.6548856548856549, "percentage": 13.1, "elapsed_time": "0:02:36", "remaining_time": "0:17:16", "throughput": 1626.24, "total_tokens": 254144} +{"current_steps": 635, "total_steps": 4810, "loss": 0.3016, "lr": 4.984605300282954e-05, "epoch": 0.66008316008316, "percentage": 13.2, "elapsed_time": "0:02:36", "remaining_time": "0:17:09", "throughput": 1635.48, "total_tokens": 256128} +{"current_steps": 640, "total_steps": 4810, "loss": 0.2596, "lr": 4.983583790361497e-05, "epoch": 0.6652806652806653, "percentage": 13.31, "elapsed_time": "0:02:36", "remaining_time": "0:17:02", "throughput": 1644.28, "total_tokens": 258048} +{"current_steps": 645, "total_steps": 4810, "loss": 0.363, "lr": 4.982529580803714e-05, "epoch": 0.6704781704781705, "percentage": 13.41, "elapsed_time": "0:02:37", "remaining_time": "0:16:55", "throughput": 1655.47, "total_tokens": 260352} +{"current_steps": 650, "total_steps": 4810, "loss": 0.2849, "lr": 4.981442685489659e-05, "epoch": 0.6756756756756757, "percentage": 13.51, "elapsed_time": "0:02:37", "remaining_time": "0:16:48", "throughput": 1664.2, "total_tokens": 262272} +{"current_steps": 655, "total_steps": 4810, "loss": 0.2969, "lr": 4.9803231187297304e-05, "epoch": 0.6808731808731808, "percentage": 13.62, "elapsed_time": "0:02:37", "remaining_time": "0:16:41", "throughput": 1673.71, "total_tokens": 264320} +{"current_steps": 660, "total_steps": 4810, "loss": 0.3962, "lr": 4.979170895264494e-05, "epoch": 0.6860706860706861, "percentage": 13.72, "elapsed_time": "0:02:38", "remaining_time": "0:16:35", "throughput": 1682.4, "total_tokens": 266240} +{"current_steps": 665, "total_steps": 4810, "loss": 0.312, "lr": 4.977986030264482e-05, "epoch": 0.6912681912681913, "percentage": 13.83, "elapsed_time": "0:02:38", "remaining_time": "0:16:28", "throughput": 1691.44, "total_tokens": 268224} +{"current_steps": 670, "total_steps": 4810, "loss": 0.2552, "lr": 4.976768539329994e-05, "epoch": 0.6964656964656964, "percentage": 13.93, "elapsed_time": "0:02:38", "remaining_time": "0:16:21", "throughput": 1700.79, "total_tokens": 270272} +{"current_steps": 675, "total_steps": 4810, "loss": 0.312, "lr": 4.975518438490897e-05, "epoch": 0.7016632016632016, "percentage": 14.03, "elapsed_time": "0:02:39", "remaining_time": "0:16:15", "throughput": 1709.69, "total_tokens": 272256} +{"current_steps": 680, "total_steps": 4810, "loss": 0.2889, "lr": 4.9742357442064045e-05, "epoch": 0.7068607068607069, "percentage": 14.14, "elapsed_time": "0:02:39", "remaining_time": "0:16:09", "throughput": 1718.52, "total_tokens": 274240} +{"current_steps": 685, "total_steps": 4810, "loss": 0.2841, "lr": 4.972920473364869e-05, "epoch": 0.7120582120582121, "percentage": 14.24, "elapsed_time": "0:02:39", "remaining_time": "0:16:02", "throughput": 1727.83, "total_tokens": 276288} +{"current_steps": 690, "total_steps": 4810, "loss": 0.3076, "lr": 4.971572643283557e-05, "epoch": 0.7172557172557172, "percentage": 14.35, "elapsed_time": "0:02:40", "remaining_time": "0:15:56", "throughput": 1736.68, "total_tokens": 278272} +{"current_steps": 695, "total_steps": 4810, "loss": 0.285, "lr": 4.970192271708416e-05, "epoch": 0.7224532224532224, "percentage": 14.45, "elapsed_time": "0:02:40", "remaining_time": "0:15:50", "throughput": 1746.31, "total_tokens": 280384} +{"current_steps": 700, "total_steps": 4810, "loss": 0.2376, "lr": 4.968779376813849e-05, "epoch": 0.7276507276507277, "percentage": 14.55, "elapsed_time": "0:02:40", "remaining_time": "0:15:44", "throughput": 1755.12, "total_tokens": 282368} +{"current_steps": 705, "total_steps": 4810, "loss": 0.2787, "lr": 4.967333977202469e-05, "epoch": 0.7328482328482329, "percentage": 14.66, "elapsed_time": "0:02:41", "remaining_time": "0:15:38", "throughput": 1764.26, "total_tokens": 284416} +{"current_steps": 710, "total_steps": 4810, "loss": 0.214, "lr": 4.965856091904855e-05, "epoch": 0.738045738045738, "percentage": 14.76, "elapsed_time": "0:02:41", "remaining_time": "0:15:32", "throughput": 1773.35, "total_tokens": 286464} +{"current_steps": 715, "total_steps": 4810, "loss": 0.2858, "lr": 4.964345740379307e-05, "epoch": 0.7432432432432432, "percentage": 14.86, "elapsed_time": "0:02:41", "remaining_time": "0:15:27", "throughput": 1782.08, "total_tokens": 288448} +{"current_steps": 720, "total_steps": 4810, "loss": 0.2962, "lr": 4.962802942511581e-05, "epoch": 0.7484407484407485, "percentage": 14.97, "elapsed_time": "0:02:42", "remaining_time": "0:15:21", "throughput": 1791.15, "total_tokens": 290496} +{"current_steps": 723, "total_steps": 4810, "eval_loss": 0.29600390791893005, "epoch": 0.7515592515592515, "percentage": 15.03, "elapsed_time": "0:02:45", "remaining_time": "0:15:36", "throughput": 1760.16, "total_tokens": 291712} +{"current_steps": 725, "total_steps": 4810, "loss": 0.3061, "lr": 4.9612277186146335e-05, "epoch": 0.7536382536382537, "percentage": 15.07, "elapsed_time": "0:03:10", "remaining_time": "0:17:54", "throughput": 1533.17, "total_tokens": 292480} +{"current_steps": 730, "total_steps": 4810, "loss": 0.281, "lr": 4.959620089428354e-05, "epoch": 0.7588357588357588, "percentage": 15.18, "elapsed_time": "0:03:11", "remaining_time": "0:17:48", "throughput": 1540.92, "total_tokens": 294464} +{"current_steps": 735, "total_steps": 4810, "loss": 0.2702, "lr": 4.957980076119285e-05, "epoch": 0.764033264033264, "percentage": 15.28, "elapsed_time": "0:03:11", "remaining_time": "0:17:41", "throughput": 1548.64, "total_tokens": 296448} +{"current_steps": 740, "total_steps": 4810, "loss": 0.3146, "lr": 4.956307700280354e-05, "epoch": 0.7692307692307693, "percentage": 15.38, "elapsed_time": "0:03:11", "remaining_time": "0:17:34", "throughput": 1556.34, "total_tokens": 298432} +{"current_steps": 745, "total_steps": 4810, "loss": 0.2567, "lr": 4.954602983930581e-05, "epoch": 0.7744282744282744, "percentage": 15.49, "elapsed_time": "0:03:12", "remaining_time": "0:17:28", "throughput": 1564.35, "total_tokens": 300480} +{"current_steps": 750, "total_steps": 4810, "loss": 0.2488, "lr": 4.95286594951479e-05, "epoch": 0.7796257796257796, "percentage": 15.59, "elapsed_time": "0:03:12", "remaining_time": "0:17:21", "throughput": 1571.67, "total_tokens": 302400} +{"current_steps": 755, "total_steps": 4810, "loss": 0.2852, "lr": 4.9510966199033174e-05, "epoch": 0.7848232848232848, "percentage": 15.7, "elapsed_time": "0:03:12", "remaining_time": "0:17:15", "throughput": 1578.95, "total_tokens": 304320} +{"current_steps": 760, "total_steps": 4810, "loss": 0.2968, "lr": 4.949295018391706e-05, "epoch": 0.7900207900207901, "percentage": 15.8, "elapsed_time": "0:03:13", "remaining_time": "0:17:08", "throughput": 1586.22, "total_tokens": 306240} +{"current_steps": 765, "total_steps": 4810, "loss": 0.2957, "lr": 4.947461168700402e-05, "epoch": 0.7952182952182952, "percentage": 15.9, "elapsed_time": "0:03:13", "remaining_time": "0:17:02", "throughput": 1592.79, "total_tokens": 308032} +{"current_steps": 770, "total_steps": 4810, "loss": 0.2531, "lr": 4.945595094974442e-05, "epoch": 0.8004158004158004, "percentage": 16.01, "elapsed_time": "0:03:13", "remaining_time": "0:16:56", "throughput": 1600.02, "total_tokens": 309952} +{"current_steps": 775, "total_steps": 4810, "loss": 0.2396, "lr": 4.94369682178313e-05, "epoch": 0.8056133056133056, "percentage": 16.11, "elapsed_time": "0:03:14", "remaining_time": "0:16:50", "throughput": 1607.56, "total_tokens": 311936} +{"current_steps": 780, "total_steps": 4810, "loss": 0.3127, "lr": 4.9417663741197236e-05, "epoch": 0.8108108108108109, "percentage": 16.22, "elapsed_time": "0:03:14", "remaining_time": "0:16:44", "throughput": 1615.06, "total_tokens": 313920} +{"current_steps": 785, "total_steps": 4810, "loss": 0.2873, "lr": 4.939803777401095e-05, "epoch": 0.816008316008316, "percentage": 16.32, "elapsed_time": "0:03:14", "remaining_time": "0:16:38", "throughput": 1622.88, "total_tokens": 315968} +{"current_steps": 790, "total_steps": 4810, "loss": 0.263, "lr": 4.937809057467404e-05, "epoch": 0.8212058212058212, "percentage": 16.42, "elapsed_time": "0:03:15", "remaining_time": "0:16:32", "throughput": 1630.33, "total_tokens": 317952} +{"current_steps": 795, "total_steps": 4810, "loss": 0.2762, "lr": 4.935782240581752e-05, "epoch": 0.8264033264033264, "percentage": 16.53, "elapsed_time": "0:03:15", "remaining_time": "0:16:26", "throughput": 1637.42, "total_tokens": 319872} +{"current_steps": 800, "total_steps": 4810, "loss": 0.2759, "lr": 4.9337233534298425e-05, "epoch": 0.8316008316008316, "percentage": 16.63, "elapsed_time": "0:03:15", "remaining_time": "0:16:20", "throughput": 1644.81, "total_tokens": 321856} +{"current_steps": 805, "total_steps": 4810, "loss": 0.2849, "lr": 4.931632423119621e-05, "epoch": 0.8367983367983368, "percentage": 16.74, "elapsed_time": "0:03:16", "remaining_time": "0:16:15", "throughput": 1652.83, "total_tokens": 323968} +{"current_steps": 810, "total_steps": 4810, "loss": 0.2775, "lr": 4.9295094771809285e-05, "epoch": 0.841995841995842, "percentage": 16.84, "elapsed_time": "0:03:16", "remaining_time": "0:16:09", "throughput": 1660.17, "total_tokens": 325952} +{"current_steps": 815, "total_steps": 4810, "loss": 0.1962, "lr": 4.92735454356513e-05, "epoch": 0.8471933471933472, "percentage": 16.94, "elapsed_time": "0:03:16", "remaining_time": "0:16:04", "throughput": 1667.81, "total_tokens": 328000} +{"current_steps": 820, "total_steps": 4810, "loss": 0.2237, "lr": 4.925167650644752e-05, "epoch": 0.8523908523908524, "percentage": 17.05, "elapsed_time": "0:03:16", "remaining_time": "0:15:58", "throughput": 1675.11, "total_tokens": 329984} +{"current_steps": 825, "total_steps": 4810, "loss": 0.3432, "lr": 4.9229488272131067e-05, "epoch": 0.8575883575883576, "percentage": 17.15, "elapsed_time": "0:03:17", "remaining_time": "0:15:55", "throughput": 1678.38, "total_tokens": 331904} +{"current_steps": 830, "total_steps": 4810, "loss": 0.3102, "lr": 4.920698102483912e-05, "epoch": 0.8627858627858628, "percentage": 17.26, "elapsed_time": "0:03:18", "remaining_time": "0:15:49", "throughput": 1685.65, "total_tokens": 333888} +{"current_steps": 835, "total_steps": 4810, "loss": 0.3035, "lr": 4.918415506090911e-05, "epoch": 0.867983367983368, "percentage": 17.36, "elapsed_time": "0:03:18", "remaining_time": "0:15:44", "throughput": 1692.85, "total_tokens": 335872} +{"current_steps": 840, "total_steps": 4810, "loss": 0.2682, "lr": 4.916101068087476e-05, "epoch": 0.8731808731808732, "percentage": 17.46, "elapsed_time": "0:03:18", "remaining_time": "0:15:39", "throughput": 1700.06, "total_tokens": 337856} +{"current_steps": 845, "total_steps": 4810, "loss": 0.2422, "lr": 4.913754818946219e-05, "epoch": 0.8783783783783784, "percentage": 17.57, "elapsed_time": "0:03:19", "remaining_time": "0:15:34", "throughput": 1706.95, "total_tokens": 339776} +{"current_steps": 850, "total_steps": 4810, "loss": 0.1949, "lr": 4.911376789558584e-05, "epoch": 0.8835758835758836, "percentage": 17.67, "elapsed_time": "0:03:19", "remaining_time": "0:15:28", "throughput": 1714.11, "total_tokens": 341760} +{"current_steps": 855, "total_steps": 4810, "loss": 0.3477, "lr": 4.9089670112344456e-05, "epoch": 0.8887733887733887, "percentage": 17.78, "elapsed_time": "0:03:19", "remaining_time": "0:15:23", "throughput": 1720.91, "total_tokens": 343680} +{"current_steps": 860, "total_steps": 4810, "loss": 0.292, "lr": 4.906525515701695e-05, "epoch": 0.893970893970894, "percentage": 17.88, "elapsed_time": "0:03:20", "remaining_time": "0:15:18", "throughput": 1727.68, "total_tokens": 345600} +{"current_steps": 865, "total_steps": 4810, "loss": 0.2896, "lr": 4.904052335105822e-05, "epoch": 0.8991683991683992, "percentage": 17.98, "elapsed_time": "0:03:20", "remaining_time": "0:15:13", "throughput": 1734.39, "total_tokens": 347520} +{"current_steps": 870, "total_steps": 4810, "loss": 0.2644, "lr": 4.90154750200949e-05, "epoch": 0.9043659043659044, "percentage": 18.09, "elapsed_time": "0:03:20", "remaining_time": "0:15:08", "throughput": 1741.73, "total_tokens": 349568} +{"current_steps": 875, "total_steps": 4810, "loss": 0.3212, "lr": 4.8990110493921105e-05, "epoch": 0.9095634095634095, "percentage": 18.19, "elapsed_time": "0:03:21", "remaining_time": "0:15:04", "throughput": 1748.72, "total_tokens": 351552} +{"current_steps": 880, "total_steps": 4810, "loss": 0.2787, "lr": 4.8964430106494075e-05, "epoch": 0.9147609147609148, "percentage": 18.3, "elapsed_time": "0:03:21", "remaining_time": "0:14:59", "throughput": 1755.37, "total_tokens": 353472} +{"current_steps": 885, "total_steps": 4810, "loss": 0.2656, "lr": 4.893843419592977e-05, "epoch": 0.91995841995842, "percentage": 18.4, "elapsed_time": "0:03:21", "remaining_time": "0:14:54", "throughput": 1762.01, "total_tokens": 355392} +{"current_steps": 890, "total_steps": 4810, "loss": 0.2593, "lr": 4.891212310449844e-05, "epoch": 0.9251559251559252, "percentage": 18.5, "elapsed_time": "0:03:22", "remaining_time": "0:14:49", "throughput": 1769.28, "total_tokens": 357440} +{"current_steps": 895, "total_steps": 4810, "loss": 0.2785, "lr": 4.8885497178620095e-05, "epoch": 0.9303534303534303, "percentage": 18.61, "elapsed_time": "0:03:22", "remaining_time": "0:14:45", "throughput": 1776.53, "total_tokens": 359488} +{"current_steps": 900, "total_steps": 4810, "loss": 0.283, "lr": 4.8858556768859944e-05, "epoch": 0.9355509355509356, "percentage": 18.71, "elapsed_time": "0:03:22", "remaining_time": "0:14:40", "throughput": 1783.12, "total_tokens": 361408} +{"current_steps": 905, "total_steps": 4810, "loss": 0.27, "lr": 4.88313022299238e-05, "epoch": 0.9407484407484408, "percentage": 18.81, "elapsed_time": "0:03:23", "remaining_time": "0:14:35", "throughput": 1790.0, "total_tokens": 363392} +{"current_steps": 910, "total_steps": 4810, "loss": 0.2987, "lr": 4.88037339206534e-05, "epoch": 0.9459459459459459, "percentage": 18.92, "elapsed_time": "0:03:23", "remaining_time": "0:14:31", "throughput": 1797.17, "total_tokens": 365440} +{"current_steps": 915, "total_steps": 4810, "loss": 0.2998, "lr": 4.8775852204021665e-05, "epoch": 0.9511434511434511, "percentage": 19.02, "elapsed_time": "0:03:23", "remaining_time": "0:14:26", "throughput": 1804.95, "total_tokens": 367616} +{"current_steps": 920, "total_steps": 4810, "loss": 0.358, "lr": 4.874765744712796e-05, "epoch": 0.9563409563409564, "percentage": 19.13, "elapsed_time": "0:03:24", "remaining_time": "0:14:22", "throughput": 1811.76, "total_tokens": 369600} +{"current_steps": 925, "total_steps": 4810, "loss": 0.2755, "lr": 4.871915002119321e-05, "epoch": 0.9615384615384616, "percentage": 19.23, "elapsed_time": "0:03:24", "remaining_time": "0:14:18", "throughput": 1818.25, "total_tokens": 371520} +{"current_steps": 930, "total_steps": 4810, "loss": 0.3085, "lr": 4.8690330301555045e-05, "epoch": 0.9667359667359667, "percentage": 19.33, "elapsed_time": "0:03:24", "remaining_time": "0:14:13", "throughput": 1825.34, "total_tokens": 373568} +{"current_steps": 935, "total_steps": 4810, "loss": 0.2548, "lr": 4.8661198667662854e-05, "epoch": 0.9719334719334719, "percentage": 19.44, "elapsed_time": "0:03:24", "remaining_time": "0:14:09", "throughput": 1831.78, "total_tokens": 375488} +{"current_steps": 940, "total_steps": 4810, "loss": 0.3274, "lr": 4.86317555030728e-05, "epoch": 0.9771309771309772, "percentage": 19.54, "elapsed_time": "0:03:25", "remaining_time": "0:14:05", "throughput": 1839.74, "total_tokens": 377728} +{"current_steps": 945, "total_steps": 4810, "loss": 0.2924, "lr": 4.8602001195442725e-05, "epoch": 0.9823284823284824, "percentage": 19.65, "elapsed_time": "0:03:25", "remaining_time": "0:14:01", "throughput": 1847.07, "total_tokens": 379840} +{"current_steps": 950, "total_steps": 4810, "loss": 0.2685, "lr": 4.857193613652711e-05, "epoch": 0.9875259875259875, "percentage": 19.75, "elapsed_time": "0:03:25", "remaining_time": "0:13:56", "throughput": 1853.45, "total_tokens": 381760} +{"current_steps": 955, "total_steps": 4810, "loss": 0.2743, "lr": 4.8541560722171855e-05, "epoch": 0.9927234927234927, "percentage": 19.85, "elapsed_time": "0:03:26", "remaining_time": "0:13:52", "throughput": 1860.42, "total_tokens": 383808} +{"current_steps": 960, "total_steps": 4810, "loss": 0.2807, "lr": 4.8510875352309106e-05, "epoch": 0.997920997920998, "percentage": 19.96, "elapsed_time": "0:03:26", "remaining_time": "0:13:48", "throughput": 1867.39, "total_tokens": 385856} +{"current_steps": 964, "total_steps": 4810, "eval_loss": 0.2738620638847351, "epoch": 1.002079002079002, "percentage": 20.04, "elapsed_time": "0:03:27", "remaining_time": "0:13:49", "throughput": 1862.86, "total_tokens": 387464} +{"current_steps": 965, "total_steps": 4810, "loss": 0.2643, "lr": 4.8479880430951995e-05, "epoch": 1.003118503118503, "percentage": 20.06, "elapsed_time": "0:04:47", "remaining_time": "0:19:04", "throughput": 1350.42, "total_tokens": 387848} +{"current_steps": 970, "total_steps": 4810, "loss": 0.2613, "lr": 4.844857636618928e-05, "epoch": 1.0083160083160083, "percentage": 20.17, "elapsed_time": "0:04:47", "remaining_time": "0:18:58", "throughput": 1355.13, "total_tokens": 389640} +{"current_steps": 975, "total_steps": 4810, "loss": 0.2824, "lr": 4.8416963570180025e-05, "epoch": 1.0135135135135136, "percentage": 20.27, "elapsed_time": "0:04:47", "remaining_time": "0:18:52", "throughput": 1360.5, "total_tokens": 391624} +{"current_steps": 980, "total_steps": 4810, "loss": 0.3008, "lr": 4.838504245914812e-05, "epoch": 1.0187110187110187, "percentage": 20.37, "elapsed_time": "0:04:48", "remaining_time": "0:18:46", "throughput": 1366.09, "total_tokens": 393672} +{"current_steps": 985, "total_steps": 4810, "loss": 0.3048, "lr": 4.8352813453376836e-05, "epoch": 1.023908523908524, "percentage": 20.48, "elapsed_time": "0:04:48", "remaining_time": "0:18:40", "throughput": 1371.87, "total_tokens": 395784} +{"current_steps": 990, "total_steps": 4810, "loss": 0.3205, "lr": 4.83202769772033e-05, "epoch": 1.0291060291060292, "percentage": 20.58, "elapsed_time": "0:04:48", "remaining_time": "0:18:34", "throughput": 1377.22, "total_tokens": 397768} +{"current_steps": 995, "total_steps": 4810, "loss": 0.2694, "lr": 4.8287433459012844e-05, "epoch": 1.0343035343035343, "percentage": 20.69, "elapsed_time": "0:04:49", "remaining_time": "0:18:28", "throughput": 1382.77, "total_tokens": 399816} +{"current_steps": 1000, "total_steps": 4810, "loss": 0.3263, "lr": 4.8254283331233464e-05, "epoch": 1.0395010395010396, "percentage": 20.79, "elapsed_time": "0:04:49", "remaining_time": "0:18:22", "throughput": 1388.51, "total_tokens": 401928} +{"current_steps": 1005, "total_steps": 4810, "loss": 0.3028, "lr": 4.822082703033003e-05, "epoch": 1.0446985446985446, "percentage": 20.89, "elapsed_time": "0:04:49", "remaining_time": "0:18:17", "throughput": 1393.82, "total_tokens": 403912} +{"current_steps": 1010, "total_steps": 4810, "loss": 0.2501, "lr": 4.818706499679862e-05, "epoch": 1.04989604989605, "percentage": 21.0, "elapsed_time": "0:04:50", "remaining_time": "0:18:11", "throughput": 1398.9, "total_tokens": 405832} +{"current_steps": 1015, "total_steps": 4810, "loss": 0.339, "lr": 4.815299767516065e-05, "epoch": 1.0550935550935552, "percentage": 21.1, "elapsed_time": "0:04:50", "remaining_time": "0:18:05", "throughput": 1404.4, "total_tokens": 407880} +{"current_steps": 1020, "total_steps": 4810, "loss": 0.2748, "lr": 4.8118625513957074e-05, "epoch": 1.0602910602910602, "percentage": 21.21, "elapsed_time": "0:04:50", "remaining_time": "0:18:00", "throughput": 1410.53, "total_tokens": 410120} +{"current_steps": 1025, "total_steps": 4810, "loss": 0.3246, "lr": 4.808394896574245e-05, "epoch": 1.0654885654885655, "percentage": 21.31, "elapsed_time": "0:04:51", "remaining_time": "0:17:54", "throughput": 1416.01, "total_tokens": 412168} +{"current_steps": 1030, "total_steps": 4810, "loss": 0.2849, "lr": 4.8048968487079e-05, "epoch": 1.0706860706860706, "percentage": 21.41, "elapsed_time": "0:04:51", "remaining_time": "0:17:49", "throughput": 1422.32, "total_tokens": 414472} +{"current_steps": 1035, "total_steps": 4810, "loss": 0.2908, "lr": 4.8013684538530565e-05, "epoch": 1.0758835758835759, "percentage": 21.52, "elapsed_time": "0:04:51", "remaining_time": "0:17:44", "throughput": 1427.78, "total_tokens": 416520} +{"current_steps": 1040, "total_steps": 4810, "loss": 0.2774, "lr": 4.79780975846566e-05, "epoch": 1.0810810810810811, "percentage": 21.62, "elapsed_time": "0:04:52", "remaining_time": "0:17:38", "throughput": 1433.21, "total_tokens": 418568} +{"current_steps": 1045, "total_steps": 4810, "loss": 0.2417, "lr": 4.7942208094006e-05, "epoch": 1.0862785862785862, "percentage": 21.73, "elapsed_time": "0:04:52", "remaining_time": "0:17:33", "throughput": 1438.21, "total_tokens": 420488} +{"current_steps": 1050, "total_steps": 4810, "loss": 0.2736, "lr": 4.790601653911094e-05, "epoch": 1.0914760914760915, "percentage": 21.83, "elapsed_time": "0:04:52", "remaining_time": "0:17:28", "throughput": 1443.4, "total_tokens": 422472} +{"current_steps": 1055, "total_steps": 4810, "loss": 0.3165, "lr": 4.786952339648071e-05, "epoch": 1.0966735966735968, "percentage": 21.93, "elapsed_time": "0:04:53", "remaining_time": "0:17:22", "throughput": 1448.59, "total_tokens": 424456} +{"current_steps": 1060, "total_steps": 4810, "loss": 0.305, "lr": 4.783272914659535e-05, "epoch": 1.1018711018711018, "percentage": 22.04, "elapsed_time": "0:04:53", "remaining_time": "0:17:17", "throughput": 1454.19, "total_tokens": 426568} +{"current_steps": 1065, "total_steps": 4810, "loss": 0.2809, "lr": 4.77956342738994e-05, "epoch": 1.107068607068607, "percentage": 22.14, "elapsed_time": "0:04:53", "remaining_time": "0:17:12", "throughput": 1459.35, "total_tokens": 428552} +{"current_steps": 1070, "total_steps": 4810, "loss": 0.2758, "lr": 4.775823926679548e-05, "epoch": 1.1122661122661124, "percentage": 22.25, "elapsed_time": "0:04:53", "remaining_time": "0:17:07", "throughput": 1464.27, "total_tokens": 430472} +{"current_steps": 1075, "total_steps": 4810, "loss": 0.2657, "lr": 4.77205446176379e-05, "epoch": 1.1174636174636174, "percentage": 22.35, "elapsed_time": "0:04:54", "remaining_time": "0:17:02", "throughput": 1468.97, "total_tokens": 432328} +{"current_steps": 1080, "total_steps": 4810, "loss": 0.2881, "lr": 4.768255082272611e-05, "epoch": 1.1226611226611227, "percentage": 22.45, "elapsed_time": "0:04:54", "remaining_time": "0:16:57", "throughput": 1474.52, "total_tokens": 434440} +{"current_steps": 1085, "total_steps": 4810, "loss": 0.2938, "lr": 4.764425838229824e-05, "epoch": 1.1278586278586278, "percentage": 22.56, "elapsed_time": "0:04:54", "remaining_time": "0:16:52", "throughput": 1479.85, "total_tokens": 436488} +{"current_steps": 1090, "total_steps": 4810, "loss": 0.4153, "lr": 4.760566780052445e-05, "epoch": 1.133056133056133, "percentage": 22.66, "elapsed_time": "0:04:55", "remaining_time": "0:16:47", "throughput": 1484.95, "total_tokens": 438472} +{"current_steps": 1095, "total_steps": 4810, "loss": 0.3296, "lr": 4.7566779585500347e-05, "epoch": 1.1382536382536383, "percentage": 22.77, "elapsed_time": "0:04:55", "remaining_time": "0:16:42", "throughput": 1490.05, "total_tokens": 440456} +{"current_steps": 1100, "total_steps": 4810, "loss": 0.3082, "lr": 4.7527594249240264e-05, "epoch": 1.1434511434511434, "percentage": 22.87, "elapsed_time": "0:04:55", "remaining_time": "0:16:38", "throughput": 1495.12, "total_tokens": 442440} +{"current_steps": 1105, "total_steps": 4810, "loss": 0.3109, "lr": 4.748811230767051e-05, "epoch": 1.1486486486486487, "percentage": 22.97, "elapsed_time": "0:04:56", "remaining_time": "0:16:33", "throughput": 1500.18, "total_tokens": 444424} +{"current_steps": 1110, "total_steps": 4810, "loss": 0.2754, "lr": 4.744833428062262e-05, "epoch": 1.1538461538461537, "percentage": 23.08, "elapsed_time": "0:04:56", "remaining_time": "0:16:28", "throughput": 1504.81, "total_tokens": 446280} +{"current_steps": 1115, "total_steps": 4810, "loss": 0.286, "lr": 4.740826069182645e-05, "epoch": 1.159043659043659, "percentage": 23.18, "elapsed_time": "0:04:56", "remaining_time": "0:16:23", "throughput": 1509.85, "total_tokens": 448264} +{"current_steps": 1120, "total_steps": 4810, "loss": 0.2806, "lr": 4.736789206890332e-05, "epoch": 1.1642411642411643, "percentage": 23.28, "elapsed_time": "0:04:57", "remaining_time": "0:16:19", "throughput": 1515.31, "total_tokens": 450376} +{"current_steps": 1125, "total_steps": 4810, "loss": 0.2575, "lr": 4.732722894335909e-05, "epoch": 1.1694386694386694, "percentage": 23.39, "elapsed_time": "0:04:57", "remaining_time": "0:16:14", "throughput": 1520.98, "total_tokens": 452552} +{"current_steps": 1130, "total_steps": 4810, "loss": 0.2989, "lr": 4.7286271850577105e-05, "epoch": 1.1746361746361746, "percentage": 23.49, "elapsed_time": "0:04:57", "remaining_time": "0:16:10", "throughput": 1526.2, "total_tokens": 454600} +{"current_steps": 1135, "total_steps": 4810, "loss": 0.5214, "lr": 4.724502132981119e-05, "epoch": 1.17983367983368, "percentage": 23.6, "elapsed_time": "0:04:58", "remaining_time": "0:16:05", "throughput": 1531.41, "total_tokens": 456648} +{"current_steps": 1140, "total_steps": 4810, "loss": 0.3325, "lr": 4.7203477924178506e-05, "epoch": 1.185031185031185, "percentage": 23.7, "elapsed_time": "0:04:58", "remaining_time": "0:16:00", "throughput": 1536.4, "total_tokens": 458632} +{"current_steps": 1145, "total_steps": 4810, "loss": 0.2795, "lr": 4.7161642180652464e-05, "epoch": 1.1902286902286903, "percentage": 23.8, "elapsed_time": "0:04:58", "remaining_time": "0:15:56", "throughput": 1541.59, "total_tokens": 460680} +{"current_steps": 1150, "total_steps": 4810, "loss": 0.2697, "lr": 4.7119514650055476e-05, "epoch": 1.1954261954261955, "percentage": 23.91, "elapsed_time": "0:04:59", "remaining_time": "0:15:52", "throughput": 1546.76, "total_tokens": 462728} +{"current_steps": 1155, "total_steps": 4810, "loss": 0.2429, "lr": 4.7077095887051686e-05, "epoch": 1.2006237006237006, "percentage": 24.01, "elapsed_time": "0:04:59", "remaining_time": "0:15:47", "throughput": 1551.93, "total_tokens": 464776} +{"current_steps": 1160, "total_steps": 4810, "loss": 0.2844, "lr": 4.7034386450139735e-05, "epoch": 1.2058212058212059, "percentage": 24.12, "elapsed_time": "0:04:59", "remaining_time": "0:15:43", "throughput": 1556.65, "total_tokens": 466696} +{"current_steps": 1165, "total_steps": 4810, "loss": 0.259, "lr": 4.699138690164533e-05, "epoch": 1.211018711018711, "percentage": 24.22, "elapsed_time": "0:05:00", "remaining_time": "0:15:39", "throughput": 1561.37, "total_tokens": 468616} +{"current_steps": 1170, "total_steps": 4810, "loss": 0.2734, "lr": 4.694809780771391e-05, "epoch": 1.2162162162162162, "percentage": 24.32, "elapsed_time": "0:05:00", "remaining_time": "0:15:34", "throughput": 1566.71, "total_tokens": 470728} +{"current_steps": 1175, "total_steps": 4810, "loss": 0.2763, "lr": 4.690451973830313e-05, "epoch": 1.2214137214137215, "percentage": 24.43, "elapsed_time": "0:05:00", "remaining_time": "0:15:30", "throughput": 1571.84, "total_tokens": 472776} +{"current_steps": 1180, "total_steps": 4810, "loss": 0.2615, "lr": 4.6860653267175416e-05, "epoch": 1.2266112266112266, "percentage": 24.53, "elapsed_time": "0:05:01", "remaining_time": "0:15:26", "throughput": 1576.95, "total_tokens": 474824} +{"current_steps": 1185, "total_steps": 4810, "loss": 0.2894, "lr": 4.681649897189036e-05, "epoch": 1.2318087318087318, "percentage": 24.64, "elapsed_time": "0:05:01", "remaining_time": "0:15:22", "throughput": 1581.63, "total_tokens": 476744} +{"current_steps": 1190, "total_steps": 4810, "loss": 0.2065, "lr": 4.677205743379713e-05, "epoch": 1.237006237006237, "percentage": 24.74, "elapsed_time": "0:05:01", "remaining_time": "0:15:17", "throughput": 1586.92, "total_tokens": 478856} +{"current_steps": 1195, "total_steps": 4810, "loss": 0.4129, "lr": 4.672732923802685e-05, "epoch": 1.2422037422037422, "percentage": 24.84, "elapsed_time": "0:05:02", "remaining_time": "0:15:13", "throughput": 1591.58, "total_tokens": 480776} +{"current_steps": 1200, "total_steps": 4810, "loss": 0.2716, "lr": 4.668231497348484e-05, "epoch": 1.2474012474012475, "percentage": 24.95, "elapsed_time": "0:05:02", "remaining_time": "0:15:09", "throughput": 1597.07, "total_tokens": 482952} +{"current_steps": 1205, "total_steps": 4810, "loss": 0.2836, "lr": 4.663701523284291e-05, "epoch": 1.2525987525987525, "percentage": 25.05, "elapsed_time": "0:05:02", "remaining_time": "0:15:05", "throughput": 1602.75, "total_tokens": 485192} +{"current_steps": 1205, "total_steps": 4810, "eval_loss": 0.2581372559070587, "epoch": 1.2525987525987525, "percentage": 25.05, "elapsed_time": "0:05:04", "remaining_time": "0:15:10", "throughput": 1594.6, "total_tokens": 485192} +{"current_steps": 1210, "total_steps": 4810, "loss": 0.2541, "lr": 4.6591430612531515e-05, "epoch": 1.2577962577962578, "percentage": 25.16, "elapsed_time": "0:05:38", "remaining_time": "0:16:45", "throughput": 1440.85, "total_tokens": 487112} +{"current_steps": 1215, "total_steps": 4810, "loss": 0.3056, "lr": 4.6545561712731954e-05, "epoch": 1.262993762993763, "percentage": 25.26, "elapsed_time": "0:05:38", "remaining_time": "0:16:41", "throughput": 1445.51, "total_tokens": 489160} +{"current_steps": 1220, "total_steps": 4810, "loss": 0.2656, "lr": 4.649940913736841e-05, "epoch": 1.2681912681912682, "percentage": 25.36, "elapsed_time": "0:05:38", "remaining_time": "0:16:36", "throughput": 1449.79, "total_tokens": 491080} +{"current_steps": 1225, "total_steps": 4810, "loss": 0.2917, "lr": 4.645297349410005e-05, "epoch": 1.2733887733887734, "percentage": 25.47, "elapsed_time": "0:05:39", "remaining_time": "0:16:32", "throughput": 1454.25, "total_tokens": 493064} +{"current_steps": 1230, "total_steps": 4810, "loss": 0.2878, "lr": 4.640625539431298e-05, "epoch": 1.2785862785862787, "percentage": 25.57, "elapsed_time": "0:05:39", "remaining_time": "0:16:27", "throughput": 1458.51, "total_tokens": 494984} +{"current_steps": 1235, "total_steps": 4810, "loss": 0.2686, "lr": 4.635925545311224e-05, "epoch": 1.2837837837837838, "percentage": 25.68, "elapsed_time": "0:05:39", "remaining_time": "0:16:23", "throughput": 1462.97, "total_tokens": 496968} +{"current_steps": 1240, "total_steps": 4810, "loss": 0.2747, "lr": 4.6311974289313646e-05, "epoch": 1.288981288981289, "percentage": 25.78, "elapsed_time": "0:05:40", "remaining_time": "0:16:18", "throughput": 1467.03, "total_tokens": 498824} +{"current_steps": 1245, "total_steps": 4810, "loss": 0.2269, "lr": 4.6264412525435716e-05, "epoch": 1.2941787941787941, "percentage": 25.88, "elapsed_time": "0:05:40", "remaining_time": "0:16:14", "throughput": 1471.46, "total_tokens": 500808} +{"current_steps": 1250, "total_steps": 4810, "loss": 0.2595, "lr": 4.6216570787691423e-05, "epoch": 1.2993762993762994, "percentage": 25.99, "elapsed_time": "0:05:40", "remaining_time": "0:16:10", "throughput": 1476.07, "total_tokens": 502856} +{"current_steps": 1255, "total_steps": 4810, "loss": 0.2367, "lr": 4.6168449705979956e-05, "epoch": 1.3045738045738045, "percentage": 26.09, "elapsed_time": "0:05:40", "remaining_time": "0:16:05", "throughput": 1480.09, "total_tokens": 504712} +{"current_steps": 1260, "total_steps": 4810, "loss": 0.3177, "lr": 4.612004991387843e-05, "epoch": 1.3097713097713097, "percentage": 26.2, "elapsed_time": "0:05:41", "remaining_time": "0:16:01", "throughput": 1484.5, "total_tokens": 506696} +{"current_steps": 1265, "total_steps": 4810, "loss": 0.2562, "lr": 4.6071372048633566e-05, "epoch": 1.314968814968815, "percentage": 26.3, "elapsed_time": "0:05:41", "remaining_time": "0:15:57", "throughput": 1488.88, "total_tokens": 508680} +{"current_steps": 1270, "total_steps": 4810, "loss": 0.291, "lr": 4.6022416751153255e-05, "epoch": 1.32016632016632, "percentage": 26.4, "elapsed_time": "0:05:41", "remaining_time": "0:15:53", "throughput": 1493.46, "total_tokens": 510728} +{"current_steps": 1275, "total_steps": 4810, "loss": 0.2441, "lr": 4.5973184665998186e-05, "epoch": 1.3253638253638254, "percentage": 26.51, "elapsed_time": "0:05:42", "remaining_time": "0:15:49", "throughput": 1497.83, "total_tokens": 512712} +{"current_steps": 1280, "total_steps": 4810, "loss": 0.2674, "lr": 4.5923676441373287e-05, "epoch": 1.3305613305613306, "percentage": 26.61, "elapsed_time": "0:05:42", "remaining_time": "0:15:44", "throughput": 1502.2, "total_tokens": 514696} +{"current_steps": 1285, "total_steps": 4810, "loss": 0.2628, "lr": 4.5873892729119225e-05, "epoch": 1.3357588357588357, "percentage": 26.72, "elapsed_time": "0:05:42", "remaining_time": "0:15:40", "throughput": 1506.93, "total_tokens": 516808} +{"current_steps": 1290, "total_steps": 4810, "loss": 0.208, "lr": 4.582383418470386e-05, "epoch": 1.340956340956341, "percentage": 26.82, "elapsed_time": "0:05:43", "remaining_time": "0:15:36", "throughput": 1511.28, "total_tokens": 518792} +{"current_steps": 1295, "total_steps": 4810, "loss": 0.2791, "lr": 4.577350146721353e-05, "epoch": 1.3461538461538463, "percentage": 26.92, "elapsed_time": "0:05:43", "remaining_time": "0:15:32", "throughput": 1515.81, "total_tokens": 520840} +{"current_steps": 1300, "total_steps": 4810, "loss": 0.2367, "lr": 4.5722895239344435e-05, "epoch": 1.3513513513513513, "percentage": 27.03, "elapsed_time": "0:05:43", "remaining_time": "0:15:28", "throughput": 1519.95, "total_tokens": 522760} +{"current_steps": 1305, "total_steps": 4810, "loss": 0.2853, "lr": 4.567201616739393e-05, "epoch": 1.3565488565488566, "percentage": 27.13, "elapsed_time": "0:05:44", "remaining_time": "0:15:24", "throughput": 1524.65, "total_tokens": 524872} +{"current_steps": 1310, "total_steps": 4810, "loss": 0.2922, "lr": 4.562086492125167e-05, "epoch": 1.3617463617463619, "percentage": 27.23, "elapsed_time": "0:05:44", "remaining_time": "0:15:20", "throughput": 1529.15, "total_tokens": 526920} +{"current_steps": 1315, "total_steps": 4810, "loss": 0.2892, "lr": 4.556944217439088e-05, "epoch": 1.366943866943867, "percentage": 27.34, "elapsed_time": "0:05:44", "remaining_time": "0:15:16", "throughput": 1533.64, "total_tokens": 528968} +{"current_steps": 1320, "total_steps": 4810, "loss": 0.2689, "lr": 4.5517748603859435e-05, "epoch": 1.3721413721413722, "percentage": 27.44, "elapsed_time": "0:05:45", "remaining_time": "0:15:12", "throughput": 1537.76, "total_tokens": 530888} +{"current_steps": 1325, "total_steps": 4810, "loss": 0.2348, "lr": 4.546578489027095e-05, "epoch": 1.3773388773388773, "percentage": 27.55, "elapsed_time": "0:05:45", "remaining_time": "0:15:08", "throughput": 1542.06, "total_tokens": 532872} +{"current_steps": 1330, "total_steps": 4810, "loss": 0.2971, "lr": 4.541355171779582e-05, "epoch": 1.3825363825363826, "percentage": 27.65, "elapsed_time": "0:05:45", "remaining_time": "0:15:05", "throughput": 1546.54, "total_tokens": 534920} +{"current_steps": 1335, "total_steps": 4810, "loss": 0.2582, "lr": 4.5361049774152256e-05, "epoch": 1.3877338877338876, "percentage": 27.75, "elapsed_time": "0:05:46", "remaining_time": "0:15:01", "throughput": 1550.64, "total_tokens": 536840} +{"current_steps": 1340, "total_steps": 4810, "loss": 0.2788, "lr": 4.530827975059715e-05, "epoch": 1.392931392931393, "percentage": 27.86, "elapsed_time": "0:05:46", "remaining_time": "0:14:57", "throughput": 1554.74, "total_tokens": 538760} +{"current_steps": 1345, "total_steps": 4810, "loss": 0.2367, "lr": 4.5255242341917055e-05, "epoch": 1.3981288981288982, "percentage": 27.96, "elapsed_time": "0:05:46", "remaining_time": "0:14:53", "throughput": 1558.83, "total_tokens": 540680} +{"current_steps": 1350, "total_steps": 4810, "loss": 0.2864, "lr": 4.5201938246418976e-05, "epoch": 1.4033264033264032, "percentage": 28.07, "elapsed_time": "0:05:47", "remaining_time": "0:14:49", "throughput": 1563.09, "total_tokens": 542664} +{"current_steps": 1355, "total_steps": 4810, "loss": 0.1771, "lr": 4.51483681659212e-05, "epoch": 1.4085239085239085, "percentage": 28.17, "elapsed_time": "0:05:47", "remaining_time": "0:14:46", "throughput": 1567.53, "total_tokens": 544712} +{"current_steps": 1360, "total_steps": 4810, "loss": 0.3864, "lr": 4.509453280574407e-05, "epoch": 1.4137214137214138, "percentage": 28.27, "elapsed_time": "0:05:47", "remaining_time": "0:14:42", "throughput": 1572.14, "total_tokens": 546824} +{"current_steps": 1365, "total_steps": 4810, "loss": 0.2952, "lr": 4.504043287470068e-05, "epoch": 1.4189189189189189, "percentage": 28.38, "elapsed_time": "0:05:48", "remaining_time": "0:14:38", "throughput": 1576.74, "total_tokens": 548936} +{"current_steps": 1370, "total_steps": 4810, "loss": 0.3433, "lr": 4.498606908508754e-05, "epoch": 1.4241164241164241, "percentage": 28.48, "elapsed_time": "0:05:48", "remaining_time": "0:14:34", "throughput": 1580.97, "total_tokens": 550920} +{"current_steps": 1375, "total_steps": 4810, "loss": 0.2757, "lr": 4.4931442152675185e-05, "epoch": 1.4293139293139294, "percentage": 28.59, "elapsed_time": "0:05:48", "remaining_time": "0:14:31", "throughput": 1585.2, "total_tokens": 552904} +{"current_steps": 1380, "total_steps": 4810, "loss": 0.3025, "lr": 4.487655279669881e-05, "epoch": 1.4345114345114345, "percentage": 28.69, "elapsed_time": "0:05:49", "remaining_time": "0:14:27", "throughput": 1589.23, "total_tokens": 554824} +{"current_steps": 1385, "total_steps": 4810, "loss": 0.2663, "lr": 4.482140173984875e-05, "epoch": 1.4397089397089398, "percentage": 28.79, "elapsed_time": "0:05:49", "remaining_time": "0:14:24", "throughput": 1593.62, "total_tokens": 556872} +{"current_steps": 1390, "total_steps": 4810, "loss": 0.2717, "lr": 4.476598970826094e-05, "epoch": 1.444906444906445, "percentage": 28.9, "elapsed_time": "0:05:49", "remaining_time": "0:14:20", "throughput": 1598.18, "total_tokens": 558984} +{"current_steps": 1395, "total_steps": 4810, "loss": 0.2791, "lr": 4.4710317431507434e-05, "epoch": 1.45010395010395, "percentage": 29.0, "elapsed_time": "0:05:50", "remaining_time": "0:14:17", "throughput": 1602.37, "total_tokens": 560968} +{"current_steps": 1400, "total_steps": 4810, "loss": 0.2617, "lr": 4.465438564258673e-05, "epoch": 1.4553014553014554, "percentage": 29.11, "elapsed_time": "0:05:50", "remaining_time": "0:14:13", "throughput": 1606.56, "total_tokens": 562952} +{"current_steps": 1405, "total_steps": 4810, "loss": 0.2452, "lr": 4.4598195077914145e-05, "epoch": 1.4604989604989604, "percentage": 29.21, "elapsed_time": "0:05:50", "remaining_time": "0:14:10", "throughput": 1611.0, "total_tokens": 565064} +{"current_steps": 1410, "total_steps": 4810, "loss": 0.2761, "lr": 4.454174647731213e-05, "epoch": 1.4656964656964657, "percentage": 29.31, "elapsed_time": "0:05:51", "remaining_time": "0:14:06", "throughput": 1615.35, "total_tokens": 567112} +{"current_steps": 1415, "total_steps": 4810, "loss": 0.2875, "lr": 4.4485040584000514e-05, "epoch": 1.4708939708939708, "percentage": 29.42, "elapsed_time": "0:05:51", "remaining_time": "0:14:03", "throughput": 1619.69, "total_tokens": 569160} +{"current_steps": 1420, "total_steps": 4810, "loss": 0.2782, "lr": 4.442807814458672e-05, "epoch": 1.476091476091476, "percentage": 29.52, "elapsed_time": "0:05:51", "remaining_time": "0:13:59", "throughput": 1624.37, "total_tokens": 571336} +{"current_steps": 1425, "total_steps": 4810, "loss": 0.25, "lr": 4.437085990905591e-05, "epoch": 1.4812889812889813, "percentage": 29.63, "elapsed_time": "0:05:52", "remaining_time": "0:13:56", "throughput": 1628.69, "total_tokens": 573384} +{"current_steps": 1430, "total_steps": 4810, "loss": 0.2596, "lr": 4.431338663076119e-05, "epoch": 1.4864864864864864, "percentage": 29.73, "elapsed_time": "0:05:52", "remaining_time": "0:13:52", "throughput": 1632.65, "total_tokens": 575304} +{"current_steps": 1435, "total_steps": 4810, "loss": 0.2788, "lr": 4.4255659066413595e-05, "epoch": 1.4916839916839917, "percentage": 29.83, "elapsed_time": "0:05:52", "remaining_time": "0:13:49", "throughput": 1636.42, "total_tokens": 577160} +{"current_steps": 1440, "total_steps": 4810, "loss": 0.2892, "lr": 4.419767797607219e-05, "epoch": 1.496881496881497, "percentage": 29.94, "elapsed_time": "0:05:53", "remaining_time": "0:13:47", "throughput": 1638.89, "total_tokens": 579208} +{"current_steps": 1445, "total_steps": 4810, "loss": 0.2936, "lr": 4.413944412313405e-05, "epoch": 1.502079002079002, "percentage": 30.04, "elapsed_time": "0:05:53", "remaining_time": "0:13:43", "throughput": 1643.18, "total_tokens": 581256} +{"current_steps": 1446, "total_steps": 4810, "eval_loss": 0.25699949264526367, "epoch": 1.503118503118503, "percentage": 30.06, "elapsed_time": "0:05:55", "remaining_time": "0:13:46", "throughput": 1636.61, "total_tokens": 581704} +{"current_steps": 1450, "total_steps": 4810, "loss": 0.2702, "lr": 4.4080958274324155e-05, "epoch": 1.5072765072765073, "percentage": 30.15, "elapsed_time": "0:07:05", "remaining_time": "0:16:24", "throughput": 1372.36, "total_tokens": 583304} +{"current_steps": 1455, "total_steps": 4810, "loss": 0.2252, "lr": 4.40222211996854e-05, "epoch": 1.5124740124740126, "percentage": 30.25, "elapsed_time": "0:07:05", "remaining_time": "0:16:20", "throughput": 1375.81, "total_tokens": 585224} +{"current_steps": 1460, "total_steps": 4810, "loss": 0.4066, "lr": 4.396323367256836e-05, "epoch": 1.5176715176715176, "percentage": 30.35, "elapsed_time": "0:07:05", "remaining_time": "0:16:16", "throughput": 1379.55, "total_tokens": 587272} +{"current_steps": 1465, "total_steps": 4810, "loss": 0.2413, "lr": 4.390399646962117e-05, "epoch": 1.5228690228690227, "percentage": 30.46, "elapsed_time": "0:07:06", "remaining_time": "0:16:12", "throughput": 1383.28, "total_tokens": 589320} +{"current_steps": 1470, "total_steps": 4810, "loss": 0.2593, "lr": 4.384451037077924e-05, "epoch": 1.5280665280665282, "percentage": 30.56, "elapsed_time": "0:07:06", "remaining_time": "0:16:08", "throughput": 1386.86, "total_tokens": 591304} +{"current_steps": 1475, "total_steps": 4810, "loss": 0.2499, "lr": 4.378477615925505e-05, "epoch": 1.5332640332640333, "percentage": 30.67, "elapsed_time": "0:07:06", "remaining_time": "0:16:04", "throughput": 1390.27, "total_tokens": 593224} +{"current_steps": 1480, "total_steps": 4810, "loss": 0.2672, "lr": 4.372479462152781e-05, "epoch": 1.5384615384615383, "percentage": 30.77, "elapsed_time": "0:07:07", "remaining_time": "0:16:00", "throughput": 1394.12, "total_tokens": 595336} +{"current_steps": 1485, "total_steps": 4810, "loss": 0.2898, "lr": 4.366456654733308e-05, "epoch": 1.5436590436590436, "percentage": 30.87, "elapsed_time": "0:07:07", "remaining_time": "0:15:56", "throughput": 1397.52, "total_tokens": 597256} +{"current_steps": 1490, "total_steps": 4810, "loss": 0.2852, "lr": 4.360409272965242e-05, "epoch": 1.5488565488565489, "percentage": 30.98, "elapsed_time": "0:07:07", "remaining_time": "0:15:53", "throughput": 1401.21, "total_tokens": 599304} +{"current_steps": 1495, "total_steps": 4810, "loss": 0.2828, "lr": 4.3543373964702907e-05, "epoch": 1.554054054054054, "percentage": 31.08, "elapsed_time": "0:07:08", "remaining_time": "0:15:49", "throughput": 1404.74, "total_tokens": 601288} +{"current_steps": 1500, "total_steps": 4810, "loss": 0.2597, "lr": 4.348241105192668e-05, "epoch": 1.5592515592515592, "percentage": 31.19, "elapsed_time": "0:07:08", "remaining_time": "0:15:45", "throughput": 1408.27, "total_tokens": 603272} +{"current_steps": 1505, "total_steps": 4810, "loss": 0.2584, "lr": 4.34212047939804e-05, "epoch": 1.5644490644490645, "percentage": 31.29, "elapsed_time": "0:07:08", "remaining_time": "0:15:41", "throughput": 1411.8, "total_tokens": 605256} +{"current_steps": 1510, "total_steps": 4810, "loss": 0.2713, "lr": 4.335975599672469e-05, "epoch": 1.5696465696465696, "percentage": 31.39, "elapsed_time": "0:07:09", "remaining_time": "0:15:37", "throughput": 1415.48, "total_tokens": 607304} +{"current_steps": 1515, "total_steps": 4810, "loss": 0.2702, "lr": 4.329806546921353e-05, "epoch": 1.5748440748440748, "percentage": 31.5, "elapsed_time": "0:07:09", "remaining_time": "0:15:33", "throughput": 1418.85, "total_tokens": 609224} +{"current_steps": 1520, "total_steps": 4810, "loss": 0.2648, "lr": 4.323613402368357e-05, "epoch": 1.5800415800415801, "percentage": 31.6, "elapsed_time": "0:07:09", "remaining_time": "0:15:30", "throughput": 1422.67, "total_tokens": 611336} +{"current_steps": 1525, "total_steps": 4810, "loss": 0.2879, "lr": 4.317396247554347e-05, "epoch": 1.5852390852390852, "percentage": 31.7, "elapsed_time": "0:07:10", "remaining_time": "0:15:26", "throughput": 1426.18, "total_tokens": 613320} +{"current_steps": 1530, "total_steps": 4810, "loss": 0.2953, "lr": 4.311155164336318e-05, "epoch": 1.5904365904365905, "percentage": 31.81, "elapsed_time": "0:07:10", "remaining_time": "0:15:22", "throughput": 1429.38, "total_tokens": 615176} +{"current_steps": 1535, "total_steps": 4810, "loss": 0.2754, "lr": 4.3048902348863116e-05, "epoch": 1.5956340956340958, "percentage": 31.91, "elapsed_time": "0:07:10", "remaining_time": "0:15:18", "throughput": 1433.04, "total_tokens": 617224} +{"current_steps": 1540, "total_steps": 4810, "loss": 0.2785, "lr": 4.298601541690336e-05, "epoch": 1.6008316008316008, "percentage": 32.02, "elapsed_time": "0:07:11", "remaining_time": "0:15:15", "throughput": 1436.53, "total_tokens": 619208} +{"current_steps": 1545, "total_steps": 4810, "loss": 0.278, "lr": 4.292289167547281e-05, "epoch": 1.6060291060291059, "percentage": 32.12, "elapsed_time": "0:07:11", "remaining_time": "0:15:11", "throughput": 1440.02, "total_tokens": 621192} +{"current_steps": 1550, "total_steps": 4810, "loss": 0.2618, "lr": 4.285953195567827e-05, "epoch": 1.6112266112266114, "percentage": 32.22, "elapsed_time": "0:07:11", "remaining_time": "0:15:07", "throughput": 1443.5, "total_tokens": 623176} +{"current_steps": 1555, "total_steps": 4810, "loss": 0.2506, "lr": 4.2795937091733515e-05, "epoch": 1.6164241164241164, "percentage": 32.33, "elapsed_time": "0:07:12", "remaining_time": "0:15:04", "throughput": 1446.97, "total_tokens": 625160} +{"current_steps": 1560, "total_steps": 4810, "loss": 0.3095, "lr": 4.27321079209483e-05, "epoch": 1.6216216216216215, "percentage": 32.43, "elapsed_time": "0:07:12", "remaining_time": "0:15:00", "throughput": 1450.45, "total_tokens": 627144} +{"current_steps": 1565, "total_steps": 4810, "loss": 0.2951, "lr": 4.266804528371732e-05, "epoch": 1.6268191268191268, "percentage": 32.54, "elapsed_time": "0:07:12", "remaining_time": "0:14:57", "throughput": 1454.07, "total_tokens": 629192} +{"current_steps": 1570, "total_steps": 4810, "loss": 0.2796, "lr": 4.260375002350917e-05, "epoch": 1.632016632016632, "percentage": 32.64, "elapsed_time": "0:07:13", "remaining_time": "0:14:53", "throughput": 1457.68, "total_tokens": 631240} +{"current_steps": 1575, "total_steps": 4810, "loss": 0.2407, "lr": 4.253922298685525e-05, "epoch": 1.637214137214137, "percentage": 32.74, "elapsed_time": "0:07:13", "remaining_time": "0:14:50", "throughput": 1461.14, "total_tokens": 633224} +{"current_steps": 1580, "total_steps": 4810, "loss": 0.2386, "lr": 4.247446502333858e-05, "epoch": 1.6424116424116424, "percentage": 32.85, "elapsed_time": "0:07:13", "remaining_time": "0:14:46", "throughput": 1464.6, "total_tokens": 635208} +{"current_steps": 1585, "total_steps": 4810, "loss": 0.2872, "lr": 4.2409476985582644e-05, "epoch": 1.6476091476091477, "percentage": 32.95, "elapsed_time": "0:07:14", "remaining_time": "0:14:43", "throughput": 1468.2, "total_tokens": 637256} +{"current_steps": 1590, "total_steps": 4810, "loss": 0.2806, "lr": 4.234425972924014e-05, "epoch": 1.6528066528066527, "percentage": 33.06, "elapsed_time": "0:07:14", "remaining_time": "0:14:39", "throughput": 1471.5, "total_tokens": 639176} +{"current_steps": 1595, "total_steps": 4810, "loss": 0.2715, "lr": 4.227881411298175e-05, "epoch": 1.658004158004158, "percentage": 33.16, "elapsed_time": "0:07:14", "remaining_time": "0:14:36", "throughput": 1475.08, "total_tokens": 641224} +{"current_steps": 1600, "total_steps": 4810, "loss": 0.2872, "lr": 4.221314099848481e-05, "epoch": 1.6632016632016633, "percentage": 33.26, "elapsed_time": "0:07:15", "remaining_time": "0:14:32", "throughput": 1478.37, "total_tokens": 643144} +{"current_steps": 1605, "total_steps": 4810, "loss": 0.2204, "lr": 4.2147241250421944e-05, "epoch": 1.6683991683991684, "percentage": 33.37, "elapsed_time": "0:07:15", "remaining_time": "0:14:29", "throughput": 1481.35, "total_tokens": 644936} +{"current_steps": 1610, "total_steps": 4810, "loss": 0.2557, "lr": 4.208111573644975e-05, "epoch": 1.6735966735966736, "percentage": 33.47, "elapsed_time": "0:07:15", "remaining_time": "0:14:25", "throughput": 1484.92, "total_tokens": 646984} +{"current_steps": 1615, "total_steps": 4810, "loss": 0.2777, "lr": 4.201476532719728e-05, "epoch": 1.678794178794179, "percentage": 33.58, "elapsed_time": "0:07:16", "remaining_time": "0:14:22", "throughput": 1488.49, "total_tokens": 649032} +{"current_steps": 1620, "total_steps": 4810, "loss": 0.2778, "lr": 4.194819089625466e-05, "epoch": 1.683991683991684, "percentage": 33.68, "elapsed_time": "0:07:16", "remaining_time": "0:14:19", "throughput": 1492.05, "total_tokens": 651080} +{"current_steps": 1625, "total_steps": 4810, "loss": 0.2953, "lr": 4.188139332016154e-05, "epoch": 1.689189189189189, "percentage": 33.78, "elapsed_time": "0:07:16", "remaining_time": "0:14:15", "throughput": 1495.31, "total_tokens": 653000} +{"current_steps": 1630, "total_steps": 4810, "loss": 0.2955, "lr": 4.1814373478395586e-05, "epoch": 1.6943866943866945, "percentage": 33.89, "elapsed_time": "0:07:17", "remaining_time": "0:14:12", "throughput": 1498.56, "total_tokens": 654920} +{"current_steps": 1635, "total_steps": 4810, "loss": 0.2599, "lr": 4.174713225336086e-05, "epoch": 1.6995841995841996, "percentage": 33.99, "elapsed_time": "0:07:17", "remaining_time": "0:14:09", "throughput": 1501.95, "total_tokens": 656904} +{"current_steps": 1640, "total_steps": 4810, "loss": 0.2986, "lr": 4.1679670530376244e-05, "epoch": 1.7047817047817047, "percentage": 34.1, "elapsed_time": "0:07:17", "remaining_time": "0:14:06", "throughput": 1505.49, "total_tokens": 658952} +{"current_steps": 1645, "total_steps": 4810, "loss": 0.264, "lr": 4.161198919766375e-05, "epoch": 1.70997920997921, "percentage": 34.2, "elapsed_time": "0:07:18", "remaining_time": "0:14:02", "throughput": 1508.73, "total_tokens": 660872} +{"current_steps": 1650, "total_steps": 4810, "loss": 0.2337, "lr": 4.154408914633685e-05, "epoch": 1.7151767151767152, "percentage": 34.3, "elapsed_time": "0:07:18", "remaining_time": "0:13:59", "throughput": 1512.11, "total_tokens": 662856} +{"current_steps": 1655, "total_steps": 4810, "loss": 0.2968, "lr": 4.147597127038873e-05, "epoch": 1.7203742203742203, "percentage": 34.41, "elapsed_time": "0:07:18", "remaining_time": "0:13:56", "throughput": 1515.63, "total_tokens": 664904} +{"current_steps": 1660, "total_steps": 4810, "loss": 0.2433, "lr": 4.140763646668052e-05, "epoch": 1.7255717255717256, "percentage": 34.51, "elapsed_time": "0:07:19", "remaining_time": "0:13:53", "throughput": 1518.99, "total_tokens": 666888} +{"current_steps": 1665, "total_steps": 4810, "loss": 0.3127, "lr": 4.1339085634929485e-05, "epoch": 1.7307692307692308, "percentage": 34.62, "elapsed_time": "0:07:19", "remaining_time": "0:13:49", "throughput": 1522.51, "total_tokens": 668936} +{"current_steps": 1670, "total_steps": 4810, "loss": 0.2454, "lr": 4.12703196776972e-05, "epoch": 1.735966735966736, "percentage": 34.72, "elapsed_time": "0:07:19", "remaining_time": "0:13:46", "throughput": 1525.72, "total_tokens": 670856} +{"current_steps": 1675, "total_steps": 4810, "loss": 0.3639, "lr": 4.120133950037763e-05, "epoch": 1.7411642411642412, "percentage": 34.82, "elapsed_time": "0:07:20", "remaining_time": "0:13:43", "throughput": 1529.07, "total_tokens": 672840} +{"current_steps": 1680, "total_steps": 4810, "loss": 0.2468, "lr": 4.113214601118524e-05, "epoch": 1.7463617463617465, "percentage": 34.93, "elapsed_time": "0:07:20", "remaining_time": "0:13:40", "throughput": 1532.42, "total_tokens": 674824} +{"current_steps": 1685, "total_steps": 4810, "loss": 0.2705, "lr": 4.1062740121143016e-05, "epoch": 1.7515592515592515, "percentage": 35.03, "elapsed_time": "0:07:20", "remaining_time": "0:13:37", "throughput": 1535.76, "total_tokens": 676808} +{"current_steps": 1687, "total_steps": 4810, "eval_loss": 0.25601524114608765, "epoch": 1.7536382536382535, "percentage": 35.07, "elapsed_time": "0:07:21", "remaining_time": "0:13:38", "throughput": 1533.39, "total_tokens": 677576} +{"current_steps": 1690, "total_steps": 4810, "loss": 0.2969, "lr": 4.099312274407048e-05, "epoch": 1.7567567567567568, "percentage": 35.14, "elapsed_time": "0:08:12", "remaining_time": "0:15:10", "throughput": 1376.94, "total_tokens": 678728} +{"current_steps": 1695, "total_steps": 4810, "loss": 0.2874, "lr": 4.0923294796571676e-05, "epoch": 1.761954261954262, "percentage": 35.24, "elapsed_time": "0:08:13", "remaining_time": "0:15:06", "throughput": 1380.18, "total_tokens": 680776} +{"current_steps": 1700, "total_steps": 4810, "loss": 0.2651, "lr": 4.085325719802307e-05, "epoch": 1.7671517671517671, "percentage": 35.34, "elapsed_time": "0:08:13", "remaining_time": "0:15:02", "throughput": 1383.8, "total_tokens": 683016} +{"current_steps": 1705, "total_steps": 4810, "loss": 0.2924, "lr": 4.078301087056144e-05, "epoch": 1.7723492723492722, "percentage": 35.45, "elapsed_time": "0:08:13", "remaining_time": "0:14:59", "throughput": 1387.41, "total_tokens": 685256} +{"current_steps": 1710, "total_steps": 4810, "loss": 0.2762, "lr": 4.0712556739071795e-05, "epoch": 1.7775467775467777, "percentage": 35.55, "elapsed_time": "0:08:14", "remaining_time": "0:14:55", "throughput": 1390.63, "total_tokens": 687304} +{"current_steps": 1715, "total_steps": 4810, "loss": 0.2888, "lr": 4.064189573117512e-05, "epoch": 1.7827442827442828, "percentage": 35.65, "elapsed_time": "0:08:14", "remaining_time": "0:14:52", "throughput": 1393.59, "total_tokens": 689224} +{"current_steps": 1720, "total_steps": 4810, "loss": 0.2282, "lr": 4.0571028777216214e-05, "epoch": 1.7879417879417878, "percentage": 35.76, "elapsed_time": "0:08:14", "remaining_time": "0:14:49", "throughput": 1397.04, "total_tokens": 691400} +{"current_steps": 1725, "total_steps": 4810, "loss": 0.187, "lr": 4.049995681025143e-05, "epoch": 1.793139293139293, "percentage": 35.86, "elapsed_time": "0:08:15", "remaining_time": "0:14:45", "throughput": 1400.0, "total_tokens": 693320} +{"current_steps": 1730, "total_steps": 4810, "loss": 0.4406, "lr": 4.0428680766036384e-05, "epoch": 1.7983367983367984, "percentage": 35.97, "elapsed_time": "0:08:15", "remaining_time": "0:14:42", "throughput": 1403.34, "total_tokens": 695432} +{"current_steps": 1735, "total_steps": 4810, "loss": 0.3552, "lr": 4.035720158301363e-05, "epoch": 1.8035343035343034, "percentage": 36.07, "elapsed_time": "0:08:15", "remaining_time": "0:14:38", "throughput": 1406.67, "total_tokens": 697544} +{"current_steps": 1740, "total_steps": 4810, "loss": 0.3263, "lr": 4.028552020230031e-05, "epoch": 1.8087318087318087, "percentage": 36.17, "elapsed_time": "0:08:16", "remaining_time": "0:14:35", "throughput": 1409.87, "total_tokens": 699592} +{"current_steps": 1745, "total_steps": 4810, "loss": 0.2859, "lr": 4.0213637567675774e-05, "epoch": 1.813929313929314, "percentage": 36.28, "elapsed_time": "0:08:16", "remaining_time": "0:14:32", "throughput": 1412.94, "total_tokens": 701576} +{"current_steps": 1750, "total_steps": 4810, "loss": 0.2657, "lr": 4.0141554625569125e-05, "epoch": 1.819126819126819, "percentage": 36.38, "elapsed_time": "0:08:16", "remaining_time": "0:14:28", "throughput": 1416.26, "total_tokens": 703688} +{"current_steps": 1755, "total_steps": 4810, "loss": 0.2842, "lr": 4.0069272325046816e-05, "epoch": 1.8243243243243243, "percentage": 36.49, "elapsed_time": "0:08:17", "remaining_time": "0:14:25", "throughput": 1419.45, "total_tokens": 705736} +{"current_steps": 1760, "total_steps": 4810, "loss": 0.2479, "lr": 3.999679161780005e-05, "epoch": 1.8295218295218296, "percentage": 36.59, "elapsed_time": "0:08:17", "remaining_time": "0:14:22", "throughput": 1422.51, "total_tokens": 707720} +{"current_steps": 1765, "total_steps": 4810, "loss": 0.3132, "lr": 3.99241134581324e-05, "epoch": 1.8347193347193347, "percentage": 36.69, "elapsed_time": "0:08:17", "remaining_time": "0:14:18", "throughput": 1425.94, "total_tokens": 709896} +{"current_steps": 1770, "total_steps": 4810, "loss": 0.2661, "lr": 3.985123880294708e-05, "epoch": 1.83991683991684, "percentage": 36.8, "elapsed_time": "0:08:18", "remaining_time": "0:14:15", "throughput": 1429.13, "total_tokens": 711944} +{"current_steps": 1775, "total_steps": 4810, "loss": 0.2664, "lr": 3.9778168611734456e-05, "epoch": 1.8451143451143452, "percentage": 36.9, "elapsed_time": "0:08:18", "remaining_time": "0:14:12", "throughput": 1432.3, "total_tokens": 713992} +{"current_steps": 1780, "total_steps": 4810, "loss": 0.2443, "lr": 3.970490384655939e-05, "epoch": 1.8503118503118503, "percentage": 37.01, "elapsed_time": "0:08:18", "remaining_time": "0:14:09", "throughput": 1435.35, "total_tokens": 715976} +{"current_steps": 1785, "total_steps": 4810, "loss": 0.2659, "lr": 3.963144547204856e-05, "epoch": 1.8555093555093554, "percentage": 37.11, "elapsed_time": "0:08:19", "remaining_time": "0:14:05", "throughput": 1438.53, "total_tokens": 718024} +{"current_steps": 1790, "total_steps": 4810, "loss": 0.2441, "lr": 3.955779445537776e-05, "epoch": 1.8607068607068609, "percentage": 37.21, "elapsed_time": "0:08:19", "remaining_time": "0:14:02", "throughput": 1441.69, "total_tokens": 720072} +{"current_steps": 1795, "total_steps": 4810, "loss": 0.279, "lr": 3.948395176625918e-05, "epoch": 1.865904365904366, "percentage": 37.32, "elapsed_time": "0:08:19", "remaining_time": "0:13:59", "throughput": 1444.85, "total_tokens": 722120} +{"current_steps": 1800, "total_steps": 4810, "loss": 0.2851, "lr": 3.9409918376928604e-05, "epoch": 1.871101871101871, "percentage": 37.42, "elapsed_time": "0:08:20", "remaining_time": "0:13:56", "throughput": 1448.02, "total_tokens": 724168} +{"current_steps": 1805, "total_steps": 4810, "loss": 0.2928, "lr": 3.933569526213268e-05, "epoch": 1.8762993762993763, "percentage": 37.53, "elapsed_time": "0:08:20", "remaining_time": "0:13:53", "throughput": 1451.3, "total_tokens": 726280} +{"current_steps": 1810, "total_steps": 4810, "loss": 0.2677, "lr": 3.926128339911599e-05, "epoch": 1.8814968814968815, "percentage": 37.63, "elapsed_time": "0:08:20", "remaining_time": "0:13:49", "throughput": 1454.33, "total_tokens": 728264} +{"current_steps": 1815, "total_steps": 4810, "loss": 0.2924, "lr": 3.918668376760827e-05, "epoch": 1.8866943866943866, "percentage": 37.73, "elapsed_time": "0:08:21", "remaining_time": "0:13:46", "throughput": 1457.48, "total_tokens": 730312} +{"current_steps": 1820, "total_steps": 4810, "loss": 0.2771, "lr": 3.9111897349811454e-05, "epoch": 1.8918918918918919, "percentage": 37.84, "elapsed_time": "0:08:21", "remaining_time": "0:13:43", "throughput": 1460.5, "total_tokens": 732296} +{"current_steps": 1825, "total_steps": 4810, "loss": 0.2412, "lr": 3.903692513038677e-05, "epoch": 1.8970893970893972, "percentage": 37.94, "elapsed_time": "0:08:21", "remaining_time": "0:13:40", "throughput": 1463.12, "total_tokens": 734088} +{"current_steps": 1830, "total_steps": 4810, "loss": 0.2897, "lr": 3.896176809644178e-05, "epoch": 1.9022869022869022, "percentage": 38.05, "elapsed_time": "0:08:22", "remaining_time": "0:13:37", "throughput": 1465.63, "total_tokens": 736072} +{"current_steps": 1835, "total_steps": 4810, "loss": 0.3063, "lr": 3.8886427237517344e-05, "epoch": 1.9074844074844075, "percentage": 38.15, "elapsed_time": "0:08:22", "remaining_time": "0:13:34", "throughput": 1468.76, "total_tokens": 738120} +{"current_steps": 1840, "total_steps": 4810, "loss": 0.3038, "lr": 3.881090354557463e-05, "epoch": 1.9126819126819128, "percentage": 38.25, "elapsed_time": "0:08:22", "remaining_time": "0:13:31", "throughput": 1471.89, "total_tokens": 740168} +{"current_steps": 1845, "total_steps": 4810, "loss": 0.2716, "lr": 3.8735198014982064e-05, "epoch": 1.9178794178794178, "percentage": 38.36, "elapsed_time": "0:08:23", "remaining_time": "0:13:28", "throughput": 1475.14, "total_tokens": 742280} +{"current_steps": 1850, "total_steps": 4810, "loss": 0.2834, "lr": 3.865931164250219e-05, "epoch": 1.9230769230769231, "percentage": 38.46, "elapsed_time": "0:08:23", "remaining_time": "0:13:25", "throughput": 1478.14, "total_tokens": 744328} +{"current_steps": 1855, "total_steps": 4810, "loss": 0.2845, "lr": 3.8583245427278584e-05, "epoch": 1.9282744282744284, "percentage": 38.57, "elapsed_time": "0:08:23", "remaining_time": "0:13:22", "throughput": 1481.39, "total_tokens": 746440} +{"current_steps": 1860, "total_steps": 4810, "loss": 0.3004, "lr": 3.850700037082268e-05, "epoch": 1.9334719334719335, "percentage": 38.67, "elapsed_time": "0:08:24", "remaining_time": "0:13:19", "throughput": 1484.5, "total_tokens": 748488} +{"current_steps": 1865, "total_steps": 4810, "loss": 0.2696, "lr": 3.8430577477000595e-05, "epoch": 1.9386694386694385, "percentage": 38.77, "elapsed_time": "0:08:24", "remaining_time": "0:13:16", "throughput": 1487.23, "total_tokens": 750344} +{"current_steps": 1870, "total_steps": 4810, "loss": 0.2567, "lr": 3.835397775201991e-05, "epoch": 1.943866943866944, "percentage": 38.88, "elapsed_time": "0:08:24", "remaining_time": "0:13:13", "throughput": 1490.21, "total_tokens": 752328} +{"current_steps": 1875, "total_steps": 4810, "loss": 0.269, "lr": 3.827720220441642e-05, "epoch": 1.949064449064449, "percentage": 38.98, "elapsed_time": "0:08:25", "remaining_time": "0:13:10", "throughput": 1493.19, "total_tokens": 754312} +{"current_steps": 1880, "total_steps": 4810, "loss": 0.2816, "lr": 3.8200251845040855e-05, "epoch": 1.9542619542619541, "percentage": 39.09, "elapsed_time": "0:08:25", "remaining_time": "0:13:07", "throughput": 1496.03, "total_tokens": 756232} +{"current_steps": 1885, "total_steps": 4810, "loss": 0.2706, "lr": 3.812312768704557e-05, "epoch": 1.9594594594594594, "percentage": 39.19, "elapsed_time": "0:08:25", "remaining_time": "0:13:04", "throughput": 1499.12, "total_tokens": 758280} +{"current_steps": 1890, "total_steps": 4810, "loss": 0.2412, "lr": 3.8045830745871195e-05, "epoch": 1.9646569646569647, "percentage": 39.29, "elapsed_time": "0:08:26", "remaining_time": "0:13:01", "throughput": 1502.21, "total_tokens": 760328} +{"current_steps": 1895, "total_steps": 4810, "loss": 0.2593, "lr": 3.7968362039233316e-05, "epoch": 1.9698544698544698, "percentage": 39.4, "elapsed_time": "0:08:26", "remaining_time": "0:12:59", "throughput": 1505.04, "total_tokens": 762248} +{"current_steps": 1900, "total_steps": 4810, "loss": 0.2765, "lr": 3.789072258710898e-05, "epoch": 1.975051975051975, "percentage": 39.5, "elapsed_time": "0:08:26", "remaining_time": "0:12:56", "throughput": 1507.87, "total_tokens": 764168} +{"current_steps": 1905, "total_steps": 4810, "loss": 0.2703, "lr": 3.781291341172338e-05, "epoch": 1.9802494802494803, "percentage": 39.6, "elapsed_time": "0:08:27", "remaining_time": "0:12:53", "throughput": 1510.95, "total_tokens": 766216} +{"current_steps": 1910, "total_steps": 4810, "loss": 0.2418, "lr": 3.7734935537536276e-05, "epoch": 1.9854469854469854, "percentage": 39.71, "elapsed_time": "0:08:27", "remaining_time": "0:12:50", "throughput": 1514.02, "total_tokens": 768264} +{"current_steps": 1915, "total_steps": 4810, "loss": 0.2502, "lr": 3.7656789991228636e-05, "epoch": 1.9906444906444907, "percentage": 39.81, "elapsed_time": "0:08:27", "remaining_time": "0:12:47", "throughput": 1516.84, "total_tokens": 770184} +{"current_steps": 1920, "total_steps": 4810, "loss": 0.2432, "lr": 3.7578477801689e-05, "epoch": 1.995841995841996, "percentage": 39.92, "elapsed_time": "0:08:28", "remaining_time": "0:12:44", "throughput": 1519.78, "total_tokens": 772168} +{"current_steps": 1925, "total_steps": 4810, "loss": 0.2243, "lr": 3.7500000000000003e-05, "epoch": 2.001039501039501, "percentage": 40.02, "elapsed_time": "0:08:28", "remaining_time": "0:12:42", "throughput": 1522.47, "total_tokens": 774160} +{"current_steps": 1928, "total_steps": 4810, "eval_loss": 0.2575376331806183, "epoch": 2.004158004158004, "percentage": 40.08, "elapsed_time": "0:08:29", "remaining_time": "0:12:41", "throughput": 1521.1, "total_tokens": 775312} +{"current_steps": 1930, "total_steps": 4810, "loss": 0.26, "lr": 3.742135761942479e-05, "epoch": 2.006237006237006, "percentage": 40.12, "elapsed_time": "0:09:37", "remaining_time": "0:14:21", "throughput": 1344.97, "total_tokens": 776144} +{"current_steps": 1935, "total_steps": 4810, "loss": 0.2814, "lr": 3.734255169539337e-05, "epoch": 2.0114345114345116, "percentage": 40.23, "elapsed_time": "0:09:37", "remaining_time": "0:14:17", "throughput": 1347.66, "total_tokens": 778128} +{"current_steps": 1940, "total_steps": 4810, "loss": 0.2911, "lr": 3.7263583265489074e-05, "epoch": 2.0166320166320166, "percentage": 40.33, "elapsed_time": "0:09:37", "remaining_time": "0:14:14", "throughput": 1350.46, "total_tokens": 780176} +{"current_steps": 1945, "total_steps": 4810, "loss": 0.2723, "lr": 3.718445336943478e-05, "epoch": 2.0218295218295217, "percentage": 40.44, "elapsed_time": "0:09:38", "remaining_time": "0:14:11", "throughput": 1353.14, "total_tokens": 782160} +{"current_steps": 1950, "total_steps": 4810, "loss": 0.3159, "lr": 3.710516304907931e-05, "epoch": 2.027027027027027, "percentage": 40.54, "elapsed_time": "0:09:38", "remaining_time": "0:14:08", "throughput": 1355.92, "total_tokens": 784208} +{"current_steps": 1955, "total_steps": 4810, "loss": 0.2713, "lr": 3.702571334838365e-05, "epoch": 2.0322245322245323, "percentage": 40.64, "elapsed_time": "0:09:38", "remaining_time": "0:14:05", "throughput": 1358.71, "total_tokens": 786256} +{"current_steps": 1960, "total_steps": 4810, "loss": 0.2491, "lr": 3.694610531340729e-05, "epoch": 2.0374220374220373, "percentage": 40.75, "elapsed_time": "0:09:38", "remaining_time": "0:14:01", "throughput": 1361.39, "total_tokens": 788240} +{"current_steps": 1965, "total_steps": 4810, "loss": 0.2663, "lr": 3.6866339992294344e-05, "epoch": 2.042619542619543, "percentage": 40.85, "elapsed_time": "0:09:39", "remaining_time": "0:13:58", "throughput": 1364.18, "total_tokens": 790288} +{"current_steps": 1970, "total_steps": 4810, "loss": 0.2681, "lr": 3.6786418435259854e-05, "epoch": 2.047817047817048, "percentage": 40.96, "elapsed_time": "0:09:39", "remaining_time": "0:13:55", "throughput": 1366.85, "total_tokens": 792272} +{"current_steps": 1975, "total_steps": 4810, "loss": 0.2757, "lr": 3.670634169457587e-05, "epoch": 2.053014553014553, "percentage": 41.06, "elapsed_time": "0:09:39", "remaining_time": "0:13:52", "throughput": 1369.73, "total_tokens": 794384} +{"current_steps": 1980, "total_steps": 4810, "loss": 0.2727, "lr": 3.662611082455766e-05, "epoch": 2.0582120582120584, "percentage": 41.16, "elapsed_time": "0:09:40", "remaining_time": "0:13:49", "throughput": 1372.4, "total_tokens": 796368} +{"current_steps": 1985, "total_steps": 4810, "loss": 0.2711, "lr": 3.654572688154979e-05, "epoch": 2.0634095634095635, "percentage": 41.27, "elapsed_time": "0:09:40", "remaining_time": "0:13:46", "throughput": 1375.28, "total_tokens": 798480} +{"current_steps": 1990, "total_steps": 4810, "loss": 0.2843, "lr": 3.646519092391227e-05, "epoch": 2.0686070686070686, "percentage": 41.37, "elapsed_time": "0:09:40", "remaining_time": "0:13:43", "throughput": 1378.04, "total_tokens": 800528} +{"current_steps": 1995, "total_steps": 4810, "loss": 0.2917, "lr": 3.6384504012006544e-05, "epoch": 2.0738045738045736, "percentage": 41.48, "elapsed_time": "0:09:41", "remaining_time": "0:13:40", "throughput": 1381.13, "total_tokens": 802768} +{"current_steps": 2000, "total_steps": 4810, "loss": 0.2846, "lr": 3.6303667208181575e-05, "epoch": 2.079002079002079, "percentage": 41.58, "elapsed_time": "0:09:41", "remaining_time": "0:13:37", "throughput": 1383.78, "total_tokens": 804752} +{"current_steps": 2005, "total_steps": 4810, "loss": 0.2932, "lr": 3.622268157675986e-05, "epoch": 2.084199584199584, "percentage": 41.68, "elapsed_time": "0:09:41", "remaining_time": "0:13:34", "throughput": 1386.32, "total_tokens": 806672} +{"current_steps": 2010, "total_steps": 4810, "loss": 0.2602, "lr": 3.614154818402339e-05, "epoch": 2.0893970893970892, "percentage": 41.79, "elapsed_time": "0:09:42", "remaining_time": "0:13:31", "throughput": 1388.97, "total_tokens": 808656} +{"current_steps": 2015, "total_steps": 4810, "loss": 0.2402, "lr": 3.606026809819966e-05, "epoch": 2.0945945945945947, "percentage": 41.89, "elapsed_time": "0:09:42", "remaining_time": "0:13:28", "throughput": 1391.62, "total_tokens": 810640} +{"current_steps": 2020, "total_steps": 4810, "loss": 0.2832, "lr": 3.597884238944752e-05, "epoch": 2.0997920997921, "percentage": 42.0, "elapsed_time": "0:09:42", "remaining_time": "0:13:25", "throughput": 1394.37, "total_tokens": 812688} +{"current_steps": 2025, "total_steps": 4810, "loss": 0.262, "lr": 3.5897272129843194e-05, "epoch": 2.104989604989605, "percentage": 42.1, "elapsed_time": "0:09:43", "remaining_time": "0:13:22", "throughput": 1397.22, "total_tokens": 814800} +{"current_steps": 2030, "total_steps": 4810, "loss": 0.2348, "lr": 3.581555839336606e-05, "epoch": 2.1101871101871104, "percentage": 42.2, "elapsed_time": "0:09:43", "remaining_time": "0:13:19", "throughput": 1400.07, "total_tokens": 816912} +{"current_steps": 2035, "total_steps": 4810, "loss": 0.2981, "lr": 3.57337022558846e-05, "epoch": 2.1153846153846154, "percentage": 42.31, "elapsed_time": "0:09:43", "remaining_time": "0:13:16", "throughput": 1402.7, "total_tokens": 818896} +{"current_steps": 2040, "total_steps": 4810, "loss": 0.2857, "lr": 3.565170479514214e-05, "epoch": 2.1205821205821205, "percentage": 42.41, "elapsed_time": "0:09:44", "remaining_time": "0:13:13", "throughput": 1405.33, "total_tokens": 820880} +{"current_steps": 2045, "total_steps": 4810, "loss": 0.2745, "lr": 3.5569567090742764e-05, "epoch": 2.125779625779626, "percentage": 42.52, "elapsed_time": "0:09:44", "remaining_time": "0:13:10", "throughput": 1407.96, "total_tokens": 822864} +{"current_steps": 2050, "total_steps": 4810, "loss": 0.2705, "lr": 3.548729022413701e-05, "epoch": 2.130977130977131, "percentage": 42.62, "elapsed_time": "0:09:44", "remaining_time": "0:13:07", "throughput": 1410.91, "total_tokens": 825040} +{"current_steps": 2055, "total_steps": 4810, "loss": 0.2397, "lr": 3.540487527860769e-05, "epoch": 2.136174636174636, "percentage": 42.72, "elapsed_time": "0:09:45", "remaining_time": "0:13:04", "throughput": 1413.53, "total_tokens": 827024} +{"current_steps": 2060, "total_steps": 4810, "loss": 0.2921, "lr": 3.53223233392556e-05, "epoch": 2.141372141372141, "percentage": 42.83, "elapsed_time": "0:09:45", "remaining_time": "0:13:01", "throughput": 1416.36, "total_tokens": 829136} +{"current_steps": 2065, "total_steps": 4810, "loss": 0.274, "lr": 3.523963549298525e-05, "epoch": 2.1465696465696467, "percentage": 42.93, "elapsed_time": "0:09:45", "remaining_time": "0:12:58", "throughput": 1419.08, "total_tokens": 831184} +{"current_steps": 2070, "total_steps": 4810, "loss": 0.3599, "lr": 3.51568128284905e-05, "epoch": 2.1517671517671517, "percentage": 43.04, "elapsed_time": "0:09:46", "remaining_time": "0:12:55", "throughput": 1421.69, "total_tokens": 833168} +{"current_steps": 2075, "total_steps": 4810, "loss": 0.2991, "lr": 3.5073856436240334e-05, "epoch": 2.156964656964657, "percentage": 43.14, "elapsed_time": "0:09:46", "remaining_time": "0:12:52", "throughput": 1424.41, "total_tokens": 835216} +{"current_steps": 2080, "total_steps": 4810, "loss": 0.2711, "lr": 3.499076740846438e-05, "epoch": 2.1621621621621623, "percentage": 43.24, "elapsed_time": "0:09:46", "remaining_time": "0:12:50", "throughput": 1426.91, "total_tokens": 837136} +{"current_steps": 2085, "total_steps": 4810, "loss": 0.263, "lr": 3.490754683913863e-05, "epoch": 2.1673596673596673, "percentage": 43.35, "elapsed_time": "0:09:46", "remaining_time": "0:12:47", "throughput": 1429.51, "total_tokens": 839120} +{"current_steps": 2090, "total_steps": 4810, "loss": 0.2114, "lr": 3.482419582397095e-05, "epoch": 2.1725571725571724, "percentage": 43.45, "elapsed_time": "0:09:47", "remaining_time": "0:12:44", "throughput": 1432.12, "total_tokens": 841104} +{"current_steps": 2095, "total_steps": 4810, "loss": 0.3437, "lr": 3.474071546038673e-05, "epoch": 2.177754677754678, "percentage": 43.56, "elapsed_time": "0:09:47", "remaining_time": "0:12:41", "throughput": 1434.83, "total_tokens": 843152} +{"current_steps": 2100, "total_steps": 4810, "loss": 0.2665, "lr": 3.46571068475144e-05, "epoch": 2.182952182952183, "percentage": 43.66, "elapsed_time": "0:09:47", "remaining_time": "0:12:38", "throughput": 1437.42, "total_tokens": 845136} +{"current_steps": 2105, "total_steps": 4810, "loss": 0.2736, "lr": 3.4573371086170936e-05, "epoch": 2.188149688149688, "percentage": 43.76, "elapsed_time": "0:09:48", "remaining_time": "0:12:35", "throughput": 1440.01, "total_tokens": 847120} +{"current_steps": 2110, "total_steps": 4810, "loss": 0.2967, "lr": 3.4489509278847414e-05, "epoch": 2.1933471933471935, "percentage": 43.87, "elapsed_time": "0:09:48", "remaining_time": "0:12:33", "throughput": 1442.71, "total_tokens": 849168} +{"current_steps": 2115, "total_steps": 4810, "loss": 0.2804, "lr": 3.4405522529694454e-05, "epoch": 2.1985446985446986, "percentage": 43.97, "elapsed_time": "0:09:48", "remaining_time": "0:12:30", "throughput": 1445.3, "total_tokens": 851152} +{"current_steps": 2120, "total_steps": 4810, "loss": 0.2789, "lr": 3.432141194450772e-05, "epoch": 2.2037422037422036, "percentage": 44.07, "elapsed_time": "0:09:49", "remaining_time": "0:12:27", "throughput": 1447.67, "total_tokens": 853008} +{"current_steps": 2125, "total_steps": 4810, "loss": 0.2593, "lr": 3.4237178630713314e-05, "epoch": 2.208939708939709, "percentage": 44.18, "elapsed_time": "0:09:49", "remaining_time": "0:12:24", "throughput": 1450.47, "total_tokens": 855120} +{"current_steps": 2130, "total_steps": 4810, "loss": 0.3184, "lr": 3.415282369735324e-05, "epoch": 2.214137214137214, "percentage": 44.28, "elapsed_time": "0:09:49", "remaining_time": "0:12:22", "throughput": 1453.26, "total_tokens": 857232} +{"current_steps": 2135, "total_steps": 4810, "loss": 0.2697, "lr": 3.4068348255070763e-05, "epoch": 2.2193347193347193, "percentage": 44.39, "elapsed_time": "0:09:50", "remaining_time": "0:12:19", "throughput": 1456.05, "total_tokens": 859344} +{"current_steps": 2140, "total_steps": 4810, "loss": 0.2666, "lr": 3.3983753416095845e-05, "epoch": 2.2245322245322248, "percentage": 44.49, "elapsed_time": "0:09:50", "remaining_time": "0:12:16", "throughput": 1458.62, "total_tokens": 861328} +{"current_steps": 2145, "total_steps": 4810, "loss": 0.2807, "lr": 3.389904029423041e-05, "epoch": 2.22972972972973, "percentage": 44.59, "elapsed_time": "0:09:50", "remaining_time": "0:12:14", "throughput": 1461.3, "total_tokens": 863376} +{"current_steps": 2150, "total_steps": 4810, "loss": 0.277, "lr": 3.381421000483378e-05, "epoch": 2.234927234927235, "percentage": 44.7, "elapsed_time": "0:09:51", "remaining_time": "0:12:11", "throughput": 1463.97, "total_tokens": 865424} +{"current_steps": 2155, "total_steps": 4810, "loss": 0.2884, "lr": 3.37292636648079e-05, "epoch": 2.24012474012474, "percentage": 44.8, "elapsed_time": "0:09:51", "remaining_time": "0:12:08", "throughput": 1466.64, "total_tokens": 867472} +{"current_steps": 2160, "total_steps": 4810, "loss": 0.259, "lr": 3.36442023925827e-05, "epoch": 2.2453222453222454, "percentage": 44.91, "elapsed_time": "0:09:51", "remaining_time": "0:12:06", "throughput": 1469.42, "total_tokens": 869584} +{"current_steps": 2165, "total_steps": 4810, "loss": 0.2477, "lr": 3.3559027308101345e-05, "epoch": 2.2505197505197505, "percentage": 45.01, "elapsed_time": "0:09:52", "remaining_time": "0:12:03", "throughput": 1471.97, "total_tokens": 871568} +{"current_steps": 2169, "total_steps": 4810, "eval_loss": 0.2923731505870819, "epoch": 2.2546777546777546, "percentage": 45.09, "elapsed_time": "0:09:54", "remaining_time": "0:12:04", "throughput": 1468.33, "total_tokens": 873104} +{"current_steps": 2170, "total_steps": 4810, "loss": 0.3482, "lr": 3.3473739532805467e-05, "epoch": 2.2557172557172556, "percentage": 45.11, "elapsed_time": "0:10:28", "remaining_time": "0:12:44", "throughput": 1390.87, "total_tokens": 873488} +{"current_steps": 2175, "total_steps": 4810, "loss": 0.26, "lr": 3.3388340189620424e-05, "epoch": 2.260914760914761, "percentage": 45.22, "elapsed_time": "0:10:28", "remaining_time": "0:12:41", "throughput": 1393.31, "total_tokens": 875472} +{"current_steps": 2180, "total_steps": 4810, "loss": 0.2554, "lr": 3.330283040294053e-05, "epoch": 2.266112266112266, "percentage": 45.32, "elapsed_time": "0:10:28", "remaining_time": "0:12:38", "throughput": 1395.65, "total_tokens": 877392} +{"current_steps": 2185, "total_steps": 4810, "loss": 0.2621, "lr": 3.321721129861422e-05, "epoch": 2.271309771309771, "percentage": 45.43, "elapsed_time": "0:10:28", "remaining_time": "0:12:35", "throughput": 1398.28, "total_tokens": 879504} +{"current_steps": 2190, "total_steps": 4810, "loss": 0.29, "lr": 3.3131484003929246e-05, "epoch": 2.2765072765072767, "percentage": 45.53, "elapsed_time": "0:10:29", "remaining_time": "0:12:32", "throughput": 1400.51, "total_tokens": 881360} +{"current_steps": 2195, "total_steps": 4810, "loss": 0.2916, "lr": 3.3045649647597815e-05, "epoch": 2.2817047817047817, "percentage": 45.63, "elapsed_time": "0:10:29", "remaining_time": "0:12:30", "throughput": 1402.84, "total_tokens": 883280} +{"current_steps": 2200, "total_steps": 4810, "loss": 0.2572, "lr": 3.2959709359741744e-05, "epoch": 2.286902286902287, "percentage": 45.74, "elapsed_time": "0:10:29", "remaining_time": "0:12:27", "throughput": 1405.37, "total_tokens": 885328} +{"current_steps": 2205, "total_steps": 4810, "loss": 0.3062, "lr": 3.2873664271877584e-05, "epoch": 2.2920997920997923, "percentage": 45.84, "elapsed_time": "0:10:30", "remaining_time": "0:12:24", "throughput": 1407.8, "total_tokens": 887312} +{"current_steps": 2210, "total_steps": 4810, "loss": 0.2672, "lr": 3.278751551690172e-05, "epoch": 2.2972972972972974, "percentage": 45.95, "elapsed_time": "0:10:30", "remaining_time": "0:12:21", "throughput": 1410.22, "total_tokens": 889296} +{"current_steps": 2215, "total_steps": 4810, "loss": 0.2647, "lr": 3.270126422907544e-05, "epoch": 2.3024948024948024, "percentage": 46.05, "elapsed_time": "0:10:30", "remaining_time": "0:12:19", "throughput": 1412.84, "total_tokens": 891408} +{"current_steps": 2220, "total_steps": 4810, "loss": 0.2884, "lr": 3.261491154401001e-05, "epoch": 2.3076923076923075, "percentage": 46.15, "elapsed_time": "0:10:31", "remaining_time": "0:12:16", "throughput": 1415.25, "total_tokens": 893392} +{"current_steps": 2225, "total_steps": 4810, "loss": 0.2719, "lr": 3.2528458598651734e-05, "epoch": 2.312889812889813, "percentage": 46.26, "elapsed_time": "0:10:31", "remaining_time": "0:12:13", "throughput": 1417.77, "total_tokens": 895440} +{"current_steps": 2230, "total_steps": 4810, "loss": 0.2718, "lr": 3.244190653126696e-05, "epoch": 2.318087318087318, "percentage": 46.36, "elapsed_time": "0:10:31", "remaining_time": "0:12:11", "throughput": 1420.48, "total_tokens": 897616} +{"current_steps": 2235, "total_steps": 4810, "loss": 0.2636, "lr": 3.2355256481427145e-05, "epoch": 2.323284823284823, "percentage": 46.47, "elapsed_time": "0:10:32", "remaining_time": "0:12:08", "throughput": 1422.78, "total_tokens": 899536} +{"current_steps": 2240, "total_steps": 4810, "loss": 0.2544, "lr": 3.226850958999375e-05, "epoch": 2.3284823284823286, "percentage": 46.57, "elapsed_time": "0:10:32", "remaining_time": "0:12:05", "throughput": 1425.39, "total_tokens": 901648} +{"current_steps": 2245, "total_steps": 4810, "loss": 0.2258, "lr": 3.2181666999103324e-05, "epoch": 2.3336798336798337, "percentage": 46.67, "elapsed_time": "0:10:32", "remaining_time": "0:12:03", "throughput": 1427.9, "total_tokens": 903696} +{"current_steps": 2250, "total_steps": 4810, "loss": 0.3054, "lr": 3.209472985215243e-05, "epoch": 2.3388773388773387, "percentage": 46.78, "elapsed_time": "0:10:33", "remaining_time": "0:12:00", "throughput": 1430.1, "total_tokens": 905552} +{"current_steps": 2255, "total_steps": 4810, "loss": 0.3446, "lr": 3.2007699293782555e-05, "epoch": 2.3440748440748442, "percentage": 46.88, "elapsed_time": "0:10:33", "remaining_time": "0:11:57", "throughput": 1432.39, "total_tokens": 907472} +{"current_steps": 2260, "total_steps": 4810, "loss": 0.2495, "lr": 3.1920576469865115e-05, "epoch": 2.3492723492723493, "percentage": 46.99, "elapsed_time": "0:10:33", "remaining_time": "0:11:55", "throughput": 1434.92, "total_tokens": 909584} +{"current_steps": 2265, "total_steps": 4810, "loss": 0.2754, "lr": 3.183336252748627e-05, "epoch": 2.3544698544698544, "percentage": 47.09, "elapsed_time": "0:10:34", "remaining_time": "0:11:52", "throughput": 1437.42, "total_tokens": 911632} +{"current_steps": 2270, "total_steps": 4810, "loss": 0.2604, "lr": 3.1746058614931916e-05, "epoch": 2.35966735966736, "percentage": 47.19, "elapsed_time": "0:10:34", "remaining_time": "0:11:50", "throughput": 1439.81, "total_tokens": 913616} +{"current_steps": 2275, "total_steps": 4810, "loss": 0.2711, "lr": 3.16586658816725e-05, "epoch": 2.364864864864865, "percentage": 47.3, "elapsed_time": "0:10:34", "remaining_time": "0:11:47", "throughput": 1442.39, "total_tokens": 915728} +{"current_steps": 2280, "total_steps": 4810, "loss": 0.2566, "lr": 3.157118547834793e-05, "epoch": 2.37006237006237, "percentage": 47.4, "elapsed_time": "0:10:35", "remaining_time": "0:11:44", "throughput": 1444.87, "total_tokens": 917776} +{"current_steps": 2285, "total_steps": 4810, "loss": 0.2684, "lr": 3.148361855675237e-05, "epoch": 2.375259875259875, "percentage": 47.51, "elapsed_time": "0:10:35", "remaining_time": "0:11:42", "throughput": 1447.56, "total_tokens": 919952} +{"current_steps": 2290, "total_steps": 4810, "loss": 0.2294, "lr": 3.139596626981916e-05, "epoch": 2.3804573804573805, "percentage": 47.61, "elapsed_time": "0:10:35", "remaining_time": "0:11:39", "throughput": 1449.84, "total_tokens": 921872} +{"current_steps": 2295, "total_steps": 4810, "loss": 0.2603, "lr": 3.130822977160554e-05, "epoch": 2.3856548856548856, "percentage": 47.71, "elapsed_time": "0:10:36", "remaining_time": "0:11:37", "throughput": 1452.23, "total_tokens": 923856} +{"current_steps": 2300, "total_steps": 4810, "loss": 0.3942, "lr": 3.122041021727755e-05, "epoch": 2.390852390852391, "percentage": 47.82, "elapsed_time": "0:10:36", "remaining_time": "0:11:34", "throughput": 1454.81, "total_tokens": 925968} +{"current_steps": 2305, "total_steps": 4810, "loss": 0.3128, "lr": 3.1132508763094715e-05, "epoch": 2.396049896049896, "percentage": 47.92, "elapsed_time": "0:10:36", "remaining_time": "0:11:32", "throughput": 1457.09, "total_tokens": 927888} +{"current_steps": 2310, "total_steps": 4810, "loss": 0.2467, "lr": 3.104452656639492e-05, "epoch": 2.401247401247401, "percentage": 48.02, "elapsed_time": "0:10:37", "remaining_time": "0:11:29", "throughput": 1459.36, "total_tokens": 929808} +{"current_steps": 2315, "total_steps": 4810, "loss": 0.1963, "lr": 3.0956464785579124e-05, "epoch": 2.4064449064449063, "percentage": 48.13, "elapsed_time": "0:10:37", "remaining_time": "0:11:27", "throughput": 1461.62, "total_tokens": 931728} +{"current_steps": 2320, "total_steps": 4810, "loss": 0.3533, "lr": 3.0868324580096114e-05, "epoch": 2.4116424116424118, "percentage": 48.23, "elapsed_time": "0:10:37", "remaining_time": "0:11:24", "throughput": 1464.19, "total_tokens": 933840} +{"current_steps": 2325, "total_steps": 4810, "loss": 0.2936, "lr": 3.078010711042723e-05, "epoch": 2.416839916839917, "percentage": 48.34, "elapsed_time": "0:10:38", "remaining_time": "0:11:22", "throughput": 1466.56, "total_tokens": 935824} +{"current_steps": 2330, "total_steps": 4810, "loss": 0.274, "lr": 3.0691813538071105e-05, "epoch": 2.422037422037422, "percentage": 48.44, "elapsed_time": "0:10:38", "remaining_time": "0:11:19", "throughput": 1469.02, "total_tokens": 937872} +{"current_steps": 2335, "total_steps": 4810, "loss": 0.3378, "lr": 3.0603445025528376e-05, "epoch": 2.4272349272349274, "percentage": 48.54, "elapsed_time": "0:10:38", "remaining_time": "0:11:17", "throughput": 1471.58, "total_tokens": 939984} +{"current_steps": 2340, "total_steps": 4810, "loss": 0.2418, "lr": 3.051500273628633e-05, "epoch": 2.4324324324324325, "percentage": 48.65, "elapsed_time": "0:10:39", "remaining_time": "0:11:14", "throughput": 1473.94, "total_tokens": 941968} +{"current_steps": 2345, "total_steps": 4810, "loss": 0.2943, "lr": 3.0426487834803657e-05, "epoch": 2.4376299376299375, "percentage": 48.75, "elapsed_time": "0:10:39", "remaining_time": "0:11:12", "throughput": 1476.3, "total_tokens": 943952} +{"current_steps": 2350, "total_steps": 4810, "loss": 0.2435, "lr": 3.0337901486495073e-05, "epoch": 2.442827442827443, "percentage": 48.86, "elapsed_time": "0:10:39", "remaining_time": "0:11:09", "throughput": 1478.55, "total_tokens": 945872} +{"current_steps": 2355, "total_steps": 4810, "loss": 0.267, "lr": 3.0249244857715976e-05, "epoch": 2.448024948024948, "percentage": 48.96, "elapsed_time": "0:10:40", "remaining_time": "0:11:07", "throughput": 1480.91, "total_tokens": 947856} +{"current_steps": 2360, "total_steps": 4810, "loss": 0.2452, "lr": 3.01605191157471e-05, "epoch": 2.453222453222453, "percentage": 49.06, "elapsed_time": "0:10:40", "remaining_time": "0:11:04", "throughput": 1483.26, "total_tokens": 949840} +{"current_steps": 2365, "total_steps": 4810, "loss": 0.2342, "lr": 3.007172542877915e-05, "epoch": 2.4584199584199586, "percentage": 49.17, "elapsed_time": "0:10:40", "remaining_time": "0:11:02", "throughput": 1485.49, "total_tokens": 951760} +{"current_steps": 2370, "total_steps": 4810, "loss": 0.3294, "lr": 2.998286496589742e-05, "epoch": 2.4636174636174637, "percentage": 49.27, "elapsed_time": "0:10:41", "remaining_time": "0:10:59", "throughput": 1487.73, "total_tokens": 953680} +{"current_steps": 2375, "total_steps": 4810, "loss": 0.2417, "lr": 2.9893938897066393e-05, "epoch": 2.4688149688149688, "percentage": 49.38, "elapsed_time": "0:10:41", "remaining_time": "0:10:57", "throughput": 1489.95, "total_tokens": 955600} +{"current_steps": 2380, "total_steps": 4810, "loss": 0.2781, "lr": 2.9804948393114324e-05, "epoch": 2.474012474012474, "percentage": 49.48, "elapsed_time": "0:10:41", "remaining_time": "0:10:55", "throughput": 1492.09, "total_tokens": 957456} +{"current_steps": 2385, "total_steps": 4810, "loss": 0.2721, "lr": 2.9715894625717866e-05, "epoch": 2.4792099792099793, "percentage": 49.58, "elapsed_time": "0:10:42", "remaining_time": "0:10:52", "throughput": 1494.52, "total_tokens": 959504} +{"current_steps": 2390, "total_steps": 4810, "loss": 0.277, "lr": 2.9626778767386604e-05, "epoch": 2.4844074844074844, "percentage": 49.69, "elapsed_time": "0:10:42", "remaining_time": "0:10:50", "throughput": 1496.85, "total_tokens": 961488} +{"current_steps": 2395, "total_steps": 4810, "loss": 0.2759, "lr": 2.953760199144764e-05, "epoch": 2.4896049896049894, "percentage": 49.79, "elapsed_time": "0:10:42", "remaining_time": "0:10:48", "throughput": 1499.07, "total_tokens": 963408} +{"current_steps": 2400, "total_steps": 4810, "loss": 0.2633, "lr": 2.9448365472030115e-05, "epoch": 2.494802494802495, "percentage": 49.9, "elapsed_time": "0:10:42", "remaining_time": "0:10:45", "throughput": 1501.4, "total_tokens": 965392} +{"current_steps": 2405, "total_steps": 4810, "loss": 0.2744, "lr": 2.935907038404981e-05, "epoch": 2.5, "percentage": 50.0, "elapsed_time": "0:10:43", "remaining_time": "0:10:43", "throughput": 1503.81, "total_tokens": 967440} +{"current_steps": 2410, "total_steps": 4810, "loss": 0.2379, "lr": 2.92697179031936e-05, "epoch": 2.505197505197505, "percentage": 50.1, "elapsed_time": "0:10:43", "remaining_time": "0:10:40", "throughput": 1506.02, "total_tokens": 969360} +{"current_steps": 2410, "total_steps": 4810, "eval_loss": 0.2576568126678467, "epoch": 2.505197505197505, "percentage": 50.1, "elapsed_time": "0:10:44", "remaining_time": "0:10:42", "throughput": 1503.49, "total_tokens": 969360} +{"current_steps": 2415, "total_steps": 4810, "loss": 0.2923, "lr": 2.9180309205904027e-05, "epoch": 2.51039501039501, "percentage": 50.21, "elapsed_time": "0:11:35", "remaining_time": "0:11:29", "throughput": 1397.45, "total_tokens": 971472} +{"current_steps": 2420, "total_steps": 4810, "loss": 0.296, "lr": 2.9090845469363805e-05, "epoch": 2.5155925155925156, "percentage": 50.31, "elapsed_time": "0:11:35", "remaining_time": "0:11:26", "throughput": 1399.64, "total_tokens": 973456} +{"current_steps": 2425, "total_steps": 4810, "loss": 0.2911, "lr": 2.9001327871480294e-05, "epoch": 2.5207900207900207, "percentage": 50.42, "elapsed_time": "0:11:35", "remaining_time": "0:11:24", "throughput": 1401.92, "total_tokens": 975504} +{"current_steps": 2430, "total_steps": 4810, "loss": 0.285, "lr": 2.8911757590870027e-05, "epoch": 2.525987525987526, "percentage": 50.52, "elapsed_time": "0:11:36", "remaining_time": "0:11:21", "throughput": 1404.2, "total_tokens": 977552} +{"current_steps": 2435, "total_steps": 4810, "loss": 0.2552, "lr": 2.8822135806843154e-05, "epoch": 2.5311850311850312, "percentage": 50.62, "elapsed_time": "0:11:36", "remaining_time": "0:11:19", "throughput": 1406.38, "total_tokens": 979536} +{"current_steps": 2440, "total_steps": 4810, "loss": 0.2906, "lr": 2.8732463699387968e-05, "epoch": 2.5363825363825363, "percentage": 50.73, "elapsed_time": "0:11:36", "remaining_time": "0:11:16", "throughput": 1408.66, "total_tokens": 981584} +{"current_steps": 2445, "total_steps": 4810, "loss": 0.2795, "lr": 2.8642742449155284e-05, "epoch": 2.5415800415800414, "percentage": 50.83, "elapsed_time": "0:11:37", "remaining_time": "0:11:14", "throughput": 1410.85, "total_tokens": 983632} +{"current_steps": 2450, "total_steps": 4810, "loss": 0.228, "lr": 2.855297323744301e-05, "epoch": 2.546777546777547, "percentage": 50.94, "elapsed_time": "0:11:37", "remaining_time": "0:11:11", "throughput": 1413.12, "total_tokens": 985680} +{"current_steps": 2455, "total_steps": 4810, "loss": 0.2414, "lr": 2.8463157246180468e-05, "epoch": 2.551975051975052, "percentage": 51.04, "elapsed_time": "0:11:37", "remaining_time": "0:11:09", "throughput": 1415.3, "total_tokens": 987664} +{"current_steps": 2460, "total_steps": 4810, "loss": 0.2636, "lr": 2.8373295657912945e-05, "epoch": 2.5571725571725574, "percentage": 51.14, "elapsed_time": "0:11:38", "remaining_time": "0:11:06", "throughput": 1417.47, "total_tokens": 989648} +{"current_steps": 2465, "total_steps": 4810, "loss": 0.2691, "lr": 2.828338965578603e-05, "epoch": 2.5623700623700625, "percentage": 51.25, "elapsed_time": "0:11:38", "remaining_time": "0:11:04", "throughput": 1419.73, "total_tokens": 991696} +{"current_steps": 2470, "total_steps": 4810, "loss": 0.2598, "lr": 2.8193440423530114e-05, "epoch": 2.5675675675675675, "percentage": 51.35, "elapsed_time": "0:11:38", "remaining_time": "0:11:02", "throughput": 1421.81, "total_tokens": 993616} +{"current_steps": 2475, "total_steps": 4810, "loss": 0.2688, "lr": 2.810344914544475e-05, "epoch": 2.5727650727650726, "percentage": 51.46, "elapsed_time": "0:11:39", "remaining_time": "0:10:59", "throughput": 1424.07, "total_tokens": 995664} +{"current_steps": 2480, "total_steps": 4810, "loss": 0.295, "lr": 2.8013417006383076e-05, "epoch": 2.577962577962578, "percentage": 51.56, "elapsed_time": "0:11:39", "remaining_time": "0:10:57", "throughput": 1426.24, "total_tokens": 997648} +{"current_steps": 2485, "total_steps": 4810, "loss": 0.2802, "lr": 2.792334519173624e-05, "epoch": 2.583160083160083, "percentage": 51.66, "elapsed_time": "0:11:39", "remaining_time": "0:10:54", "throughput": 1428.49, "total_tokens": 999696} +{"current_steps": 2490, "total_steps": 4810, "loss": 0.2897, "lr": 2.7833234887417743e-05, "epoch": 2.5883575883575882, "percentage": 51.77, "elapsed_time": "0:11:40", "remaining_time": "0:10:52", "throughput": 1430.65, "total_tokens": 1001680} +{"current_steps": 2495, "total_steps": 4810, "loss": 0.2723, "lr": 2.7743087279847868e-05, "epoch": 2.5935550935550937, "percentage": 51.87, "elapsed_time": "0:11:40", "remaining_time": "0:10:49", "throughput": 1432.9, "total_tokens": 1003728} +{"current_steps": 2500, "total_steps": 4810, "loss": 0.2874, "lr": 2.765290355593805e-05, "epoch": 2.598752598752599, "percentage": 51.98, "elapsed_time": "0:11:40", "remaining_time": "0:10:47", "throughput": 1434.87, "total_tokens": 1005584} +{"current_steps": 2505, "total_steps": 4810, "loss": 0.2405, "lr": 2.7562684903075238e-05, "epoch": 2.603950103950104, "percentage": 52.08, "elapsed_time": "0:11:41", "remaining_time": "0:10:45", "throughput": 1437.21, "total_tokens": 1007696} +{"current_steps": 2510, "total_steps": 4810, "loss": 0.2737, "lr": 2.7472432509106248e-05, "epoch": 2.609147609147609, "percentage": 52.18, "elapsed_time": "0:11:41", "remaining_time": "0:10:42", "throughput": 1439.36, "total_tokens": 1009680} +{"current_steps": 2515, "total_steps": 4810, "loss": 0.2753, "lr": 2.7382147562322174e-05, "epoch": 2.6143451143451144, "percentage": 52.29, "elapsed_time": "0:11:41", "remaining_time": "0:10:40", "throughput": 1441.61, "total_tokens": 1011728} +{"current_steps": 2520, "total_steps": 4810, "loss": 0.2553, "lr": 2.729183125144269e-05, "epoch": 2.6195426195426195, "percentage": 52.39, "elapsed_time": "0:11:42", "remaining_time": "0:10:38", "throughput": 1443.94, "total_tokens": 1013840} +{"current_steps": 2525, "total_steps": 4810, "loss": 0.2564, "lr": 2.7201484765600426e-05, "epoch": 2.624740124740125, "percentage": 52.49, "elapsed_time": "0:11:42", "remaining_time": "0:10:35", "throughput": 1446.08, "total_tokens": 1015824} +{"current_steps": 2530, "total_steps": 4810, "loss": 0.277, "lr": 2.7111109294325297e-05, "epoch": 2.62993762993763, "percentage": 52.6, "elapsed_time": "0:11:42", "remaining_time": "0:10:33", "throughput": 1448.13, "total_tokens": 1017744} +{"current_steps": 2535, "total_steps": 4810, "loss": 0.2439, "lr": 2.702070602752887e-05, "epoch": 2.635135135135135, "percentage": 52.7, "elapsed_time": "0:11:43", "remaining_time": "0:10:31", "throughput": 1450.27, "total_tokens": 1019728} +{"current_steps": 2540, "total_steps": 4810, "loss": 0.2958, "lr": 2.693027615548864e-05, "epoch": 2.64033264033264, "percentage": 52.81, "elapsed_time": "0:11:43", "remaining_time": "0:10:28", "throughput": 1452.6, "total_tokens": 1021840} +{"current_steps": 2545, "total_steps": 4810, "loss": 0.2809, "lr": 2.6839820868832433e-05, "epoch": 2.6455301455301456, "percentage": 52.91, "elapsed_time": "0:11:43", "remaining_time": "0:10:26", "throughput": 1454.73, "total_tokens": 1023824} +{"current_steps": 2550, "total_steps": 4810, "loss": 0.2583, "lr": 2.6749341358522674e-05, "epoch": 2.6507276507276507, "percentage": 53.01, "elapsed_time": "0:11:44", "remaining_time": "0:10:24", "throughput": 1456.6, "total_tokens": 1025616} +{"current_steps": 2555, "total_steps": 4810, "loss": 0.2494, "lr": 2.665883881584072e-05, "epoch": 2.6559251559251558, "percentage": 53.12, "elapsed_time": "0:11:44", "remaining_time": "0:10:21", "throughput": 1458.82, "total_tokens": 1027664} +{"current_steps": 2560, "total_steps": 4810, "loss": 0.2477, "lr": 2.6568314432371183e-05, "epoch": 2.6611226611226613, "percentage": 53.22, "elapsed_time": "0:11:44", "remaining_time": "0:10:19", "throughput": 1460.95, "total_tokens": 1029648} +{"current_steps": 2565, "total_steps": 4810, "loss": 0.2402, "lr": 2.6477769399986245e-05, "epoch": 2.6663201663201663, "percentage": 53.33, "elapsed_time": "0:11:45", "remaining_time": "0:10:17", "throughput": 1463.08, "total_tokens": 1031632} +{"current_steps": 2570, "total_steps": 4810, "loss": 0.2583, "lr": 2.6387204910829956e-05, "epoch": 2.6715176715176714, "percentage": 53.43, "elapsed_time": "0:11:45", "remaining_time": "0:10:14", "throughput": 1465.03, "total_tokens": 1033488} +{"current_steps": 2575, "total_steps": 4810, "loss": 0.2162, "lr": 2.629662215730253e-05, "epoch": 2.6767151767151764, "percentage": 53.53, "elapsed_time": "0:11:45", "remaining_time": "0:10:12", "throughput": 1467.25, "total_tokens": 1035536} +{"current_steps": 2580, "total_steps": 4810, "loss": 0.2652, "lr": 2.6206022332044667e-05, "epoch": 2.681912681912682, "percentage": 53.64, "elapsed_time": "0:11:46", "remaining_time": "0:10:10", "throughput": 1469.46, "total_tokens": 1037584} +{"current_steps": 2585, "total_steps": 4810, "loss": 0.2401, "lr": 2.6115406627921825e-05, "epoch": 2.687110187110187, "percentage": 53.74, "elapsed_time": "0:11:46", "remaining_time": "0:10:08", "throughput": 1471.58, "total_tokens": 1039568} +{"current_steps": 2590, "total_steps": 4810, "loss": 0.2416, "lr": 2.6024776238008543e-05, "epoch": 2.6923076923076925, "percentage": 53.85, "elapsed_time": "0:11:46", "remaining_time": "0:10:05", "throughput": 1473.79, "total_tokens": 1041616} +{"current_steps": 2595, "total_steps": 4810, "loss": 0.2479, "lr": 2.593413235557271e-05, "epoch": 2.6975051975051976, "percentage": 53.95, "elapsed_time": "0:11:47", "remaining_time": "0:10:03", "throughput": 1476.0, "total_tokens": 1043664} +{"current_steps": 2600, "total_steps": 4810, "loss": 0.2624, "lr": 2.5843476174059872e-05, "epoch": 2.7027027027027026, "percentage": 54.05, "elapsed_time": "0:11:47", "remaining_time": "0:10:01", "throughput": 1477.94, "total_tokens": 1045520} +{"current_steps": 2605, "total_steps": 4810, "loss": 0.2519, "lr": 2.5752808887077477e-05, "epoch": 2.7079002079002077, "percentage": 54.16, "elapsed_time": "0:11:47", "remaining_time": "0:09:59", "throughput": 1479.87, "total_tokens": 1047376} +{"current_steps": 2610, "total_steps": 4810, "loss": 0.2347, "lr": 2.5662131688379242e-05, "epoch": 2.713097713097713, "percentage": 54.26, "elapsed_time": "0:11:48", "remaining_time": "0:09:56", "throughput": 1481.98, "total_tokens": 1049360} +{"current_steps": 2615, "total_steps": 4810, "loss": 0.2785, "lr": 2.5571445771849327e-05, "epoch": 2.7182952182952183, "percentage": 54.37, "elapsed_time": "0:11:48", "remaining_time": "0:09:54", "throughput": 1484.09, "total_tokens": 1051344} +{"current_steps": 2620, "total_steps": 4810, "loss": 0.2622, "lr": 2.548075233148674e-05, "epoch": 2.7234927234927238, "percentage": 54.47, "elapsed_time": "0:11:48", "remaining_time": "0:09:52", "throughput": 1486.11, "total_tokens": 1053264} +{"current_steps": 2625, "total_steps": 4810, "loss": 0.2798, "lr": 2.5390052561389478e-05, "epoch": 2.728690228690229, "percentage": 54.57, "elapsed_time": "0:11:49", "remaining_time": "0:09:50", "throughput": 1488.21, "total_tokens": 1055248} +{"current_steps": 2630, "total_steps": 4810, "loss": 0.2568, "lr": 2.529934765573893e-05, "epoch": 2.733887733887734, "percentage": 54.68, "elapsed_time": "0:11:49", "remaining_time": "0:09:48", "throughput": 1490.13, "total_tokens": 1057104} +{"current_steps": 2635, "total_steps": 4810, "loss": 0.2622, "lr": 2.520863880878408e-05, "epoch": 2.739085239085239, "percentage": 54.78, "elapsed_time": "0:11:49", "remaining_time": "0:09:45", "throughput": 1492.14, "total_tokens": 1059024} +{"current_steps": 2640, "total_steps": 4810, "loss": 0.2707, "lr": 2.511792721482581e-05, "epoch": 2.7442827442827444, "percentage": 54.89, "elapsed_time": "0:11:50", "remaining_time": "0:09:43", "throughput": 1494.15, "total_tokens": 1060944} +{"current_steps": 2645, "total_steps": 4810, "loss": 0.2525, "lr": 2.502721406820116e-05, "epoch": 2.7494802494802495, "percentage": 54.99, "elapsed_time": "0:11:50", "remaining_time": "0:09:41", "throughput": 1496.34, "total_tokens": 1062992} +{"current_steps": 2650, "total_steps": 4810, "loss": 0.2934, "lr": 2.4936500563267627e-05, "epoch": 2.7546777546777546, "percentage": 55.09, "elapsed_time": "0:11:50", "remaining_time": "0:09:39", "throughput": 1498.26, "total_tokens": 1064848} +{"current_steps": 2651, "total_steps": 4810, "eval_loss": 0.2561495900154114, "epoch": 2.7557172557172556, "percentage": 55.11, "elapsed_time": "0:11:51", "remaining_time": "0:09:39", "throughput": 1496.46, "total_tokens": 1065232} +{"current_steps": 2655, "total_steps": 4810, "loss": 0.2493, "lr": 2.4845787894387425e-05, "epoch": 2.75987525987526, "percentage": 55.2, "elapsed_time": "0:12:35", "remaining_time": "0:10:13", "throughput": 1411.33, "total_tokens": 1066832} +{"current_steps": 2660, "total_steps": 4810, "loss": 0.2661, "lr": 2.4755077255911743e-05, "epoch": 2.765072765072765, "percentage": 55.3, "elapsed_time": "0:12:36", "remaining_time": "0:10:11", "throughput": 1413.43, "total_tokens": 1068880} +{"current_steps": 2665, "total_steps": 4810, "loss": 0.2398, "lr": 2.4664369842165068e-05, "epoch": 2.77027027027027, "percentage": 55.41, "elapsed_time": "0:12:36", "remaining_time": "0:10:08", "throughput": 1415.46, "total_tokens": 1070864} +{"current_steps": 2670, "total_steps": 4810, "loss": 0.2523, "lr": 2.4573666847429384e-05, "epoch": 2.7754677754677752, "percentage": 55.51, "elapsed_time": "0:12:36", "remaining_time": "0:10:06", "throughput": 1417.47, "total_tokens": 1072848} +{"current_steps": 2675, "total_steps": 4810, "loss": 0.3167, "lr": 2.4482969465928543e-05, "epoch": 2.7806652806652807, "percentage": 55.61, "elapsed_time": "0:12:37", "remaining_time": "0:10:04", "throughput": 1419.49, "total_tokens": 1074832} +{"current_steps": 2680, "total_steps": 4810, "loss": 0.2951, "lr": 2.4392278891812455e-05, "epoch": 2.785862785862786, "percentage": 55.72, "elapsed_time": "0:12:37", "remaining_time": "0:10:02", "throughput": 1421.67, "total_tokens": 1076944} +{"current_steps": 2685, "total_steps": 4810, "loss": 0.2844, "lr": 2.430159631914141e-05, "epoch": 2.7910602910602913, "percentage": 55.82, "elapsed_time": "0:12:37", "remaining_time": "0:09:59", "throughput": 1423.52, "total_tokens": 1078800} +{"current_steps": 2690, "total_steps": 4810, "loss": 0.2706, "lr": 2.4210922941870367e-05, "epoch": 2.7962577962577964, "percentage": 55.93, "elapsed_time": "0:12:38", "remaining_time": "0:09:57", "throughput": 1425.7, "total_tokens": 1080912} +{"current_steps": 2695, "total_steps": 4810, "loss": 0.244, "lr": 2.41202599538332e-05, "epoch": 2.8014553014553014, "percentage": 56.03, "elapsed_time": "0:12:38", "remaining_time": "0:09:55", "throughput": 1427.79, "total_tokens": 1082960} +{"current_steps": 2700, "total_steps": 4810, "loss": 0.2877, "lr": 2.402960854872697e-05, "epoch": 2.8066528066528065, "percentage": 56.13, "elapsed_time": "0:12:38", "remaining_time": "0:09:52", "throughput": 1429.89, "total_tokens": 1085008} +{"current_steps": 2705, "total_steps": 4810, "loss": 0.1818, "lr": 2.39389699200963e-05, "epoch": 2.811850311850312, "percentage": 56.24, "elapsed_time": "0:12:39", "remaining_time": "0:09:50", "throughput": 1432.15, "total_tokens": 1087184} +{"current_steps": 2710, "total_steps": 4810, "loss": 0.2384, "lr": 2.384834526131752e-05, "epoch": 2.817047817047817, "percentage": 56.34, "elapsed_time": "0:12:39", "remaining_time": "0:09:48", "throughput": 1434.07, "total_tokens": 1089104} +{"current_steps": 2715, "total_steps": 4810, "loss": 0.2707, "lr": 2.3757735765583083e-05, "epoch": 2.822245322245322, "percentage": 56.44, "elapsed_time": "0:12:39", "remaining_time": "0:09:46", "throughput": 1435.99, "total_tokens": 1091024} +{"current_steps": 2720, "total_steps": 4810, "loss": 0.2399, "lr": 2.366714262588577e-05, "epoch": 2.8274428274428276, "percentage": 56.55, "elapsed_time": "0:12:40", "remaining_time": "0:09:44", "throughput": 1437.99, "total_tokens": 1093008} +{"current_steps": 2725, "total_steps": 4810, "loss": 0.2595, "lr": 2.3576567035003027e-05, "epoch": 2.8326403326403327, "percentage": 56.65, "elapsed_time": "0:12:40", "remaining_time": "0:09:41", "throughput": 1439.99, "total_tokens": 1094992} +{"current_steps": 2730, "total_steps": 4810, "loss": 0.2918, "lr": 2.3486010185481248e-05, "epoch": 2.8378378378378377, "percentage": 56.76, "elapsed_time": "0:12:40", "remaining_time": "0:09:39", "throughput": 1442.08, "total_tokens": 1097040} +{"current_steps": 2735, "total_steps": 4810, "loss": 0.274, "lr": 2.3395473269620056e-05, "epoch": 2.8430353430353428, "percentage": 56.86, "elapsed_time": "0:12:41", "remaining_time": "0:09:37", "throughput": 1443.99, "total_tokens": 1098960} +{"current_steps": 2740, "total_steps": 4810, "loss": 0.2749, "lr": 2.330495747945665e-05, "epoch": 2.8482328482328483, "percentage": 56.96, "elapsed_time": "0:12:41", "remaining_time": "0:09:35", "throughput": 1446.31, "total_tokens": 1101200} +{"current_steps": 2745, "total_steps": 4810, "loss": 0.2766, "lr": 2.321446400675005e-05, "epoch": 2.8534303534303533, "percentage": 57.07, "elapsed_time": "0:12:41", "remaining_time": "0:09:33", "throughput": 1448.23, "total_tokens": 1103120} +{"current_steps": 2750, "total_steps": 4810, "loss": 0.255, "lr": 2.3123994042965453e-05, "epoch": 2.858627858627859, "percentage": 57.17, "elapsed_time": "0:12:42", "remaining_time": "0:09:30", "throughput": 1450.3, "total_tokens": 1105168} +{"current_steps": 2755, "total_steps": 4810, "loss": 0.2452, "lr": 2.3033548779258535e-05, "epoch": 2.863825363825364, "percentage": 57.28, "elapsed_time": "0:12:42", "remaining_time": "0:09:28", "throughput": 1452.29, "total_tokens": 1107152} +{"current_steps": 2760, "total_steps": 4810, "loss": 0.3016, "lr": 2.294312940645975e-05, "epoch": 2.869022869022869, "percentage": 57.38, "elapsed_time": "0:12:42", "remaining_time": "0:09:26", "throughput": 1454.36, "total_tokens": 1109200} +{"current_steps": 2765, "total_steps": 4810, "loss": 0.282, "lr": 2.2852737115058682e-05, "epoch": 2.874220374220374, "percentage": 57.48, "elapsed_time": "0:12:42", "remaining_time": "0:09:24", "throughput": 1456.43, "total_tokens": 1111248} +{"current_steps": 2770, "total_steps": 4810, "loss": 0.2753, "lr": 2.276237309518834e-05, "epoch": 2.8794178794178795, "percentage": 57.59, "elapsed_time": "0:12:43", "remaining_time": "0:09:22", "throughput": 1458.42, "total_tokens": 1113232} +{"current_steps": 2775, "total_steps": 4810, "loss": 0.268, "lr": 2.2672038536609487e-05, "epoch": 2.8846153846153846, "percentage": 57.69, "elapsed_time": "0:12:43", "remaining_time": "0:09:20", "throughput": 1460.4, "total_tokens": 1115216} +{"current_steps": 2780, "total_steps": 4810, "loss": 0.2816, "lr": 2.2581734628695034e-05, "epoch": 2.88981288981289, "percentage": 57.8, "elapsed_time": "0:12:43", "remaining_time": "0:09:17", "throughput": 1462.47, "total_tokens": 1117264} +{"current_steps": 2785, "total_steps": 4810, "loss": 0.2795, "lr": 2.2491462560414287e-05, "epoch": 2.895010395010395, "percentage": 57.9, "elapsed_time": "0:12:44", "remaining_time": "0:09:15", "throughput": 1464.61, "total_tokens": 1119376} +{"current_steps": 2790, "total_steps": 4810, "loss": 0.283, "lr": 2.2401223520317362e-05, "epoch": 2.9002079002079, "percentage": 58.0, "elapsed_time": "0:12:44", "remaining_time": "0:09:13", "throughput": 1466.68, "total_tokens": 1121424} +{"current_steps": 2795, "total_steps": 4810, "loss": 0.2663, "lr": 2.2311018696519532e-05, "epoch": 2.9054054054054053, "percentage": 58.11, "elapsed_time": "0:12:44", "remaining_time": "0:09:11", "throughput": 1468.74, "total_tokens": 1123472} +{"current_steps": 2800, "total_steps": 4810, "loss": 0.218, "lr": 2.222084927668553e-05, "epoch": 2.9106029106029108, "percentage": 58.21, "elapsed_time": "0:12:45", "remaining_time": "0:09:09", "throughput": 1470.88, "total_tokens": 1125584} +{"current_steps": 2805, "total_steps": 4810, "loss": 0.2474, "lr": 2.2130716448014e-05, "epoch": 2.915800415800416, "percentage": 58.32, "elapsed_time": "0:12:45", "remaining_time": "0:09:07", "throughput": 1472.85, "total_tokens": 1127568} +{"current_steps": 2810, "total_steps": 4810, "loss": 0.3308, "lr": 2.204062139722176e-05, "epoch": 2.920997920997921, "percentage": 58.42, "elapsed_time": "0:12:45", "remaining_time": "0:09:05", "throughput": 1474.83, "total_tokens": 1129552} +{"current_steps": 2815, "total_steps": 4810, "loss": 0.2914, "lr": 2.1950565310528266e-05, "epoch": 2.9261954261954264, "percentage": 58.52, "elapsed_time": "0:12:46", "remaining_time": "0:09:03", "throughput": 1476.71, "total_tokens": 1131472} +{"current_steps": 2820, "total_steps": 4810, "loss": 0.3008, "lr": 2.186054937363996e-05, "epoch": 2.9313929313929314, "percentage": 58.63, "elapsed_time": "0:12:46", "remaining_time": "0:09:00", "throughput": 1478.6, "total_tokens": 1133392} +{"current_steps": 2825, "total_steps": 4810, "loss": 0.2747, "lr": 2.1770574771734642e-05, "epoch": 2.9365904365904365, "percentage": 58.73, "elapsed_time": "0:12:46", "remaining_time": "0:08:58", "throughput": 1480.65, "total_tokens": 1135440} +{"current_steps": 2830, "total_steps": 4810, "loss": 0.2694, "lr": 2.168064268944591e-05, "epoch": 2.9417879417879416, "percentage": 58.84, "elapsed_time": "0:12:47", "remaining_time": "0:08:56", "throughput": 1482.59, "total_tokens": 1137424} +{"current_steps": 2835, "total_steps": 4810, "loss": 0.2574, "lr": 2.159075431084751e-05, "epoch": 2.946985446985447, "percentage": 58.94, "elapsed_time": "0:12:47", "remaining_time": "0:08:54", "throughput": 1484.56, "total_tokens": 1139408} +{"current_steps": 2840, "total_steps": 4810, "loss": 0.2677, "lr": 2.1500910819437766e-05, "epoch": 2.952182952182952, "percentage": 59.04, "elapsed_time": "0:12:47", "remaining_time": "0:08:52", "throughput": 1486.6, "total_tokens": 1141456} +{"current_steps": 2845, "total_steps": 4810, "loss": 0.2513, "lr": 2.141111339812405e-05, "epoch": 2.9573804573804576, "percentage": 59.15, "elapsed_time": "0:12:48", "remaining_time": "0:08:50", "throughput": 1488.56, "total_tokens": 1143440} +{"current_steps": 2850, "total_steps": 4810, "loss": 0.256, "lr": 2.1321363229207096e-05, "epoch": 2.9625779625779627, "percentage": 59.25, "elapsed_time": "0:12:48", "remaining_time": "0:08:48", "throughput": 1490.44, "total_tokens": 1145360} +{"current_steps": 2855, "total_steps": 4810, "loss": 0.2779, "lr": 2.123166149436556e-05, "epoch": 2.9677754677754677, "percentage": 59.36, "elapsed_time": "0:12:48", "remaining_time": "0:08:46", "throughput": 1492.32, "total_tokens": 1147280} +{"current_steps": 2860, "total_steps": 4810, "loss": 0.2814, "lr": 2.114200937464035e-05, "epoch": 2.972972972972973, "percentage": 59.46, "elapsed_time": "0:12:49", "remaining_time": "0:08:44", "throughput": 1494.2, "total_tokens": 1149200} +{"current_steps": 2865, "total_steps": 4810, "loss": 0.2671, "lr": 2.1052408050419152e-05, "epoch": 2.9781704781704783, "percentage": 59.56, "elapsed_time": "0:12:49", "remaining_time": "0:08:42", "throughput": 1496.15, "total_tokens": 1151184} +{"current_steps": 2870, "total_steps": 4810, "loss": 0.2391, "lr": 2.0962858701420866e-05, "epoch": 2.9833679833679834, "percentage": 59.67, "elapsed_time": "0:12:49", "remaining_time": "0:08:40", "throughput": 1498.19, "total_tokens": 1153232} +{"current_steps": 2875, "total_steps": 4810, "loss": 0.251, "lr": 2.0873362506680057e-05, "epoch": 2.9885654885654884, "percentage": 59.77, "elapsed_time": "0:12:50", "remaining_time": "0:08:38", "throughput": 1500.14, "total_tokens": 1155216} +{"current_steps": 2880, "total_steps": 4810, "loss": 0.2661, "lr": 2.078392064453144e-05, "epoch": 2.993762993762994, "percentage": 59.88, "elapsed_time": "0:12:50", "remaining_time": "0:08:36", "throughput": 1502.17, "total_tokens": 1157264} +{"current_steps": 2885, "total_steps": 4810, "loss": 0.2609, "lr": 2.0694534292594392e-05, "epoch": 2.998960498960499, "percentage": 59.98, "elapsed_time": "0:12:50", "remaining_time": "0:08:34", "throughput": 1504.21, "total_tokens": 1159312} +{"current_steps": 2890, "total_steps": 4810, "loss": 0.2209, "lr": 2.0605204627757403e-05, "epoch": 3.004158004158004, "percentage": 60.08, "elapsed_time": "0:12:51", "remaining_time": "0:08:32", "throughput": 1505.85, "total_tokens": 1161248} +{"current_steps": 2892, "total_steps": 4810, "eval_loss": 0.257083535194397, "epoch": 3.006237006237006, "percentage": 60.12, "elapsed_time": "0:12:52", "remaining_time": "0:08:32", "throughput": 1504.54, "total_tokens": 1162016} +{"current_steps": 2895, "total_steps": 4810, "loss": 0.2146, "lr": 2.051593282616262e-05, "epoch": 3.0093555093555096, "percentage": 60.19, "elapsed_time": "0:13:26", "remaining_time": "0:08:53", "throughput": 1442.55, "total_tokens": 1163168} +{"current_steps": 2900, "total_steps": 4810, "loss": 0.2637, "lr": 2.0426720063190335e-05, "epoch": 3.0145530145530146, "percentage": 60.29, "elapsed_time": "0:13:26", "remaining_time": "0:08:51", "throughput": 1444.35, "total_tokens": 1165088} +{"current_steps": 2905, "total_steps": 4810, "loss": 0.2303, "lr": 2.033756751344352e-05, "epoch": 3.0197505197505197, "percentage": 60.4, "elapsed_time": "0:13:26", "remaining_time": "0:08:49", "throughput": 1446.31, "total_tokens": 1167136} +{"current_steps": 2910, "total_steps": 4810, "loss": 0.2915, "lr": 2.0248476350732368e-05, "epoch": 3.024948024948025, "percentage": 60.5, "elapsed_time": "0:13:27", "remaining_time": "0:08:47", "throughput": 1448.19, "total_tokens": 1169120} +{"current_steps": 2915, "total_steps": 4810, "loss": 0.3333, "lr": 2.0159447748058805e-05, "epoch": 3.0301455301455302, "percentage": 60.6, "elapsed_time": "0:13:27", "remaining_time": "0:08:45", "throughput": 1449.99, "total_tokens": 1171040} +{"current_steps": 2920, "total_steps": 4810, "loss": 0.2142, "lr": 2.0070482877601127e-05, "epoch": 3.0353430353430353, "percentage": 60.71, "elapsed_time": "0:13:27", "remaining_time": "0:08:42", "throughput": 1451.87, "total_tokens": 1173024} +{"current_steps": 2925, "total_steps": 4810, "loss": 0.2912, "lr": 1.998158291069845e-05, "epoch": 3.0405405405405403, "percentage": 60.81, "elapsed_time": "0:13:28", "remaining_time": "0:08:40", "throughput": 1453.66, "total_tokens": 1174944} +{"current_steps": 2930, "total_steps": 4810, "loss": 0.2799, "lr": 1.9892749017835384e-05, "epoch": 3.045738045738046, "percentage": 60.91, "elapsed_time": "0:13:28", "remaining_time": "0:08:38", "throughput": 1455.7, "total_tokens": 1177056} +{"current_steps": 2935, "total_steps": 4810, "loss": 0.318, "lr": 1.9803982368626583e-05, "epoch": 3.050935550935551, "percentage": 61.02, "elapsed_time": "0:13:28", "remaining_time": "0:08:36", "throughput": 1457.49, "total_tokens": 1178976} +{"current_steps": 2940, "total_steps": 4810, "loss": 0.2836, "lr": 1.9715284131801353e-05, "epoch": 3.056133056133056, "percentage": 61.12, "elapsed_time": "0:13:29", "remaining_time": "0:08:34", "throughput": 1459.44, "total_tokens": 1181024} +{"current_steps": 2945, "total_steps": 4810, "loss": 0.2515, "lr": 1.9626655475188238e-05, "epoch": 3.0613305613305615, "percentage": 61.23, "elapsed_time": "0:13:29", "remaining_time": "0:08:32", "throughput": 1461.31, "total_tokens": 1183008} +{"current_steps": 2950, "total_steps": 4810, "loss": 0.2949, "lr": 1.953809756569971e-05, "epoch": 3.0665280665280665, "percentage": 61.33, "elapsed_time": "0:13:29", "remaining_time": "0:08:30", "throughput": 1463.26, "total_tokens": 1185056} +{"current_steps": 2955, "total_steps": 4810, "loss": 0.2646, "lr": 1.9449611569316717e-05, "epoch": 3.0717255717255716, "percentage": 61.43, "elapsed_time": "0:13:30", "remaining_time": "0:08:28", "throughput": 1465.05, "total_tokens": 1186976} +{"current_steps": 2960, "total_steps": 4810, "loss": 0.3027, "lr": 1.9361198651073408e-05, "epoch": 3.076923076923077, "percentage": 61.54, "elapsed_time": "0:13:30", "remaining_time": "0:08:26", "throughput": 1466.91, "total_tokens": 1188960} +{"current_steps": 2965, "total_steps": 4810, "loss": 0.2629, "lr": 1.9272859975041754e-05, "epoch": 3.082120582120582, "percentage": 61.64, "elapsed_time": "0:13:30", "remaining_time": "0:08:24", "throughput": 1468.78, "total_tokens": 1190944} +{"current_steps": 2970, "total_steps": 4810, "loss": 0.2261, "lr": 1.918459670431622e-05, "epoch": 3.087318087318087, "percentage": 61.75, "elapsed_time": "0:13:31", "remaining_time": "0:08:22", "throughput": 1470.59, "total_tokens": 1192928} +{"current_steps": 2975, "total_steps": 4810, "loss": 0.239, "lr": 1.9096410000998475e-05, "epoch": 3.0925155925155927, "percentage": 61.85, "elapsed_time": "0:13:31", "remaining_time": "0:08:20", "throughput": 1472.36, "total_tokens": 1194848} +{"current_steps": 2980, "total_steps": 4810, "loss": 0.2484, "lr": 1.900830102618206e-05, "epoch": 3.0977130977130978, "percentage": 61.95, "elapsed_time": "0:13:31", "remaining_time": "0:08:18", "throughput": 1474.14, "total_tokens": 1196768} +{"current_steps": 2985, "total_steps": 4810, "loss": 0.2739, "lr": 1.892027093993716e-05, "epoch": 3.102910602910603, "percentage": 62.06, "elapsed_time": "0:13:32", "remaining_time": "0:08:16", "throughput": 1475.91, "total_tokens": 1198688} +{"current_steps": 2990, "total_steps": 4810, "loss": 0.2701, "lr": 1.8832320901295227e-05, "epoch": 3.108108108108108, "percentage": 62.16, "elapsed_time": "0:13:32", "remaining_time": "0:08:14", "throughput": 1477.76, "total_tokens": 1200672} +{"current_steps": 2995, "total_steps": 4810, "loss": 0.29, "lr": 1.8744452068233825e-05, "epoch": 3.1133056133056134, "percentage": 62.27, "elapsed_time": "0:13:32", "remaining_time": "0:08:12", "throughput": 1479.69, "total_tokens": 1202720} +{"current_steps": 3000, "total_steps": 4810, "loss": 0.2816, "lr": 1.8656665597661333e-05, "epoch": 3.1185031185031185, "percentage": 62.37, "elapsed_time": "0:13:33", "remaining_time": "0:08:10", "throughput": 1481.62, "total_tokens": 1204768} +{"current_steps": 3005, "total_steps": 4810, "loss": 0.2677, "lr": 1.85689626454017e-05, "epoch": 3.1237006237006235, "percentage": 62.47, "elapsed_time": "0:13:33", "remaining_time": "0:08:08", "throughput": 1483.7, "total_tokens": 1206944} +{"current_steps": 3010, "total_steps": 4810, "loss": 0.2308, "lr": 1.8481344366179284e-05, "epoch": 3.128898128898129, "percentage": 62.58, "elapsed_time": "0:13:33", "remaining_time": "0:08:06", "throughput": 1485.7, "total_tokens": 1209056} +{"current_steps": 3015, "total_steps": 4810, "loss": 0.2745, "lr": 1.839381191360358e-05, "epoch": 3.134095634095634, "percentage": 62.68, "elapsed_time": "0:13:34", "remaining_time": "0:08:04", "throughput": 1487.47, "total_tokens": 1210976} +{"current_steps": 3020, "total_steps": 4810, "loss": 0.2645, "lr": 1.8306366440154066e-05, "epoch": 3.139293139293139, "percentage": 62.79, "elapsed_time": "0:13:34", "remaining_time": "0:08:02", "throughput": 1489.39, "total_tokens": 1213024} +{"current_steps": 3025, "total_steps": 4810, "loss": 0.2854, "lr": 1.821900909716504e-05, "epoch": 3.1444906444906446, "percentage": 62.89, "elapsed_time": "0:13:34", "remaining_time": "0:08:00", "throughput": 1491.39, "total_tokens": 1215136} +{"current_steps": 3030, "total_steps": 4810, "loss": 0.2667, "lr": 1.8131741034810435e-05, "epoch": 3.1496881496881497, "percentage": 62.99, "elapsed_time": "0:13:35", "remaining_time": "0:07:58", "throughput": 1493.15, "total_tokens": 1217056} +{"current_steps": 3035, "total_steps": 4810, "loss": 0.2799, "lr": 1.8044563402088684e-05, "epoch": 3.1548856548856548, "percentage": 63.1, "elapsed_time": "0:13:35", "remaining_time": "0:07:56", "throughput": 1495.14, "total_tokens": 1219168} +{"current_steps": 3040, "total_steps": 4810, "loss": 0.2724, "lr": 1.795747734680762e-05, "epoch": 3.1600831600831603, "percentage": 63.2, "elapsed_time": "0:13:35", "remaining_time": "0:07:54", "throughput": 1496.9, "total_tokens": 1221088} +{"current_steps": 3045, "total_steps": 4810, "loss": 0.2666, "lr": 1.7870484015569306e-05, "epoch": 3.1652806652806653, "percentage": 63.31, "elapsed_time": "0:13:36", "remaining_time": "0:07:53", "throughput": 1498.97, "total_tokens": 1223264} +{"current_steps": 3050, "total_steps": 4810, "loss": 0.2586, "lr": 1.7783584553755006e-05, "epoch": 3.1704781704781704, "percentage": 63.41, "elapsed_time": "0:13:36", "remaining_time": "0:07:51", "throughput": 1501.03, "total_tokens": 1225440} +{"current_steps": 3055, "total_steps": 4810, "loss": 0.2519, "lr": 1.769678010551003e-05, "epoch": 3.175675675675676, "percentage": 63.51, "elapsed_time": "0:13:36", "remaining_time": "0:07:49", "throughput": 1502.87, "total_tokens": 1227424} +{"current_steps": 3060, "total_steps": 4810, "loss": 0.241, "lr": 1.761007181372874e-05, "epoch": 3.180873180873181, "percentage": 63.62, "elapsed_time": "0:13:37", "remaining_time": "0:07:47", "throughput": 1504.63, "total_tokens": 1229344} +{"current_steps": 3065, "total_steps": 4810, "loss": 0.2406, "lr": 1.7523460820039464e-05, "epoch": 3.186070686070686, "percentage": 63.72, "elapsed_time": "0:13:37", "remaining_time": "0:07:45", "throughput": 1506.62, "total_tokens": 1231456} +{"current_steps": 3070, "total_steps": 4810, "loss": 0.3145, "lr": 1.7436948264789466e-05, "epoch": 3.1912681912681915, "percentage": 63.83, "elapsed_time": "0:13:37", "remaining_time": "0:07:43", "throughput": 1508.46, "total_tokens": 1233440} +{"current_steps": 3075, "total_steps": 4810, "loss": 0.2568, "lr": 1.7350535287029957e-05, "epoch": 3.1964656964656966, "percentage": 63.93, "elapsed_time": "0:13:38", "remaining_time": "0:07:41", "throughput": 1510.45, "total_tokens": 1235552} +{"current_steps": 3080, "total_steps": 4810, "loss": 0.2696, "lr": 1.7264223024501064e-05, "epoch": 3.2016632016632016, "percentage": 64.03, "elapsed_time": "0:13:38", "remaining_time": "0:07:39", "throughput": 1512.28, "total_tokens": 1237536} +{"current_steps": 3085, "total_steps": 4810, "loss": 0.2861, "lr": 1.717801261361685e-05, "epoch": 3.2068607068607067, "percentage": 64.14, "elapsed_time": "0:13:38", "remaining_time": "0:07:37", "throughput": 1514.19, "total_tokens": 1239584} +{"current_steps": 3090, "total_steps": 4810, "loss": 0.2501, "lr": 1.7091905189450423e-05, "epoch": 3.212058212058212, "percentage": 64.24, "elapsed_time": "0:13:38", "remaining_time": "0:07:35", "throughput": 1515.94, "total_tokens": 1241504} +{"current_steps": 3095, "total_steps": 4810, "loss": 0.2578, "lr": 1.700590188571887e-05, "epoch": 3.2172557172557172, "percentage": 64.35, "elapsed_time": "0:13:39", "remaining_time": "0:07:33", "throughput": 1517.85, "total_tokens": 1243552} +{"current_steps": 3100, "total_steps": 4810, "loss": 0.3075, "lr": 1.6920003834768438e-05, "epoch": 3.2224532224532223, "percentage": 64.45, "elapsed_time": "0:13:39", "remaining_time": "0:07:32", "throughput": 1519.75, "total_tokens": 1245600} +{"current_steps": 3105, "total_steps": 4810, "loss": 0.2389, "lr": 1.6834212167559575e-05, "epoch": 3.227650727650728, "percentage": 64.55, "elapsed_time": "0:13:39", "remaining_time": "0:07:30", "throughput": 1521.73, "total_tokens": 1247712} +{"current_steps": 3110, "total_steps": 4810, "loss": 0.26, "lr": 1.674852801365203e-05, "epoch": 3.232848232848233, "percentage": 64.66, "elapsed_time": "0:13:40", "remaining_time": "0:07:28", "throughput": 1523.55, "total_tokens": 1249696} +{"current_steps": 3115, "total_steps": 4810, "loss": 0.3027, "lr": 1.6662952501190033e-05, "epoch": 3.238045738045738, "percentage": 64.76, "elapsed_time": "0:13:40", "remaining_time": "0:07:26", "throughput": 1525.53, "total_tokens": 1251808} +{"current_steps": 3120, "total_steps": 4810, "loss": 0.2315, "lr": 1.6577486756887374e-05, "epoch": 3.2432432432432434, "percentage": 64.86, "elapsed_time": "0:13:40", "remaining_time": "0:07:24", "throughput": 1527.27, "total_tokens": 1253728} +{"current_steps": 3125, "total_steps": 4810, "loss": 0.249, "lr": 1.649213190601261e-05, "epoch": 3.2484407484407485, "percentage": 64.97, "elapsed_time": "0:13:41", "remaining_time": "0:07:22", "throughput": 1529.25, "total_tokens": 1255840} +{"current_steps": 3130, "total_steps": 4810, "loss": 0.2647, "lr": 1.640688907237425e-05, "epoch": 3.2536382536382535, "percentage": 65.07, "elapsed_time": "0:13:41", "remaining_time": "0:07:20", "throughput": 1531.14, "total_tokens": 1257888} +{"current_steps": 3133, "total_steps": 4810, "eval_loss": 0.2563324272632599, "epoch": 3.2567567567567566, "percentage": 65.14, "elapsed_time": "0:13:42", "remaining_time": "0:07:20", "throughput": 1530.42, "total_tokens": 1259168} +{"current_steps": 3135, "total_steps": 4810, "loss": 0.2584, "lr": 1.632175937830594e-05, "epoch": 3.258835758835759, "percentage": 65.18, "elapsed_time": "0:14:31", "remaining_time": "0:07:45", "throughput": 1445.42, "total_tokens": 1259936} +{"current_steps": 3140, "total_steps": 4810, "loss": 0.2355, "lr": 1.6236743944651703e-05, "epoch": 3.264033264033264, "percentage": 65.28, "elapsed_time": "0:14:31", "remaining_time": "0:07:43", "throughput": 1447.38, "total_tokens": 1262112} +{"current_steps": 3145, "total_steps": 4810, "loss": 0.2481, "lr": 1.615184389075117e-05, "epoch": 3.269230769230769, "percentage": 65.38, "elapsed_time": "0:14:32", "remaining_time": "0:07:41", "throughput": 1448.91, "total_tokens": 1263904} +{"current_steps": 3150, "total_steps": 4810, "loss": 0.2607, "lr": 1.6067060334424835e-05, "epoch": 3.274428274428274, "percentage": 65.49, "elapsed_time": "0:14:32", "remaining_time": "0:07:39", "throughput": 1450.72, "total_tokens": 1265952} +{"current_steps": 3155, "total_steps": 4810, "loss": 0.3119, "lr": 1.5982394391959382e-05, "epoch": 3.2796257796257797, "percentage": 65.59, "elapsed_time": "0:14:32", "remaining_time": "0:07:37", "throughput": 1452.39, "total_tokens": 1267872} +{"current_steps": 3160, "total_steps": 4810, "loss": 0.2925, "lr": 1.58978471780929e-05, "epoch": 3.284823284823285, "percentage": 65.7, "elapsed_time": "0:14:33", "remaining_time": "0:07:35", "throughput": 1454.05, "total_tokens": 1269792} +{"current_steps": 3165, "total_steps": 4810, "loss": 0.2586, "lr": 1.581341980600033e-05, "epoch": 3.29002079002079, "percentage": 65.8, "elapsed_time": "0:14:33", "remaining_time": "0:07:34", "throughput": 1455.79, "total_tokens": 1271776} +{"current_steps": 3170, "total_steps": 4810, "loss": 0.2671, "lr": 1.5729113387278673e-05, "epoch": 3.2952182952182953, "percentage": 65.9, "elapsed_time": "0:14:33", "remaining_time": "0:07:32", "throughput": 1457.53, "total_tokens": 1273760} +{"current_steps": 3175, "total_steps": 4810, "loss": 0.2864, "lr": 1.5644929031932454e-05, "epoch": 3.3004158004158004, "percentage": 66.01, "elapsed_time": "0:14:34", "remaining_time": "0:07:30", "throughput": 1459.34, "total_tokens": 1275808} +{"current_steps": 3180, "total_steps": 4810, "loss": 0.2666, "lr": 1.5560867848359077e-05, "epoch": 3.3056133056133055, "percentage": 66.11, "elapsed_time": "0:14:34", "remaining_time": "0:07:28", "throughput": 1461.07, "total_tokens": 1277792} +{"current_steps": 3185, "total_steps": 4810, "loss": 0.2648, "lr": 1.547693094333421e-05, "epoch": 3.310810810810811, "percentage": 66.22, "elapsed_time": "0:14:34", "remaining_time": "0:07:26", "throughput": 1462.81, "total_tokens": 1279776} +{"current_steps": 3190, "total_steps": 4810, "loss": 0.2586, "lr": 1.539311942199725e-05, "epoch": 3.316008316008316, "percentage": 66.32, "elapsed_time": "0:14:35", "remaining_time": "0:07:24", "throughput": 1464.54, "total_tokens": 1281760} +{"current_steps": 3195, "total_steps": 4810, "loss": 0.2391, "lr": 1.5309434387836735e-05, "epoch": 3.321205821205821, "percentage": 66.42, "elapsed_time": "0:14:35", "remaining_time": "0:07:22", "throughput": 1466.27, "total_tokens": 1283744} +{"current_steps": 3200, "total_steps": 4810, "loss": 0.2907, "lr": 1.5225876942675842e-05, "epoch": 3.3264033264033266, "percentage": 66.53, "elapsed_time": "0:14:35", "remaining_time": "0:07:20", "throughput": 1468.07, "total_tokens": 1285792} +{"current_steps": 3205, "total_steps": 4810, "loss": 0.2942, "lr": 1.5142448186657878e-05, "epoch": 3.3316008316008316, "percentage": 66.63, "elapsed_time": "0:14:36", "remaining_time": "0:07:18", "throughput": 1469.8, "total_tokens": 1287776} +{"current_steps": 3210, "total_steps": 4810, "loss": 0.3321, "lr": 1.505914921823178e-05, "epoch": 3.3367983367983367, "percentage": 66.74, "elapsed_time": "0:14:36", "remaining_time": "0:07:16", "throughput": 1471.45, "total_tokens": 1289696} +{"current_steps": 3215, "total_steps": 4810, "loss": 0.2486, "lr": 1.4975981134137659e-05, "epoch": 3.3419958419958418, "percentage": 66.84, "elapsed_time": "0:14:36", "remaining_time": "0:07:14", "throughput": 1473.18, "total_tokens": 1291680} +{"current_steps": 3220, "total_steps": 4810, "loss": 0.2502, "lr": 1.489294502939238e-05, "epoch": 3.3471933471933473, "percentage": 66.94, "elapsed_time": "0:14:37", "remaining_time": "0:07:13", "throughput": 1474.76, "total_tokens": 1293536} +{"current_steps": 3225, "total_steps": 4810, "loss": 0.2878, "lr": 1.4810041997275092e-05, "epoch": 3.3523908523908523, "percentage": 67.05, "elapsed_time": "0:14:37", "remaining_time": "0:07:11", "throughput": 1476.7, "total_tokens": 1295712} +{"current_steps": 3230, "total_steps": 4810, "loss": 0.2824, "lr": 1.4727273129312918e-05, "epoch": 3.357588357588358, "percentage": 67.15, "elapsed_time": "0:14:37", "remaining_time": "0:07:09", "throughput": 1478.49, "total_tokens": 1297760} +{"current_steps": 3235, "total_steps": 4810, "loss": 0.2772, "lr": 1.4644639515266483e-05, "epoch": 3.362785862785863, "percentage": 67.26, "elapsed_time": "0:14:38", "remaining_time": "0:07:07", "throughput": 1480.28, "total_tokens": 1299808} +{"current_steps": 3240, "total_steps": 4810, "loss": 0.2602, "lr": 1.4562142243115644e-05, "epoch": 3.367983367983368, "percentage": 67.36, "elapsed_time": "0:14:38", "remaining_time": "0:07:05", "throughput": 1482.15, "total_tokens": 1301920} +{"current_steps": 3245, "total_steps": 4810, "loss": 0.2737, "lr": 1.4479782399045152e-05, "epoch": 3.373180873180873, "percentage": 67.46, "elapsed_time": "0:14:38", "remaining_time": "0:07:03", "throughput": 1483.86, "total_tokens": 1303904} +{"current_steps": 3250, "total_steps": 4810, "loss": 0.2683, "lr": 1.4397561067430298e-05, "epoch": 3.3783783783783785, "percentage": 67.57, "elapsed_time": "0:14:39", "remaining_time": "0:07:01", "throughput": 1485.58, "total_tokens": 1305888} +{"current_steps": 3255, "total_steps": 4810, "loss": 0.261, "lr": 1.4315479330822712e-05, "epoch": 3.3835758835758836, "percentage": 67.67, "elapsed_time": "0:14:39", "remaining_time": "0:07:00", "throughput": 1487.51, "total_tokens": 1308064} +{"current_steps": 3260, "total_steps": 4810, "loss": 0.2702, "lr": 1.4233538269936042e-05, "epoch": 3.3887733887733886, "percentage": 67.78, "elapsed_time": "0:14:39", "remaining_time": "0:06:58", "throughput": 1489.23, "total_tokens": 1310048} +{"current_steps": 3265, "total_steps": 4810, "loss": 0.2761, "lr": 1.415173896363178e-05, "epoch": 3.393970893970894, "percentage": 67.88, "elapsed_time": "0:14:40", "remaining_time": "0:06:56", "throughput": 1490.86, "total_tokens": 1311968} +{"current_steps": 3270, "total_steps": 4810, "loss": 0.2631, "lr": 1.4070082488905034e-05, "epoch": 3.399168399168399, "percentage": 67.98, "elapsed_time": "0:14:40", "remaining_time": "0:06:54", "throughput": 1492.49, "total_tokens": 1313888} +{"current_steps": 3275, "total_steps": 4810, "loss": 0.2702, "lr": 1.3988569920870314e-05, "epoch": 3.4043659043659042, "percentage": 68.09, "elapsed_time": "0:14:40", "remaining_time": "0:06:52", "throughput": 1494.41, "total_tokens": 1316064} +{"current_steps": 3280, "total_steps": 4810, "loss": 0.2643, "lr": 1.3907202332747454e-05, "epoch": 3.4095634095634098, "percentage": 68.19, "elapsed_time": "0:14:40", "remaining_time": "0:06:50", "throughput": 1496.19, "total_tokens": 1318112} +{"current_steps": 3285, "total_steps": 4810, "loss": 0.2877, "lr": 1.3825980795847402e-05, "epoch": 3.414760914760915, "percentage": 68.3, "elapsed_time": "0:14:41", "remaining_time": "0:06:49", "throughput": 1497.74, "total_tokens": 1319968} +{"current_steps": 3290, "total_steps": 4810, "loss": 0.271, "lr": 1.3744906379558165e-05, "epoch": 3.41995841995842, "percentage": 68.4, "elapsed_time": "0:14:41", "remaining_time": "0:06:47", "throughput": 1499.52, "total_tokens": 1322016} +{"current_steps": 3295, "total_steps": 4810, "loss": 0.2729, "lr": 1.3663980151330732e-05, "epoch": 3.4251559251559254, "percentage": 68.5, "elapsed_time": "0:14:41", "remaining_time": "0:06:45", "throughput": 1501.14, "total_tokens": 1323936} +{"current_steps": 3300, "total_steps": 4810, "loss": 0.261, "lr": 1.3583203176664961e-05, "epoch": 3.4303534303534304, "percentage": 68.61, "elapsed_time": "0:14:42", "remaining_time": "0:06:43", "throughput": 1502.84, "total_tokens": 1325920} +{"current_steps": 3305, "total_steps": 4810, "loss": 0.2498, "lr": 1.350257651909562e-05, "epoch": 3.4355509355509355, "percentage": 68.71, "elapsed_time": "0:14:42", "remaining_time": "0:06:41", "throughput": 1504.47, "total_tokens": 1327840} +{"current_steps": 3310, "total_steps": 4810, "loss": 0.2384, "lr": 1.3422101240178365e-05, "epoch": 3.4407484407484406, "percentage": 68.81, "elapsed_time": "0:14:42", "remaining_time": "0:06:40", "throughput": 1506.09, "total_tokens": 1329760} +{"current_steps": 3315, "total_steps": 4810, "loss": 0.2789, "lr": 1.3341778399475713e-05, "epoch": 3.445945945945946, "percentage": 68.92, "elapsed_time": "0:14:43", "remaining_time": "0:06:38", "throughput": 1507.78, "total_tokens": 1331744} +{"current_steps": 3320, "total_steps": 4810, "loss": 0.26, "lr": 1.3261609054543179e-05, "epoch": 3.451143451143451, "percentage": 69.02, "elapsed_time": "0:14:43", "remaining_time": "0:06:36", "throughput": 1509.55, "total_tokens": 1333792} +{"current_steps": 3325, "total_steps": 4810, "loss": 0.2975, "lr": 1.3181594260915262e-05, "epoch": 3.456340956340956, "percentage": 69.13, "elapsed_time": "0:14:43", "remaining_time": "0:06:34", "throughput": 1511.24, "total_tokens": 1335776} +{"current_steps": 3330, "total_steps": 4810, "loss": 0.2479, "lr": 1.3101735072091622e-05, "epoch": 3.4615384615384617, "percentage": 69.23, "elapsed_time": "0:14:44", "remaining_time": "0:06:32", "throughput": 1513.0, "total_tokens": 1337824} +{"current_steps": 3335, "total_steps": 4810, "loss": 0.223, "lr": 1.3022032539523176e-05, "epoch": 3.4667359667359667, "percentage": 69.33, "elapsed_time": "0:14:44", "remaining_time": "0:06:31", "throughput": 1514.76, "total_tokens": 1339872} +{"current_steps": 3340, "total_steps": 4810, "loss": 0.2543, "lr": 1.2942487712598234e-05, "epoch": 3.471933471933472, "percentage": 69.44, "elapsed_time": "0:14:44", "remaining_time": "0:06:29", "throughput": 1516.52, "total_tokens": 1341920} +{"current_steps": 3345, "total_steps": 4810, "loss": 0.2449, "lr": 1.2863101638628717e-05, "epoch": 3.4771309771309773, "percentage": 69.54, "elapsed_time": "0:14:45", "remaining_time": "0:06:27", "throughput": 1518.21, "total_tokens": 1343904} +{"current_steps": 3350, "total_steps": 4810, "loss": 0.2881, "lr": 1.2783875362836373e-05, "epoch": 3.4823284823284824, "percentage": 69.65, "elapsed_time": "0:14:45", "remaining_time": "0:06:25", "throughput": 1519.96, "total_tokens": 1345952} +{"current_steps": 3355, "total_steps": 4810, "loss": 0.2574, "lr": 1.2704809928338956e-05, "epoch": 3.4875259875259874, "percentage": 69.75, "elapsed_time": "0:14:45", "remaining_time": "0:06:24", "throughput": 1521.86, "total_tokens": 1348128} +{"current_steps": 3360, "total_steps": 4810, "loss": 0.2915, "lr": 1.2625906376136581e-05, "epoch": 3.492723492723493, "percentage": 69.85, "elapsed_time": "0:14:46", "remaining_time": "0:06:22", "throughput": 1523.47, "total_tokens": 1350048} +{"current_steps": 3365, "total_steps": 4810, "loss": 0.2653, "lr": 1.2547165745097928e-05, "epoch": 3.497920997920998, "percentage": 69.96, "elapsed_time": "0:14:46", "remaining_time": "0:06:20", "throughput": 1525.08, "total_tokens": 1351968} +{"current_steps": 3370, "total_steps": 4810, "loss": 0.2795, "lr": 1.2468589071946632e-05, "epoch": 3.503118503118503, "percentage": 70.06, "elapsed_time": "0:14:46", "remaining_time": "0:06:18", "throughput": 1526.76, "total_tokens": 1353952} +{"current_steps": 3374, "total_steps": 4810, "eval_loss": 0.2641850709915161, "epoch": 3.507276507276507, "percentage": 70.15, "elapsed_time": "0:14:48", "remaining_time": "0:06:17", "throughput": 1526.35, "total_tokens": 1355552} +{"current_steps": 3375, "total_steps": 4810, "loss": 0.2673, "lr": 1.2390177391247614e-05, "epoch": 3.508316008316008, "percentage": 70.17, "elapsed_time": "0:15:15", "remaining_time": "0:06:29", "throughput": 1480.51, "total_tokens": 1356000} +{"current_steps": 3380, "total_steps": 4810, "loss": 0.2527, "lr": 1.2311931735393417e-05, "epoch": 3.5135135135135136, "percentage": 70.27, "elapsed_time": "0:15:16", "remaining_time": "0:06:27", "throughput": 1482.15, "total_tokens": 1357984} +{"current_steps": 3385, "total_steps": 4810, "loss": 0.2635, "lr": 1.2233853134590697e-05, "epoch": 3.5187110187110187, "percentage": 70.37, "elapsed_time": "0:15:16", "remaining_time": "0:06:25", "throughput": 1483.73, "total_tokens": 1359904} +{"current_steps": 3390, "total_steps": 4810, "loss": 0.2737, "lr": 1.215594261684656e-05, "epoch": 3.523908523908524, "percentage": 70.48, "elapsed_time": "0:15:16", "remaining_time": "0:06:24", "throughput": 1485.44, "total_tokens": 1361952} +{"current_steps": 3395, "total_steps": 4810, "loss": 0.2521, "lr": 1.2078201207955123e-05, "epoch": 3.529106029106029, "percentage": 70.58, "elapsed_time": "0:15:17", "remaining_time": "0:06:22", "throughput": 1487.16, "total_tokens": 1364000} +{"current_steps": 3400, "total_steps": 4810, "loss": 0.246, "lr": 1.2000629931483947e-05, "epoch": 3.5343035343035343, "percentage": 70.69, "elapsed_time": "0:15:17", "remaining_time": "0:06:20", "throughput": 1488.94, "total_tokens": 1366112} +{"current_steps": 3405, "total_steps": 4810, "loss": 0.3136, "lr": 1.1923229808760564e-05, "epoch": 3.5395010395010393, "percentage": 70.79, "elapsed_time": "0:15:17", "remaining_time": "0:06:18", "throughput": 1490.58, "total_tokens": 1368096} +{"current_steps": 3410, "total_steps": 4810, "loss": 0.2365, "lr": 1.1846001858859054e-05, "epoch": 3.544698544698545, "percentage": 70.89, "elapsed_time": "0:15:18", "remaining_time": "0:06:16", "throughput": 1492.36, "total_tokens": 1370208} +{"current_steps": 3415, "total_steps": 4810, "loss": 0.2545, "lr": 1.1768947098586628e-05, "epoch": 3.54989604989605, "percentage": 71.0, "elapsed_time": "0:15:18", "remaining_time": "0:06:15", "throughput": 1494.0, "total_tokens": 1372192} +{"current_steps": 3420, "total_steps": 4810, "loss": 0.2743, "lr": 1.1692066542470201e-05, "epoch": 3.555093555093555, "percentage": 71.1, "elapsed_time": "0:15:18", "remaining_time": "0:06:13", "throughput": 1495.71, "total_tokens": 1374240} +{"current_steps": 3425, "total_steps": 4810, "loss": 0.2821, "lr": 1.1615361202743088e-05, "epoch": 3.5602910602910605, "percentage": 71.21, "elapsed_time": "0:15:19", "remaining_time": "0:06:11", "throughput": 1497.28, "total_tokens": 1376160} +{"current_steps": 3430, "total_steps": 4810, "loss": 0.2579, "lr": 1.1538832089331628e-05, "epoch": 3.5654885654885655, "percentage": 71.31, "elapsed_time": "0:15:19", "remaining_time": "0:06:09", "throughput": 1498.99, "total_tokens": 1378208} +{"current_steps": 3435, "total_steps": 4810, "loss": 0.2526, "lr": 1.1462480209841928e-05, "epoch": 3.5706860706860706, "percentage": 71.41, "elapsed_time": "0:15:19", "remaining_time": "0:06:08", "throughput": 1500.62, "total_tokens": 1380192} +{"current_steps": 3440, "total_steps": 4810, "loss": 0.2369, "lr": 1.138630656954658e-05, "epoch": 3.5758835758835756, "percentage": 71.52, "elapsed_time": "0:15:20", "remaining_time": "0:06:06", "throughput": 1502.46, "total_tokens": 1382368} +{"current_steps": 3445, "total_steps": 4810, "loss": 0.3155, "lr": 1.1310312171371393e-05, "epoch": 3.581081081081081, "percentage": 71.62, "elapsed_time": "0:15:20", "remaining_time": "0:06:04", "throughput": 1504.37, "total_tokens": 1384608} +{"current_steps": 3450, "total_steps": 4810, "loss": 0.2615, "lr": 1.1234498015882261e-05, "epoch": 3.586278586278586, "percentage": 71.73, "elapsed_time": "0:15:20", "remaining_time": "0:06:02", "throughput": 1506.0, "total_tokens": 1386592} +{"current_steps": 3455, "total_steps": 4810, "loss": 0.2614, "lr": 1.1158865101271906e-05, "epoch": 3.5914760914760917, "percentage": 71.83, "elapsed_time": "0:15:21", "remaining_time": "0:06:01", "throughput": 1507.49, "total_tokens": 1388448} +{"current_steps": 3460, "total_steps": 4810, "loss": 0.2222, "lr": 1.1083414423346807e-05, "epoch": 3.5966735966735968, "percentage": 71.93, "elapsed_time": "0:15:21", "remaining_time": "0:05:59", "throughput": 1509.26, "total_tokens": 1390560} +{"current_steps": 3465, "total_steps": 4810, "loss": 0.3213, "lr": 1.1008146975514059e-05, "epoch": 3.601871101871102, "percentage": 72.04, "elapsed_time": "0:15:21", "remaining_time": "0:05:57", "throughput": 1511.1, "total_tokens": 1392736} +{"current_steps": 3470, "total_steps": 4810, "loss": 0.2762, "lr": 1.0933063748768254e-05, "epoch": 3.607068607068607, "percentage": 72.14, "elapsed_time": "0:15:22", "remaining_time": "0:05:56", "throughput": 1512.71, "total_tokens": 1394720} +{"current_steps": 3475, "total_steps": 4810, "loss": 0.23, "lr": 1.0858165731678513e-05, "epoch": 3.6122661122661124, "percentage": 72.25, "elapsed_time": "0:15:22", "remaining_time": "0:05:54", "throughput": 1514.27, "total_tokens": 1396640} +{"current_steps": 3480, "total_steps": 4810, "loss": 0.3322, "lr": 1.0783453910375424e-05, "epoch": 3.6174636174636174, "percentage": 72.35, "elapsed_time": "0:15:22", "remaining_time": "0:05:52", "throughput": 1516.03, "total_tokens": 1398752} +{"current_steps": 3485, "total_steps": 4810, "loss": 0.2494, "lr": 1.0708929268538034e-05, "epoch": 3.6226611226611225, "percentage": 72.45, "elapsed_time": "0:15:22", "remaining_time": "0:05:50", "throughput": 1517.72, "total_tokens": 1400800} +{"current_steps": 3490, "total_steps": 4810, "loss": 0.2596, "lr": 1.0634592787380965e-05, "epoch": 3.627858627858628, "percentage": 72.56, "elapsed_time": "0:15:23", "remaining_time": "0:05:49", "throughput": 1519.28, "total_tokens": 1402720} +{"current_steps": 3495, "total_steps": 4810, "loss": 0.2563, "lr": 1.0560445445641423e-05, "epoch": 3.633056133056133, "percentage": 72.66, "elapsed_time": "0:15:23", "remaining_time": "0:05:47", "throughput": 1520.9, "total_tokens": 1404704} +{"current_steps": 3500, "total_steps": 4810, "loss": 0.2589, "lr": 1.048648821956637e-05, "epoch": 3.638253638253638, "percentage": 72.77, "elapsed_time": "0:15:23", "remaining_time": "0:05:45", "throughput": 1522.38, "total_tokens": 1406560} +{"current_steps": 3505, "total_steps": 4810, "loss": 0.2386, "lr": 1.0412722082899644e-05, "epoch": 3.643451143451143, "percentage": 72.87, "elapsed_time": "0:15:24", "remaining_time": "0:05:44", "throughput": 1524.0, "total_tokens": 1408544} +{"current_steps": 3510, "total_steps": 4810, "loss": 0.2512, "lr": 1.033914800686912e-05, "epoch": 3.6486486486486487, "percentage": 72.97, "elapsed_time": "0:15:24", "remaining_time": "0:05:42", "throughput": 1525.55, "total_tokens": 1410464} +{"current_steps": 3515, "total_steps": 4810, "loss": 0.2277, "lr": 1.0265766960173965e-05, "epoch": 3.6538461538461537, "percentage": 73.08, "elapsed_time": "0:15:24", "remaining_time": "0:05:40", "throughput": 1527.17, "total_tokens": 1412448} +{"current_steps": 3520, "total_steps": 4810, "loss": 0.2869, "lr": 1.019257990897185e-05, "epoch": 3.6590436590436592, "percentage": 73.18, "elapsed_time": "0:15:25", "remaining_time": "0:05:39", "throughput": 1529.05, "total_tokens": 1414688} +{"current_steps": 3525, "total_steps": 4810, "loss": 0.2914, "lr": 1.0119587816866258e-05, "epoch": 3.6642411642411643, "percentage": 73.28, "elapsed_time": "0:15:25", "remaining_time": "0:05:37", "throughput": 1530.66, "total_tokens": 1416672} +{"current_steps": 3530, "total_steps": 4810, "loss": 0.2836, "lr": 1.0046791644893758e-05, "epoch": 3.6694386694386694, "percentage": 73.39, "elapsed_time": "0:15:25", "remaining_time": "0:05:35", "throughput": 1532.2, "total_tokens": 1418592} +{"current_steps": 3535, "total_steps": 4810, "loss": 0.2675, "lr": 9.974192351511368e-06, "epoch": 3.6746361746361744, "percentage": 73.49, "elapsed_time": "0:15:26", "remaining_time": "0:05:34", "throughput": 1533.8, "total_tokens": 1420576} +{"current_steps": 3540, "total_steps": 4810, "loss": 0.2679, "lr": 9.901790892583974e-06, "epoch": 3.67983367983368, "percentage": 73.6, "elapsed_time": "0:15:26", "remaining_time": "0:05:32", "throughput": 1535.41, "total_tokens": 1422560} +{"current_steps": 3545, "total_steps": 4810, "loss": 0.2697, "lr": 9.829588221371694e-06, "epoch": 3.685031185031185, "percentage": 73.7, "elapsed_time": "0:15:26", "remaining_time": "0:05:30", "throughput": 1537.08, "total_tokens": 1424608} +{"current_steps": 3550, "total_steps": 4810, "loss": 0.2612, "lr": 9.757585288517328e-06, "epoch": 3.6902286902286905, "percentage": 73.8, "elapsed_time": "0:15:27", "remaining_time": "0:05:29", "throughput": 1538.89, "total_tokens": 1426784} +{"current_steps": 3555, "total_steps": 4810, "loss": 0.2501, "lr": 9.6857830420339e-06, "epoch": 3.6954261954261955, "percentage": 73.91, "elapsed_time": "0:15:27", "remaining_time": "0:05:27", "throughput": 1540.63, "total_tokens": 1428896} +{"current_steps": 3560, "total_steps": 4810, "loss": 0.2586, "lr": 9.614182427292077e-06, "epoch": 3.7006237006237006, "percentage": 74.01, "elapsed_time": "0:15:27", "remaining_time": "0:05:25", "throughput": 1542.23, "total_tokens": 1430880} +{"current_steps": 3565, "total_steps": 4810, "loss": 0.2484, "lr": 9.54278438700785e-06, "epoch": 3.7058212058212057, "percentage": 74.12, "elapsed_time": "0:15:28", "remaining_time": "0:05:24", "throughput": 1543.83, "total_tokens": 1432864} +{"current_steps": 3570, "total_steps": 4810, "loss": 0.287, "lr": 9.471589861229998e-06, "epoch": 3.711018711018711, "percentage": 74.22, "elapsed_time": "0:15:28", "remaining_time": "0:05:22", "throughput": 1545.49, "total_tokens": 1434912} +{"current_steps": 3575, "total_steps": 4810, "loss": 0.3025, "lr": 9.400599787327773e-06, "epoch": 3.7162162162162162, "percentage": 74.32, "elapsed_time": "0:15:28", "remaining_time": "0:05:20", "throughput": 1547.02, "total_tokens": 1436832} +{"current_steps": 3580, "total_steps": 4810, "loss": 0.2433, "lr": 9.329815099978568e-06, "epoch": 3.7214137214137213, "percentage": 74.43, "elapsed_time": "0:15:29", "remaining_time": "0:05:19", "throughput": 1548.55, "total_tokens": 1438752} +{"current_steps": 3585, "total_steps": 4810, "loss": 0.3809, "lr": 9.259236731155582e-06, "epoch": 3.726611226611227, "percentage": 74.53, "elapsed_time": "0:15:29", "remaining_time": "0:05:17", "throughput": 1550.08, "total_tokens": 1440672} +{"current_steps": 3590, "total_steps": 4810, "loss": 0.2221, "lr": 9.18886561011557e-06, "epoch": 3.731808731808732, "percentage": 74.64, "elapsed_time": "0:15:29", "remaining_time": "0:05:15", "throughput": 1551.81, "total_tokens": 1442784} +{"current_steps": 3595, "total_steps": 4810, "loss": 0.2622, "lr": 9.118702663386584e-06, "epoch": 3.737006237006237, "percentage": 74.74, "elapsed_time": "0:15:30", "remaining_time": "0:05:14", "throughput": 1553.6, "total_tokens": 1444960} +{"current_steps": 3600, "total_steps": 4810, "loss": 0.3094, "lr": 9.048748814755784e-06, "epoch": 3.742203742203742, "percentage": 74.84, "elapsed_time": "0:15:30", "remaining_time": "0:05:12", "throughput": 1555.13, "total_tokens": 1446880} +{"current_steps": 3605, "total_steps": 4810, "loss": 0.2723, "lr": 8.979004985257294e-06, "epoch": 3.7474012474012475, "percentage": 74.95, "elapsed_time": "0:15:30", "remaining_time": "0:05:11", "throughput": 1556.85, "total_tokens": 1448992} +{"current_steps": 3610, "total_steps": 4810, "loss": 0.2755, "lr": 8.909472093160065e-06, "epoch": 3.7525987525987525, "percentage": 75.05, "elapsed_time": "0:15:31", "remaining_time": "0:05:09", "throughput": 1558.44, "total_tokens": 1450976} +{"current_steps": 3615, "total_steps": 4810, "loss": 0.2751, "lr": 8.840151053955773e-06, "epoch": 3.757796257796258, "percentage": 75.16, "elapsed_time": "0:15:31", "remaining_time": "0:05:07", "throughput": 1560.17, "total_tokens": 1453088} +{"current_steps": 3615, "total_steps": 4810, "eval_loss": 0.25871533155441284, "epoch": 3.757796257796258, "percentage": 75.16, "elapsed_time": "0:15:32", "remaining_time": "0:05:08", "throughput": 1558.41, "total_tokens": 1453088} +{"current_steps": 3620, "total_steps": 4810, "loss": 0.2834, "lr": 8.771042780346766e-06, "epoch": 3.762993762993763, "percentage": 75.26, "elapsed_time": "0:16:11", "remaining_time": "0:05:19", "throughput": 1497.07, "total_tokens": 1455136} +{"current_steps": 3625, "total_steps": 4810, "loss": 0.2472, "lr": 8.702148182234043e-06, "epoch": 3.768191268191268, "percentage": 75.36, "elapsed_time": "0:16:12", "remaining_time": "0:05:17", "throughput": 1498.62, "total_tokens": 1457120} +{"current_steps": 3630, "total_steps": 4810, "loss": 0.2772, "lr": 8.633468166705336e-06, "epoch": 3.773388773388773, "percentage": 75.47, "elapsed_time": "0:16:12", "remaining_time": "0:05:16", "throughput": 1500.23, "total_tokens": 1459168} +{"current_steps": 3635, "total_steps": 4810, "loss": 0.2651, "lr": 8.565003638023065e-06, "epoch": 3.7785862785862787, "percentage": 75.57, "elapsed_time": "0:16:12", "remaining_time": "0:05:14", "throughput": 1501.78, "total_tokens": 1461152} +{"current_steps": 3640, "total_steps": 4810, "loss": 0.2756, "lr": 8.496755497612492e-06, "epoch": 3.7837837837837838, "percentage": 75.68, "elapsed_time": "0:16:13", "remaining_time": "0:05:12", "throughput": 1503.32, "total_tokens": 1463136} +{"current_steps": 3645, "total_steps": 4810, "loss": 0.2693, "lr": 8.42872464404986e-06, "epoch": 3.788981288981289, "percentage": 75.78, "elapsed_time": "0:16:13", "remaining_time": "0:05:11", "throughput": 1504.86, "total_tokens": 1465120} +{"current_steps": 3650, "total_steps": 4810, "loss": 0.2816, "lr": 8.360911973050537e-06, "epoch": 3.7941787941787943, "percentage": 75.88, "elapsed_time": "0:16:13", "remaining_time": "0:05:09", "throughput": 1506.4, "total_tokens": 1467104} +{"current_steps": 3655, "total_steps": 4810, "loss": 0.2571, "lr": 8.293318377457241e-06, "epoch": 3.7993762993762994, "percentage": 75.99, "elapsed_time": "0:16:14", "remaining_time": "0:05:07", "throughput": 1508.01, "total_tokens": 1469152} +{"current_steps": 3660, "total_steps": 4810, "loss": 0.268, "lr": 8.225944747228257e-06, "epoch": 3.8045738045738045, "percentage": 76.09, "elapsed_time": "0:16:14", "remaining_time": "0:05:06", "throughput": 1509.67, "total_tokens": 1471264} +{"current_steps": 3665, "total_steps": 4810, "loss": 0.2128, "lr": 8.158791969425738e-06, "epoch": 3.8097713097713095, "percentage": 76.2, "elapsed_time": "0:16:14", "remaining_time": "0:05:04", "throughput": 1511.21, "total_tokens": 1473248} +{"current_steps": 3670, "total_steps": 4810, "loss": 0.3101, "lr": 8.091860928204049e-06, "epoch": 3.814968814968815, "percentage": 76.3, "elapsed_time": "0:16:15", "remaining_time": "0:05:02", "throughput": 1512.87, "total_tokens": 1475360} +{"current_steps": 3675, "total_steps": 4810, "loss": 0.3044, "lr": 8.025152504798078e-06, "epoch": 3.82016632016632, "percentage": 76.4, "elapsed_time": "0:16:15", "remaining_time": "0:05:01", "throughput": 1514.54, "total_tokens": 1477472} +{"current_steps": 3680, "total_steps": 4810, "loss": 0.2471, "lr": 7.958667577511683e-06, "epoch": 3.8253638253638256, "percentage": 76.51, "elapsed_time": "0:16:15", "remaining_time": "0:04:59", "throughput": 1515.93, "total_tokens": 1479328} +{"current_steps": 3685, "total_steps": 4810, "loss": 0.2552, "lr": 7.892407021706063e-06, "epoch": 3.8305613305613306, "percentage": 76.61, "elapsed_time": "0:16:16", "remaining_time": "0:04:58", "throughput": 1517.4, "total_tokens": 1481248} +{"current_steps": 3690, "total_steps": 4810, "loss": 0.3112, "lr": 7.826371709788313e-06, "epoch": 3.8357588357588357, "percentage": 76.72, "elapsed_time": "0:16:16", "remaining_time": "0:04:56", "throughput": 1518.86, "total_tokens": 1483168} +{"current_steps": 3695, "total_steps": 4810, "loss": 0.2585, "lr": 7.760562511199882e-06, "epoch": 3.8409563409563408, "percentage": 76.82, "elapsed_time": "0:16:16", "remaining_time": "0:04:54", "throughput": 1520.39, "total_tokens": 1485152} +{"current_steps": 3700, "total_steps": 4810, "loss": 0.2673, "lr": 7.694980292405122e-06, "epoch": 3.8461538461538463, "percentage": 76.92, "elapsed_time": "0:16:17", "remaining_time": "0:04:53", "throughput": 1521.98, "total_tokens": 1487200} +{"current_steps": 3705, "total_steps": 4810, "loss": 0.2763, "lr": 7.629625916879932e-06, "epoch": 3.8513513513513513, "percentage": 77.03, "elapsed_time": "0:16:17", "remaining_time": "0:04:51", "throughput": 1523.5, "total_tokens": 1489184} +{"current_steps": 3710, "total_steps": 4810, "loss": 0.278, "lr": 7.564500245100325e-06, "epoch": 3.856548856548857, "percentage": 77.13, "elapsed_time": "0:16:17", "remaining_time": "0:04:49", "throughput": 1525.03, "total_tokens": 1491168} +{"current_steps": 3715, "total_steps": 4810, "loss": 0.2727, "lr": 7.499604134531149e-06, "epoch": 3.861746361746362, "percentage": 77.23, "elapsed_time": "0:16:18", "remaining_time": "0:04:48", "throughput": 1526.62, "total_tokens": 1493216} +{"current_steps": 3720, "total_steps": 4810, "loss": 0.2667, "lr": 7.434938439614781e-06, "epoch": 3.866943866943867, "percentage": 77.34, "elapsed_time": "0:16:18", "remaining_time": "0:04:46", "throughput": 1528.14, "total_tokens": 1495200} +{"current_steps": 3725, "total_steps": 4810, "loss": 0.2707, "lr": 7.370504011759855e-06, "epoch": 3.872141372141372, "percentage": 77.44, "elapsed_time": "0:16:18", "remaining_time": "0:04:45", "throughput": 1529.66, "total_tokens": 1497184} +{"current_steps": 3730, "total_steps": 4810, "loss": 0.2656, "lr": 7.306301699330065e-06, "epoch": 3.8773388773388775, "percentage": 77.55, "elapsed_time": "0:16:19", "remaining_time": "0:04:43", "throughput": 1531.05, "total_tokens": 1499040} +{"current_steps": 3735, "total_steps": 4810, "loss": 0.2423, "lr": 7.242332347633052e-06, "epoch": 3.8825363825363826, "percentage": 77.65, "elapsed_time": "0:16:19", "remaining_time": "0:04:41", "throughput": 1532.57, "total_tokens": 1501024} +{"current_steps": 3740, "total_steps": 4810, "loss": 0.2487, "lr": 7.178596798909159e-06, "epoch": 3.8877338877338876, "percentage": 77.75, "elapsed_time": "0:16:19", "remaining_time": "0:04:40", "throughput": 1534.15, "total_tokens": 1503072} +{"current_steps": 3745, "total_steps": 4810, "loss": 0.2847, "lr": 7.115095892320456e-06, "epoch": 3.892931392931393, "percentage": 77.86, "elapsed_time": "0:16:20", "remaining_time": "0:04:38", "throughput": 1535.86, "total_tokens": 1505248} +{"current_steps": 3750, "total_steps": 4810, "loss": 0.2334, "lr": 7.051830463939604e-06, "epoch": 3.898128898128898, "percentage": 77.96, "elapsed_time": "0:16:20", "remaining_time": "0:04:37", "throughput": 1537.44, "total_tokens": 1507296} +{"current_steps": 3755, "total_steps": 4810, "loss": 0.2595, "lr": 6.98880134673891e-06, "epoch": 3.9033264033264032, "percentage": 78.07, "elapsed_time": "0:16:20", "remaining_time": "0:04:35", "throughput": 1539.02, "total_tokens": 1509344} +{"current_steps": 3760, "total_steps": 4810, "loss": 0.2098, "lr": 6.926009370579334e-06, "epoch": 3.9085239085239083, "percentage": 78.17, "elapsed_time": "0:16:21", "remaining_time": "0:04:33", "throughput": 1540.66, "total_tokens": 1511456} +{"current_steps": 3765, "total_steps": 4810, "loss": 0.2277, "lr": 6.8634553621995416e-06, "epoch": 3.913721413721414, "percentage": 78.27, "elapsed_time": "0:16:21", "remaining_time": "0:04:32", "throughput": 1542.17, "total_tokens": 1513440} +{"current_steps": 3770, "total_steps": 4810, "loss": 0.3251, "lr": 6.80114014520507e-06, "epoch": 3.918918918918919, "percentage": 78.38, "elapsed_time": "0:16:21", "remaining_time": "0:04:30", "throughput": 1543.74, "total_tokens": 1515488} +{"current_steps": 3775, "total_steps": 4810, "loss": 0.2604, "lr": 6.739064540057424e-06, "epoch": 3.9241164241164244, "percentage": 78.48, "elapsed_time": "0:16:22", "remaining_time": "0:04:29", "throughput": 1545.19, "total_tokens": 1517408} +{"current_steps": 3780, "total_steps": 4810, "loss": 0.2458, "lr": 6.677229364063328e-06, "epoch": 3.9293139293139294, "percentage": 78.59, "elapsed_time": "0:16:22", "remaining_time": "0:04:27", "throughput": 1546.7, "total_tokens": 1519392} +{"current_steps": 3785, "total_steps": 4810, "loss": 0.2596, "lr": 6.615635431363942e-06, "epoch": 3.9345114345114345, "percentage": 78.69, "elapsed_time": "0:16:22", "remaining_time": "0:04:26", "throughput": 1548.27, "total_tokens": 1521440} +{"current_steps": 3790, "total_steps": 4810, "loss": 0.2766, "lr": 6.554283552924118e-06, "epoch": 3.9397089397089395, "percentage": 78.79, "elapsed_time": "0:16:22", "remaining_time": "0:04:24", "throughput": 1549.84, "total_tokens": 1523488} +{"current_steps": 3795, "total_steps": 4810, "loss": 0.2551, "lr": 6.493174536521768e-06, "epoch": 3.944906444906445, "percentage": 78.9, "elapsed_time": "0:16:23", "remaining_time": "0:04:22", "throughput": 1551.48, "total_tokens": 1525600} +{"current_steps": 3800, "total_steps": 4810, "loss": 0.2612, "lr": 6.4323091867372095e-06, "epoch": 3.95010395010395, "percentage": 79.0, "elapsed_time": "0:16:23", "remaining_time": "0:04:21", "throughput": 1552.98, "total_tokens": 1527584} +{"current_steps": 3805, "total_steps": 4810, "loss": 0.2575, "lr": 6.371688304942544e-06, "epoch": 3.955301455301455, "percentage": 79.11, "elapsed_time": "0:16:23", "remaining_time": "0:04:19", "throughput": 1554.42, "total_tokens": 1529504} +{"current_steps": 3810, "total_steps": 4810, "loss": 0.2897, "lr": 6.311312689291166e-06, "epoch": 3.9604989604989607, "percentage": 79.21, "elapsed_time": "0:16:24", "remaining_time": "0:04:18", "throughput": 1555.86, "total_tokens": 1531424} +{"current_steps": 3815, "total_steps": 4810, "loss": 0.2366, "lr": 6.251183134707184e-06, "epoch": 3.9656964656964657, "percentage": 79.31, "elapsed_time": "0:16:24", "remaining_time": "0:04:16", "throughput": 1557.36, "total_tokens": 1533408} +{"current_steps": 3820, "total_steps": 4810, "loss": 0.2668, "lr": 6.191300432875017e-06, "epoch": 3.970893970893971, "percentage": 79.42, "elapsed_time": "0:16:24", "remaining_time": "0:04:15", "throughput": 1558.87, "total_tokens": 1535392} +{"current_steps": 3825, "total_steps": 4810, "loss": 0.1661, "lr": 6.13166537222894e-06, "epoch": 3.976091476091476, "percentage": 79.52, "elapsed_time": "0:16:25", "remaining_time": "0:04:13", "throughput": 1560.3, "total_tokens": 1537312} +{"current_steps": 3830, "total_steps": 4810, "loss": 0.28, "lr": 6.072278737942691e-06, "epoch": 3.9812889812889813, "percentage": 79.63, "elapsed_time": "0:16:25", "remaining_time": "0:04:12", "throughput": 1561.87, "total_tokens": 1539360} +{"current_steps": 3835, "total_steps": 4810, "loss": 0.3038, "lr": 6.0131413119191685e-06, "epoch": 3.9864864864864864, "percentage": 79.73, "elapsed_time": "0:16:25", "remaining_time": "0:04:10", "throughput": 1563.3, "total_tokens": 1541280} +{"current_steps": 3840, "total_steps": 4810, "loss": 0.2598, "lr": 5.954253872780102e-06, "epoch": 3.991683991683992, "percentage": 79.83, "elapsed_time": "0:16:26", "remaining_time": "0:04:09", "throughput": 1564.67, "total_tokens": 1543136} +{"current_steps": 3845, "total_steps": 4810, "loss": 0.2387, "lr": 5.8956171958558266e-06, "epoch": 3.996881496881497, "percentage": 79.94, "elapsed_time": "0:16:26", "remaining_time": "0:04:07", "throughput": 1566.17, "total_tokens": 1545120} +{"current_steps": 3850, "total_steps": 4810, "loss": 0.2258, "lr": 5.8372320531750655e-06, "epoch": 4.002079002079002, "percentage": 80.04, "elapsed_time": "0:16:26", "remaining_time": "0:04:06", "throughput": 1567.44, "total_tokens": 1547056} +{"current_steps": 3855, "total_steps": 4810, "loss": 0.279, "lr": 5.77909921345475e-06, "epoch": 4.007276507276507, "percentage": 80.15, "elapsed_time": "0:16:27", "remaining_time": "0:04:04", "throughput": 1568.87, "total_tokens": 1548976} +{"current_steps": 3856, "total_steps": 4810, "eval_loss": 0.25588732957839966, "epoch": 4.008316008316008, "percentage": 80.17, "elapsed_time": "0:16:28", "remaining_time": "0:04:04", "throughput": 1567.47, "total_tokens": 1549360} +{"current_steps": 3860, "total_steps": 4810, "loss": 0.2636, "lr": 5.721219442089926e-06, "epoch": 4.012474012474012, "percentage": 80.25, "elapsed_time": "0:16:53", "remaining_time": "0:04:09", "throughput": 1529.55, "total_tokens": 1550960} +{"current_steps": 3865, "total_steps": 4810, "loss": 0.2772, "lr": 5.663593501143663e-06, "epoch": 4.017671517671518, "percentage": 80.35, "elapsed_time": "0:16:54", "remaining_time": "0:04:08", "throughput": 1531.0, "total_tokens": 1552944} +{"current_steps": 3870, "total_steps": 4810, "loss": 0.2654, "lr": 5.6062221493370035e-06, "epoch": 4.022869022869023, "percentage": 80.46, "elapsed_time": "0:16:54", "remaining_time": "0:04:06", "throughput": 1532.51, "total_tokens": 1554992} +{"current_steps": 3875, "total_steps": 4810, "loss": 0.2682, "lr": 5.549106142039018e-06, "epoch": 4.028066528066528, "percentage": 80.56, "elapsed_time": "0:16:55", "remaining_time": "0:04:04", "throughput": 1534.07, "total_tokens": 1557104} +{"current_steps": 3880, "total_steps": 4810, "loss": 0.2818, "lr": 5.492246231256798e-06, "epoch": 4.033264033264033, "percentage": 80.67, "elapsed_time": "0:16:55", "remaining_time": "0:04:03", "throughput": 1535.52, "total_tokens": 1559088} +{"current_steps": 3885, "total_steps": 4810, "loss": 0.2739, "lr": 5.435643165625614e-06, "epoch": 4.038461538461538, "percentage": 80.77, "elapsed_time": "0:16:55", "remaining_time": "0:04:01", "throughput": 1536.9, "total_tokens": 1561008} +{"current_steps": 3890, "total_steps": 4810, "loss": 0.273, "lr": 5.379297690399035e-06, "epoch": 4.043659043659043, "percentage": 80.87, "elapsed_time": "0:16:56", "remaining_time": "0:04:00", "throughput": 1538.41, "total_tokens": 1563056} +{"current_steps": 3895, "total_steps": 4810, "loss": 0.2571, "lr": 5.3232105474390895e-06, "epoch": 4.048856548856548, "percentage": 80.98, "elapsed_time": "0:16:56", "remaining_time": "0:03:58", "throughput": 1539.85, "total_tokens": 1565040} +{"current_steps": 3900, "total_steps": 4810, "loss": 0.2529, "lr": 5.267382475206548e-06, "epoch": 4.054054054054054, "percentage": 81.08, "elapsed_time": "0:16:56", "remaining_time": "0:03:57", "throughput": 1541.29, "total_tokens": 1567024} +{"current_steps": 3905, "total_steps": 4810, "loss": 0.264, "lr": 5.2118142087511705e-06, "epoch": 4.0592515592515594, "percentage": 81.19, "elapsed_time": "0:16:57", "remaining_time": "0:03:55", "throughput": 1542.85, "total_tokens": 1569136} +{"current_steps": 3910, "total_steps": 4810, "loss": 0.2638, "lr": 5.156506479702019e-06, "epoch": 4.0644490644490645, "percentage": 81.29, "elapsed_time": "0:16:57", "remaining_time": "0:03:54", "throughput": 1544.3, "total_tokens": 1571120} +{"current_steps": 3915, "total_steps": 4810, "loss": 0.2652, "lr": 5.101460016257859e-06, "epoch": 4.06964656964657, "percentage": 81.39, "elapsed_time": "0:16:57", "remaining_time": "0:03:52", "throughput": 1545.7, "total_tokens": 1573040} +{"current_steps": 3920, "total_steps": 4810, "loss": 0.2582, "lr": 5.0466755431775316e-06, "epoch": 4.074844074844075, "percentage": 81.5, "elapsed_time": "0:16:58", "remaining_time": "0:03:51", "throughput": 1547.04, "total_tokens": 1574896} +{"current_steps": 3925, "total_steps": 4810, "loss": 0.2618, "lr": 4.992153781770448e-06, "epoch": 4.08004158004158, "percentage": 81.6, "elapsed_time": "0:16:58", "remaining_time": "0:03:49", "throughput": 1548.5, "total_tokens": 1576880} +{"current_steps": 3930, "total_steps": 4810, "loss": 0.2455, "lr": 4.937895449887075e-06, "epoch": 4.085239085239086, "percentage": 81.7, "elapsed_time": "0:16:58", "remaining_time": "0:03:48", "throughput": 1549.96, "total_tokens": 1578864} +{"current_steps": 3935, "total_steps": 4810, "loss": 0.2813, "lr": 4.883901261909465e-06, "epoch": 4.090436590436591, "percentage": 81.81, "elapsed_time": "0:16:58", "remaining_time": "0:03:46", "throughput": 1551.42, "total_tokens": 1580848} +{"current_steps": 3940, "total_steps": 4810, "loss": 0.2815, "lr": 4.8301719287419e-06, "epoch": 4.095634095634096, "percentage": 81.91, "elapsed_time": "0:16:59", "remaining_time": "0:03:45", "throughput": 1552.75, "total_tokens": 1582704} +{"current_steps": 3945, "total_steps": 4810, "loss": 0.2796, "lr": 4.776708157801463e-06, "epoch": 4.100831600831601, "percentage": 82.02, "elapsed_time": "0:16:59", "remaining_time": "0:03:43", "throughput": 1554.34, "total_tokens": 1584816} +{"current_steps": 3950, "total_steps": 4810, "loss": 0.2491, "lr": 4.7235106530088085e-06, "epoch": 4.106029106029106, "percentage": 82.12, "elapsed_time": "0:16:59", "remaining_time": "0:03:42", "throughput": 1555.79, "total_tokens": 1586800} +{"current_steps": 3955, "total_steps": 4810, "loss": 0.2528, "lr": 4.670580114778813e-06, "epoch": 4.111226611226611, "percentage": 82.22, "elapsed_time": "0:17:00", "remaining_time": "0:03:40", "throughput": 1557.19, "total_tokens": 1588720} +{"current_steps": 3960, "total_steps": 4810, "loss": 0.2732, "lr": 4.617917240011394e-06, "epoch": 4.116424116424117, "percentage": 82.33, "elapsed_time": "0:17:00", "remaining_time": "0:03:39", "throughput": 1558.52, "total_tokens": 1590576} +{"current_steps": 3965, "total_steps": 4810, "loss": 0.2573, "lr": 4.565522722082336e-06, "epoch": 4.121621621621622, "percentage": 82.43, "elapsed_time": "0:17:00", "remaining_time": "0:03:37", "throughput": 1559.91, "total_tokens": 1592496} +{"current_steps": 3970, "total_steps": 4810, "loss": 0.2638, "lr": 4.513397250834159e-06, "epoch": 4.126819126819127, "percentage": 82.54, "elapsed_time": "0:17:01", "remaining_time": "0:03:36", "throughput": 1561.43, "total_tokens": 1594544} +{"current_steps": 3975, "total_steps": 4810, "loss": 0.2925, "lr": 4.461541512567011e-06, "epoch": 4.132016632016632, "percentage": 82.64, "elapsed_time": "0:17:01", "remaining_time": "0:03:34", "throughput": 1562.76, "total_tokens": 1596400} +{"current_steps": 3980, "total_steps": 4810, "loss": 0.2786, "lr": 4.409956190029674e-06, "epoch": 4.137214137214137, "percentage": 82.74, "elapsed_time": "0:17:01", "remaining_time": "0:03:33", "throughput": 1564.15, "total_tokens": 1598320} +{"current_steps": 3985, "total_steps": 4810, "loss": 0.2286, "lr": 4.358641962410537e-06, "epoch": 4.142411642411642, "percentage": 82.85, "elapsed_time": "0:17:02", "remaining_time": "0:03:31", "throughput": 1565.65, "total_tokens": 1600368} +{"current_steps": 3990, "total_steps": 4810, "loss": 0.2986, "lr": 4.307599505328672e-06, "epoch": 4.147609147609147, "percentage": 82.95, "elapsed_time": "0:17:02", "remaining_time": "0:03:30", "throughput": 1567.1, "total_tokens": 1602352} +{"current_steps": 3995, "total_steps": 4810, "loss": 0.2363, "lr": 4.256829490824949e-06, "epoch": 4.152806652806653, "percentage": 83.06, "elapsed_time": "0:17:02", "remaining_time": "0:03:28", "throughput": 1568.54, "total_tokens": 1604336} +{"current_steps": 4000, "total_steps": 4810, "loss": 0.2652, "lr": 4.206332587353149e-06, "epoch": 4.158004158004158, "percentage": 83.16, "elapsed_time": "0:17:03", "remaining_time": "0:03:27", "throughput": 1569.92, "total_tokens": 1606256} +{"current_steps": 4005, "total_steps": 4810, "loss": 0.2641, "lr": 4.1561094597712155e-06, "epoch": 4.163201663201663, "percentage": 83.26, "elapsed_time": "0:17:03", "remaining_time": "0:03:25", "throughput": 1571.42, "total_tokens": 1608304} +{"current_steps": 4010, "total_steps": 4810, "loss": 0.2415, "lr": 4.106160769332443e-06, "epoch": 4.168399168399168, "percentage": 83.37, "elapsed_time": "0:17:03", "remaining_time": "0:03:24", "throughput": 1573.04, "total_tokens": 1610480} +{"current_steps": 4015, "total_steps": 4810, "loss": 0.2449, "lr": 4.056487173676843e-06, "epoch": 4.173596673596673, "percentage": 83.47, "elapsed_time": "0:17:04", "remaining_time": "0:03:22", "throughput": 1574.54, "total_tokens": 1612528} +{"current_steps": 4020, "total_steps": 4810, "loss": 0.2742, "lr": 4.007089326822405e-06, "epoch": 4.1787941787941785, "percentage": 83.58, "elapsed_time": "0:17:04", "remaining_time": "0:03:21", "throughput": 1576.04, "total_tokens": 1614576} +{"current_steps": 4025, "total_steps": 4810, "loss": 0.264, "lr": 3.957967879156533e-06, "epoch": 4.183991683991684, "percentage": 83.68, "elapsed_time": "0:17:04", "remaining_time": "0:03:19", "throughput": 1577.54, "total_tokens": 1616624} +{"current_steps": 4030, "total_steps": 4810, "loss": 0.2548, "lr": 3.909123477427487e-06, "epoch": 4.1891891891891895, "percentage": 83.78, "elapsed_time": "0:17:05", "remaining_time": "0:03:18", "throughput": 1579.03, "total_tokens": 1618672} +{"current_steps": 4035, "total_steps": 4810, "loss": 0.2113, "lr": 3.860556764735842e-06, "epoch": 4.1943866943866945, "percentage": 83.89, "elapsed_time": "0:17:05", "remaining_time": "0:03:16", "throughput": 1580.59, "total_tokens": 1620784} +{"current_steps": 4040, "total_steps": 4810, "loss": 0.3261, "lr": 3.812268380526046e-06, "epoch": 4.1995841995842, "percentage": 83.99, "elapsed_time": "0:17:05", "remaining_time": "0:03:15", "throughput": 1582.02, "total_tokens": 1622768} +{"current_steps": 4045, "total_steps": 4810, "loss": 0.2481, "lr": 3.764258960577971e-06, "epoch": 4.204781704781705, "percentage": 84.1, "elapsed_time": "0:17:06", "remaining_time": "0:03:14", "throughput": 1583.39, "total_tokens": 1624688} +{"current_steps": 4050, "total_steps": 4810, "loss": 0.2599, "lr": 3.7165291369985618e-06, "epoch": 4.20997920997921, "percentage": 84.2, "elapsed_time": "0:17:06", "remaining_time": "0:03:12", "throughput": 1584.82, "total_tokens": 1626672} +{"current_steps": 4055, "total_steps": 4810, "loss": 0.258, "lr": 3.6690795382135186e-06, "epoch": 4.215176715176715, "percentage": 84.3, "elapsed_time": "0:17:06", "remaining_time": "0:03:11", "throughput": 1586.43, "total_tokens": 1628848} +{"current_steps": 4060, "total_steps": 4810, "loss": 0.2809, "lr": 3.6219107889590155e-06, "epoch": 4.220374220374221, "percentage": 84.41, "elapsed_time": "0:17:07", "remaining_time": "0:03:09", "throughput": 1587.86, "total_tokens": 1630832} +{"current_steps": 4065, "total_steps": 4810, "loss": 0.2292, "lr": 3.575023510273462e-06, "epoch": 4.225571725571726, "percentage": 84.51, "elapsed_time": "0:17:07", "remaining_time": "0:03:08", "throughput": 1589.34, "total_tokens": 1632880} +{"current_steps": 4070, "total_steps": 4810, "loss": 0.2871, "lr": 3.5284183194893488e-06, "epoch": 4.230769230769231, "percentage": 84.62, "elapsed_time": "0:17:07", "remaining_time": "0:03:06", "throughput": 1590.88, "total_tokens": 1634992} +{"current_steps": 4075, "total_steps": 4810, "loss": 0.2634, "lr": 3.48209583022511e-06, "epoch": 4.235966735966736, "percentage": 84.72, "elapsed_time": "0:17:08", "remaining_time": "0:03:05", "throughput": 1592.24, "total_tokens": 1636912} +{"current_steps": 4080, "total_steps": 4810, "loss": 0.2477, "lr": 3.4360566523770426e-06, "epoch": 4.241164241164241, "percentage": 84.82, "elapsed_time": "0:17:08", "remaining_time": "0:03:04", "throughput": 1593.59, "total_tokens": 1638832} +{"current_steps": 4085, "total_steps": 4810, "loss": 0.2351, "lr": 3.3903013921112755e-06, "epoch": 4.246361746361746, "percentage": 84.93, "elapsed_time": "0:17:08", "remaining_time": "0:03:02", "throughput": 1595.25, "total_tokens": 1641072} +{"current_steps": 4090, "total_steps": 4810, "loss": 0.2808, "lr": 3.3448306518557795e-06, "epoch": 4.251559251559252, "percentage": 85.03, "elapsed_time": "0:17:09", "remaining_time": "0:03:01", "throughput": 1596.61, "total_tokens": 1642992} +{"current_steps": 4095, "total_steps": 4810, "loss": 0.2511, "lr": 3.299645030292467e-06, "epoch": 4.256756756756757, "percentage": 85.14, "elapsed_time": "0:17:09", "remaining_time": "0:02:59", "throughput": 1598.09, "total_tokens": 1645040} +{"current_steps": 4097, "total_steps": 4810, "eval_loss": 0.2517484128475189, "epoch": 4.258835758835759, "percentage": 85.18, "elapsed_time": "0:17:10", "remaining_time": "0:02:59", "throughput": 1597.01, "total_tokens": 1645808} +{"current_steps": 4100, "total_steps": 4810, "loss": 0.2495, "lr": 3.2547451223492786e-06, "epoch": 4.261954261954262, "percentage": 85.24, "elapsed_time": "0:17:59", "remaining_time": "0:03:06", "throughput": 1526.33, "total_tokens": 1647024} +{"current_steps": 4105, "total_steps": 4810, "loss": 0.2774, "lr": 3.2101315191923663e-06, "epoch": 4.267151767151767, "percentage": 85.34, "elapsed_time": "0:17:59", "remaining_time": "0:03:05", "throughput": 1527.71, "total_tokens": 1649008} +{"current_steps": 4110, "total_steps": 4810, "loss": 0.2208, "lr": 3.165804808218292e-06, "epoch": 4.272349272349272, "percentage": 85.45, "elapsed_time": "0:17:59", "remaining_time": "0:03:03", "throughput": 1529.14, "total_tokens": 1651056} +{"current_steps": 4115, "total_steps": 4810, "loss": 0.2601, "lr": 3.1217655730463093e-06, "epoch": 4.277546777546777, "percentage": 85.55, "elapsed_time": "0:18:00", "remaining_time": "0:03:02", "throughput": 1530.58, "total_tokens": 1653104} +{"current_steps": 4120, "total_steps": 4810, "loss": 0.2427, "lr": 3.078014393510695e-06, "epoch": 4.282744282744282, "percentage": 85.65, "elapsed_time": "0:18:00", "remaining_time": "0:03:00", "throughput": 1532.18, "total_tokens": 1655344} +{"current_steps": 4125, "total_steps": 4810, "loss": 0.2959, "lr": 3.0345518456530665e-06, "epoch": 4.287941787941788, "percentage": 85.76, "elapsed_time": "0:18:00", "remaining_time": "0:02:59", "throughput": 1533.62, "total_tokens": 1657392} +{"current_steps": 4130, "total_steps": 4810, "loss": 0.2807, "lr": 2.991378501714856e-06, "epoch": 4.293139293139293, "percentage": 85.86, "elapsed_time": "0:18:01", "remaining_time": "0:02:57", "throughput": 1534.93, "total_tokens": 1659312} +{"current_steps": 4135, "total_steps": 4810, "loss": 0.2579, "lr": 2.9484949301297166e-06, "epoch": 4.298336798336798, "percentage": 85.97, "elapsed_time": "0:18:01", "remaining_time": "0:02:56", "throughput": 1536.42, "total_tokens": 1661424} +{"current_steps": 4140, "total_steps": 4810, "loss": 0.2498, "lr": 2.9059016955160916e-06, "epoch": 4.303534303534303, "percentage": 86.07, "elapsed_time": "0:18:01", "remaining_time": "0:02:55", "throughput": 1537.79, "total_tokens": 1663408} +{"current_steps": 4145, "total_steps": 4810, "loss": 0.226, "lr": 2.8635993586697553e-06, "epoch": 4.3087318087318085, "percentage": 86.17, "elapsed_time": "0:18:02", "remaining_time": "0:02:53", "throughput": 1539.11, "total_tokens": 1665328} +{"current_steps": 4150, "total_steps": 4810, "loss": 0.2687, "lr": 2.8215884765564193e-06, "epoch": 4.313929313929314, "percentage": 86.28, "elapsed_time": "0:18:02", "remaining_time": "0:02:52", "throughput": 1540.48, "total_tokens": 1667312} +{"current_steps": 4155, "total_steps": 4810, "loss": 0.1693, "lr": 2.7798696023044163e-06, "epoch": 4.3191268191268195, "percentage": 86.38, "elapsed_time": "0:18:02", "remaining_time": "0:02:50", "throughput": 1541.85, "total_tokens": 1669296} +{"current_steps": 4160, "total_steps": 4810, "loss": 0.2217, "lr": 2.73844328519742e-06, "epoch": 4.324324324324325, "percentage": 86.49, "elapsed_time": "0:18:02", "remaining_time": "0:02:49", "throughput": 1543.21, "total_tokens": 1671280} +{"current_steps": 4165, "total_steps": 4810, "loss": 0.2814, "lr": 2.6973100706672e-06, "epoch": 4.32952182952183, "percentage": 86.59, "elapsed_time": "0:18:03", "remaining_time": "0:02:47", "throughput": 1544.76, "total_tokens": 1673456} +{"current_steps": 4170, "total_steps": 4810, "loss": 0.2523, "lr": 2.656470500286451e-06, "epoch": 4.334719334719335, "percentage": 86.69, "elapsed_time": "0:18:03", "remaining_time": "0:02:46", "throughput": 1546.18, "total_tokens": 1675504} +{"current_steps": 4175, "total_steps": 4810, "loss": 0.228, "lr": 2.615925111761647e-06, "epoch": 4.33991683991684, "percentage": 86.8, "elapsed_time": "0:18:03", "remaining_time": "0:02:44", "throughput": 1547.55, "total_tokens": 1677488} +{"current_steps": 4180, "total_steps": 4810, "loss": 0.2399, "lr": 2.5756744389259734e-06, "epoch": 4.345114345114345, "percentage": 86.9, "elapsed_time": "0:18:04", "remaining_time": "0:02:43", "throughput": 1548.98, "total_tokens": 1679536} +{"current_steps": 4185, "total_steps": 4810, "loss": 0.2345, "lr": 2.535719011732321e-06, "epoch": 4.350311850311851, "percentage": 87.01, "elapsed_time": "0:18:04", "remaining_time": "0:02:41", "throughput": 1550.34, "total_tokens": 1681520} +{"current_steps": 4190, "total_steps": 4810, "loss": 0.2726, "lr": 2.49605935624625e-06, "epoch": 4.355509355509356, "percentage": 87.11, "elapsed_time": "0:18:04", "remaining_time": "0:02:40", "throughput": 1551.77, "total_tokens": 1683568} +{"current_steps": 4195, "total_steps": 4810, "loss": 0.236, "lr": 2.4566959946391243e-06, "epoch": 4.360706860706861, "percentage": 87.21, "elapsed_time": "0:18:05", "remaining_time": "0:02:39", "throughput": 1553.07, "total_tokens": 1685488} +{"current_steps": 4200, "total_steps": 4810, "loss": 0.2476, "lr": 2.417629445181194e-06, "epoch": 4.365904365904366, "percentage": 87.32, "elapsed_time": "0:18:05", "remaining_time": "0:02:37", "throughput": 1554.38, "total_tokens": 1687408} +{"current_steps": 4205, "total_steps": 4810, "loss": 0.2325, "lr": 2.378860222234794e-06, "epoch": 4.371101871101871, "percentage": 87.42, "elapsed_time": "0:18:05", "remaining_time": "0:02:36", "throughput": 1555.85, "total_tokens": 1689520} +{"current_steps": 4210, "total_steps": 4810, "loss": 0.2749, "lr": 2.3403888362475782e-06, "epoch": 4.376299376299376, "percentage": 87.53, "elapsed_time": "0:18:06", "remaining_time": "0:02:34", "throughput": 1557.27, "total_tokens": 1691568} +{"current_steps": 4215, "total_steps": 4810, "loss": 0.2235, "lr": 2.3022157937457627e-06, "epoch": 4.381496881496881, "percentage": 87.63, "elapsed_time": "0:18:06", "remaining_time": "0:02:33", "throughput": 1558.69, "total_tokens": 1693616} +{"current_steps": 4220, "total_steps": 4810, "loss": 0.2369, "lr": 2.2643415973275016e-06, "epoch": 4.386694386694387, "percentage": 87.73, "elapsed_time": "0:18:06", "remaining_time": "0:02:31", "throughput": 1560.05, "total_tokens": 1695600} +{"current_steps": 4225, "total_steps": 4810, "loss": 0.285, "lr": 2.2267667456562307e-06, "epoch": 4.391891891891892, "percentage": 87.84, "elapsed_time": "0:18:07", "remaining_time": "0:02:30", "throughput": 1561.41, "total_tokens": 1697584} +{"current_steps": 4230, "total_steps": 4810, "loss": 0.2273, "lr": 2.1894917334541354e-06, "epoch": 4.397089397089397, "percentage": 87.94, "elapsed_time": "0:18:07", "remaining_time": "0:02:29", "throughput": 1562.77, "total_tokens": 1699568} +{"current_steps": 4235, "total_steps": 4810, "loss": 0.2953, "lr": 2.15251705149562e-06, "epoch": 4.402286902286902, "percentage": 88.05, "elapsed_time": "0:18:07", "remaining_time": "0:02:27", "throughput": 1564.3, "total_tokens": 1701744} +{"current_steps": 4240, "total_steps": 4810, "loss": 0.2404, "lr": 2.11584318660083e-06, "epoch": 4.407484407484407, "percentage": 88.15, "elapsed_time": "0:18:08", "remaining_time": "0:02:26", "throughput": 1565.54, "total_tokens": 1703600} +{"current_steps": 4245, "total_steps": 4810, "loss": 0.3067, "lr": 2.0794706216292813e-06, "epoch": 4.412681912681912, "percentage": 88.25, "elapsed_time": "0:18:08", "remaining_time": "0:02:24", "throughput": 1567.01, "total_tokens": 1705712} +{"current_steps": 4250, "total_steps": 4810, "loss": 0.2088, "lr": 2.043399835473475e-06, "epoch": 4.417879417879418, "percentage": 88.36, "elapsed_time": "0:18:08", "remaining_time": "0:02:23", "throughput": 1568.36, "total_tokens": 1707696} +{"current_steps": 4255, "total_steps": 4810, "loss": 0.2195, "lr": 2.0076313030525844e-06, "epoch": 4.423076923076923, "percentage": 88.46, "elapsed_time": "0:18:09", "remaining_time": "0:02:22", "throughput": 1569.77, "total_tokens": 1709744} +{"current_steps": 4260, "total_steps": 4810, "loss": 0.2399, "lr": 1.972165495306241e-06, "epoch": 4.428274428274428, "percentage": 88.57, "elapsed_time": "0:18:09", "remaining_time": "0:02:20", "throughput": 1571.18, "total_tokens": 1711792} +{"current_steps": 4265, "total_steps": 4810, "loss": 0.2491, "lr": 1.937002879188285e-06, "epoch": 4.4334719334719335, "percentage": 88.67, "elapsed_time": "0:18:09", "remaining_time": "0:02:19", "throughput": 1572.65, "total_tokens": 1713904} +{"current_steps": 4270, "total_steps": 4810, "loss": 0.2257, "lr": 1.9021439176606564e-06, "epoch": 4.4386694386694385, "percentage": 88.77, "elapsed_time": "0:18:10", "remaining_time": "0:02:17", "throughput": 1573.94, "total_tokens": 1715824} +{"current_steps": 4275, "total_steps": 4810, "loss": 0.2438, "lr": 1.8675890696872838e-06, "epoch": 4.443866943866944, "percentage": 88.88, "elapsed_time": "0:18:10", "remaining_time": "0:02:16", "throughput": 1575.29, "total_tokens": 1717808} +{"current_steps": 4280, "total_steps": 4810, "loss": 0.2773, "lr": 1.8333387902280314e-06, "epoch": 4.4490644490644495, "percentage": 88.98, "elapsed_time": "0:18:10", "remaining_time": "0:02:15", "throughput": 1576.69, "total_tokens": 1719856} +{"current_steps": 4285, "total_steps": 4810, "loss": 0.2193, "lr": 1.7993935302327292e-06, "epoch": 4.454261954261955, "percentage": 89.09, "elapsed_time": "0:18:11", "remaining_time": "0:02:13", "throughput": 1577.99, "total_tokens": 1721776} +{"current_steps": 4290, "total_steps": 4810, "loss": 0.238, "lr": 1.7657537366352338e-06, "epoch": 4.45945945945946, "percentage": 89.19, "elapsed_time": "0:18:11", "remaining_time": "0:02:12", "throughput": 1579.22, "total_tokens": 1723632} +{"current_steps": 4295, "total_steps": 4810, "loss": 0.1772, "lr": 1.732419852347511e-06, "epoch": 4.464656964656965, "percentage": 89.29, "elapsed_time": "0:18:11", "remaining_time": "0:02:10", "throughput": 1580.45, "total_tokens": 1725488} +{"current_steps": 4300, "total_steps": 4810, "loss": 0.2837, "lr": 1.699392316253856e-06, "epoch": 4.46985446985447, "percentage": 89.4, "elapsed_time": "0:18:12", "remaining_time": "0:02:09", "throughput": 1581.91, "total_tokens": 1727600} +{"current_steps": 4305, "total_steps": 4810, "loss": 0.2494, "lr": 1.666671563205069e-06, "epoch": 4.475051975051975, "percentage": 89.5, "elapsed_time": "0:18:12", "remaining_time": "0:02:08", "throughput": 1583.37, "total_tokens": 1729712} +{"current_steps": 4310, "total_steps": 4810, "loss": 0.269, "lr": 1.6342580240127582e-06, "epoch": 4.48024948024948, "percentage": 89.6, "elapsed_time": "0:18:12", "remaining_time": "0:02:06", "throughput": 1584.71, "total_tokens": 1731696} +{"current_steps": 4315, "total_steps": 4810, "loss": 0.2551, "lr": 1.6021521254436678e-06, "epoch": 4.485446985446986, "percentage": 89.71, "elapsed_time": "0:18:13", "remaining_time": "0:02:05", "throughput": 1586.11, "total_tokens": 1733744} +{"current_steps": 4320, "total_steps": 4810, "loss": 0.2408, "lr": 1.5703542902140294e-06, "epoch": 4.490644490644491, "percentage": 89.81, "elapsed_time": "0:18:13", "remaining_time": "0:02:04", "throughput": 1587.46, "total_tokens": 1735728} +{"current_steps": 4325, "total_steps": 4810, "loss": 0.1891, "lr": 1.5388649369840357e-06, "epoch": 4.495841995841996, "percentage": 89.92, "elapsed_time": "0:18:13", "remaining_time": "0:02:02", "throughput": 1588.86, "total_tokens": 1737776} +{"current_steps": 4330, "total_steps": 4810, "loss": 0.2684, "lr": 1.5076844803522922e-06, "epoch": 4.501039501039501, "percentage": 90.02, "elapsed_time": "0:18:14", "remaining_time": "0:02:01", "throughput": 1590.26, "total_tokens": 1739824} +{"current_steps": 4335, "total_steps": 4810, "loss": 0.2709, "lr": 1.476813330850388e-06, "epoch": 4.506237006237006, "percentage": 90.12, "elapsed_time": "0:18:14", "remaining_time": "0:01:59", "throughput": 1591.54, "total_tokens": 1741744} +{"current_steps": 4338, "total_steps": 4810, "eval_loss": 0.2577267587184906, "epoch": 4.509355509355509, "percentage": 90.19, "elapsed_time": "0:18:15", "remaining_time": "0:01:59", "throughput": 1590.85, "total_tokens": 1742960} +{"current_steps": 4340, "total_steps": 4810, "loss": 0.2731, "lr": 1.4462518949374838e-06, "epoch": 4.511434511434511, "percentage": 90.23, "elapsed_time": "0:18:39", "remaining_time": "0:02:01", "throughput": 1558.23, "total_tokens": 1743728} +{"current_steps": 4345, "total_steps": 4810, "loss": 0.2431, "lr": 1.4160005749949328e-06, "epoch": 4.516632016632016, "percentage": 90.33, "elapsed_time": "0:18:39", "remaining_time": "0:01:59", "throughput": 1559.72, "total_tokens": 1745904} +{"current_steps": 4350, "total_steps": 4810, "loss": 0.2649, "lr": 1.386059769321027e-06, "epoch": 4.521829521829522, "percentage": 90.44, "elapsed_time": "0:18:39", "remaining_time": "0:01:58", "throughput": 1560.96, "total_tokens": 1747824} +{"current_steps": 4355, "total_steps": 4810, "loss": 0.2569, "lr": 1.3564298721257223e-06, "epoch": 4.527027027027027, "percentage": 90.54, "elapsed_time": "0:18:40", "remaining_time": "0:01:57", "throughput": 1562.34, "total_tokens": 1749872} +{"current_steps": 4360, "total_steps": 4810, "loss": 0.1998, "lr": 1.3271112735254498e-06, "epoch": 4.532224532224532, "percentage": 90.64, "elapsed_time": "0:18:40", "remaining_time": "0:01:55", "throughput": 1563.6, "total_tokens": 1751792} +{"current_steps": 4365, "total_steps": 4810, "loss": 0.251, "lr": 1.298104359538005e-06, "epoch": 4.537422037422037, "percentage": 90.75, "elapsed_time": "0:18:40", "remaining_time": "0:01:54", "throughput": 1564.91, "total_tokens": 1753776} +{"current_steps": 4370, "total_steps": 4810, "loss": 0.2705, "lr": 1.269409512077427e-06, "epoch": 4.542619542619542, "percentage": 90.85, "elapsed_time": "0:18:41", "remaining_time": "0:01:52", "throughput": 1566.28, "total_tokens": 1755824} +{"current_steps": 4375, "total_steps": 4810, "loss": 0.202, "lr": 1.241027108949e-06, "epoch": 4.547817047817047, "percentage": 90.96, "elapsed_time": "0:18:41", "remaining_time": "0:01:51", "throughput": 1567.77, "total_tokens": 1758000} +{"current_steps": 4380, "total_steps": 4810, "loss": 0.2565, "lr": 1.2129575238442715e-06, "epoch": 4.553014553014553, "percentage": 91.06, "elapsed_time": "0:18:41", "remaining_time": "0:01:50", "throughput": 1569.08, "total_tokens": 1759984} +{"current_steps": 4385, "total_steps": 4810, "loss": 0.2607, "lr": 1.185201126336122e-06, "epoch": 4.558212058212058, "percentage": 91.16, "elapsed_time": "0:18:41", "remaining_time": "0:01:48", "throughput": 1570.38, "total_tokens": 1761968} +{"current_steps": 4390, "total_steps": 4810, "loss": 0.2392, "lr": 1.1577582818739135e-06, "epoch": 4.5634095634095635, "percentage": 91.27, "elapsed_time": "0:18:42", "remaining_time": "0:01:47", "throughput": 1571.74, "total_tokens": 1764016} +{"current_steps": 4395, "total_steps": 4810, "loss": 0.2808, "lr": 1.1306293517786614e-06, "epoch": 4.5686070686070686, "percentage": 91.37, "elapsed_time": "0:18:42", "remaining_time": "0:01:46", "throughput": 1572.99, "total_tokens": 1765936} +{"current_steps": 4400, "total_steps": 4810, "loss": 0.1891, "lr": 1.1038146932383004e-06, "epoch": 4.573804573804574, "percentage": 91.48, "elapsed_time": "0:18:42", "remaining_time": "0:01:44", "throughput": 1574.35, "total_tokens": 1767984} +{"current_steps": 4405, "total_steps": 4810, "loss": 0.2029, "lr": 1.0773146593029637e-06, "epoch": 4.579002079002079, "percentage": 91.58, "elapsed_time": "0:18:43", "remaining_time": "0:01:43", "throughput": 1575.6, "total_tokens": 1769904} +{"current_steps": 4410, "total_steps": 4810, "loss": 0.2743, "lr": 1.0511295988803294e-06, "epoch": 4.584199584199585, "percentage": 91.68, "elapsed_time": "0:18:43", "remaining_time": "0:01:41", "throughput": 1576.89, "total_tokens": 1771888} +{"current_steps": 4415, "total_steps": 4810, "loss": 0.2115, "lr": 1.0252598567310451e-06, "epoch": 4.58939708939709, "percentage": 91.79, "elapsed_time": "0:18:43", "remaining_time": "0:01:40", "throughput": 1578.25, "total_tokens": 1773936} +{"current_steps": 4420, "total_steps": 4810, "loss": 0.2778, "lr": 9.99705773464185e-07, "epoch": 4.594594594594595, "percentage": 91.89, "elapsed_time": "0:18:44", "remaining_time": "0:01:39", "throughput": 1579.61, "total_tokens": 1775984} +{"current_steps": 4425, "total_steps": 4810, "loss": 0.2428, "lr": 9.744676855327483e-07, "epoch": 4.5997920997921, "percentage": 92.0, "elapsed_time": "0:18:44", "remaining_time": "0:01:37", "throughput": 1580.79, "total_tokens": 1777840} +{"current_steps": 4430, "total_steps": 4810, "loss": 0.2124, "lr": 9.495459252292504e-07, "epoch": 4.604989604989605, "percentage": 92.1, "elapsed_time": "0:18:44", "remaining_time": "0:01:36", "throughput": 1582.08, "total_tokens": 1779824} +{"current_steps": 4435, "total_steps": 4810, "loss": 0.1939, "lr": 9.249408206813332e-07, "epoch": 4.61018711018711, "percentage": 92.2, "elapsed_time": "0:18:45", "remaining_time": "0:01:35", "throughput": 1583.43, "total_tokens": 1781872} +{"current_steps": 4440, "total_steps": 4810, "loss": 0.2364, "lr": 9.006526958474509e-07, "epoch": 4.615384615384615, "percentage": 92.31, "elapsed_time": "0:18:45", "remaining_time": "0:01:33", "throughput": 1584.84, "total_tokens": 1783984} +{"current_steps": 4445, "total_steps": 4810, "loss": 0.2023, "lr": 8.766818705126134e-07, "epoch": 4.620582120582121, "percentage": 92.41, "elapsed_time": "0:18:45", "remaining_time": "0:01:32", "throughput": 1586.18, "total_tokens": 1786032} +{"current_steps": 4450, "total_steps": 4810, "loss": 0.2455, "lr": 8.530286602841525e-07, "epoch": 4.625779625779626, "percentage": 92.52, "elapsed_time": "0:18:46", "remaining_time": "0:01:31", "throughput": 1587.47, "total_tokens": 1788016} +{"current_steps": 4455, "total_steps": 4810, "loss": 0.2154, "lr": 8.296933765875897e-07, "epoch": 4.630977130977131, "percentage": 92.62, "elapsed_time": "0:18:46", "remaining_time": "0:01:29", "throughput": 1588.82, "total_tokens": 1790064} +{"current_steps": 4460, "total_steps": 4810, "loss": 0.2046, "lr": 8.066763266625282e-07, "epoch": 4.636174636174636, "percentage": 92.72, "elapsed_time": "0:18:46", "remaining_time": "0:01:28", "throughput": 1590.05, "total_tokens": 1791984} +{"current_steps": 4465, "total_steps": 4810, "loss": 0.1884, "lr": 7.839778135586007e-07, "epoch": 4.641372141372141, "percentage": 92.83, "elapsed_time": "0:18:47", "remaining_time": "0:01:27", "throughput": 1591.29, "total_tokens": 1793904} +{"current_steps": 4470, "total_steps": 4810, "loss": 0.223, "lr": 7.615981361314889e-07, "epoch": 4.646569646569646, "percentage": 92.93, "elapsed_time": "0:18:47", "remaining_time": "0:01:25", "throughput": 1592.58, "total_tokens": 1795888} +{"current_steps": 4475, "total_steps": 4810, "loss": 0.3424, "lr": 7.3953758903898e-07, "epoch": 4.651767151767151, "percentage": 93.04, "elapsed_time": "0:18:47", "remaining_time": "0:01:24", "throughput": 1593.87, "total_tokens": 1797872} +{"current_steps": 4480, "total_steps": 4810, "loss": 0.2152, "lr": 7.177964627370997e-07, "epoch": 4.656964656964657, "percentage": 93.14, "elapsed_time": "0:18:48", "remaining_time": "0:01:23", "throughput": 1595.23, "total_tokens": 1799920} +{"current_steps": 4485, "total_steps": 4810, "loss": 0.2628, "lr": 6.963750434762745e-07, "epoch": 4.662162162162162, "percentage": 93.24, "elapsed_time": "0:18:48", "remaining_time": "0:01:21", "throughput": 1596.41, "total_tokens": 1801776} +{"current_steps": 4490, "total_steps": 4810, "loss": 0.2974, "lr": 6.752736132975696e-07, "epoch": 4.667359667359667, "percentage": 93.35, "elapsed_time": "0:18:48", "remaining_time": "0:01:20", "throughput": 1597.75, "total_tokens": 1803824} +{"current_steps": 4495, "total_steps": 4810, "loss": 0.1697, "lr": 6.54492450028979e-07, "epoch": 4.672557172557172, "percentage": 93.45, "elapsed_time": "0:18:49", "remaining_time": "0:01:19", "throughput": 1598.98, "total_tokens": 1805744} +{"current_steps": 4500, "total_steps": 4810, "loss": 0.2489, "lr": 6.340318272817474e-07, "epoch": 4.6777546777546775, "percentage": 93.56, "elapsed_time": "0:18:49", "remaining_time": "0:01:17", "throughput": 1600.27, "total_tokens": 1807728} +{"current_steps": 4505, "total_steps": 4810, "loss": 0.255, "lr": 6.138920144468124e-07, "epoch": 4.682952182952183, "percentage": 93.66, "elapsed_time": "0:18:49", "remaining_time": "0:01:16", "throughput": 1601.55, "total_tokens": 1809712} +{"current_steps": 4510, "total_steps": 4810, "loss": 0.2946, "lr": 5.94073276691201e-07, "epoch": 4.6881496881496885, "percentage": 93.76, "elapsed_time": "0:18:50", "remaining_time": "0:01:15", "throughput": 1602.78, "total_tokens": 1811632} +{"current_steps": 4515, "total_steps": 4810, "loss": 0.2011, "lr": 5.745758749545749e-07, "epoch": 4.6933471933471935, "percentage": 93.87, "elapsed_time": "0:18:50", "remaining_time": "0:01:13", "throughput": 1604.01, "total_tokens": 1813552} +{"current_steps": 4520, "total_steps": 4810, "loss": 0.2354, "lr": 5.554000659457881e-07, "epoch": 4.698544698544699, "percentage": 93.97, "elapsed_time": "0:18:50", "remaining_time": "0:01:12", "throughput": 1605.4, "total_tokens": 1815664} +{"current_steps": 4525, "total_steps": 4810, "loss": 0.2284, "lr": 5.365461021395096e-07, "epoch": 4.703742203742204, "percentage": 94.07, "elapsed_time": "0:18:51", "remaining_time": "0:01:11", "throughput": 1606.68, "total_tokens": 1817648} +{"current_steps": 4530, "total_steps": 4810, "loss": 0.2259, "lr": 5.180142317728815e-07, "epoch": 4.708939708939709, "percentage": 94.18, "elapsed_time": "0:18:51", "remaining_time": "0:01:09", "throughput": 1608.02, "total_tokens": 1819696} +{"current_steps": 4535, "total_steps": 4810, "loss": 0.269, "lr": 4.998046988422766e-07, "epoch": 4.714137214137214, "percentage": 94.28, "elapsed_time": "0:18:51", "remaining_time": "0:01:08", "throughput": 1609.3, "total_tokens": 1821680} +{"current_steps": 4540, "total_steps": 4810, "loss": 0.2786, "lr": 4.819177431000604e-07, "epoch": 4.71933471933472, "percentage": 94.39, "elapsed_time": "0:18:52", "remaining_time": "0:01:07", "throughput": 1610.64, "total_tokens": 1823728} +{"current_steps": 4545, "total_steps": 4810, "loss": 0.3228, "lr": 4.6435360005145644e-07, "epoch": 4.724532224532225, "percentage": 94.49, "elapsed_time": "0:18:52", "remaining_time": "0:01:06", "throughput": 1611.92, "total_tokens": 1825712} +{"current_steps": 4550, "total_steps": 4810, "loss": 0.2664, "lr": 4.4711250095143267e-07, "epoch": 4.72972972972973, "percentage": 94.59, "elapsed_time": "0:18:52", "remaining_time": "0:01:04", "throughput": 1613.25, "total_tokens": 1827760} +{"current_steps": 4555, "total_steps": 4810, "loss": 0.2014, "lr": 4.30194672801662e-07, "epoch": 4.734927234927235, "percentage": 94.7, "elapsed_time": "0:18:53", "remaining_time": "0:01:03", "throughput": 1614.47, "total_tokens": 1829680} +{"current_steps": 4560, "total_steps": 4810, "loss": 0.2992, "lr": 4.136003383475251e-07, "epoch": 4.74012474012474, "percentage": 94.8, "elapsed_time": "0:18:53", "remaining_time": "0:01:02", "throughput": 1615.81, "total_tokens": 1831728} +{"current_steps": 4565, "total_steps": 4810, "loss": 0.2033, "lr": 3.9732971607519265e-07, "epoch": 4.745322245322245, "percentage": 94.91, "elapsed_time": "0:18:53", "remaining_time": "0:01:00", "throughput": 1617.02, "total_tokens": 1833648} +{"current_steps": 4570, "total_steps": 4810, "loss": 0.2388, "lr": 3.8138302020873373e-07, "epoch": 4.75051975051975, "percentage": 95.01, "elapsed_time": "0:18:54", "remaining_time": "0:00:59", "throughput": 1618.36, "total_tokens": 1835696} +{"current_steps": 4575, "total_steps": 4810, "loss": 0.2582, "lr": 3.6576046070730675e-07, "epoch": 4.755717255717256, "percentage": 95.11, "elapsed_time": "0:18:54", "remaining_time": "0:00:58", "throughput": 1619.75, "total_tokens": 1837808} +{"current_steps": 4579, "total_steps": 4810, "eval_loss": 0.2604904770851135, "epoch": 4.75987525987526, "percentage": 95.2, "elapsed_time": "0:18:55", "remaining_time": "0:00:57", "throughput": 1619.22, "total_tokens": 1839344} +{"current_steps": 4580, "total_steps": 4810, "loss": 0.2365, "lr": 3.5046224326238107e-07, "epoch": 4.760914760914761, "percentage": 95.22, "elapsed_time": "0:19:38", "remaining_time": "0:00:59", "throughput": 1561.72, "total_tokens": 1839728} +{"current_steps": 4585, "total_steps": 4810, "loss": 0.2569, "lr": 3.3548856929505047e-07, "epoch": 4.766112266112266, "percentage": 95.32, "elapsed_time": "0:19:38", "remaining_time": "0:00:57", "throughput": 1563.03, "total_tokens": 1841776} +{"current_steps": 4590, "total_steps": 4810, "loss": 0.2548, "lr": 3.208396359533572e-07, "epoch": 4.771309771309771, "percentage": 95.43, "elapsed_time": "0:19:38", "remaining_time": "0:00:56", "throughput": 1564.22, "total_tokens": 1843696} +{"current_steps": 4595, "total_steps": 4810, "loss": 0.2391, "lr": 3.065156361097138e-07, "epoch": 4.776507276507276, "percentage": 95.53, "elapsed_time": "0:19:38", "remaining_time": "0:00:55", "throughput": 1565.52, "total_tokens": 1845744} +{"current_steps": 4600, "total_steps": 4810, "loss": 0.2364, "lr": 2.925167583583577e-07, "epoch": 4.781704781704782, "percentage": 95.63, "elapsed_time": "0:19:39", "remaining_time": "0:00:53", "throughput": 1566.82, "total_tokens": 1847792} +{"current_steps": 4605, "total_steps": 4810, "loss": 0.2843, "lr": 2.7884318701285885e-07, "epoch": 4.786902286902287, "percentage": 95.74, "elapsed_time": "0:19:39", "remaining_time": "0:00:52", "throughput": 1568.06, "total_tokens": 1849776} +{"current_steps": 4610, "total_steps": 4810, "loss": 0.2187, "lr": 2.6549510210371607e-07, "epoch": 4.792099792099792, "percentage": 95.84, "elapsed_time": "0:19:39", "remaining_time": "0:00:51", "throughput": 1569.52, "total_tokens": 1852016} +{"current_steps": 4615, "total_steps": 4810, "loss": 0.246, "lr": 2.524726793759591e-07, "epoch": 4.797297297297297, "percentage": 95.95, "elapsed_time": "0:19:40", "remaining_time": "0:00:49", "throughput": 1570.82, "total_tokens": 1854064} +{"current_steps": 4620, "total_steps": 4810, "loss": 0.2382, "lr": 2.397760902868612e-07, "epoch": 4.802494802494802, "percentage": 96.05, "elapsed_time": "0:19:40", "remaining_time": "0:00:48", "throughput": 1572.11, "total_tokens": 1856112} +{"current_steps": 4625, "total_steps": 4810, "loss": 0.2361, "lr": 2.274055020036553e-07, "epoch": 4.8076923076923075, "percentage": 96.15, "elapsed_time": "0:19:40", "remaining_time": "0:00:47", "throughput": 1573.35, "total_tokens": 1858096} +{"current_steps": 4630, "total_steps": 4810, "loss": 0.2671, "lr": 2.1536107740135482e-07, "epoch": 4.8128898128898125, "percentage": 96.26, "elapsed_time": "0:19:41", "remaining_time": "0:00:45", "throughput": 1574.76, "total_tokens": 1860272} +{"current_steps": 4635, "total_steps": 4810, "loss": 0.2501, "lr": 2.0364297506060003e-07, "epoch": 4.8180873180873185, "percentage": 96.36, "elapsed_time": "0:19:41", "remaining_time": "0:00:44", "throughput": 1576.0, "total_tokens": 1862256} +{"current_steps": 4640, "total_steps": 4810, "loss": 0.1984, "lr": 1.922513492655653e-07, "epoch": 4.8232848232848236, "percentage": 96.47, "elapsed_time": "0:19:41", "remaining_time": "0:00:43", "throughput": 1577.29, "total_tokens": 1864304} +{"current_steps": 4645, "total_steps": 4810, "loss": 0.2677, "lr": 1.8118635000194396e-07, "epoch": 4.828482328482329, "percentage": 96.57, "elapsed_time": "0:19:42", "remaining_time": "0:00:41", "throughput": 1578.48, "total_tokens": 1866224} +{"current_steps": 4650, "total_steps": 4810, "loss": 0.2349, "lr": 1.704481229549526e-07, "epoch": 4.833679833679834, "percentage": 96.67, "elapsed_time": "0:19:42", "remaining_time": "0:00:40", "throughput": 1579.82, "total_tokens": 1868336} +{"current_steps": 4655, "total_steps": 4810, "loss": 0.2927, "lr": 1.6003680950742728e-07, "epoch": 4.838877338877339, "percentage": 96.78, "elapsed_time": "0:19:42", "remaining_time": "0:00:39", "throughput": 1581.17, "total_tokens": 1870448} +{"current_steps": 4660, "total_steps": 4810, "loss": 0.2206, "lr": 1.4995254673795812e-07, "epoch": 4.844074844074844, "percentage": 96.88, "elapsed_time": "0:19:43", "remaining_time": "0:00:38", "throughput": 1582.35, "total_tokens": 1872368} +{"current_steps": 4665, "total_steps": 4810, "loss": 0.2374, "lr": 1.4019546741908251e-07, "epoch": 4.849272349272349, "percentage": 96.99, "elapsed_time": "0:19:43", "remaining_time": "0:00:36", "throughput": 1583.7, "total_tokens": 1874480} +{"current_steps": 4670, "total_steps": 4810, "loss": 0.2712, "lr": 1.3076570001553934e-07, "epoch": 4.854469854469855, "percentage": 97.09, "elapsed_time": "0:19:43", "remaining_time": "0:00:35", "throughput": 1584.93, "total_tokens": 1876464} +{"current_steps": 4675, "total_steps": 4810, "loss": 0.2406, "lr": 1.216633686825841e-07, "epoch": 4.85966735966736, "percentage": 97.19, "elapsed_time": "0:19:44", "remaining_time": "0:00:34", "throughput": 1586.17, "total_tokens": 1878448} +{"current_steps": 4680, "total_steps": 4810, "loss": 0.2743, "lr": 1.1288859326433477e-07, "epoch": 4.864864864864865, "percentage": 97.3, "elapsed_time": "0:19:44", "remaining_time": "0:00:32", "throughput": 1587.4, "total_tokens": 1880432} +{"current_steps": 4685, "total_steps": 4810, "loss": 0.2828, "lr": 1.0444148929221464e-07, "epoch": 4.87006237006237, "percentage": 97.4, "elapsed_time": "0:19:44", "remaining_time": "0:00:31", "throughput": 1588.74, "total_tokens": 1882544} +{"current_steps": 4690, "total_steps": 4810, "loss": 0.274, "lr": 9.63221679834203e-08, "epoch": 4.875259875259875, "percentage": 97.51, "elapsed_time": "0:19:45", "remaining_time": "0:00:30", "throughput": 1589.98, "total_tokens": 1884528} +{"current_steps": 4695, "total_steps": 4810, "loss": 0.2457, "lr": 8.853073623946162e-08, "epoch": 4.88045738045738, "percentage": 97.61, "elapsed_time": "0:19:45", "remaining_time": "0:00:29", "throughput": 1591.32, "total_tokens": 1886640} +{"current_steps": 4700, "total_steps": 4810, "loss": 0.2663, "lr": 8.106729664475176e-08, "epoch": 4.885654885654886, "percentage": 97.71, "elapsed_time": "0:19:45", "remaining_time": "0:00:27", "throughput": 1592.6, "total_tokens": 1888688} +{"current_steps": 4705, "total_steps": 4810, "loss": 0.2572, "lr": 7.393194746525279e-08, "epoch": 4.890852390852391, "percentage": 97.82, "elapsed_time": "0:19:46", "remaining_time": "0:00:26", "throughput": 1593.89, "total_tokens": 1890736} +{"current_steps": 4710, "total_steps": 4810, "loss": 0.2399, "lr": 6.712478264719601e-08, "epoch": 4.896049896049896, "percentage": 97.92, "elapsed_time": "0:19:46", "remaining_time": "0:00:25", "throughput": 1595.12, "total_tokens": 1892720} +{"current_steps": 4715, "total_steps": 4810, "loss": 0.2267, "lr": 6.064589181582481e-08, "epoch": 4.901247401247401, "percentage": 98.02, "elapsed_time": "0:19:46", "remaining_time": "0:00:23", "throughput": 1596.35, "total_tokens": 1894704} +{"current_steps": 4720, "total_steps": 4810, "loss": 0.2652, "lr": 5.4495360274231524e-08, "epoch": 4.906444906444906, "percentage": 98.13, "elapsed_time": "0:19:47", "remaining_time": "0:00:22", "throughput": 1597.52, "total_tokens": 1896624} +{"current_steps": 4725, "total_steps": 4810, "loss": 0.2254, "lr": 4.867326900223068e-08, "epoch": 4.911642411642411, "percentage": 98.23, "elapsed_time": "0:19:47", "remaining_time": "0:00:21", "throughput": 1598.7, "total_tokens": 1898544} +{"current_steps": 4730, "total_steps": 4810, "loss": 0.2342, "lr": 4.317969465527927e-08, "epoch": 4.916839916839917, "percentage": 98.34, "elapsed_time": "0:19:47", "remaining_time": "0:00:20", "throughput": 1599.98, "total_tokens": 1900592} +{"current_steps": 4735, "total_steps": 4810, "loss": 0.2151, "lr": 3.8014709563488625e-08, "epoch": 4.922037422037422, "percentage": 98.44, "elapsed_time": "0:19:48", "remaining_time": "0:00:18", "throughput": 1601.2, "total_tokens": 1902576} +{"current_steps": 4740, "total_steps": 4810, "loss": 0.2368, "lr": 3.317838173066135e-08, "epoch": 4.927234927234927, "percentage": 98.54, "elapsed_time": "0:19:48", "remaining_time": "0:00:17", "throughput": 1602.48, "total_tokens": 1904624} +{"current_steps": 4745, "total_steps": 4810, "loss": 0.2662, "lr": 2.8670774833386426e-08, "epoch": 4.9324324324324325, "percentage": 98.65, "elapsed_time": "0:19:48", "remaining_time": "0:00:16", "throughput": 1603.82, "total_tokens": 1906736} +{"current_steps": 4750, "total_steps": 4810, "loss": 0.221, "lr": 2.449194822022327e-08, "epoch": 4.9376299376299375, "percentage": 98.75, "elapsed_time": "0:19:49", "remaining_time": "0:00:15", "throughput": 1604.93, "total_tokens": 1908592} +{"current_steps": 4755, "total_steps": 4810, "loss": 0.2286, "lr": 2.064195691089954e-08, "epoch": 4.942827442827443, "percentage": 98.86, "elapsed_time": "0:19:49", "remaining_time": "0:00:13", "throughput": 1606.16, "total_tokens": 1910576} +{"current_steps": 4760, "total_steps": 4810, "loss": 0.2104, "lr": 1.712085159559784e-08, "epoch": 4.948024948024948, "percentage": 98.96, "elapsed_time": "0:19:49", "remaining_time": "0:00:12", "throughput": 1607.43, "total_tokens": 1912624} +{"current_steps": 4765, "total_steps": 4810, "loss": 0.2802, "lr": 1.3928678634289593e-08, "epoch": 4.953222453222454, "percentage": 99.06, "elapsed_time": "0:19:50", "remaining_time": "0:00:11", "throughput": 1608.66, "total_tokens": 1914608} +{"current_steps": 4770, "total_steps": 4810, "loss": 0.2125, "lr": 1.1065480056110522e-08, "epoch": 4.958419958419959, "percentage": 99.17, "elapsed_time": "0:19:50", "remaining_time": "0:00:09", "throughput": 1609.88, "total_tokens": 1916592} +{"current_steps": 4775, "total_steps": 4810, "loss": 0.2162, "lr": 8.531293558824982e-09, "epoch": 4.963617463617464, "percentage": 99.27, "elapsed_time": "0:19:50", "remaining_time": "0:00:08", "throughput": 1611.2, "total_tokens": 1918704} +{"current_steps": 4780, "total_steps": 4810, "loss": 0.2508, "lr": 6.326152508320804e-09, "epoch": 4.968814968814969, "percentage": 99.38, "elapsed_time": "0:19:51", "remaining_time": "0:00:07", "throughput": 1612.36, "total_tokens": 1920624} +{"current_steps": 4785, "total_steps": 4810, "loss": 0.2453, "lr": 4.450085938170756e-09, "epoch": 4.974012474012474, "percentage": 99.48, "elapsed_time": "0:19:51", "remaining_time": "0:00:06", "throughput": 1613.47, "total_tokens": 1922480} +{"current_steps": 4790, "total_steps": 4810, "loss": 0.2758, "lr": 2.9031185492522926e-09, "epoch": 4.979209979209979, "percentage": 99.58, "elapsed_time": "0:19:51", "remaining_time": "0:00:04", "throughput": 1614.69, "total_tokens": 1924464} +{"current_steps": 4795, "total_steps": 4810, "loss": 0.2275, "lr": 1.6852707094172636e-09, "epoch": 4.984407484407484, "percentage": 99.69, "elapsed_time": "0:19:52", "remaining_time": "0:00:03", "throughput": 1615.9, "total_tokens": 1926448} +{"current_steps": 4800, "total_steps": 4810, "loss": 0.2635, "lr": 7.965584532282355e-10, "epoch": 4.98960498960499, "percentage": 99.79, "elapsed_time": "0:19:52", "remaining_time": "0:00:02", "throughput": 1617.23, "total_tokens": 1928560} +{"current_steps": 4805, "total_steps": 4810, "loss": 0.2384, "lr": 2.3699348174754945e-10, "epoch": 4.994802494802495, "percentage": 99.9, "elapsed_time": "0:19:52", "remaining_time": "0:00:01", "throughput": 1618.45, "total_tokens": 1930544} +{"current_steps": 4810, "total_steps": 4810, "loss": 0.2943, "lr": 6.583162381890162e-12, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:19:53", "remaining_time": "0:00:00", "throughput": 1619.66, "total_tokens": 1932608} +{"current_steps": 4810, "total_steps": 4810, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:20:17", "remaining_time": "0:00:00", "throughput": 1587.52, "total_tokens": 1932608} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..9228bf6 --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,7911 @@ +{ + "best_global_step": 4097, + "best_metric": 0.2517484128475189, + "best_model_checkpoint": "saves_bts_preliminary/base/llama-3.2-1b-instruct/train_cola_42_1774791067/checkpoint-4097", + "epoch": 5.0, + "eval_steps": 241, + "global_step": 4810, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.005197505197505198, + "grad_norm": 434.86285400390625, + "learning_rate": 4.1580041580041583e-07, + "loss": 1.2842, + "num_input_tokens_seen": 2048, + "step": 5 + }, + { + "epoch": 0.010395010395010396, + "grad_norm": 175.30227661132812, + "learning_rate": 9.355509355509356e-07, + "loss": 0.8545, + "num_input_tokens_seen": 4224, + "step": 10 + }, + { + "epoch": 0.015592515592515593, + "grad_norm": 26.521507263183594, + "learning_rate": 1.4553014553014554e-06, + "loss": 0.3278, + "num_input_tokens_seen": 6272, + "step": 15 + }, + { + "epoch": 0.02079002079002079, + "grad_norm": 86.457275390625, + "learning_rate": 1.975051975051975e-06, + "loss": 0.365, + "num_input_tokens_seen": 8384, + "step": 20 + }, + { + "epoch": 0.02598752598752599, + "grad_norm": 55.42351150512695, + "learning_rate": 2.494802494802495e-06, + "loss": 0.4433, + "num_input_tokens_seen": 10496, + "step": 25 + }, + { + "epoch": 0.031185031185031187, + "grad_norm": 22.866464614868164, + "learning_rate": 3.014553014553015e-06, + "loss": 0.2526, + "num_input_tokens_seen": 12544, + "step": 30 + }, + { + "epoch": 0.036382536382536385, + "grad_norm": 34.69972229003906, + "learning_rate": 3.5343035343035348e-06, + "loss": 0.3051, + "num_input_tokens_seen": 14528, + "step": 35 + }, + { + "epoch": 0.04158004158004158, + "grad_norm": 62.158714294433594, + "learning_rate": 4.0540540540540545e-06, + "loss": 0.5129, + "num_input_tokens_seen": 16576, + "step": 40 + }, + { + "epoch": 0.04677754677754678, + "grad_norm": 24.736021041870117, + "learning_rate": 4.573804573804574e-06, + "loss": 0.283, + "num_input_tokens_seen": 18560, + "step": 45 + }, + { + "epoch": 0.05197505197505198, + "grad_norm": 103.87641906738281, + "learning_rate": 5.093555093555094e-06, + "loss": 0.454, + "num_input_tokens_seen": 20608, + "step": 50 + }, + { + "epoch": 0.057172557172557176, + "grad_norm": 85.98382568359375, + "learning_rate": 5.613305613305614e-06, + "loss": 0.2518, + "num_input_tokens_seen": 22656, + "step": 55 + }, + { + "epoch": 0.062370062370062374, + "grad_norm": 15.937103271484375, + "learning_rate": 6.1330561330561335e-06, + "loss": 0.2538, + "num_input_tokens_seen": 24640, + "step": 60 + }, + { + "epoch": 0.06756756756756757, + "grad_norm": 71.92253112792969, + "learning_rate": 6.652806652806653e-06, + "loss": 0.3571, + "num_input_tokens_seen": 26752, + "step": 65 + }, + { + "epoch": 0.07276507276507277, + "grad_norm": 41.08773422241211, + "learning_rate": 7.172557172557173e-06, + "loss": 0.3588, + "num_input_tokens_seen": 28608, + "step": 70 + }, + { + "epoch": 0.07796257796257797, + "grad_norm": 39.851627349853516, + "learning_rate": 7.692307692307694e-06, + "loss": 0.2553, + "num_input_tokens_seen": 30912, + "step": 75 + }, + { + "epoch": 0.08316008316008316, + "grad_norm": 39.69013595581055, + "learning_rate": 8.212058212058212e-06, + "loss": 0.3869, + "num_input_tokens_seen": 32896, + "step": 80 + }, + { + "epoch": 0.08835758835758836, + "grad_norm": 15.486207962036133, + "learning_rate": 8.731808731808733e-06, + "loss": 0.3812, + "num_input_tokens_seen": 34816, + "step": 85 + }, + { + "epoch": 0.09355509355509356, + "grad_norm": 54.213748931884766, + "learning_rate": 9.251559251559252e-06, + "loss": 0.735, + "num_input_tokens_seen": 36736, + "step": 90 + }, + { + "epoch": 0.09875259875259876, + "grad_norm": 33.433189392089844, + "learning_rate": 9.771309771309773e-06, + "loss": 0.4027, + "num_input_tokens_seen": 38720, + "step": 95 + }, + { + "epoch": 0.10395010395010396, + "grad_norm": 45.393463134765625, + "learning_rate": 1.0291060291060291e-05, + "loss": 0.4605, + "num_input_tokens_seen": 40640, + "step": 100 + }, + { + "epoch": 0.10914760914760915, + "grad_norm": 4.37235164642334, + "learning_rate": 1.0810810810810812e-05, + "loss": 0.2999, + "num_input_tokens_seen": 42688, + "step": 105 + }, + { + "epoch": 0.11434511434511435, + "grad_norm": 41.325050354003906, + "learning_rate": 1.1330561330561331e-05, + "loss": 0.2839, + "num_input_tokens_seen": 44544, + "step": 110 + }, + { + "epoch": 0.11954261954261955, + "grad_norm": 19.053668975830078, + "learning_rate": 1.1850311850311852e-05, + "loss": 0.3329, + "num_input_tokens_seen": 46400, + "step": 115 + }, + { + "epoch": 0.12474012474012475, + "grad_norm": 11.979599952697754, + "learning_rate": 1.2370062370062372e-05, + "loss": 0.2089, + "num_input_tokens_seen": 48448, + "step": 120 + }, + { + "epoch": 0.12993762993762994, + "grad_norm": 20.051830291748047, + "learning_rate": 1.2889812889812891e-05, + "loss": 0.2829, + "num_input_tokens_seen": 50496, + "step": 125 + }, + { + "epoch": 0.13513513513513514, + "grad_norm": 41.367645263671875, + "learning_rate": 1.3409563409563412e-05, + "loss": 0.2434, + "num_input_tokens_seen": 52416, + "step": 130 + }, + { + "epoch": 0.14033264033264034, + "grad_norm": 97.8139419555664, + "learning_rate": 1.392931392931393e-05, + "loss": 0.3621, + "num_input_tokens_seen": 54464, + "step": 135 + }, + { + "epoch": 0.14553014553014554, + "grad_norm": 25.77781867980957, + "learning_rate": 1.4449064449064451e-05, + "loss": 0.3338, + "num_input_tokens_seen": 56448, + "step": 140 + }, + { + "epoch": 0.15072765072765074, + "grad_norm": 22.036914825439453, + "learning_rate": 1.496881496881497e-05, + "loss": 0.3185, + "num_input_tokens_seen": 58368, + "step": 145 + }, + { + "epoch": 0.15592515592515593, + "grad_norm": 13.202033996582031, + "learning_rate": 1.548856548856549e-05, + "loss": 0.2379, + "num_input_tokens_seen": 60544, + "step": 150 + }, + { + "epoch": 0.16112266112266113, + "grad_norm": 27.529069900512695, + "learning_rate": 1.600831600831601e-05, + "loss": 0.3634, + "num_input_tokens_seen": 62592, + "step": 155 + }, + { + "epoch": 0.16632016632016633, + "grad_norm": 25.028240203857422, + "learning_rate": 1.652806652806653e-05, + "loss": 0.3093, + "num_input_tokens_seen": 64576, + "step": 160 + }, + { + "epoch": 0.17151767151767153, + "grad_norm": 10.42611026763916, + "learning_rate": 1.704781704781705e-05, + "loss": 0.3377, + "num_input_tokens_seen": 66688, + "step": 165 + }, + { + "epoch": 0.17671517671517672, + "grad_norm": 4.2057390213012695, + "learning_rate": 1.756756756756757e-05, + "loss": 0.3224, + "num_input_tokens_seen": 68544, + "step": 170 + }, + { + "epoch": 0.18191268191268192, + "grad_norm": 36.7962532043457, + "learning_rate": 1.808731808731809e-05, + "loss": 0.3814, + "num_input_tokens_seen": 70592, + "step": 175 + }, + { + "epoch": 0.18711018711018712, + "grad_norm": 9.922293663024902, + "learning_rate": 1.8607068607068607e-05, + "loss": 0.338, + "num_input_tokens_seen": 72576, + "step": 180 + }, + { + "epoch": 0.19230769230769232, + "grad_norm": 2.9066672325134277, + "learning_rate": 1.9126819126819128e-05, + "loss": 0.2853, + "num_input_tokens_seen": 74624, + "step": 185 + }, + { + "epoch": 0.19750519750519752, + "grad_norm": 30.27046775817871, + "learning_rate": 1.964656964656965e-05, + "loss": 0.3374, + "num_input_tokens_seen": 76608, + "step": 190 + }, + { + "epoch": 0.20270270270270271, + "grad_norm": 17.140790939331055, + "learning_rate": 2.016632016632017e-05, + "loss": 0.3221, + "num_input_tokens_seen": 78720, + "step": 195 + }, + { + "epoch": 0.2079002079002079, + "grad_norm": 75.4980239868164, + "learning_rate": 2.068607068607069e-05, + "loss": 0.3944, + "num_input_tokens_seen": 81152, + "step": 200 + }, + { + "epoch": 0.2130977130977131, + "grad_norm": 10.222508430480957, + "learning_rate": 2.1205821205821207e-05, + "loss": 0.3755, + "num_input_tokens_seen": 83200, + "step": 205 + }, + { + "epoch": 0.2182952182952183, + "grad_norm": 9.712939262390137, + "learning_rate": 2.1725571725571728e-05, + "loss": 0.2949, + "num_input_tokens_seen": 85184, + "step": 210 + }, + { + "epoch": 0.2234927234927235, + "grad_norm": 20.923433303833008, + "learning_rate": 2.2245322245322248e-05, + "loss": 0.2174, + "num_input_tokens_seen": 87232, + "step": 215 + }, + { + "epoch": 0.2286902286902287, + "grad_norm": 27.973743438720703, + "learning_rate": 2.276507276507277e-05, + "loss": 0.6706, + "num_input_tokens_seen": 89152, + "step": 220 + }, + { + "epoch": 0.2338877338877339, + "grad_norm": 23.218599319458008, + "learning_rate": 2.3284823284823286e-05, + "loss": 0.4387, + "num_input_tokens_seen": 91328, + "step": 225 + }, + { + "epoch": 0.2390852390852391, + "grad_norm": 3.9333198070526123, + "learning_rate": 2.3804573804573807e-05, + "loss": 0.3047, + "num_input_tokens_seen": 93312, + "step": 230 + }, + { + "epoch": 0.2442827442827443, + "grad_norm": 3.1809186935424805, + "learning_rate": 2.4324324324324327e-05, + "loss": 0.2717, + "num_input_tokens_seen": 95296, + "step": 235 + }, + { + "epoch": 0.2494802494802495, + "grad_norm": 15.368531227111816, + "learning_rate": 2.4844074844074848e-05, + "loss": 0.2682, + "num_input_tokens_seen": 97216, + "step": 240 + }, + { + "epoch": 0.2505197505197505, + "eval_loss": 0.38468512892723083, + "eval_runtime": 1.6403, + "eval_samples_per_second": 521.872, + "eval_steps_per_second": 65.234, + "num_input_tokens_seen": 97664, + "step": 241 + }, + { + "epoch": 0.25467775467775466, + "grad_norm": 2.458040952682495, + "learning_rate": 2.5363825363825365e-05, + "loss": 0.344, + "num_input_tokens_seen": 99264, + "step": 245 + }, + { + "epoch": 0.2598752598752599, + "grad_norm": 26.132585525512695, + "learning_rate": 2.5883575883575882e-05, + "loss": 0.3993, + "num_input_tokens_seen": 101184, + "step": 250 + }, + { + "epoch": 0.26507276507276506, + "grad_norm": 28.206130981445312, + "learning_rate": 2.6403326403326406e-05, + "loss": 0.4414, + "num_input_tokens_seen": 103296, + "step": 255 + }, + { + "epoch": 0.2702702702702703, + "grad_norm": 6.235988140106201, + "learning_rate": 2.6923076923076923e-05, + "loss": 0.3322, + "num_input_tokens_seen": 105344, + "step": 260 + }, + { + "epoch": 0.27546777546777546, + "grad_norm": 5.716452121734619, + "learning_rate": 2.7442827442827447e-05, + "loss": 0.3314, + "num_input_tokens_seen": 107392, + "step": 265 + }, + { + "epoch": 0.2806652806652807, + "grad_norm": 13.819499969482422, + "learning_rate": 2.796257796257796e-05, + "loss": 0.2951, + "num_input_tokens_seen": 109440, + "step": 270 + }, + { + "epoch": 0.28586278586278585, + "grad_norm": 27.50826644897461, + "learning_rate": 2.8482328482328485e-05, + "loss": 0.2986, + "num_input_tokens_seen": 111424, + "step": 275 + }, + { + "epoch": 0.2910602910602911, + "grad_norm": 24.54796600341797, + "learning_rate": 2.9002079002079002e-05, + "loss": 0.407, + "num_input_tokens_seen": 113408, + "step": 280 + }, + { + "epoch": 0.29625779625779625, + "grad_norm": 1.7183665037155151, + "learning_rate": 2.9521829521829526e-05, + "loss": 0.4506, + "num_input_tokens_seen": 115392, + "step": 285 + }, + { + "epoch": 0.30145530145530147, + "grad_norm": 38.75688552856445, + "learning_rate": 3.0041580041580043e-05, + "loss": 0.4738, + "num_input_tokens_seen": 117440, + "step": 290 + }, + { + "epoch": 0.30665280665280664, + "grad_norm": 20.901853561401367, + "learning_rate": 3.056133056133057e-05, + "loss": 0.5248, + "num_input_tokens_seen": 119424, + "step": 295 + }, + { + "epoch": 0.31185031185031187, + "grad_norm": 37.667694091796875, + "learning_rate": 3.108108108108108e-05, + "loss": 0.3321, + "num_input_tokens_seen": 121344, + "step": 300 + }, + { + "epoch": 0.31704781704781704, + "grad_norm": 21.214815139770508, + "learning_rate": 3.16008316008316e-05, + "loss": 0.3707, + "num_input_tokens_seen": 123264, + "step": 305 + }, + { + "epoch": 0.32224532224532226, + "grad_norm": 3.6351711750030518, + "learning_rate": 3.212058212058212e-05, + "loss": 0.3574, + "num_input_tokens_seen": 125184, + "step": 310 + }, + { + "epoch": 0.32744282744282743, + "grad_norm": 2.756866216659546, + "learning_rate": 3.264033264033264e-05, + "loss": 0.2851, + "num_input_tokens_seen": 127296, + "step": 315 + }, + { + "epoch": 0.33264033264033266, + "grad_norm": 8.542179107666016, + "learning_rate": 3.3160083160083164e-05, + "loss": 0.2794, + "num_input_tokens_seen": 129408, + "step": 320 + }, + { + "epoch": 0.33783783783783783, + "grad_norm": 5.599982738494873, + "learning_rate": 3.3679833679833684e-05, + "loss": 0.3015, + "num_input_tokens_seen": 131520, + "step": 325 + }, + { + "epoch": 0.34303534303534305, + "grad_norm": 0.6099509000778198, + "learning_rate": 3.41995841995842e-05, + "loss": 0.2826, + "num_input_tokens_seen": 133568, + "step": 330 + }, + { + "epoch": 0.3482328482328482, + "grad_norm": 10.96675968170166, + "learning_rate": 3.4719334719334725e-05, + "loss": 0.3704, + "num_input_tokens_seen": 135616, + "step": 335 + }, + { + "epoch": 0.35343035343035345, + "grad_norm": 36.376678466796875, + "learning_rate": 3.523908523908524e-05, + "loss": 0.4519, + "num_input_tokens_seen": 137664, + "step": 340 + }, + { + "epoch": 0.3586278586278586, + "grad_norm": 23.873687744140625, + "learning_rate": 3.575883575883576e-05, + "loss": 0.2863, + "num_input_tokens_seen": 139584, + "step": 345 + }, + { + "epoch": 0.36382536382536385, + "grad_norm": 3.04746675491333, + "learning_rate": 3.627858627858628e-05, + "loss": 0.4921, + "num_input_tokens_seen": 141504, + "step": 350 + }, + { + "epoch": 0.369022869022869, + "grad_norm": 22.159381866455078, + "learning_rate": 3.67983367983368e-05, + "loss": 0.3078, + "num_input_tokens_seen": 143552, + "step": 355 + }, + { + "epoch": 0.37422037422037424, + "grad_norm": 4.239355564117432, + "learning_rate": 3.731808731808732e-05, + "loss": 0.252, + "num_input_tokens_seen": 145536, + "step": 360 + }, + { + "epoch": 0.3794178794178794, + "grad_norm": 33.11611557006836, + "learning_rate": 3.783783783783784e-05, + "loss": 0.2894, + "num_input_tokens_seen": 147456, + "step": 365 + }, + { + "epoch": 0.38461538461538464, + "grad_norm": 3.5446720123291016, + "learning_rate": 3.8357588357588356e-05, + "loss": 0.1779, + "num_input_tokens_seen": 149440, + "step": 370 + }, + { + "epoch": 0.3898128898128898, + "grad_norm": 17.057636260986328, + "learning_rate": 3.8877338877338883e-05, + "loss": 0.4928, + "num_input_tokens_seen": 151360, + "step": 375 + }, + { + "epoch": 0.39501039501039503, + "grad_norm": 11.648699760437012, + "learning_rate": 3.93970893970894e-05, + "loss": 0.4363, + "num_input_tokens_seen": 153344, + "step": 380 + }, + { + "epoch": 0.4002079002079002, + "grad_norm": 6.347674369812012, + "learning_rate": 3.991683991683992e-05, + "loss": 0.2689, + "num_input_tokens_seen": 155264, + "step": 385 + }, + { + "epoch": 0.40540540540540543, + "grad_norm": 14.731024742126465, + "learning_rate": 4.043659043659044e-05, + "loss": 0.2539, + "num_input_tokens_seen": 157248, + "step": 390 + }, + { + "epoch": 0.4106029106029106, + "grad_norm": 11.619532585144043, + "learning_rate": 4.095634095634096e-05, + "loss": 0.332, + "num_input_tokens_seen": 159296, + "step": 395 + }, + { + "epoch": 0.4158004158004158, + "grad_norm": 20.94300079345703, + "learning_rate": 4.147609147609148e-05, + "loss": 0.3, + "num_input_tokens_seen": 161344, + "step": 400 + }, + { + "epoch": 0.420997920997921, + "grad_norm": 4.039135456085205, + "learning_rate": 4.1995841995842e-05, + "loss": 0.2376, + "num_input_tokens_seen": 163328, + "step": 405 + }, + { + "epoch": 0.4261954261954262, + "grad_norm": 9.615825653076172, + "learning_rate": 4.2515592515592514e-05, + "loss": 0.2709, + "num_input_tokens_seen": 165312, + "step": 410 + }, + { + "epoch": 0.4313929313929314, + "grad_norm": 4.961127758026123, + "learning_rate": 4.303534303534304e-05, + "loss": 0.1471, + "num_input_tokens_seen": 167360, + "step": 415 + }, + { + "epoch": 0.4365904365904366, + "grad_norm": 55.59805679321289, + "learning_rate": 4.3555093555093555e-05, + "loss": 0.9994, + "num_input_tokens_seen": 169344, + "step": 420 + }, + { + "epoch": 0.4417879417879418, + "grad_norm": 7.878658294677734, + "learning_rate": 4.407484407484408e-05, + "loss": 0.603, + "num_input_tokens_seen": 171456, + "step": 425 + }, + { + "epoch": 0.446985446985447, + "grad_norm": 5.158046722412109, + "learning_rate": 4.4594594594594596e-05, + "loss": 0.3054, + "num_input_tokens_seen": 173568, + "step": 430 + }, + { + "epoch": 0.4521829521829522, + "grad_norm": 1.331925630569458, + "learning_rate": 4.511434511434512e-05, + "loss": 0.3208, + "num_input_tokens_seen": 175552, + "step": 435 + }, + { + "epoch": 0.4573804573804574, + "grad_norm": 7.393728733062744, + "learning_rate": 4.563409563409564e-05, + "loss": 0.2942, + "num_input_tokens_seen": 177536, + "step": 440 + }, + { + "epoch": 0.4625779625779626, + "grad_norm": 15.99036693572998, + "learning_rate": 4.615384615384616e-05, + "loss": 0.3005, + "num_input_tokens_seen": 179584, + "step": 445 + }, + { + "epoch": 0.4677754677754678, + "grad_norm": 1.2690688371658325, + "learning_rate": 4.667359667359668e-05, + "loss": 1.7773, + "num_input_tokens_seen": 181568, + "step": 450 + }, + { + "epoch": 0.47297297297297297, + "grad_norm": 3.469167709350586, + "learning_rate": 4.71933471933472e-05, + "loss": 0.2889, + "num_input_tokens_seen": 183552, + "step": 455 + }, + { + "epoch": 0.4781704781704782, + "grad_norm": 90.938232421875, + "learning_rate": 4.771309771309771e-05, + "loss": 0.2556, + "num_input_tokens_seen": 185600, + "step": 460 + }, + { + "epoch": 0.48336798336798337, + "grad_norm": 2.4140217304229736, + "learning_rate": 4.823284823284824e-05, + "loss": 0.2378, + "num_input_tokens_seen": 187584, + "step": 465 + }, + { + "epoch": 0.4885654885654886, + "grad_norm": 4.565840721130371, + "learning_rate": 4.8752598752598754e-05, + "loss": 0.2859, + "num_input_tokens_seen": 189568, + "step": 470 + }, + { + "epoch": 0.49376299376299376, + "grad_norm": 12.585880279541016, + "learning_rate": 4.9272349272349275e-05, + "loss": 0.2438, + "num_input_tokens_seen": 191680, + "step": 475 + }, + { + "epoch": 0.498960498960499, + "grad_norm": 3.2450168132781982, + "learning_rate": 4.9792099792099796e-05, + "loss": 0.3383, + "num_input_tokens_seen": 193728, + "step": 480 + }, + { + "epoch": 0.501039501039501, + "eval_loss": 0.4080815315246582, + "eval_runtime": 2.6441, + "eval_samples_per_second": 323.736, + "eval_steps_per_second": 40.467, + "num_input_tokens_seen": 194560, + "step": 482 + }, + { + "epoch": 0.5041580041580042, + "grad_norm": 29.770891189575195, + "learning_rate": 4.999994075155936e-05, + "loss": 0.381, + "num_input_tokens_seen": 195776, + "step": 485 + }, + { + "epoch": 0.5093555093555093, + "grad_norm": 19.471193313598633, + "learning_rate": 4.999957867877242e-05, + "loss": 0.2916, + "num_input_tokens_seen": 197696, + "step": 490 + }, + { + "epoch": 0.5145530145530145, + "grad_norm": 29.544788360595703, + "learning_rate": 4.999888745376028e-05, + "loss": 0.2766, + "num_input_tokens_seen": 199680, + "step": 495 + }, + { + "epoch": 0.5197505197505198, + "grad_norm": 11.05797290802002, + "learning_rate": 4.9997867085623824e-05, + "loss": 0.2596, + "num_input_tokens_seen": 201792, + "step": 500 + }, + { + "epoch": 0.524948024948025, + "grad_norm": 3.8948936462402344, + "learning_rate": 4.999651758779754e-05, + "loss": 0.2689, + "num_input_tokens_seen": 203840, + "step": 505 + }, + { + "epoch": 0.5301455301455301, + "grad_norm": 18.150039672851562, + "learning_rate": 4.999483897804933e-05, + "loss": 0.3363, + "num_input_tokens_seen": 205824, + "step": 510 + }, + { + "epoch": 0.5353430353430353, + "grad_norm": 1.8224319219589233, + "learning_rate": 4.999283127848029e-05, + "loss": 0.2583, + "num_input_tokens_seen": 207936, + "step": 515 + }, + { + "epoch": 0.5405405405405406, + "grad_norm": 9.910496711730957, + "learning_rate": 4.999049451552443e-05, + "loss": 0.3915, + "num_input_tokens_seen": 209984, + "step": 520 + }, + { + "epoch": 0.5457380457380457, + "grad_norm": 0.8137359619140625, + "learning_rate": 4.9987828719948284e-05, + "loss": 0.2461, + "num_input_tokens_seen": 212096, + "step": 525 + }, + { + "epoch": 0.5509355509355509, + "grad_norm": 2.0492968559265137, + "learning_rate": 4.998483392685055e-05, + "loss": 0.2863, + "num_input_tokens_seen": 214080, + "step": 530 + }, + { + "epoch": 0.5561330561330561, + "grad_norm": 24.322450637817383, + "learning_rate": 4.9981510175661606e-05, + "loss": 0.3052, + "num_input_tokens_seen": 216128, + "step": 535 + }, + { + "epoch": 0.5613305613305614, + "grad_norm": 28.344161987304688, + "learning_rate": 4.9977857510143e-05, + "loss": 0.3625, + "num_input_tokens_seen": 218176, + "step": 540 + }, + { + "epoch": 0.5665280665280665, + "grad_norm": 11.159996032714844, + "learning_rate": 4.9973875978386843e-05, + "loss": 0.2801, + "num_input_tokens_seen": 220096, + "step": 545 + }, + { + "epoch": 0.5717255717255717, + "grad_norm": 14.94636058807373, + "learning_rate": 4.996956563281524e-05, + "loss": 0.3041, + "num_input_tokens_seen": 222080, + "step": 550 + }, + { + "epoch": 0.5769230769230769, + "grad_norm": 8.506303787231445, + "learning_rate": 4.996492653017952e-05, + "loss": 0.2498, + "num_input_tokens_seen": 224000, + "step": 555 + }, + { + "epoch": 0.5821205821205822, + "grad_norm": 18.009078979492188, + "learning_rate": 4.995995873155958e-05, + "loss": 0.3224, + "num_input_tokens_seen": 225984, + "step": 560 + }, + { + "epoch": 0.5873180873180873, + "grad_norm": 19.32984733581543, + "learning_rate": 4.9954662302362973e-05, + "loss": 0.322, + "num_input_tokens_seen": 227840, + "step": 565 + }, + { + "epoch": 0.5925155925155925, + "grad_norm": 18.17301368713379, + "learning_rate": 4.9949037312324155e-05, + "loss": 0.302, + "num_input_tokens_seen": 229824, + "step": 570 + }, + { + "epoch": 0.5977130977130977, + "grad_norm": 14.943294525146484, + "learning_rate": 4.9943083835503467e-05, + "loss": 0.3875, + "num_input_tokens_seen": 231872, + "step": 575 + }, + { + "epoch": 0.6029106029106029, + "grad_norm": 12.56007194519043, + "learning_rate": 4.993680195028626e-05, + "loss": 0.314, + "num_input_tokens_seen": 233920, + "step": 580 + }, + { + "epoch": 0.6081081081081081, + "grad_norm": 12.372591972351074, + "learning_rate": 4.9930191739381775e-05, + "loss": 0.3189, + "num_input_tokens_seen": 235840, + "step": 585 + }, + { + "epoch": 0.6133056133056133, + "grad_norm": 11.213384628295898, + "learning_rate": 4.9923253289822116e-05, + "loss": 0.3418, + "num_input_tokens_seen": 238016, + "step": 590 + }, + { + "epoch": 0.6185031185031185, + "grad_norm": 12.969761848449707, + "learning_rate": 4.9915986692961045e-05, + "loss": 0.3307, + "num_input_tokens_seen": 240064, + "step": 595 + }, + { + "epoch": 0.6237006237006237, + "grad_norm": 1.1426069736480713, + "learning_rate": 4.9908392044472865e-05, + "loss": 0.2835, + "num_input_tokens_seen": 242048, + "step": 600 + }, + { + "epoch": 0.6288981288981289, + "grad_norm": 7.80474853515625, + "learning_rate": 4.990046944435105e-05, + "loss": 0.2584, + "num_input_tokens_seen": 243968, + "step": 605 + }, + { + "epoch": 0.6340956340956341, + "grad_norm": 1.6327171325683594, + "learning_rate": 4.989221899690704e-05, + "loss": 0.2953, + "num_input_tokens_seen": 246016, + "step": 610 + }, + { + "epoch": 0.6392931392931392, + "grad_norm": 16.204669952392578, + "learning_rate": 4.9883640810768764e-05, + "loss": 0.3214, + "num_input_tokens_seen": 248000, + "step": 615 + }, + { + "epoch": 0.6444906444906445, + "grad_norm": 0.29481250047683716, + "learning_rate": 4.9874734998879316e-05, + "loss": 0.312, + "num_input_tokens_seen": 250048, + "step": 620 + }, + { + "epoch": 0.6496881496881497, + "grad_norm": 18.51386833190918, + "learning_rate": 4.9865501678495375e-05, + "loss": 0.3215, + "num_input_tokens_seen": 252096, + "step": 625 + }, + { + "epoch": 0.6548856548856549, + "grad_norm": 5.452864646911621, + "learning_rate": 4.98559409711857e-05, + "loss": 0.2892, + "num_input_tokens_seen": 254144, + "step": 630 + }, + { + "epoch": 0.66008316008316, + "grad_norm": 11.4102783203125, + "learning_rate": 4.984605300282954e-05, + "loss": 0.3016, + "num_input_tokens_seen": 256128, + "step": 635 + }, + { + "epoch": 0.6652806652806653, + "grad_norm": 8.976471900939941, + "learning_rate": 4.983583790361497e-05, + "loss": 0.2596, + "num_input_tokens_seen": 258048, + "step": 640 + }, + { + "epoch": 0.6704781704781705, + "grad_norm": 27.530433654785156, + "learning_rate": 4.982529580803714e-05, + "loss": 0.363, + "num_input_tokens_seen": 260352, + "step": 645 + }, + { + "epoch": 0.6756756756756757, + "grad_norm": 12.061158180236816, + "learning_rate": 4.981442685489659e-05, + "loss": 0.2849, + "num_input_tokens_seen": 262272, + "step": 650 + }, + { + "epoch": 0.6808731808731808, + "grad_norm": 13.447040557861328, + "learning_rate": 4.9803231187297304e-05, + "loss": 0.2969, + "num_input_tokens_seen": 264320, + "step": 655 + }, + { + "epoch": 0.6860706860706861, + "grad_norm": 33.57612228393555, + "learning_rate": 4.979170895264494e-05, + "loss": 0.3962, + "num_input_tokens_seen": 266240, + "step": 660 + }, + { + "epoch": 0.6912681912681913, + "grad_norm": 4.9110002517700195, + "learning_rate": 4.977986030264482e-05, + "loss": 0.312, + "num_input_tokens_seen": 268224, + "step": 665 + }, + { + "epoch": 0.6964656964656964, + "grad_norm": 0.21739044785499573, + "learning_rate": 4.976768539329994e-05, + "loss": 0.2552, + "num_input_tokens_seen": 270272, + "step": 670 + }, + { + "epoch": 0.7016632016632016, + "grad_norm": 8.439529418945312, + "learning_rate": 4.975518438490897e-05, + "loss": 0.312, + "num_input_tokens_seen": 272256, + "step": 675 + }, + { + "epoch": 0.7068607068607069, + "grad_norm": 10.565657615661621, + "learning_rate": 4.9742357442064045e-05, + "loss": 0.2889, + "num_input_tokens_seen": 274240, + "step": 680 + }, + { + "epoch": 0.7120582120582121, + "grad_norm": 19.482200622558594, + "learning_rate": 4.972920473364869e-05, + "loss": 0.2841, + "num_input_tokens_seen": 276288, + "step": 685 + }, + { + "epoch": 0.7172557172557172, + "grad_norm": 21.85175132751465, + "learning_rate": 4.971572643283557e-05, + "loss": 0.3076, + "num_input_tokens_seen": 278272, + "step": 690 + }, + { + "epoch": 0.7224532224532224, + "grad_norm": 7.696235656738281, + "learning_rate": 4.970192271708416e-05, + "loss": 0.285, + "num_input_tokens_seen": 280384, + "step": 695 + }, + { + "epoch": 0.7276507276507277, + "grad_norm": 4.778509616851807, + "learning_rate": 4.968779376813849e-05, + "loss": 0.2376, + "num_input_tokens_seen": 282368, + "step": 700 + }, + { + "epoch": 0.7328482328482329, + "grad_norm": 9.415769577026367, + "learning_rate": 4.967333977202469e-05, + "loss": 0.2787, + "num_input_tokens_seen": 284416, + "step": 705 + }, + { + "epoch": 0.738045738045738, + "grad_norm": 4.963840484619141, + "learning_rate": 4.965856091904855e-05, + "loss": 0.214, + "num_input_tokens_seen": 286464, + "step": 710 + }, + { + "epoch": 0.7432432432432432, + "grad_norm": 12.690200805664062, + "learning_rate": 4.964345740379307e-05, + "loss": 0.2858, + "num_input_tokens_seen": 288448, + "step": 715 + }, + { + "epoch": 0.7484407484407485, + "grad_norm": 15.548615455627441, + "learning_rate": 4.962802942511581e-05, + "loss": 0.2962, + "num_input_tokens_seen": 290496, + "step": 720 + }, + { + "epoch": 0.7515592515592515, + "eval_loss": 0.29600390791893005, + "eval_runtime": 3.3797, + "eval_samples_per_second": 253.278, + "eval_steps_per_second": 31.66, + "num_input_tokens_seen": 291712, + "step": 723 + }, + { + "epoch": 0.7536382536382537, + "grad_norm": 7.057698726654053, + "learning_rate": 4.9612277186146335e-05, + "loss": 0.3061, + "num_input_tokens_seen": 292480, + "step": 725 + }, + { + "epoch": 0.7588357588357588, + "grad_norm": 17.72517204284668, + "learning_rate": 4.959620089428354e-05, + "loss": 0.281, + "num_input_tokens_seen": 294464, + "step": 730 + }, + { + "epoch": 0.764033264033264, + "grad_norm": 1.6551860570907593, + "learning_rate": 4.957980076119285e-05, + "loss": 0.2702, + "num_input_tokens_seen": 296448, + "step": 735 + }, + { + "epoch": 0.7692307692307693, + "grad_norm": 9.719671249389648, + "learning_rate": 4.956307700280354e-05, + "loss": 0.3146, + "num_input_tokens_seen": 298432, + "step": 740 + }, + { + "epoch": 0.7744282744282744, + "grad_norm": 8.770389556884766, + "learning_rate": 4.954602983930581e-05, + "loss": 0.2567, + "num_input_tokens_seen": 300480, + "step": 745 + }, + { + "epoch": 0.7796257796257796, + "grad_norm": 7.721967697143555, + "learning_rate": 4.95286594951479e-05, + "loss": 0.2488, + "num_input_tokens_seen": 302400, + "step": 750 + }, + { + "epoch": 0.7848232848232848, + "grad_norm": 7.888345241546631, + "learning_rate": 4.9510966199033174e-05, + "loss": 0.2852, + "num_input_tokens_seen": 304320, + "step": 755 + }, + { + "epoch": 0.7900207900207901, + "grad_norm": 8.099255561828613, + "learning_rate": 4.949295018391706e-05, + "loss": 0.2968, + "num_input_tokens_seen": 306240, + "step": 760 + }, + { + "epoch": 0.7952182952182952, + "grad_norm": 7.542270183563232, + "learning_rate": 4.947461168700402e-05, + "loss": 0.2957, + "num_input_tokens_seen": 308032, + "step": 765 + }, + { + "epoch": 0.8004158004158004, + "grad_norm": 4.36430025100708, + "learning_rate": 4.945595094974442e-05, + "loss": 0.2531, + "num_input_tokens_seen": 309952, + "step": 770 + }, + { + "epoch": 0.8056133056133056, + "grad_norm": 11.39189624786377, + "learning_rate": 4.94369682178313e-05, + "loss": 0.2396, + "num_input_tokens_seen": 311936, + "step": 775 + }, + { + "epoch": 0.8108108108108109, + "grad_norm": 3.859365224838257, + "learning_rate": 4.9417663741197236e-05, + "loss": 0.3127, + "num_input_tokens_seen": 313920, + "step": 780 + }, + { + "epoch": 0.816008316008316, + "grad_norm": 10.639534950256348, + "learning_rate": 4.939803777401095e-05, + "loss": 0.2873, + "num_input_tokens_seen": 315968, + "step": 785 + }, + { + "epoch": 0.8212058212058212, + "grad_norm": 8.708645820617676, + "learning_rate": 4.937809057467404e-05, + "loss": 0.263, + "num_input_tokens_seen": 317952, + "step": 790 + }, + { + "epoch": 0.8264033264033264, + "grad_norm": 3.0771279335021973, + "learning_rate": 4.935782240581752e-05, + "loss": 0.2762, + "num_input_tokens_seen": 319872, + "step": 795 + }, + { + "epoch": 0.8316008316008316, + "grad_norm": 9.068258285522461, + "learning_rate": 4.9337233534298425e-05, + "loss": 0.2759, + "num_input_tokens_seen": 321856, + "step": 800 + }, + { + "epoch": 0.8367983367983368, + "grad_norm": 11.020606994628906, + "learning_rate": 4.931632423119621e-05, + "loss": 0.2849, + "num_input_tokens_seen": 323968, + "step": 805 + }, + { + "epoch": 0.841995841995842, + "grad_norm": 11.716889381408691, + "learning_rate": 4.9295094771809285e-05, + "loss": 0.2775, + "num_input_tokens_seen": 325952, + "step": 810 + }, + { + "epoch": 0.8471933471933472, + "grad_norm": 2.4100873470306396, + "learning_rate": 4.92735454356513e-05, + "loss": 0.1962, + "num_input_tokens_seen": 328000, + "step": 815 + }, + { + "epoch": 0.8523908523908524, + "grad_norm": 18.39780044555664, + "learning_rate": 4.925167650644752e-05, + "loss": 0.2237, + "num_input_tokens_seen": 329984, + "step": 820 + }, + { + "epoch": 0.8575883575883576, + "grad_norm": 31.814456939697266, + "learning_rate": 4.9229488272131067e-05, + "loss": 0.3432, + "num_input_tokens_seen": 331904, + "step": 825 + }, + { + "epoch": 0.8627858627858628, + "grad_norm": 13.310869216918945, + "learning_rate": 4.920698102483912e-05, + "loss": 0.3102, + "num_input_tokens_seen": 333888, + "step": 830 + }, + { + "epoch": 0.867983367983368, + "grad_norm": 1.8199642896652222, + "learning_rate": 4.918415506090911e-05, + "loss": 0.3035, + "num_input_tokens_seen": 335872, + "step": 835 + }, + { + "epoch": 0.8731808731808732, + "grad_norm": 14.503442764282227, + "learning_rate": 4.916101068087476e-05, + "loss": 0.2682, + "num_input_tokens_seen": 337856, + "step": 840 + }, + { + "epoch": 0.8783783783783784, + "grad_norm": 1.1979509592056274, + "learning_rate": 4.913754818946219e-05, + "loss": 0.2422, + "num_input_tokens_seen": 339776, + "step": 845 + }, + { + "epoch": 0.8835758835758836, + "grad_norm": 5.467031478881836, + "learning_rate": 4.911376789558584e-05, + "loss": 0.1949, + "num_input_tokens_seen": 341760, + "step": 850 + }, + { + "epoch": 0.8887733887733887, + "grad_norm": 26.362804412841797, + "learning_rate": 4.9089670112344456e-05, + "loss": 0.3477, + "num_input_tokens_seen": 343680, + "step": 855 + }, + { + "epoch": 0.893970893970894, + "grad_norm": 13.462319374084473, + "learning_rate": 4.906525515701695e-05, + "loss": 0.292, + "num_input_tokens_seen": 345600, + "step": 860 + }, + { + "epoch": 0.8991683991683992, + "grad_norm": 15.104516983032227, + "learning_rate": 4.904052335105822e-05, + "loss": 0.2896, + "num_input_tokens_seen": 347520, + "step": 865 + }, + { + "epoch": 0.9043659043659044, + "grad_norm": 2.1453566551208496, + "learning_rate": 4.90154750200949e-05, + "loss": 0.2644, + "num_input_tokens_seen": 349568, + "step": 870 + }, + { + "epoch": 0.9095634095634095, + "grad_norm": 30.04273223876953, + "learning_rate": 4.8990110493921105e-05, + "loss": 0.3212, + "num_input_tokens_seen": 351552, + "step": 875 + }, + { + "epoch": 0.9147609147609148, + "grad_norm": 9.758408546447754, + "learning_rate": 4.8964430106494075e-05, + "loss": 0.2787, + "num_input_tokens_seen": 353472, + "step": 880 + }, + { + "epoch": 0.91995841995842, + "grad_norm": 2.3094310760498047, + "learning_rate": 4.893843419592977e-05, + "loss": 0.2656, + "num_input_tokens_seen": 355392, + "step": 885 + }, + { + "epoch": 0.9251559251559252, + "grad_norm": 2.449030876159668, + "learning_rate": 4.891212310449844e-05, + "loss": 0.2593, + "num_input_tokens_seen": 357440, + "step": 890 + }, + { + "epoch": 0.9303534303534303, + "grad_norm": 5.086390972137451, + "learning_rate": 4.8885497178620095e-05, + "loss": 0.2785, + "num_input_tokens_seen": 359488, + "step": 895 + }, + { + "epoch": 0.9355509355509356, + "grad_norm": 12.254743576049805, + "learning_rate": 4.8858556768859944e-05, + "loss": 0.283, + "num_input_tokens_seen": 361408, + "step": 900 + }, + { + "epoch": 0.9407484407484408, + "grad_norm": 8.048048973083496, + "learning_rate": 4.88313022299238e-05, + "loss": 0.27, + "num_input_tokens_seen": 363392, + "step": 905 + }, + { + "epoch": 0.9459459459459459, + "grad_norm": 13.520707130432129, + "learning_rate": 4.88037339206534e-05, + "loss": 0.2987, + "num_input_tokens_seen": 365440, + "step": 910 + }, + { + "epoch": 0.9511434511434511, + "grad_norm": 18.515222549438477, + "learning_rate": 4.8775852204021665e-05, + "loss": 0.2998, + "num_input_tokens_seen": 367616, + "step": 915 + }, + { + "epoch": 0.9563409563409564, + "grad_norm": 25.785511016845703, + "learning_rate": 4.874765744712796e-05, + "loss": 0.358, + "num_input_tokens_seen": 369600, + "step": 920 + }, + { + "epoch": 0.9615384615384616, + "grad_norm": 8.675851821899414, + "learning_rate": 4.871915002119321e-05, + "loss": 0.2755, + "num_input_tokens_seen": 371520, + "step": 925 + }, + { + "epoch": 0.9667359667359667, + "grad_norm": 0.7464810013771057, + "learning_rate": 4.8690330301555045e-05, + "loss": 0.3085, + "num_input_tokens_seen": 373568, + "step": 930 + }, + { + "epoch": 0.9719334719334719, + "grad_norm": 21.288469314575195, + "learning_rate": 4.8661198667662854e-05, + "loss": 0.2548, + "num_input_tokens_seen": 375488, + "step": 935 + }, + { + "epoch": 0.9771309771309772, + "grad_norm": 15.424735069274902, + "learning_rate": 4.86317555030728e-05, + "loss": 0.3274, + "num_input_tokens_seen": 377728, + "step": 940 + }, + { + "epoch": 0.9823284823284824, + "grad_norm": 11.471841812133789, + "learning_rate": 4.8602001195442725e-05, + "loss": 0.2924, + "num_input_tokens_seen": 379840, + "step": 945 + }, + { + "epoch": 0.9875259875259875, + "grad_norm": 12.289169311523438, + "learning_rate": 4.857193613652711e-05, + "loss": 0.2685, + "num_input_tokens_seen": 381760, + "step": 950 + }, + { + "epoch": 0.9927234927234927, + "grad_norm": 2.2855138778686523, + "learning_rate": 4.8541560722171855e-05, + "loss": 0.2743, + "num_input_tokens_seen": 383808, + "step": 955 + }, + { + "epoch": 0.997920997920998, + "grad_norm": 14.171538352966309, + "learning_rate": 4.8510875352309106e-05, + "loss": 0.2807, + "num_input_tokens_seen": 385856, + "step": 960 + }, + { + "epoch": 1.002079002079002, + "eval_loss": 0.2738620638847351, + "eval_runtime": 1.0463, + "eval_samples_per_second": 818.137, + "eval_steps_per_second": 102.267, + "num_input_tokens_seen": 387464, + "step": 964 + }, + { + "epoch": 1.003118503118503, + "grad_norm": 1.732373833656311, + "learning_rate": 4.8479880430951995e-05, + "loss": 0.2643, + "num_input_tokens_seen": 387848, + "step": 965 + }, + { + "epoch": 1.0083160083160083, + "grad_norm": 9.852456092834473, + "learning_rate": 4.844857636618928e-05, + "loss": 0.2613, + "num_input_tokens_seen": 389640, + "step": 970 + }, + { + "epoch": 1.0135135135135136, + "grad_norm": 13.70590877532959, + "learning_rate": 4.8416963570180025e-05, + "loss": 0.2824, + "num_input_tokens_seen": 391624, + "step": 975 + }, + { + "epoch": 1.0187110187110187, + "grad_norm": 10.222359657287598, + "learning_rate": 4.838504245914812e-05, + "loss": 0.3008, + "num_input_tokens_seen": 393672, + "step": 980 + }, + { + "epoch": 1.023908523908524, + "grad_norm": 24.265884399414062, + "learning_rate": 4.8352813453376836e-05, + "loss": 0.3048, + "num_input_tokens_seen": 395784, + "step": 985 + }, + { + "epoch": 1.0291060291060292, + "grad_norm": 20.11310577392578, + "learning_rate": 4.83202769772033e-05, + "loss": 0.3205, + "num_input_tokens_seen": 397768, + "step": 990 + }, + { + "epoch": 1.0343035343035343, + "grad_norm": 19.961780548095703, + "learning_rate": 4.8287433459012844e-05, + "loss": 0.2694, + "num_input_tokens_seen": 399816, + "step": 995 + }, + { + "epoch": 1.0395010395010396, + "grad_norm": 3.684941530227661, + "learning_rate": 4.8254283331233464e-05, + "loss": 0.3263, + "num_input_tokens_seen": 401928, + "step": 1000 + }, + { + "epoch": 1.0446985446985446, + "grad_norm": 1.1775870323181152, + "learning_rate": 4.822082703033003e-05, + "loss": 0.3028, + "num_input_tokens_seen": 403912, + "step": 1005 + }, + { + "epoch": 1.04989604989605, + "grad_norm": 7.7064595222473145, + "learning_rate": 4.818706499679862e-05, + "loss": 0.2501, + "num_input_tokens_seen": 405832, + "step": 1010 + }, + { + "epoch": 1.0550935550935552, + "grad_norm": 20.951908111572266, + "learning_rate": 4.815299767516065e-05, + "loss": 0.339, + "num_input_tokens_seen": 407880, + "step": 1015 + }, + { + "epoch": 1.0602910602910602, + "grad_norm": 0.5823318958282471, + "learning_rate": 4.8118625513957074e-05, + "loss": 0.2748, + "num_input_tokens_seen": 410120, + "step": 1020 + }, + { + "epoch": 1.0654885654885655, + "grad_norm": 5.90387487411499, + "learning_rate": 4.808394896574245e-05, + "loss": 0.3246, + "num_input_tokens_seen": 412168, + "step": 1025 + }, + { + "epoch": 1.0706860706860706, + "grad_norm": 13.779071807861328, + "learning_rate": 4.8048968487079e-05, + "loss": 0.2849, + "num_input_tokens_seen": 414472, + "step": 1030 + }, + { + "epoch": 1.0758835758835759, + "grad_norm": 15.818516731262207, + "learning_rate": 4.8013684538530565e-05, + "loss": 0.2908, + "num_input_tokens_seen": 416520, + "step": 1035 + }, + { + "epoch": 1.0810810810810811, + "grad_norm": 11.890518188476562, + "learning_rate": 4.79780975846566e-05, + "loss": 0.2774, + "num_input_tokens_seen": 418568, + "step": 1040 + }, + { + "epoch": 1.0862785862785862, + "grad_norm": 7.704615592956543, + "learning_rate": 4.7942208094006e-05, + "loss": 0.2417, + "num_input_tokens_seen": 420488, + "step": 1045 + }, + { + "epoch": 1.0914760914760915, + "grad_norm": 2.7734618186950684, + "learning_rate": 4.790601653911094e-05, + "loss": 0.2736, + "num_input_tokens_seen": 422472, + "step": 1050 + }, + { + "epoch": 1.0966735966735968, + "grad_norm": 12.339665412902832, + "learning_rate": 4.786952339648071e-05, + "loss": 0.3165, + "num_input_tokens_seen": 424456, + "step": 1055 + }, + { + "epoch": 1.1018711018711018, + "grad_norm": 3.863492250442505, + "learning_rate": 4.783272914659535e-05, + "loss": 0.305, + "num_input_tokens_seen": 426568, + "step": 1060 + }, + { + "epoch": 1.107068607068607, + "grad_norm": 5.703735828399658, + "learning_rate": 4.77956342738994e-05, + "loss": 0.2809, + "num_input_tokens_seen": 428552, + "step": 1065 + }, + { + "epoch": 1.1122661122661124, + "grad_norm": 5.661115646362305, + "learning_rate": 4.775823926679548e-05, + "loss": 0.2758, + "num_input_tokens_seen": 430472, + "step": 1070 + }, + { + "epoch": 1.1174636174636174, + "grad_norm": 5.488950729370117, + "learning_rate": 4.77205446176379e-05, + "loss": 0.2657, + "num_input_tokens_seen": 432328, + "step": 1075 + }, + { + "epoch": 1.1226611226611227, + "grad_norm": 10.569025993347168, + "learning_rate": 4.768255082272611e-05, + "loss": 0.2881, + "num_input_tokens_seen": 434440, + "step": 1080 + }, + { + "epoch": 1.1278586278586278, + "grad_norm": 3.0698752403259277, + "learning_rate": 4.764425838229824e-05, + "loss": 0.2938, + "num_input_tokens_seen": 436488, + "step": 1085 + }, + { + "epoch": 1.133056133056133, + "grad_norm": 23.730390548706055, + "learning_rate": 4.760566780052445e-05, + "loss": 0.4153, + "num_input_tokens_seen": 438472, + "step": 1090 + }, + { + "epoch": 1.1382536382536383, + "grad_norm": 0.6121450066566467, + "learning_rate": 4.7566779585500347e-05, + "loss": 0.3296, + "num_input_tokens_seen": 440456, + "step": 1095 + }, + { + "epoch": 1.1434511434511434, + "grad_norm": 4.771881103515625, + "learning_rate": 4.7527594249240264e-05, + "loss": 0.3082, + "num_input_tokens_seen": 442440, + "step": 1100 + }, + { + "epoch": 1.1486486486486487, + "grad_norm": 7.00406551361084, + "learning_rate": 4.748811230767051e-05, + "loss": 0.3109, + "num_input_tokens_seen": 444424, + "step": 1105 + }, + { + "epoch": 1.1538461538461537, + "grad_norm": 0.35836905241012573, + "learning_rate": 4.744833428062262e-05, + "loss": 0.2754, + "num_input_tokens_seen": 446280, + "step": 1110 + }, + { + "epoch": 1.159043659043659, + "grad_norm": 12.108142852783203, + "learning_rate": 4.740826069182645e-05, + "loss": 0.286, + "num_input_tokens_seen": 448264, + "step": 1115 + }, + { + "epoch": 1.1642411642411643, + "grad_norm": 2.960707902908325, + "learning_rate": 4.736789206890332e-05, + "loss": 0.2806, + "num_input_tokens_seen": 450376, + "step": 1120 + }, + { + "epoch": 1.1694386694386694, + "grad_norm": 1.6544653177261353, + "learning_rate": 4.732722894335909e-05, + "loss": 0.2575, + "num_input_tokens_seen": 452552, + "step": 1125 + }, + { + "epoch": 1.1746361746361746, + "grad_norm": 4.431951999664307, + "learning_rate": 4.7286271850577105e-05, + "loss": 0.2989, + "num_input_tokens_seen": 454600, + "step": 1130 + }, + { + "epoch": 1.17983367983368, + "grad_norm": 27.89082145690918, + "learning_rate": 4.724502132981119e-05, + "loss": 0.5214, + "num_input_tokens_seen": 456648, + "step": 1135 + }, + { + "epoch": 1.185031185031185, + "grad_norm": 12.9546480178833, + "learning_rate": 4.7203477924178506e-05, + "loss": 0.3325, + "num_input_tokens_seen": 458632, + "step": 1140 + }, + { + "epoch": 1.1902286902286903, + "grad_norm": 10.19326114654541, + "learning_rate": 4.7161642180652464e-05, + "loss": 0.2795, + "num_input_tokens_seen": 460680, + "step": 1145 + }, + { + "epoch": 1.1954261954261955, + "grad_norm": 11.509027481079102, + "learning_rate": 4.7119514650055476e-05, + "loss": 0.2697, + "num_input_tokens_seen": 462728, + "step": 1150 + }, + { + "epoch": 1.2006237006237006, + "grad_norm": 11.531643867492676, + "learning_rate": 4.7077095887051686e-05, + "loss": 0.2429, + "num_input_tokens_seen": 464776, + "step": 1155 + }, + { + "epoch": 1.2058212058212059, + "grad_norm": 2.4489336013793945, + "learning_rate": 4.7034386450139735e-05, + "loss": 0.2844, + "num_input_tokens_seen": 466696, + "step": 1160 + }, + { + "epoch": 1.211018711018711, + "grad_norm": 10.006536483764648, + "learning_rate": 4.699138690164533e-05, + "loss": 0.259, + "num_input_tokens_seen": 468616, + "step": 1165 + }, + { + "epoch": 1.2162162162162162, + "grad_norm": 5.630403995513916, + "learning_rate": 4.694809780771391e-05, + "loss": 0.2734, + "num_input_tokens_seen": 470728, + "step": 1170 + }, + { + "epoch": 1.2214137214137215, + "grad_norm": 9.379544258117676, + "learning_rate": 4.690451973830313e-05, + "loss": 0.2763, + "num_input_tokens_seen": 472776, + "step": 1175 + }, + { + "epoch": 1.2266112266112266, + "grad_norm": 4.9165167808532715, + "learning_rate": 4.6860653267175416e-05, + "loss": 0.2615, + "num_input_tokens_seen": 474824, + "step": 1180 + }, + { + "epoch": 1.2318087318087318, + "grad_norm": 7.163639068603516, + "learning_rate": 4.681649897189036e-05, + "loss": 0.2894, + "num_input_tokens_seen": 476744, + "step": 1185 + }, + { + "epoch": 1.237006237006237, + "grad_norm": 3.139596939086914, + "learning_rate": 4.677205743379713e-05, + "loss": 0.2065, + "num_input_tokens_seen": 478856, + "step": 1190 + }, + { + "epoch": 1.2422037422037422, + "grad_norm": 18.728031158447266, + "learning_rate": 4.672732923802685e-05, + "loss": 0.4129, + "num_input_tokens_seen": 480776, + "step": 1195 + }, + { + "epoch": 1.2474012474012475, + "grad_norm": 21.870121002197266, + "learning_rate": 4.668231497348484e-05, + "loss": 0.2716, + "num_input_tokens_seen": 482952, + "step": 1200 + }, + { + "epoch": 1.2525987525987525, + "grad_norm": 7.45676851272583, + "learning_rate": 4.663701523284291e-05, + "loss": 0.2836, + "num_input_tokens_seen": 485192, + "step": 1205 + }, + { + "epoch": 1.2525987525987525, + "eval_loss": 0.2581372559070587, + "eval_runtime": 1.5453, + "eval_samples_per_second": 553.946, + "eval_steps_per_second": 69.243, + "num_input_tokens_seen": 485192, + "step": 1205 + }, + { + "epoch": 1.2577962577962578, + "grad_norm": 19.655874252319336, + "learning_rate": 4.6591430612531515e-05, + "loss": 0.2541, + "num_input_tokens_seen": 487112, + "step": 1210 + }, + { + "epoch": 1.262993762993763, + "grad_norm": 11.319998741149902, + "learning_rate": 4.6545561712731954e-05, + "loss": 0.3056, + "num_input_tokens_seen": 489160, + "step": 1215 + }, + { + "epoch": 1.2681912681912682, + "grad_norm": 6.425257205963135, + "learning_rate": 4.649940913736841e-05, + "loss": 0.2656, + "num_input_tokens_seen": 491080, + "step": 1220 + }, + { + "epoch": 1.2733887733887734, + "grad_norm": 7.79650354385376, + "learning_rate": 4.645297349410005e-05, + "loss": 0.2917, + "num_input_tokens_seen": 493064, + "step": 1225 + }, + { + "epoch": 1.2785862785862787, + "grad_norm": 8.849406242370605, + "learning_rate": 4.640625539431298e-05, + "loss": 0.2878, + "num_input_tokens_seen": 494984, + "step": 1230 + }, + { + "epoch": 1.2837837837837838, + "grad_norm": 10.014208793640137, + "learning_rate": 4.635925545311224e-05, + "loss": 0.2686, + "num_input_tokens_seen": 496968, + "step": 1235 + }, + { + "epoch": 1.288981288981289, + "grad_norm": 3.8225860595703125, + "learning_rate": 4.6311974289313646e-05, + "loss": 0.2747, + "num_input_tokens_seen": 498824, + "step": 1240 + }, + { + "epoch": 1.2941787941787941, + "grad_norm": 9.505216598510742, + "learning_rate": 4.6264412525435716e-05, + "loss": 0.2269, + "num_input_tokens_seen": 500808, + "step": 1245 + }, + { + "epoch": 1.2993762993762994, + "grad_norm": 12.160257339477539, + "learning_rate": 4.6216570787691423e-05, + "loss": 0.2595, + "num_input_tokens_seen": 502856, + "step": 1250 + }, + { + "epoch": 1.3045738045738045, + "grad_norm": 2.7872188091278076, + "learning_rate": 4.6168449705979956e-05, + "loss": 0.2367, + "num_input_tokens_seen": 504712, + "step": 1255 + }, + { + "epoch": 1.3097713097713097, + "grad_norm": 1.930995225906372, + "learning_rate": 4.612004991387843e-05, + "loss": 0.3177, + "num_input_tokens_seen": 506696, + "step": 1260 + }, + { + "epoch": 1.314968814968815, + "grad_norm": 0.9595280289649963, + "learning_rate": 4.6071372048633566e-05, + "loss": 0.2562, + "num_input_tokens_seen": 508680, + "step": 1265 + }, + { + "epoch": 1.32016632016632, + "grad_norm": 1.0570541620254517, + "learning_rate": 4.6022416751153255e-05, + "loss": 0.291, + "num_input_tokens_seen": 510728, + "step": 1270 + }, + { + "epoch": 1.3253638253638254, + "grad_norm": 3.702086925506592, + "learning_rate": 4.5973184665998186e-05, + "loss": 0.2441, + "num_input_tokens_seen": 512712, + "step": 1275 + }, + { + "epoch": 1.3305613305613306, + "grad_norm": 0.28220054507255554, + "learning_rate": 4.5923676441373287e-05, + "loss": 0.2674, + "num_input_tokens_seen": 514696, + "step": 1280 + }, + { + "epoch": 1.3357588357588357, + "grad_norm": 4.1724724769592285, + "learning_rate": 4.5873892729119225e-05, + "loss": 0.2628, + "num_input_tokens_seen": 516808, + "step": 1285 + }, + { + "epoch": 1.340956340956341, + "grad_norm": 5.697893142700195, + "learning_rate": 4.582383418470386e-05, + "loss": 0.208, + "num_input_tokens_seen": 518792, + "step": 1290 + }, + { + "epoch": 1.3461538461538463, + "grad_norm": 14.32170581817627, + "learning_rate": 4.577350146721353e-05, + "loss": 0.2791, + "num_input_tokens_seen": 520840, + "step": 1295 + }, + { + "epoch": 1.3513513513513513, + "grad_norm": 5.778555393218994, + "learning_rate": 4.5722895239344435e-05, + "loss": 0.2367, + "num_input_tokens_seen": 522760, + "step": 1300 + }, + { + "epoch": 1.3565488565488566, + "grad_norm": 10.224639892578125, + "learning_rate": 4.567201616739393e-05, + "loss": 0.2853, + "num_input_tokens_seen": 524872, + "step": 1305 + }, + { + "epoch": 1.3617463617463619, + "grad_norm": 10.455507278442383, + "learning_rate": 4.562086492125167e-05, + "loss": 0.2922, + "num_input_tokens_seen": 526920, + "step": 1310 + }, + { + "epoch": 1.366943866943867, + "grad_norm": 1.0684677362442017, + "learning_rate": 4.556944217439088e-05, + "loss": 0.2892, + "num_input_tokens_seen": 528968, + "step": 1315 + }, + { + "epoch": 1.3721413721413722, + "grad_norm": 8.995451927185059, + "learning_rate": 4.5517748603859435e-05, + "loss": 0.2689, + "num_input_tokens_seen": 530888, + "step": 1320 + }, + { + "epoch": 1.3773388773388773, + "grad_norm": 9.848129272460938, + "learning_rate": 4.546578489027095e-05, + "loss": 0.2348, + "num_input_tokens_seen": 532872, + "step": 1325 + }, + { + "epoch": 1.3825363825363826, + "grad_norm": 12.437982559204102, + "learning_rate": 4.541355171779582e-05, + "loss": 0.2971, + "num_input_tokens_seen": 534920, + "step": 1330 + }, + { + "epoch": 1.3877338877338876, + "grad_norm": 4.1738667488098145, + "learning_rate": 4.5361049774152256e-05, + "loss": 0.2582, + "num_input_tokens_seen": 536840, + "step": 1335 + }, + { + "epoch": 1.392931392931393, + "grad_norm": 11.655598640441895, + "learning_rate": 4.530827975059715e-05, + "loss": 0.2788, + "num_input_tokens_seen": 538760, + "step": 1340 + }, + { + "epoch": 1.3981288981288982, + "grad_norm": 16.621856689453125, + "learning_rate": 4.5255242341917055e-05, + "loss": 0.2367, + "num_input_tokens_seen": 540680, + "step": 1345 + }, + { + "epoch": 1.4033264033264032, + "grad_norm": 13.314364433288574, + "learning_rate": 4.5201938246418976e-05, + "loss": 0.2864, + "num_input_tokens_seen": 542664, + "step": 1350 + }, + { + "epoch": 1.4085239085239085, + "grad_norm": 0.3170285224914551, + "learning_rate": 4.51483681659212e-05, + "loss": 0.1771, + "num_input_tokens_seen": 544712, + "step": 1355 + }, + { + "epoch": 1.4137214137214138, + "grad_norm": 14.410113334655762, + "learning_rate": 4.509453280574407e-05, + "loss": 0.3864, + "num_input_tokens_seen": 546824, + "step": 1360 + }, + { + "epoch": 1.4189189189189189, + "grad_norm": 9.504006385803223, + "learning_rate": 4.504043287470068e-05, + "loss": 0.2952, + "num_input_tokens_seen": 548936, + "step": 1365 + }, + { + "epoch": 1.4241164241164241, + "grad_norm": 19.96672248840332, + "learning_rate": 4.498606908508754e-05, + "loss": 0.3433, + "num_input_tokens_seen": 550920, + "step": 1370 + }, + { + "epoch": 1.4293139293139294, + "grad_norm": 3.9341182708740234, + "learning_rate": 4.4931442152675185e-05, + "loss": 0.2757, + "num_input_tokens_seen": 552904, + "step": 1375 + }, + { + "epoch": 1.4345114345114345, + "grad_norm": 13.74646282196045, + "learning_rate": 4.487655279669881e-05, + "loss": 0.3025, + "num_input_tokens_seen": 554824, + "step": 1380 + }, + { + "epoch": 1.4397089397089398, + "grad_norm": 2.631537914276123, + "learning_rate": 4.482140173984875e-05, + "loss": 0.2663, + "num_input_tokens_seen": 556872, + "step": 1385 + }, + { + "epoch": 1.444906444906445, + "grad_norm": 6.440622329711914, + "learning_rate": 4.476598970826094e-05, + "loss": 0.2717, + "num_input_tokens_seen": 558984, + "step": 1390 + }, + { + "epoch": 1.45010395010395, + "grad_norm": 17.752002716064453, + "learning_rate": 4.4710317431507434e-05, + "loss": 0.2791, + "num_input_tokens_seen": 560968, + "step": 1395 + }, + { + "epoch": 1.4553014553014554, + "grad_norm": 5.554246425628662, + "learning_rate": 4.465438564258673e-05, + "loss": 0.2617, + "num_input_tokens_seen": 562952, + "step": 1400 + }, + { + "epoch": 1.4604989604989604, + "grad_norm": 5.866454601287842, + "learning_rate": 4.4598195077914145e-05, + "loss": 0.2452, + "num_input_tokens_seen": 565064, + "step": 1405 + }, + { + "epoch": 1.4656964656964657, + "grad_norm": 3.3153018951416016, + "learning_rate": 4.454174647731213e-05, + "loss": 0.2761, + "num_input_tokens_seen": 567112, + "step": 1410 + }, + { + "epoch": 1.4708939708939708, + "grad_norm": 20.00400733947754, + "learning_rate": 4.4485040584000514e-05, + "loss": 0.2875, + "num_input_tokens_seen": 569160, + "step": 1415 + }, + { + "epoch": 1.476091476091476, + "grad_norm": 12.827857971191406, + "learning_rate": 4.442807814458672e-05, + "loss": 0.2782, + "num_input_tokens_seen": 571336, + "step": 1420 + }, + { + "epoch": 1.4812889812889813, + "grad_norm": 1.1996235847473145, + "learning_rate": 4.437085990905591e-05, + "loss": 0.25, + "num_input_tokens_seen": 573384, + "step": 1425 + }, + { + "epoch": 1.4864864864864864, + "grad_norm": 1.4895740747451782, + "learning_rate": 4.431338663076119e-05, + "loss": 0.2596, + "num_input_tokens_seen": 575304, + "step": 1430 + }, + { + "epoch": 1.4916839916839917, + "grad_norm": 2.120258331298828, + "learning_rate": 4.4255659066413595e-05, + "loss": 0.2788, + "num_input_tokens_seen": 577160, + "step": 1435 + }, + { + "epoch": 1.496881496881497, + "grad_norm": 1.543442726135254, + "learning_rate": 4.419767797607219e-05, + "loss": 0.2892, + "num_input_tokens_seen": 579208, + "step": 1440 + }, + { + "epoch": 1.502079002079002, + "grad_norm": 7.000278472900391, + "learning_rate": 4.413944412313405e-05, + "loss": 0.2936, + "num_input_tokens_seen": 581256, + "step": 1445 + }, + { + "epoch": 1.503118503118503, + "eval_loss": 0.25699949264526367, + "eval_runtime": 1.6561, + "eval_samples_per_second": 516.892, + "eval_steps_per_second": 64.612, + "num_input_tokens_seen": 581704, + "step": 1446 + }, + { + "epoch": 1.5072765072765073, + "grad_norm": 8.624284744262695, + "learning_rate": 4.4080958274324155e-05, + "loss": 0.2702, + "num_input_tokens_seen": 583304, + "step": 1450 + }, + { + "epoch": 1.5124740124740126, + "grad_norm": 1.7187201976776123, + "learning_rate": 4.40222211996854e-05, + "loss": 0.2252, + "num_input_tokens_seen": 585224, + "step": 1455 + }, + { + "epoch": 1.5176715176715176, + "grad_norm": 13.548686981201172, + "learning_rate": 4.396323367256836e-05, + "loss": 0.4066, + "num_input_tokens_seen": 587272, + "step": 1460 + }, + { + "epoch": 1.5228690228690227, + "grad_norm": 4.836349010467529, + "learning_rate": 4.390399646962117e-05, + "loss": 0.2413, + "num_input_tokens_seen": 589320, + "step": 1465 + }, + { + "epoch": 1.5280665280665282, + "grad_norm": 16.470077514648438, + "learning_rate": 4.384451037077924e-05, + "loss": 0.2593, + "num_input_tokens_seen": 591304, + "step": 1470 + }, + { + "epoch": 1.5332640332640333, + "grad_norm": 19.7336483001709, + "learning_rate": 4.378477615925505e-05, + "loss": 0.2499, + "num_input_tokens_seen": 593224, + "step": 1475 + }, + { + "epoch": 1.5384615384615383, + "grad_norm": 11.778541564941406, + "learning_rate": 4.372479462152781e-05, + "loss": 0.2672, + "num_input_tokens_seen": 595336, + "step": 1480 + }, + { + "epoch": 1.5436590436590436, + "grad_norm": 10.281831741333008, + "learning_rate": 4.366456654733308e-05, + "loss": 0.2898, + "num_input_tokens_seen": 597256, + "step": 1485 + }, + { + "epoch": 1.5488565488565489, + "grad_norm": 1.1301134824752808, + "learning_rate": 4.360409272965242e-05, + "loss": 0.2852, + "num_input_tokens_seen": 599304, + "step": 1490 + }, + { + "epoch": 1.554054054054054, + "grad_norm": 13.930249214172363, + "learning_rate": 4.3543373964702907e-05, + "loss": 0.2828, + "num_input_tokens_seen": 601288, + "step": 1495 + }, + { + "epoch": 1.5592515592515592, + "grad_norm": 6.923305988311768, + "learning_rate": 4.348241105192668e-05, + "loss": 0.2597, + "num_input_tokens_seen": 603272, + "step": 1500 + }, + { + "epoch": 1.5644490644490645, + "grad_norm": 6.9845356941223145, + "learning_rate": 4.34212047939804e-05, + "loss": 0.2584, + "num_input_tokens_seen": 605256, + "step": 1505 + }, + { + "epoch": 1.5696465696465696, + "grad_norm": 14.034126281738281, + "learning_rate": 4.335975599672469e-05, + "loss": 0.2713, + "num_input_tokens_seen": 607304, + "step": 1510 + }, + { + "epoch": 1.5748440748440748, + "grad_norm": 1.7358630895614624, + "learning_rate": 4.329806546921353e-05, + "loss": 0.2702, + "num_input_tokens_seen": 609224, + "step": 1515 + }, + { + "epoch": 1.5800415800415801, + "grad_norm": 7.067193031311035, + "learning_rate": 4.323613402368357e-05, + "loss": 0.2648, + "num_input_tokens_seen": 611336, + "step": 1520 + }, + { + "epoch": 1.5852390852390852, + "grad_norm": 2.2806382179260254, + "learning_rate": 4.317396247554347e-05, + "loss": 0.2879, + "num_input_tokens_seen": 613320, + "step": 1525 + }, + { + "epoch": 1.5904365904365905, + "grad_norm": 7.832094669342041, + "learning_rate": 4.311155164336318e-05, + "loss": 0.2953, + "num_input_tokens_seen": 615176, + "step": 1530 + }, + { + "epoch": 1.5956340956340958, + "grad_norm": 5.03207540512085, + "learning_rate": 4.3048902348863116e-05, + "loss": 0.2754, + "num_input_tokens_seen": 617224, + "step": 1535 + }, + { + "epoch": 1.6008316008316008, + "grad_norm": 9.225286483764648, + "learning_rate": 4.298601541690336e-05, + "loss": 0.2785, + "num_input_tokens_seen": 619208, + "step": 1540 + }, + { + "epoch": 1.6060291060291059, + "grad_norm": 8.74346923828125, + "learning_rate": 4.292289167547281e-05, + "loss": 0.278, + "num_input_tokens_seen": 621192, + "step": 1545 + }, + { + "epoch": 1.6112266112266114, + "grad_norm": 7.021914005279541, + "learning_rate": 4.285953195567827e-05, + "loss": 0.2618, + "num_input_tokens_seen": 623176, + "step": 1550 + }, + { + "epoch": 1.6164241164241164, + "grad_norm": 1.7642489671707153, + "learning_rate": 4.2795937091733515e-05, + "loss": 0.2506, + "num_input_tokens_seen": 625160, + "step": 1555 + }, + { + "epoch": 1.6216216216216215, + "grad_norm": 19.76347541809082, + "learning_rate": 4.27321079209483e-05, + "loss": 0.3095, + "num_input_tokens_seen": 627144, + "step": 1560 + }, + { + "epoch": 1.6268191268191268, + "grad_norm": 3.08026385307312, + "learning_rate": 4.266804528371732e-05, + "loss": 0.2951, + "num_input_tokens_seen": 629192, + "step": 1565 + }, + { + "epoch": 1.632016632016632, + "grad_norm": 6.732242584228516, + "learning_rate": 4.260375002350917e-05, + "loss": 0.2796, + "num_input_tokens_seen": 631240, + "step": 1570 + }, + { + "epoch": 1.637214137214137, + "grad_norm": 9.543598175048828, + "learning_rate": 4.253922298685525e-05, + "loss": 0.2407, + "num_input_tokens_seen": 633224, + "step": 1575 + }, + { + "epoch": 1.6424116424116424, + "grad_norm": 12.409037590026855, + "learning_rate": 4.247446502333858e-05, + "loss": 0.2386, + "num_input_tokens_seen": 635208, + "step": 1580 + }, + { + "epoch": 1.6476091476091477, + "grad_norm": 1.7029387950897217, + "learning_rate": 4.2409476985582644e-05, + "loss": 0.2872, + "num_input_tokens_seen": 637256, + "step": 1585 + }, + { + "epoch": 1.6528066528066527, + "grad_norm": 8.404769897460938, + "learning_rate": 4.234425972924014e-05, + "loss": 0.2806, + "num_input_tokens_seen": 639176, + "step": 1590 + }, + { + "epoch": 1.658004158004158, + "grad_norm": 3.5066511631011963, + "learning_rate": 4.227881411298175e-05, + "loss": 0.2715, + "num_input_tokens_seen": 641224, + "step": 1595 + }, + { + "epoch": 1.6632016632016633, + "grad_norm": 0.08306021988391876, + "learning_rate": 4.221314099848481e-05, + "loss": 0.2872, + "num_input_tokens_seen": 643144, + "step": 1600 + }, + { + "epoch": 1.6683991683991684, + "grad_norm": 3.17313551902771, + "learning_rate": 4.2147241250421944e-05, + "loss": 0.2204, + "num_input_tokens_seen": 644936, + "step": 1605 + }, + { + "epoch": 1.6735966735966736, + "grad_norm": 7.495476722717285, + "learning_rate": 4.208111573644975e-05, + "loss": 0.2557, + "num_input_tokens_seen": 646984, + "step": 1610 + }, + { + "epoch": 1.678794178794179, + "grad_norm": 11.988297462463379, + "learning_rate": 4.201476532719728e-05, + "loss": 0.2777, + "num_input_tokens_seen": 649032, + "step": 1615 + }, + { + "epoch": 1.683991683991684, + "grad_norm": 9.61047649383545, + "learning_rate": 4.194819089625466e-05, + "loss": 0.2778, + "num_input_tokens_seen": 651080, + "step": 1620 + }, + { + "epoch": 1.689189189189189, + "grad_norm": 12.550249099731445, + "learning_rate": 4.188139332016154e-05, + "loss": 0.2953, + "num_input_tokens_seen": 653000, + "step": 1625 + }, + { + "epoch": 1.6943866943866945, + "grad_norm": 9.836450576782227, + "learning_rate": 4.1814373478395586e-05, + "loss": 0.2955, + "num_input_tokens_seen": 654920, + "step": 1630 + }, + { + "epoch": 1.6995841995841996, + "grad_norm": 4.831801414489746, + "learning_rate": 4.174713225336086e-05, + "loss": 0.2599, + "num_input_tokens_seen": 656904, + "step": 1635 + }, + { + "epoch": 1.7047817047817047, + "grad_norm": 23.776752471923828, + "learning_rate": 4.1679670530376244e-05, + "loss": 0.2986, + "num_input_tokens_seen": 658952, + "step": 1640 + }, + { + "epoch": 1.70997920997921, + "grad_norm": 8.714804649353027, + "learning_rate": 4.161198919766375e-05, + "loss": 0.264, + "num_input_tokens_seen": 660872, + "step": 1645 + }, + { + "epoch": 1.7151767151767152, + "grad_norm": 7.620249271392822, + "learning_rate": 4.154408914633685e-05, + "loss": 0.2337, + "num_input_tokens_seen": 662856, + "step": 1650 + }, + { + "epoch": 1.7203742203742203, + "grad_norm": 12.147835731506348, + "learning_rate": 4.147597127038873e-05, + "loss": 0.2968, + "num_input_tokens_seen": 664904, + "step": 1655 + }, + { + "epoch": 1.7255717255717256, + "grad_norm": 4.487679481506348, + "learning_rate": 4.140763646668052e-05, + "loss": 0.2433, + "num_input_tokens_seen": 666888, + "step": 1660 + }, + { + "epoch": 1.7307692307692308, + "grad_norm": 4.300174236297607, + "learning_rate": 4.1339085634929485e-05, + "loss": 0.3127, + "num_input_tokens_seen": 668936, + "step": 1665 + }, + { + "epoch": 1.735966735966736, + "grad_norm": 5.227227687835693, + "learning_rate": 4.12703196776972e-05, + "loss": 0.2454, + "num_input_tokens_seen": 670856, + "step": 1670 + }, + { + "epoch": 1.7411642411642412, + "grad_norm": 3.5631868839263916, + "learning_rate": 4.120133950037763e-05, + "loss": 0.3639, + "num_input_tokens_seen": 672840, + "step": 1675 + }, + { + "epoch": 1.7463617463617465, + "grad_norm": 3.815650701522827, + "learning_rate": 4.113214601118524e-05, + "loss": 0.2468, + "num_input_tokens_seen": 674824, + "step": 1680 + }, + { + "epoch": 1.7515592515592515, + "grad_norm": 8.337157249450684, + "learning_rate": 4.1062740121143016e-05, + "loss": 0.2705, + "num_input_tokens_seen": 676808, + "step": 1685 + }, + { + "epoch": 1.7536382536382535, + "eval_loss": 0.25601524114608765, + "eval_runtime": 1.0768, + "eval_samples_per_second": 794.918, + "eval_steps_per_second": 99.365, + "num_input_tokens_seen": 677576, + "step": 1687 + }, + { + "epoch": 1.7567567567567568, + "grad_norm": 5.897716999053955, + "learning_rate": 4.099312274407048e-05, + "loss": 0.2969, + "num_input_tokens_seen": 678728, + "step": 1690 + }, + { + "epoch": 1.761954261954262, + "grad_norm": 8.0389404296875, + "learning_rate": 4.0923294796571676e-05, + "loss": 0.2874, + "num_input_tokens_seen": 680776, + "step": 1695 + }, + { + "epoch": 1.7671517671517671, + "grad_norm": 8.596820831298828, + "learning_rate": 4.085325719802307e-05, + "loss": 0.2651, + "num_input_tokens_seen": 683016, + "step": 1700 + }, + { + "epoch": 1.7723492723492722, + "grad_norm": 9.364229202270508, + "learning_rate": 4.078301087056144e-05, + "loss": 0.2924, + "num_input_tokens_seen": 685256, + "step": 1705 + }, + { + "epoch": 1.7775467775467777, + "grad_norm": 17.756505966186523, + "learning_rate": 4.0712556739071795e-05, + "loss": 0.2762, + "num_input_tokens_seen": 687304, + "step": 1710 + }, + { + "epoch": 1.7827442827442828, + "grad_norm": 16.004009246826172, + "learning_rate": 4.064189573117512e-05, + "loss": 0.2888, + "num_input_tokens_seen": 689224, + "step": 1715 + }, + { + "epoch": 1.7879417879417878, + "grad_norm": 15.74494457244873, + "learning_rate": 4.0571028777216214e-05, + "loss": 0.2282, + "num_input_tokens_seen": 691400, + "step": 1720 + }, + { + "epoch": 1.793139293139293, + "grad_norm": 2.8662827014923096, + "learning_rate": 4.049995681025143e-05, + "loss": 0.187, + "num_input_tokens_seen": 693320, + "step": 1725 + }, + { + "epoch": 1.7983367983367984, + "grad_norm": 8.626184463500977, + "learning_rate": 4.0428680766036384e-05, + "loss": 0.4406, + "num_input_tokens_seen": 695432, + "step": 1730 + }, + { + "epoch": 1.8035343035343034, + "grad_norm": 3.6228630542755127, + "learning_rate": 4.035720158301363e-05, + "loss": 0.3552, + "num_input_tokens_seen": 697544, + "step": 1735 + }, + { + "epoch": 1.8087318087318087, + "grad_norm": 34.01264953613281, + "learning_rate": 4.028552020230031e-05, + "loss": 0.3263, + "num_input_tokens_seen": 699592, + "step": 1740 + }, + { + "epoch": 1.813929313929314, + "grad_norm": 5.828328609466553, + "learning_rate": 4.0213637567675774e-05, + "loss": 0.2859, + "num_input_tokens_seen": 701576, + "step": 1745 + }, + { + "epoch": 1.819126819126819, + "grad_norm": 6.004729747772217, + "learning_rate": 4.0141554625569125e-05, + "loss": 0.2657, + "num_input_tokens_seen": 703688, + "step": 1750 + }, + { + "epoch": 1.8243243243243243, + "grad_norm": 4.201369285583496, + "learning_rate": 4.0069272325046816e-05, + "loss": 0.2842, + "num_input_tokens_seen": 705736, + "step": 1755 + }, + { + "epoch": 1.8295218295218296, + "grad_norm": 12.624285697937012, + "learning_rate": 3.999679161780005e-05, + "loss": 0.2479, + "num_input_tokens_seen": 707720, + "step": 1760 + }, + { + "epoch": 1.8347193347193347, + "grad_norm": 4.109714031219482, + "learning_rate": 3.99241134581324e-05, + "loss": 0.3132, + "num_input_tokens_seen": 709896, + "step": 1765 + }, + { + "epoch": 1.83991683991684, + "grad_norm": 5.0265302658081055, + "learning_rate": 3.985123880294708e-05, + "loss": 0.2661, + "num_input_tokens_seen": 711944, + "step": 1770 + }, + { + "epoch": 1.8451143451143452, + "grad_norm": 6.782411575317383, + "learning_rate": 3.9778168611734456e-05, + "loss": 0.2664, + "num_input_tokens_seen": 713992, + "step": 1775 + }, + { + "epoch": 1.8503118503118503, + "grad_norm": 1.0791548490524292, + "learning_rate": 3.970490384655939e-05, + "loss": 0.2443, + "num_input_tokens_seen": 715976, + "step": 1780 + }, + { + "epoch": 1.8555093555093554, + "grad_norm": 8.595144271850586, + "learning_rate": 3.963144547204856e-05, + "loss": 0.2659, + "num_input_tokens_seen": 718024, + "step": 1785 + }, + { + "epoch": 1.8607068607068609, + "grad_norm": 6.319913387298584, + "learning_rate": 3.955779445537776e-05, + "loss": 0.2441, + "num_input_tokens_seen": 720072, + "step": 1790 + }, + { + "epoch": 1.865904365904366, + "grad_norm": 16.376117706298828, + "learning_rate": 3.948395176625918e-05, + "loss": 0.279, + "num_input_tokens_seen": 722120, + "step": 1795 + }, + { + "epoch": 1.871101871101871, + "grad_norm": 12.614494323730469, + "learning_rate": 3.9409918376928604e-05, + "loss": 0.2851, + "num_input_tokens_seen": 724168, + "step": 1800 + }, + { + "epoch": 1.8762993762993763, + "grad_norm": 0.3612583577632904, + "learning_rate": 3.933569526213268e-05, + "loss": 0.2928, + "num_input_tokens_seen": 726280, + "step": 1805 + }, + { + "epoch": 1.8814968814968815, + "grad_norm": 5.5901103019714355, + "learning_rate": 3.926128339911599e-05, + "loss": 0.2677, + "num_input_tokens_seen": 728264, + "step": 1810 + }, + { + "epoch": 1.8866943866943866, + "grad_norm": 19.419448852539062, + "learning_rate": 3.918668376760827e-05, + "loss": 0.2924, + "num_input_tokens_seen": 730312, + "step": 1815 + }, + { + "epoch": 1.8918918918918919, + "grad_norm": 19.855844497680664, + "learning_rate": 3.9111897349811454e-05, + "loss": 0.2771, + "num_input_tokens_seen": 732296, + "step": 1820 + }, + { + "epoch": 1.8970893970893972, + "grad_norm": 0.2629048228263855, + "learning_rate": 3.903692513038677e-05, + "loss": 0.2412, + "num_input_tokens_seen": 734088, + "step": 1825 + }, + { + "epoch": 1.9022869022869022, + "grad_norm": 10.053337097167969, + "learning_rate": 3.896176809644178e-05, + "loss": 0.2897, + "num_input_tokens_seen": 736072, + "step": 1830 + }, + { + "epoch": 1.9074844074844075, + "grad_norm": 14.880932807922363, + "learning_rate": 3.8886427237517344e-05, + "loss": 0.3063, + "num_input_tokens_seen": 738120, + "step": 1835 + }, + { + "epoch": 1.9126819126819128, + "grad_norm": 7.023550510406494, + "learning_rate": 3.881090354557463e-05, + "loss": 0.3038, + "num_input_tokens_seen": 740168, + "step": 1840 + }, + { + "epoch": 1.9178794178794178, + "grad_norm": 14.33624267578125, + "learning_rate": 3.8735198014982064e-05, + "loss": 0.2716, + "num_input_tokens_seen": 742280, + "step": 1845 + }, + { + "epoch": 1.9230769230769231, + "grad_norm": 3.6817572116851807, + "learning_rate": 3.865931164250219e-05, + "loss": 0.2834, + "num_input_tokens_seen": 744328, + "step": 1850 + }, + { + "epoch": 1.9282744282744284, + "grad_norm": 6.452430248260498, + "learning_rate": 3.8583245427278584e-05, + "loss": 0.2845, + "num_input_tokens_seen": 746440, + "step": 1855 + }, + { + "epoch": 1.9334719334719335, + "grad_norm": 5.071720123291016, + "learning_rate": 3.850700037082268e-05, + "loss": 0.3004, + "num_input_tokens_seen": 748488, + "step": 1860 + }, + { + "epoch": 1.9386694386694385, + "grad_norm": 7.624428749084473, + "learning_rate": 3.8430577477000595e-05, + "loss": 0.2696, + "num_input_tokens_seen": 750344, + "step": 1865 + }, + { + "epoch": 1.943866943866944, + "grad_norm": 11.881917953491211, + "learning_rate": 3.835397775201991e-05, + "loss": 0.2567, + "num_input_tokens_seen": 752328, + "step": 1870 + }, + { + "epoch": 1.949064449064449, + "grad_norm": 3.7098724842071533, + "learning_rate": 3.827720220441642e-05, + "loss": 0.269, + "num_input_tokens_seen": 754312, + "step": 1875 + }, + { + "epoch": 1.9542619542619541, + "grad_norm": 8.87547492980957, + "learning_rate": 3.8200251845040855e-05, + "loss": 0.2816, + "num_input_tokens_seen": 756232, + "step": 1880 + }, + { + "epoch": 1.9594594594594594, + "grad_norm": 4.694116592407227, + "learning_rate": 3.812312768704557e-05, + "loss": 0.2706, + "num_input_tokens_seen": 758280, + "step": 1885 + }, + { + "epoch": 1.9646569646569647, + "grad_norm": 0.5913885235786438, + "learning_rate": 3.8045830745871195e-05, + "loss": 0.2412, + "num_input_tokens_seen": 760328, + "step": 1890 + }, + { + "epoch": 1.9698544698544698, + "grad_norm": 0.12654490768909454, + "learning_rate": 3.7968362039233316e-05, + "loss": 0.2593, + "num_input_tokens_seen": 762248, + "step": 1895 + }, + { + "epoch": 1.975051975051975, + "grad_norm": 25.26936149597168, + "learning_rate": 3.789072258710898e-05, + "loss": 0.2765, + "num_input_tokens_seen": 764168, + "step": 1900 + }, + { + "epoch": 1.9802494802494803, + "grad_norm": 13.081347465515137, + "learning_rate": 3.781291341172338e-05, + "loss": 0.2703, + "num_input_tokens_seen": 766216, + "step": 1905 + }, + { + "epoch": 1.9854469854469854, + "grad_norm": 5.589529037475586, + "learning_rate": 3.7734935537536276e-05, + "loss": 0.2418, + "num_input_tokens_seen": 768264, + "step": 1910 + }, + { + "epoch": 1.9906444906444907, + "grad_norm": 10.241774559020996, + "learning_rate": 3.7656789991228636e-05, + "loss": 0.2502, + "num_input_tokens_seen": 770184, + "step": 1915 + }, + { + "epoch": 1.995841995841996, + "grad_norm": 2.5858964920043945, + "learning_rate": 3.7578477801689e-05, + "loss": 0.2432, + "num_input_tokens_seen": 772168, + "step": 1920 + }, + { + "epoch": 2.001039501039501, + "grad_norm": 3.724403142929077, + "learning_rate": 3.7500000000000003e-05, + "loss": 0.2243, + "num_input_tokens_seen": 774160, + "step": 1925 + }, + { + "epoch": 2.004158004158004, + "eval_loss": 0.2575376331806183, + "eval_runtime": 1.0513, + "eval_samples_per_second": 814.265, + "eval_steps_per_second": 101.783, + "num_input_tokens_seen": 775312, + "step": 1928 + }, + { + "epoch": 2.006237006237006, + "grad_norm": 8.0248384475708, + "learning_rate": 3.742135761942479e-05, + "loss": 0.26, + "num_input_tokens_seen": 776144, + "step": 1930 + }, + { + "epoch": 2.0114345114345116, + "grad_norm": 8.558785438537598, + "learning_rate": 3.734255169539337e-05, + "loss": 0.2814, + "num_input_tokens_seen": 778128, + "step": 1935 + }, + { + "epoch": 2.0166320166320166, + "grad_norm": 29.213605880737305, + "learning_rate": 3.7263583265489074e-05, + "loss": 0.2911, + "num_input_tokens_seen": 780176, + "step": 1940 + }, + { + "epoch": 2.0218295218295217, + "grad_norm": 2.797147274017334, + "learning_rate": 3.718445336943478e-05, + "loss": 0.2723, + "num_input_tokens_seen": 782160, + "step": 1945 + }, + { + "epoch": 2.027027027027027, + "grad_norm": 11.302480697631836, + "learning_rate": 3.710516304907931e-05, + "loss": 0.3159, + "num_input_tokens_seen": 784208, + "step": 1950 + }, + { + "epoch": 2.0322245322245323, + "grad_norm": 10.434552192687988, + "learning_rate": 3.702571334838365e-05, + "loss": 0.2713, + "num_input_tokens_seen": 786256, + "step": 1955 + }, + { + "epoch": 2.0374220374220373, + "grad_norm": 18.884937286376953, + "learning_rate": 3.694610531340729e-05, + "loss": 0.2491, + "num_input_tokens_seen": 788240, + "step": 1960 + }, + { + "epoch": 2.042619542619543, + "grad_norm": 7.0856404304504395, + "learning_rate": 3.6866339992294344e-05, + "loss": 0.2663, + "num_input_tokens_seen": 790288, + "step": 1965 + }, + { + "epoch": 2.047817047817048, + "grad_norm": 8.749947547912598, + "learning_rate": 3.6786418435259854e-05, + "loss": 0.2681, + "num_input_tokens_seen": 792272, + "step": 1970 + }, + { + "epoch": 2.053014553014553, + "grad_norm": 7.0498785972595215, + "learning_rate": 3.670634169457587e-05, + "loss": 0.2757, + "num_input_tokens_seen": 794384, + "step": 1975 + }, + { + "epoch": 2.0582120582120584, + "grad_norm": 1.3708738088607788, + "learning_rate": 3.662611082455766e-05, + "loss": 0.2727, + "num_input_tokens_seen": 796368, + "step": 1980 + }, + { + "epoch": 2.0634095634095635, + "grad_norm": 17.901782989501953, + "learning_rate": 3.654572688154979e-05, + "loss": 0.2711, + "num_input_tokens_seen": 798480, + "step": 1985 + }, + { + "epoch": 2.0686070686070686, + "grad_norm": 3.3067057132720947, + "learning_rate": 3.646519092391227e-05, + "loss": 0.2843, + "num_input_tokens_seen": 800528, + "step": 1990 + }, + { + "epoch": 2.0738045738045736, + "grad_norm": 10.808554649353027, + "learning_rate": 3.6384504012006544e-05, + "loss": 0.2917, + "num_input_tokens_seen": 802768, + "step": 1995 + }, + { + "epoch": 2.079002079002079, + "grad_norm": 15.788969039916992, + "learning_rate": 3.6303667208181575e-05, + "loss": 0.2846, + "num_input_tokens_seen": 804752, + "step": 2000 + }, + { + "epoch": 2.084199584199584, + "grad_norm": 7.7113847732543945, + "learning_rate": 3.622268157675986e-05, + "loss": 0.2932, + "num_input_tokens_seen": 806672, + "step": 2005 + }, + { + "epoch": 2.0893970893970892, + "grad_norm": 1.0900391340255737, + "learning_rate": 3.614154818402339e-05, + "loss": 0.2602, + "num_input_tokens_seen": 808656, + "step": 2010 + }, + { + "epoch": 2.0945945945945947, + "grad_norm": 8.559063911437988, + "learning_rate": 3.606026809819966e-05, + "loss": 0.2402, + "num_input_tokens_seen": 810640, + "step": 2015 + }, + { + "epoch": 2.0997920997921, + "grad_norm": 13.94715690612793, + "learning_rate": 3.597884238944752e-05, + "loss": 0.2832, + "num_input_tokens_seen": 812688, + "step": 2020 + }, + { + "epoch": 2.104989604989605, + "grad_norm": 10.943618774414062, + "learning_rate": 3.5897272129843194e-05, + "loss": 0.262, + "num_input_tokens_seen": 814800, + "step": 2025 + }, + { + "epoch": 2.1101871101871104, + "grad_norm": 8.191487312316895, + "learning_rate": 3.581555839336606e-05, + "loss": 0.2348, + "num_input_tokens_seen": 816912, + "step": 2030 + }, + { + "epoch": 2.1153846153846154, + "grad_norm": 8.54643440246582, + "learning_rate": 3.57337022558846e-05, + "loss": 0.2981, + "num_input_tokens_seen": 818896, + "step": 2035 + }, + { + "epoch": 2.1205821205821205, + "grad_norm": 0.22179275751113892, + "learning_rate": 3.565170479514214e-05, + "loss": 0.2857, + "num_input_tokens_seen": 820880, + "step": 2040 + }, + { + "epoch": 2.125779625779626, + "grad_norm": 8.135652542114258, + "learning_rate": 3.5569567090742764e-05, + "loss": 0.2745, + "num_input_tokens_seen": 822864, + "step": 2045 + }, + { + "epoch": 2.130977130977131, + "grad_norm": 1.2629114389419556, + "learning_rate": 3.548729022413701e-05, + "loss": 0.2705, + "num_input_tokens_seen": 825040, + "step": 2050 + }, + { + "epoch": 2.136174636174636, + "grad_norm": 2.5352609157562256, + "learning_rate": 3.540487527860769e-05, + "loss": 0.2397, + "num_input_tokens_seen": 827024, + "step": 2055 + }, + { + "epoch": 2.141372141372141, + "grad_norm": 5.771927356719971, + "learning_rate": 3.53223233392556e-05, + "loss": 0.2921, + "num_input_tokens_seen": 829136, + "step": 2060 + }, + { + "epoch": 2.1465696465696467, + "grad_norm": 14.170849800109863, + "learning_rate": 3.523963549298525e-05, + "loss": 0.274, + "num_input_tokens_seen": 831184, + "step": 2065 + }, + { + "epoch": 2.1517671517671517, + "grad_norm": 35.1840705871582, + "learning_rate": 3.51568128284905e-05, + "loss": 0.3599, + "num_input_tokens_seen": 833168, + "step": 2070 + }, + { + "epoch": 2.156964656964657, + "grad_norm": 3.5509274005889893, + "learning_rate": 3.5073856436240334e-05, + "loss": 0.2991, + "num_input_tokens_seen": 835216, + "step": 2075 + }, + { + "epoch": 2.1621621621621623, + "grad_norm": 11.091768264770508, + "learning_rate": 3.499076740846438e-05, + "loss": 0.2711, + "num_input_tokens_seen": 837136, + "step": 2080 + }, + { + "epoch": 2.1673596673596673, + "grad_norm": 10.117902755737305, + "learning_rate": 3.490754683913863e-05, + "loss": 0.263, + "num_input_tokens_seen": 839120, + "step": 2085 + }, + { + "epoch": 2.1725571725571724, + "grad_norm": 8.886628150939941, + "learning_rate": 3.482419582397095e-05, + "loss": 0.2114, + "num_input_tokens_seen": 841104, + "step": 2090 + }, + { + "epoch": 2.177754677754678, + "grad_norm": 3.9707517623901367, + "learning_rate": 3.474071546038673e-05, + "loss": 0.3437, + "num_input_tokens_seen": 843152, + "step": 2095 + }, + { + "epoch": 2.182952182952183, + "grad_norm": 7.44064474105835, + "learning_rate": 3.46571068475144e-05, + "loss": 0.2665, + "num_input_tokens_seen": 845136, + "step": 2100 + }, + { + "epoch": 2.188149688149688, + "grad_norm": 15.758981704711914, + "learning_rate": 3.4573371086170936e-05, + "loss": 0.2736, + "num_input_tokens_seen": 847120, + "step": 2105 + }, + { + "epoch": 2.1933471933471935, + "grad_norm": 6.210805892944336, + "learning_rate": 3.4489509278847414e-05, + "loss": 0.2967, + "num_input_tokens_seen": 849168, + "step": 2110 + }, + { + "epoch": 2.1985446985446986, + "grad_norm": 5.870239734649658, + "learning_rate": 3.4405522529694454e-05, + "loss": 0.2804, + "num_input_tokens_seen": 851152, + "step": 2115 + }, + { + "epoch": 2.2037422037422036, + "grad_norm": 0.2958710789680481, + "learning_rate": 3.432141194450772e-05, + "loss": 0.2789, + "num_input_tokens_seen": 853008, + "step": 2120 + }, + { + "epoch": 2.208939708939709, + "grad_norm": 2.236769199371338, + "learning_rate": 3.4237178630713314e-05, + "loss": 0.2593, + "num_input_tokens_seen": 855120, + "step": 2125 + }, + { + "epoch": 2.214137214137214, + "grad_norm": 13.610929489135742, + "learning_rate": 3.415282369735324e-05, + "loss": 0.3184, + "num_input_tokens_seen": 857232, + "step": 2130 + }, + { + "epoch": 2.2193347193347193, + "grad_norm": 23.174781799316406, + "learning_rate": 3.4068348255070763e-05, + "loss": 0.2697, + "num_input_tokens_seen": 859344, + "step": 2135 + }, + { + "epoch": 2.2245322245322248, + "grad_norm": 5.864615440368652, + "learning_rate": 3.3983753416095845e-05, + "loss": 0.2666, + "num_input_tokens_seen": 861328, + "step": 2140 + }, + { + "epoch": 2.22972972972973, + "grad_norm": 4.22444486618042, + "learning_rate": 3.389904029423041e-05, + "loss": 0.2807, + "num_input_tokens_seen": 863376, + "step": 2145 + }, + { + "epoch": 2.234927234927235, + "grad_norm": 10.534299850463867, + "learning_rate": 3.381421000483378e-05, + "loss": 0.277, + "num_input_tokens_seen": 865424, + "step": 2150 + }, + { + "epoch": 2.24012474012474, + "grad_norm": 19.86652946472168, + "learning_rate": 3.37292636648079e-05, + "loss": 0.2884, + "num_input_tokens_seen": 867472, + "step": 2155 + }, + { + "epoch": 2.2453222453222454, + "grad_norm": 1.5927962064743042, + "learning_rate": 3.36442023925827e-05, + "loss": 0.259, + "num_input_tokens_seen": 869584, + "step": 2160 + }, + { + "epoch": 2.2505197505197505, + "grad_norm": 13.930359840393066, + "learning_rate": 3.3559027308101345e-05, + "loss": 0.2477, + "num_input_tokens_seen": 871568, + "step": 2165 + }, + { + "epoch": 2.2546777546777546, + "eval_loss": 0.2923731505870819, + "eval_runtime": 2.2896, + "eval_samples_per_second": 373.867, + "eval_steps_per_second": 46.733, + "num_input_tokens_seen": 873104, + "step": 2169 + }, + { + "epoch": 2.2557172557172556, + "grad_norm": 13.714078903198242, + "learning_rate": 3.3473739532805467e-05, + "loss": 0.3482, + "num_input_tokens_seen": 873488, + "step": 2170 + }, + { + "epoch": 2.260914760914761, + "grad_norm": 6.342438697814941, + "learning_rate": 3.3388340189620424e-05, + "loss": 0.26, + "num_input_tokens_seen": 875472, + "step": 2175 + }, + { + "epoch": 2.266112266112266, + "grad_norm": 13.85311222076416, + "learning_rate": 3.330283040294053e-05, + "loss": 0.2554, + "num_input_tokens_seen": 877392, + "step": 2180 + }, + { + "epoch": 2.271309771309771, + "grad_norm": 4.5571370124816895, + "learning_rate": 3.321721129861422e-05, + "loss": 0.2621, + "num_input_tokens_seen": 879504, + "step": 2185 + }, + { + "epoch": 2.2765072765072767, + "grad_norm": 12.646343231201172, + "learning_rate": 3.3131484003929246e-05, + "loss": 0.29, + "num_input_tokens_seen": 881360, + "step": 2190 + }, + { + "epoch": 2.2817047817047817, + "grad_norm": 2.4754276275634766, + "learning_rate": 3.3045649647597815e-05, + "loss": 0.2916, + "num_input_tokens_seen": 883280, + "step": 2195 + }, + { + "epoch": 2.286902286902287, + "grad_norm": 9.653176307678223, + "learning_rate": 3.2959709359741744e-05, + "loss": 0.2572, + "num_input_tokens_seen": 885328, + "step": 2200 + }, + { + "epoch": 2.2920997920997923, + "grad_norm": 16.368059158325195, + "learning_rate": 3.2873664271877584e-05, + "loss": 0.3062, + "num_input_tokens_seen": 887312, + "step": 2205 + }, + { + "epoch": 2.2972972972972974, + "grad_norm": 11.021875381469727, + "learning_rate": 3.278751551690172e-05, + "loss": 0.2672, + "num_input_tokens_seen": 889296, + "step": 2210 + }, + { + "epoch": 2.3024948024948024, + "grad_norm": 8.907588958740234, + "learning_rate": 3.270126422907544e-05, + "loss": 0.2647, + "num_input_tokens_seen": 891408, + "step": 2215 + }, + { + "epoch": 2.3076923076923075, + "grad_norm": 9.290825843811035, + "learning_rate": 3.261491154401001e-05, + "loss": 0.2884, + "num_input_tokens_seen": 893392, + "step": 2220 + }, + { + "epoch": 2.312889812889813, + "grad_norm": 4.591054916381836, + "learning_rate": 3.2528458598651734e-05, + "loss": 0.2719, + "num_input_tokens_seen": 895440, + "step": 2225 + }, + { + "epoch": 2.318087318087318, + "grad_norm": 14.931044578552246, + "learning_rate": 3.244190653126696e-05, + "loss": 0.2718, + "num_input_tokens_seen": 897616, + "step": 2230 + }, + { + "epoch": 2.323284823284823, + "grad_norm": 5.752501487731934, + "learning_rate": 3.2355256481427145e-05, + "loss": 0.2636, + "num_input_tokens_seen": 899536, + "step": 2235 + }, + { + "epoch": 2.3284823284823286, + "grad_norm": 10.545312881469727, + "learning_rate": 3.226850958999375e-05, + "loss": 0.2544, + "num_input_tokens_seen": 901648, + "step": 2240 + }, + { + "epoch": 2.3336798336798337, + "grad_norm": 0.47291961312294006, + "learning_rate": 3.2181666999103324e-05, + "loss": 0.2258, + "num_input_tokens_seen": 903696, + "step": 2245 + }, + { + "epoch": 2.3388773388773387, + "grad_norm": 12.981254577636719, + "learning_rate": 3.209472985215243e-05, + "loss": 0.3054, + "num_input_tokens_seen": 905552, + "step": 2250 + }, + { + "epoch": 2.3440748440748442, + "grad_norm": 6.684492588043213, + "learning_rate": 3.2007699293782555e-05, + "loss": 0.3446, + "num_input_tokens_seen": 907472, + "step": 2255 + }, + { + "epoch": 2.3492723492723493, + "grad_norm": 4.928536891937256, + "learning_rate": 3.1920576469865115e-05, + "loss": 0.2495, + "num_input_tokens_seen": 909584, + "step": 2260 + }, + { + "epoch": 2.3544698544698544, + "grad_norm": 6.033250331878662, + "learning_rate": 3.183336252748627e-05, + "loss": 0.2754, + "num_input_tokens_seen": 911632, + "step": 2265 + }, + { + "epoch": 2.35966735966736, + "grad_norm": 2.3870551586151123, + "learning_rate": 3.1746058614931916e-05, + "loss": 0.2604, + "num_input_tokens_seen": 913616, + "step": 2270 + }, + { + "epoch": 2.364864864864865, + "grad_norm": 18.541162490844727, + "learning_rate": 3.16586658816725e-05, + "loss": 0.2711, + "num_input_tokens_seen": 915728, + "step": 2275 + }, + { + "epoch": 2.37006237006237, + "grad_norm": 13.122420310974121, + "learning_rate": 3.157118547834793e-05, + "loss": 0.2566, + "num_input_tokens_seen": 917776, + "step": 2280 + }, + { + "epoch": 2.375259875259875, + "grad_norm": 12.414369583129883, + "learning_rate": 3.148361855675237e-05, + "loss": 0.2684, + "num_input_tokens_seen": 919952, + "step": 2285 + }, + { + "epoch": 2.3804573804573805, + "grad_norm": 7.519947052001953, + "learning_rate": 3.139596626981916e-05, + "loss": 0.2294, + "num_input_tokens_seen": 921872, + "step": 2290 + }, + { + "epoch": 2.3856548856548856, + "grad_norm": 8.675261497497559, + "learning_rate": 3.130822977160554e-05, + "loss": 0.2603, + "num_input_tokens_seen": 923856, + "step": 2295 + }, + { + "epoch": 2.390852390852391, + "grad_norm": 5.88022518157959, + "learning_rate": 3.122041021727755e-05, + "loss": 0.3942, + "num_input_tokens_seen": 925968, + "step": 2300 + }, + { + "epoch": 2.396049896049896, + "grad_norm": 14.03941535949707, + "learning_rate": 3.1132508763094715e-05, + "loss": 0.3128, + "num_input_tokens_seen": 927888, + "step": 2305 + }, + { + "epoch": 2.401247401247401, + "grad_norm": 15.206921577453613, + "learning_rate": 3.104452656639492e-05, + "loss": 0.2467, + "num_input_tokens_seen": 929808, + "step": 2310 + }, + { + "epoch": 2.4064449064449063, + "grad_norm": 1.0389469861984253, + "learning_rate": 3.0956464785579124e-05, + "loss": 0.1963, + "num_input_tokens_seen": 931728, + "step": 2315 + }, + { + "epoch": 2.4116424116424118, + "grad_norm": 9.624686241149902, + "learning_rate": 3.0868324580096114e-05, + "loss": 0.3533, + "num_input_tokens_seen": 933840, + "step": 2320 + }, + { + "epoch": 2.416839916839917, + "grad_norm": 1.1855783462524414, + "learning_rate": 3.078010711042723e-05, + "loss": 0.2936, + "num_input_tokens_seen": 935824, + "step": 2325 + }, + { + "epoch": 2.422037422037422, + "grad_norm": 4.064991474151611, + "learning_rate": 3.0691813538071105e-05, + "loss": 0.274, + "num_input_tokens_seen": 937872, + "step": 2330 + }, + { + "epoch": 2.4272349272349274, + "grad_norm": 26.271160125732422, + "learning_rate": 3.0603445025528376e-05, + "loss": 0.3378, + "num_input_tokens_seen": 939984, + "step": 2335 + }, + { + "epoch": 2.4324324324324325, + "grad_norm": 12.682053565979004, + "learning_rate": 3.051500273628633e-05, + "loss": 0.2418, + "num_input_tokens_seen": 941968, + "step": 2340 + }, + { + "epoch": 2.4376299376299375, + "grad_norm": 3.6713008880615234, + "learning_rate": 3.0426487834803657e-05, + "loss": 0.2943, + "num_input_tokens_seen": 943952, + "step": 2345 + }, + { + "epoch": 2.442827442827443, + "grad_norm": 19.096328735351562, + "learning_rate": 3.0337901486495073e-05, + "loss": 0.2435, + "num_input_tokens_seen": 945872, + "step": 2350 + }, + { + "epoch": 2.448024948024948, + "grad_norm": 4.218629360198975, + "learning_rate": 3.0249244857715976e-05, + "loss": 0.267, + "num_input_tokens_seen": 947856, + "step": 2355 + }, + { + "epoch": 2.453222453222453, + "grad_norm": 0.270999550819397, + "learning_rate": 3.01605191157471e-05, + "loss": 0.2452, + "num_input_tokens_seen": 949840, + "step": 2360 + }, + { + "epoch": 2.4584199584199586, + "grad_norm": 1.739176630973816, + "learning_rate": 3.007172542877915e-05, + "loss": 0.2342, + "num_input_tokens_seen": 951760, + "step": 2365 + }, + { + "epoch": 2.4636174636174637, + "grad_norm": 13.98282241821289, + "learning_rate": 2.998286496589742e-05, + "loss": 0.3294, + "num_input_tokens_seen": 953680, + "step": 2370 + }, + { + "epoch": 2.4688149688149688, + "grad_norm": 9.587896347045898, + "learning_rate": 2.9893938897066393e-05, + "loss": 0.2417, + "num_input_tokens_seen": 955600, + "step": 2375 + }, + { + "epoch": 2.474012474012474, + "grad_norm": 6.101572036743164, + "learning_rate": 2.9804948393114324e-05, + "loss": 0.2781, + "num_input_tokens_seen": 957456, + "step": 2380 + }, + { + "epoch": 2.4792099792099793, + "grad_norm": 5.505262851715088, + "learning_rate": 2.9715894625717866e-05, + "loss": 0.2721, + "num_input_tokens_seen": 959504, + "step": 2385 + }, + { + "epoch": 2.4844074844074844, + "grad_norm": 0.05719423666596413, + "learning_rate": 2.9626778767386604e-05, + "loss": 0.277, + "num_input_tokens_seen": 961488, + "step": 2390 + }, + { + "epoch": 2.4896049896049894, + "grad_norm": 17.471576690673828, + "learning_rate": 2.953760199144764e-05, + "loss": 0.2759, + "num_input_tokens_seen": 963408, + "step": 2395 + }, + { + "epoch": 2.494802494802495, + "grad_norm": 12.931529998779297, + "learning_rate": 2.9448365472030115e-05, + "loss": 0.2633, + "num_input_tokens_seen": 965392, + "step": 2400 + }, + { + "epoch": 2.5, + "grad_norm": 8.689949989318848, + "learning_rate": 2.935907038404981e-05, + "loss": 0.2744, + "num_input_tokens_seen": 967440, + "step": 2405 + }, + { + "epoch": 2.505197505197505, + "grad_norm": 1.9627736806869507, + "learning_rate": 2.92697179031936e-05, + "loss": 0.2379, + "num_input_tokens_seen": 969360, + "step": 2410 + }, + { + "epoch": 2.505197505197505, + "eval_loss": 0.2576568126678467, + "eval_runtime": 1.0822, + "eval_samples_per_second": 790.985, + "eval_steps_per_second": 98.873, + "num_input_tokens_seen": 969360, + "step": 2410 + }, + { + "epoch": 2.51039501039501, + "grad_norm": 0.891659140586853, + "learning_rate": 2.9180309205904027e-05, + "loss": 0.2923, + "num_input_tokens_seen": 971472, + "step": 2415 + }, + { + "epoch": 2.5155925155925156, + "grad_norm": 2.514449119567871, + "learning_rate": 2.9090845469363805e-05, + "loss": 0.296, + "num_input_tokens_seen": 973456, + "step": 2420 + }, + { + "epoch": 2.5207900207900207, + "grad_norm": 19.587871551513672, + "learning_rate": 2.9001327871480294e-05, + "loss": 0.2911, + "num_input_tokens_seen": 975504, + "step": 2425 + }, + { + "epoch": 2.525987525987526, + "grad_norm": 16.2788143157959, + "learning_rate": 2.8911757590870027e-05, + "loss": 0.285, + "num_input_tokens_seen": 977552, + "step": 2430 + }, + { + "epoch": 2.5311850311850312, + "grad_norm": 21.12313461303711, + "learning_rate": 2.8822135806843154e-05, + "loss": 0.2552, + "num_input_tokens_seen": 979536, + "step": 2435 + }, + { + "epoch": 2.5363825363825363, + "grad_norm": 1.4399539232254028, + "learning_rate": 2.8732463699387968e-05, + "loss": 0.2906, + "num_input_tokens_seen": 981584, + "step": 2440 + }, + { + "epoch": 2.5415800415800414, + "grad_norm": 13.594979286193848, + "learning_rate": 2.8642742449155284e-05, + "loss": 0.2795, + "num_input_tokens_seen": 983632, + "step": 2445 + }, + { + "epoch": 2.546777546777547, + "grad_norm": 16.668123245239258, + "learning_rate": 2.855297323744301e-05, + "loss": 0.228, + "num_input_tokens_seen": 985680, + "step": 2450 + }, + { + "epoch": 2.551975051975052, + "grad_norm": 1.3556967973709106, + "learning_rate": 2.8463157246180468e-05, + "loss": 0.2414, + "num_input_tokens_seen": 987664, + "step": 2455 + }, + { + "epoch": 2.5571725571725574, + "grad_norm": 8.519729614257812, + "learning_rate": 2.8373295657912945e-05, + "loss": 0.2636, + "num_input_tokens_seen": 989648, + "step": 2460 + }, + { + "epoch": 2.5623700623700625, + "grad_norm": 2.2857918739318848, + "learning_rate": 2.828338965578603e-05, + "loss": 0.2691, + "num_input_tokens_seen": 991696, + "step": 2465 + }, + { + "epoch": 2.5675675675675675, + "grad_norm": 5.966533184051514, + "learning_rate": 2.8193440423530114e-05, + "loss": 0.2598, + "num_input_tokens_seen": 993616, + "step": 2470 + }, + { + "epoch": 2.5727650727650726, + "grad_norm": 2.139225482940674, + "learning_rate": 2.810344914544475e-05, + "loss": 0.2688, + "num_input_tokens_seen": 995664, + "step": 2475 + }, + { + "epoch": 2.577962577962578, + "grad_norm": 1.0499998331069946, + "learning_rate": 2.8013417006383076e-05, + "loss": 0.295, + "num_input_tokens_seen": 997648, + "step": 2480 + }, + { + "epoch": 2.583160083160083, + "grad_norm": 8.98536205291748, + "learning_rate": 2.792334519173624e-05, + "loss": 0.2802, + "num_input_tokens_seen": 999696, + "step": 2485 + }, + { + "epoch": 2.5883575883575882, + "grad_norm": 9.025850296020508, + "learning_rate": 2.7833234887417743e-05, + "loss": 0.2897, + "num_input_tokens_seen": 1001680, + "step": 2490 + }, + { + "epoch": 2.5935550935550937, + "grad_norm": 4.961789131164551, + "learning_rate": 2.7743087279847868e-05, + "loss": 0.2723, + "num_input_tokens_seen": 1003728, + "step": 2495 + }, + { + "epoch": 2.598752598752599, + "grad_norm": 11.652027130126953, + "learning_rate": 2.765290355593805e-05, + "loss": 0.2874, + "num_input_tokens_seen": 1005584, + "step": 2500 + }, + { + "epoch": 2.603950103950104, + "grad_norm": 16.368242263793945, + "learning_rate": 2.7562684903075238e-05, + "loss": 0.2405, + "num_input_tokens_seen": 1007696, + "step": 2505 + }, + { + "epoch": 2.609147609147609, + "grad_norm": 12.281315803527832, + "learning_rate": 2.7472432509106248e-05, + "loss": 0.2737, + "num_input_tokens_seen": 1009680, + "step": 2510 + }, + { + "epoch": 2.6143451143451144, + "grad_norm": 16.369632720947266, + "learning_rate": 2.7382147562322174e-05, + "loss": 0.2753, + "num_input_tokens_seen": 1011728, + "step": 2515 + }, + { + "epoch": 2.6195426195426195, + "grad_norm": 3.395531177520752, + "learning_rate": 2.729183125144269e-05, + "loss": 0.2553, + "num_input_tokens_seen": 1013840, + "step": 2520 + }, + { + "epoch": 2.624740124740125, + "grad_norm": 7.065828323364258, + "learning_rate": 2.7201484765600426e-05, + "loss": 0.2564, + "num_input_tokens_seen": 1015824, + "step": 2525 + }, + { + "epoch": 2.62993762993763, + "grad_norm": 2.8372550010681152, + "learning_rate": 2.7111109294325297e-05, + "loss": 0.277, + "num_input_tokens_seen": 1017744, + "step": 2530 + }, + { + "epoch": 2.635135135135135, + "grad_norm": 12.833436012268066, + "learning_rate": 2.702070602752887e-05, + "loss": 0.2439, + "num_input_tokens_seen": 1019728, + "step": 2535 + }, + { + "epoch": 2.64033264033264, + "grad_norm": 0.17026355862617493, + "learning_rate": 2.693027615548864e-05, + "loss": 0.2958, + "num_input_tokens_seen": 1021840, + "step": 2540 + }, + { + "epoch": 2.6455301455301456, + "grad_norm": 10.469789505004883, + "learning_rate": 2.6839820868832433e-05, + "loss": 0.2809, + "num_input_tokens_seen": 1023824, + "step": 2545 + }, + { + "epoch": 2.6507276507276507, + "grad_norm": 10.419620513916016, + "learning_rate": 2.6749341358522674e-05, + "loss": 0.2583, + "num_input_tokens_seen": 1025616, + "step": 2550 + }, + { + "epoch": 2.6559251559251558, + "grad_norm": 3.5157597064971924, + "learning_rate": 2.665883881584072e-05, + "loss": 0.2494, + "num_input_tokens_seen": 1027664, + "step": 2555 + }, + { + "epoch": 2.6611226611226613, + "grad_norm": 1.5977754592895508, + "learning_rate": 2.6568314432371183e-05, + "loss": 0.2477, + "num_input_tokens_seen": 1029648, + "step": 2560 + }, + { + "epoch": 2.6663201663201663, + "grad_norm": 1.0980393886566162, + "learning_rate": 2.6477769399986245e-05, + "loss": 0.2402, + "num_input_tokens_seen": 1031632, + "step": 2565 + }, + { + "epoch": 2.6715176715176714, + "grad_norm": 8.981844902038574, + "learning_rate": 2.6387204910829956e-05, + "loss": 0.2583, + "num_input_tokens_seen": 1033488, + "step": 2570 + }, + { + "epoch": 2.6767151767151764, + "grad_norm": 3.0374419689178467, + "learning_rate": 2.629662215730253e-05, + "loss": 0.2162, + "num_input_tokens_seen": 1035536, + "step": 2575 + }, + { + "epoch": 2.681912681912682, + "grad_norm": 5.767524242401123, + "learning_rate": 2.6206022332044667e-05, + "loss": 0.2652, + "num_input_tokens_seen": 1037584, + "step": 2580 + }, + { + "epoch": 2.687110187110187, + "grad_norm": 0.40257641673088074, + "learning_rate": 2.6115406627921825e-05, + "loss": 0.2401, + "num_input_tokens_seen": 1039568, + "step": 2585 + }, + { + "epoch": 2.6923076923076925, + "grad_norm": 1.3719632625579834, + "learning_rate": 2.6024776238008543e-05, + "loss": 0.2416, + "num_input_tokens_seen": 1041616, + "step": 2590 + }, + { + "epoch": 2.6975051975051976, + "grad_norm": 0.23526664078235626, + "learning_rate": 2.593413235557271e-05, + "loss": 0.2479, + "num_input_tokens_seen": 1043664, + "step": 2595 + }, + { + "epoch": 2.7027027027027026, + "grad_norm": 5.976350784301758, + "learning_rate": 2.5843476174059872e-05, + "loss": 0.2624, + "num_input_tokens_seen": 1045520, + "step": 2600 + }, + { + "epoch": 2.7079002079002077, + "grad_norm": 1.9363540410995483, + "learning_rate": 2.5752808887077477e-05, + "loss": 0.2519, + "num_input_tokens_seen": 1047376, + "step": 2605 + }, + { + "epoch": 2.713097713097713, + "grad_norm": 0.9820289611816406, + "learning_rate": 2.5662131688379242e-05, + "loss": 0.2347, + "num_input_tokens_seen": 1049360, + "step": 2610 + }, + { + "epoch": 2.7182952182952183, + "grad_norm": 6.348036766052246, + "learning_rate": 2.5571445771849327e-05, + "loss": 0.2785, + "num_input_tokens_seen": 1051344, + "step": 2615 + }, + { + "epoch": 2.7234927234927238, + "grad_norm": 2.1040618419647217, + "learning_rate": 2.548075233148674e-05, + "loss": 0.2622, + "num_input_tokens_seen": 1053264, + "step": 2620 + }, + { + "epoch": 2.728690228690229, + "grad_norm": 3.914247989654541, + "learning_rate": 2.5390052561389478e-05, + "loss": 0.2798, + "num_input_tokens_seen": 1055248, + "step": 2625 + }, + { + "epoch": 2.733887733887734, + "grad_norm": 10.045319557189941, + "learning_rate": 2.529934765573893e-05, + "loss": 0.2568, + "num_input_tokens_seen": 1057104, + "step": 2630 + }, + { + "epoch": 2.739085239085239, + "grad_norm": 6.609117031097412, + "learning_rate": 2.520863880878408e-05, + "loss": 0.2622, + "num_input_tokens_seen": 1059024, + "step": 2635 + }, + { + "epoch": 2.7442827442827444, + "grad_norm": 8.553672790527344, + "learning_rate": 2.511792721482581e-05, + "loss": 0.2707, + "num_input_tokens_seen": 1060944, + "step": 2640 + }, + { + "epoch": 2.7494802494802495, + "grad_norm": 6.869534969329834, + "learning_rate": 2.502721406820116e-05, + "loss": 0.2525, + "num_input_tokens_seen": 1062992, + "step": 2645 + }, + { + "epoch": 2.7546777546777546, + "grad_norm": 8.741276741027832, + "learning_rate": 2.4936500563267627e-05, + "loss": 0.2934, + "num_input_tokens_seen": 1064848, + "step": 2650 + }, + { + "epoch": 2.7557172557172556, + "eval_loss": 0.2561495900154114, + "eval_runtime": 1.071, + "eval_samples_per_second": 799.235, + "eval_steps_per_second": 99.904, + "num_input_tokens_seen": 1065232, + "step": 2651 + }, + { + "epoch": 2.75987525987526, + "grad_norm": 10.544535636901855, + "learning_rate": 2.4845787894387425e-05, + "loss": 0.2493, + "num_input_tokens_seen": 1066832, + "step": 2655 + }, + { + "epoch": 2.765072765072765, + "grad_norm": 7.622214317321777, + "learning_rate": 2.4755077255911743e-05, + "loss": 0.2661, + "num_input_tokens_seen": 1068880, + "step": 2660 + }, + { + "epoch": 2.77027027027027, + "grad_norm": 7.094521522521973, + "learning_rate": 2.4664369842165068e-05, + "loss": 0.2398, + "num_input_tokens_seen": 1070864, + "step": 2665 + }, + { + "epoch": 2.7754677754677752, + "grad_norm": 9.394824981689453, + "learning_rate": 2.4573666847429384e-05, + "loss": 0.2523, + "num_input_tokens_seen": 1072848, + "step": 2670 + }, + { + "epoch": 2.7806652806652807, + "grad_norm": 5.644352436065674, + "learning_rate": 2.4482969465928543e-05, + "loss": 0.3167, + "num_input_tokens_seen": 1074832, + "step": 2675 + }, + { + "epoch": 2.785862785862786, + "grad_norm": 11.34897232055664, + "learning_rate": 2.4392278891812455e-05, + "loss": 0.2951, + "num_input_tokens_seen": 1076944, + "step": 2680 + }, + { + "epoch": 2.7910602910602913, + "grad_norm": 4.7796196937561035, + "learning_rate": 2.430159631914141e-05, + "loss": 0.2844, + "num_input_tokens_seen": 1078800, + "step": 2685 + }, + { + "epoch": 2.7962577962577964, + "grad_norm": 6.175029277801514, + "learning_rate": 2.4210922941870367e-05, + "loss": 0.2706, + "num_input_tokens_seen": 1080912, + "step": 2690 + }, + { + "epoch": 2.8014553014553014, + "grad_norm": 2.2498137950897217, + "learning_rate": 2.41202599538332e-05, + "loss": 0.244, + "num_input_tokens_seen": 1082960, + "step": 2695 + }, + { + "epoch": 2.8066528066528065, + "grad_norm": 14.539408683776855, + "learning_rate": 2.402960854872697e-05, + "loss": 0.2877, + "num_input_tokens_seen": 1085008, + "step": 2700 + }, + { + "epoch": 2.811850311850312, + "grad_norm": 6.818408489227295, + "learning_rate": 2.39389699200963e-05, + "loss": 0.1818, + "num_input_tokens_seen": 1087184, + "step": 2705 + }, + { + "epoch": 2.817047817047817, + "grad_norm": 8.152698516845703, + "learning_rate": 2.384834526131752e-05, + "loss": 0.2384, + "num_input_tokens_seen": 1089104, + "step": 2710 + }, + { + "epoch": 2.822245322245322, + "grad_norm": 0.4875684976577759, + "learning_rate": 2.3757735765583083e-05, + "loss": 0.2707, + "num_input_tokens_seen": 1091024, + "step": 2715 + }, + { + "epoch": 2.8274428274428276, + "grad_norm": 0.5857343077659607, + "learning_rate": 2.366714262588577e-05, + "loss": 0.2399, + "num_input_tokens_seen": 1093008, + "step": 2720 + }, + { + "epoch": 2.8326403326403327, + "grad_norm": 0.10867218673229218, + "learning_rate": 2.3576567035003027e-05, + "loss": 0.2595, + "num_input_tokens_seen": 1094992, + "step": 2725 + }, + { + "epoch": 2.8378378378378377, + "grad_norm": 5.911508083343506, + "learning_rate": 2.3486010185481248e-05, + "loss": 0.2918, + "num_input_tokens_seen": 1097040, + "step": 2730 + }, + { + "epoch": 2.8430353430353428, + "grad_norm": 12.04796314239502, + "learning_rate": 2.3395473269620056e-05, + "loss": 0.274, + "num_input_tokens_seen": 1098960, + "step": 2735 + }, + { + "epoch": 2.8482328482328483, + "grad_norm": 15.308754920959473, + "learning_rate": 2.330495747945665e-05, + "loss": 0.2749, + "num_input_tokens_seen": 1101200, + "step": 2740 + }, + { + "epoch": 2.8534303534303533, + "grad_norm": 16.627357482910156, + "learning_rate": 2.321446400675005e-05, + "loss": 0.2766, + "num_input_tokens_seen": 1103120, + "step": 2745 + }, + { + "epoch": 2.858627858627859, + "grad_norm": 20.289390563964844, + "learning_rate": 2.3123994042965453e-05, + "loss": 0.255, + "num_input_tokens_seen": 1105168, + "step": 2750 + }, + { + "epoch": 2.863825363825364, + "grad_norm": 8.598325729370117, + "learning_rate": 2.3033548779258535e-05, + "loss": 0.2452, + "num_input_tokens_seen": 1107152, + "step": 2755 + }, + { + "epoch": 2.869022869022869, + "grad_norm": 13.070589065551758, + "learning_rate": 2.294312940645975e-05, + "loss": 0.3016, + "num_input_tokens_seen": 1109200, + "step": 2760 + }, + { + "epoch": 2.874220374220374, + "grad_norm": 2.4811654090881348, + "learning_rate": 2.2852737115058682e-05, + "loss": 0.282, + "num_input_tokens_seen": 1111248, + "step": 2765 + }, + { + "epoch": 2.8794178794178795, + "grad_norm": 9.034327507019043, + "learning_rate": 2.276237309518834e-05, + "loss": 0.2753, + "num_input_tokens_seen": 1113232, + "step": 2770 + }, + { + "epoch": 2.8846153846153846, + "grad_norm": 0.18150383234024048, + "learning_rate": 2.2672038536609487e-05, + "loss": 0.268, + "num_input_tokens_seen": 1115216, + "step": 2775 + }, + { + "epoch": 2.88981288981289, + "grad_norm": 4.699392318725586, + "learning_rate": 2.2581734628695034e-05, + "loss": 0.2816, + "num_input_tokens_seen": 1117264, + "step": 2780 + }, + { + "epoch": 2.895010395010395, + "grad_norm": 4.98245906829834, + "learning_rate": 2.2491462560414287e-05, + "loss": 0.2795, + "num_input_tokens_seen": 1119376, + "step": 2785 + }, + { + "epoch": 2.9002079002079, + "grad_norm": 7.173026084899902, + "learning_rate": 2.2401223520317362e-05, + "loss": 0.283, + "num_input_tokens_seen": 1121424, + "step": 2790 + }, + { + "epoch": 2.9054054054054053, + "grad_norm": 1.0886781215667725, + "learning_rate": 2.2311018696519532e-05, + "loss": 0.2663, + "num_input_tokens_seen": 1123472, + "step": 2795 + }, + { + "epoch": 2.9106029106029108, + "grad_norm": 3.959348440170288, + "learning_rate": 2.222084927668553e-05, + "loss": 0.218, + "num_input_tokens_seen": 1125584, + "step": 2800 + }, + { + "epoch": 2.915800415800416, + "grad_norm": 18.90048599243164, + "learning_rate": 2.2130716448014e-05, + "loss": 0.2474, + "num_input_tokens_seen": 1127568, + "step": 2805 + }, + { + "epoch": 2.920997920997921, + "grad_norm": 19.015106201171875, + "learning_rate": 2.204062139722176e-05, + "loss": 0.3308, + "num_input_tokens_seen": 1129552, + "step": 2810 + }, + { + "epoch": 2.9261954261954264, + "grad_norm": 3.917026996612549, + "learning_rate": 2.1950565310528266e-05, + "loss": 0.2914, + "num_input_tokens_seen": 1131472, + "step": 2815 + }, + { + "epoch": 2.9313929313929314, + "grad_norm": 11.03906536102295, + "learning_rate": 2.186054937363996e-05, + "loss": 0.3008, + "num_input_tokens_seen": 1133392, + "step": 2820 + }, + { + "epoch": 2.9365904365904365, + "grad_norm": 9.081315040588379, + "learning_rate": 2.1770574771734642e-05, + "loss": 0.2747, + "num_input_tokens_seen": 1135440, + "step": 2825 + }, + { + "epoch": 2.9417879417879416, + "grad_norm": 1.4751437902450562, + "learning_rate": 2.168064268944591e-05, + "loss": 0.2694, + "num_input_tokens_seen": 1137424, + "step": 2830 + }, + { + "epoch": 2.946985446985447, + "grad_norm": 0.2908379137516022, + "learning_rate": 2.159075431084751e-05, + "loss": 0.2574, + "num_input_tokens_seen": 1139408, + "step": 2835 + }, + { + "epoch": 2.952182952182952, + "grad_norm": 6.697641372680664, + "learning_rate": 2.1500910819437766e-05, + "loss": 0.2677, + "num_input_tokens_seen": 1141456, + "step": 2840 + }, + { + "epoch": 2.9573804573804576, + "grad_norm": 0.9215155243873596, + "learning_rate": 2.141111339812405e-05, + "loss": 0.2513, + "num_input_tokens_seen": 1143440, + "step": 2845 + }, + { + "epoch": 2.9625779625779627, + "grad_norm": 0.976637601852417, + "learning_rate": 2.1321363229207096e-05, + "loss": 0.256, + "num_input_tokens_seen": 1145360, + "step": 2850 + }, + { + "epoch": 2.9677754677754677, + "grad_norm": 13.551946640014648, + "learning_rate": 2.123166149436556e-05, + "loss": 0.2779, + "num_input_tokens_seen": 1147280, + "step": 2855 + }, + { + "epoch": 2.972972972972973, + "grad_norm": 11.918627738952637, + "learning_rate": 2.114200937464035e-05, + "loss": 0.2814, + "num_input_tokens_seen": 1149200, + "step": 2860 + }, + { + "epoch": 2.9781704781704783, + "grad_norm": 19.893056869506836, + "learning_rate": 2.1052408050419152e-05, + "loss": 0.2671, + "num_input_tokens_seen": 1151184, + "step": 2865 + }, + { + "epoch": 2.9833679833679834, + "grad_norm": 12.081989288330078, + "learning_rate": 2.0962858701420866e-05, + "loss": 0.2391, + "num_input_tokens_seen": 1153232, + "step": 2870 + }, + { + "epoch": 2.9885654885654884, + "grad_norm": 9.680088996887207, + "learning_rate": 2.0873362506680057e-05, + "loss": 0.251, + "num_input_tokens_seen": 1155216, + "step": 2875 + }, + { + "epoch": 2.993762993762994, + "grad_norm": 7.104877471923828, + "learning_rate": 2.078392064453144e-05, + "loss": 0.2661, + "num_input_tokens_seen": 1157264, + "step": 2880 + }, + { + "epoch": 2.998960498960499, + "grad_norm": 0.48920291662216187, + "learning_rate": 2.0694534292594392e-05, + "loss": 0.2609, + "num_input_tokens_seen": 1159312, + "step": 2885 + }, + { + "epoch": 3.004158004158004, + "grad_norm": 7.250494003295898, + "learning_rate": 2.0605204627757403e-05, + "loss": 0.2209, + "num_input_tokens_seen": 1161248, + "step": 2890 + }, + { + "epoch": 3.006237006237006, + "eval_loss": 0.257083535194397, + "eval_runtime": 1.0821, + "eval_samples_per_second": 791.084, + "eval_steps_per_second": 98.885, + "num_input_tokens_seen": 1162016, + "step": 2892 + }, + { + "epoch": 3.0093555093555096, + "grad_norm": 14.574300765991211, + "learning_rate": 2.051593282616262e-05, + "loss": 0.2146, + "num_input_tokens_seen": 1163168, + "step": 2895 + }, + { + "epoch": 3.0145530145530146, + "grad_norm": 15.882224082946777, + "learning_rate": 2.0426720063190335e-05, + "loss": 0.2637, + "num_input_tokens_seen": 1165088, + "step": 2900 + }, + { + "epoch": 3.0197505197505197, + "grad_norm": 17.72052574157715, + "learning_rate": 2.033756751344352e-05, + "loss": 0.2303, + "num_input_tokens_seen": 1167136, + "step": 2905 + }, + { + "epoch": 3.024948024948025, + "grad_norm": 6.26023530960083, + "learning_rate": 2.0248476350732368e-05, + "loss": 0.2915, + "num_input_tokens_seen": 1169120, + "step": 2910 + }, + { + "epoch": 3.0301455301455302, + "grad_norm": 10.183695793151855, + "learning_rate": 2.0159447748058805e-05, + "loss": 0.3333, + "num_input_tokens_seen": 1171040, + "step": 2915 + }, + { + "epoch": 3.0353430353430353, + "grad_norm": 5.654576778411865, + "learning_rate": 2.0070482877601127e-05, + "loss": 0.2142, + "num_input_tokens_seen": 1173024, + "step": 2920 + }, + { + "epoch": 3.0405405405405403, + "grad_norm": 6.201435565948486, + "learning_rate": 1.998158291069845e-05, + "loss": 0.2912, + "num_input_tokens_seen": 1174944, + "step": 2925 + }, + { + "epoch": 3.045738045738046, + "grad_norm": 6.677492141723633, + "learning_rate": 1.9892749017835384e-05, + "loss": 0.2799, + "num_input_tokens_seen": 1177056, + "step": 2930 + }, + { + "epoch": 3.050935550935551, + "grad_norm": 22.7122859954834, + "learning_rate": 1.9803982368626583e-05, + "loss": 0.318, + "num_input_tokens_seen": 1178976, + "step": 2935 + }, + { + "epoch": 3.056133056133056, + "grad_norm": 8.921732902526855, + "learning_rate": 1.9715284131801353e-05, + "loss": 0.2836, + "num_input_tokens_seen": 1181024, + "step": 2940 + }, + { + "epoch": 3.0613305613305615, + "grad_norm": 1.3563765287399292, + "learning_rate": 1.9626655475188238e-05, + "loss": 0.2515, + "num_input_tokens_seen": 1183008, + "step": 2945 + }, + { + "epoch": 3.0665280665280665, + "grad_norm": 9.756816864013672, + "learning_rate": 1.953809756569971e-05, + "loss": 0.2949, + "num_input_tokens_seen": 1185056, + "step": 2950 + }, + { + "epoch": 3.0717255717255716, + "grad_norm": 10.324029922485352, + "learning_rate": 1.9449611569316717e-05, + "loss": 0.2646, + "num_input_tokens_seen": 1186976, + "step": 2955 + }, + { + "epoch": 3.076923076923077, + "grad_norm": 1.5440117120742798, + "learning_rate": 1.9361198651073408e-05, + "loss": 0.3027, + "num_input_tokens_seen": 1188960, + "step": 2960 + }, + { + "epoch": 3.082120582120582, + "grad_norm": 11.017732620239258, + "learning_rate": 1.9272859975041754e-05, + "loss": 0.2629, + "num_input_tokens_seen": 1190944, + "step": 2965 + }, + { + "epoch": 3.087318087318087, + "grad_norm": 19.006444931030273, + "learning_rate": 1.918459670431622e-05, + "loss": 0.2261, + "num_input_tokens_seen": 1192928, + "step": 2970 + }, + { + "epoch": 3.0925155925155927, + "grad_norm": 7.811370849609375, + "learning_rate": 1.9096410000998475e-05, + "loss": 0.239, + "num_input_tokens_seen": 1194848, + "step": 2975 + }, + { + "epoch": 3.0977130977130978, + "grad_norm": 1.5552674531936646, + "learning_rate": 1.900830102618206e-05, + "loss": 0.2484, + "num_input_tokens_seen": 1196768, + "step": 2980 + }, + { + "epoch": 3.102910602910603, + "grad_norm": 9.481167793273926, + "learning_rate": 1.892027093993716e-05, + "loss": 0.2739, + "num_input_tokens_seen": 1198688, + "step": 2985 + }, + { + "epoch": 3.108108108108108, + "grad_norm": 8.231619834899902, + "learning_rate": 1.8832320901295227e-05, + "loss": 0.2701, + "num_input_tokens_seen": 1200672, + "step": 2990 + }, + { + "epoch": 3.1133056133056134, + "grad_norm": 9.055398941040039, + "learning_rate": 1.8744452068233825e-05, + "loss": 0.29, + "num_input_tokens_seen": 1202720, + "step": 2995 + }, + { + "epoch": 3.1185031185031185, + "grad_norm": 1.7919214963912964, + "learning_rate": 1.8656665597661333e-05, + "loss": 0.2816, + "num_input_tokens_seen": 1204768, + "step": 3000 + }, + { + "epoch": 3.1237006237006235, + "grad_norm": 9.331473350524902, + "learning_rate": 1.85689626454017e-05, + "loss": 0.2677, + "num_input_tokens_seen": 1206944, + "step": 3005 + }, + { + "epoch": 3.128898128898129, + "grad_norm": 9.339173316955566, + "learning_rate": 1.8481344366179284e-05, + "loss": 0.2308, + "num_input_tokens_seen": 1209056, + "step": 3010 + }, + { + "epoch": 3.134095634095634, + "grad_norm": 0.4089166224002838, + "learning_rate": 1.839381191360358e-05, + "loss": 0.2745, + "num_input_tokens_seen": 1210976, + "step": 3015 + }, + { + "epoch": 3.139293139293139, + "grad_norm": 13.044018745422363, + "learning_rate": 1.8306366440154066e-05, + "loss": 0.2645, + "num_input_tokens_seen": 1213024, + "step": 3020 + }, + { + "epoch": 3.1444906444906446, + "grad_norm": 3.4399261474609375, + "learning_rate": 1.821900909716504e-05, + "loss": 0.2854, + "num_input_tokens_seen": 1215136, + "step": 3025 + }, + { + "epoch": 3.1496881496881497, + "grad_norm": 16.901412963867188, + "learning_rate": 1.8131741034810435e-05, + "loss": 0.2667, + "num_input_tokens_seen": 1217056, + "step": 3030 + }, + { + "epoch": 3.1548856548856548, + "grad_norm": 4.719562530517578, + "learning_rate": 1.8044563402088684e-05, + "loss": 0.2799, + "num_input_tokens_seen": 1219168, + "step": 3035 + }, + { + "epoch": 3.1600831600831603, + "grad_norm": 0.4354883134365082, + "learning_rate": 1.795747734680762e-05, + "loss": 0.2724, + "num_input_tokens_seen": 1221088, + "step": 3040 + }, + { + "epoch": 3.1652806652806653, + "grad_norm": 4.838202953338623, + "learning_rate": 1.7870484015569306e-05, + "loss": 0.2666, + "num_input_tokens_seen": 1223264, + "step": 3045 + }, + { + "epoch": 3.1704781704781704, + "grad_norm": 0.40550848841667175, + "learning_rate": 1.7783584553755006e-05, + "loss": 0.2586, + "num_input_tokens_seen": 1225440, + "step": 3050 + }, + { + "epoch": 3.175675675675676, + "grad_norm": 8.755316734313965, + "learning_rate": 1.769678010551003e-05, + "loss": 0.2519, + "num_input_tokens_seen": 1227424, + "step": 3055 + }, + { + "epoch": 3.180873180873181, + "grad_norm": 8.232521057128906, + "learning_rate": 1.761007181372874e-05, + "loss": 0.241, + "num_input_tokens_seen": 1229344, + "step": 3060 + }, + { + "epoch": 3.186070686070686, + "grad_norm": 7.669497013092041, + "learning_rate": 1.7523460820039464e-05, + "loss": 0.2406, + "num_input_tokens_seen": 1231456, + "step": 3065 + }, + { + "epoch": 3.1912681912681915, + "grad_norm": 12.419413566589355, + "learning_rate": 1.7436948264789466e-05, + "loss": 0.3145, + "num_input_tokens_seen": 1233440, + "step": 3070 + }, + { + "epoch": 3.1964656964656966, + "grad_norm": 2.3379440307617188, + "learning_rate": 1.7350535287029957e-05, + "loss": 0.2568, + "num_input_tokens_seen": 1235552, + "step": 3075 + }, + { + "epoch": 3.2016632016632016, + "grad_norm": 10.220464706420898, + "learning_rate": 1.7264223024501064e-05, + "loss": 0.2696, + "num_input_tokens_seen": 1237536, + "step": 3080 + }, + { + "epoch": 3.2068607068607067, + "grad_norm": 17.75920867919922, + "learning_rate": 1.717801261361685e-05, + "loss": 0.2861, + "num_input_tokens_seen": 1239584, + "step": 3085 + }, + { + "epoch": 3.212058212058212, + "grad_norm": 7.69419002532959, + "learning_rate": 1.7091905189450423e-05, + "loss": 0.2501, + "num_input_tokens_seen": 1241504, + "step": 3090 + }, + { + "epoch": 3.2172557172557172, + "grad_norm": 6.530004501342773, + "learning_rate": 1.700590188571887e-05, + "loss": 0.2578, + "num_input_tokens_seen": 1243552, + "step": 3095 + }, + { + "epoch": 3.2224532224532223, + "grad_norm": 2.1304476261138916, + "learning_rate": 1.6920003834768438e-05, + "loss": 0.3075, + "num_input_tokens_seen": 1245600, + "step": 3100 + }, + { + "epoch": 3.227650727650728, + "grad_norm": 19.96734046936035, + "learning_rate": 1.6834212167559575e-05, + "loss": 0.2389, + "num_input_tokens_seen": 1247712, + "step": 3105 + }, + { + "epoch": 3.232848232848233, + "grad_norm": 12.024674415588379, + "learning_rate": 1.674852801365203e-05, + "loss": 0.26, + "num_input_tokens_seen": 1249696, + "step": 3110 + }, + { + "epoch": 3.238045738045738, + "grad_norm": 6.835387229919434, + "learning_rate": 1.6662952501190033e-05, + "loss": 0.3027, + "num_input_tokens_seen": 1251808, + "step": 3115 + }, + { + "epoch": 3.2432432432432434, + "grad_norm": 8.725172996520996, + "learning_rate": 1.6577486756887374e-05, + "loss": 0.2315, + "num_input_tokens_seen": 1253728, + "step": 3120 + }, + { + "epoch": 3.2484407484407485, + "grad_norm": 0.420453816652298, + "learning_rate": 1.649213190601261e-05, + "loss": 0.249, + "num_input_tokens_seen": 1255840, + "step": 3125 + }, + { + "epoch": 3.2536382536382535, + "grad_norm": 8.639700889587402, + "learning_rate": 1.640688907237425e-05, + "loss": 0.2647, + "num_input_tokens_seen": 1257888, + "step": 3130 + }, + { + "epoch": 3.2567567567567566, + "eval_loss": 0.2563324272632599, + "eval_runtime": 1.0592, + "eval_samples_per_second": 808.124, + "eval_steps_per_second": 101.015, + "num_input_tokens_seen": 1259168, + "step": 3133 + }, + { + "epoch": 3.258835758835759, + "grad_norm": 13.672746658325195, + "learning_rate": 1.632175937830594e-05, + "loss": 0.2584, + "num_input_tokens_seen": 1259936, + "step": 3135 + }, + { + "epoch": 3.264033264033264, + "grad_norm": 14.988076210021973, + "learning_rate": 1.6236743944651703e-05, + "loss": 0.2355, + "num_input_tokens_seen": 1262112, + "step": 3140 + }, + { + "epoch": 3.269230769230769, + "grad_norm": 4.268918037414551, + "learning_rate": 1.615184389075117e-05, + "loss": 0.2481, + "num_input_tokens_seen": 1263904, + "step": 3145 + }, + { + "epoch": 3.274428274428274, + "grad_norm": 2.765204429626465, + "learning_rate": 1.6067060334424835e-05, + "loss": 0.2607, + "num_input_tokens_seen": 1265952, + "step": 3150 + }, + { + "epoch": 3.2796257796257797, + "grad_norm": 18.85066795349121, + "learning_rate": 1.5982394391959382e-05, + "loss": 0.3119, + "num_input_tokens_seen": 1267872, + "step": 3155 + }, + { + "epoch": 3.284823284823285, + "grad_norm": 2.8350369930267334, + "learning_rate": 1.58978471780929e-05, + "loss": 0.2925, + "num_input_tokens_seen": 1269792, + "step": 3160 + }, + { + "epoch": 3.29002079002079, + "grad_norm": 6.0720438957214355, + "learning_rate": 1.581341980600033e-05, + "loss": 0.2586, + "num_input_tokens_seen": 1271776, + "step": 3165 + }, + { + "epoch": 3.2952182952182953, + "grad_norm": 15.48050308227539, + "learning_rate": 1.5729113387278673e-05, + "loss": 0.2671, + "num_input_tokens_seen": 1273760, + "step": 3170 + }, + { + "epoch": 3.3004158004158004, + "grad_norm": 4.232337951660156, + "learning_rate": 1.5644929031932454e-05, + "loss": 0.2864, + "num_input_tokens_seen": 1275808, + "step": 3175 + }, + { + "epoch": 3.3056133056133055, + "grad_norm": 4.032689094543457, + "learning_rate": 1.5560867848359077e-05, + "loss": 0.2666, + "num_input_tokens_seen": 1277792, + "step": 3180 + }, + { + "epoch": 3.310810810810811, + "grad_norm": 3.819479465484619, + "learning_rate": 1.547693094333421e-05, + "loss": 0.2648, + "num_input_tokens_seen": 1279776, + "step": 3185 + }, + { + "epoch": 3.316008316008316, + "grad_norm": 5.751096725463867, + "learning_rate": 1.539311942199725e-05, + "loss": 0.2586, + "num_input_tokens_seen": 1281760, + "step": 3190 + }, + { + "epoch": 3.321205821205821, + "grad_norm": 5.748921871185303, + "learning_rate": 1.5309434387836735e-05, + "loss": 0.2391, + "num_input_tokens_seen": 1283744, + "step": 3195 + }, + { + "epoch": 3.3264033264033266, + "grad_norm": 4.8532915115356445, + "learning_rate": 1.5225876942675842e-05, + "loss": 0.2907, + "num_input_tokens_seen": 1285792, + "step": 3200 + }, + { + "epoch": 3.3316008316008316, + "grad_norm": 2.2807741165161133, + "learning_rate": 1.5142448186657878e-05, + "loss": 0.2942, + "num_input_tokens_seen": 1287776, + "step": 3205 + }, + { + "epoch": 3.3367983367983367, + "grad_norm": 0.5820121169090271, + "learning_rate": 1.505914921823178e-05, + "loss": 0.3321, + "num_input_tokens_seen": 1289696, + "step": 3210 + }, + { + "epoch": 3.3419958419958418, + "grad_norm": 2.5034902095794678, + "learning_rate": 1.4975981134137659e-05, + "loss": 0.2486, + "num_input_tokens_seen": 1291680, + "step": 3215 + }, + { + "epoch": 3.3471933471933473, + "grad_norm": 1.1145634651184082, + "learning_rate": 1.489294502939238e-05, + "loss": 0.2502, + "num_input_tokens_seen": 1293536, + "step": 3220 + }, + { + "epoch": 3.3523908523908523, + "grad_norm": 7.527857780456543, + "learning_rate": 1.4810041997275092e-05, + "loss": 0.2878, + "num_input_tokens_seen": 1295712, + "step": 3225 + }, + { + "epoch": 3.357588357588358, + "grad_norm": 12.356915473937988, + "learning_rate": 1.4727273129312918e-05, + "loss": 0.2824, + "num_input_tokens_seen": 1297760, + "step": 3230 + }, + { + "epoch": 3.362785862785863, + "grad_norm": 4.496915817260742, + "learning_rate": 1.4644639515266483e-05, + "loss": 0.2772, + "num_input_tokens_seen": 1299808, + "step": 3235 + }, + { + "epoch": 3.367983367983368, + "grad_norm": 2.9005799293518066, + "learning_rate": 1.4562142243115644e-05, + "loss": 0.2602, + "num_input_tokens_seen": 1301920, + "step": 3240 + }, + { + "epoch": 3.373180873180873, + "grad_norm": 1.413136601448059, + "learning_rate": 1.4479782399045152e-05, + "loss": 0.2737, + "num_input_tokens_seen": 1303904, + "step": 3245 + }, + { + "epoch": 3.3783783783783785, + "grad_norm": 15.236632347106934, + "learning_rate": 1.4397561067430298e-05, + "loss": 0.2683, + "num_input_tokens_seen": 1305888, + "step": 3250 + }, + { + "epoch": 3.3835758835758836, + "grad_norm": 13.490982055664062, + "learning_rate": 1.4315479330822712e-05, + "loss": 0.261, + "num_input_tokens_seen": 1308064, + "step": 3255 + }, + { + "epoch": 3.3887733887733886, + "grad_norm": 4.421963691711426, + "learning_rate": 1.4233538269936042e-05, + "loss": 0.2702, + "num_input_tokens_seen": 1310048, + "step": 3260 + }, + { + "epoch": 3.393970893970894, + "grad_norm": 10.610108375549316, + "learning_rate": 1.415173896363178e-05, + "loss": 0.2761, + "num_input_tokens_seen": 1311968, + "step": 3265 + }, + { + "epoch": 3.399168399168399, + "grad_norm": 4.008954048156738, + "learning_rate": 1.4070082488905034e-05, + "loss": 0.2631, + "num_input_tokens_seen": 1313888, + "step": 3270 + }, + { + "epoch": 3.4043659043659042, + "grad_norm": 2.906602144241333, + "learning_rate": 1.3988569920870314e-05, + "loss": 0.2702, + "num_input_tokens_seen": 1316064, + "step": 3275 + }, + { + "epoch": 3.4095634095634098, + "grad_norm": 12.885231018066406, + "learning_rate": 1.3907202332747454e-05, + "loss": 0.2643, + "num_input_tokens_seen": 1318112, + "step": 3280 + }, + { + "epoch": 3.414760914760915, + "grad_norm": 0.1723124235868454, + "learning_rate": 1.3825980795847402e-05, + "loss": 0.2877, + "num_input_tokens_seen": 1319968, + "step": 3285 + }, + { + "epoch": 3.41995841995842, + "grad_norm": 7.7092390060424805, + "learning_rate": 1.3744906379558165e-05, + "loss": 0.271, + "num_input_tokens_seen": 1322016, + "step": 3290 + }, + { + "epoch": 3.4251559251559254, + "grad_norm": 1.4101628065109253, + "learning_rate": 1.3663980151330732e-05, + "loss": 0.2729, + "num_input_tokens_seen": 1323936, + "step": 3295 + }, + { + "epoch": 3.4303534303534304, + "grad_norm": 1.401780128479004, + "learning_rate": 1.3583203176664961e-05, + "loss": 0.261, + "num_input_tokens_seen": 1325920, + "step": 3300 + }, + { + "epoch": 3.4355509355509355, + "grad_norm": 21.787748336791992, + "learning_rate": 1.350257651909562e-05, + "loss": 0.2498, + "num_input_tokens_seen": 1327840, + "step": 3305 + }, + { + "epoch": 3.4407484407484406, + "grad_norm": 8.913102149963379, + "learning_rate": 1.3422101240178365e-05, + "loss": 0.2384, + "num_input_tokens_seen": 1329760, + "step": 3310 + }, + { + "epoch": 3.445945945945946, + "grad_norm": 2.156329870223999, + "learning_rate": 1.3341778399475713e-05, + "loss": 0.2789, + "num_input_tokens_seen": 1331744, + "step": 3315 + }, + { + "epoch": 3.451143451143451, + "grad_norm": 6.306075096130371, + "learning_rate": 1.3261609054543179e-05, + "loss": 0.26, + "num_input_tokens_seen": 1333792, + "step": 3320 + }, + { + "epoch": 3.456340956340956, + "grad_norm": 8.915762901306152, + "learning_rate": 1.3181594260915262e-05, + "loss": 0.2975, + "num_input_tokens_seen": 1335776, + "step": 3325 + }, + { + "epoch": 3.4615384615384617, + "grad_norm": 2.6008245944976807, + "learning_rate": 1.3101735072091622e-05, + "loss": 0.2479, + "num_input_tokens_seen": 1337824, + "step": 3330 + }, + { + "epoch": 3.4667359667359667, + "grad_norm": 10.535400390625, + "learning_rate": 1.3022032539523176e-05, + "loss": 0.223, + "num_input_tokens_seen": 1339872, + "step": 3335 + }, + { + "epoch": 3.471933471933472, + "grad_norm": 7.183012008666992, + "learning_rate": 1.2942487712598234e-05, + "loss": 0.2543, + "num_input_tokens_seen": 1341920, + "step": 3340 + }, + { + "epoch": 3.4771309771309773, + "grad_norm": 8.969158172607422, + "learning_rate": 1.2863101638628717e-05, + "loss": 0.2449, + "num_input_tokens_seen": 1343904, + "step": 3345 + }, + { + "epoch": 3.4823284823284824, + "grad_norm": 14.45447826385498, + "learning_rate": 1.2783875362836373e-05, + "loss": 0.2881, + "num_input_tokens_seen": 1345952, + "step": 3350 + }, + { + "epoch": 3.4875259875259874, + "grad_norm": 5.68330717086792, + "learning_rate": 1.2704809928338956e-05, + "loss": 0.2574, + "num_input_tokens_seen": 1348128, + "step": 3355 + }, + { + "epoch": 3.492723492723493, + "grad_norm": 4.9651079177856445, + "learning_rate": 1.2625906376136581e-05, + "loss": 0.2915, + "num_input_tokens_seen": 1350048, + "step": 3360 + }, + { + "epoch": 3.497920997920998, + "grad_norm": 0.1253027617931366, + "learning_rate": 1.2547165745097928e-05, + "loss": 0.2653, + "num_input_tokens_seen": 1351968, + "step": 3365 + }, + { + "epoch": 3.503118503118503, + "grad_norm": 7.796263217926025, + "learning_rate": 1.2468589071946632e-05, + "loss": 0.2795, + "num_input_tokens_seen": 1353952, + "step": 3370 + }, + { + "epoch": 3.507276507276507, + "eval_loss": 0.2641850709915161, + "eval_runtime": 1.0564, + "eval_samples_per_second": 810.335, + "eval_steps_per_second": 101.292, + "num_input_tokens_seen": 1355552, + "step": 3374 + }, + { + "epoch": 3.508316008316008, + "grad_norm": 0.7158005237579346, + "learning_rate": 1.2390177391247614e-05, + "loss": 0.2673, + "num_input_tokens_seen": 1356000, + "step": 3375 + }, + { + "epoch": 3.5135135135135136, + "grad_norm": 2.2780776023864746, + "learning_rate": 1.2311931735393417e-05, + "loss": 0.2527, + "num_input_tokens_seen": 1357984, + "step": 3380 + }, + { + "epoch": 3.5187110187110187, + "grad_norm": 2.900038957595825, + "learning_rate": 1.2233853134590697e-05, + "loss": 0.2635, + "num_input_tokens_seen": 1359904, + "step": 3385 + }, + { + "epoch": 3.523908523908524, + "grad_norm": 9.76952075958252, + "learning_rate": 1.215594261684656e-05, + "loss": 0.2737, + "num_input_tokens_seen": 1361952, + "step": 3390 + }, + { + "epoch": 3.529106029106029, + "grad_norm": 0.9151262044906616, + "learning_rate": 1.2078201207955123e-05, + "loss": 0.2521, + "num_input_tokens_seen": 1364000, + "step": 3395 + }, + { + "epoch": 3.5343035343035343, + "grad_norm": 7.289126873016357, + "learning_rate": 1.2000629931483947e-05, + "loss": 0.246, + "num_input_tokens_seen": 1366112, + "step": 3400 + }, + { + "epoch": 3.5395010395010393, + "grad_norm": 7.83226203918457, + "learning_rate": 1.1923229808760564e-05, + "loss": 0.3136, + "num_input_tokens_seen": 1368096, + "step": 3405 + }, + { + "epoch": 3.544698544698545, + "grad_norm": 0.7650713324546814, + "learning_rate": 1.1846001858859054e-05, + "loss": 0.2365, + "num_input_tokens_seen": 1370208, + "step": 3410 + }, + { + "epoch": 3.54989604989605, + "grad_norm": 8.69223403930664, + "learning_rate": 1.1768947098586628e-05, + "loss": 0.2545, + "num_input_tokens_seen": 1372192, + "step": 3415 + }, + { + "epoch": 3.555093555093555, + "grad_norm": 8.523820877075195, + "learning_rate": 1.1692066542470201e-05, + "loss": 0.2743, + "num_input_tokens_seen": 1374240, + "step": 3420 + }, + { + "epoch": 3.5602910602910605, + "grad_norm": 13.287330627441406, + "learning_rate": 1.1615361202743088e-05, + "loss": 0.2821, + "num_input_tokens_seen": 1376160, + "step": 3425 + }, + { + "epoch": 3.5654885654885655, + "grad_norm": 6.943297386169434, + "learning_rate": 1.1538832089331628e-05, + "loss": 0.2579, + "num_input_tokens_seen": 1378208, + "step": 3430 + }, + { + "epoch": 3.5706860706860706, + "grad_norm": 9.258183479309082, + "learning_rate": 1.1462480209841928e-05, + "loss": 0.2526, + "num_input_tokens_seen": 1380192, + "step": 3435 + }, + { + "epoch": 3.5758835758835756, + "grad_norm": 0.5721746683120728, + "learning_rate": 1.138630656954658e-05, + "loss": 0.2369, + "num_input_tokens_seen": 1382368, + "step": 3440 + }, + { + "epoch": 3.581081081081081, + "grad_norm": 7.4510297775268555, + "learning_rate": 1.1310312171371393e-05, + "loss": 0.3155, + "num_input_tokens_seen": 1384608, + "step": 3445 + }, + { + "epoch": 3.586278586278586, + "grad_norm": 17.350297927856445, + "learning_rate": 1.1234498015882261e-05, + "loss": 0.2615, + "num_input_tokens_seen": 1386592, + "step": 3450 + }, + { + "epoch": 3.5914760914760917, + "grad_norm": 5.5357513427734375, + "learning_rate": 1.1158865101271906e-05, + "loss": 0.2614, + "num_input_tokens_seen": 1388448, + "step": 3455 + }, + { + "epoch": 3.5966735966735968, + "grad_norm": 7.910511016845703, + "learning_rate": 1.1083414423346807e-05, + "loss": 0.2222, + "num_input_tokens_seen": 1390560, + "step": 3460 + }, + { + "epoch": 3.601871101871102, + "grad_norm": 13.7831392288208, + "learning_rate": 1.1008146975514059e-05, + "loss": 0.3213, + "num_input_tokens_seen": 1392736, + "step": 3465 + }, + { + "epoch": 3.607068607068607, + "grad_norm": 0.9229243397712708, + "learning_rate": 1.0933063748768254e-05, + "loss": 0.2762, + "num_input_tokens_seen": 1394720, + "step": 3470 + }, + { + "epoch": 3.6122661122661124, + "grad_norm": 8.663399696350098, + "learning_rate": 1.0858165731678513e-05, + "loss": 0.23, + "num_input_tokens_seen": 1396640, + "step": 3475 + }, + { + "epoch": 3.6174636174636174, + "grad_norm": 13.28499984741211, + "learning_rate": 1.0783453910375424e-05, + "loss": 0.3322, + "num_input_tokens_seen": 1398752, + "step": 3480 + }, + { + "epoch": 3.6226611226611225, + "grad_norm": 8.6603364944458, + "learning_rate": 1.0708929268538034e-05, + "loss": 0.2494, + "num_input_tokens_seen": 1400800, + "step": 3485 + }, + { + "epoch": 3.627858627858628, + "grad_norm": 16.12564468383789, + "learning_rate": 1.0634592787380965e-05, + "loss": 0.2596, + "num_input_tokens_seen": 1402720, + "step": 3490 + }, + { + "epoch": 3.633056133056133, + "grad_norm": 7.862550735473633, + "learning_rate": 1.0560445445641423e-05, + "loss": 0.2563, + "num_input_tokens_seen": 1404704, + "step": 3495 + }, + { + "epoch": 3.638253638253638, + "grad_norm": 0.07106157392263412, + "learning_rate": 1.048648821956637e-05, + "loss": 0.2589, + "num_input_tokens_seen": 1406560, + "step": 3500 + }, + { + "epoch": 3.643451143451143, + "grad_norm": 0.42181286215782166, + "learning_rate": 1.0412722082899644e-05, + "loss": 0.2386, + "num_input_tokens_seen": 1408544, + "step": 3505 + }, + { + "epoch": 3.6486486486486487, + "grad_norm": 0.11339768022298813, + "learning_rate": 1.033914800686912e-05, + "loss": 0.2512, + "num_input_tokens_seen": 1410464, + "step": 3510 + }, + { + "epoch": 3.6538461538461537, + "grad_norm": 16.115554809570312, + "learning_rate": 1.0265766960173965e-05, + "loss": 0.2277, + "num_input_tokens_seen": 1412448, + "step": 3515 + }, + { + "epoch": 3.6590436590436592, + "grad_norm": 18.590940475463867, + "learning_rate": 1.019257990897185e-05, + "loss": 0.2869, + "num_input_tokens_seen": 1414688, + "step": 3520 + }, + { + "epoch": 3.6642411642411643, + "grad_norm": 5.8544158935546875, + "learning_rate": 1.0119587816866258e-05, + "loss": 0.2914, + "num_input_tokens_seen": 1416672, + "step": 3525 + }, + { + "epoch": 3.6694386694386694, + "grad_norm": 8.909049034118652, + "learning_rate": 1.0046791644893758e-05, + "loss": 0.2836, + "num_input_tokens_seen": 1418592, + "step": 3530 + }, + { + "epoch": 3.6746361746361744, + "grad_norm": 5.8211212158203125, + "learning_rate": 9.974192351511368e-06, + "loss": 0.2675, + "num_input_tokens_seen": 1420576, + "step": 3535 + }, + { + "epoch": 3.67983367983368, + "grad_norm": 7.190529823303223, + "learning_rate": 9.901790892583974e-06, + "loss": 0.2679, + "num_input_tokens_seen": 1422560, + "step": 3540 + }, + { + "epoch": 3.685031185031185, + "grad_norm": 6.408370018005371, + "learning_rate": 9.829588221371694e-06, + "loss": 0.2697, + "num_input_tokens_seen": 1424608, + "step": 3545 + }, + { + "epoch": 3.6902286902286905, + "grad_norm": 3.801816940307617, + "learning_rate": 9.757585288517328e-06, + "loss": 0.2612, + "num_input_tokens_seen": 1426784, + "step": 3550 + }, + { + "epoch": 3.6954261954261955, + "grad_norm": 2.5229806900024414, + "learning_rate": 9.6857830420339e-06, + "loss": 0.2501, + "num_input_tokens_seen": 1428896, + "step": 3555 + }, + { + "epoch": 3.7006237006237006, + "grad_norm": 7.06850004196167, + "learning_rate": 9.614182427292077e-06, + "loss": 0.2586, + "num_input_tokens_seen": 1430880, + "step": 3560 + }, + { + "epoch": 3.7058212058212057, + "grad_norm": 6.542532920837402, + "learning_rate": 9.54278438700785e-06, + "loss": 0.2484, + "num_input_tokens_seen": 1432864, + "step": 3565 + }, + { + "epoch": 3.711018711018711, + "grad_norm": 15.00790023803711, + "learning_rate": 9.471589861229998e-06, + "loss": 0.287, + "num_input_tokens_seen": 1434912, + "step": 3570 + }, + { + "epoch": 3.7162162162162162, + "grad_norm": 3.730722188949585, + "learning_rate": 9.400599787327773e-06, + "loss": 0.3025, + "num_input_tokens_seen": 1436832, + "step": 3575 + }, + { + "epoch": 3.7214137214137213, + "grad_norm": 0.24840876460075378, + "learning_rate": 9.329815099978568e-06, + "loss": 0.2433, + "num_input_tokens_seen": 1438752, + "step": 3580 + }, + { + "epoch": 3.726611226611227, + "grad_norm": 12.727954864501953, + "learning_rate": 9.259236731155582e-06, + "loss": 0.3809, + "num_input_tokens_seen": 1440672, + "step": 3585 + }, + { + "epoch": 3.731808731808732, + "grad_norm": 3.5419039726257324, + "learning_rate": 9.18886561011557e-06, + "loss": 0.2221, + "num_input_tokens_seen": 1442784, + "step": 3590 + }, + { + "epoch": 3.737006237006237, + "grad_norm": 4.471946716308594, + "learning_rate": 9.118702663386584e-06, + "loss": 0.2622, + "num_input_tokens_seen": 1444960, + "step": 3595 + }, + { + "epoch": 3.742203742203742, + "grad_norm": 7.390607833862305, + "learning_rate": 9.048748814755784e-06, + "loss": 0.3094, + "num_input_tokens_seen": 1446880, + "step": 3600 + }, + { + "epoch": 3.7474012474012475, + "grad_norm": 0.6072008013725281, + "learning_rate": 8.979004985257294e-06, + "loss": 0.2723, + "num_input_tokens_seen": 1448992, + "step": 3605 + }, + { + "epoch": 3.7525987525987525, + "grad_norm": 5.596619606018066, + "learning_rate": 8.909472093160065e-06, + "loss": 0.2755, + "num_input_tokens_seen": 1450976, + "step": 3610 + }, + { + "epoch": 3.757796257796258, + "grad_norm": 4.79258394241333, + "learning_rate": 8.840151053955773e-06, + "loss": 0.2751, + "num_input_tokens_seen": 1453088, + "step": 3615 + }, + { + "epoch": 3.757796257796258, + "eval_loss": 0.25871533155441284, + "eval_runtime": 1.0494, + "eval_samples_per_second": 815.737, + "eval_steps_per_second": 101.967, + "num_input_tokens_seen": 1453088, + "step": 3615 + }, + { + "epoch": 3.762993762993763, + "grad_norm": 9.075246810913086, + "learning_rate": 8.771042780346766e-06, + "loss": 0.2834, + "num_input_tokens_seen": 1455136, + "step": 3620 + }, + { + "epoch": 3.768191268191268, + "grad_norm": 3.0494143962860107, + "learning_rate": 8.702148182234043e-06, + "loss": 0.2472, + "num_input_tokens_seen": 1457120, + "step": 3625 + }, + { + "epoch": 3.773388773388773, + "grad_norm": 3.5605342388153076, + "learning_rate": 8.633468166705336e-06, + "loss": 0.2772, + "num_input_tokens_seen": 1459168, + "step": 3630 + }, + { + "epoch": 3.7785862785862787, + "grad_norm": 3.971622943878174, + "learning_rate": 8.565003638023065e-06, + "loss": 0.2651, + "num_input_tokens_seen": 1461152, + "step": 3635 + }, + { + "epoch": 3.7837837837837838, + "grad_norm": 2.8847694396972656, + "learning_rate": 8.496755497612492e-06, + "loss": 0.2756, + "num_input_tokens_seen": 1463136, + "step": 3640 + }, + { + "epoch": 3.788981288981289, + "grad_norm": 9.094311714172363, + "learning_rate": 8.42872464404986e-06, + "loss": 0.2693, + "num_input_tokens_seen": 1465120, + "step": 3645 + }, + { + "epoch": 3.7941787941787943, + "grad_norm": 3.9456887245178223, + "learning_rate": 8.360911973050537e-06, + "loss": 0.2816, + "num_input_tokens_seen": 1467104, + "step": 3650 + }, + { + "epoch": 3.7993762993762994, + "grad_norm": 9.080158233642578, + "learning_rate": 8.293318377457241e-06, + "loss": 0.2571, + "num_input_tokens_seen": 1469152, + "step": 3655 + }, + { + "epoch": 3.8045738045738045, + "grad_norm": 3.958771228790283, + "learning_rate": 8.225944747228257e-06, + "loss": 0.268, + "num_input_tokens_seen": 1471264, + "step": 3660 + }, + { + "epoch": 3.8097713097713095, + "grad_norm": 8.621827125549316, + "learning_rate": 8.158791969425738e-06, + "loss": 0.2128, + "num_input_tokens_seen": 1473248, + "step": 3665 + }, + { + "epoch": 3.814968814968815, + "grad_norm": 14.013006210327148, + "learning_rate": 8.091860928204049e-06, + "loss": 0.3101, + "num_input_tokens_seen": 1475360, + "step": 3670 + }, + { + "epoch": 3.82016632016632, + "grad_norm": 11.601419448852539, + "learning_rate": 8.025152504798078e-06, + "loss": 0.3044, + "num_input_tokens_seen": 1477472, + "step": 3675 + }, + { + "epoch": 3.8253638253638256, + "grad_norm": 3.5920257568359375, + "learning_rate": 7.958667577511683e-06, + "loss": 0.2471, + "num_input_tokens_seen": 1479328, + "step": 3680 + }, + { + "epoch": 3.8305613305613306, + "grad_norm": 11.748164176940918, + "learning_rate": 7.892407021706063e-06, + "loss": 0.2552, + "num_input_tokens_seen": 1481248, + "step": 3685 + }, + { + "epoch": 3.8357588357588357, + "grad_norm": 11.761496543884277, + "learning_rate": 7.826371709788313e-06, + "loss": 0.3112, + "num_input_tokens_seen": 1483168, + "step": 3690 + }, + { + "epoch": 3.8409563409563408, + "grad_norm": 2.8758435249328613, + "learning_rate": 7.760562511199882e-06, + "loss": 0.2585, + "num_input_tokens_seen": 1485152, + "step": 3695 + }, + { + "epoch": 3.8461538461538463, + "grad_norm": 3.748758554458618, + "learning_rate": 7.694980292405122e-06, + "loss": 0.2673, + "num_input_tokens_seen": 1487200, + "step": 3700 + }, + { + "epoch": 3.8513513513513513, + "grad_norm": 5.409223556518555, + "learning_rate": 7.629625916879932e-06, + "loss": 0.2763, + "num_input_tokens_seen": 1489184, + "step": 3705 + }, + { + "epoch": 3.856548856548857, + "grad_norm": 13.337824821472168, + "learning_rate": 7.564500245100325e-06, + "loss": 0.278, + "num_input_tokens_seen": 1491168, + "step": 3710 + }, + { + "epoch": 3.861746361746362, + "grad_norm": 1.357743740081787, + "learning_rate": 7.499604134531149e-06, + "loss": 0.2727, + "num_input_tokens_seen": 1493216, + "step": 3715 + }, + { + "epoch": 3.866943866943867, + "grad_norm": 0.9974175095558167, + "learning_rate": 7.434938439614781e-06, + "loss": 0.2667, + "num_input_tokens_seen": 1495200, + "step": 3720 + }, + { + "epoch": 3.872141372141372, + "grad_norm": 1.3982412815093994, + "learning_rate": 7.370504011759855e-06, + "loss": 0.2707, + "num_input_tokens_seen": 1497184, + "step": 3725 + }, + { + "epoch": 3.8773388773388775, + "grad_norm": 2.715106248855591, + "learning_rate": 7.306301699330065e-06, + "loss": 0.2656, + "num_input_tokens_seen": 1499040, + "step": 3730 + }, + { + "epoch": 3.8825363825363826, + "grad_norm": 10.939849853515625, + "learning_rate": 7.242332347633052e-06, + "loss": 0.2423, + "num_input_tokens_seen": 1501024, + "step": 3735 + }, + { + "epoch": 3.8877338877338876, + "grad_norm": 8.844660758972168, + "learning_rate": 7.178596798909159e-06, + "loss": 0.2487, + "num_input_tokens_seen": 1503072, + "step": 3740 + }, + { + "epoch": 3.892931392931393, + "grad_norm": 0.9195927381515503, + "learning_rate": 7.115095892320456e-06, + "loss": 0.2847, + "num_input_tokens_seen": 1505248, + "step": 3745 + }, + { + "epoch": 3.898128898128898, + "grad_norm": 15.075143814086914, + "learning_rate": 7.051830463939604e-06, + "loss": 0.2334, + "num_input_tokens_seen": 1507296, + "step": 3750 + }, + { + "epoch": 3.9033264033264032, + "grad_norm": 5.580709934234619, + "learning_rate": 6.98880134673891e-06, + "loss": 0.2595, + "num_input_tokens_seen": 1509344, + "step": 3755 + }, + { + "epoch": 3.9085239085239083, + "grad_norm": 5.476256370544434, + "learning_rate": 6.926009370579334e-06, + "loss": 0.2098, + "num_input_tokens_seen": 1511456, + "step": 3760 + }, + { + "epoch": 3.913721413721414, + "grad_norm": 3.832021713256836, + "learning_rate": 6.8634553621995416e-06, + "loss": 0.2277, + "num_input_tokens_seen": 1513440, + "step": 3765 + }, + { + "epoch": 3.918918918918919, + "grad_norm": 15.132575035095215, + "learning_rate": 6.80114014520507e-06, + "loss": 0.3251, + "num_input_tokens_seen": 1515488, + "step": 3770 + }, + { + "epoch": 3.9241164241164244, + "grad_norm": 5.868591785430908, + "learning_rate": 6.739064540057424e-06, + "loss": 0.2604, + "num_input_tokens_seen": 1517408, + "step": 3775 + }, + { + "epoch": 3.9293139293139294, + "grad_norm": 11.784462928771973, + "learning_rate": 6.677229364063328e-06, + "loss": 0.2458, + "num_input_tokens_seen": 1519392, + "step": 3780 + }, + { + "epoch": 3.9345114345114345, + "grad_norm": 3.2488772869110107, + "learning_rate": 6.615635431363942e-06, + "loss": 0.2596, + "num_input_tokens_seen": 1521440, + "step": 3785 + }, + { + "epoch": 3.9397089397089395, + "grad_norm": 3.991219997406006, + "learning_rate": 6.554283552924118e-06, + "loss": 0.2766, + "num_input_tokens_seen": 1523488, + "step": 3790 + }, + { + "epoch": 3.944906444906445, + "grad_norm": 2.877652168273926, + "learning_rate": 6.493174536521768e-06, + "loss": 0.2551, + "num_input_tokens_seen": 1525600, + "step": 3795 + }, + { + "epoch": 3.95010395010395, + "grad_norm": 10.219852447509766, + "learning_rate": 6.4323091867372095e-06, + "loss": 0.2612, + "num_input_tokens_seen": 1527584, + "step": 3800 + }, + { + "epoch": 3.955301455301455, + "grad_norm": 9.425738334655762, + "learning_rate": 6.371688304942544e-06, + "loss": 0.2575, + "num_input_tokens_seen": 1529504, + "step": 3805 + }, + { + "epoch": 3.9604989604989607, + "grad_norm": 13.004129409790039, + "learning_rate": 6.311312689291166e-06, + "loss": 0.2897, + "num_input_tokens_seen": 1531424, + "step": 3810 + }, + { + "epoch": 3.9656964656964657, + "grad_norm": 7.159772872924805, + "learning_rate": 6.251183134707184e-06, + "loss": 0.2366, + "num_input_tokens_seen": 1533408, + "step": 3815 + }, + { + "epoch": 3.970893970893971, + "grad_norm": 6.52066707611084, + "learning_rate": 6.191300432875017e-06, + "loss": 0.2668, + "num_input_tokens_seen": 1535392, + "step": 3820 + }, + { + "epoch": 3.976091476091476, + "grad_norm": 13.160318374633789, + "learning_rate": 6.13166537222894e-06, + "loss": 0.1661, + "num_input_tokens_seen": 1537312, + "step": 3825 + }, + { + "epoch": 3.9812889812889813, + "grad_norm": 16.36733055114746, + "learning_rate": 6.072278737942691e-06, + "loss": 0.28, + "num_input_tokens_seen": 1539360, + "step": 3830 + }, + { + "epoch": 3.9864864864864864, + "grad_norm": 4.4265875816345215, + "learning_rate": 6.0131413119191685e-06, + "loss": 0.3038, + "num_input_tokens_seen": 1541280, + "step": 3835 + }, + { + "epoch": 3.991683991683992, + "grad_norm": 4.7540717124938965, + "learning_rate": 5.954253872780102e-06, + "loss": 0.2598, + "num_input_tokens_seen": 1543136, + "step": 3840 + }, + { + "epoch": 3.996881496881497, + "grad_norm": 1.5352482795715332, + "learning_rate": 5.8956171958558266e-06, + "loss": 0.2387, + "num_input_tokens_seen": 1545120, + "step": 3845 + }, + { + "epoch": 4.002079002079002, + "grad_norm": 0.05950174108147621, + "learning_rate": 5.8372320531750655e-06, + "loss": 0.2258, + "num_input_tokens_seen": 1547056, + "step": 3850 + }, + { + "epoch": 4.007276507276507, + "grad_norm": 9.390141487121582, + "learning_rate": 5.77909921345475e-06, + "loss": 0.279, + "num_input_tokens_seen": 1548976, + "step": 3855 + }, + { + "epoch": 4.008316008316008, + "eval_loss": 0.25588732957839966, + "eval_runtime": 1.0892, + "eval_samples_per_second": 785.884, + "eval_steps_per_second": 98.235, + "num_input_tokens_seen": 1549360, + "step": 3856 + }, + { + "epoch": 4.012474012474012, + "grad_norm": 4.292252063751221, + "learning_rate": 5.721219442089926e-06, + "loss": 0.2636, + "num_input_tokens_seen": 1550960, + "step": 3860 + }, + { + "epoch": 4.017671517671518, + "grad_norm": 3.9697649478912354, + "learning_rate": 5.663593501143663e-06, + "loss": 0.2772, + "num_input_tokens_seen": 1552944, + "step": 3865 + }, + { + "epoch": 4.022869022869023, + "grad_norm": 1.579316258430481, + "learning_rate": 5.6062221493370035e-06, + "loss": 0.2654, + "num_input_tokens_seen": 1554992, + "step": 3870 + }, + { + "epoch": 4.028066528066528, + "grad_norm": 14.188766479492188, + "learning_rate": 5.549106142039018e-06, + "loss": 0.2682, + "num_input_tokens_seen": 1557104, + "step": 3875 + }, + { + "epoch": 4.033264033264033, + "grad_norm": 7.652184963226318, + "learning_rate": 5.492246231256798e-06, + "loss": 0.2818, + "num_input_tokens_seen": 1559088, + "step": 3880 + }, + { + "epoch": 4.038461538461538, + "grad_norm": 7.617486953735352, + "learning_rate": 5.435643165625614e-06, + "loss": 0.2739, + "num_input_tokens_seen": 1561008, + "step": 3885 + }, + { + "epoch": 4.043659043659043, + "grad_norm": 14.909598350524902, + "learning_rate": 5.379297690399035e-06, + "loss": 0.273, + "num_input_tokens_seen": 1563056, + "step": 3890 + }, + { + "epoch": 4.048856548856548, + "grad_norm": 13.364591598510742, + "learning_rate": 5.3232105474390895e-06, + "loss": 0.2571, + "num_input_tokens_seen": 1565040, + "step": 3895 + }, + { + "epoch": 4.054054054054054, + "grad_norm": 4.7986159324646, + "learning_rate": 5.267382475206548e-06, + "loss": 0.2529, + "num_input_tokens_seen": 1567024, + "step": 3900 + }, + { + "epoch": 4.0592515592515594, + "grad_norm": 4.830848693847656, + "learning_rate": 5.2118142087511705e-06, + "loss": 0.264, + "num_input_tokens_seen": 1569136, + "step": 3905 + }, + { + "epoch": 4.0644490644490645, + "grad_norm": 11.776159286499023, + "learning_rate": 5.156506479702019e-06, + "loss": 0.2638, + "num_input_tokens_seen": 1571120, + "step": 3910 + }, + { + "epoch": 4.06964656964657, + "grad_norm": 0.2953391969203949, + "learning_rate": 5.101460016257859e-06, + "loss": 0.2652, + "num_input_tokens_seen": 1573040, + "step": 3915 + }, + { + "epoch": 4.074844074844075, + "grad_norm": 0.2401997148990631, + "learning_rate": 5.0466755431775316e-06, + "loss": 0.2582, + "num_input_tokens_seen": 1574896, + "step": 3920 + }, + { + "epoch": 4.08004158004158, + "grad_norm": 0.6011865139007568, + "learning_rate": 4.992153781770448e-06, + "loss": 0.2618, + "num_input_tokens_seen": 1576880, + "step": 3925 + }, + { + "epoch": 4.085239085239086, + "grad_norm": 12.98713493347168, + "learning_rate": 4.937895449887075e-06, + "loss": 0.2455, + "num_input_tokens_seen": 1578864, + "step": 3930 + }, + { + "epoch": 4.090436590436591, + "grad_norm": 13.129234313964844, + "learning_rate": 4.883901261909465e-06, + "loss": 0.2813, + "num_input_tokens_seen": 1580848, + "step": 3935 + }, + { + "epoch": 4.095634095634096, + "grad_norm": 11.796737670898438, + "learning_rate": 4.8301719287419e-06, + "loss": 0.2815, + "num_input_tokens_seen": 1582704, + "step": 3940 + }, + { + "epoch": 4.100831600831601, + "grad_norm": 9.959646224975586, + "learning_rate": 4.776708157801463e-06, + "loss": 0.2796, + "num_input_tokens_seen": 1584816, + "step": 3945 + }, + { + "epoch": 4.106029106029106, + "grad_norm": 11.752809524536133, + "learning_rate": 4.7235106530088085e-06, + "loss": 0.2491, + "num_input_tokens_seen": 1586800, + "step": 3950 + }, + { + "epoch": 4.111226611226611, + "grad_norm": 5.360927104949951, + "learning_rate": 4.670580114778813e-06, + "loss": 0.2528, + "num_input_tokens_seen": 1588720, + "step": 3955 + }, + { + "epoch": 4.116424116424117, + "grad_norm": 5.705671310424805, + "learning_rate": 4.617917240011394e-06, + "loss": 0.2732, + "num_input_tokens_seen": 1590576, + "step": 3960 + }, + { + "epoch": 4.121621621621622, + "grad_norm": 1.100892186164856, + "learning_rate": 4.565522722082336e-06, + "loss": 0.2573, + "num_input_tokens_seen": 1592496, + "step": 3965 + }, + { + "epoch": 4.126819126819127, + "grad_norm": 1.0973014831542969, + "learning_rate": 4.513397250834159e-06, + "loss": 0.2638, + "num_input_tokens_seen": 1594544, + "step": 3970 + }, + { + "epoch": 4.132016632016632, + "grad_norm": 8.093790054321289, + "learning_rate": 4.461541512567011e-06, + "loss": 0.2925, + "num_input_tokens_seen": 1596400, + "step": 3975 + }, + { + "epoch": 4.137214137214137, + "grad_norm": 0.3267320990562439, + "learning_rate": 4.409956190029674e-06, + "loss": 0.2786, + "num_input_tokens_seen": 1598320, + "step": 3980 + }, + { + "epoch": 4.142411642411642, + "grad_norm": 0.30618995428085327, + "learning_rate": 4.358641962410537e-06, + "loss": 0.2286, + "num_input_tokens_seen": 1600368, + "step": 3985 + }, + { + "epoch": 4.147609147609147, + "grad_norm": 12.98468017578125, + "learning_rate": 4.307599505328672e-06, + "loss": 0.2986, + "num_input_tokens_seen": 1602352, + "step": 3990 + }, + { + "epoch": 4.152806652806653, + "grad_norm": 0.18394550681114197, + "learning_rate": 4.256829490824949e-06, + "loss": 0.2363, + "num_input_tokens_seen": 1604336, + "step": 3995 + }, + { + "epoch": 4.158004158004158, + "grad_norm": 6.980307102203369, + "learning_rate": 4.206332587353149e-06, + "loss": 0.2652, + "num_input_tokens_seen": 1606256, + "step": 4000 + }, + { + "epoch": 4.163201663201663, + "grad_norm": 0.6148359775543213, + "learning_rate": 4.1561094597712155e-06, + "loss": 0.2641, + "num_input_tokens_seen": 1608304, + "step": 4005 + }, + { + "epoch": 4.168399168399168, + "grad_norm": 9.185464859008789, + "learning_rate": 4.106160769332443e-06, + "loss": 0.2415, + "num_input_tokens_seen": 1610480, + "step": 4010 + }, + { + "epoch": 4.173596673596673, + "grad_norm": 0.5142713189125061, + "learning_rate": 4.056487173676843e-06, + "loss": 0.2449, + "num_input_tokens_seen": 1612528, + "step": 4015 + }, + { + "epoch": 4.1787941787941785, + "grad_norm": 15.734733581542969, + "learning_rate": 4.007089326822405e-06, + "loss": 0.2742, + "num_input_tokens_seen": 1614576, + "step": 4020 + }, + { + "epoch": 4.183991683991684, + "grad_norm": 1.1118292808532715, + "learning_rate": 3.957967879156533e-06, + "loss": 0.264, + "num_input_tokens_seen": 1616624, + "step": 4025 + }, + { + "epoch": 4.1891891891891895, + "grad_norm": 12.48095989227295, + "learning_rate": 3.909123477427487e-06, + "loss": 0.2548, + "num_input_tokens_seen": 1618672, + "step": 4030 + }, + { + "epoch": 4.1943866943866945, + "grad_norm": 5.244612693786621, + "learning_rate": 3.860556764735842e-06, + "loss": 0.2113, + "num_input_tokens_seen": 1620784, + "step": 4035 + }, + { + "epoch": 4.1995841995842, + "grad_norm": 21.30678367614746, + "learning_rate": 3.812268380526046e-06, + "loss": 0.3261, + "num_input_tokens_seen": 1622768, + "step": 4040 + }, + { + "epoch": 4.204781704781705, + "grad_norm": 8.002152442932129, + "learning_rate": 3.764258960577971e-06, + "loss": 0.2481, + "num_input_tokens_seen": 1624688, + "step": 4045 + }, + { + "epoch": 4.20997920997921, + "grad_norm": 2.3525662422180176, + "learning_rate": 3.7165291369985618e-06, + "loss": 0.2599, + "num_input_tokens_seen": 1626672, + "step": 4050 + }, + { + "epoch": 4.215176715176715, + "grad_norm": 4.8225202560424805, + "learning_rate": 3.6690795382135186e-06, + "loss": 0.258, + "num_input_tokens_seen": 1628848, + "step": 4055 + }, + { + "epoch": 4.220374220374221, + "grad_norm": 1.9619829654693604, + "learning_rate": 3.6219107889590155e-06, + "loss": 0.2809, + "num_input_tokens_seen": 1630832, + "step": 4060 + }, + { + "epoch": 4.225571725571726, + "grad_norm": 20.82301139831543, + "learning_rate": 3.575023510273462e-06, + "loss": 0.2292, + "num_input_tokens_seen": 1632880, + "step": 4065 + }, + { + "epoch": 4.230769230769231, + "grad_norm": 1.0340510606765747, + "learning_rate": 3.5284183194893488e-06, + "loss": 0.2871, + "num_input_tokens_seen": 1634992, + "step": 4070 + }, + { + "epoch": 4.235966735966736, + "grad_norm": 12.200738906860352, + "learning_rate": 3.48209583022511e-06, + "loss": 0.2634, + "num_input_tokens_seen": 1636912, + "step": 4075 + }, + { + "epoch": 4.241164241164241, + "grad_norm": 14.348763465881348, + "learning_rate": 3.4360566523770426e-06, + "loss": 0.2477, + "num_input_tokens_seen": 1638832, + "step": 4080 + }, + { + "epoch": 4.246361746361746, + "grad_norm": 3.283851385116577, + "learning_rate": 3.3903013921112755e-06, + "loss": 0.2351, + "num_input_tokens_seen": 1641072, + "step": 4085 + }, + { + "epoch": 4.251559251559252, + "grad_norm": 1.4203660488128662, + "learning_rate": 3.3448306518557795e-06, + "loss": 0.2808, + "num_input_tokens_seen": 1642992, + "step": 4090 + }, + { + "epoch": 4.256756756756757, + "grad_norm": 5.4867753982543945, + "learning_rate": 3.299645030292467e-06, + "loss": 0.2511, + "num_input_tokens_seen": 1645040, + "step": 4095 + }, + { + "epoch": 4.258835758835759, + "eval_loss": 0.2517484128475189, + "eval_runtime": 1.069, + "eval_samples_per_second": 800.752, + "eval_steps_per_second": 100.094, + "num_input_tokens_seen": 1645808, + "step": 4097 + }, + { + "epoch": 4.261954261954262, + "grad_norm": 15.803162574768066, + "learning_rate": 3.2547451223492786e-06, + "loss": 0.2495, + "num_input_tokens_seen": 1647024, + "step": 4100 + }, + { + "epoch": 4.267151767151767, + "grad_norm": 6.709695816040039, + "learning_rate": 3.2101315191923663e-06, + "loss": 0.2774, + "num_input_tokens_seen": 1649008, + "step": 4105 + }, + { + "epoch": 4.272349272349272, + "grad_norm": 12.675971984863281, + "learning_rate": 3.165804808218292e-06, + "loss": 0.2208, + "num_input_tokens_seen": 1651056, + "step": 4110 + }, + { + "epoch": 4.277546777546777, + "grad_norm": 20.12381935119629, + "learning_rate": 3.1217655730463093e-06, + "loss": 0.2601, + "num_input_tokens_seen": 1653104, + "step": 4115 + }, + { + "epoch": 4.282744282744282, + "grad_norm": 5.935137748718262, + "learning_rate": 3.078014393510695e-06, + "loss": 0.2427, + "num_input_tokens_seen": 1655344, + "step": 4120 + }, + { + "epoch": 4.287941787941788, + "grad_norm": 3.3360893726348877, + "learning_rate": 3.0345518456530665e-06, + "loss": 0.2959, + "num_input_tokens_seen": 1657392, + "step": 4125 + }, + { + "epoch": 4.293139293139293, + "grad_norm": 8.30186653137207, + "learning_rate": 2.991378501714856e-06, + "loss": 0.2807, + "num_input_tokens_seen": 1659312, + "step": 4130 + }, + { + "epoch": 4.298336798336798, + "grad_norm": 7.54670524597168, + "learning_rate": 2.9484949301297166e-06, + "loss": 0.2579, + "num_input_tokens_seen": 1661424, + "step": 4135 + }, + { + "epoch": 4.303534303534303, + "grad_norm": 14.763995170593262, + "learning_rate": 2.9059016955160916e-06, + "loss": 0.2498, + "num_input_tokens_seen": 1663408, + "step": 4140 + }, + { + "epoch": 4.3087318087318085, + "grad_norm": 1.220461368560791, + "learning_rate": 2.8635993586697553e-06, + "loss": 0.226, + "num_input_tokens_seen": 1665328, + "step": 4145 + }, + { + "epoch": 4.313929313929314, + "grad_norm": 23.395973205566406, + "learning_rate": 2.8215884765564193e-06, + "loss": 0.2687, + "num_input_tokens_seen": 1667312, + "step": 4150 + }, + { + "epoch": 4.3191268191268195, + "grad_norm": 4.078779697418213, + "learning_rate": 2.7798696023044163e-06, + "loss": 0.1693, + "num_input_tokens_seen": 1669296, + "step": 4155 + }, + { + "epoch": 4.324324324324325, + "grad_norm": 5.839596748352051, + "learning_rate": 2.73844328519742e-06, + "loss": 0.2217, + "num_input_tokens_seen": 1671280, + "step": 4160 + }, + { + "epoch": 4.32952182952183, + "grad_norm": 21.18253517150879, + "learning_rate": 2.6973100706672e-06, + "loss": 0.2814, + "num_input_tokens_seen": 1673456, + "step": 4165 + }, + { + "epoch": 4.334719334719335, + "grad_norm": 6.5861101150512695, + "learning_rate": 2.656470500286451e-06, + "loss": 0.2523, + "num_input_tokens_seen": 1675504, + "step": 4170 + }, + { + "epoch": 4.33991683991684, + "grad_norm": 6.993749618530273, + "learning_rate": 2.615925111761647e-06, + "loss": 0.228, + "num_input_tokens_seen": 1677488, + "step": 4175 + }, + { + "epoch": 4.345114345114345, + "grad_norm": 11.91810417175293, + "learning_rate": 2.5756744389259734e-06, + "loss": 0.2399, + "num_input_tokens_seen": 1679536, + "step": 4180 + }, + { + "epoch": 4.350311850311851, + "grad_norm": 4.944723606109619, + "learning_rate": 2.535719011732321e-06, + "loss": 0.2345, + "num_input_tokens_seen": 1681520, + "step": 4185 + }, + { + "epoch": 4.355509355509356, + "grad_norm": 18.20621681213379, + "learning_rate": 2.49605935624625e-06, + "loss": 0.2726, + "num_input_tokens_seen": 1683568, + "step": 4190 + }, + { + "epoch": 4.360706860706861, + "grad_norm": 8.823187828063965, + "learning_rate": 2.4566959946391243e-06, + "loss": 0.236, + "num_input_tokens_seen": 1685488, + "step": 4195 + }, + { + "epoch": 4.365904365904366, + "grad_norm": 8.236385345458984, + "learning_rate": 2.417629445181194e-06, + "loss": 0.2476, + "num_input_tokens_seen": 1687408, + "step": 4200 + }, + { + "epoch": 4.371101871101871, + "grad_norm": 3.388185739517212, + "learning_rate": 2.378860222234794e-06, + "loss": 0.2325, + "num_input_tokens_seen": 1689520, + "step": 4205 + }, + { + "epoch": 4.376299376299376, + "grad_norm": 2.7209372520446777, + "learning_rate": 2.3403888362475782e-06, + "loss": 0.2749, + "num_input_tokens_seen": 1691568, + "step": 4210 + }, + { + "epoch": 4.381496881496881, + "grad_norm": 7.729001045227051, + "learning_rate": 2.3022157937457627e-06, + "loss": 0.2235, + "num_input_tokens_seen": 1693616, + "step": 4215 + }, + { + "epoch": 4.386694386694387, + "grad_norm": 9.053695678710938, + "learning_rate": 2.2643415973275016e-06, + "loss": 0.2369, + "num_input_tokens_seen": 1695600, + "step": 4220 + }, + { + "epoch": 4.391891891891892, + "grad_norm": 4.420502662658691, + "learning_rate": 2.2267667456562307e-06, + "loss": 0.285, + "num_input_tokens_seen": 1697584, + "step": 4225 + }, + { + "epoch": 4.397089397089397, + "grad_norm": 3.5097815990448, + "learning_rate": 2.1894917334541354e-06, + "loss": 0.2273, + "num_input_tokens_seen": 1699568, + "step": 4230 + }, + { + "epoch": 4.402286902286902, + "grad_norm": 23.638469696044922, + "learning_rate": 2.15251705149562e-06, + "loss": 0.2953, + "num_input_tokens_seen": 1701744, + "step": 4235 + }, + { + "epoch": 4.407484407484407, + "grad_norm": 4.72571325302124, + "learning_rate": 2.11584318660083e-06, + "loss": 0.2404, + "num_input_tokens_seen": 1703600, + "step": 4240 + }, + { + "epoch": 4.412681912681912, + "grad_norm": 6.068181991577148, + "learning_rate": 2.0794706216292813e-06, + "loss": 0.3067, + "num_input_tokens_seen": 1705712, + "step": 4245 + }, + { + "epoch": 4.417879417879418, + "grad_norm": 10.372715950012207, + "learning_rate": 2.043399835473475e-06, + "loss": 0.2088, + "num_input_tokens_seen": 1707696, + "step": 4250 + }, + { + "epoch": 4.423076923076923, + "grad_norm": 4.278080463409424, + "learning_rate": 2.0076313030525844e-06, + "loss": 0.2195, + "num_input_tokens_seen": 1709744, + "step": 4255 + }, + { + "epoch": 4.428274428274428, + "grad_norm": 9.075408935546875, + "learning_rate": 1.972165495306241e-06, + "loss": 0.2399, + "num_input_tokens_seen": 1711792, + "step": 4260 + }, + { + "epoch": 4.4334719334719335, + "grad_norm": 4.037149429321289, + "learning_rate": 1.937002879188285e-06, + "loss": 0.2491, + "num_input_tokens_seen": 1713904, + "step": 4265 + }, + { + "epoch": 4.4386694386694385, + "grad_norm": 7.768908977508545, + "learning_rate": 1.9021439176606564e-06, + "loss": 0.2257, + "num_input_tokens_seen": 1715824, + "step": 4270 + }, + { + "epoch": 4.443866943866944, + "grad_norm": 4.410028457641602, + "learning_rate": 1.8675890696872838e-06, + "loss": 0.2438, + "num_input_tokens_seen": 1717808, + "step": 4275 + }, + { + "epoch": 4.4490644490644495, + "grad_norm": 4.74402379989624, + "learning_rate": 1.8333387902280314e-06, + "loss": 0.2773, + "num_input_tokens_seen": 1719856, + "step": 4280 + }, + { + "epoch": 4.454261954261955, + "grad_norm": 6.120370864868164, + "learning_rate": 1.7993935302327292e-06, + "loss": 0.2193, + "num_input_tokens_seen": 1721776, + "step": 4285 + }, + { + "epoch": 4.45945945945946, + "grad_norm": 10.760017395019531, + "learning_rate": 1.7657537366352338e-06, + "loss": 0.238, + "num_input_tokens_seen": 1723632, + "step": 4290 + }, + { + "epoch": 4.464656964656965, + "grad_norm": 6.990230083465576, + "learning_rate": 1.732419852347511e-06, + "loss": 0.1772, + "num_input_tokens_seen": 1725488, + "step": 4295 + }, + { + "epoch": 4.46985446985447, + "grad_norm": 15.208341598510742, + "learning_rate": 1.699392316253856e-06, + "loss": 0.2837, + "num_input_tokens_seen": 1727600, + "step": 4300 + }, + { + "epoch": 4.475051975051975, + "grad_norm": 16.286996841430664, + "learning_rate": 1.666671563205069e-06, + "loss": 0.2494, + "num_input_tokens_seen": 1729712, + "step": 4305 + }, + { + "epoch": 4.48024948024948, + "grad_norm": 2.84039306640625, + "learning_rate": 1.6342580240127582e-06, + "loss": 0.269, + "num_input_tokens_seen": 1731696, + "step": 4310 + }, + { + "epoch": 4.485446985446986, + "grad_norm": 15.725839614868164, + "learning_rate": 1.6021521254436678e-06, + "loss": 0.2551, + "num_input_tokens_seen": 1733744, + "step": 4315 + }, + { + "epoch": 4.490644490644491, + "grad_norm": 4.358521461486816, + "learning_rate": 1.5703542902140294e-06, + "loss": 0.2408, + "num_input_tokens_seen": 1735728, + "step": 4320 + }, + { + "epoch": 4.495841995841996, + "grad_norm": 14.235426902770996, + "learning_rate": 1.5388649369840357e-06, + "loss": 0.1891, + "num_input_tokens_seen": 1737776, + "step": 4325 + }, + { + "epoch": 4.501039501039501, + "grad_norm": 7.304314136505127, + "learning_rate": 1.5076844803522922e-06, + "loss": 0.2684, + "num_input_tokens_seen": 1739824, + "step": 4330 + }, + { + "epoch": 4.506237006237006, + "grad_norm": 18.58903694152832, + "learning_rate": 1.476813330850388e-06, + "loss": 0.2709, + "num_input_tokens_seen": 1741744, + "step": 4335 + }, + { + "epoch": 4.509355509355509, + "eval_loss": 0.2577267587184906, + "eval_runtime": 1.0636, + "eval_samples_per_second": 804.851, + "eval_steps_per_second": 100.606, + "num_input_tokens_seen": 1742960, + "step": 4338 + }, + { + "epoch": 4.511434511434511, + "grad_norm": 18.499958038330078, + "learning_rate": 1.4462518949374838e-06, + "loss": 0.2731, + "num_input_tokens_seen": 1743728, + "step": 4340 + }, + { + "epoch": 4.516632016632016, + "grad_norm": 4.451554298400879, + "learning_rate": 1.4160005749949328e-06, + "loss": 0.2431, + "num_input_tokens_seen": 1745904, + "step": 4345 + }, + { + "epoch": 4.521829521829522, + "grad_norm": 5.922986030578613, + "learning_rate": 1.386059769321027e-06, + "loss": 0.2649, + "num_input_tokens_seen": 1747824, + "step": 4350 + }, + { + "epoch": 4.527027027027027, + "grad_norm": 11.740480422973633, + "learning_rate": 1.3564298721257223e-06, + "loss": 0.2569, + "num_input_tokens_seen": 1749872, + "step": 4355 + }, + { + "epoch": 4.532224532224532, + "grad_norm": 10.447465896606445, + "learning_rate": 1.3271112735254498e-06, + "loss": 0.1998, + "num_input_tokens_seen": 1751792, + "step": 4360 + }, + { + "epoch": 4.537422037422037, + "grad_norm": 5.754942893981934, + "learning_rate": 1.298104359538005e-06, + "loss": 0.251, + "num_input_tokens_seen": 1753776, + "step": 4365 + }, + { + "epoch": 4.542619542619542, + "grad_norm": 8.049335479736328, + "learning_rate": 1.269409512077427e-06, + "loss": 0.2705, + "num_input_tokens_seen": 1755824, + "step": 4370 + }, + { + "epoch": 4.547817047817047, + "grad_norm": 4.818149089813232, + "learning_rate": 1.241027108949e-06, + "loss": 0.202, + "num_input_tokens_seen": 1758000, + "step": 4375 + }, + { + "epoch": 4.553014553014553, + "grad_norm": 10.757091522216797, + "learning_rate": 1.2129575238442715e-06, + "loss": 0.2565, + "num_input_tokens_seen": 1759984, + "step": 4380 + }, + { + "epoch": 4.558212058212058, + "grad_norm": 23.19622230529785, + "learning_rate": 1.185201126336122e-06, + "loss": 0.2607, + "num_input_tokens_seen": 1761968, + "step": 4385 + }, + { + "epoch": 4.5634095634095635, + "grad_norm": 6.780999660491943, + "learning_rate": 1.1577582818739135e-06, + "loss": 0.2392, + "num_input_tokens_seen": 1764016, + "step": 4390 + }, + { + "epoch": 4.5686070686070686, + "grad_norm": 6.052558422088623, + "learning_rate": 1.1306293517786614e-06, + "loss": 0.2808, + "num_input_tokens_seen": 1765936, + "step": 4395 + }, + { + "epoch": 4.573804573804574, + "grad_norm": 11.568082809448242, + "learning_rate": 1.1038146932383004e-06, + "loss": 0.1891, + "num_input_tokens_seen": 1767984, + "step": 4400 + }, + { + "epoch": 4.579002079002079, + "grad_norm": 17.461746215820312, + "learning_rate": 1.0773146593029637e-06, + "loss": 0.2029, + "num_input_tokens_seen": 1769904, + "step": 4405 + }, + { + "epoch": 4.584199584199585, + "grad_norm": 9.160344123840332, + "learning_rate": 1.0511295988803294e-06, + "loss": 0.2743, + "num_input_tokens_seen": 1771888, + "step": 4410 + }, + { + "epoch": 4.58939708939709, + "grad_norm": 8.415828704833984, + "learning_rate": 1.0252598567310451e-06, + "loss": 0.2115, + "num_input_tokens_seen": 1773936, + "step": 4415 + }, + { + "epoch": 4.594594594594595, + "grad_norm": 17.489177703857422, + "learning_rate": 9.99705773464185e-07, + "loss": 0.2778, + "num_input_tokens_seen": 1775984, + "step": 4420 + }, + { + "epoch": 4.5997920997921, + "grad_norm": 11.403511047363281, + "learning_rate": 9.744676855327483e-07, + "loss": 0.2428, + "num_input_tokens_seen": 1777840, + "step": 4425 + }, + { + "epoch": 4.604989604989605, + "grad_norm": 23.2257022857666, + "learning_rate": 9.495459252292504e-07, + "loss": 0.2124, + "num_input_tokens_seen": 1779824, + "step": 4430 + }, + { + "epoch": 4.61018711018711, + "grad_norm": 4.646495342254639, + "learning_rate": 9.249408206813332e-07, + "loss": 0.1939, + "num_input_tokens_seen": 1781872, + "step": 4435 + }, + { + "epoch": 4.615384615384615, + "grad_norm": 3.444089412689209, + "learning_rate": 9.006526958474509e-07, + "loss": 0.2364, + "num_input_tokens_seen": 1783984, + "step": 4440 + }, + { + "epoch": 4.620582120582121, + "grad_norm": 18.236093521118164, + "learning_rate": 8.766818705126134e-07, + "loss": 0.2023, + "num_input_tokens_seen": 1786032, + "step": 4445 + }, + { + "epoch": 4.625779625779626, + "grad_norm": 7.719527244567871, + "learning_rate": 8.530286602841525e-07, + "loss": 0.2455, + "num_input_tokens_seen": 1788016, + "step": 4450 + }, + { + "epoch": 4.630977130977131, + "grad_norm": 6.857132911682129, + "learning_rate": 8.296933765875897e-07, + "loss": 0.2154, + "num_input_tokens_seen": 1790064, + "step": 4455 + }, + { + "epoch": 4.636174636174636, + "grad_norm": 10.924470901489258, + "learning_rate": 8.066763266625282e-07, + "loss": 0.2046, + "num_input_tokens_seen": 1791984, + "step": 4460 + }, + { + "epoch": 4.641372141372141, + "grad_norm": 3.512413740158081, + "learning_rate": 7.839778135586007e-07, + "loss": 0.1884, + "num_input_tokens_seen": 1793904, + "step": 4465 + }, + { + "epoch": 4.646569646569646, + "grad_norm": 20.026166915893555, + "learning_rate": 7.615981361314889e-07, + "loss": 0.223, + "num_input_tokens_seen": 1795888, + "step": 4470 + }, + { + "epoch": 4.651767151767151, + "grad_norm": 13.404367446899414, + "learning_rate": 7.3953758903898e-07, + "loss": 0.3424, + "num_input_tokens_seen": 1797872, + "step": 4475 + }, + { + "epoch": 4.656964656964657, + "grad_norm": 8.044845581054688, + "learning_rate": 7.177964627370997e-07, + "loss": 0.2152, + "num_input_tokens_seen": 1799920, + "step": 4480 + }, + { + "epoch": 4.662162162162162, + "grad_norm": 6.080995082855225, + "learning_rate": 6.963750434762745e-07, + "loss": 0.2628, + "num_input_tokens_seen": 1801776, + "step": 4485 + }, + { + "epoch": 4.667359667359667, + "grad_norm": 7.769125461578369, + "learning_rate": 6.752736132975696e-07, + "loss": 0.2974, + "num_input_tokens_seen": 1803824, + "step": 4490 + }, + { + "epoch": 4.672557172557172, + "grad_norm": 9.061914443969727, + "learning_rate": 6.54492450028979e-07, + "loss": 0.1697, + "num_input_tokens_seen": 1805744, + "step": 4495 + }, + { + "epoch": 4.6777546777546775, + "grad_norm": 8.759089469909668, + "learning_rate": 6.340318272817474e-07, + "loss": 0.2489, + "num_input_tokens_seen": 1807728, + "step": 4500 + }, + { + "epoch": 4.682952182952183, + "grad_norm": 14.477424621582031, + "learning_rate": 6.138920144468124e-07, + "loss": 0.255, + "num_input_tokens_seen": 1809712, + "step": 4505 + }, + { + "epoch": 4.6881496881496885, + "grad_norm": 16.341243743896484, + "learning_rate": 5.94073276691201e-07, + "loss": 0.2946, + "num_input_tokens_seen": 1811632, + "step": 4510 + }, + { + "epoch": 4.6933471933471935, + "grad_norm": 4.825214385986328, + "learning_rate": 5.745758749545749e-07, + "loss": 0.2011, + "num_input_tokens_seen": 1813552, + "step": 4515 + }, + { + "epoch": 4.698544698544699, + "grad_norm": 6.129444122314453, + "learning_rate": 5.554000659457881e-07, + "loss": 0.2354, + "num_input_tokens_seen": 1815664, + "step": 4520 + }, + { + "epoch": 4.703742203742204, + "grad_norm": 4.319976806640625, + "learning_rate": 5.365461021395096e-07, + "loss": 0.2284, + "num_input_tokens_seen": 1817648, + "step": 4525 + }, + { + "epoch": 4.708939708939709, + "grad_norm": 4.276791572570801, + "learning_rate": 5.180142317728815e-07, + "loss": 0.2259, + "num_input_tokens_seen": 1819696, + "step": 4530 + }, + { + "epoch": 4.714137214137214, + "grad_norm": 10.404797554016113, + "learning_rate": 4.998046988422766e-07, + "loss": 0.269, + "num_input_tokens_seen": 1821680, + "step": 4535 + }, + { + "epoch": 4.71933471933472, + "grad_norm": 11.949972152709961, + "learning_rate": 4.819177431000604e-07, + "loss": 0.2786, + "num_input_tokens_seen": 1823728, + "step": 4540 + }, + { + "epoch": 4.724532224532225, + "grad_norm": 9.46826171875, + "learning_rate": 4.6435360005145644e-07, + "loss": 0.3228, + "num_input_tokens_seen": 1825712, + "step": 4545 + }, + { + "epoch": 4.72972972972973, + "grad_norm": 13.263773918151855, + "learning_rate": 4.4711250095143267e-07, + "loss": 0.2664, + "num_input_tokens_seen": 1827760, + "step": 4550 + }, + { + "epoch": 4.734927234927235, + "grad_norm": 5.771205902099609, + "learning_rate": 4.30194672801662e-07, + "loss": 0.2014, + "num_input_tokens_seen": 1829680, + "step": 4555 + }, + { + "epoch": 4.74012474012474, + "grad_norm": 23.836517333984375, + "learning_rate": 4.136003383475251e-07, + "loss": 0.2992, + "num_input_tokens_seen": 1831728, + "step": 4560 + }, + { + "epoch": 4.745322245322245, + "grad_norm": 12.346782684326172, + "learning_rate": 3.9732971607519265e-07, + "loss": 0.2033, + "num_input_tokens_seen": 1833648, + "step": 4565 + }, + { + "epoch": 4.75051975051975, + "grad_norm": 5.421136856079102, + "learning_rate": 3.8138302020873373e-07, + "loss": 0.2388, + "num_input_tokens_seen": 1835696, + "step": 4570 + }, + { + "epoch": 4.755717255717256, + "grad_norm": 12.613269805908203, + "learning_rate": 3.6576046070730675e-07, + "loss": 0.2582, + "num_input_tokens_seen": 1837808, + "step": 4575 + }, + { + "epoch": 4.75987525987526, + "eval_loss": 0.2604904770851135, + "eval_runtime": 1.0828, + "eval_samples_per_second": 790.52, + "eval_steps_per_second": 98.815, + "num_input_tokens_seen": 1839344, + "step": 4579 + }, + { + "epoch": 4.760914760914761, + "grad_norm": 10.182611465454102, + "learning_rate": 3.5046224326238107e-07, + "loss": 0.2365, + "num_input_tokens_seen": 1839728, + "step": 4580 + }, + { + "epoch": 4.766112266112266, + "grad_norm": 5.537731647491455, + "learning_rate": 3.3548856929505047e-07, + "loss": 0.2569, + "num_input_tokens_seen": 1841776, + "step": 4585 + }, + { + "epoch": 4.771309771309771, + "grad_norm": 4.337884902954102, + "learning_rate": 3.208396359533572e-07, + "loss": 0.2548, + "num_input_tokens_seen": 1843696, + "step": 4590 + }, + { + "epoch": 4.776507276507276, + "grad_norm": 15.579423904418945, + "learning_rate": 3.065156361097138e-07, + "loss": 0.2391, + "num_input_tokens_seen": 1845744, + "step": 4595 + }, + { + "epoch": 4.781704781704782, + "grad_norm": 3.1390204429626465, + "learning_rate": 2.925167583583577e-07, + "loss": 0.2364, + "num_input_tokens_seen": 1847792, + "step": 4600 + }, + { + "epoch": 4.786902286902287, + "grad_norm": 12.236397743225098, + "learning_rate": 2.7884318701285885e-07, + "loss": 0.2843, + "num_input_tokens_seen": 1849776, + "step": 4605 + }, + { + "epoch": 4.792099792099792, + "grad_norm": 6.024417877197266, + "learning_rate": 2.6549510210371607e-07, + "loss": 0.2187, + "num_input_tokens_seen": 1852016, + "step": 4610 + }, + { + "epoch": 4.797297297297297, + "grad_norm": 13.414298057556152, + "learning_rate": 2.524726793759591e-07, + "loss": 0.246, + "num_input_tokens_seen": 1854064, + "step": 4615 + }, + { + "epoch": 4.802494802494802, + "grad_norm": 2.9425196647644043, + "learning_rate": 2.397760902868612e-07, + "loss": 0.2382, + "num_input_tokens_seen": 1856112, + "step": 4620 + }, + { + "epoch": 4.8076923076923075, + "grad_norm": 18.276071548461914, + "learning_rate": 2.274055020036553e-07, + "loss": 0.2361, + "num_input_tokens_seen": 1858096, + "step": 4625 + }, + { + "epoch": 4.8128898128898125, + "grad_norm": 3.6439883708953857, + "learning_rate": 2.1536107740135482e-07, + "loss": 0.2671, + "num_input_tokens_seen": 1860272, + "step": 4630 + }, + { + "epoch": 4.8180873180873185, + "grad_norm": 10.452295303344727, + "learning_rate": 2.0364297506060003e-07, + "loss": 0.2501, + "num_input_tokens_seen": 1862256, + "step": 4635 + }, + { + "epoch": 4.8232848232848236, + "grad_norm": 7.328881740570068, + "learning_rate": 1.922513492655653e-07, + "loss": 0.1984, + "num_input_tokens_seen": 1864304, + "step": 4640 + }, + { + "epoch": 4.828482328482329, + "grad_norm": 4.626097202301025, + "learning_rate": 1.8118635000194396e-07, + "loss": 0.2677, + "num_input_tokens_seen": 1866224, + "step": 4645 + }, + { + "epoch": 4.833679833679834, + "grad_norm": 6.644436836242676, + "learning_rate": 1.704481229549526e-07, + "loss": 0.2349, + "num_input_tokens_seen": 1868336, + "step": 4650 + }, + { + "epoch": 4.838877338877339, + "grad_norm": 6.079159259796143, + "learning_rate": 1.6003680950742728e-07, + "loss": 0.2927, + "num_input_tokens_seen": 1870448, + "step": 4655 + }, + { + "epoch": 4.844074844074844, + "grad_norm": 11.934816360473633, + "learning_rate": 1.4995254673795812e-07, + "loss": 0.2206, + "num_input_tokens_seen": 1872368, + "step": 4660 + }, + { + "epoch": 4.849272349272349, + "grad_norm": 2.1284427642822266, + "learning_rate": 1.4019546741908251e-07, + "loss": 0.2374, + "num_input_tokens_seen": 1874480, + "step": 4665 + }, + { + "epoch": 4.854469854469855, + "grad_norm": 7.95443868637085, + "learning_rate": 1.3076570001553934e-07, + "loss": 0.2712, + "num_input_tokens_seen": 1876464, + "step": 4670 + }, + { + "epoch": 4.85966735966736, + "grad_norm": 10.991232872009277, + "learning_rate": 1.216633686825841e-07, + "loss": 0.2406, + "num_input_tokens_seen": 1878448, + "step": 4675 + }, + { + "epoch": 4.864864864864865, + "grad_norm": 16.078187942504883, + "learning_rate": 1.1288859326433477e-07, + "loss": 0.2743, + "num_input_tokens_seen": 1880432, + "step": 4680 + }, + { + "epoch": 4.87006237006237, + "grad_norm": 19.031558990478516, + "learning_rate": 1.0444148929221464e-07, + "loss": 0.2828, + "num_input_tokens_seen": 1882544, + "step": 4685 + }, + { + "epoch": 4.875259875259875, + "grad_norm": 16.82112693786621, + "learning_rate": 9.63221679834203e-08, + "loss": 0.274, + "num_input_tokens_seen": 1884528, + "step": 4690 + }, + { + "epoch": 4.88045738045738, + "grad_norm": 6.512580394744873, + "learning_rate": 8.853073623946162e-08, + "loss": 0.2457, + "num_input_tokens_seen": 1886640, + "step": 4695 + }, + { + "epoch": 4.885654885654886, + "grad_norm": 9.699633598327637, + "learning_rate": 8.106729664475176e-08, + "loss": 0.2663, + "num_input_tokens_seen": 1888688, + "step": 4700 + }, + { + "epoch": 4.890852390852391, + "grad_norm": 14.048091888427734, + "learning_rate": 7.393194746525279e-08, + "loss": 0.2572, + "num_input_tokens_seen": 1890736, + "step": 4705 + }, + { + "epoch": 4.896049896049896, + "grad_norm": 7.062888145446777, + "learning_rate": 6.712478264719601e-08, + "loss": 0.2399, + "num_input_tokens_seen": 1892720, + "step": 4710 + }, + { + "epoch": 4.901247401247401, + "grad_norm": 11.242563247680664, + "learning_rate": 6.064589181582481e-08, + "loss": 0.2267, + "num_input_tokens_seen": 1894704, + "step": 4715 + }, + { + "epoch": 4.906444906444906, + "grad_norm": 1.6842583417892456, + "learning_rate": 5.4495360274231524e-08, + "loss": 0.2652, + "num_input_tokens_seen": 1896624, + "step": 4720 + }, + { + "epoch": 4.911642411642411, + "grad_norm": 4.220650672912598, + "learning_rate": 4.867326900223068e-08, + "loss": 0.2254, + "num_input_tokens_seen": 1898544, + "step": 4725 + }, + { + "epoch": 4.916839916839917, + "grad_norm": 3.8804283142089844, + "learning_rate": 4.317969465527927e-08, + "loss": 0.2342, + "num_input_tokens_seen": 1900592, + "step": 4730 + }, + { + "epoch": 4.922037422037422, + "grad_norm": 6.306464195251465, + "learning_rate": 3.8014709563488625e-08, + "loss": 0.2151, + "num_input_tokens_seen": 1902576, + "step": 4735 + }, + { + "epoch": 4.927234927234927, + "grad_norm": 5.872474193572998, + "learning_rate": 3.317838173066135e-08, + "loss": 0.2368, + "num_input_tokens_seen": 1904624, + "step": 4740 + }, + { + "epoch": 4.9324324324324325, + "grad_norm": 23.829078674316406, + "learning_rate": 2.8670774833386426e-08, + "loss": 0.2662, + "num_input_tokens_seen": 1906736, + "step": 4745 + }, + { + "epoch": 4.9376299376299375, + "grad_norm": 2.1569466590881348, + "learning_rate": 2.449194822022327e-08, + "loss": 0.221, + "num_input_tokens_seen": 1908592, + "step": 4750 + }, + { + "epoch": 4.942827442827443, + "grad_norm": 5.917527675628662, + "learning_rate": 2.064195691089954e-08, + "loss": 0.2286, + "num_input_tokens_seen": 1910576, + "step": 4755 + }, + { + "epoch": 4.948024948024948, + "grad_norm": 8.833841323852539, + "learning_rate": 1.712085159559784e-08, + "loss": 0.2104, + "num_input_tokens_seen": 1912624, + "step": 4760 + }, + { + "epoch": 4.953222453222454, + "grad_norm": 17.08448600769043, + "learning_rate": 1.3928678634289593e-08, + "loss": 0.2802, + "num_input_tokens_seen": 1914608, + "step": 4765 + }, + { + "epoch": 4.958419958419959, + "grad_norm": 2.2440571784973145, + "learning_rate": 1.1065480056110522e-08, + "loss": 0.2125, + "num_input_tokens_seen": 1916592, + "step": 4770 + }, + { + "epoch": 4.963617463617464, + "grad_norm": 6.129010200500488, + "learning_rate": 8.531293558824982e-09, + "loss": 0.2162, + "num_input_tokens_seen": 1918704, + "step": 4775 + }, + { + "epoch": 4.968814968814969, + "grad_norm": 2.9528563022613525, + "learning_rate": 6.326152508320804e-09, + "loss": 0.2508, + "num_input_tokens_seen": 1920624, + "step": 4780 + }, + { + "epoch": 4.974012474012474, + "grad_norm": 7.140697479248047, + "learning_rate": 4.450085938170756e-09, + "loss": 0.2453, + "num_input_tokens_seen": 1922480, + "step": 4785 + }, + { + "epoch": 4.979209979209979, + "grad_norm": 13.262871742248535, + "learning_rate": 2.9031185492522926e-09, + "loss": 0.2758, + "num_input_tokens_seen": 1924464, + "step": 4790 + }, + { + "epoch": 4.984407484407484, + "grad_norm": 8.832655906677246, + "learning_rate": 1.6852707094172636e-09, + "loss": 0.2275, + "num_input_tokens_seen": 1926448, + "step": 4795 + }, + { + "epoch": 4.98960498960499, + "grad_norm": 11.241654396057129, + "learning_rate": 7.965584532282355e-10, + "loss": 0.2635, + "num_input_tokens_seen": 1928560, + "step": 4800 + }, + { + "epoch": 4.994802494802495, + "grad_norm": 5.555950164794922, + "learning_rate": 2.3699348174754945e-10, + "loss": 0.2384, + "num_input_tokens_seen": 1930544, + "step": 4805 + }, + { + "epoch": 5.0, + "grad_norm": 12.928886413574219, + "learning_rate": 6.583162381890162e-12, + "loss": 0.2943, + "num_input_tokens_seen": 1932608, + "step": 4810 + }, + { + "epoch": 5.0, + "num_input_tokens_seen": 1932608, + "step": 4810, + "total_flos": 1.1284259767320576e+16, + "train_loss": 0.28020706261022177, + "train_runtime": 1219.1473, + "train_samples_per_second": 31.559, + "train_steps_per_second": 3.945 + } + ], + "logging_steps": 5, + "max_steps": 4810, + "num_input_tokens_seen": 1932608, + "num_train_epochs": 5, + "save_steps": 241, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.1284259767320576e+16, + "train_batch_size": 8, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..9374b67 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6775128737cb76a145e8e18bc6f48142ecc6436b02b0011794059b1800e3d087 +size 6289 diff --git a/training_eval_loss.png b/training_eval_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..4fb548816027d35816d2e9afa8ee03b7b6c59404 GIT binary patch literal 40596 zcmeFZ^;=e56fOEvf+Arch=iyhA|>5epokzK4bmmu4Wfu52&i-;2-4k+h)Op|H%K=~ zpSkcm_uTv3^W5kB0rv-=&re?VyZ2gi%{k^6WA1k{(hrDEQJ%tJFhmj$@5^B@*d7=R z)+oUV_!sW>!Aba!fUTIa?NbW_TL*1xeT0Rj*on;*r>uCJiNf!lTE3bBkH-)*X7Z=CaF_}*#p!IJp!)ySbpv-*I<5DY%SeGJ4L@(6k(Ek7%ap z_mDN(Y;2Fb=yiB%d_PfcbuKMS^+o0%2NvUzw5&>>M~PQhSQc{|i~l-YUuawtG&#Mn zx-+Q!kVK2cWj>=wIalvwfbbSYV<_89<=#@-G6T0GJ_*faw~}TsTL**baJiGCqoa(R zoZN_1O5wrYc7j~W?;PC+ZoG*-)O?m6WlN>LJsD~f3k&bFve+$a=r(0uNpNJlOAFgmYdHQs@-lYqy>c29dmHp|*2B(JRO?dj=OxpemI z*)VRC3u9wr_r=8e68-y)?)CNBI6DjE88l;OOO77E?XG_#Wb1M+@#{-fNc&xCXX3T( zc66}a6eAo7Pr>QF@AybkQl-%Jq9;DdbmtRM{co>Na;KVXE%Z%JPj{p#WicHw24b>9 z62E*Qy?9Y&q?xqfOL8(nhN6pDO^9MzM%{(*S=&-owmgATr%qYg+h?wFR~;P+5|Xp# zKTTWEUF}gf+UiT=nGW@W5=CoOj6f z91cFQ-r@dE`Rb2Lp{BKKQ;jEyiN!M%J4oLNYEO7TQu%k>SF(_fp56Dq?t~g!SXtfTG-!%**flgoKz}3{$jEagf>P{si5n8$J zH%H55L>evVV9=ZSY-4etSG6Tx%-6IfZ=V>hDXHPUqyNg&)5_kS0q(?OaiGYiQ;HWt z^krTiC)(Wg>E`a#ss+uy5a-I>xtj*f5n`5>?B?d?@2U7dEi9OxK7j-A&vkfsSX^4l zq5bW(byckI3`TW2!ECrZJmu-v@tK*ozP^N4#ou4%=I);EpR0V)C}IKWq`I#!oLtlO z+F@8iOY5?8Ma+i}q!2#$?ClGioo*_oqb29#=O0^KY!17n%V#tFxa8-@ z;NZFt7BvbUQ{|GqRJqO>`;khw(^PzN=l1qPmjg<#`7Z@atk zoIxt$KHQX*we`23Ki|U9pZ7_UHR7U#SgLPmD4i^UM`7H4(C&eSv$D0tz{;Aby6N@i zP0t^awETQ7aX(70vNAyt5fP!yuBYe8$Q0)LkC!KzTG0MIoF&>PPo4+~35Bt1-z{0L zP8A`9Skhahi(%J(wYhFm|B3$g)beMaem&Xt{o(X<=A_5rcO4!11fu=XBl}%?psLzW zKcH1Iyyh%oH+SCM-5moNu+h0Pkp<4HD4Z55QTM1wi^_|#Gc=gP{q-mFZShlk zx(z`$&R@9DpI;Qu?-BC3b-8lSza?5Qp>q~R{(MhH+BmP$t-$*45b(D{S)aAdZ~ooc zv4ZgEYr4tG!ZNklt9kv(73^r~2XIGhm49_gT049dW?YJrhMi`pA2S3tJ6Nei3)tnJ zJgnY-aEKC0U!Ec4*bG@WZEfxDQybK|xw$JF8+sdm+L@KJJ-AJJl&e0}?9&}g1c+Kg z-b-jV!mNk-rKR0``c=BFyE}Nqea{cl!H2-W+Op+JwS+esKJko$_5)_7gT)`w!AwqO z?8(w>&41p>=deU|wA1;)1*5}SyKKq5RX7Y{kI$x)?`s)|@t-oy6 z>OwG>j#Ng&Rm(bfU|Bef+AjN33;uvJ{Tz;x=8FSvw4f>~Drh5Z7k+=7Y7FJnZ#aMV z?p?>}a6?SGMZT}X*9v}qepk5aduqXux3unIgM;da+f_%m^nQ`rFZ{kEFMraNaPYaodpn5kT8&80+@qnZrPWC+o;H z(M2%mc7uY>o0qSO@9*zBj(L&8s!w*MJmtaCv(q;)uwHNG zThoCW9wlJs1BHXbX-!WtQ~kN{SBB-0jSbs3#MBLNjEf;>pClltuB-FXZw$$CKX8r| z6OoXR*xwqkm`V~&e^wToW z-_kM-ku*9J`@#Uu3Ac081t%w`$*HN}y(?)f3F3ZNgoL8P!YBZc{D99rG%#Rj3}GpY z=TIv!7K5!Qb6B1Zd?JF74xB!m&_m{h-#J&aDz+%0HffE2f2Z!USb#aM3=hPXKS%s( zY@C2|LeI+Tk5A+10YEbX@|gSIG5nSoVYLjNAU9z_KE7XI=N8WO?*k-odV-0HGiVdy682KD#+`SUBkbpysGCTih8h4EU@7`Dbt&1Y3rPU`N! zf0PT1$pRUqzBM=dk%;bp5L_+~{QK7t@_p(-l+fQ%PiB?e*AQ}RZTCoIRaF~eUmVuM zv;JvMz{enTEg8y+7FB4yi4z@QSc&oRapekUyF`5@$VCj}6BAB*i$yydolhW#r?wYB z$nXgY4rKlO3tKIJUQ8A;)mbX4^g*YY=tnA=Zkxf_j4$?A-)<`3x%1LG=K+n=eJGEL zK0ZF_KjFM(z4r177A#^S*IbAFyy3A1i1K$7ul3|Zu|&BWKmDnn!X*#aV~-d;K1D>R zKJNnB>3ZoYRYol_4qv#^>fzCnqPB1KxUh-Kc#-RHhf+ z{oLaD^Asq7rv7j`nXs_18gNL2w1f*G=<#IS_g5c8+E`TX7$n-w_w>YuvT0@}cNO?W$3k?cN&-8`2Aa~#N$hDdfkDP}? zn}KP7%%7D^4HaJ=qu&z6-=llN^UgaTAG!U5gW&OT9Wl7|i64Ha;_}Uh`lq?gIl_Zr z6PWJ3IgOTY(-D@cBURz1{>o@gk8Z5nRya1}^(Qg;DKAE=U-rbZY}zgj_Nf-dGd4hn zK^FWd5nyIl(t+FV#*J+e2=b?}u$q~}fBqOn@<@ksh_xGWJyKK*kt$V+}i^wU_j{5Vc6*bR?u?Q zQKh)qP@Z7`HX|f(yAm4~>1csODBg8zPKG%zj@;{NYCaFH?k$zIPCFzq`e4idzw~)s)-&bmvhRq14ENz89`PbC|p?FM> z^8T-*mL0_w^m~7CQtKy7+6MACP)>VpaW?HPPXnh-o?~xVMkB@I}y}!tL{x$$V1$c<% z&D8!l#wpF#l$4a<9#QBD@MJU~t6Og?Y?S)GdnYT;6l@L9W&T#l-{;$ZLha4_H*G1U%c{Q6E|! znxlj&*->PnIp6BB_IDycbFCD1fyuc-qXepwvAUrOD=RBc*4Nyw5OXPL=ukcCFEFWZ zY|K01eN!p(8XsTS;lZ9-K(L>Vjg5_jq$J8QiO>w*drSPxolEs)fk|(CyOAT5PBVW| zILnMa-yoh(YaPrV0809)$DyDc^7ZR=NFDk!Ez#WO_W<}oX)Bi29O1uy{ff)a526uv&UV>0pLgojd?8#}S;M#QGQpe|e_#GV`=|zx{XsY|`o<$cbD9Ol>0&dMdG`%=CkY`8&nL|OtAMr4X>@QmyEr+ z1j{GNI`2fuYaZ1c?+uM(0^_3+ntJ$)&2-a6=X4>enZ+g*0jP zdrDtBgCjNK6w^v(VqE@?y`?pM!yt0BZ?n6#D4C|1k^b}WU|SQ?-A$@T(R^0%%@Z#c za(-G`T53UC$8DUJ_|^gn7n!s+);g{!z`A7F1XGPYASd$826_w}VTp6hhe|0)jueY3 zE&y=s8Fup6S{#^|ot1#BHVYm6X7SX~b?K<&?3hoV&USQmKJQE-iiwHgi6shMgY=rG zU3(&g^;tvP=X=nKohK((I>L(GhVGf&q=y-Ru>OHiidlf@VR3Wo6QNaHkLLNrBm`n2 zW6^`c^)fm|j3@H4i6>PTYUIRgp8Lfwy}dEZEO;yV@0H7WIovasr|+wZ?vOx zN!XbSmVV;%Tbe7EFMHh5{jmZhOkeqPsAW#-&z{Y8r;!6HngTqS)ssC9Md3LloRS?T z@}kcSsht`giISlm1tv<+azcWDugWoKri`5FtEqX3swJekVSy^`?o+X!{778th+r)D$<%(E@YRLTk|=jWmNB=S0IFb(Y)%wUIbE`WXo9c zLm3&F5{ahZf&^0x&h!jX)622C)}iaMuCHpeiqm`DAnlpC7vge!{``5$Kk{*sakrIK zxQ2!XhR0^!c{kl#^$Wd27nk8w{&o!Q$}zpr-be5)!L-Pn>+5se>cyb zIrCCAqp(tg^=qbNg(eEp+-(^9gWXiYHHo7vw4wbz5mzh)vH&~EM{&*b$)%4pqK^+$**~}y85<|urS+B z^t0&YA;}xiVIdrks5@B(tc3PosFihGxjf>!P6Px;cV%G`mB`^=-FcE;bsHjR**8av!G(5;{j*TKO-!)1{h_z>vf7KSS#0ZShGxV&c#g-#cs4nCX&z2*q+ zbhRS?;G0U;0NU0Y*{b5&js5^sd`m(*{WaEI2iOjDDqT0)A2fyCsx7@%Nmt-d=R-F5 z;^^QstwYp+exYl zDt2(oQE^nE{FacSeYt>ULuhGX((*{dboza9anzkCrYqM#5Gv>B;6d9Wn;_m7Rb;=Y zYF;{<)TrvD99Y;A&iNK9ODvq87)|#bFNp9C0VU>Z*Kh;t5t##Pl)1vsw6~{LX3qkv z%dOF@**UZI$o&WVt9K3;W#0>KB^ zu%u3ijNfMZH1DwERT>%^XjTdbY3CdUt=={h)c;+bFuQPF{hhDo)6l2Ai81s2f0@%~ z%d`459y{@88AeMhW!Bajad9}VXmN0GI0AH-ZTpM^6*o%I!5^NXN_FHwX|2zmpLNFO zE5k^c0%8c!wxLSXTmK<4vJvp-%Jw!JZ`Cr?4YZx((3}*hS(JL!a`&q1+Gs($HZm$yV_l7>alP{wGk+1|%9Mbge$Vz9kd>f{xH}hKsm4C#GP3 z`}Xa3kp(S7VEwd|tn4M@ak<5V=|~Hsp;B(BYPn8yN?n`6TGbfH6*UdPH)ltxM5_+A zF0oZ?d}`)DbLPxGJjtMCEm5eeuKY|%x<8F7SIGkN+B$X;yx0A!7eAC1dB`N-uFtBD`C?B?Xpo;$ZQ z?#l+mQCI;!9&5T#Ip1tb9Xw76a6##!GgDI^!@`WDp2&3;+Rt`)u|6wZ0U|d~zwyHE z=KN0}+Z-qSc)h*7Z_A#Co>zZyCj+vsNkihp6#vqF(|veU3Q>0wDJMzY-(;>-N};pyq=OjUU% zYZYq2(4{?k^yp7-mS)Kw0Pr8V`i;obNeHe;Q#* z&zkCvL`jt*^JgVhe^}1A_IXzn7l#Fi?EYdUD&Luo1mMsVD>^d$_r>8lEx=gr0yxj& zB_=Et+#z(ezO-qIY4jW%XT@Ywqjc>dh600v^f-TJ0?0!=!`z(lB6ilhIiR#=oPo3> zV+fQ_>qbl^?TdXx*gRELRW;`x0qBG1AzyMfRtKP>=yrB?y3N(>=&xP-onG8fU$5Pl zs}CH#N?@Jpt6X2v)0~`~jR*RUC5wzKEQzKT4nXX}1#bb{2E=$pg9-H5()aJ<0sx3< z-dFbZ?M&y=E7&;%ijNsm+SeFoAE0xT-wLoWpUl3gCb2hibl5xXRs=mXz`cy+*||dQ z>({>y?*D?|0eqK{6)3n=jN>O>3v_ZrMbde(9CsdIit~V+Y@|HQXlxbt6Mwp7)fCCw znza2etM?o=wV6#G?jQZPX$}&r<*gd_HWt#c~Oy7K8$Gm(XkJ84j;(0F;k-u^M`dx1Tkem~fWuhv`%Wporq9L^1 z!m+E+y;p|P5>)2Xpi!_opX|>_LQA0O$IKhLS^RnSsIxf>@60j&+&c*s$|_hPuO$UHL|bBw|qj z#jZm6S^++M9bl=Niy^9hhkqwX;8cl2`nqxB2C8DvODdCR55n;T8mJ>nQxwpNx38}* z=ozOk@uUy7iK)Q0O+pf#hGx?c7>?I(-$KldWIL@JOt(aFkl?qLh8oevN-jx% zR!l>%3)pr>AZv9%QNqQ?w*gj+$9&Km(qTbSTdD;_bHU{BE)adI8yn2qpGyJE0nK9( zU2C5M^niKs*a<-Rbs$ph{7DG-134OqOf|p$T>#j(fX{y|gm(T)2bUcpY`v}x#2x<&_=gpiM($ZK(FQLT_Vbk;n z)cx_}N7JFwU})?M`ct@217>Y)O~I~(si~>CMo+&A4YtjnHab8Lx}4WU+;(kIZ&Dw4 zJ)^>Gd(ehN(0*a`B|gn%R@N4V?bx)mG^s3ceH0`nn4pM=NAB*G+%GqP)HijOtr-k- z9xy9H)OU{Eydr`YK>fJYYc$_P#|2g!aGOfL(HW3Mii?ZeARSoOE|a_b`TW)qcBEvz zMergpvv7Jy=6kc)LdB8b;0lp6XxIA;X{ktFd;k74BH19d-!C#BVlu0R>dWLRtoCXj zAX!J|Gr{tTirK*un_wFvLEAsKA>Fi!>@h%hd$ycUY62-nruOF%rzp=+9?zRFDzGQLXmKA!QBxp^iB z@ago7j1R4BZRO$n(#iqn@yxOUlM)PZ^bGx4zG}wV^XI<+zplt{J?Xs}1r4S0MRqL@ zXnYeu^n<*0H=M^T;!||ATfIH~_3Jm!F+7%Wb#o)jP)xH0weB1JcDEGH)99^;#|%>$ zMZe^s~ZR%if7CqKJx4D420TidD5X=UhQZ{``cDhk-meSxdjH8x7l4p)?M zKu0^jE(09F+o=+$mKCTy6Z_hEgBmm|_GdpqTL=d2{3Z|)y8`_cE=3$5Q6>Uy?IZp5 zDWcRskr3Mfq-4_N{}KnE2@akdFj^LgPhv%UG_sW7o`QDPX9l7SC0gZF1U?G8Y%wCR zxVd@m!iA*wl-vyri(*n8)#~a2Q~kc3!^(0@K~iF}DwJWqSp{7RTW%^t+gVdiX+HE) zU5HD7Mvb9vWJD8MK8J>9y3gkU^=85elU-d~lYb8-3NsVGt#FY;&)XWp%R0-qVSnW4AoeUZbp|djE+a89u}^4d zDEzNk;H#hCK3({-Fp>YoG4+q)P^)X>d}+Lz*bOxx#*?9%%URjjJOz(H5S-?lUS3|^ zscE?!Y|_ittIPSNv0jJm^AeW!wtw>oVOgW83w_EVH@&b&!7>zFJxnaKx6Ss_Cm?DJHczV;mOy6{d{o08O1*pYncV2=aB0t2P;gd8wXpaR2438+5OY zD1poW3p`({&{rVP(F*vh%9rf^U8-+tVlFb9t%K7puPxHj@aqaGvPF3th+lY#JW+SK zIEgohJbpCkaeVyn!6PzqK;HuY8u~1#Jg{9{@&U7Q>e{tyq?DAZ;K2Yt z)pvbRp^?n9IrQF{4r`Pw+Z4+I=)S?Bq4^SSWVlN9kBXuKQJKx;W^dA6?CP6Z7q{#j z96~WN@IxcLi1m$(Y5ok7u9XJ!RDBF#-NZ8#gf(%BOxwIAY+J|o&84= zj~!g`DmPhK8E)PB2<*eIxlghfxEu0~+Oabf)kdVAf4GJ@j|^bpj~T#Q@ebN}Mn*7> z+^i7yi;8E2lO7lmfyyVMrt+k=)X7d_ykJ4p>gwvC>wp^vktB0@+FNyea`JUT0%9$b zii;^KG&Dz~j4iKSy8stokRXxmyjs>yMM#Cx4xTn17U z;zjC7EjjfWxpTK4U+D9q-yAv*%M)6o#l8YqXB>D6jjXRPjt&|yt6o<8`P|dYLn^uMS)suVRVY(>r;e%&<*pa64 z6)cDXE}owOv|qn`dF_6%s}jI3AOLPBHpnLFSXy8OVPd%|C>S|8spq^or!SlY#1(8L z!_#izPx>zB6qv|><^J;Ji*i7QddVjwGC~g#7#fPuC<4gtQQzFJVN4CsI)sN<9F$}i z=hLV`gcA9BiZ>_I&}}L@nAuoarEGG%v`%}a0Bxz!V5!|r1S7$_r2}jw7<^XX0XSd> z%JRk3X~J=SHz_+GVGr72D5R$G=-`AmQE|;VmvjSBjSGxab0jaQAwfaeHZ#&-=}A+7 zWxxlV-{W-^1O32InL}?f3;95@3iqp`0y;st3@`5I5Gq>@4!IMPBkSR=j5}l8g1cAkRjqDO3`zu#NAhfS>U4ki{?_Kia*flMX= zBofe`n?q5~pa>yC6EyR2fHGOj)9N2n-HZHY_Xae+;Ae;PS+ZX0+!+=X_}X*E}MdQw6u<^yI}y88$}(_%6x; zf@;{eCGa48nm?=VRmW1%k)!WIdR?gyJn0)Pcaq|Vth2zxZ&7OQxHk@la)WZ!m% zd>XHEiioH{MS?kk1on3v?eD3==ow3G0%dEgQz*f|!}X9Fgbecd6t4516^FcN-1&5F z2TUVrHp-OcT&Wn#npb$xs3!EzgJ#1EZBBBJ9T1#gob&;pFhHer-U}M>wscvn{TV+DLAJP(nQi1ZqX*W;U_$ zj7`ykp%9kg&<{jIHq15c;{eq57wi=a`$h}PauqMMhRb9xyh7!=`AGr+#@E-kufT*H zB%&T&Tqx@LJMGN6SrmXo}Vjn2P| zb8~Y8@f?_f0jej`(hThE*@HWfIcGpz83dlBN0%Y+BnBTJpO{v}w1O1~J!m+82VDeX znzmrllh_vcT!!e(f+?%WYRIlP$6;9m&;c@0K^ErGp9Y56ZEx#TBW~NQ zZE;!Iz#wJB+{PitNaX=kzb*`${8wUsG zRiOC6vj$cy@VMm-kAQ6flUX{)1PkeTf++XKQN{Lf0yrg5%?BmrshpfnMJwP22yw89 zyaz8MXypc-Nm4w$Y+y|R=5u^up$XU@;L5WS4Rf80&kK8C;7}kdG0NH+70$ODmefK1 zMd6JB8^u+S!@;NmdLGD4g(brrPvRCnj!?F@*zx8Nl}tUu)Wcky91 zrH3GfqJ@Db0dZF}t}Ay6P5ZuiVB!3(bQ1)99#je%ZSZcuhduyP2nMM?onJ`=9hQJd z@p?<+>A<*gSMSg$npkjkn6T*k8Tu< zMbFv{)uya0|KC*uwyG1`9rzmSI#}}#aQ1;!K2U43Nwvg&>++@CW zmS5McqRVZifUbu+f|VWsGqiF`#S_HPm17_leK*}LEG$I!SMGHgbAwS73hVG^kdML4 zdWQYUb7$l>g6;zOx-?x^@x;W$nAHkTLn1szL=dfMiK<740n7upp!GXj8&2KYN-fDbsL#NUiMzTAff|TG z5En>zV|C*PmprRQi_ruo>(S zCNYD6Ws+6#1O6xyW~6E2)sZ_NF*WWLEsfltHs!;vp05?;WZPmq*(Y|*fc&$A?dR`C z-())(4e%f><^j{eix@zlIKM&Y6oVNYT$R_5C=5|hpY-(F<;&FuxQ`RsM<*t9haS@b zl7*&A#Z%M+$|BMiT>rAe0f&yM4QSX%`;GbD0N|BoJ}oYS6%~;vHog~FepkH^)uM6c zq4a~GThDfMGIeL5E4mh?XIDVKO{uko9&C@a(z-dwViGwkPX|S-nLqyWjBnQM*%I>SC5)Mz! z$tWzxe(w5pwebk8Nlztf6Rit3@r=vP70;%$uyeVrxTx$=R>IS-_o!K{f_Q|Y4n`9m zN=YSx&K9aLEWADFsgY#}scs+WEM&vI9^?25IjRJD-GSyrag8)(uwjBl2@mnkPoD_m zc~n)2!j7Ye1=J2KcAA0%5Z=WQt`xlHRDju#n;x+lkSBZ6RdA|7l&=Sit0RakaQGS5 zXIewYMs8li(z>c7qu#LE<>PX6UTiF}`zTjXgwUY^C-(jF%eU)ZG?mhKrq^5b$#l4G zUW@>rS}QUO zBLvhcw0`HITi30a~J7h;2US6lbuG3MZ>EGq~|dNJwB|=2@C17te|LXX`OZ#ll`+h$2Lj%$Z33+=d|(igKhTZQqxM( zyIpDj3kFk~ogk3S0mw@vYo`-8jHjB@2LzPDRfbDRuazYa z=Z+kI0gRmeeyGs3r=-KR`g^9#yOr_s_r`Z(+x8FUWj3>l1MLWkKVaXx!9frB{10K-8S zA#f6N>9glMehR74`P4+Ox92d8MKL;cg^uz}f3=zv@=0vd6jfC5xy|;QXBZ5~Bv@}l zj=PpXD;2OWoyGtGr@M5}h{rm4FyPAUr}RRIpxWl10I8d-K$v6>D{ejOm)p~T)g#U{ zUeL$G!`mD@D?7kk)#+RG`J92DZq+4iJFDf9`g~Ugx5`Ti658JtYJ>!`?fe=S&QG=! zm9?_rehjV#%IQ92OR!!&dUQ%l+FQN*8-M%C4WGMr?qGp>1>WY60ZrvFv>)n&d!f&i zzj;bJe0rvQS3ddrEeG3@bdt=Q5JpCkA3p}CmTSq#q=D~ai0 zQCcMy_e=pAKF?H5lqNWomseTC=3}=oG1Ac&5v(NdV#8|R1$+cH%xdrv z|D)oP@qoDOSa&!Hmpdy)FYZqtsdQ*hw0e1Z=H9;5HL{9?h`I^q(PjG`H3}y_{r~zf}~8XhmZ+#1W>K3WaF8-8U>6C^43}yoIx3YpeFg&P?{E-Tgv#e2=dk`t(t# z6Y7GsA%G72{CSPTCCx|gPw_gOoUET8=uxG9_DUFwFH*(3{aQ&N;_i|jV^^PO>DV)5 zC$V1&k1*KbZWVR-=CvQJ8Khx*MaZ(kv8uMqhsNRW(a8QLepX;Gzf4$&vyMIJ1zXh#^L^i@#GHibU5ZT}{E1yFDP!G@sQk z+J(9mHZRqXqecy%d!76OR$m5IUuQy2xnPeO6F~fa)IaUsf~w)A7fP6UA6;0pyIfM} zQ;`9QIkxjR9!Z^Qr#=Yh`BE`7pT9t0&A~zvn2rnd99;x6d~00OzK+46rN>~r9DEhK zLz9A$u~nUge*aDxLQKj!9~ zCl1!&hU23dQZ5Df{@c3FZ^jqnrxpcE+d6)hw9MIc7#odQiC`Y1A`I)AI+tW3(e>+t z^vlzxGrq$)<}ZY${mHSbU$pA?J|8-MTEPyS-?zK%R`5sTWX~Bl<1q>!H)c=ivEs7N zj2TMf1%5KQEZi#7nsEkwUKl7sQ^zu+RjYPv(ojahSMYD7QnCprF`#+hhN%@89RjvI z4@%ji)@R^D2g0HnM!^89#mC1hSGtxo^8@}uvKfrqpmzEFd(_x&xl<6u4CgG|CH?RD z#Qd&c)Jv@C5$Xq&iab_GX9F)hs=Y!Z0|Su=Mr5cJ<$_Me@Hnjc^~rNcH`XHKs9 zkN}8^cfj9MhqFB5{w^EiyXrvE7_SOCIR z$9AB3(fRIu2F-eaA_;2xjZ*u?29QVfg$)7DfUXe(gOO)ox)gx%EMT@^Vc+JLd5ZTw zyq&~8PK>!HXfYSa$@4&=h)+n!_zCb9+GY@0H$U~>^to$l$_#X(LA3`~&jb{-DY(Z` z5G28=3lJZ~I0EQi5}wgK(AB2F=Gn&3JZVly{;u500+b@%eKV64CroEY2Ro%7$UVQQ zNC5wW${4H>8XYYK6J;knvB2-}fY$9h3~^>`w*v5bckVj0_As4>1ATj)FZlrOJ918n z(-f!46@N@ma#hf9z&Ycsz{wQAhnfNfGEptr(2Z9TZE`_!4ZcTcBg_;)v-Sz7KDc?< z9Aub3P02+7nF46+33vj8ufXTv2@OqDT-@cz;UBrsalo9WBDIK5=}fxa?L@gVe?HGB zKcayQb}flx|~yJUF+Zx3sddLb3}?bAY|w z3AA|?WQ}=4gcE1dn+fBvp)k#o)q$}DI`46`K=-bVv@|hTDwTFgFP*PQpbS2x8byL3 zx%TUk7CcRS%JUT)Oo1v3(1O=_czT>cfH-sMl4PuiTk13adc9oYk&vJu80CGXYPPq+ zO-aNMn9{*vD?p9RutiDYiE^JEi<)5J03qJt3;b7BOCU^<8ec+jt47u}fa_629i zCuo`=E-?s!frt+GkD3155AJDF@ITgQAs;cbW@QvisbG&TEwzBh6gAxd<6tCW70_QE zkTJvH26T3bBJv7M@Z=^R{rpA!Jp-PfszPhVzc6@y9%~c`CkZJjeVBNH_VNrF85&(m zC%gy!o0;=EYLkJy2J{6=@jDgW6uJf~v%u^ZDNn2-;j8=;?*HM1|0Suy#+=!o1`v0O3C5Z5sg@S9^Cxt`? zTt6k;aB8~bLRMr?n7V8LJSJ&De2V*v-us@hIE-^Kfe9x(LWWx~RF8w4{-qmWq#1vz zm=I$;h4tyYQHDPcicEu*0E9(Z?8sSZ#O2-fW)Q=^E$g3`;AHk8H18@C*_Ua`hxII} zGm7Xd;tL@;HRNnyQstRccZx9_r?<(s<0@@AM$zzag^nCzC8VauN8x%Y|Pbdm}Qg|NIGQaW?5>)V~Z&$$5M~HW)&mW~?}Ry8JJ%(1D`lMgJU?A0l>{0c-`|9%&t` zW8UIY=tiSGDGM6*kG`Ev;J&yqyMYZl!(5I&{Mzf{v#>3XQskLT*tE3Yov|QiVG-KE ze5ar8G3-3PJv_Jxh1`Xc>dK~Nq?1~&{uOGP;y`m@b>Z1*;$*KY61Rr0$d?LV&Xtqb>3Q#aCI#g2G5i3ELJ`<_DhbN zFZF4TWj;o3AB^QxLonpS;BZdETo~Da#P9jYgRhGSiE3HkJKu*~lx{tP_KcaEl zL4nehL<`)5(CS_R71Q}~h9Y?PnxPo8IaS0n0=0u0Wf(TZgyH;xao9G{5rIB`1>G{# zv1yo2&Fif->SEO(=-{a)!!PiOf~eOg`=8NrkD$m+0JteX*cw2z8=^aqcMP0|p2$Jb!9jEa2cDIuXnJ(q>#_ho zkr~b)=Hdwi6e+L1-8J{9C@v{M>@K+Iz5V?3=eklrN{;}H0gTQ}?hs5-JPzl;^8mIF zk&R%41^GnFOaBLyMR@gsfXitjFMjg4ng~MDCc-;_r-2i#^^3-y&$2>CBRL0Z)Svlz zUr?g?`TM3Ft*tp;z6{2v0WiR0)=vs$gR@nr7ChF#d*+19j*i~e)BDoQ4Kzu*HQCC> zY$r@k77l|+)&?&ieKq?u7I|=x%1Kvux?fncSP1V>Mnf4lE>JB6_ok_7`eslhu4D9KzYqYXMU}W+MqRMSrK3;u5KuDODe>z(FZCP1aa|XXalp7Li$)OssI;)Pb=Q;A%Lvzu{s4A3dUCj{ncP$Ltc*3aeK{Ka3@E`xnEZcMRM|8(TZ3u1512ZG z0Zw0V{39L_eEYz}_B*!#Z>YtuapSNE84!2~2uYBO>xI!2@7K}iFdtbp%%^SoCB zEAGj)wu!OHhba3|G6*NV-yorS&@YrmA0r(7hXm z9E5WT&yNF_4&9FO8xNvHhWGl;yHwo9{dlF=|0T~0=zBq@ZHszQ5Y&uE(3VoS^SbT7 zr#z3I(x4vCarN$phbjce@)#5Pg)~!|IC_i_d@($5J0sNQ)Qot&HVifP5awaSjVsXd z%q$)QtmfmN<*Iv_J3sj58inO8*_5$ve+)Pb(A5?DNZErV2%^KDeKq^{3xHfwGjjFX zJQhwKBakcT3-jQ(1j&{smkQ z@pBZ9%sk664%8y7s*g`mNq_RXjMnQO1FRPhz8__V=MKHis?cqCK?WTiw4TS$X9T}Z zX_a}6?6kTvf%WA({|Y)$I23eo=GtoV>z*h6iw|bFf9`R4KY8}IpR8|11PPdhqU}#b zVBo3(5mwQbjo5N>Qrz!fvm5)R<`Ks~L{$v^(4>p0AODfaasK}dm9gs=Jk44O=5v$( z}7n%T7?Jfi%iO8?q1*xWQFrlD3ONh^kP=fG&tC9X|;$CVKC?yIDVy! zj2NM0la^;v2qwG}RY07-W{0ImaV)nbFHmCK!72)ZE0G7v2+$pZfsPL8Je!OG;j4XD9Ul=d3lnAfz2?2r{W`EstnUtbw@jf719mCC-TM z{z-r_cVu*)u;=Ctp{Z`T@XGeo8s@*Vf$r=CF0SRu=p7J5kv;5L>)2Eu8q-U;5G&EM;wOGnrZbo^(0O_YlnbUISB|A z#geC9FUArq%3y)?K`*P2O92J@gci6-Y{6A1u3z!Ln&X$hemw+n^EJH4B-VZRxz`K{ zB^P8n@iutJ5qdSuT*}u!FfRz!>Ck2;@X=17(hsvFKik_^*JzA5pAOND9%E>x7IH*l zc<<`M4#JjA0Tqq>3*f!E7%h$OA)Wv)RM1Ga=Laj)LVrOct^uq*bNVy&Ln$fxP@e~9~)&2ht%rD@(D6zxnP-JXgZZ3?7 zxcW6bl$3-yptI-|2SPAN2+m6d=V$izJkYGc8zexwpmp2$Xh%V*1r8x_KO(D>Vj4BH z)}A$52mIH+IuTo`e!8Q?gL`^fqk6>VDSuely>0faQsaMTr6yC@1I(@lfWdlVAHbVS z0s=_DvbHc#)Ec9JGYT#uAWM)R9fq_R;N}aGVv)3tJVlZr%y$yy6w=Cpu7_#7^rE&l z8NtHJvC^*Nbi+b;2d&_VpP5*r00h$Sbbx&bv@9GLN#;cF5dzuDw4f0TnqmpQE~9UsU)jJ~5Xg$c`Ehn~vH}+%=;JUFLv2yMdO}Mh zNSjMh#8vqt5JMc`Hv>c0oh*%tFhK`aaAEamnZYY?z@V?@@)vjt^cDng>B8psWIk(z z*DtBSt0$0f2;%kcE_m<8Ll~0=`KGGl?eHY1T)((O6F3T{}1UE#$;e@SYZC! z2N(zHnj@@u40riBg6kaw5;y_xgPR=9-~qJBtib>M9{8-u3&Dy4Br+L_(Bui0NgGd+41*VIU&J5747G^kFL1)IRM!qqy**SuzenG)5`d58D_#!;vr3T1B zS;lW?+_=gmok&JXHupSw*&#=%axZjhKzjX`N6+J`5?$&dl!KF%Z4M6$vrS0i5)yR1 ze1##0>a-e*Q5Vaz-u7UvnPwTYk7`H`X4D*)$^;iR~j4+ADGCz!ziOJ6}n z+69o}pfy%sWzzD%THMF{c46@CQpa&O&-FkowGqKWDVGg&CNKq(tNW7}h`2{EKGFwb zJDOU6!SfgeLcy|ZTFWV6kC!ygrEeVL7)dXMs?RzdBM3G7MJ!iHDq$S@rvQ%GmrOvw zmp5lp#ap$jz4b`bXcjKk#ef%J-9(*3*SR3wHwoSI_}PVi913#spPnQl%1eLYl@Zk- zuP>?;WOL4Nl)aQM@Heu&zRt8L8jz&Wr*@pvN+GAUwYH-1{}91S0P|o@KmLWrE2M$g zZ#o)gunI{muYPYlc`xN%m48yV!uoOW;*}9&i6RmbrZm7`(FU&u!0=cMH-WMZ8d<6^ ztWc6-TAN_%4W?VN%BK0mCp8}@%H87Q@Mz_U)v2w~GhdM3>2W)L+DrCC7)@|H!1ji5 z8WMw(1phLqn$Uj*qoK?g1z&;D^llk>o%p!#-b!RML`z1*m=}UUuiC%F$)?Sv`=P5a zwq|0*JxbI8_cC-HUhv)>%;2Ej1Mj47gY!yqv*wpC2&*|wWI9|Ht_l-g4c{Qx&Wt>P z998jm?W1v&Ln0$1abHL^d8vCS;CuK}a`!s0x9$vD%5>Dg#Ys0adR#DB$Rv_FN3^;K z699#2UGc*=jq7o&Xwu!O)yE0br?2A!cY9t}4mX@F>6*rUg zmnj>7O$4G!F1*JGIyf0V2q}uYa{B0S`KWlYaKI8whKth#f=rQwD{_My{_36mZ(+A` z#hL+Si7yUaS`xEL@_tSpEJ9I#s22R= zt1YZ<*qa{%Y$o8EimyobM-btVEEx@-)VmjT`dAU%1cJ*-44$z~XJtow6z)`Uj}n&a zZWrrGOdXk3>K!Hu4}X?Hf-T$l5!n%(zeB(Ug-ja)tOHFY1VZJIzUNJ@`s3R``KJVeP!+6I z=eDXqWGZ)~v5t?Na4sFT#0cmh^S->L5W`ST4hISsI33$3H!KVgZy!iQjk-U|(*G15 z^t#3^QJhWo?&kO{_6ygW8j!(BDzQQhgLfg2FV9QB{(k^AOen|h)a>l+zxM(_O1^b?j(V7-WCVCR@^WeI-?7b&&ZEu*-n%@; z_<*GLmR*GwhR7Cv;^XAR1NSk8EfyiO0xfW~%u+3AC#HlpST_5z>kE+`<|kAohgvlJ zi3ZfjsRQq*#EN7ZKqhN%Vgdq)c59U@({}$CadKxIY`PHlKhSrbP*AAM|IBL^Q^r^va5uA*6X%`LU+~@*A}S#Xi5X}zfFKy# z(a~|8!|MM7=gJib2(GB$2XXU7U_6=vkOgHPKNy>0PzIvF?Qpo(lOLg!14$9#!qb7h z0!Xe_Lq|vGqLi_~O5{yZJvRwAc0}&N&|hTmsrrw3FB8o^Accd4A=d%GJOIAWXC>Iq zg7R`6cpacy8pz3q)UFS}4j^rl_yQ2Z!xM=RIjHpA(zH!=pYIMJv|R8{sck$$3>Y9I z5qSQG=cdl*FHhY66A_!pcjdhmN3L=D97ooVR1;gLA}FtL_5s<1!IVT{TI4{)pJ$Km zDP9C=NTc_!qp>bgUrjw{3UH9&+}zwe2Hre)R@`!!l>s598;J8h>Z$y{U}dUH?js{3 za8!AmrYmh(j$fN`n5o{U>x+UU3~THNqj)CupY3YzDFi#I%m;sIiEf+52pJb7*)5<* z&U^k`Tbl-m*S@GRY)oKxLVEd6ZVkL1Q13vx`VEY85R!WUnv#NI6HxLjx(C8@$-aWsPPU1EQj-$jJPIf`WD_X=p542l+WQ-$O)E_4J|Z z=LpOC<-l>Xo-g4q5cCSB8Djl#2}sJo83)eUYnZx@;5LC+{(;d-uVoAvE&j#RMn1c; z0r#_^q2X@P!@L1x)c{O~SY*nD(J3k^z3vo@o?ZtG4RV#VA5|!b$*ka+p}SD+1>*24`@UPRQskYyr8E$}O&;>Ps>HT*A-Q~_g1yw#lNePpD}g9jI3lP}*Pg47qqwfY4M{c%Uab|>3Mi;2 zMk?zeCLJJ-(cEZDNVyI{4sX{bOFESnu#m%5ReV<$lH7uYznLpx%>u@k-yidk>=6h^ zO;7{{GF=dW%#f2a0M}o89)I$i#1@|3TRqjr_>&NG`u^8nUNo$p7!YsI*tJrR3cd~4 zcPVP2MDnAjTPHT?E7L!=*1#_KZB&#gvh$bipeSSF;Y7t*llb-Bf~;sgqhjp}MGG<& za^hh(2QL#S3TUhyK>b-3umQ*^b4-v!ktKz_DS@OAZVlODVKzWDgL6ye10rxAsYoL@ zUL)=lx!K9aaG-|;jWD}mp}B+5#U1Q_R^TGIf3&sm(vf5T4z8j92Y;mcveH=iN&;b* zDY208kK1Db>jn%fP!J`-oUonjz6cVnMD1Pr-)gFR$P!34h!B1;))A>^P+E91CY&KQ zRrWU*9)$-`1)Jrc_qcA^jPk(q%K^g=5_XXJjh1Pv-OtZ8EVN&n-pcT- z%DOthV^C@t2`NTutU6yU%C+I3P%zdIlBH-skZXu?BBsIlyp8q54haQ~48H+m>Xf!& z_WxYmh4l~bA;%doChfTu^JF#qOz8&HQ2D-mhK7THV9deJi|d?!Q$;F3^(^1$TX_po zkjLmdJWlS?_6YFADy2a%q8yvQ7s%(`M-6IVq8Amm`Fv=J`PS%7;IV=Op&X=Ul}Oj= zh)~%A_kN@U*#k}rBhI9g0JgNnY9w-!QWpsOB(!SsteFxV?6mnfnB^akXCt}Nfj_or7 zD+lU>Kg6d{E+oD-|BNLgb?^rTJX-u!WULm7xub|L1?U+U6((y%btzdaKQV8A#C7P|v86S=q0? zJdcEXglv~SIAVoIovIVe3V0GQBdmqr>HqhilH&Pl7cf<4h+keZMCM34@Mm(Iqj|Ui zu()WlO46qt2svcz>-7Ff+pB-S)D`3x;8+w!v+Z(uZxMTicIH(?M&Qd8CSvAa{T_$N zFFl0MSxmsXoZL{(i26;>OK6TJP)+w zvG<%WgaQ z2W1a>B%tM4|Jd2sNJZc)j)&@CdDs)CWmFM?&9NRkFT1r+qGg50-(k&CJLd~JYA|MeA7K;p z=Y2#3a2E4-gvzy{{$&HDWW*%g2wXl9N{Uudo?_g8BqYM%n-e9H&(c}d;oY#OG)Onm zI}ZNrQ!+IJ@O)A{yg3su@v zk@#;zHC06QanGh%&Rj_2GBnw07`Y`le;V@3Z_RI%~0MJWOE zwbu}u)DV^NM87Pgfy=@NeOG$kKmcj~oLuUOKu0nrP+2Obb*;UM3Kr~;?jYO2Ry^=wuV8}jnnOy6U)fiAK_jE=#_6de}!T{oNXLJ z_NIgnyYi$r9Q)qI>NUH1c8%1EAs0kSio@V_nr;s@)|rzc(VToSt#F-Sk77< z;D%|>BN*=G|6Fsi`Zpc*6hEDBI3KS_%+w=&KQ)Lr0`sVAw4TadYRW#5 zj+aiMZD#*!u1nGVe)yN3VMyGx=_J#gQ$&KBxBD+QdcV zx)oM>>9*Gv$lt|2YR=ukyuJMj09T|83E}DY>!Q4{3tX(^*n3Is@Ks3k#_;9egwnI# zIXF@egb{PTDpuR@=dAA%_M=3|3Xo9_6*7$@aAV1MyCdSSw`@5x)10Ikg!)M^tPV5V z><-tt=bK1KZZ>@ffsUQTOdfcsDCav=8}Ix`a~^GsrI8b}42zSb6&HO-WCG%ahdh#2 zy31xh`5SNhV<7}~IiKHzf^_o=(|gCz6>ZJy22_DA78nhUQ<+r7C1r$XfrkQQzm}ee zvD89cNzDX#D)dLk)Hn6lQJ&pTMr!L6{h3f&Wn6v_Ee>J8hUG_Qrr--{dkACweYklf zM|q_p$smyP=mVN!tYfKEQ_p|&$mqfJocIU0M=9Z%kj213)o;A5{&s}KrON`jL#;iK zUa1ywV$qnR!jHG-hRQLf$Mnz&KR&M)mlcQiEiFur0oM$2UpgMkW$xm6WF`$DTrYll zok}3Hzk8(GnCo=3hq*_%pJi4_)gniha_rt%=o~U?#>1Z2e&bw6Q$3}T*xxNb1|fvm zK?=&`KaMf%%103Ky{^_bqH7=1yX30=MLho7ux|L^_iu`HG&LOJWK8topNBw>P`NZ$ zvBm+v{mxGh35RE<-z&60+e0ML4c%4|VEkUs#({axpr8R&jL_c|)U1r_O_x)^Jm8w?&7Z*dV{Yzh%;o zfJ3US15HT}UhUhpg$KHp_4*QTv|BQ;AXj~LCgPXYZ;srxnAwN8)*S9EnZY9S9;j0? zZy=SRd8tvy=_Viuf5ybwTc`8+O{Gw*gsbRxK^%=$F?jdps9W*mT~FhJd~`IpkF7|x zpHdG`vIqQYZ{fiMX>H*ZD5*6mRzYYiGE+gP&ZJrCU=%Oz&$)o?x==|<<4Ptv$mh9U zc~mmhuO;=T)LI&D1Xr37X9k+r|841)7nam&&(5zv6&rK#G~o%{e!lF+N)8N|REEZP zWGeOh!YE5FQO=%k00!gMO6A=lS#-n6b9h-s8xa;@Eve@Asu#={yo&y3A`HOtHdn*W&oJ?? z$PBH( z2wkoIeLz)4pvaqv<^;G6ByE&jTu4h9NTE1gz2Qg)C3F@LfkGsNvl{p|y{lym%whSv z(ZqW?o(d+w^k%r!19U`h@%KOK(JR91s_OT>;%27edvYGVbc-u0VSWodC^daZs5A?8 zzXRwH2c0_r_{aj(4s`7=BO^mu*X%|=g_M}IA~xGVS_6+4HpKoB-KD4SM;MX@2+^$& zh5>|_175&W@T`Y|3W@V>aq~5&zq{85Ypm~rvMzb79jyU6HP{%%sva22dbzz%CXOmt zV6X=V8sh%0^C%<@Lwpw@h3J4fWWJ~~czYn0VHC+{08}F6A0V_tg&ZrzYwJ8qL^dHUi-m5Tb*@%mT>(Abb9}@|fJY{SjIM(GTn;e=oJt3n#j5M^dpjB?CbA2uzf6 z*jDc<^D>^6o2$7{3up%VftZ7dNDOs@lM`t(0y(NqIB=o=DS=y+{{Y{C)DIud0fBG1 z1gLvk@R$I@3j)Li_yp40fY$Cy$snVDrB~7m5qs4n~i?#Qck)c6Pg zajb$jwk-eQQNSDk^D&h70L6XtCJ}hMN=W#2ZbC%8L{<(~F z{y^-{VQvGjT-18)Iy-wBeERayy%{SW8YPy8nWn#;grH(#W1DXKiNs!dJ%?q=@K+^0 zl?5V@?E1P!9!>qY^zZ{bz2uzRENdE%!1vk#U1 zGP>y}KR3o1D3sm?B}2J=YK3E}hS^fnInW24FD~U>@-9d9zU?w4*!LQLyZMeV96!DP z!v+WmkzBNsH`>ThI`?ldD}~VX2KuK#X70{8J@Y{q|J56pT>0hHr?b9;D6ivIhnh}7 z@~1I0r=oA)c52pi}{TBhPKW&=!$cs)dB$Mz8#`{~54^VHzQoqS9S~ zmWC`{4ziKn#g`t!b8{av`#;!UzA|RJ`+9BUA|usJh-!xx2D6!57h+nT?iPjLt2&~P zoq3Zot4dy3u5)3c>5KK6Yk$t+Vsc(pbtbEzZ074Dr<%^fThXao)=$&^KK(ZG^bbJk zhiZMW)pjRxG?N&%vGXU57+RG}mFGxYj3G@L5T0I5zv+4w=>OeX^j#Q??KXdTQ8A%e z0anW7RD=sgAv2n~a@}W4QMi6BnvbiJ7RuoN02fU^88vu7w)4}kW|7j#p^kPO4zt3q!LA^_6>!K zISCmTGeVkgI2P&3VoaA7WD7*;gUL%*wWi}E$YE~y6jK4i5P+wRjnaA`7-+YPT}4Wd z7)Ua8%RrOr6brQC6OE{T|Cs<0Ev#XR=EoyYmcQx}O&52gqaM6@L8PkRk8qv7C?+ z?ajGzt0uTo=7>3H?^*9wXU6kI%2~;$lIKmR?5^^09{!{Xz4y^_cYWL-{Ov>ayH5yQ z2N@L>=GRZlSpuSKA%Y@<-UdR+pQ0VKzR%6d6v`hK@-u4E z8;E$l;hkt}p07EuL|>}uAJC1Ae0<{RfO5NWErtT^YUF+x9cIpX)z5JX&p?chHb5KO zU`?cH^kgAwyp$gz7mP~0FW+h5%R>Q^2Zq3tANnGy~8SF96ljAG0E$9!~3?~%tYgHyNp?Js(tbO(NZx!1hb7x&~B)mVAm=JTe< z_WJ|K2clOn9zSy#zDckA(2=uGFPlI%1pqZ`5= zUK-!sq`X*0u&QnLP_=i%PDSnf*@*o)-)uYcS3zYa1%nnN{FR=utk>iM%RfdPXjPPHbO;#Kom(6ay7%!&MFZPIrxzT0a)!q$64kXnX*stJr0U;Fvp8 zBBL>RIv(#Is{g1>u{Jxwh%<93fgQ%gJ1hgVDFA)x4oyxK?&hg;2%W3GlV*4QSl2mG ztlrLEu08;oE?`8LQZDV}>V%3Hw(UW$P_aV$=VbCdgMKPu_ zRy+AEy>h2U1MsOvb2u|`5aHw4*oAHm(P=*s~jml6bSPf_sy;@rZpNX_sa<{`8A9qNc6sbD{ zes!;@5W5LkL2Z0eiww6RR{y32W1^cZ2rLXeExjWJ3S~W6`wr8xqmv9EOaO> z2~;2CFs;}pY?&{tNO!*zt*-5z)V~af)L<~Dh_k<7)c2qg`M5eupE43oPKHyxax~ph zx9MD#qv7vq7w17@Fp^k2+ysWoGJMjmGk-v#@3eTzcqT+ zWH_n9;{pZ`1a-0`r= zxF9v`4|jQde#nlE zmi66iCIi(!>?NJ8Ke-2Hyd-=n8C1MZ6bzuA7-7X`3gH@1uM(9p)u9{G`DywpUpD(B zQELE*6kbW*9p<=mk865qhd{Iujsj*upU~kJLk?5CMgo@V)`H1hNdy(QPy6VP9a-{{ zwXXwz2mq+w6@ak+lyA1EWiW{r#rkwT9dM@=Nu+oXrjK=&R3;4?bVDF+=L_ZYL`Wq#u`3lE6?U&OxLp-rK0j!jO3>Kt-FUnSt% z?)h0S7~3NfxIy~@#2Duv2RNVNCR|WPYK4!V4G7vRTWxzaR5t5&C6TE9em|+!^un`n zq0XvNmE3K&)nDnvk_+Veh1;Kp`$jr2mGA|uc)bqB)KIX0#Y>Pp7p>^%$nM~_m(oxR zK)-Yo+}=ylJ6w(P8+UN#wxl?wiRtKMJpKNm+tqiu6@cWsjje^I5gKVUCyUM-#f^=o=&MiQvopwQi&pmVt7lGHVA|A0XVmsh&x+-$yc z&Nd$it6#inbz6_QI%uMnmW(7w6;3vOlO^67ZG+LuK@Sz$IA&EJ5Cb00(xcaH*G-%s zgRZ^}@TCLyl^{S7ckGruzi)$9W>a!S&3iP)H{JIxHYD(~xwNA{N4v|3wZ}z(ja$4b zg9AQaC?3mVr=P#+2fzR$qoAHv8+WPw0`JwSDX`Tcb;scKmWyZ%^jCcHD`py^*2Qm=`M|kzO3=AU`{8+p=`-y0SN6L?2wG#7_QY1 zw;g3vJG2gf4Jr>U(9H6W_|JoijZ_nNE+HhlT_+XrYR%1jn)+&7^RCjd6;2(T0AQDZLhU(Y?Kt}Uk1m2Fa$mLZO@wks~)Y5w3~&YUB~ zPPo%9=s~fP`<7$ht!jBT6BzGGKU}H=;_TvOCl-L@nm#lPh3}=ARk}Xs&y$KanpU-A zEwov7eQdfC(*5g%Nd92koCXErB`|JrKd$CG;P)L;mv)7ma$@r_Y}vpsO4s)IIXG4R zQ(ZDN-JY-PEqJDUK*zZbspVeo7>fg5=jOBCLDOy7t4vd%t|o1JflYu%LLy%@)K}wb z2jnQVr7Fa06gqu@Z#DsdZ~zEh7ZC?u4p7#JpfU(L(M4#K478s;FY0tZ{C#JT;Epes z&AZXaUfZoVD3U9f1$L&_?K)N;F&|MFSsYMFz+7Fh6ZuwN<}>&8n(&AlTc)H+Fn=VC zVh6{Q)l(TIe8T0Q>0fbt3~OjAf29vJ3^+f!#}zF;oKVED)CA-WcD{J6>Rq0py0Ult z-a-o6$!UBE<4-^<4VMal$^|1%u#p56dO5${v}kT1qH5N`Ow}>(|CZ1HKD%bc7Ai6c_0V1ukAlm$Mc?DBvgd zoxDTpT2EzvaRq0AlEC=H?@1}aJ@c6~GgZ%e59J5C@8H-(1pXpkM;3gHHE$(^K)8pb z)*t2ByltyJtY@%cVjoyFJftOW0a<6JC1dGB{OaD@*;;lYQylZTqgkrT_(% zGFXhpiTjA50G9;WNV41Pd8C`&J$*YK8Zd4)hJFmMY59qfzFFYG)dpNIt{S~9OiPba zg1cHimqUPaTcJuKgzet%8o}WV6zj7whHfZRYNI6uE!B}kK(w~0GOOIR)_df{gFA#u zW0m!0QLH?!+(u(h;JbZjnw|K4Rzivxj*W!ouI?Z@dq^GtCCshUz^g05Rw|owA04N^ zo))-mjA~T!_Z?b-R{nE}67;#v%eq22r6K0aDV{_|ml z2|qM%Ep7jq3v++_C0AB?5cYpbDu*in`F-a!*XvwR+2U(+&zZ%{P`n~KC2=>*4|a|( zR_+1@b@jB8NbUbM$d{0gPk+0rFhZjk=;?&GWyajN%Fj>bbq}5jt0b!E4dI|di{Ocem0f`vjwW{?RrJ?etX!&%d3aw z)X2Tx+?#>zB;Qk_W|^LP;!Y$2+aAvA*5Q#l&NVsga{TIZo~p(?B_7>^ z-s3R}05a~5?_t=EkBG*OWxP0VKLoswTz8z=J_3Ox{f4F2n6rJ`-Df%y9&uLJ;ix#X z{PF5|YXEFJ=JU%^_ZX=F7lNG0l7}EaJ{}6O@TU(PJ1d~5=sf8dV@Oi{vVVijoQ}h4O z;)1u|JH(#Pe!2m_9ZYJ$gk)g@XrJKlJ(_PIp*#?6VgYDJgKV~uLUw~(#H)1)DZUiD zaCD6*I=_|~N|Y5YM6;7tjf<4OAG59wlcjv0cvbOG%lKCTsa|D`Yr9Zx1>f<(eatG^ zOgM908Q=dAcR}#vhENDcqqW|ezx3{)gyJ| zC#~NJ69!g89tY%~@V}eOJsdQtD-?nQ>8;t{hDs| zcy#;ok_*0o)e=iZP9#vGsI~4j`Rxs|xA|AdIT`)wA@-`^_v@}mT7dGD!Mad8Ea#us zhW)L^{(yy0%h02sidU47$BJ<-oDFG6O+b}8ySQ1QGW<@4XW-!7IOl5}t#Llx^A}Ro z48cLYK*PZ?h7#Ecy3bfjS7n4+A8rZ0iP*VNJ@Na5E3F@S^>tTwx3P$v&+2qH$Y^C7|Pl@q_IS#{)

&zpLpR9-%yP)^4Hd62r<+%AUyDzPe z_ccXy<0*nc(J!=2W#1m5O@aF8w~6nhtnx%EVexXe=m1+adOIEar4te>m()DS#i6@g(FOfQ3K`wrnKElgR*w>c(IXH~*?B6cxT$o_byU=<7% z+e%@`ROL%)kEBr*-v*gDP*|gBKXUQLgDILh8F{?jApl{HoOy2@9|sH``%{9y z60++6KhZZK4CN|%x+Ziyv2(66!N;X{1Z@R<&G;DZ8Z8a>tq3J4P99Fe~Y$|8c9I!@*%6wfYSX|0}5OqhJ9QCB$rlNXOwo;MDiG6yGXD8Y5YQ(4`g z2|r`jYPX(WHeS0%$hUvdh1kW8vQ`T~Jy=bHleM45jqh^NSPkWTZJqa8Pp%jyJ}uc?!2CMWe^9#pGgb8KL zd=hcwj!iZz#tDo*%hp+I=f@3u)S3ApZ#o0cq*+}zf3HdQrvm_du&+yuu_om4(sM4| zrn0{E^|7&v`UUE5X5{ME#XsbA&3LJr6XRix?;g}FZMY7NoqIDt|5T-meKtYQ?C_bq zh}n;h-EAkACvNK8R}1m8tb*lh_mwo5L6z<$hml()3t)-;W<>^g@zf^>+ADV6v1j5< zIWg<3{f#dD;UkCoBsTSMc=x!+Av-mTl>8}Gq`k<^a45UPQFt-Hc^@70th3g0l2aQf ztFW4_x+jwlZoqo{5w!|L8l4WOFNB8a*S}tA7^Ic5^jvoqKJJHY+<=Q_SHN-*} z>|=-;QYHQ2;9v&srYI=QIf8KDnJIX3BJJV_{%oIBxUNg8CAl&-)SJ1E(6)2BUXW=p zzrqxs$6Z|dF>lh5tu`Y!Nrry)Yd}rvbJGzfB&>(<(=%sa=e=2scynD`>s1dj(dXkbw|Qz z5j1q&Yk)Sm4x6*G>gwv#NH;Q&b=$fnRbpiZO0d0%UNh3YbiRR#u!)M$=jlNln{u8K zUXW%z|59tCNxaLTNRQY>Qn%wPJ7JHK{^*J6K9d#SC2>2pKa^qvKhMwQQDu9x?r8H1 z>z{U8lq0!XDuf_hN{?j@$Qnf0GsM zrp-rH%ipPM#O@J=ka2`i1<92hWiT91v10w63ew0hbavNzZv z^|+?_gdOQ{$!xVL+$0Uj{V27>-_E&=mstn`LNUjq&Ay(z+E#V+6kFqHPv-SGlGy2u zTct``q6lQNV~Ybd-86_$+8&S zmmF~KDl=jFuwfc-6WYPQ%YS|o1kMo2r1!lrI>4NUG^8>31bdn|uaRtnT>t zq6LXuIoleOuJsmIr#?NNT5^_ zPT*#d1r4>cHuX1slQajf01omn!)C_7F~;U#al&wMyl`>lpSR^apw&cGFskD>XM8O&r>lxX9}B{wbZCrshL3zor3 z8^diKo+uzYlFwFqn~xfhjpNZW>;l(p`4xol$?9r@1-IRuSl%Z8hpPb{yhKB_LRsU&7!`B)V|BqVGUGYPRndNJ#2Iv?(v%s zghsO~Cy<{tNB9Ld2p1ZE3~Vk*6&SIndYH!6`!Ia&dQ0z*&6gHJZ?x40*(5I0Npj!7 zd&z_scopw8cKh(YpZ&S7s^?BihRlx^ztBGCDQ(GVnjk2P_#Dcc#6(u<$}@DH z9LBR7IOJMHT5oLv2Vw(1GqBQh3H1!msHTvUMOfXM_6rpeQI88hqC|HsmitdiP-h<{ z3iK^YrSygCXHzw0U=X@t9yHIyed0(=F=`0K)@;&uE+Jxh{wyr*#~eS_bfi6Qy3F~P zOdA2|Q7s|aCthFk9(@>Ie&RE4p)Fe=*YarNb?@(fYudVNj{~mWraWho{jS6Y?VV+uzJ99I_bfmn@VI;5SeE5EUI?(kqRna`L4GeCWC(5Oe3L3+; zyDWC$X?&k*youan6(N`^0=i;6&bo3Ko1&@5f>(jx+^FXon$|XKkj$37O#ZdE zYcY5BTN!a;0yob?i?GL{kG^;q?J1v$8n_%ed>jgSSj!2s>7#$jeU^4QTHUeGYqA>Z z6eFt131WHT%v=9jV8OwQ^)n;^z0X@-5%^!N{8jxYSnUmFM>|iN2rIp8oLqVOs37-? zz%pWFjf^nC8kD$OsSFCrplr!|XVoj?4$b5udtGYYj#Ei~- z(LQx|c7u25_;)#tS7FbKkM4ZxUG2V|kvKlwgpxd}+R8%eRAa@Lg$37olFt9fmttay z=OnHmp~8{x4#z0}&F z+{xF*x8(c{N(nn}N4On7MI~NbgHDD#6HKI%DeXaBexy5u?sMP9+DjJIq9ek7(rtgh z3X^Ag;fQrrU|?DOdgv0)&5xnhTCoYq8xA;R0j+k19?6){dR3<4rCdg;K;O$*C9)SY zc$~!Uz3{obV@Ujy7agm`f73{%4Fs2tJ9Tv5hQJ5o5elnO1iTO8cWB@N?R6%1#4X>v zXT-V;U*^WUtbtS!e){>Ur48(+N^XJBF8D?sn2U~odeA$$;Zd(29TN%>eGDzoifnbD zS>nKvU}8#t+!mW9D{F+qfq!Ru58J`Wo*a!UH@z2dVJj$Y$in{U3!zuxWh@IqZyt<) z?h<39)b!JsHkxvbdvO!uol$Zp4?4MBxq|rb&*|Qq+-fGGkmkAM&2t(2YVO`5^o19d zVGqQ33*Cg-TDVcrmYg(`8o4`DI(ZXH0e%{3OpOYGA3q>OE<&mnYJ_6`fB55!dpr0Y zPnj@L_Eoy)^~vBbs?|#7Tvh~`P- z17X>B3g>ETYunn|eAC%N^y#H`9_lG7p0BQ{F)G(4s}qW zr=XC`Q0&Z`(ZWc?d?V)%_Is=zyyh1*@}kZzM^OLQZz~M^Fi^7mrvLW^zy0S6TBra5 z;|89pM%>gFYdLt%@7;f9a>mTRM>28u%lVgoN2eI`e;JNQC+H>^%;mlLij9NgMLOFs zVAkVaq+bcRzW74R)~`=)r+xlR2~u|l-2~{6VF;w!V(o&qj*jNO`{G35tz<)4<>eHJ zl@GWd!QdcGpYQKyb)Fxquxr(God|%2o}lwb^dQpm^76X0DcwO})PEI>-6>yT8=P*% zI6ybbNDjRCj*nr}d z^=aATx}%BpAAnoTgWD4H?Ys_L$H~{W>(<-hKF87s#qe;y{_G|_J^fY_21(f#ffZp-1+UaN76}-BXQS~49k%D;=9I1sl$0LpIjAM1_nz1 zub1JBo)sLNDE3?%)dob#0Y1>87qW#iiHeFcF>OJMRQ=M@(&qL3JR784X>LwV?841> zPdeft)LX#ggB3oB!_9xK`<&H`f|17^Oo=c$K_;f&w?)0?AL{E3Y__5H5i(%;=;#+* zt4{sVqn4AxqUWnt4>UFTClYwjPfSg}gKoL2PVu5`1;SvwvAeswb=d8rPvpD87_TUT ztyJ~{mPhZ@RQTwqwsU;v)2818c@6*~pc;T8_%<#s1S|@2Z7i*<(t6E%#>ewNSAhjq z+R*X+qgnAnup+O^1bXCXt z2L`^*KbrwMvt`0&dvJNkP5(kJI${&x^ip5C7`@b z8PBU#?Zoc8c$7V~{4Or;(vXWWqw-)-iF?YxxA|vZmv^V^ch~x^d`L ztaW3!%#0-Z#^V<--S(7UfFm&hcwUi0YjKZGk<-;4C1VtG`q?Om*m@@?!vHjA^>}2S z7#fQI>C>l%C8t^FzS0QxT_N!Gm_5oL=)1b|BdYiQA+XitVexQgYuO~{?&N@`qA2@L zJ%<=hy$5ItO3KC=`{quVxRua4SvTQ(^sQ6Z9y6pl+bMjj^pX-%IM`}tQ&CbfUBEL0 zU-80|X0htYqcaPee2weZsfXZul)yU9*R8sUY!6Vv*i4u@4tySA2)&ttnr09=R%+i8 z`~!d)<9M&4K0qZ~8qEG-HN#Hc$uU1a&vxTRGc2Y73(gpV&dyF45frLsB5Y>Hh)&#F z*QT$h$5(;*1@sEZvq5$?L++fgw4)IRynbIdg_!AS}y`;UxZ_Gr(4t`J&&{I(&L9Wo4q#(b1ltKhwPnw9E0K zQHpB4*;&tP#T`918M3MgTR~_Yn<(HQg=)KA^o5C4CGjoLS%VdvsKNC@3Bido%gY}D zH<*8kn;ZHRW%Ka!w?k7hQ)oo$(9{4X8TTY5{k%?=4Py58T)iO?U$AXN z0P$Zjs1*E2^1umH&U?RR%7N__ZL!T5pP>D;Z=$%5zP65zDY${BvxRaw|AElt4EVlPo?5jf8wVR2%Gc1ANe2x9()s z?w*E5G`y($@n&mgQ4yD|U{X?2smrSNtvIFk2?^Jyjwbh+VZoMLSX)PeQ;9SX&%p(T zd(E}ySKVQ!-CYZdTqs<8Z*PYdoix11A;os@JDX8$r)hEN!NJT~dq^ad32CtU|C1T~ zTUx=E3EpF*&{a|^UDH32aCLtMikR-)A%o393tZ2HgoOv@TR4Ic&l9kcH7wUIvFKwthw0aBeVMdZ zxd+)`g0plC3>ZPV8xCCPOJHat067SFgTJ)%nxkF({rg4xd?SqL-wh5A$3G`8&ws+U z6#^NosEx9e6T)zjEj;+nunsX$NBiqRz2-6xACkeXH{oMJyI5TDv%_w(swx?op%%z9 z9QEOLQfU{ES|s#S#YDlYVL*NIymvh#>U z+E*Zb99M4h-xU5ja_EHR9&boD8m!MW5 z{Nu-up3%|JurOjmLc+_`gvO9rwRLtPCh+!PYzZrpL0MV(pv$$+AJ_vQ+lkI$x&de3 z;m?i*sJKbE>JFF?KjG!GV78?a$nqSM2P|8_=WG++iw5?_%*@P#fg}*es8RAX3d&E=8u`P)>(%GPwZ#!JFe@xul8t+oEFx5s&?@!=T@0fX4&(eo}N2*-0xJZ_$Ew91#*R*41s@Azi8yU z;h~=bRCr_T7Hm1jpQBhI33X)-=@OMdi!T|WQA`2OwJp4K7=tCTK z__HR_7wj>5p&*n0FFn1P2fK3VQcZf{VDA;R;>D{8(xHt4mCV)E)s*-+Lq02N)?y!T zyh}+@pu{iRU2aStcuqRqsb{aGrS;VG6+5xV^v4gc=R}xy+_sj-n+lppr_dke<>jr# zk~Ir#dTA91reUxDh37309DThgabN2J_l ztHz?_B0X3B z4O{oe$NNZ(z7q*r#;+;e+dF-Q_6@((9;7pMq<9T?f3$!rL~!FwDZA5l2u$8_N#S@lBY z!C)$xho7Hpg6AIwm+5vASn+4EmA#>Z{VwyK1R3wedM5kfmF)>6~x*O%2KQ}csas2%cR(c;+8{d83*-aAobGC2wVUtBr zkB!}`^#Lq_i-+e+p5-syRP(0HoSb8oyUV15z8eFbc9+6+^6oxq%#m6sJ5EAE;;}K{ zzBK5);OUcb^~09}+dhY-I=ah^^CdI<|C~CdsxbUc^%b3+QjZNW=;G--xr3)3|O5wD{dvkm` zSy-a~ez9p~(`ymZy`7B)Qh~Anb-BIvnXa&i2qkT8T2oWgtUE2NN)CT!GyV6{8qYR7 z4rQ`0)6^9;uENOZ1?961Ei5=8rGjAP*IMm5+EOmJrd+0@k5GO@FN9mUzdhp_L2^-5 zwHlHqDl1EHb8BlPDV)FNwTQKTr}s>H;m<;QBlzWsbLXfb%Dzk_`t!>eYHL5N+?%t% zcb|(=#hu@3lsW@kp7YK7#4Pq(#YEr(U+p zlos~gCGQKJk;H6AetD|_uigx5hmF*(ObMN9jT$*u_J)vH&A2@t~WAo=Vv=?q(Rv*mQG( zOn6#m1tSg)PROH2wO=UY$kIAKdF(^>K7zEM9~l`DWQ?GfbVnd8nbouZ^AA3}=VVXr>HV!1|1+IJude8nc?gxb&JdOxM%C6TN^egl3%GM3uk%+L>o_o%vi&a^#M6V(@NcyD7!rOZf%Xqb? zby?f|v0NA|FWMXphuwV=7pHIk_{@YI*&8$cktZA~4pS*HH7zX^OG`^0@S}c$(NOjx z)Xy4@C}~{m;?=9skw%d%jRW>~2TEL78%}vK4tdXZ3;l?bIR50x6WB)dX<7Yu9W#3| zuF96i7=Z=|cnYj&we51s8jGzebifxk4MW#vy3D$>OyCI~2YVYh7@PmD5a*Sb0ja56 zlWSh9Q@I)6bbTD7=5D$+y9eqoW_9z|?u4IZ6t190Z48M`4Z8BKqIr-}Y#gQXN z7W?cgMCfH{X%J1^86$R#}YKn(MYLzc}q*~{q@31 z&jC^Uy$QJkg?}1)Eewb8WK?Aslf7oMFj|$#QW+kiK?qbm8=y_OMeT0w=EwH<8f$J zq8mwxF|2|5kOfety}f<-)tv;(>v|MyvX6K&%Z}j@l2r+}NaI2Axc1>HcYR8?jp&b; zLU@&X>rC?%J9g;95>c?$T4$C&gd$mVrBk=mjql-6maxgmNw1CK-1^x*R5ONrH(21T zNHM@NBpGGPmrxz@n22|GfUQYRO(hm6Up;15x#xyZNt-jOMF_pP5BU;PP&B|{ECTc# z`SD6vr`Rc_YmSef|6!e}f}5MDq5q!i^XO>P(b~`mua={LgRlSq@|-f2vPw!yFC|^i zAixGYNQJ@-0#J6+MY7*-XHISK56w;ed$4d?;XBQ>kS~kfW>Ihb5B9Z&hkj-+_F8Aw z0nl5lJlLbiEMI@UIylatHZi0D1vt5$bRV*aUdoL(PnQpE1FG6kK{jEZmmv5&I}kp4 zdYQi(qG}0_Z8Y&<_q5l>JUQ0pk24HNxd;N*5o*kEM(O338>L1Wv|9dK0r|-A;G|NGouzlH*9ot)T@OJ)he^` z?=QM5e5E2;WqMQDwWyVT|Ni~PeyAeCt9&IJqK2A|t`y&O-e-m=KF8O3EzoaT|gM(B(?+z^dkDjix;5~mZm@}pnxc8QrD$r zlw1N#VPD>N^ypFAiRSn|W2QI*-?fgUs~?W5C(82iNx9F*(bLm&89IGC)t1xVew`{{ zbHV?hwA$9|*C2#Oj5)w*N}P}bXmjt(N$L2h^L5j8bac4*gkN1Ty?8Oi1GWNSThZ82 zAyHB7A1y66ZC0QZQ3eGCrF5;lw=lbOq;1PdNhe$H zo;%}rJkob(sez5hkS<{Jhj0s*q4(l&^(cT6n#Q=wn-;mZX1g*I#i5SGxTRe`v$Qz! zC2YJQij58@1cE2SbPIq??YnpXv|8k5!fFO0pA%O@x~0eeV8=)^MT6%-RK zB|0bpl@&t6|!8MP1#!khFig zC-=kZ4lyw?WunI@$<)hUooAeC$ASU_Ym<_alw|}21X{+$PKw#}i^J}J=gGX-c!l$s z_}!oELTAogIv3ltW(QnyqWk@>xYgNLwJ%@NFO|$>Jd5^p=0)^zZh1@GW1GC#`WaWr zfvph)im9>jo5qPV2k{+UgqkjUvYGnDZF4i>Nqfv>^7@5#@r`El74FboXiHtDl5|Aj zee1Rcm;Agp=J{S<;k4X>GI0Wzl7dxwvS47IS2yn>KD*yq$4&kyiS=(#artp6<@Q#u zO$p`p@J2F^5;t}Z|YLg=<;du_&`?*b_ zl<4+>2T?LJf8N}a{CfJ5L{6JUE(4R8oy~PUmYy#A$~{`q*rst;Z0CjtfY;Wvn*w!r zQ0`$GJ`aJ*omW;?epb&bYB6**PF%BQyRK)>oI&&u!TlsI z(}Vpz!@>66ozjK>%>lLlZmOHk$WzS7@~P)?@T1@7$t4T2rO zCB&y~n&^i#dJavlT)TvYCb{hqKcGp~7B}){`Wh!v0raRJv0JVPHP;bsw z@60d=hfJ#z7fsg=-&&bK-37>Uc*C5x_uyJR&{QnEZuBg3%87XoDzxj@9W7Qb2T%qtkV=ap8|`B>Vyb6m@lVn;@1@ zGBAAHES)RpgABUj(I;x}x-d9kek+PqrtH##A^(FtfWAaPiURN7$44+hr_jzIw;(wu zN9%Rj*yFgk&zl?Ho}E4sb`oIWe9i)N%QJI@^-i*Hh=_>37z-A;yd@wa0zi{mJ;y*s z7*o9pNS(iB4;nWDTh+#b?7X~Wz*~^aFu+^kH1s4~WXP3l9EQU&Uc5&E+gj(mEwkBRad2$a4Ie<#rJX#5yG1HaV@FCGJ42rwxv`i-KrMmPIK5D3S8h99g=1{v(n4_a3 z|Fi74N`VO9bl9*M_U~I8ZOjel)hkcfi#MxJTqDZn9=fA$J6K@L#Hscg-{0T={{8#x zXU}RKu`46N;wx7oYafd>hz0-ppe|M<*Y@jID}+Pp_3xitnjM3rpsq4K1;zs%Y6$6g zj5jvUNl7vNdariD!9h?vU6&wVcW%wOr2!&X)4*WBcq5Z5Y!eV92$6Czp(mg@rC%e; zf=m7 z;d?}jfagqro@{~`wFDx82}mV?N!`D>`~c-9R?J=*R4gFU6+81%`tAd+ZJ}M+`$h-b zH*LDJs^^9voXYL`9#GQIJOGJn7!;r{u!bzp6^kpc&Zg95hQ!?|?XeLh4h(Re=`0?w zkHl$<7@rTGn`+>fREu16^KSOrTf2!MHwYLDWh+Nfev&hZ4!@7JbJ}4{u-G4P_(J~E zD!=W;Fgh(*9ykBB`AedWCj%P+%Mz`3i?yOY$Ef!3 z#x_0N-`nxtoky|XwvJw%C!?rlhU~Ig-^}pTiq)i)alWo2JlF)3Dv#OhhQ%haA*4#S z)#5bR`__fgghWK#*zGtC#O*le6^+|&OgScB2!ABVpmTDT;{LL=Hct1kDLp%LyvaUY zBJ#n!--UzaCyZaT({LrHta>b|(K z(EvLn2xRVMlZ8I$k0|)E97fJt_WIh`@Xl8r`1QkfeQj#0dwk*oiV)AZIXVUg5;-}! zC|iw>*ZFVG4qBy_r)j6x#7Q_)=gOz0r41ZqPY|)DP4L^c{A^gx*xK64#m84iF4q6X zgAKYymTtP?i@S>!MqXn;2KgJIt-Sq8+~scEHs$hC)>rbqdg4(yEZ_xfpq|Pm_$;dy zx`s0L9hH--B)qJF*dj<$Q1!n{=G}l02PL!$+AMI|lyQ(c9Fq%-|V>i|iLT z!$(M)1*PQX=arQfIqx`C>)f8lPoE}rCq^cHh+I%M>;0tl5s4p&H)mFCpGolF_mtk> z9P2Lg6ozEJ53Fny@}#OZ^!UtP1q~gY+0Oc$+NZG|{hfjnh!i6F^zC$_@%n5}o72SG zV}Kj%Ru@A->(0z&27rGkjX=PTfGp;sH`BJY7AyH?4_XTUsaH@_n$~oi86{~&*U#gm zHu^}gHO32Hi{$mZKu{u+U;S&NnA>(A_*TmAK4l z378)xyb~d@(0Q7J0}tAx)6^8kZs0&mL!&y7-qF#4HWoJeUIdevsAsqQwcF9Iy0CXQEiBMhot`;vzQ|dNX6Uid=&K!^q>Mf6- zKmTX$9e}F36&Fbsz#n*;)F#*7r%^XHMQPx=Y>dR~LrZP)Ezy9nW=cw-N!;C+eufTdD`L9^~bnv+2$I zmXfvzyjt9MJI}NS_^l8y7{s+fFkXDg?dG@lFz0ass1{sj=K#H-ya2r@CA%C#$7zt6 zREDK;`d6{@ozxDi7_IA2JtIelp!Xu#WwBL-?F0wMg{7CfD;w>E>O&Ln^Lhq0GTyy= z*CXJ-=rrKkHG+a02<+VQ%Vb+98%l0&1t&@MuU!j5!zqwi+Z;&T8J!2yTOgytGb{IX zmo`8oCdC$E5;F>XAzGFwts@L@wF%S}5H3zBM=*Azc1ao;`79CGi0TCmRMLhMASw>+ zNWWwS$9R8t>*wrXITIApDiAxKK<^uGj7hfc%1|qr-fWQDzjv^=;E!tEpO!?V>H92y zJAF}2tqvMs%H%#omCBVXWXe&j5uk#B`brHrR`k7E?8B-mc_8qY3#Ayv9oRv<&vG17 zhBxX3j*P@Aj&KiOC5Vx&=duT{^9W7=ztF zi3v2cA|S2CXJ0MCY=%QxnmI~#J2fwI43h=D@=AjAts{pL8#OJhY0Z6-ix)4-dwEF? zdd={WF`m1qnN!8Ix4rfS3MGxXF*ZE)A<=HJ*r3#{4xI!5mP_UlxOjL^UcU~5V_^g( zM2yvMb3{4+L;jUmQF2twGKxlz^t=30Lp2-?PSW+nkTM!EsO{k)t_|`N_qF%zz(SWc zd-JVRmQtF@2=QQc5G>*R$N2ZxC!4_2vn`q!cUKY*o}bMbELa2GtQsDGA{0~*hT`I4 zByT+ip06fbJRYsLI38m(3Uj48;L}20t9NzMwV9>d$Uv1!xxQipy_H_r;?cSJjO?A{ z;&oeJueIq1sK7#~*MrbZMNNIbBkiWx^vP0Cs9uUYo+Kn^M8k_XY0qP9ew!zFX-N$| zMhNOkA_Mvzar9w|127c{Yf;k6A(z#lua|nc;_d*x2?q&dYMvND0@y9ms(sIIx#s}L zdBB_t1sto4moap8afe|{7OEO;`L%GdhVu<*M~AI zd`Bjq6vMDX0|tBmT~5HT^46_e5xtocV^36At3jW0*jwuwgM!lliioC;4iY_%0)=EH zJjxsbxQYp-zg_v7_Uu3@ovNy;PQKL(@D>bte$JjSQ14gsalXCtkb*4|2&=B{K7=$2 z5+$LnM%L7vhY7^|5z(%Rxxyi3AQIl2)N15NA7d17t z2N`uR83S(F)}L5Y=r~H{h60iFLg$fiBJMJ&u>>0OT?fV-X9jwZy8zvW`)@TG)dEpR z>Jf+XBTE0x5u!RtSaXHPw^K18FcC^J%%p>saz=LfD~BoYYp$?$?tOH8a1`=Ff`S^W z8yj>)N13@QfESY&s8TCA4psP$LK4)0IMCYCqFx3gk2=uYc{(kxFuZ)&%M-SKjJI5M^ehAV&qFAK6>wNziiFd-ChRxv#d z&8cY@$!w^bqcR))92Vy0o&!fU^VC-orQ9<%A!EY^O5N$!yvkwHWE^vhIC7ac;d>}_ zHC<*%gvo^kf$g20@N%!UW3atEta5((x*vqhjpK~&z{oSHva+&qCXz|)s%BWtH3oY3 z7T2=qe&`BZbHRq?UZDVZvisJUchY4+sj3A11vmjsBa1n%+g$JXGP8;v(ijb4gprh( zm`KmU!p9HtTnc`unC(EGoBW7|7bQ+fFS zbQpuKT?V7D$`RLZ!FAzu;ee-)U$}5VDFQ~Eb#;$CUaUwE$c1AKnA#QHf!@Yq*{xtyzxpm=sWlR7ytbgHt0Q~TiOnazr8=Dr7c0kj)H9G{4p}|`SbfQ^-6ET_dg0` zN?JX--EMK`3f*f#P%f9CovA^1-(Rry}OF5X}{rZ}xrv#kg zjKS%%XO{yz$XD+|Q#N&R$wNsCJ%0(5o#W0TkdUZ9*0nJ)r5!-`w2@xkN)CN^ zs1Y5dS7Z1M`a5NO1xyCaiQP9&xa%oV1e3*uXoP3B)%}%Ka#?A6q-ZQ((hVITd#D`}gmZ zbaWF=91kM{afUr%j;H@@f$s{Kw$gcE;tm##^npj()!3r6xSi&+SFd{Bd6ONdqH29` z69lN*+FIqIv-vV6m_$Ycx*nfJV!;9FPYo(=<{b@kgy8euB9?;f#CuaS;_c}{MgZFy=s__ zrslnSctl9SYsl|1>>J*O;Up4;mS6;B0>>-vz0NxiQfWWbjLqq^On&+B(2&%8*t~b| z-=9y{Mn(Y1_{dwyqF1SvfUv??@`Q*84V2e~th$7mUv{`v0A`H8Kj${gtOO1K0NMnA zCKmAf_iZ#OMU7wYQ>dciZ?hj3!ZxBz$VN3W(be1Z*2450TT!V!$}a-lWFdJY02|raa(xAD#M7Hr$y6i z0?;m@uiz6AnSt$zHPP(sD-B)UPn#SlAgsa9;{iod8XyPwaj4ek2f{%S0e(-uG3cGy zFaeVVd;lG7Yzuf03%1{`smnY7AR#g>G1d^(Fa(2PZF?e-OgCY|tn6ssTYZPVH_LAW{}Q=)>32vh*X%)9N*UutS}Q*X4t z?p336fJ8mYEFJ)$2g9_kU2`0+!nu9>HkNf~!J;LBFI~=e+ryoOS?_388+-UV1V@BxJz>6JjaBzseQrmii zyz>(jb1((Hy&S{u0ptSstFDu~21kA@<^YX>UfM&Dkb;#AgWbb{A0B}ugM;PdjEMIgbNbuq?=DT~o3JW_@2I8nrg-`Ky zJa-_qFyX+H-Cevu#wN>*EyC1pIH!?+r6?XzM3_nUa@2C~&%S zePOE1C~80W2n_m)K6>=fhybpq6s6wtYQOC2ktuOv*dd2ank{5Mhoq$LYjIo*VTtuQ>+5=PwnG&xfMDv8I}(J2w=nRysID%TX{)tj zMugf3(nmLto+TVOze z?B|MYp&F`yh=Vj>bX1^^R|B;l_&ulDXpAhs?S$pPU9);@ih!$W0DXdWm;lElCMRF> zVv3Skr_agF74lxUfkumX4TNdVb-F@siytrVA*B*jqo8lMYXBB4{(h!D3jQUlWzmmY zB&NRC?tC-^AsRLehGwe4%>CP2SG{k=Z)$MVuZ7r*cT!S`7`nQOK#c%v)M1TnvUC-V zB}d2sQg#WM|MFv<4X1Z(q_(%1j1M>D%O!R72Cxg>2L-?S_Sq4{TfmYCrk?kmc8vLg zS8>4$GX3WI8JcJTBV?E~Tb*o0o-P=Ah5#NZbo-V1KnM?gaD`KxoM$YKU2CW&`+s1C zZZ}0)kA{s+6$6lI9RK|DuBWh1^U!{sv=SX1O{hTWFkE%7)9#4pz5i;qP9@jPx1!nJ zSfKc854`gF90>?%S}`*qM@9jbfk^>!qbR7Uk+XXKrn>*&0Sqc}5VSY-M)Kl)lH>2@ z2H-5X1O#GO3wvxl{=B*agc}313Ume&2!pmU@Eu?Q)j>oTDDfY$$r)zvArTmqCS)rC zr4h>8y9Ow%AP<<-HZ*)08e-#6iL8z0)1z)Ns_>BjpBp}iy86ydB3xWtci+qO2rU65 zR8-7Y)Kq*?*Lx<@w*Auy;=r3TKyVKIPnQMC?^|aS6PlZwZ-TlClOk*wki0TjpbG2; z!jR~SA{OwWBk(?BAU8VMrUalbv+BF`m?NP>Nr?c>U^J7JO*ZBSkU$adK8Wl+$mWa% zhz)w+WtJ@;8T3E!C1aJQXY*a9LQx3QpJYg!?tE)HFn}USGYRY)Kc`%@yv3l(ba(5( zRFwfl&>Ey|15`zL0t*eZ{Bp;H4|)XHIrfTKB-h=UWx@y)*&H`nc!sv z-vD^|K$VtHDJJx#O}Bqh!0c&pcGqQa+#G>rC|D<<*+Uu7mUaVkswv2=U|zj<$$VjQ zrX!6G90OUdGul`{hZWMI_7@KJDS#&7!BIVIVD%;gw;+@nq!=PgiTp5LOz1 zfJGcYJ7i8mzSNA$eJ@_U0x}p?w~ax&dl4vyg+xXw!)!RkAMnNf;9w4*0hq(;q$U}& zxWziW>V7m@3?k-1>|R59Fg%}R|J0{z@97^ zgFXUM?*;S1KICP`9@p>QN{?W=AORu)C}z;aOu-4s+BZRL$KnTyrE>XE?rhSRs73UE zsSzCwAZH>tIfRrS!*CpmotULJG(BNZ@L-M?1da=&@q55*&jIFP?2?j<*y2}?sA15f zYQt!F9AFZ(JH~cU1t+%%um~4}&@(>Ah(=4u6ZP(0ZCcknOo@?=0FAkfeAj58dS_dA z@gw^SV@P`g z_!CuBB(Cq;al^23A7J4lkPpW|_mcuAb|`Xd0Blr-GJs)p1};=6eNaUKoLY{`- zB-Mo%v*M(i(k`pF6ypf4DB2qM3M+lI9pfF|K5QBPo7**WoLGN}D-TlB;LTy0XZ72}H0^^0%U#c=%q;v~PHBaIF*Rf;5t`+1gJ^8U@ z#%3w+-VMW=f?$dUI3WUNlW5`xJ)jDot{;*!J&d)lU_gZ({@ZhA?lh3b z5)J$(51d|q&dZ~QorH1>Hxo3h#U=uGd_Ks$iKGxQ)sOnBZAVT;^~7BgpwnFy26XA` z{U%ze)U`?mQ#WFeJroKKZ z9%j(K_}b5+of}HBoFhCJ^RJu`;Wvo<m)#qI08Lu>6kWyJa{Y>duVEC7 z4mIfd5zHk#_R3(mll1PL;&$VYA2!w6hgIPb;`~A&8=>nm=#C0hcRUO%Wg$t#5z0Y{ ze%mB4Pjm20Fw6`F1>|SbDOiV|gdl%dZ~-bInn?gDna`*)VDU;Nb@;Mn)La=!8D!`g?e? z_xfx#h{0#}yg|Ff0?_aXFx=Pg-;sUHS|kcS=hr*LV7p8o2r2mVe>aXN-{c}}5h8i^ z|Lx0++o_CctkJM9QjJ-$GO`TjIZ+gB`X@UI=J+|A98J&&@R5>KA(-LG!B=t~yp z)@3SzAhxRDCnwR(|kaj}sFPGuTQ3{)h4qV5OcCg4cF^CjXgIDf@-q1@!jh@bqNr$S#vRN5Yffg1T8fk0hwan7 z7`%YH53Irg#-OHPhK1R_R{6~Ip?pT##_xs$TCC>fshfKhk}j2g!{z}V1`$z2Un=5-J9zL@eUef*hQX{6F7iF@JOIR} z0V95(4=2GlzU>XSMD$YjF5&)-5z}5ZLI8+MluE5*V{p~z=B_vJ6u!PUEAK!JBt}W` z$n6=9jk<@x;fbq4ls!)-?XLa1f5L zUrPeg)B71w(A%RB&%aLGyRsL7D#+_V^a%XudniYuzhFOAEdSjqVpv(qpMNOPvreE7 z@zC`!mC?EsmW2X7Bke%3DFWwBloly39?Cnupu-o#VRW7QhcXfeu3slv)Wb{Wr+DL# zrVn7~rKn*8F6kYnCM{bFZq9WPSaM$tBqs@$H(e6-{(Ft%;pg%>+>Wf6dyX#Y+OdCk zVZ{VK8oolnRkH(+Pka>vhk6HNoYYQ2)i$G8s6Y*>sFfC;XQ7?09ewebR6>Z z`hB?@%zxJ$0>5*$!tC`w8svxCqI z@WXOZLa)H48mwP$;G!Zp2Y8Jt%If;2Ui1<_{#&0&{%4}A15g5O2;FrXh3wz#8`^(} zE}VkN(tae`OZ^Pq7gcstgdY8mL?7~Akoo8I=`py$hJ&HoHt6P!q4%5!cqEEbUiWa# z;&P(1`#H@}h3M|iPR3fDiADKA$tO3xb#X~xRKHZYa4zW%xab0)zsXq z3)gCbxOn@j1UBs9<_RDj zE$~x^Z~#c|fWoOC7xQ&;2A4<%?Nu{51_Il!pS*`6uK{z0SA%N1|yQw$(7~uMl zVym;|F?aVZbd?B%_MvxfM#Pc)#+`?0^rwB=pbD84u3sI8i{zUy0*m~3?ZZhCksIGf zUC%`d1+@J`8NTrRu+kJ{!V!WXgsvQ7#%t3ZMZkZT0DqaGvFH8Ak(auZ>#-x`nFvkD zzJmu##vg@SL|6c*TBFc+h%itC^F7|08;z&prCM^}urH9nW7`Yzya*j&=!m8h$OQ$K zAQSMiU;%Kl>~OR4g~vi zMIKcy64>}zke$ItL=-a)+PyAMUVWiB=e_oBMV-&0A9=}OD_ghju3?neXKfw;2299+ zg`rE<$i52*`GsERrMP+wcU?=cf)R55iNlf>lgY?V-#hI6=oQJJ zCcTJ$t!+nwa+?m;5NAf~kWb-$2)GV=Eq4RfD|gbUf`<9Zd5n6Mv`MY;~UD`aPv(YGcCu<=kJYTsK#e}h2`0xc5mU+_e$z$FYY zr`RPr|56h>At%RXR{!W8eD%Y}kJUhp_3Y`gzTFP|cKhkRfv#?^wEY_#!gNMjYw|O` zC-8{7g#51@0rmsie-f{o8bJy)`9O6a=3-wUSRbI;4R;A*{&W0|2y%Fy8mmSq<;X-4 zOB@A$z`Vo1m4yFn0310;vtPe`)8uXW_D$i+l}CLO=*lvhY9Szwi^0Gp3N$w~!}8c& zYIv(vTwniRb)y0uO0J1ig0FuW%TZWb>aQt5u(W|4S5?;{wAETez$4~~9>K8&!Cj`KE*^Gvsc37XirKqfI3Xy~i z{kk)J7x6#n^578iVQ)V7wlOwYQvOFiaANpqGJ@{K+p+cKn1_!JL7NDt6R3yq6_9Ui zRu5@q#iFloSzur9qseJs8-G1ka3_fve@6r35*$*2ZuAGJsphibFr}O~rla4pjq^r| zj085MmlkTl)%#rLShz3yVb!o@1K4@0<jn{m!;Wl5j?92=H2)xgW)vv1l^Yb?gHMgiwyd<%)t?MkJSQn>$0#F5YUs z@IAfaLrC5$OBi5#p9Al!=}&l3mkLB-xDRgjRZepeT(h(r_#3D@@N4mGQQXzEIb6Fr zvNxrwRdM)-kN^>>=6lhV9C(vK2LJg>8;)HTbK}26X(AN1#pyN%zhGvldf$$d*P|Hs zmHUEfN=i?!68b1~@KGiv4cEFve2;zo*6%c{%2V??=vGrVlEtjj=&=H-NHXJVocCbE zUzbY2Q`#S*(+~XBuY0h}T15Bm*m?MG#tjVEeq`8 z$)Cm)SmP%qxhFvi;4q>31~1|m+1#Na$AY~nVz5|FplHTLJpn#%0hP(VE+%jCpt!Zg z{HHR!v=bs~8cg{Te{SAyx4`GRNVg=wlM_^^U_wJ<{t${>6j&`0C-yxRjJ0v+drgcXU2S*-WWEcmXodw!O z{nA(i(iL(lpkkZH7(4{S3$ho%B~vg3s9e1G^?`j^OwI1>7{=5`&>u%q72V8&=8(P)0mu`{3JepZe0Qf7)W)5-=n)%=$mEG za2Gk1qB3(~>I#O5%l^=Po3>^9sm!^nG(M6Rt(^_93sP-HGk&XUy-HX&HTVUfm?9Ss zD%I#_8lYHlu$#+7wcILlI02VH-&Owj@q^YnvGlE5+dq$$TX5|nX+;hS(BfS4!iD~~ ztplB9S_gQ{E;pjd-R!Il_{+f85i{}E2KC3*2T$>q7vJa5!5Fx4rrVL;y#gm5%+^uUeUcekoR zb*%?Vm$J41U*-TF%~A9vD{$2)3+(vlAmCi=tjh@spPONNa(I(=PDdb*AZU|F=`nDj zJ%H<^aJ8El9HI2*?oxtf|Fjy}x36CVF5RG8;N;{q1=9yYI)Y$1f|fLfUfnE8rc>8m zp?W~4w1nT7$0mvRMGW4uxE<1Oe}jdO7z4@qOPS|Nzia_~AzF+%K-n6AzJoRCl5)!= z1;CQ10=}6BX?}3qiHoi^27McvBIs^&QP%HLx>84sm{xDREL$M7n|i5sn}r@KwJ568 z$Cb<-XqZg#G3pzy^pYi*agbl*C@N?PCAv}%ws5eD9)H@D4qAc2x~vFT%ryMX@hXWt zH^%!ZZ+Io1L9Kgm%eCulG@x2kGPb$Y9ius*w>_%)u57;{J%%KCD%jE!bh&{G~i-Rj0`^Fbhgdh>2?KfuIKu$j*nf@ zq!DHQW_hS8h#W!7q%XWvpu048FSq-JZmNg$SL4d?L@}H=C$cxoLOeu^BDXyAH{8u2 zTb55jh19=fNO0zgcHDQqo4gd~x)(^}yb~CtW7DTv(zAQJ_f%nz2~q8i{2c#bH;x1E zrGf6i@DIbSFU@J4aVq$mbN8G*Y{y9Ae%N|2pM==jItmTyIR~DOZT8zdDuXA@W|(cn zEN*nBp@vB%o1?DZ7^zkvQ5g@!Vg3z}&avW&m&G&OvcD{^3*NnvTG0JiPdCCixpS=G zw?ZOVZYfBrd>ND$yDZ;m_msXBn4%&H(oWZDppvHTAPj_~X%~f4_Dm3VQ6S{|#K-yj z`RkuDl3A*Hxg}G${GSEKbfRN*!J&_YhyI=Sm9HUk|D4MIoaV&81>)wR(@MU>?nizdoL2_cv@uq;r z;9P7+h+_!atrGM=OR_h-X718@w_ew&e~9kn`TT)4adPBWUxMcr=y~@bG1=mXoE?BRn<>(l&igk4_PP{r6GajkRo)l}2J-$(c zv|UX-;DQY=v^)G`3+012u+OLQxE9t4G)z7zJorfXhcVVv0()ttA9NnGyR+rCDijbX zmhaUoZXZlb`4?}gc zP0;%Jo$myY)_N=}BAhrcCQwyiHG}p|oi1J8H{pN)8Pe{bKa97=mKob5%-x6lyD`))Lc z${E<>;3^rC@6k1ljum9qBMuAz5?Er+)Qx)*j~ok#(>nfX;JGW#^W###2P!zztm(1} zdssb5=v64a-VZv4*cy2$5OlKsIB%JsGPw3#O+>s==m~`17bw$3{{jvKW zQPEYcHCX}h1A$*(us)K-`=0JJi+ykm!E^`l=X8R}CL1;9at8U<9ZaL(wb;PVx$1&z z1Y8+;#&<56l+XCO4>S8oBy=U^Qz>cAI+*dpc5MMGSws{DzR=?VA~hnr8!! z4tCZz^4S&(J+Y>+FzXn+(w=pd4WPFIG|MInVPuyEgreFAvq*F|7q01f_zc1~Hw6KD z>UV5lF)WY#cKf`g<;T&?I*(Vl*VFLz2gShnGBosSAcG^Zn5PBP?f-#W;K`u=wKQPt z{39$t#&YdWeJ`o~gks)pzl?X^ansWG_0TxNvyC6O>c5j<4k@X=IcM}0BZs`cz~)ug ze?u=59rN$C(taNZ48NxW=Lyl-@F&+k@qYCIOE7##+3#C&6E=y3230+$I=((>+MHu! zBTLt<0-WtLeS&zcK6zqb*4!QH!E;uXK17I2)(j4R~-C+TRW0e(Ql4RCCt zd#dP;uA<`ot`@!j271hVAH0dTpQEL@T{V351QtN9;`FY;>2jJQdoDc<=dHp_-kAxm z`8WgJ2&?dpL4tl@tCl&VO^NEJJ(=7X_5$0S5!swkipS}0sO-?O-5hCg<|nvs{aN(? zAndJ!>S}^-(Srt;;BE=-1b26LcleOt?gV!T5Fog_hhV`S5+Jw}EVw4PgH z)xGzxR6#g=1X1ee-&la#y)Sg@xhLZ{xNc8 z(8&N=7plNrf>`nYOU@@Aph{fO9|!I3PLP2E?GA8g1wa3DdH8GBT3`JCB-WkN zSK~^t$b^aU>(+rM%Tp{P$DIGs^7eiDhV>4T!&KLwoqYn6i)6i6Cn%jh&MK?@zKd8E z|LWKBYb#uxqAyj548G&rbJe%GeN|nyYl&QGw(|kPPWEFr+L`tj&lLME)a5mKi?^3# zy8}W$(&(s<{sYMJf0O%LKZ7o-Es&rCB}m9$USO|kbrUIrcw|0TrEc9w4T8v? zuTD0S?74gU827;9CktX(%?QL;Zk|1s=M??;rXymId0l;5=lN0}knlv~a9|O&Qr3^c z6(sU$;IdH)efopg|$p5(ZiHMLZeqs&Ql_@Qu-P+J>!t*cy0!pT7dG@4X~m-0-ho zKYj1@#Yw%p*|>avRfwmf9zK5jL2*vUQRrhBadvdV9)Bi(%{ANam;h~1bF%$E0o8f0 z*LmpHbnon8xOLRW5v382unQIo*0jP{=&sl+z1PDD-4oDFPeoB7a!A($(#HLzBUcmY zr3yE;xW%#_1tW{Vw^_%~5lh;iG7HNF6Ov?;ZsB+6*3F7z#}5_HRMHEsw~=JlWBMYW~9g#rk!7uDG}8UO2s@bWt9=up=Ar zAuNsl-?@2k`Hazg`~~~J#@_PL7A4jgBZQpBlsioqt+=uzjuG&vOSKHe0=Q}Jqe1`V z&>RxiEf}8`@Tm8VQ-9&i!-U^t)8lphd!f)T9~87c*Q%ky%6PZfB7oFe zs`|S#E!{OwYTFEl3a>=4jrmq*wC#y~_JwFa()?SHN?lzIlO;gi`b=XTlEF}fa-OB}q ztkRd@I6Y67^>ITjm#yh5n+m?H#5%khQ9KTM@E1_1V!o5~ib}SRLyy3-Nz>9V(O_+) zLVOc>-&derIO908olv-XYQCXFErM#?v|2O4QG_GJWh?^fY%zV~+o&Q8C{ z`1JK=iupu=#p50$4|C7h)rSC&`lt=StBOb`-ru8;*rJM2qU%KT{*n!K$VuN~+;QTT zR^4%pQTw2pXazh>poQ_o%9C#y;lGD1BoL#4eYXZ8`*cCyQ_Q;SUI^dN12RCTJvnOl z9!^TXOG`Pq9=T#+dP_yjE!$B$))FQhRtUw|I74FZ-?3y2X|%XO=;te$E9<zkvj=*2IJiviL^MiBuFO4$$^l-2Vh*i2AJ>1!d9(a$MzX{~AZxMKG1*<@udJWLQ?nrV~`oNDPH9vFU~i6H_X8g`bg z0V>m%UTodIo^=0RzEeBex?MM>>`P#x4BIZojni_}G5qECASw2^zurW;mj14ICCxMO3~@f^UXbSdR(6{L^&11_NA$dS{ZBK-8n+zhLH0 zC1O;1Ov)hPtaHw6y*dVQWgGLi|AQC%6;71dBqGLQ16znhZLbmZElxAXhwbZ>a=xK1 zty>ZIUaPSGkk1>N8|&7sT{ix#Ytw(!WxHstliK-OiSi3-Y@JS+~Z^iokdV zx*#m>$;mWWN73BPl^+H8y#R@FFCj3Kz#SxlQ?tfA=57S9tHj!%CFD5rjhX#Fy*ILV zJHJzMT{he5G!WHmUtjc=u3sGNnna^=6!~j~SY-dZHAJzufAz=ih^WTvxdHz0A6FbB zOqoMc;Pg+DXYCAYrs ziGqCPR`~5R-fJv3>HP_YcrsHU_9KDr3LD>Apvp0ZHTRuA%~3S74vEUXHYH2XYwh0) zqKImL0J&LAEKpzVFcn}u&rROh11~O?tj_c-I9i}Bw86`&_qqMJK)t#ogng;PDEPF` zF{e%#xpP8508IsL=-0}J8472`fig>e)^k}CwUzrf8%CB8;rC_TnN+pCH9wyf7hFq zPu9ma$@!va_CGr>xVld;*9@LBMCiFsx5$*Q-OS#z&o4DFwKQy8e+HH(f0EVpVkB*a zP5E-`g%2b6G_@k22yvr(3g7X+Yz2xfa#pE)0(oI|)5f2$_ z>?*s#uU!>P^Uv-+wY7e$>RN=gHe2gaS|9$Qvw8Aj_n$XECf$XH1P;7Ewg-eSS$_?U z#eryJWAkfE$Cqlu1Bt?h{u+Aqxfz9O7CnD<64S*E@ygN~!L$T$D}0)QT4gK@l}%~;iIAMU8ekHQ z7Kkmv`tpmZR;8thA{+kzB7!pZ!?zs)@_5w_)Sd0_=EfIq80aP)0tuB>rtnL zh^AJIsmkuW;8;mxL;>3zUPpVGuSt1DfBf3apKRaGdmq-X`BzSA9e;+x%g^l{(!W7h zXDa_0T|-;(O_M;Y(97eY%hw4OiepQ*+qo}db?vvsL-vwRcH9eO<4!(%Hd<jIQ_;_EI4xaOsq0 za^)Q%T6wP3Y)CQaJk%nCdaYex2^^5XK|quxiR%%J#|%~+`YbxNl}dI9UIJ=dH~-1& zH@V|1Bj8|j6nFw_uBT9FN(;%1eAgu;`+7X=o^>P6=hjr!}nP!LVi`4rYB35>aS)4DWrB9 z(wfgc^duxnzj@jnYD>mH)NI?A;A#2Iub+`Z{Km(>>WmGTg3EXtq)fcO6S}bjHEiv>p7Oho|Uta&2)R zSKX;fJbl@|r_KG3u>HQb_}|X~i+ty0S3K+{pN;?x7v+mG9`Z+Ux=Q=Q1fhuYS31ny zFHP4ZM@?OU9-L>S+3`JS%DwN4Q`tHB(Xe6s4lmQ5P#gt~b+>o^^CGI#??8W?IW=wq z8I2wD?1sl`~u&~KbL zL8`7~nmXV+$%tEr8E;&j%S#JC7ML_;G%Pu?+8#Z*rBbi%aUu^6*cd*BpC3{WW<7Zu zn7W)lC3jMx<8^y+>; zE5`kHT_oKw@f;&(VDWLv0=)88@6YYi1n@sn#_Bl@U70)QtR4T{H!vh}Z#;jhI5mSD z3>*m}=6XXa>;oW#w8ylcY#}59UPPYu9x+J0$tr~xvvyb@!(O{Ic3oUzjdlItCfhvW zGW+jT3Q9{n9s2hA+nvVDwiABM0nZIa0K+M7SbMCq58%26kXHg|@$F(qJ;41Jvx1c+ z!GtomUOTTQcCR&_?oO0wlMyGw^(kA%@{ChQWLk5Gu=B}nnnX19MRvw|DQo@Cp1hs6 zJynokdXn&=G=23~pMbo8V4g2_s;kN8ru$>6+&Uyd0y$v-Cdu`sw5Ey~(7@3^# zXMkwGY;k*Q>y=kAmkh{9xe0HU(j9pKnxBb=ma1@hZcEg=cPv(taz}`5$*?(W%#RnI8H=iD%&PxqPPk>zzCR6&sq*}%;Toln8W$16H zE8z?Syt~ZXtt_HI*FU2w)0I%#w87CKc7kWO`8R1q<*`F3($7;e3VTPOI`PPg0KNQ< zMHTdc8s=4fzX5xYWe`0Baz_Q0w5B8uaYRV3yF;SFdgYZ^aa+|E^YGy}x7{`(lG|DA z#YWZGYB%0h&UwAlR-~GJ8kX9xX2&r?j>3iClXE7kFMM9%sglwyr}FRJy(BR+C>|@3 zhx?-pV&t;)y~I-|ZC1wjcQ}^0t2w72gy(e=@L*m>l!ts-vG6>6d9`M{>Bxf(VoyDs z?L9o6s(v;gA}%H_g$}t=ME5gr5=i_#nXA!ORsDlWq8Qo5tAs|-{Fh$8uY8xG zu6EdndLQuYH{+Sl7py}SG`W+z?g2Bg5gm}9p{4Iq*G6o2zkx2EJi*56OPX|Or#X+$ z6nk8mNvW&zzK2ry*j!Flb2PX-*b2XR#Uj0X^J>K4=u@n6mYnQ{d+vk0NO3nZ45D)2 z4&3o(9gs#>>lBZ#wK3g7x)3D=BKj>_`b>GK23OBeyJR97*J+H;aD=K9`9fR{Hv@M* zn3JG9IqM>dY^I0$;&jjmOmA2-BYi0P60x(Zxf$9|EAi9Vx^X4h)airxagu$UG77%N z)kNc^T%s0ggRB;$3^P7VygE|7`XlTR;FDt+Su~P41If-BKBmQh{Le7Lar2FId)Nlbc`MMb|3MKhtuaKd+UKTT%` z)VL3DNZ>_tiScL`nbpC$(xu;b{%^EDdKV}UF09Cd__LC>Yhh_W1`9NI1&;joXW#v!wa* zj1xm+`VL44PHsF&SJzWCLMp_`z@03if-5knsg0!g6;azfs`(?7CmY&HKyYH#CVn`-5s zmOq!?l+H_*EjYIH6TK%DU_IbT^a!kmt(RPiyzZ;#e0ME3B)4Z_!ZyZ=Z4~ z)ub_${b1Az=8l9VVdf-GuFNgZTD!f;>_H1;71 zdFW$4SzhP!(UP!T-`Al*ZXRhwh1$!%tXbftfO3pj7=BOQcio)7SL17{h;n00vLJun z)I`NI&S&t&;GV9P?^*$@lpV&X7jeS zaO)w2Cu!l!d*35=N7G!g0lCogBH~1?#BxVB<;&L zDVFdF!AJ@9dlUXZHC+%Y?l5H`B-BoaALKc`*X1Z`973|O8Ol#UN5kJA1W{tEk&0G7 zc9ZZ<%ja{e!!7@Fs@u(9I?oF86X1@bg0*l%8P7)HFa?s5-ZZTB3#`!lIV{mXoJsNFV5hp9h z7HvWAeapI`r+BM7{-ixlBX1W{VUU4GQr$#+9!njpl&o%-u;MiTnre!AHM_p?8QICf z$`pM?Z{A;OqZK9;3P)ve`E&$0oDZ(g4N^nQhTc0@ZWC2_;z|k1gAW7Cnf%N@J%pjYAh*B+mx{C?a2_n2%O) znCFw0et|aX#q9jEN-o{bDCWPtGGZuwa=s)sz?NB!Z9uc>|`hpXZea8eDCby}TL51n12RSH<_ zU;W{4Z1Ia#9g`>4A#1rbInFry2@m6QZ99CfM^@_`G@aoLDC`sH3TWc4>0Q;@_3B&Y zH2gD`;Hy8W3Gz!pum~)qBr324HBmW0Ols_t3Ai2MhxFbC=SeQg1=~3)RpjFjr1mEp z+VqEhw>T_W0Fkq}Bb;VVH4aOZ?6t&m!=4l?VClDwOskYP-H6lI!^FCDS>T*N+mLoEL0lFinkMiSmJu9!@amf ziFET?!1Pow>^WJT4O z8IG^{ti9S{+b)j>R^boF$>(XxO?uLH->d*RQl!AOZPol8=26&hPrS{fSi>W|3f?-B zday#;H64LUhUFvm(@z#o$Yr5S03cRB(mZk02BSg4a~lgDes#2PQ)6s!4ug1udK3(D zA9$I+JWSd>wgq&JBEU!gCFXt@MrhB8x394X<6=`}1bIF^Y7tWSz5h$?7+3FA*8Wvv zQb^aaQT5mJq^?70Ikt+yixM^If|Hm48$XbrF#ga1z+lNuh=9No`Swmo9Lvlz^_r!& zsbJVfGGdG|aAXo+mx|*%CRlri)O4ML@V(DVJt(R3d(?%6m$6r99zpHMR4w(!c2#{~ z)1s-O0C|awmpnH(%MbAJ3PuS9adq@u-c{pvS-_T}8r;83GH@5pD37K77;(q8n3E@n zN_~)$7hl-;OATOEh|F6viF5ka(~My6z0-#m%*S&_tBekFTDr5z>qY+t4L>t)CR!`KG^D0+xw}FzY>6du(1C}C_UWX&4@YY0azcsz!)Ly-slo` zOc=@%wEWJi*JmB9MPYxD{wxAsC0^Zlz`SLd_&f2uuKyI-h<2_CJ|E&Jr%IP4oa?)Z zAZ=&Su`1kkpMj744Wh+J2zxdsAJOFq%tg2OV1@i?E9*`HKsp>0=y2dGL$BzpmT#4N zlm}~z{Y^Ndvo|k02RvNv*(hhDciJ4;!DMMyk(ym&k**S@-w-@Z!y;7xs9e$4H7(A- zourbL-NZ$JJf&p_C07OkNCjwPS-H^uO#IOBZgR)+plsF?_~pc(_evdC{m8~~>E*kH zN6bZ(GOp|Mv{b<3h<=U>PKW?3|9xBeC`9;S5W!q4!{y0VRv>Xd%{(eQwK=3?>n~A6 zy3g^x=2CzVrgx(JN7&RE#<;*Dcqt?-7okox=!W6cME{UrV8r_d1{g-^y)UA^gEKmp zJ$d40t$VH`(ACF%L};)bW%b*#^+>q5<+CzB9usn`&6S!4i(gy@9b}#}YOf%pO!dRH z1a!sYjzes8Zmx{2q#S)RVBgcwE`=y)qQA3Gr;dYx^yGX`g)Qul9VU3jlg7@9NLQQ3WV9Aok(f!L&LZ2<|&i4u#{zDw}k@o`Y_)y_csw!NKBmms5f zL&k=yMOEY0aiDFZXfxr9AG*bdztHR#x{Lv?6YD};E}aLb=>aj(ug2D`PPl#IHOzMF zd8FG`Q=hS(V!+O7tOg0?B!I1@=gmiAFCLY=orWd|Sd8w*GA`cs*k$O^=__zcNiCveldir_GU9+YSQN#U2{LyC zEZLc+v6i`vcm$Djx=qGrC`G>T6z1gVm(k6dlW(eODa`4aDY zuA@)5TD^yPyg&`peBH+pzg<4SAKO@((EbO{HwlVX4nB`)dM63FADoSkt^aZb<~aKK z|3N#I4fbvnmb1F^T%*tUI76=X$Ie-)MLEJB4vmHf5DvHrSB1gMxgtX?2sPaG#cXAx z+Z0ibn`QyuchjheM=6@t@8Kw#=pYKlS}Z`=OWf%r-?2LwOjc+Xn+7CXaDK=EEiUt6 z+jtWa&mL_yEc5_ft4VG5FZV0}?G+uxMTFY}M{`W3i3WZ-)lWA852@KyFc(J-u00O)iv>wsl3M=e(0_wz(U z+NKGtTdMNMCyYbf51`!et5bB+yqsC{?CcR9;_&jl|8NZ@XObyHB+mWq{8EOxcN4e$ zyc`;rMbXLj&}=xU`r~c>bH#Y%iYwGc^)Zw1mQMH%R{hsp*51n;jiFo*(jX8atcQ0b z;}7s~!td1lX|-{sfjiqU;IK-rp#{{vJT5tu+mVG-Ul6{;^?}ALw)*>0%EzR$l+aO@ zY8e@Gyca&r_>YXJ{m-76yoF4NZ{VT%N;jJS<I zMas?+;$`%;^bt*n-pOx?KK@@g=2KUKv3_uBN(vK9Tnv#^W1X=~x#Raa&c0M`Nib%D zZ>C5)I^9D8yb5!kWpxBq>O(1VD3P4bdkiT?3Z-5wKP6eGysATdADC(cKjc%W=qIH> zcM{W8RMHrPseDxEQ%hNlD8KbGqommm36pXC_{sJ`;_1tb9(S=$0t_-0plMzB<>qbW z%GD~gVf&x1p<9*W<-0`bvS-fcfj06K4a$qrU6Y0tsgmCrfW~~SF7D?joRXyIFJ0&m zE;?rqgLT@vDhRmjGj$lkSz%ZJO2ytT!R3=NAgEQtOaEvN0*Oz^!IAhSVT$9qmjcqY zAKlw3IfKyuN@(0z> zqq~(HJOn`Dq8X#GA1%iEiFL;55K!QVTQZ{ovESUvEpy^-fxq~p8J=`2(Fd?kq5De; z{($3lrf$i#Lk#5;SV~COv*vD_gg_@%`E2Q0*M^cMt=(4SjOIa%w?Hu&**+Y}^lH$; zOae*gWNZ*9YAO?r+IldC((wsB?4`ZRK=Kfne>QMx`Ei<;6{)yGhJFQjaAM>$MIf1} z8c?Y$OtQA>Njm~g5qu0_tEqxi8C)2|&ZghaP-NW117E-96#d66kW=)xWwe?pwIcnE zL+$r>QlN*q;c&fzNaZ1a^%m_|SZA(a-#I)_vY5CGfWpbPsMW@ zt5dzLhXphjMjngn{rWHh2^MyREI7tvtC{%#wad$!I|yDm5~n>@!6NiQU+0VemVTNuLhbF)ZaHM&0|_ak zIKOX&dm9Df+sIxJUsR2fi%90E1mu!{I1h+YkPBsu)>vTe5N_)1J>QpEnpq%ya#l@O zI6mNJG~%Ww7ib9q_uXc%CUiCN11NT*!TmSVltRKBI@djk@jxAH`#+s5YRz9*zw4#V zBM^u&E#CsLy))T32C`epdUeZyDSEICpvfeTpEQ*k&lzx?-s-+w$DN|c!;Mq`quDlo z&74v$PEj7ynP_g9m=9MeejoI~oIt&|+ZxOa$1lB~mv)|#r_x7Xm zD#!QB5%1t?nSSezU$FSAp1@PWqJrY(dDa!c92bDw0KwAs__1!3z9w7&qH``7_T<*A z7((DUx4q$NjBPdj>-gEWv@t12z+XPwOq9h>3ZV!*scvDHNlSHmF@1k_MztiMh9KqB zL<8s5S^cYAlc`Aq z9DHr=j+~JmC_^Bh^GIs)PB7)C#Gr5#Mz5x~_}u^=3pc1ifNg~Z3Y)|KysYJLJ};1Y z32&TC&=21R+fdPth5+J*FUznFNo*Z2-JAE&R@c68V#zVe8Dq&G<%>NGVuHbnY3{(2 z%kjaRq*5J_v9%0EiiMT^Tt$*K+930p@D z>9Pz1tPmy=>1KwS==)Rgb(M1Utqv;WJ1be@FZOtOnG1#;VdHOwsj;@pQxX4>c-mKz zEQ^zupsS)llTAAJ@t@#u1+-)9Z44g#uNA6Gy{=p44k>tga(DPKbfOf}NT?=ianVj| z=1t6~nDDmb(=S2?VjQbpQ??_t-j~kj09%1Xn~cJO{&?F((n{X8LmZNDXxVN;lq@4i zkg<qYN@hOnA_b!XS|eFK?wLqhul*JcoP^FBd`JL&0(EGkXfYui zjzo!*OK#a&=jo`L;H!s_XKLp9?;_n?T?Me`g4U|JBO5ju3!eEXujW$QavlLAk z_FSEZWitr&JYd?f;Kh%wzEt}w-*Eg4UZA@U4OpiExDh7br83{>-*p z{S=6}7soo`esfLSGT~gtvCH+1EK4Q|;8%bWJOsbNHUyhGkuD==C;qko=M6O+E?LP4 zD40fLa#Pbzhs@sNfeH;$i$X-_h*w`yR1+1_&6re-O6tdV_IU9E{v5_F3cb<0Y8jy~ z;7AzWVt#x!6O6jwnrt-2-82=)n&##dBfg>x#?0-1Qd4sp&b91l`$iY0lK^Pn0|J70 zz*5I6VaT5IJzAmcqZa;L??2UdU%nlOnky9d#ubA1G8 zEU2l)FazJK1p%EfAlC+ObSK|ux4*cp3 ziljxb=oOrX=6I*;KY-qVvbu!0Fh~IH4EMu+uJI~6$O(1dNkBzch`dj zA-GeCS*f07d5(q_V*XM$w0HOfMKnM%@HY;#stYaz{SYCYaDgA~#m}>A=X_UG-?!Do z@^$Q`%3FTcqu0N^)}l>{(ICM0)xsu2hDGkx;6Xu0YSmM$YIWVQ!80Jf0g4r!#APy( z#exribxvolz*#$4L{ts?kjA^t0$bGigRLo*f8!4WiuI;6#f1e4}FD|J@k9$F` zlB@$%ANji76WX{_)ypH*%Rgnjdx=6wLrV*-^_0@RIwo=oxJd z|1jxoJhGHW1NlhPIPrJNG5$z|3hf(?zB5{p(bcW;Su?Q@Fsmx_37yAhPrm~Qc_7h{Bu%AU%Z1AO2Twh z%4niQ0_na2f@LbrlQ3dP;?}P#r&+38NtZiE1{vC@KGpKj%HgU5l|LojycSNOy0BPnWQ{w^(9FEP zecL%B1WsqH$2jO+GTQzPHM86^Ess*Aui0yZnE~F7#YqZNsdZbe<)mKDD^jycpfr=H zuUP5$;2HLBFSMK2TNiQ?IcJ^==>ab8UPJ?na9FUySk-4u~A4B$xeIbuQ z$Y|3R550PT-KB3@F-Q-I>x`r+Zg|~g0f%?Hx=@9nbbwc@r#tETBo}*;YM(bgp)mwc zRFEDhnrh#109mfph`?%`K1kwNiOkX zBt8_>%~JskDVhi;Q{7=v=H{u4wDZ#EE?e~CUX{YmKUdI2gIi|GzTOZXH(4p~*Mb9V zifvrAnvU_#*Ip3_Kr1xpvqT_wV7s+aAg}>tBZ!lN(mId8*p5h1nI&Wi!?#1($kJW_ zW-^QWmhSE%q$71PEy#0c7tq4;o)vnJS^5r*v*L3beM$IpnrC5`5Er^YX*RI9BvEgs8Jxuj^n=$#A?`!kfE5SQZ%dbQEK&i( z4}G~3xb=bR8SE$WY#?*VFDgk^cuPO*C*XsDadaM=h{@4mRZX@lZj{-BA?<{C;2rZ< z)+tLq1w9UxgPv0dzyNHl39j-)jwGnun7kmY!^`VQ0JB+-?0h8eu*I~-BMv2G**Rlk#jw{i;pH9ICz8Y(f0&Z7?9cnJ zzZlD6G3Qflu#9sfWhkQk8E9nQbHGqU(GCb6@k&bjuskZ(^$1~?B7z8rWP=hs+-r#f z9ppQjS#q`i<{95e6PEl^B9}5G0F2iC7>v2L-H>3a>up?S-@#B{3FYa z{VMI}^bwO>%_;dnzahkJJsl#j$rYEytChnkmy!-Y5&QF#j!2K^#HFeMof#-}D)Qzx zIn&T$0lFQ?8*-5@XNy!Fu}~P5$W@~g&>^|1ZC5ZaiIz7Z;aHjWj(}IZ&D3{@CI1N% z+h5|QE{>>lL>3XU5+5O?mTnvPt(`?DFvkJW@3rHcf+h00HQAnGhtvb8Jey)e1UQMW zkh!mt#`z`7bSlkiPwf@#%`}o!iu-}agHKl@q6j6f=va&6A0m~xb-ky z28E!~Dx#m zbra*T!dyvp^D6atI)sz;&D??K62m=y+k@2p=Tb;R_j$-4Zy`V{gIc;?S8JU~xsX{J zCYvjJd)5|eo5|lXFwMHs<;O4h8qu6nFFDkL9FG}p&fd2!UI7GJA0P?YNt|N!;y^3{ z#wer!Aw=2>2Yq!_Xq8vM;ms@p5|4f95o8flaWLOj0SJ1`bnU4?wWkoUaK}xL4RAN^ zy`{p%$@*FmK)z&gMFtsazzJIj+Na*PoB%Xd>`nxrWawB4yDY+70FTaz$^^Qmk^+?g z1vy1HH8cPPWR7(3ps!rH?q_OjZjd`Dx*4Nn+Rrl@1>|u}uKldgj?Jo?Bn?Z4v7X+u z>mQ2PW`(4k-vF$sczX>W0+Mbl97i!wncadBsHr)1!#U34tx`vJ30?u#-=bdX|FV(WyQ_b!pcU}1E&ty>q8iI;)} z2cBrdJif%MlNKzpWz+kwyD$X`Z^i1})`MUCxKSK%@_{!FSYl$h>5uaq8#p1`Fa7GF zbwnCs?fJR3Lm;X4NI-KTfe7T$<_{g!YbtW(zIsDXXENG@3I5QsL)PrHk68-wfPSvN)>Nub_cLF?b*9^3jFJVy(%mK5hedVj8RTp8drA$*EK96WTW@-ak0}) zj1)?t`bROoQXN4BLS`|EXvN|A)k4)dA2i5n%!3ojzKe))??$(bL&bSWaAEtZYzmBD z_`O5vBa7fGU63Dh^dSx@jXj7|<#B{A<*Tn9_$8hVhxi?R)#P<4a*SUxD_(_pm;}iL zhswD;e@vz8<|g^io7JZw_*FQ@u3-}!nNnCD^2U6=JK38^7VbXnq; zdI=f}N4#TaGVG2MM%cWXs^^eoBzn4y!!4ex^ztK45Z3{cHn(TWZv!a z(l)XMQ-|af6oAKAFBo_LwQEm027}GeEJqT7$sN6fq$DthD)C#q_1qxMA@RTSGBFK; z{Pmjt7eOid%f~<2p5aUcFp~=G`)BPyxi9P}n zC|qtKl9{)hVjP<5?TS61A<*N=?MX+{A-Fox966+`uEJ6f?)6E;CLPfES*hg0Y5M*u zy>2Qq0f*Y-i1*NUbL6(UN)bAU5&!h_xqkOl4!T0k<1-N2xei=NB^{g0y)_cB(U|xT z_;&$2{RUuI&usFI5Nc@!oG&?iudH@|cc`W~gH}OcJWm6ifCIXf!F+OTFq(sZGEex} zE6`MTbITV%n(#ZjpMqaq;p}odby)whqdCLkK^jJFmVDhmI?8WYO?*TCdvpwo5C2#* zHoOsAuh~YydQMWCId%}kOQ+zB{2_$=XDHIm)t|p5jYML-BK}R?jRn`%Op{SNiAczW z8wf~Ow0`3dFO)x$7Ma+R$L-!NJA>!-^{6Mi`kc8k^EG`&nt&qdQ)8R(Bm82oM1pm! z4ddMV5||A##f-nv9=_kJH_IK#g7p&=e23LokoJXtw|AT4o4*KrC&Z=0D_9&yF_=hl zO?-&og7F*jrl-=n7yenfm!)*RN(g$93kKC%2^K=hH-hu^{9QyVlQ{qTR%9Bl=v@au z+j!WRue+<*e);;z7Stmi%oZnb>OAFv^nyx1(Bdm}oC|#kXnw9+5`zhLu4?+pY1=O9TG~m*VCc^1SJA zy%8pCC!1d##T8*ooXVGox7Vdc5VeOQcREy!5A$ z+-}!CcKdlG%<1Bql@AKdEq!PEiGu~&0D4eROC@z7TumwEQE96f@%{S>^l3l?|JFis z4O2Mzm00Yr*@3u;Rf3~(&48p`qTb&EGJYM&pyKZo=I|WUuHDU6@0&xOuY1T z`C}#?G5>?StSfr)9@;dwpV8W}nk5SszIm;yFh8acONRQs7A>{$iYweGHQX%gpc?jKB_itr`_|L{_k;l%K zPwsyxrZg-K+By9aU&vy^4lcp?N{!(<`00;ccF z@Y}XsFUPNud*&1MJ{|Tx3O{S+iBUKmbyBn>9PZR0O3o;Y4wuuEB2n{0vY-BstYBJ=ov34Rl|97|9ju3Ur#Kdt4Sd4n zmpoibGGX>5s-Cxh-ULo5$7rV05OZjd|HrBM+{ATrt2C-Y{^EA4@6MRh_=!PPxgaYh z7XAWE6(%Gm{xDJ6{bkRs{Q}HP4g9dF0Y*}S>4TiVuKnm7HGzX$d7huWOknQ&%1fR3 zChcaszw)eiuJA_E8t{v=9a%*a%?yY56KOI*wACz#;ZE=_RdW#qE!OXd%}DlDR+q7= zuzL?VD_?pY$Xto#b1x#0B02KO%Qi1c8^h-18#GS4e^QZ0l`n!o=7X=RT7 z{`eOy5Nj~)M+}$X>~Y%Rf)b>v#GOUl^*QP4TVIH$qH){yxunTwvM|Y_H-UYBJi;<~ zNds@4u2=@bFeW&0l5fVn}JhG8aDGIknxO#PpVvh)XmM!b?IEk zd0J?ocs`J=sHqvufB8#S1B?-8zJf_EIu8HItWy6xz!s}zt5>nIi-bFaCwaZY%ua+( zKPsPdh5jZ*;W(6`*`8&0^eH$W`F#7`oimz>9v1)Fhku=P9fPtfD3hK2fvoS8%rSob zhm-J-P*X0_=1P}g2O&a0aIzI(Y+F)eJJ1`&;jN>Ittea#gp5jXR3?W7v zp!<@Nx+dZMRKmUf8@85BDKWl8=GZK4*(yGB7gKF>>pOPuC~m+Ds&`^t2fWY_0cQ83 z@P^H>L@U|7zU6+b;SXA7g`|-trB{v|w7YLMKeV7~n8$HYvHeK=3!i<2%DtKYlZH_S z*hGP_veaaa3bpj|yS5j4JZWwVdhT%3y@10M3IU_ewY0P#kf6H(3X8=$`gOb3Rr6NW?y^#o`1a$B{KtkYmB0?QXbvJ*Q*oO?+UK7(P3pL@XwCYhfwc93 z&3|&}m^!(BHf7LMhkY@9+>BLHf)vZny$Q+YdEcMTq}u@SgolTR8E`tUsH@X)LbG#l z2;(@&o&`=L)0>+~Y(bZCRnKV|8J1wE)7FXK;J9LQapf~{(@PH;s_1PYfiu@YuqFGO zx2k0hf88u`1-=sEoS9_xk%&=ee%g%Ca=$CPB#+@BVrPG&$@=eIiX9t`g1ZE`J_I_g z3{2p2ZM_c=ncrDhSeW+yFEOqq(5v3Ox?P!>rSoMiNVbn;ol#e1vSt0#h| znc2gU;Z;r!zBgQ~)vpKGXw_qENk6CA-}C0dNlZF&Qk(2t$H)A~tX-MMo{`-&lzGuO zX9(utl(k@Z#E(TU)8}XXCN%NpdtJpmePRwPr#Xx*Mm@t+{4->VRbfa?>|GYQ`n%vO z*o8tKPKxBBS2$2>9R{;Pi&)xk3sRc+La>C>9cpC26l47zZOA)o8*OgCZckuh^_$TI zwv2&`I4T3{b>A0SYN+$36}Z4G=d7OwaP%n=#@GQ4Q`m=S(2u01&IP}N{+LS%>QEl- z5s3`^c(79@*`d~|)H6i1P^UX7fdP1^<+_}0Ce*^@|N6(7EoZ$(wA7H0voogze_$ji zrOAEe?Z128M$Q3~1JkpK2?1jqX4>e$Z{8UP^-zGhqz2xSIEX*p9|R>s#UTHHuPGJ< z1!hwn(s1#EdU10R{~BwV9<54eP^^8*jZ3#K1WC9ZzgOTfw#um*_a}C5MT)I z!bj>Nkn01iUVqNc7TeEGPlvQPEcV+pQ-P_m0HGjX7fROvYYred&KC;^5Sp2pflj7> z$IDy2vexDb2ZlUKy18+lcnJbW6cGV6@r4gfsv^K@V%n~ zH`wI+$Hw{*Jc_|RH+f*n^NxpS9M~~4gSkFe&H2yFMo~oSz_QN@%z>C$TB5g|%1Z}B z4*q=1&1Df57FNgxmp&3uiom>3x2z))xK_*&tAm3Hsp zQ0IFbz<;7;&$dNdRmTcX@u zTwMAPfx5lpJyj2!=^6Gy^9>vBqLC8sS??GY7UrJHaFGMI%|J7mI-VLMx5>)R?ngxZ zEu^VCuvmGCW-=+!6djS|i@nL3aD4qo>o}9?85#Fm^S{X#2z+KL4)-UOU8Lu1F^tvN zhfMD>U|#)W&CO@Qo;ujt#>ES=vh7yK9=EdU3@YC|@!*SlAwE7n{x?1QVNYmkq+Pvg zsH7jGc;%OF0fep+#_0?ijq)o4l$j@9~L=`mVanZXMrw z|I}9~6wDCWf-2vVaR|<*p1cy@J->RxYmd9vmEO zE^upMt&Be}F3-zT4hRU~4ez_Y46$51i{4>_=?%XdtE;_0mZlh)nuJoNMD$X3Q><{_ zt-Rj39rTL@--U-WB99%j31(`HLMyu_8NTLO^c2bo@dOd>ZzfyugR5(tP%(U{prAnO zdP?b{6fT!WV)5JC+ev=8r>EyNu)=sB>g0z1x;a8=*roza%q=a|Ag0)3pO(14+zQs95XIVr_W+ ztW&H}qlVyUG-Kwnhxrd5I`g}NQX-drW#`ZIi0TSrtn;h>tz!$5nTTp;)xNJPT16PI zix_&`;h$E9y_$pq?Rxb2@R2;BP!DsNH~H69ND)b!hxI6&NDwx;WXY1tT<$!$&(lNO zV(w)oG~>M`bC=XBTwXjddJ!OIRT#?|_r*^Wjz1czt+$*D_U5yXk4|ORs+gT{H`OG6 z=+>Qz!)Hz1RD01S+XSQ(-yS|v*dyucN~x^exT;z=RTX2w{5;bt!+j1lm3d?) zcIa4gbd;5qowBpCmYaI>)e$MWdt+9^3Yw9Li3kW15$Yd6X}>ABe3_!t={!Dz!N@Br z`flkICQjkGQT!fLXCV>p0zRoqO|y{yB;Tg5Zsq5v$I`V1eaMWN+lVbC5s;S0$SVJR{G6$JgFTD<&AiAPtPbg|1K%X zc=s++N#Anj?zSt{)xL9R*-kgGmuaE=B6L5?+}ykY6hqxw_T&lxYo1QYUHR@TO#)A6`J(Ll-y(B!C{8T+S=5U$GC z*>vPvOx7#8xnJwX$b;!x3&xQ?o~Xvsb-o?0l#GS<<|!-nbko53pMTbznaKIW)VIWq zRAVe;+MUeq1*ntzN1qEwQP)hig%`0FD&PBU7EImzn#`QFUbhk(*lRLJqXsth9ImK6 zaMLL`xRh*;lVcEn?#mjp#X;rCBI#KOv<`BPkk<&drVo(#r-kjt@BmyqJeCzBlB!p% z9Sa!CFW`|xV$wZb$5=_H@4%($yL4*cj?kPd>20W zUVL>}dT0LLO{^`^5Tg#(>5>l3;iF&Pr(XY!j;(SMQMdlRbt#_VClif+`=6e!H4Y>( z385nW2nH&B8(E4bLEiJJuqLoX049XOBd1A~;)f0`uKqp$^V>tAG>F)QnhOjpEEA@s ziEyO-2Yd>&FQj(8o1MM+r4@}EU>4Y=MB{D`JaniY*S-|o81d85xiN!#RER!|<|G%V z%-N|?RU#7Z-nENDxkgPUKLA|4dP*=Vh4Z)7#zq;ZDvGRQMEByTT2xd-QfCR+f$2Hx zsk=_2#oix{?T!+G;Ioq_Px6s{pLYH{;w`G9zNGX)$VW#<}b2+)MO87 zk8r_6(1vT)G$u{ZbACF9eumGM&g<#z-A#^6lC%pKPH8iOULXmbr>GN)*Q9=>yC^a; zl8yVTXLT28w0s+k{*rqMd4r&PF*xCi6vlJnpp1b=<`x$Rbxxu#5KFOy^R|#K!923* z@}Y6hvhaE$+)FocuZo}_4hd;N zODdD?^AK z;@K;=q$Ne@D6Qlc46vC*4<)BiY|(ZYItSzd*@BErP4R}; zWWc!-H}pvR|KPz^tnUL`ukra>gi-h`yz_W<^%lbR!t8uJVs$$4YJ)zF8@3vUq%2jv zD0Nck(S$$t!K=0K{Z;?}&O6`K{CV!du?!!7@02uS`O)?7J>=YyjTAl{ZJoCkTkksY EUq0{m$p8QV literal 0 HcmV?d00001