From 45fcd09a4a45afde02f6744e4cefb41492e19d46 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 12 Jun 2026 17:02:21 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: shuoxing/llama3-8b-full-pretrain-wash-c4-0-9m-bs4 Source: Original Platform --- .gitattributes | 36 + README.md | 60 + all_results.json | 8 + chat_template.jinja | 5 + config.json | 32 + generation_config.json | 13 + model.safetensors | 3 + tokenizer.json | 3 + tokenizer_config.json | 16 + train_results.json | 8 + trainer_log.jsonl | 1429 ++++++ trainer_state.json | 10039 +++++++++++++++++++++++++++++++++++++++ training_args.bin | 3 + training_loss.png | Bin 0 -> 51056 bytes 14 files changed, 11655 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 all_results.json create mode 100644 chat_template.jinja create mode 100644 config.json create mode 100644 generation_config.json create mode 100644 model.safetensors create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_loss.png diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..fc3160d --- /dev/null +++ b/README.md @@ -0,0 +1,60 @@ +--- +library_name: transformers +license: llama3 +base_model: shuoxing/llama3-8b-full-pretrain-junk-tweet-1m-en-reproduce-bs8 +tags: +- llama-factory +- full +- generated_from_trainer +model-index: +- name: llama3-8b-full-pretrain-wash-c4-0-9m-bs4 + results: [] +--- + + + +# llama3-8b-full-pretrain-wash-c4-0-9m-bs4 + +This model is a fine-tuned version of [shuoxing/llama3-8b-full-pretrain-junk-tweet-1m-en-reproduce-bs8](https://huggingface.co/shuoxing/llama3-8b-full-pretrain-junk-tweet-1m-en-reproduce-bs8) on the c4_0_9m dataset. + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 1e-05 +- train_batch_size: 1 +- eval_batch_size: 8 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 4 +- total_train_batch_size: 4 +- total_eval_batch_size: 32 +- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_steps: 0.1 +- num_epochs: 3.0 + +### Training results + + + +### Framework versions + +- Transformers 5.2.0 +- Pytorch 2.6.0+cu124 +- Datasets 4.0.0 +- Tokenizers 0.22.2 diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..0c78575 --- /dev/null +++ b/all_results.json @@ -0,0 +1,8 @@ +{ + "epoch": 3.0, + "total_flos": 3902317486080.0, + "train_loss": 1.6620939874066776, + "train_runtime": 1853.0016, + "train_samples_per_second": 3.081, + "train_steps_per_second": 0.771 +} \ No newline at end of file diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..39bd0c9 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,5 @@ +{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|> + +'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|> + +' }}{% endif %} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..a5b8bc3 --- /dev/null +++ b/config.json @@ -0,0 +1,32 @@ +{ + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "dtype": "bfloat16", + "eos_token_id": 128009, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 8192, + "mlp_bias": false, + "model_type": "llama", + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pad_token_id": 128009, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_parameters": { + "rope_theta": 500000.0, + "rope_type": "default" + }, + "tie_word_embeddings": false, + "transformers_version": "5.2.0", + "use_cache": false, + "vocab_size": 128256 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..eb23973 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,13 @@ +{ + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": [ + 128001, + 128009 + ], + "max_length": 4096, + "pad_token_id": 128009, + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "5.2.0" +} diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..df0ae11 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1687ccb341b3bba244a225800046c1bee0bbd1e52f1aa25c12acd32d565c1d8 +size 16060556616 diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..86a3394 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5cf44023714fb39b05e71e425f8d7b92805ff73f7988b083b8c87f0bf87393 +size 17209961 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..75e0e01 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,16 @@ +{ + "backend": "tokenizers", + "bos_token": "<|begin_of_text|>", + "clean_up_tokenization_spaces": true, + "eos_token": "<|eot_id|>", + "is_local": false, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 1000000000000000019884624838656, + "pad_token": "<|eot_id|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "TokenizersBackend" +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..0c78575 --- /dev/null +++ b/train_results.json @@ -0,0 +1,8 @@ +{ + "epoch": 3.0, + "total_flos": 3902317486080.0, + "train_loss": 1.6620939874066776, + "train_runtime": 1853.0016, + "train_samples_per_second": 3.081, + "train_steps_per_second": 0.771 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..c4392ae --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,1429 @@ +{"current_steps": 1, "total_steps": 1428, "loss": 4.722589492797852, "lr": 0.0, "epoch": 0.0021008403361344537, "percentage": 0.07, "elapsed_time": "0:00:03", "remaining_time": "1:22:53"} +{"current_steps": 2, "total_steps": 1428, "loss": 3.9686050415039062, "lr": 6.993006993006993e-08, "epoch": 0.004201680672268907, "percentage": 0.14, "elapsed_time": "0:00:04", "remaining_time": "0:57:50"} +{"current_steps": 3, "total_steps": 1428, "loss": 4.086915969848633, "lr": 1.3986013986013987e-07, "epoch": 0.0063025210084033615, "percentage": 0.21, "elapsed_time": "0:00:05", "remaining_time": "0:47:02"} +{"current_steps": 4, "total_steps": 1428, "loss": 4.020754814147949, "lr": 2.097902097902098e-07, "epoch": 0.008403361344537815, "percentage": 0.28, "elapsed_time": "0:00:07", "remaining_time": "0:41:43"} +{"current_steps": 5, "total_steps": 1428, "loss": 4.11073112487793, "lr": 2.7972027972027973e-07, "epoch": 0.01050420168067227, "percentage": 0.35, "elapsed_time": "0:00:08", "remaining_time": "0:38:25"} +{"current_steps": 6, "total_steps": 1428, "loss": 4.068889141082764, "lr": 3.496503496503497e-07, "epoch": 0.012605042016806723, "percentage": 0.42, "elapsed_time": "0:00:09", "remaining_time": "0:36:15"} +{"current_steps": 7, "total_steps": 1428, "loss": 3.9590301513671875, "lr": 4.195804195804196e-07, "epoch": 0.014705882352941176, "percentage": 0.49, "elapsed_time": "0:00:10", "remaining_time": "0:34:41"} +{"current_steps": 8, "total_steps": 1428, "loss": 3.7929787635803223, "lr": 4.895104895104896e-07, "epoch": 0.01680672268907563, "percentage": 0.56, "elapsed_time": "0:00:11", "remaining_time": "0:33:30"} +{"current_steps": 9, "total_steps": 1428, "loss": 4.345971584320068, "lr": 5.594405594405595e-07, "epoch": 0.018907563025210083, "percentage": 0.63, "elapsed_time": "0:00:12", "remaining_time": "0:32:35"} +{"current_steps": 10, "total_steps": 1428, "loss": 4.204797744750977, "lr": 6.293706293706295e-07, "epoch": 0.02100840336134454, "percentage": 0.7, "elapsed_time": "0:00:13", "remaining_time": "0:31:52"} +{"current_steps": 11, "total_steps": 1428, "loss": 4.2924957275390625, "lr": 6.993006993006994e-07, "epoch": 0.023109243697478993, "percentage": 0.77, "elapsed_time": "0:00:14", "remaining_time": "0:31:16"} +{"current_steps": 12, "total_steps": 1428, "loss": 3.6519017219543457, "lr": 7.692307692307694e-07, "epoch": 0.025210084033613446, "percentage": 0.84, "elapsed_time": "0:00:15", "remaining_time": "0:30:46"} +{"current_steps": 13, "total_steps": 1428, "loss": 3.5902950763702393, "lr": 8.391608391608393e-07, "epoch": 0.0273109243697479, "percentage": 0.91, "elapsed_time": "0:00:16", "remaining_time": "0:30:22"} +{"current_steps": 14, "total_steps": 1428, "loss": 3.751192092895508, "lr": 9.090909090909091e-07, "epoch": 0.029411764705882353, "percentage": 0.98, "elapsed_time": "0:00:17", "remaining_time": "0:30:02"} +{"current_steps": 15, "total_steps": 1428, "loss": 4.330526351928711, "lr": 9.790209790209791e-07, "epoch": 0.031512605042016806, "percentage": 1.05, "elapsed_time": "0:00:18", "remaining_time": "0:29:42"} +{"current_steps": 16, "total_steps": 1428, "loss": 3.7747349739074707, "lr": 1.0489510489510491e-06, "epoch": 0.03361344537815126, "percentage": 1.12, "elapsed_time": "0:00:20", "remaining_time": "0:29:26"} +{"current_steps": 17, "total_steps": 1428, "loss": 3.6174468994140625, "lr": 1.118881118881119e-06, "epoch": 0.03571428571428571, "percentage": 1.19, "elapsed_time": "0:00:21", "remaining_time": "0:29:10"} +{"current_steps": 18, "total_steps": 1428, "loss": 3.4348971843719482, "lr": 1.188811188811189e-06, "epoch": 0.037815126050420166, "percentage": 1.26, "elapsed_time": "0:00:22", "remaining_time": "0:28:56"} +{"current_steps": 19, "total_steps": 1428, "loss": 3.4862470626831055, "lr": 1.258741258741259e-06, "epoch": 0.03991596638655462, "percentage": 1.33, "elapsed_time": "0:00:23", "remaining_time": "0:28:44"} +{"current_steps": 20, "total_steps": 1428, "loss": 3.7471625804901123, "lr": 1.3286713286713287e-06, "epoch": 0.04201680672268908, "percentage": 1.4, "elapsed_time": "0:00:24", "remaining_time": "0:28:33"} +{"current_steps": 21, "total_steps": 1428, "loss": 3.6562182903289795, "lr": 1.3986013986013987e-06, "epoch": 0.04411764705882353, "percentage": 1.47, "elapsed_time": "0:00:25", "remaining_time": "0:28:22"} +{"current_steps": 22, "total_steps": 1428, "loss": 2.944753408432007, "lr": 1.4685314685314685e-06, "epoch": 0.046218487394957986, "percentage": 1.54, "elapsed_time": "0:00:26", "remaining_time": "0:28:12"} +{"current_steps": 23, "total_steps": 1428, "loss": 4.277539253234863, "lr": 1.5384615384615387e-06, "epoch": 0.04831932773109244, "percentage": 1.61, "elapsed_time": "0:00:27", "remaining_time": "0:28:03"} +{"current_steps": 24, "total_steps": 1428, "loss": 4.103379726409912, "lr": 1.6083916083916085e-06, "epoch": 0.05042016806722689, "percentage": 1.68, "elapsed_time": "0:00:28", "remaining_time": "0:27:55"} +{"current_steps": 25, "total_steps": 1428, "loss": 3.516192674636841, "lr": 1.6783216783216785e-06, "epoch": 0.052521008403361345, "percentage": 1.75, "elapsed_time": "0:00:29", "remaining_time": "0:27:47"} +{"current_steps": 26, "total_steps": 1428, "loss": 3.054426908493042, "lr": 1.7482517482517483e-06, "epoch": 0.0546218487394958, "percentage": 1.82, "elapsed_time": "0:00:30", "remaining_time": "0:27:40"} +{"current_steps": 27, "total_steps": 1428, "loss": 3.598344564437866, "lr": 1.8181818181818183e-06, "epoch": 0.05672268907563025, "percentage": 1.89, "elapsed_time": "0:00:31", "remaining_time": "0:27:33"} +{"current_steps": 28, "total_steps": 1428, "loss": 2.1566905975341797, "lr": 1.888111888111888e-06, "epoch": 0.058823529411764705, "percentage": 1.96, "elapsed_time": "0:00:32", "remaining_time": "0:27:27"} +{"current_steps": 29, "total_steps": 1428, "loss": 2.7493889331817627, "lr": 1.9580419580419583e-06, "epoch": 0.06092436974789916, "percentage": 2.03, "elapsed_time": "0:00:34", "remaining_time": "0:27:22"} +{"current_steps": 30, "total_steps": 1428, "loss": 3.7484190464019775, "lr": 2.027972027972028e-06, "epoch": 0.06302521008403361, "percentage": 2.1, "elapsed_time": "0:00:35", "remaining_time": "0:27:17"} +{"current_steps": 31, "total_steps": 1428, "loss": 3.4763312339782715, "lr": 2.0979020979020983e-06, "epoch": 0.06512605042016807, "percentage": 2.17, "elapsed_time": "0:00:36", "remaining_time": "0:27:12"} +{"current_steps": 32, "total_steps": 1428, "loss": 4.1537184715271, "lr": 2.167832167832168e-06, "epoch": 0.06722689075630252, "percentage": 2.24, "elapsed_time": "0:00:37", "remaining_time": "0:27:07"} +{"current_steps": 33, "total_steps": 1428, "loss": 3.949978828430176, "lr": 2.237762237762238e-06, "epoch": 0.06932773109243698, "percentage": 2.31, "elapsed_time": "0:00:38", "remaining_time": "0:27:03"} +{"current_steps": 34, "total_steps": 1428, "loss": 3.095123291015625, "lr": 2.307692307692308e-06, "epoch": 0.07142857142857142, "percentage": 2.38, "elapsed_time": "0:00:39", "remaining_time": "0:26:58"} +{"current_steps": 35, "total_steps": 1428, "loss": 3.6232047080993652, "lr": 2.377622377622378e-06, "epoch": 0.07352941176470588, "percentage": 2.45, "elapsed_time": "0:00:40", "remaining_time": "0:26:53"} +{"current_steps": 36, "total_steps": 1428, "loss": 3.801804304122925, "lr": 2.4475524475524477e-06, "epoch": 0.07563025210084033, "percentage": 2.52, "elapsed_time": "0:00:41", "remaining_time": "0:26:49"} +{"current_steps": 37, "total_steps": 1428, "loss": 2.909287452697754, "lr": 2.517482517482518e-06, "epoch": 0.07773109243697479, "percentage": 2.59, "elapsed_time": "0:00:42", "remaining_time": "0:26:46"} +{"current_steps": 38, "total_steps": 1428, "loss": 3.283078670501709, "lr": 2.5874125874125877e-06, "epoch": 0.07983193277310924, "percentage": 2.66, "elapsed_time": "0:00:43", "remaining_time": "0:26:42"} +{"current_steps": 39, "total_steps": 1428, "loss": 2.9224965572357178, "lr": 2.6573426573426574e-06, "epoch": 0.0819327731092437, "percentage": 2.73, "elapsed_time": "0:00:44", "remaining_time": "0:26:38"} +{"current_steps": 40, "total_steps": 1428, "loss": 3.591977119445801, "lr": 2.7272727272727272e-06, "epoch": 0.08403361344537816, "percentage": 2.8, "elapsed_time": "0:00:45", "remaining_time": "0:26:35"} +{"current_steps": 41, "total_steps": 1428, "loss": 3.0213565826416016, "lr": 2.7972027972027974e-06, "epoch": 0.0861344537815126, "percentage": 2.87, "elapsed_time": "0:00:47", "remaining_time": "0:26:32"} +{"current_steps": 42, "total_steps": 1428, "loss": 2.9183509349823, "lr": 2.8671328671328672e-06, "epoch": 0.08823529411764706, "percentage": 2.94, "elapsed_time": "0:00:48", "remaining_time": "0:26:28"} +{"current_steps": 43, "total_steps": 1428, "loss": 3.4748919010162354, "lr": 2.937062937062937e-06, "epoch": 0.09033613445378151, "percentage": 3.01, "elapsed_time": "0:00:49", "remaining_time": "0:26:25"} +{"current_steps": 44, "total_steps": 1428, "loss": 3.53951096534729, "lr": 3.006993006993007e-06, "epoch": 0.09243697478991597, "percentage": 3.08, "elapsed_time": "0:00:50", "remaining_time": "0:26:22"} +{"current_steps": 45, "total_steps": 1428, "loss": 3.2075607776641846, "lr": 3.0769230769230774e-06, "epoch": 0.09453781512605042, "percentage": 3.15, "elapsed_time": "0:00:51", "remaining_time": "0:26:18"} +{"current_steps": 46, "total_steps": 1428, "loss": 3.2893571853637695, "lr": 3.1468531468531472e-06, "epoch": 0.09663865546218488, "percentage": 3.22, "elapsed_time": "0:00:52", "remaining_time": "0:26:15"} +{"current_steps": 47, "total_steps": 1428, "loss": 3.47295880317688, "lr": 3.216783216783217e-06, "epoch": 0.09873949579831932, "percentage": 3.29, "elapsed_time": "0:00:53", "remaining_time": "0:26:12"} +{"current_steps": 48, "total_steps": 1428, "loss": 3.5495269298553467, "lr": 3.286713286713287e-06, "epoch": 0.10084033613445378, "percentage": 3.36, "elapsed_time": "0:00:54", "remaining_time": "0:26:09"} +{"current_steps": 49, "total_steps": 1428, "loss": 3.218782901763916, "lr": 3.356643356643357e-06, "epoch": 0.10294117647058823, "percentage": 3.43, "elapsed_time": "0:00:55", "remaining_time": "0:26:06"} +{"current_steps": 50, "total_steps": 1428, "loss": 2.612854242324829, "lr": 3.426573426573427e-06, "epoch": 0.10504201680672269, "percentage": 3.5, "elapsed_time": "0:00:56", "remaining_time": "0:26:04"} +{"current_steps": 51, "total_steps": 1428, "loss": 3.0805444717407227, "lr": 3.4965034965034966e-06, "epoch": 0.10714285714285714, "percentage": 3.57, "elapsed_time": "0:00:57", "remaining_time": "0:26:01"} +{"current_steps": 52, "total_steps": 1428, "loss": 3.1539719104766846, "lr": 3.566433566433567e-06, "epoch": 0.1092436974789916, "percentage": 3.64, "elapsed_time": "0:00:58", "remaining_time": "0:25:58"} +{"current_steps": 53, "total_steps": 1428, "loss": 3.5745811462402344, "lr": 3.6363636363636366e-06, "epoch": 0.11134453781512606, "percentage": 3.71, "elapsed_time": "0:00:59", "remaining_time": "0:25:56"} +{"current_steps": 54, "total_steps": 1428, "loss": 3.033264398574829, "lr": 3.7062937062937064e-06, "epoch": 0.1134453781512605, "percentage": 3.78, "elapsed_time": "0:01:01", "remaining_time": "0:25:53"} +{"current_steps": 55, "total_steps": 1428, "loss": 2.5727319717407227, "lr": 3.776223776223776e-06, "epoch": 0.11554621848739496, "percentage": 3.85, "elapsed_time": "0:01:02", "remaining_time": "0:25:51"} +{"current_steps": 56, "total_steps": 1428, "loss": 3.4801394939422607, "lr": 3.846153846153847e-06, "epoch": 0.11764705882352941, "percentage": 3.92, "elapsed_time": "0:01:03", "remaining_time": "0:25:49"} +{"current_steps": 57, "total_steps": 1428, "loss": 3.253239631652832, "lr": 3.916083916083917e-06, "epoch": 0.11974789915966387, "percentage": 3.99, "elapsed_time": "0:01:04", "remaining_time": "0:25:46"} +{"current_steps": 58, "total_steps": 1428, "loss": 3.0049266815185547, "lr": 3.986013986013986e-06, "epoch": 0.12184873949579832, "percentage": 4.06, "elapsed_time": "0:01:05", "remaining_time": "0:25:44"} +{"current_steps": 59, "total_steps": 1428, "loss": 3.13586688041687, "lr": 4.055944055944056e-06, "epoch": 0.12394957983193278, "percentage": 4.13, "elapsed_time": "0:01:06", "remaining_time": "0:25:42"} +{"current_steps": 60, "total_steps": 1428, "loss": 3.5970468521118164, "lr": 4.125874125874127e-06, "epoch": 0.12605042016806722, "percentage": 4.2, "elapsed_time": "0:01:07", "remaining_time": "0:25:39"} +{"current_steps": 61, "total_steps": 1428, "loss": 3.0423130989074707, "lr": 4.195804195804197e-06, "epoch": 0.12815126050420167, "percentage": 4.27, "elapsed_time": "0:01:08", "remaining_time": "0:25:37"} +{"current_steps": 62, "total_steps": 1428, "loss": 3.270495891571045, "lr": 4.265734265734266e-06, "epoch": 0.13025210084033614, "percentage": 4.34, "elapsed_time": "0:01:09", "remaining_time": "0:25:34"} +{"current_steps": 63, "total_steps": 1428, "loss": 3.3109726905822754, "lr": 4.335664335664336e-06, "epoch": 0.1323529411764706, "percentage": 4.41, "elapsed_time": "0:01:10", "remaining_time": "0:25:32"} +{"current_steps": 64, "total_steps": 1428, "loss": 2.8192973136901855, "lr": 4.405594405594406e-06, "epoch": 0.13445378151260504, "percentage": 4.48, "elapsed_time": "0:01:11", "remaining_time": "0:25:30"} +{"current_steps": 65, "total_steps": 1428, "loss": 2.6368956565856934, "lr": 4.475524475524476e-06, "epoch": 0.13655462184873948, "percentage": 4.55, "elapsed_time": "0:01:12", "remaining_time": "0:25:28"} +{"current_steps": 66, "total_steps": 1428, "loss": 3.2420871257781982, "lr": 4.5454545454545455e-06, "epoch": 0.13865546218487396, "percentage": 4.62, "elapsed_time": "0:01:14", "remaining_time": "0:25:27"} +{"current_steps": 67, "total_steps": 1428, "loss": 3.4662106037139893, "lr": 4.615384615384616e-06, "epoch": 0.1407563025210084, "percentage": 4.69, "elapsed_time": "0:01:15", "remaining_time": "0:25:25"} +{"current_steps": 68, "total_steps": 1428, "loss": 2.52485728263855, "lr": 4.685314685314686e-06, "epoch": 0.14285714285714285, "percentage": 4.76, "elapsed_time": "0:01:16", "remaining_time": "0:25:23"} +{"current_steps": 69, "total_steps": 1428, "loss": 2.94364595413208, "lr": 4.755244755244756e-06, "epoch": 0.14495798319327732, "percentage": 4.83, "elapsed_time": "0:01:17", "remaining_time": "0:25:22"} +{"current_steps": 70, "total_steps": 1428, "loss": 3.080875873565674, "lr": 4.8251748251748255e-06, "epoch": 0.14705882352941177, "percentage": 4.9, "elapsed_time": "0:01:18", "remaining_time": "0:25:20"} +{"current_steps": 71, "total_steps": 1428, "loss": 2.779900550842285, "lr": 4.895104895104895e-06, "epoch": 0.14915966386554622, "percentage": 4.97, "elapsed_time": "0:01:19", "remaining_time": "0:25:18"} +{"current_steps": 72, "total_steps": 1428, "loss": 2.5541608333587646, "lr": 4.965034965034965e-06, "epoch": 0.15126050420168066, "percentage": 5.04, "elapsed_time": "0:01:20", "remaining_time": "0:25:16"} +{"current_steps": 73, "total_steps": 1428, "loss": 3.3032145500183105, "lr": 5.034965034965036e-06, "epoch": 0.15336134453781514, "percentage": 5.11, "elapsed_time": "0:01:21", "remaining_time": "0:25:14"} +{"current_steps": 74, "total_steps": 1428, "loss": 3.302570104598999, "lr": 5.1048951048951055e-06, "epoch": 0.15546218487394958, "percentage": 5.18, "elapsed_time": "0:01:22", "remaining_time": "0:25:12"} +{"current_steps": 75, "total_steps": 1428, "loss": 3.084743022918701, "lr": 5.174825174825175e-06, "epoch": 0.15756302521008403, "percentage": 5.25, "elapsed_time": "0:01:23", "remaining_time": "0:25:10"} +{"current_steps": 76, "total_steps": 1428, "loss": 2.839994430541992, "lr": 5.244755244755245e-06, "epoch": 0.15966386554621848, "percentage": 5.32, "elapsed_time": "0:01:24", "remaining_time": "0:25:08"} +{"current_steps": 77, "total_steps": 1428, "loss": 2.8261585235595703, "lr": 5.314685314685315e-06, "epoch": 0.16176470588235295, "percentage": 5.39, "elapsed_time": "0:01:25", "remaining_time": "0:25:06"} +{"current_steps": 78, "total_steps": 1428, "loss": 3.022369861602783, "lr": 5.384615384615385e-06, "epoch": 0.1638655462184874, "percentage": 5.46, "elapsed_time": "0:01:26", "remaining_time": "0:25:04"} +{"current_steps": 79, "total_steps": 1428, "loss": 3.11270809173584, "lr": 5.4545454545454545e-06, "epoch": 0.16596638655462184, "percentage": 5.53, "elapsed_time": "0:01:28", "remaining_time": "0:25:03"} +{"current_steps": 80, "total_steps": 1428, "loss": 2.8419973850250244, "lr": 5.524475524475524e-06, "epoch": 0.16806722689075632, "percentage": 5.6, "elapsed_time": "0:01:29", "remaining_time": "0:25:01"} +{"current_steps": 81, "total_steps": 1428, "loss": 3.14296555519104, "lr": 5.594405594405595e-06, "epoch": 0.17016806722689076, "percentage": 5.67, "elapsed_time": "0:01:30", "remaining_time": "0:25:00"} +{"current_steps": 82, "total_steps": 1428, "loss": 2.8033950328826904, "lr": 5.664335664335665e-06, "epoch": 0.1722689075630252, "percentage": 5.74, "elapsed_time": "0:01:31", "remaining_time": "0:24:58"} +{"current_steps": 83, "total_steps": 1428, "loss": 3.087614059448242, "lr": 5.7342657342657345e-06, "epoch": 0.17436974789915966, "percentage": 5.81, "elapsed_time": "0:01:32", "remaining_time": "0:24:56"} +{"current_steps": 84, "total_steps": 1428, "loss": 2.7504851818084717, "lr": 5.804195804195804e-06, "epoch": 0.17647058823529413, "percentage": 5.88, "elapsed_time": "0:01:33", "remaining_time": "0:24:55"} +{"current_steps": 85, "total_steps": 1428, "loss": 2.701443672180176, "lr": 5.874125874125874e-06, "epoch": 0.17857142857142858, "percentage": 5.95, "elapsed_time": "0:01:34", "remaining_time": "0:24:53"} +{"current_steps": 86, "total_steps": 1428, "loss": 2.8965351581573486, "lr": 5.944055944055944e-06, "epoch": 0.18067226890756302, "percentage": 6.02, "elapsed_time": "0:01:35", "remaining_time": "0:24:51"} +{"current_steps": 87, "total_steps": 1428, "loss": 2.9607667922973633, "lr": 6.013986013986014e-06, "epoch": 0.18277310924369747, "percentage": 6.09, "elapsed_time": "0:01:36", "remaining_time": "0:24:50"} +{"current_steps": 88, "total_steps": 1428, "loss": 3.2360849380493164, "lr": 6.083916083916085e-06, "epoch": 0.18487394957983194, "percentage": 6.16, "elapsed_time": "0:01:37", "remaining_time": "0:24:48"} +{"current_steps": 89, "total_steps": 1428, "loss": 3.146829605102539, "lr": 6.153846153846155e-06, "epoch": 0.1869747899159664, "percentage": 6.23, "elapsed_time": "0:01:38", "remaining_time": "0:24:46"} +{"current_steps": 90, "total_steps": 1428, "loss": 3.017669200897217, "lr": 6.223776223776225e-06, "epoch": 0.18907563025210083, "percentage": 6.3, "elapsed_time": "0:01:39", "remaining_time": "0:24:45"} +{"current_steps": 91, "total_steps": 1428, "loss": 3.4739527702331543, "lr": 6.2937062937062944e-06, "epoch": 0.19117647058823528, "percentage": 6.37, "elapsed_time": "0:01:40", "remaining_time": "0:24:43"} +{"current_steps": 92, "total_steps": 1428, "loss": 2.8482136726379395, "lr": 6.363636363636364e-06, "epoch": 0.19327731092436976, "percentage": 6.44, "elapsed_time": "0:01:42", "remaining_time": "0:24:41"} +{"current_steps": 93, "total_steps": 1428, "loss": 2.7700202465057373, "lr": 6.433566433566434e-06, "epoch": 0.1953781512605042, "percentage": 6.51, "elapsed_time": "0:01:43", "remaining_time": "0:24:40"} +{"current_steps": 94, "total_steps": 1428, "loss": 3.109806537628174, "lr": 6.503496503496504e-06, "epoch": 0.19747899159663865, "percentage": 6.58, "elapsed_time": "0:01:44", "remaining_time": "0:24:38"} +{"current_steps": 95, "total_steps": 1428, "loss": 2.9637131690979004, "lr": 6.573426573426574e-06, "epoch": 0.19957983193277312, "percentage": 6.65, "elapsed_time": "0:01:45", "remaining_time": "0:24:37"} +{"current_steps": 96, "total_steps": 1428, "loss": 2.846522808074951, "lr": 6.643356643356644e-06, "epoch": 0.20168067226890757, "percentage": 6.72, "elapsed_time": "0:01:46", "remaining_time": "0:24:35"} +{"current_steps": 97, "total_steps": 1428, "loss": 3.3485140800476074, "lr": 6.713286713286714e-06, "epoch": 0.20378151260504201, "percentage": 6.79, "elapsed_time": "0:01:47", "remaining_time": "0:24:33"} +{"current_steps": 98, "total_steps": 1428, "loss": 3.014303207397461, "lr": 6.783216783216784e-06, "epoch": 0.20588235294117646, "percentage": 6.86, "elapsed_time": "0:01:48", "remaining_time": "0:24:32"} +{"current_steps": 99, "total_steps": 1428, "loss": 2.6768596172332764, "lr": 6.853146853146854e-06, "epoch": 0.20798319327731093, "percentage": 6.93, "elapsed_time": "0:01:49", "remaining_time": "0:24:30"} +{"current_steps": 100, "total_steps": 1428, "loss": 2.9336276054382324, "lr": 6.923076923076923e-06, "epoch": 0.21008403361344538, "percentage": 7.0, "elapsed_time": "0:01:50", "remaining_time": "0:24:29"} +{"current_steps": 101, "total_steps": 1428, "loss": 3.103717803955078, "lr": 6.993006993006993e-06, "epoch": 0.21218487394957983, "percentage": 7.07, "elapsed_time": "0:01:51", "remaining_time": "0:24:27"} +{"current_steps": 102, "total_steps": 1428, "loss": 2.7759556770324707, "lr": 7.062937062937063e-06, "epoch": 0.21428571428571427, "percentage": 7.14, "elapsed_time": "0:01:52", "remaining_time": "0:24:26"} +{"current_steps": 103, "total_steps": 1428, "loss": 2.586292266845703, "lr": 7.132867132867134e-06, "epoch": 0.21638655462184875, "percentage": 7.21, "elapsed_time": "0:01:53", "remaining_time": "0:24:24"} +{"current_steps": 104, "total_steps": 1428, "loss": 3.109880208969116, "lr": 7.202797202797203e-06, "epoch": 0.2184873949579832, "percentage": 7.28, "elapsed_time": "0:01:54", "remaining_time": "0:24:23"} +{"current_steps": 105, "total_steps": 1428, "loss": 2.7075915336608887, "lr": 7.272727272727273e-06, "epoch": 0.22058823529411764, "percentage": 7.35, "elapsed_time": "0:01:56", "remaining_time": "0:24:21"} +{"current_steps": 106, "total_steps": 1428, "loss": 3.034566879272461, "lr": 7.342657342657343e-06, "epoch": 0.22268907563025211, "percentage": 7.42, "elapsed_time": "0:01:57", "remaining_time": "0:24:20"} +{"current_steps": 107, "total_steps": 1428, "loss": 2.3479254245758057, "lr": 7.412587412587413e-06, "epoch": 0.22478991596638656, "percentage": 7.49, "elapsed_time": "0:01:58", "remaining_time": "0:24:18"} +{"current_steps": 108, "total_steps": 1428, "loss": 2.9856462478637695, "lr": 7.4825174825174825e-06, "epoch": 0.226890756302521, "percentage": 7.56, "elapsed_time": "0:01:59", "remaining_time": "0:24:17"} +{"current_steps": 109, "total_steps": 1428, "loss": 3.462696075439453, "lr": 7.552447552447552e-06, "epoch": 0.22899159663865545, "percentage": 7.63, "elapsed_time": "0:02:00", "remaining_time": "0:24:16"} +{"current_steps": 110, "total_steps": 1428, "loss": 3.270888566970825, "lr": 7.622377622377622e-06, "epoch": 0.23109243697478993, "percentage": 7.7, "elapsed_time": "0:02:01", "remaining_time": "0:24:14"} +{"current_steps": 111, "total_steps": 1428, "loss": 3.048227310180664, "lr": 7.692307692307694e-06, "epoch": 0.23319327731092437, "percentage": 7.77, "elapsed_time": "0:02:02", "remaining_time": "0:24:13"} +{"current_steps": 112, "total_steps": 1428, "loss": 3.2194204330444336, "lr": 7.762237762237763e-06, "epoch": 0.23529411764705882, "percentage": 7.84, "elapsed_time": "0:02:03", "remaining_time": "0:24:11"} +{"current_steps": 113, "total_steps": 1428, "loss": 3.6809778213500977, "lr": 7.832167832167833e-06, "epoch": 0.23739495798319327, "percentage": 7.91, "elapsed_time": "0:02:04", "remaining_time": "0:24:10"} +{"current_steps": 114, "total_steps": 1428, "loss": 2.912044048309326, "lr": 7.902097902097902e-06, "epoch": 0.23949579831932774, "percentage": 7.98, "elapsed_time": "0:02:05", "remaining_time": "0:24:08"} +{"current_steps": 115, "total_steps": 1428, "loss": 3.1021275520324707, "lr": 7.972027972027973e-06, "epoch": 0.2415966386554622, "percentage": 8.05, "elapsed_time": "0:02:06", "remaining_time": "0:24:07"} +{"current_steps": 116, "total_steps": 1428, "loss": 3.089829683303833, "lr": 8.041958041958042e-06, "epoch": 0.24369747899159663, "percentage": 8.12, "elapsed_time": "0:02:07", "remaining_time": "0:24:06"} +{"current_steps": 117, "total_steps": 1428, "loss": 3.4016504287719727, "lr": 8.111888111888112e-06, "epoch": 0.24579831932773108, "percentage": 8.19, "elapsed_time": "0:02:08", "remaining_time": "0:24:04"} +{"current_steps": 118, "total_steps": 1428, "loss": 3.502598285675049, "lr": 8.181818181818183e-06, "epoch": 0.24789915966386555, "percentage": 8.26, "elapsed_time": "0:02:10", "remaining_time": "0:24:03"} +{"current_steps": 119, "total_steps": 1428, "loss": 3.0750184059143066, "lr": 8.251748251748254e-06, "epoch": 0.25, "percentage": 8.33, "elapsed_time": "0:02:11", "remaining_time": "0:24:02"} +{"current_steps": 120, "total_steps": 1428, "loss": 2.8168656826019287, "lr": 8.321678321678323e-06, "epoch": 0.25210084033613445, "percentage": 8.4, "elapsed_time": "0:02:12", "remaining_time": "0:24:00"} +{"current_steps": 121, "total_steps": 1428, "loss": 2.3565826416015625, "lr": 8.391608391608393e-06, "epoch": 0.2542016806722689, "percentage": 8.47, "elapsed_time": "0:02:13", "remaining_time": "0:23:59"} +{"current_steps": 122, "total_steps": 1428, "loss": 2.972810745239258, "lr": 8.461538461538462e-06, "epoch": 0.25630252100840334, "percentage": 8.54, "elapsed_time": "0:02:14", "remaining_time": "0:23:57"} +{"current_steps": 123, "total_steps": 1428, "loss": 2.9700140953063965, "lr": 8.531468531468533e-06, "epoch": 0.25840336134453784, "percentage": 8.61, "elapsed_time": "0:02:15", "remaining_time": "0:23:56"} +{"current_steps": 124, "total_steps": 1428, "loss": 3.0162484645843506, "lr": 8.601398601398602e-06, "epoch": 0.2605042016806723, "percentage": 8.68, "elapsed_time": "0:02:16", "remaining_time": "0:23:55"} +{"current_steps": 125, "total_steps": 1428, "loss": 3.109422445297241, "lr": 8.671328671328672e-06, "epoch": 0.26260504201680673, "percentage": 8.75, "elapsed_time": "0:02:17", "remaining_time": "0:23:54"} +{"current_steps": 126, "total_steps": 1428, "loss": 2.6802124977111816, "lr": 8.741258741258743e-06, "epoch": 0.2647058823529412, "percentage": 8.82, "elapsed_time": "0:02:18", "remaining_time": "0:23:52"} +{"current_steps": 127, "total_steps": 1428, "loss": 2.6609840393066406, "lr": 8.811188811188812e-06, "epoch": 0.2668067226890756, "percentage": 8.89, "elapsed_time": "0:02:19", "remaining_time": "0:23:51"} +{"current_steps": 128, "total_steps": 1428, "loss": 3.0896430015563965, "lr": 8.881118881118883e-06, "epoch": 0.2689075630252101, "percentage": 8.96, "elapsed_time": "0:02:20", "remaining_time": "0:23:49"} +{"current_steps": 129, "total_steps": 1428, "loss": 3.2370247840881348, "lr": 8.951048951048951e-06, "epoch": 0.2710084033613445, "percentage": 9.03, "elapsed_time": "0:02:21", "remaining_time": "0:23:48"} +{"current_steps": 130, "total_steps": 1428, "loss": 2.8461947441101074, "lr": 9.020979020979022e-06, "epoch": 0.27310924369747897, "percentage": 9.1, "elapsed_time": "0:02:22", "remaining_time": "0:23:47"} +{"current_steps": 131, "total_steps": 1428, "loss": 3.480252742767334, "lr": 9.090909090909091e-06, "epoch": 0.27521008403361347, "percentage": 9.17, "elapsed_time": "0:02:24", "remaining_time": "0:23:45"} +{"current_steps": 132, "total_steps": 1428, "loss": 2.8424923419952393, "lr": 9.160839160839162e-06, "epoch": 0.2773109243697479, "percentage": 9.24, "elapsed_time": "0:02:25", "remaining_time": "0:23:44"} +{"current_steps": 133, "total_steps": 1428, "loss": 3.4489340782165527, "lr": 9.230769230769232e-06, "epoch": 0.27941176470588236, "percentage": 9.31, "elapsed_time": "0:02:26", "remaining_time": "0:23:43"} +{"current_steps": 134, "total_steps": 1428, "loss": 2.48683500289917, "lr": 9.300699300699301e-06, "epoch": 0.2815126050420168, "percentage": 9.38, "elapsed_time": "0:02:27", "remaining_time": "0:23:42"} +{"current_steps": 135, "total_steps": 1428, "loss": 2.975668430328369, "lr": 9.370629370629372e-06, "epoch": 0.28361344537815125, "percentage": 9.45, "elapsed_time": "0:02:28", "remaining_time": "0:23:40"} +{"current_steps": 136, "total_steps": 1428, "loss": 3.163745403289795, "lr": 9.44055944055944e-06, "epoch": 0.2857142857142857, "percentage": 9.52, "elapsed_time": "0:02:29", "remaining_time": "0:23:39"} +{"current_steps": 137, "total_steps": 1428, "loss": 3.3047399520874023, "lr": 9.510489510489511e-06, "epoch": 0.28781512605042014, "percentage": 9.59, "elapsed_time": "0:02:30", "remaining_time": "0:23:38"} +{"current_steps": 138, "total_steps": 1428, "loss": 2.901014804840088, "lr": 9.58041958041958e-06, "epoch": 0.28991596638655465, "percentage": 9.66, "elapsed_time": "0:02:31", "remaining_time": "0:23:37"} +{"current_steps": 139, "total_steps": 1428, "loss": 2.4749934673309326, "lr": 9.650349650349651e-06, "epoch": 0.2920168067226891, "percentage": 9.73, "elapsed_time": "0:02:32", "remaining_time": "0:23:35"} +{"current_steps": 140, "total_steps": 1428, "loss": 2.735682964324951, "lr": 9.72027972027972e-06, "epoch": 0.29411764705882354, "percentage": 9.8, "elapsed_time": "0:02:33", "remaining_time": "0:23:34"} +{"current_steps": 141, "total_steps": 1428, "loss": 1.6851799488067627, "lr": 9.79020979020979e-06, "epoch": 0.296218487394958, "percentage": 9.87, "elapsed_time": "0:02:34", "remaining_time": "0:23:33"} +{"current_steps": 142, "total_steps": 1428, "loss": 2.4892358779907227, "lr": 9.860139860139861e-06, "epoch": 0.29831932773109243, "percentage": 9.94, "elapsed_time": "0:02:35", "remaining_time": "0:23:31"} +{"current_steps": 143, "total_steps": 1428, "loss": 3.152186870574951, "lr": 9.93006993006993e-06, "epoch": 0.3004201680672269, "percentage": 10.01, "elapsed_time": "0:02:36", "remaining_time": "0:23:30"} +{"current_steps": 144, "total_steps": 1428, "loss": 2.4623451232910156, "lr": 1e-05, "epoch": 0.3025210084033613, "percentage": 10.08, "elapsed_time": "0:02:38", "remaining_time": "0:23:29"} +{"current_steps": 145, "total_steps": 1428, "loss": 2.3573660850524902, "lr": 9.999985057155316e-06, "epoch": 0.30462184873949577, "percentage": 10.15, "elapsed_time": "0:02:39", "remaining_time": "0:23:28"} +{"current_steps": 146, "total_steps": 1428, "loss": 3.248166561126709, "lr": 9.999940228710581e-06, "epoch": 0.3067226890756303, "percentage": 10.22, "elapsed_time": "0:02:40", "remaining_time": "0:23:27"} +{"current_steps": 147, "total_steps": 1428, "loss": 3.073438882827759, "lr": 9.99986551493374e-06, "epoch": 0.3088235294117647, "percentage": 10.29, "elapsed_time": "0:02:41", "remaining_time": "0:23:25"} +{"current_steps": 148, "total_steps": 1428, "loss": 3.175532579421997, "lr": 9.999760916271368e-06, "epoch": 0.31092436974789917, "percentage": 10.36, "elapsed_time": "0:02:42", "remaining_time": "0:23:24"} +{"current_steps": 149, "total_steps": 1428, "loss": 2.2849655151367188, "lr": 9.999626433348664e-06, "epoch": 0.3130252100840336, "percentage": 10.43, "elapsed_time": "0:02:43", "remaining_time": "0:23:23"} +{"current_steps": 150, "total_steps": 1428, "loss": 2.7922751903533936, "lr": 9.999462066969451e-06, "epoch": 0.31512605042016806, "percentage": 10.5, "elapsed_time": "0:02:44", "remaining_time": "0:23:22"} +{"current_steps": 151, "total_steps": 1428, "loss": 3.03188419342041, "lr": 9.999267818116173e-06, "epoch": 0.3172268907563025, "percentage": 10.57, "elapsed_time": "0:02:45", "remaining_time": "0:23:20"} +{"current_steps": 152, "total_steps": 1428, "loss": 3.3826239109039307, "lr": 9.999043687949878e-06, "epoch": 0.31932773109243695, "percentage": 10.64, "elapsed_time": "0:02:46", "remaining_time": "0:23:19"} +{"current_steps": 153, "total_steps": 1428, "loss": 3.103822708129883, "lr": 9.998789677810226e-06, "epoch": 0.32142857142857145, "percentage": 10.71, "elapsed_time": "0:02:47", "remaining_time": "0:23:18"} +{"current_steps": 154, "total_steps": 1428, "loss": 2.633566379547119, "lr": 9.998505789215469e-06, "epoch": 0.3235294117647059, "percentage": 10.78, "elapsed_time": "0:02:48", "remaining_time": "0:23:16"} +{"current_steps": 155, "total_steps": 1428, "loss": 2.937821388244629, "lr": 9.998192023862448e-06, "epoch": 0.32563025210084034, "percentage": 10.85, "elapsed_time": "0:02:49", "remaining_time": "0:23:15"} +{"current_steps": 156, "total_steps": 1428, "loss": 3.0057592391967773, "lr": 9.997848383626583e-06, "epoch": 0.3277310924369748, "percentage": 10.92, "elapsed_time": "0:02:51", "remaining_time": "0:23:14"} +{"current_steps": 157, "total_steps": 1428, "loss": 3.4198083877563477, "lr": 9.997474870561858e-06, "epoch": 0.32983193277310924, "percentage": 10.99, "elapsed_time": "0:02:52", "remaining_time": "0:23:13"} +{"current_steps": 158, "total_steps": 1428, "loss": 2.748509407043457, "lr": 9.997071486900813e-06, "epoch": 0.3319327731092437, "percentage": 11.06, "elapsed_time": "0:02:53", "remaining_time": "0:23:11"} +{"current_steps": 159, "total_steps": 1428, "loss": 3.3422679901123047, "lr": 9.996638235054527e-06, "epoch": 0.33403361344537813, "percentage": 11.13, "elapsed_time": "0:02:54", "remaining_time": "0:23:10"} +{"current_steps": 160, "total_steps": 1428, "loss": 3.2214763164520264, "lr": 9.996175117612608e-06, "epoch": 0.33613445378151263, "percentage": 11.2, "elapsed_time": "0:02:55", "remaining_time": "0:23:09"} +{"current_steps": 161, "total_steps": 1428, "loss": 2.5538628101348877, "lr": 9.99568213734317e-06, "epoch": 0.3382352941176471, "percentage": 11.27, "elapsed_time": "0:02:56", "remaining_time": "0:23:08"} +{"current_steps": 162, "total_steps": 1428, "loss": 2.781787872314453, "lr": 9.995159297192824e-06, "epoch": 0.3403361344537815, "percentage": 11.34, "elapsed_time": "0:02:57", "remaining_time": "0:23:07"} +{"current_steps": 163, "total_steps": 1428, "loss": 3.3784282207489014, "lr": 9.99460660028666e-06, "epoch": 0.34243697478991597, "percentage": 11.41, "elapsed_time": "0:02:58", "remaining_time": "0:23:05"} +{"current_steps": 164, "total_steps": 1428, "loss": 3.2824249267578125, "lr": 9.994024049928222e-06, "epoch": 0.3445378151260504, "percentage": 11.48, "elapsed_time": "0:02:59", "remaining_time": "0:23:04"} +{"current_steps": 165, "total_steps": 1428, "loss": 2.589594841003418, "lr": 9.993411649599494e-06, "epoch": 0.34663865546218486, "percentage": 11.55, "elapsed_time": "0:03:00", "remaining_time": "0:23:03"} +{"current_steps": 166, "total_steps": 1428, "loss": 3.7193164825439453, "lr": 9.992769402960878e-06, "epoch": 0.3487394957983193, "percentage": 11.62, "elapsed_time": "0:03:01", "remaining_time": "0:23:02"} +{"current_steps": 167, "total_steps": 1428, "loss": 2.823063611984253, "lr": 9.99209731385117e-06, "epoch": 0.35084033613445376, "percentage": 11.69, "elapsed_time": "0:03:02", "remaining_time": "0:23:00"} +{"current_steps": 168, "total_steps": 1428, "loss": 3.1389951705932617, "lr": 9.99139538628754e-06, "epoch": 0.35294117647058826, "percentage": 11.76, "elapsed_time": "0:03:03", "remaining_time": "0:22:59"} +{"current_steps": 169, "total_steps": 1428, "loss": 2.9536495208740234, "lr": 9.990663624465504e-06, "epoch": 0.3550420168067227, "percentage": 11.83, "elapsed_time": "0:03:05", "remaining_time": "0:22:58"} +{"current_steps": 170, "total_steps": 1428, "loss": 2.6355466842651367, "lr": 9.989902032758904e-06, "epoch": 0.35714285714285715, "percentage": 11.9, "elapsed_time": "0:03:06", "remaining_time": "0:22:57"} +{"current_steps": 171, "total_steps": 1428, "loss": 1.1800763607025146, "lr": 9.989110615719882e-06, "epoch": 0.3592436974789916, "percentage": 11.97, "elapsed_time": "0:03:07", "remaining_time": "0:22:56"} +{"current_steps": 172, "total_steps": 1428, "loss": 2.679232358932495, "lr": 9.988289378078842e-06, "epoch": 0.36134453781512604, "percentage": 12.04, "elapsed_time": "0:03:08", "remaining_time": "0:22:54"} +{"current_steps": 173, "total_steps": 1428, "loss": 2.3583908081054688, "lr": 9.987438324744437e-06, "epoch": 0.3634453781512605, "percentage": 12.11, "elapsed_time": "0:03:09", "remaining_time": "0:22:53"} +{"current_steps": 174, "total_steps": 1428, "loss": 2.748077392578125, "lr": 9.986557460803527e-06, "epoch": 0.36554621848739494, "percentage": 12.18, "elapsed_time": "0:03:10", "remaining_time": "0:22:52"} +{"current_steps": 175, "total_steps": 1428, "loss": 3.2660067081451416, "lr": 9.985646791521165e-06, "epoch": 0.36764705882352944, "percentage": 12.25, "elapsed_time": "0:03:11", "remaining_time": "0:22:51"} +{"current_steps": 176, "total_steps": 1428, "loss": 2.9270148277282715, "lr": 9.984706322340539e-06, "epoch": 0.3697478991596639, "percentage": 12.32, "elapsed_time": "0:03:12", "remaining_time": "0:22:49"} +{"current_steps": 177, "total_steps": 1428, "loss": 2.455327033996582, "lr": 9.983736058882965e-06, "epoch": 0.37184873949579833, "percentage": 12.39, "elapsed_time": "0:03:13", "remaining_time": "0:22:48"} +{"current_steps": 178, "total_steps": 1428, "loss": 3.171403169631958, "lr": 9.982736006947842e-06, "epoch": 0.3739495798319328, "percentage": 12.46, "elapsed_time": "0:03:14", "remaining_time": "0:22:47"} +{"current_steps": 179, "total_steps": 1428, "loss": 2.6023473739624023, "lr": 9.98170617251262e-06, "epoch": 0.3760504201680672, "percentage": 12.54, "elapsed_time": "0:03:15", "remaining_time": "0:22:46"} +{"current_steps": 180, "total_steps": 1428, "loss": 2.7492432594299316, "lr": 9.98064656173276e-06, "epoch": 0.37815126050420167, "percentage": 12.61, "elapsed_time": "0:03:16", "remaining_time": "0:22:45"} +{"current_steps": 181, "total_steps": 1428, "loss": 3.520758628845215, "lr": 9.979557180941702e-06, "epoch": 0.3802521008403361, "percentage": 12.68, "elapsed_time": "0:03:18", "remaining_time": "0:22:44"} +{"current_steps": 182, "total_steps": 1428, "loss": 2.7245442867279053, "lr": 9.978438036650822e-06, "epoch": 0.38235294117647056, "percentage": 12.75, "elapsed_time": "0:03:19", "remaining_time": "0:22:42"} +{"current_steps": 183, "total_steps": 1428, "loss": 2.790768623352051, "lr": 9.977289135549404e-06, "epoch": 0.38445378151260506, "percentage": 12.82, "elapsed_time": "0:03:20", "remaining_time": "0:22:41"} +{"current_steps": 184, "total_steps": 1428, "loss": 2.5588126182556152, "lr": 9.976110484504587e-06, "epoch": 0.3865546218487395, "percentage": 12.89, "elapsed_time": "0:03:21", "remaining_time": "0:22:40"} +{"current_steps": 185, "total_steps": 1428, "loss": 3.0367865562438965, "lr": 9.974902090561331e-06, "epoch": 0.38865546218487396, "percentage": 12.96, "elapsed_time": "0:03:22", "remaining_time": "0:22:39"} +{"current_steps": 186, "total_steps": 1428, "loss": 3.1013669967651367, "lr": 9.973663960942373e-06, "epoch": 0.3907563025210084, "percentage": 13.03, "elapsed_time": "0:03:23", "remaining_time": "0:22:38"} +{"current_steps": 187, "total_steps": 1428, "loss": 2.678436279296875, "lr": 9.972396103048184e-06, "epoch": 0.39285714285714285, "percentage": 13.1, "elapsed_time": "0:03:24", "remaining_time": "0:22:36"} +{"current_steps": 188, "total_steps": 1428, "loss": 2.866910696029663, "lr": 9.971098524456925e-06, "epoch": 0.3949579831932773, "percentage": 13.17, "elapsed_time": "0:03:25", "remaining_time": "0:22:35"} +{"current_steps": 189, "total_steps": 1428, "loss": 2.6690807342529297, "lr": 9.969771232924404e-06, "epoch": 0.39705882352941174, "percentage": 13.24, "elapsed_time": "0:03:26", "remaining_time": "0:22:34"} +{"current_steps": 190, "total_steps": 1428, "loss": 2.615846633911133, "lr": 9.968414236384022e-06, "epoch": 0.39915966386554624, "percentage": 13.31, "elapsed_time": "0:03:27", "remaining_time": "0:22:33"} +{"current_steps": 191, "total_steps": 1428, "loss": 3.197604179382324, "lr": 9.967027542946739e-06, "epoch": 0.4012605042016807, "percentage": 13.38, "elapsed_time": "0:03:28", "remaining_time": "0:22:31"} +{"current_steps": 192, "total_steps": 1428, "loss": 1.584808349609375, "lr": 9.965611160901008e-06, "epoch": 0.40336134453781514, "percentage": 13.45, "elapsed_time": "0:03:29", "remaining_time": "0:22:30"} +{"current_steps": 193, "total_steps": 1428, "loss": 2.7913365364074707, "lr": 9.964165098712745e-06, "epoch": 0.4054621848739496, "percentage": 13.52, "elapsed_time": "0:03:30", "remaining_time": "0:22:29"} +{"current_steps": 194, "total_steps": 1428, "loss": 3.42575740814209, "lr": 9.962689365025259e-06, "epoch": 0.40756302521008403, "percentage": 13.59, "elapsed_time": "0:03:31", "remaining_time": "0:22:28"} +{"current_steps": 195, "total_steps": 1428, "loss": 2.6931188106536865, "lr": 9.961183968659217e-06, "epoch": 0.4096638655462185, "percentage": 13.66, "elapsed_time": "0:03:33", "remaining_time": "0:22:27"} +{"current_steps": 196, "total_steps": 1428, "loss": 2.4463605880737305, "lr": 9.959648918612576e-06, "epoch": 0.4117647058823529, "percentage": 13.73, "elapsed_time": "0:03:34", "remaining_time": "0:22:26"} +{"current_steps": 197, "total_steps": 1428, "loss": 2.647773265838623, "lr": 9.958084224060547e-06, "epoch": 0.41386554621848737, "percentage": 13.8, "elapsed_time": "0:03:35", "remaining_time": "0:22:24"} +{"current_steps": 198, "total_steps": 1428, "loss": 2.660770893096924, "lr": 9.956489894355521e-06, "epoch": 0.41596638655462187, "percentage": 13.87, "elapsed_time": "0:03:36", "remaining_time": "0:22:23"} +{"current_steps": 199, "total_steps": 1428, "loss": 3.627254009246826, "lr": 9.954865939027028e-06, "epoch": 0.4180672268907563, "percentage": 13.94, "elapsed_time": "0:03:37", "remaining_time": "0:22:22"} +{"current_steps": 200, "total_steps": 1428, "loss": 2.683685779571533, "lr": 9.953212367781675e-06, "epoch": 0.42016806722689076, "percentage": 14.01, "elapsed_time": "0:03:38", "remaining_time": "0:22:21"} +{"current_steps": 201, "total_steps": 1428, "loss": 2.7249388694763184, "lr": 9.95152919050308e-06, "epoch": 0.4222689075630252, "percentage": 14.08, "elapsed_time": "0:03:39", "remaining_time": "0:22:20"} +{"current_steps": 202, "total_steps": 1428, "loss": 2.933401107788086, "lr": 9.949816417251831e-06, "epoch": 0.42436974789915966, "percentage": 14.15, "elapsed_time": "0:03:40", "remaining_time": "0:22:19"} +{"current_steps": 203, "total_steps": 1428, "loss": 3.5457630157470703, "lr": 9.948074058265409e-06, "epoch": 0.4264705882352941, "percentage": 14.22, "elapsed_time": "0:03:41", "remaining_time": "0:22:17"} +{"current_steps": 204, "total_steps": 1428, "loss": 2.483736038208008, "lr": 9.94630212395813e-06, "epoch": 0.42857142857142855, "percentage": 14.29, "elapsed_time": "0:03:42", "remaining_time": "0:22:16"} +{"current_steps": 205, "total_steps": 1428, "loss": 2.470374584197998, "lr": 9.944500624921094e-06, "epoch": 0.43067226890756305, "percentage": 14.36, "elapsed_time": "0:03:43", "remaining_time": "0:22:15"} +{"current_steps": 206, "total_steps": 1428, "loss": 3.2255494594573975, "lr": 9.942669571922108e-06, "epoch": 0.4327731092436975, "percentage": 14.43, "elapsed_time": "0:03:44", "remaining_time": "0:22:14"} +{"current_steps": 207, "total_steps": 1428, "loss": 3.4820542335510254, "lr": 9.940808975905627e-06, "epoch": 0.43487394957983194, "percentage": 14.5, "elapsed_time": "0:03:46", "remaining_time": "0:22:13"} +{"current_steps": 208, "total_steps": 1428, "loss": 3.218539237976074, "lr": 9.93891884799269e-06, "epoch": 0.4369747899159664, "percentage": 14.57, "elapsed_time": "0:03:47", "remaining_time": "0:22:11"} +{"current_steps": 209, "total_steps": 1428, "loss": 2.8428990840911865, "lr": 9.936999199480854e-06, "epoch": 0.43907563025210083, "percentage": 14.64, "elapsed_time": "0:03:48", "remaining_time": "0:22:10"} +{"current_steps": 210, "total_steps": 1428, "loss": 3.661019802093506, "lr": 9.935050041844121e-06, "epoch": 0.4411764705882353, "percentage": 14.71, "elapsed_time": "0:03:49", "remaining_time": "0:22:09"} +{"current_steps": 211, "total_steps": 1428, "loss": 3.330902338027954, "lr": 9.933071386732874e-06, "epoch": 0.4432773109243697, "percentage": 14.78, "elapsed_time": "0:03:50", "remaining_time": "0:22:08"} +{"current_steps": 212, "total_steps": 1428, "loss": 2.7754883766174316, "lr": 9.931063245973812e-06, "epoch": 0.44537815126050423, "percentage": 14.85, "elapsed_time": "0:03:51", "remaining_time": "0:22:07"} +{"current_steps": 213, "total_steps": 1428, "loss": 2.3284661769866943, "lr": 9.929025631569864e-06, "epoch": 0.4474789915966387, "percentage": 14.92, "elapsed_time": "0:03:52", "remaining_time": "0:22:06"} +{"current_steps": 214, "total_steps": 1428, "loss": 2.599228858947754, "lr": 9.926958555700134e-06, "epoch": 0.4495798319327731, "percentage": 14.99, "elapsed_time": "0:03:53", "remaining_time": "0:22:04"} +{"current_steps": 215, "total_steps": 1428, "loss": 3.174004077911377, "lr": 9.924862030719821e-06, "epoch": 0.45168067226890757, "percentage": 15.06, "elapsed_time": "0:03:54", "remaining_time": "0:22:03"} +{"current_steps": 216, "total_steps": 1428, "loss": 2.7390694618225098, "lr": 9.922736069160141e-06, "epoch": 0.453781512605042, "percentage": 15.13, "elapsed_time": "0:03:55", "remaining_time": "0:22:02"} +{"current_steps": 217, "total_steps": 1428, "loss": 2.7388081550598145, "lr": 9.920580683728263e-06, "epoch": 0.45588235294117646, "percentage": 15.2, "elapsed_time": "0:03:56", "remaining_time": "0:22:01"} +{"current_steps": 218, "total_steps": 1428, "loss": 2.4359140396118164, "lr": 9.918395887307219e-06, "epoch": 0.4579831932773109, "percentage": 15.27, "elapsed_time": "0:03:57", "remaining_time": "0:22:00"} +{"current_steps": 219, "total_steps": 1428, "loss": 2.9688220024108887, "lr": 9.916181692955841e-06, "epoch": 0.46008403361344535, "percentage": 15.34, "elapsed_time": "0:03:58", "remaining_time": "0:21:59"} +{"current_steps": 220, "total_steps": 1428, "loss": 3.1534006595611572, "lr": 9.913938113908675e-06, "epoch": 0.46218487394957986, "percentage": 15.41, "elapsed_time": "0:04:00", "remaining_time": "0:21:58"} +{"current_steps": 221, "total_steps": 1428, "loss": 2.618938684463501, "lr": 9.9116651635759e-06, "epoch": 0.4642857142857143, "percentage": 15.48, "elapsed_time": "0:04:01", "remaining_time": "0:21:56"} +{"current_steps": 222, "total_steps": 1428, "loss": 2.844968318939209, "lr": 9.909362855543253e-06, "epoch": 0.46638655462184875, "percentage": 15.55, "elapsed_time": "0:04:02", "remaining_time": "0:21:55"} +{"current_steps": 223, "total_steps": 1428, "loss": 2.4792628288269043, "lr": 9.907031203571948e-06, "epoch": 0.4684873949579832, "percentage": 15.62, "elapsed_time": "0:04:03", "remaining_time": "0:21:54"} +{"current_steps": 224, "total_steps": 1428, "loss": 2.894502639770508, "lr": 9.90467022159859e-06, "epoch": 0.47058823529411764, "percentage": 15.69, "elapsed_time": "0:04:04", "remaining_time": "0:21:53"} +{"current_steps": 225, "total_steps": 1428, "loss": 2.792015552520752, "lr": 9.902279923735093e-06, "epoch": 0.4726890756302521, "percentage": 15.76, "elapsed_time": "0:04:05", "remaining_time": "0:21:52"} +{"current_steps": 226, "total_steps": 1428, "loss": 2.9171247482299805, "lr": 9.899860324268599e-06, "epoch": 0.47478991596638653, "percentage": 15.83, "elapsed_time": "0:04:06", "remaining_time": "0:21:50"} +{"current_steps": 227, "total_steps": 1428, "loss": 2.560214042663574, "lr": 9.897411437661386e-06, "epoch": 0.47689075630252103, "percentage": 15.9, "elapsed_time": "0:04:07", "remaining_time": "0:21:49"} +{"current_steps": 228, "total_steps": 1428, "loss": 3.2796883583068848, "lr": 9.894933278550785e-06, "epoch": 0.4789915966386555, "percentage": 15.97, "elapsed_time": "0:04:08", "remaining_time": "0:21:48"} +{"current_steps": 229, "total_steps": 1428, "loss": 3.0324971675872803, "lr": 9.8924258617491e-06, "epoch": 0.4810924369747899, "percentage": 16.04, "elapsed_time": "0:04:09", "remaining_time": "0:21:47"} +{"current_steps": 230, "total_steps": 1428, "loss": 3.3899683952331543, "lr": 9.8898892022435e-06, "epoch": 0.4831932773109244, "percentage": 16.11, "elapsed_time": "0:04:10", "remaining_time": "0:21:46"} +{"current_steps": 231, "total_steps": 1428, "loss": 2.742903709411621, "lr": 9.887323315195956e-06, "epoch": 0.4852941176470588, "percentage": 16.18, "elapsed_time": "0:04:11", "remaining_time": "0:21:45"} +{"current_steps": 232, "total_steps": 1428, "loss": 3.230966806411743, "lr": 9.884728215943122e-06, "epoch": 0.48739495798319327, "percentage": 16.25, "elapsed_time": "0:04:12", "remaining_time": "0:21:44"} +{"current_steps": 233, "total_steps": 1428, "loss": 2.8818302154541016, "lr": 9.882103919996268e-06, "epoch": 0.4894957983193277, "percentage": 16.32, "elapsed_time": "0:04:14", "remaining_time": "0:21:42"} +{"current_steps": 234, "total_steps": 1428, "loss": 2.358765125274658, "lr": 9.879450443041172e-06, "epoch": 0.49159663865546216, "percentage": 16.39, "elapsed_time": "0:04:15", "remaining_time": "0:21:41"} +{"current_steps": 235, "total_steps": 1428, "loss": 3.0420098304748535, "lr": 9.876767800938032e-06, "epoch": 0.49369747899159666, "percentage": 16.46, "elapsed_time": "0:04:16", "remaining_time": "0:21:40"} +{"current_steps": 236, "total_steps": 1428, "loss": 2.9595160484313965, "lr": 9.874056009721367e-06, "epoch": 0.4957983193277311, "percentage": 16.53, "elapsed_time": "0:04:17", "remaining_time": "0:21:39"} +{"current_steps": 237, "total_steps": 1428, "loss": 2.9571242332458496, "lr": 9.87131508559993e-06, "epoch": 0.49789915966386555, "percentage": 16.6, "elapsed_time": "0:04:18", "remaining_time": "0:21:38"} +{"current_steps": 238, "total_steps": 1428, "loss": 2.798694610595703, "lr": 9.868545044956603e-06, "epoch": 0.5, "percentage": 16.67, "elapsed_time": "0:04:19", "remaining_time": "0:21:37"} +{"current_steps": 239, "total_steps": 1428, "loss": 2.9430432319641113, "lr": 9.865745904348296e-06, "epoch": 0.5021008403361344, "percentage": 16.74, "elapsed_time": "0:04:20", "remaining_time": "0:21:36"} +{"current_steps": 240, "total_steps": 1428, "loss": 3.065462112426758, "lr": 9.862917680505863e-06, "epoch": 0.5042016806722689, "percentage": 16.81, "elapsed_time": "0:04:21", "remaining_time": "0:21:35"} +{"current_steps": 241, "total_steps": 1428, "loss": 3.8562116622924805, "lr": 9.860060390333988e-06, "epoch": 0.5063025210084033, "percentage": 16.88, "elapsed_time": "0:04:22", "remaining_time": "0:21:33"} +{"current_steps": 242, "total_steps": 1428, "loss": 2.645123243331909, "lr": 9.857174050911085e-06, "epoch": 0.5084033613445378, "percentage": 16.95, "elapsed_time": "0:04:23", "remaining_time": "0:21:32"} +{"current_steps": 243, "total_steps": 1428, "loss": 2.500267744064331, "lr": 9.854258679489203e-06, "epoch": 0.5105042016806722, "percentage": 17.02, "elapsed_time": "0:04:24", "remaining_time": "0:21:31"} +{"current_steps": 244, "total_steps": 1428, "loss": 2.553537368774414, "lr": 9.851314293493923e-06, "epoch": 0.5126050420168067, "percentage": 17.09, "elapsed_time": "0:04:25", "remaining_time": "0:21:30"} +{"current_steps": 245, "total_steps": 1428, "loss": 2.694528102874756, "lr": 9.848340910524243e-06, "epoch": 0.5147058823529411, "percentage": 17.16, "elapsed_time": "0:04:27", "remaining_time": "0:21:29"} +{"current_steps": 246, "total_steps": 1428, "loss": 3.2089271545410156, "lr": 9.845338548352482e-06, "epoch": 0.5168067226890757, "percentage": 17.23, "elapsed_time": "0:04:28", "remaining_time": "0:21:28"} +{"current_steps": 247, "total_steps": 1428, "loss": 2.443826198577881, "lr": 9.842307224924174e-06, "epoch": 0.5189075630252101, "percentage": 17.3, "elapsed_time": "0:04:29", "remaining_time": "0:21:27"} +{"current_steps": 248, "total_steps": 1428, "loss": 2.9329233169555664, "lr": 9.839246958357957e-06, "epoch": 0.5210084033613446, "percentage": 17.37, "elapsed_time": "0:04:30", "remaining_time": "0:21:26"} +{"current_steps": 249, "total_steps": 1428, "loss": 2.5171399116516113, "lr": 9.836157766945467e-06, "epoch": 0.523109243697479, "percentage": 17.44, "elapsed_time": "0:04:31", "remaining_time": "0:21:25"} +{"current_steps": 250, "total_steps": 1428, "loss": 3.0069408416748047, "lr": 9.833039669151225e-06, "epoch": 0.5252100840336135, "percentage": 17.51, "elapsed_time": "0:04:32", "remaining_time": "0:21:25"} +{"current_steps": 251, "total_steps": 1428, "loss": 2.5816359519958496, "lr": 9.829892683612535e-06, "epoch": 0.5273109243697479, "percentage": 17.58, "elapsed_time": "0:04:33", "remaining_time": "0:21:24"} +{"current_steps": 252, "total_steps": 1428, "loss": 2.3982670307159424, "lr": 9.826716829139358e-06, "epoch": 0.5294117647058824, "percentage": 17.65, "elapsed_time": "0:04:34", "remaining_time": "0:21:22"} +{"current_steps": 253, "total_steps": 1428, "loss": 2.975574016571045, "lr": 9.82351212471422e-06, "epoch": 0.5315126050420168, "percentage": 17.72, "elapsed_time": "0:04:35", "remaining_time": "0:21:21"} +{"current_steps": 254, "total_steps": 1428, "loss": 2.4827775955200195, "lr": 9.820278589492076e-06, "epoch": 0.5336134453781513, "percentage": 17.79, "elapsed_time": "0:04:37", "remaining_time": "0:21:20"} +{"current_steps": 255, "total_steps": 1428, "loss": 2.690033197402954, "lr": 9.817016242800215e-06, "epoch": 0.5357142857142857, "percentage": 17.86, "elapsed_time": "0:04:38", "remaining_time": "0:21:19"} +{"current_steps": 256, "total_steps": 1428, "loss": 3.346949338912964, "lr": 9.813725104138133e-06, "epoch": 0.5378151260504201, "percentage": 17.93, "elapsed_time": "0:04:39", "remaining_time": "0:21:18"} +{"current_steps": 257, "total_steps": 1428, "loss": 2.6791281700134277, "lr": 9.810405193177418e-06, "epoch": 0.5399159663865546, "percentage": 18.0, "elapsed_time": "0:04:40", "remaining_time": "0:21:16"} +{"current_steps": 258, "total_steps": 1428, "loss": 2.853158950805664, "lr": 9.807056529761637e-06, "epoch": 0.542016806722689, "percentage": 18.07, "elapsed_time": "0:04:41", "remaining_time": "0:21:15"} +{"current_steps": 259, "total_steps": 1428, "loss": 3.1636295318603516, "lr": 9.80367913390621e-06, "epoch": 0.5441176470588235, "percentage": 18.14, "elapsed_time": "0:04:42", "remaining_time": "0:21:14"} +{"current_steps": 260, "total_steps": 1428, "loss": 2.5055313110351562, "lr": 9.800273025798302e-06, "epoch": 0.5462184873949579, "percentage": 18.21, "elapsed_time": "0:04:43", "remaining_time": "0:21:13"} +{"current_steps": 261, "total_steps": 1428, "loss": 2.9986414909362793, "lr": 9.796838225796688e-06, "epoch": 0.5483193277310925, "percentage": 18.28, "elapsed_time": "0:04:44", "remaining_time": "0:21:12"} +{"current_steps": 262, "total_steps": 1428, "loss": 2.419975757598877, "lr": 9.793374754431642e-06, "epoch": 0.5504201680672269, "percentage": 18.35, "elapsed_time": "0:04:45", "remaining_time": "0:21:11"} +{"current_steps": 263, "total_steps": 1428, "loss": 3.0301923751831055, "lr": 9.789882632404809e-06, "epoch": 0.5525210084033614, "percentage": 18.42, "elapsed_time": "0:04:46", "remaining_time": "0:21:09"} +{"current_steps": 264, "total_steps": 1428, "loss": 2.846034526824951, "lr": 9.786361880589084e-06, "epoch": 0.5546218487394958, "percentage": 18.49, "elapsed_time": "0:04:47", "remaining_time": "0:21:08"} +{"current_steps": 265, "total_steps": 1428, "loss": 3.250943183898926, "lr": 9.782812520028487e-06, "epoch": 0.5567226890756303, "percentage": 18.56, "elapsed_time": "0:04:48", "remaining_time": "0:21:07"} +{"current_steps": 266, "total_steps": 1428, "loss": 2.5069515705108643, "lr": 9.779234571938034e-06, "epoch": 0.5588235294117647, "percentage": 18.63, "elapsed_time": "0:04:49", "remaining_time": "0:21:06"} +{"current_steps": 267, "total_steps": 1428, "loss": 2.2883377075195312, "lr": 9.775628057703616e-06, "epoch": 0.5609243697478992, "percentage": 18.7, "elapsed_time": "0:04:50", "remaining_time": "0:21:05"} +{"current_steps": 268, "total_steps": 1428, "loss": 1.8844149112701416, "lr": 9.771992998881865e-06, "epoch": 0.5630252100840336, "percentage": 18.77, "elapsed_time": "0:04:52", "remaining_time": "0:21:04"} +{"current_steps": 269, "total_steps": 1428, "loss": 2.608553409576416, "lr": 9.768329417200029e-06, "epoch": 0.5651260504201681, "percentage": 18.84, "elapsed_time": "0:04:53", "remaining_time": "0:21:03"} +{"current_steps": 270, "total_steps": 1428, "loss": 2.8849685192108154, "lr": 9.76463733455584e-06, "epoch": 0.5672268907563025, "percentage": 18.91, "elapsed_time": "0:04:54", "remaining_time": "0:21:01"} +{"current_steps": 271, "total_steps": 1428, "loss": 2.83829402923584, "lr": 9.760916773017386e-06, "epoch": 0.569327731092437, "percentage": 18.98, "elapsed_time": "0:04:55", "remaining_time": "0:21:00"} +{"current_steps": 272, "total_steps": 1428, "loss": 2.6053004264831543, "lr": 9.757167754822974e-06, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:04:56", "remaining_time": "0:20:59"} +{"current_steps": 273, "total_steps": 1428, "loss": 2.8338804244995117, "lr": 9.753390302381006e-06, "epoch": 0.5735294117647058, "percentage": 19.12, "elapsed_time": "0:04:57", "remaining_time": "0:20:58"} +{"current_steps": 274, "total_steps": 1428, "loss": 2.979978084564209, "lr": 9.749584438269833e-06, "epoch": 0.5756302521008403, "percentage": 19.19, "elapsed_time": "0:04:58", "remaining_time": "0:20:57"} +{"current_steps": 275, "total_steps": 1428, "loss": 1.8241777420043945, "lr": 9.74575018523763e-06, "epoch": 0.5777310924369747, "percentage": 19.26, "elapsed_time": "0:04:59", "remaining_time": "0:20:56"} +{"current_steps": 276, "total_steps": 1428, "loss": 3.2140274047851562, "lr": 9.741887566202259e-06, "epoch": 0.5798319327731093, "percentage": 19.33, "elapsed_time": "0:05:00", "remaining_time": "0:20:55"} +{"current_steps": 277, "total_steps": 1428, "loss": 3.074397325515747, "lr": 9.737996604251124e-06, "epoch": 0.5819327731092437, "percentage": 19.4, "elapsed_time": "0:05:01", "remaining_time": "0:20:53"} +{"current_steps": 278, "total_steps": 1428, "loss": 2.527010679244995, "lr": 9.73407732264104e-06, "epoch": 0.5840336134453782, "percentage": 19.47, "elapsed_time": "0:05:02", "remaining_time": "0:20:52"} +{"current_steps": 279, "total_steps": 1428, "loss": 2.6019768714904785, "lr": 9.730129744798096e-06, "epoch": 0.5861344537815126, "percentage": 19.54, "elapsed_time": "0:05:03", "remaining_time": "0:20:51"} +{"current_steps": 280, "total_steps": 1428, "loss": 2.848952293395996, "lr": 9.726153894317508e-06, "epoch": 0.5882352941176471, "percentage": 19.61, "elapsed_time": "0:05:05", "remaining_time": "0:20:50"} +{"current_steps": 281, "total_steps": 1428, "loss": 3.120556354522705, "lr": 9.722149794963483e-06, "epoch": 0.5903361344537815, "percentage": 19.68, "elapsed_time": "0:05:06", "remaining_time": "0:20:49"} +{"current_steps": 282, "total_steps": 1428, "loss": 2.8926405906677246, "lr": 9.718117470669072e-06, "epoch": 0.592436974789916, "percentage": 19.75, "elapsed_time": "0:05:07", "remaining_time": "0:20:48"} +{"current_steps": 283, "total_steps": 1428, "loss": 3.2854347229003906, "lr": 9.714056945536039e-06, "epoch": 0.5945378151260504, "percentage": 19.82, "elapsed_time": "0:05:08", "remaining_time": "0:20:47"} +{"current_steps": 284, "total_steps": 1428, "loss": 2.856870651245117, "lr": 9.709968243834698e-06, "epoch": 0.5966386554621849, "percentage": 19.89, "elapsed_time": "0:05:09", "remaining_time": "0:20:46"} +{"current_steps": 285, "total_steps": 1428, "loss": 3.3881802558898926, "lr": 9.705851390003783e-06, "epoch": 0.5987394957983193, "percentage": 19.96, "elapsed_time": "0:05:10", "remaining_time": "0:20:45"} +{"current_steps": 286, "total_steps": 1428, "loss": 2.6102542877197266, "lr": 9.7017064086503e-06, "epoch": 0.6008403361344538, "percentage": 20.03, "elapsed_time": "0:05:11", "remaining_time": "0:20:43"} +{"current_steps": 287, "total_steps": 1428, "loss": 2.7697243690490723, "lr": 9.697533324549371e-06, "epoch": 0.6029411764705882, "percentage": 20.1, "elapsed_time": "0:05:12", "remaining_time": "0:20:42"} +{"current_steps": 288, "total_steps": 1428, "loss": 2.568695545196533, "lr": 9.693332162644095e-06, "epoch": 0.6050420168067226, "percentage": 20.17, "elapsed_time": "0:05:13", "remaining_time": "0:20:41"} +{"current_steps": 289, "total_steps": 1428, "loss": 2.922543525695801, "lr": 9.689102948045398e-06, "epoch": 0.6071428571428571, "percentage": 20.24, "elapsed_time": "0:05:14", "remaining_time": "0:20:40"} +{"current_steps": 290, "total_steps": 1428, "loss": 3.1011314392089844, "lr": 9.684845706031878e-06, "epoch": 0.6092436974789915, "percentage": 20.31, "elapsed_time": "0:05:15", "remaining_time": "0:20:39"} +{"current_steps": 291, "total_steps": 1428, "loss": 2.627528429031372, "lr": 9.680560462049657e-06, "epoch": 0.6113445378151261, "percentage": 20.38, "elapsed_time": "0:05:16", "remaining_time": "0:20:38"} +{"current_steps": 292, "total_steps": 1428, "loss": 2.8417811393737793, "lr": 9.676247241712228e-06, "epoch": 0.6134453781512605, "percentage": 20.45, "elapsed_time": "0:05:17", "remaining_time": "0:20:37"} +{"current_steps": 293, "total_steps": 1428, "loss": 2.3787314891815186, "lr": 9.671906070800307e-06, "epoch": 0.615546218487395, "percentage": 20.52, "elapsed_time": "0:05:19", "remaining_time": "0:20:35"} +{"current_steps": 294, "total_steps": 1428, "loss": 2.751317024230957, "lr": 9.667536975261667e-06, "epoch": 0.6176470588235294, "percentage": 20.59, "elapsed_time": "0:05:20", "remaining_time": "0:20:34"} +{"current_steps": 295, "total_steps": 1428, "loss": 2.6910929679870605, "lr": 9.663139981210998e-06, "epoch": 0.6197478991596639, "percentage": 20.66, "elapsed_time": "0:05:21", "remaining_time": "0:20:33"} +{"current_steps": 296, "total_steps": 1428, "loss": 2.801499366760254, "lr": 9.658715114929737e-06, "epoch": 0.6218487394957983, "percentage": 20.73, "elapsed_time": "0:05:22", "remaining_time": "0:20:32"} +{"current_steps": 297, "total_steps": 1428, "loss": 2.885946273803711, "lr": 9.654262402865922e-06, "epoch": 0.6239495798319328, "percentage": 20.8, "elapsed_time": "0:05:23", "remaining_time": "0:20:31"} +{"current_steps": 298, "total_steps": 1428, "loss": 3.1485133171081543, "lr": 9.649781871634025e-06, "epoch": 0.6260504201680672, "percentage": 20.87, "elapsed_time": "0:05:24", "remaining_time": "0:20:30"} +{"current_steps": 299, "total_steps": 1428, "loss": 3.174015998840332, "lr": 9.6452735480148e-06, "epoch": 0.6281512605042017, "percentage": 20.94, "elapsed_time": "0:05:25", "remaining_time": "0:20:29"} +{"current_steps": 300, "total_steps": 1428, "loss": 3.339445114135742, "lr": 9.64073745895512e-06, "epoch": 0.6302521008403361, "percentage": 21.01, "elapsed_time": "0:05:26", "remaining_time": "0:20:28"} +{"current_steps": 301, "total_steps": 1428, "loss": 2.9448843002319336, "lr": 9.636173631567812e-06, "epoch": 0.6323529411764706, "percentage": 21.08, "elapsed_time": "0:05:27", "remaining_time": "0:20:27"} +{"current_steps": 302, "total_steps": 1428, "loss": 2.6363561153411865, "lr": 9.631582093131501e-06, "epoch": 0.634453781512605, "percentage": 21.15, "elapsed_time": "0:05:28", "remaining_time": "0:20:26"} +{"current_steps": 303, "total_steps": 1428, "loss": 2.4621901512145996, "lr": 9.62696287109045e-06, "epoch": 0.6365546218487395, "percentage": 21.22, "elapsed_time": "0:05:29", "remaining_time": "0:20:24"} +{"current_steps": 304, "total_steps": 1428, "loss": 2.8623251914978027, "lr": 9.622315993054384e-06, "epoch": 0.6386554621848739, "percentage": 21.29, "elapsed_time": "0:05:30", "remaining_time": "0:20:23"} +{"current_steps": 305, "total_steps": 1428, "loss": 2.191575765609741, "lr": 9.61764148679833e-06, "epoch": 0.6407563025210085, "percentage": 21.36, "elapsed_time": "0:05:32", "remaining_time": "0:20:22"} +{"current_steps": 306, "total_steps": 1428, "loss": 2.018388271331787, "lr": 9.61293938026246e-06, "epoch": 0.6428571428571429, "percentage": 21.43, "elapsed_time": "0:05:33", "remaining_time": "0:20:21"} +{"current_steps": 307, "total_steps": 1428, "loss": 2.756854772567749, "lr": 9.608209701551913e-06, "epoch": 0.6449579831932774, "percentage": 21.5, "elapsed_time": "0:05:34", "remaining_time": "0:20:20"} +{"current_steps": 308, "total_steps": 1428, "loss": 2.6668529510498047, "lr": 9.60345247893663e-06, "epoch": 0.6470588235294118, "percentage": 21.57, "elapsed_time": "0:05:35", "remaining_time": "0:20:19"} +{"current_steps": 309, "total_steps": 1428, "loss": 2.6617343425750732, "lr": 9.598667740851187e-06, "epoch": 0.6491596638655462, "percentage": 21.64, "elapsed_time": "0:05:36", "remaining_time": "0:20:18"} +{"current_steps": 310, "total_steps": 1428, "loss": 3.1460976600646973, "lr": 9.59385551589462e-06, "epoch": 0.6512605042016807, "percentage": 21.71, "elapsed_time": "0:05:37", "remaining_time": "0:20:16"} +{"current_steps": 311, "total_steps": 1428, "loss": 2.7566354274749756, "lr": 9.589015832830267e-06, "epoch": 0.6533613445378151, "percentage": 21.78, "elapsed_time": "0:05:38", "remaining_time": "0:20:15"} +{"current_steps": 312, "total_steps": 1428, "loss": 3.3112881183624268, "lr": 9.584148720585575e-06, "epoch": 0.6554621848739496, "percentage": 21.85, "elapsed_time": "0:05:39", "remaining_time": "0:20:14"} +{"current_steps": 313, "total_steps": 1428, "loss": 2.8563618659973145, "lr": 9.57925420825195e-06, "epoch": 0.657563025210084, "percentage": 21.92, "elapsed_time": "0:05:40", "remaining_time": "0:20:13"} +{"current_steps": 314, "total_steps": 1428, "loss": 3.5544567108154297, "lr": 9.574332325084564e-06, "epoch": 0.6596638655462185, "percentage": 21.99, "elapsed_time": "0:05:41", "remaining_time": "0:20:12"} +{"current_steps": 315, "total_steps": 1428, "loss": 2.924015998840332, "lr": 9.569383100502193e-06, "epoch": 0.6617647058823529, "percentage": 22.06, "elapsed_time": "0:05:42", "remaining_time": "0:20:11"} +{"current_steps": 316, "total_steps": 1428, "loss": 2.7250008583068848, "lr": 9.564406564087032e-06, "epoch": 0.6638655462184874, "percentage": 22.13, "elapsed_time": "0:05:43", "remaining_time": "0:20:10"} +{"current_steps": 317, "total_steps": 1428, "loss": 2.9229238033294678, "lr": 9.559402745584527e-06, "epoch": 0.6659663865546218, "percentage": 22.2, "elapsed_time": "0:05:44", "remaining_time": "0:20:09"} +{"current_steps": 318, "total_steps": 1428, "loss": 3.4867515563964844, "lr": 9.554371674903191e-06, "epoch": 0.6680672268907563, "percentage": 22.27, "elapsed_time": "0:05:46", "remaining_time": "0:20:07"} +{"current_steps": 319, "total_steps": 1428, "loss": 2.4049417972564697, "lr": 9.549313382114427e-06, "epoch": 0.6701680672268907, "percentage": 22.34, "elapsed_time": "0:05:47", "remaining_time": "0:20:06"} +{"current_steps": 320, "total_steps": 1428, "loss": 3.1008338928222656, "lr": 9.54422789745235e-06, "epoch": 0.6722689075630253, "percentage": 22.41, "elapsed_time": "0:05:48", "remaining_time": "0:20:05"} +{"current_steps": 321, "total_steps": 1428, "loss": 2.6114342212677, "lr": 9.5391152513136e-06, "epoch": 0.6743697478991597, "percentage": 22.48, "elapsed_time": "0:05:49", "remaining_time": "0:20:04"} +{"current_steps": 322, "total_steps": 1428, "loss": 2.7165164947509766, "lr": 9.533975474257171e-06, "epoch": 0.6764705882352942, "percentage": 22.55, "elapsed_time": "0:05:50", "remaining_time": "0:20:03"} +{"current_steps": 323, "total_steps": 1428, "loss": 2.8122520446777344, "lr": 9.528808597004216e-06, "epoch": 0.6785714285714286, "percentage": 22.62, "elapsed_time": "0:05:51", "remaining_time": "0:20:02"} +{"current_steps": 324, "total_steps": 1428, "loss": 2.862661838531494, "lr": 9.523614650437876e-06, "epoch": 0.680672268907563, "percentage": 22.69, "elapsed_time": "0:05:52", "remaining_time": "0:20:01"} +{"current_steps": 325, "total_steps": 1428, "loss": 2.9812843799591064, "lr": 9.518393665603084e-06, "epoch": 0.6827731092436975, "percentage": 22.76, "elapsed_time": "0:05:53", "remaining_time": "0:20:00"} +{"current_steps": 326, "total_steps": 1428, "loss": 2.9455337524414062, "lr": 9.513145673706383e-06, "epoch": 0.6848739495798319, "percentage": 22.83, "elapsed_time": "0:05:54", "remaining_time": "0:19:58"} +{"current_steps": 327, "total_steps": 1428, "loss": 3.1577422618865967, "lr": 9.507870706115749e-06, "epoch": 0.6869747899159664, "percentage": 22.9, "elapsed_time": "0:05:55", "remaining_time": "0:19:57"} +{"current_steps": 328, "total_steps": 1428, "loss": 2.545835018157959, "lr": 9.50256879436039e-06, "epoch": 0.6890756302521008, "percentage": 22.97, "elapsed_time": "0:05:56", "remaining_time": "0:19:56"} +{"current_steps": 329, "total_steps": 1428, "loss": 2.559062957763672, "lr": 9.497239970130561e-06, "epoch": 0.6911764705882353, "percentage": 23.04, "elapsed_time": "0:05:57", "remaining_time": "0:19:55"} +{"current_steps": 330, "total_steps": 1428, "loss": 2.932499647140503, "lr": 9.491884265277383e-06, "epoch": 0.6932773109243697, "percentage": 23.11, "elapsed_time": "0:05:58", "remaining_time": "0:19:54"} +{"current_steps": 331, "total_steps": 1428, "loss": 2.967616558074951, "lr": 9.486501711812637e-06, "epoch": 0.6953781512605042, "percentage": 23.18, "elapsed_time": "0:06:00", "remaining_time": "0:19:53"} +{"current_steps": 332, "total_steps": 1428, "loss": 2.4604697227478027, "lr": 9.481092341908591e-06, "epoch": 0.6974789915966386, "percentage": 23.25, "elapsed_time": "0:06:01", "remaining_time": "0:19:52"} +{"current_steps": 333, "total_steps": 1428, "loss": 3.146969795227051, "lr": 9.475656187897794e-06, "epoch": 0.6995798319327731, "percentage": 23.32, "elapsed_time": "0:06:02", "remaining_time": "0:19:51"} +{"current_steps": 334, "total_steps": 1428, "loss": 3.337083339691162, "lr": 9.470193282272886e-06, "epoch": 0.7016806722689075, "percentage": 23.39, "elapsed_time": "0:06:03", "remaining_time": "0:19:50"} +{"current_steps": 335, "total_steps": 1428, "loss": 2.7829766273498535, "lr": 9.464703657686412e-06, "epoch": 0.7037815126050421, "percentage": 23.46, "elapsed_time": "0:06:04", "remaining_time": "0:19:48"} +{"current_steps": 336, "total_steps": 1428, "loss": 3.095449447631836, "lr": 9.45918734695061e-06, "epoch": 0.7058823529411765, "percentage": 23.53, "elapsed_time": "0:06:05", "remaining_time": "0:19:47"} +{"current_steps": 337, "total_steps": 1428, "loss": 2.6790573596954346, "lr": 9.453644383037232e-06, "epoch": 0.707983193277311, "percentage": 23.6, "elapsed_time": "0:06:06", "remaining_time": "0:19:46"} +{"current_steps": 338, "total_steps": 1428, "loss": 2.9844274520874023, "lr": 9.448074799077337e-06, "epoch": 0.7100840336134454, "percentage": 23.67, "elapsed_time": "0:06:07", "remaining_time": "0:19:45"} +{"current_steps": 339, "total_steps": 1428, "loss": 2.256910562515259, "lr": 9.442478628361098e-06, "epoch": 0.7121848739495799, "percentage": 23.74, "elapsed_time": "0:06:08", "remaining_time": "0:19:44"} +{"current_steps": 340, "total_steps": 1428, "loss": 2.9464545249938965, "lr": 9.436855904337596e-06, "epoch": 0.7142857142857143, "percentage": 23.81, "elapsed_time": "0:06:09", "remaining_time": "0:19:43"} +{"current_steps": 341, "total_steps": 1428, "loss": 2.23644757270813, "lr": 9.43120666061463e-06, "epoch": 0.7163865546218487, "percentage": 23.88, "elapsed_time": "0:06:10", "remaining_time": "0:19:42"} +{"current_steps": 342, "total_steps": 1428, "loss": 2.85072660446167, "lr": 9.425530930958507e-06, "epoch": 0.7184873949579832, "percentage": 23.95, "elapsed_time": "0:06:11", "remaining_time": "0:19:41"} +{"current_steps": 343, "total_steps": 1428, "loss": 3.09238862991333, "lr": 9.419828749293845e-06, "epoch": 0.7205882352941176, "percentage": 24.02, "elapsed_time": "0:06:13", "remaining_time": "0:19:39"} +{"current_steps": 344, "total_steps": 1428, "loss": 2.7548587322235107, "lr": 9.414100149703373e-06, "epoch": 0.7226890756302521, "percentage": 24.09, "elapsed_time": "0:06:14", "remaining_time": "0:19:38"} +{"current_steps": 345, "total_steps": 1428, "loss": 2.487452507019043, "lr": 9.40834516642772e-06, "epoch": 0.7247899159663865, "percentage": 24.16, "elapsed_time": "0:06:15", "remaining_time": "0:19:37"} +{"current_steps": 346, "total_steps": 1428, "loss": 3.077296257019043, "lr": 9.402563833865213e-06, "epoch": 0.726890756302521, "percentage": 24.23, "elapsed_time": "0:06:16", "remaining_time": "0:19:36"} +{"current_steps": 347, "total_steps": 1428, "loss": 2.6188814640045166, "lr": 9.396756186571672e-06, "epoch": 0.7289915966386554, "percentage": 24.3, "elapsed_time": "0:06:17", "remaining_time": "0:19:35"} +{"current_steps": 348, "total_steps": 1428, "loss": 3.150355815887451, "lr": 9.39092225926021e-06, "epoch": 0.7310924369747899, "percentage": 24.37, "elapsed_time": "0:06:18", "remaining_time": "0:19:34"} +{"current_steps": 349, "total_steps": 1428, "loss": 2.6666879653930664, "lr": 9.385062086801013e-06, "epoch": 0.7331932773109243, "percentage": 24.44, "elapsed_time": "0:06:19", "remaining_time": "0:19:33"} +{"current_steps": 350, "total_steps": 1428, "loss": 2.885680675506592, "lr": 9.379175704221139e-06, "epoch": 0.7352941176470589, "percentage": 24.51, "elapsed_time": "0:06:20", "remaining_time": "0:19:32"} +{"current_steps": 351, "total_steps": 1428, "loss": 2.948115110397339, "lr": 9.37326314670431e-06, "epoch": 0.7373949579831933, "percentage": 24.58, "elapsed_time": "0:06:21", "remaining_time": "0:19:31"} +{"current_steps": 352, "total_steps": 1428, "loss": 2.743468761444092, "lr": 9.367324449590694e-06, "epoch": 0.7394957983193278, "percentage": 24.65, "elapsed_time": "0:06:22", "remaining_time": "0:19:29"} +{"current_steps": 353, "total_steps": 1428, "loss": 3.0895063877105713, "lr": 9.361359648376707e-06, "epoch": 0.7415966386554622, "percentage": 24.72, "elapsed_time": "0:06:23", "remaining_time": "0:19:28"} +{"current_steps": 354, "total_steps": 1428, "loss": 2.808818817138672, "lr": 9.355368778714784e-06, "epoch": 0.7436974789915967, "percentage": 24.79, "elapsed_time": "0:06:24", "remaining_time": "0:19:27"} +{"current_steps": 355, "total_steps": 1428, "loss": 2.889227867126465, "lr": 9.349351876413181e-06, "epoch": 0.7457983193277311, "percentage": 24.86, "elapsed_time": "0:06:25", "remaining_time": "0:19:26"} +{"current_steps": 356, "total_steps": 1428, "loss": 3.021900177001953, "lr": 9.343308977435754e-06, "epoch": 0.7478991596638656, "percentage": 24.93, "elapsed_time": "0:06:27", "remaining_time": "0:19:25"} +{"current_steps": 357, "total_steps": 1428, "loss": 2.4112629890441895, "lr": 9.337240117901742e-06, "epoch": 0.75, "percentage": 25.0, "elapsed_time": "0:06:28", "remaining_time": "0:19:24"} +{"current_steps": 358, "total_steps": 1428, "loss": 2.898515224456787, "lr": 9.331145334085554e-06, "epoch": 0.7521008403361344, "percentage": 25.07, "elapsed_time": "0:06:29", "remaining_time": "0:19:23"} +{"current_steps": 359, "total_steps": 1428, "loss": 2.683413028717041, "lr": 9.325024662416553e-06, "epoch": 0.7542016806722689, "percentage": 25.14, "elapsed_time": "0:06:30", "remaining_time": "0:19:22"} +{"current_steps": 360, "total_steps": 1428, "loss": 2.890808582305908, "lr": 9.318878139478842e-06, "epoch": 0.7563025210084033, "percentage": 25.21, "elapsed_time": "0:06:31", "remaining_time": "0:19:20"} +{"current_steps": 361, "total_steps": 1428, "loss": 2.9919955730438232, "lr": 9.312705802011029e-06, "epoch": 0.7584033613445378, "percentage": 25.28, "elapsed_time": "0:06:32", "remaining_time": "0:19:19"} +{"current_steps": 362, "total_steps": 1428, "loss": 2.7725915908813477, "lr": 9.306507686906033e-06, "epoch": 0.7605042016806722, "percentage": 25.35, "elapsed_time": "0:06:33", "remaining_time": "0:19:18"} +{"current_steps": 363, "total_steps": 1428, "loss": 2.9397757053375244, "lr": 9.300283831210838e-06, "epoch": 0.7626050420168067, "percentage": 25.42, "elapsed_time": "0:06:34", "remaining_time": "0:19:17"} +{"current_steps": 364, "total_steps": 1428, "loss": 2.770698070526123, "lr": 9.294034272126286e-06, "epoch": 0.7647058823529411, "percentage": 25.49, "elapsed_time": "0:06:35", "remaining_time": "0:19:16"} +{"current_steps": 365, "total_steps": 1428, "loss": 2.5156445503234863, "lr": 9.28775904700686e-06, "epoch": 0.7668067226890757, "percentage": 25.56, "elapsed_time": "0:06:36", "remaining_time": "0:19:15"} +{"current_steps": 366, "total_steps": 1428, "loss": 2.597851276397705, "lr": 9.281458193360442e-06, "epoch": 0.7689075630252101, "percentage": 25.63, "elapsed_time": "0:06:37", "remaining_time": "0:19:14"} +{"current_steps": 367, "total_steps": 1428, "loss": 2.4659290313720703, "lr": 9.2751317488481e-06, "epoch": 0.7710084033613446, "percentage": 25.7, "elapsed_time": "0:06:38", "remaining_time": "0:19:13"} +{"current_steps": 368, "total_steps": 1428, "loss": 3.0518131256103516, "lr": 9.26877975128387e-06, "epoch": 0.773109243697479, "percentage": 25.77, "elapsed_time": "0:06:39", "remaining_time": "0:19:12"} +{"current_steps": 369, "total_steps": 1428, "loss": 2.0272233486175537, "lr": 9.262402238634514e-06, "epoch": 0.7752100840336135, "percentage": 25.84, "elapsed_time": "0:06:41", "remaining_time": "0:19:10"} +{"current_steps": 370, "total_steps": 1428, "loss": 2.282167911529541, "lr": 9.255999249019307e-06, "epoch": 0.7773109243697479, "percentage": 25.91, "elapsed_time": "0:06:42", "remaining_time": "0:19:09"} +{"current_steps": 371, "total_steps": 1428, "loss": 2.447831869125366, "lr": 9.2495708207098e-06, "epoch": 0.7794117647058824, "percentage": 25.98, "elapsed_time": "0:06:43", "remaining_time": "0:19:08"} +{"current_steps": 372, "total_steps": 1428, "loss": 2.5548458099365234, "lr": 9.243116992129593e-06, "epoch": 0.7815126050420168, "percentage": 26.05, "elapsed_time": "0:06:44", "remaining_time": "0:19:07"} +{"current_steps": 373, "total_steps": 1428, "loss": 2.2244365215301514, "lr": 9.23663780185411e-06, "epoch": 0.7836134453781513, "percentage": 26.12, "elapsed_time": "0:06:45", "remaining_time": "0:19:06"} +{"current_steps": 374, "total_steps": 1428, "loss": 3.044992208480835, "lr": 9.230133288610366e-06, "epoch": 0.7857142857142857, "percentage": 26.19, "elapsed_time": "0:06:46", "remaining_time": "0:19:05"} +{"current_steps": 375, "total_steps": 1428, "loss": 2.545569896697998, "lr": 9.223603491276733e-06, "epoch": 0.7878151260504201, "percentage": 26.26, "elapsed_time": "0:06:47", "remaining_time": "0:19:04"} +{"current_steps": 376, "total_steps": 1428, "loss": 3.337583541870117, "lr": 9.217048448882711e-06, "epoch": 0.7899159663865546, "percentage": 26.33, "elapsed_time": "0:06:48", "remaining_time": "0:19:03"} +{"current_steps": 377, "total_steps": 1428, "loss": 3.1922380924224854, "lr": 9.210468200608691e-06, "epoch": 0.792016806722689, "percentage": 26.4, "elapsed_time": "0:06:49", "remaining_time": "0:19:02"} +{"current_steps": 378, "total_steps": 1428, "loss": 2.5922632217407227, "lr": 9.203862785785724e-06, "epoch": 0.7941176470588235, "percentage": 26.47, "elapsed_time": "0:06:50", "remaining_time": "0:19:00"} +{"current_steps": 379, "total_steps": 1428, "loss": 2.876894474029541, "lr": 9.197232243895285e-06, "epoch": 0.7962184873949579, "percentage": 26.54, "elapsed_time": "0:06:51", "remaining_time": "0:18:59"} +{"current_steps": 380, "total_steps": 1428, "loss": 2.7677531242370605, "lr": 9.190576614569035e-06, "epoch": 0.7983193277310925, "percentage": 26.61, "elapsed_time": "0:06:52", "remaining_time": "0:18:58"} +{"current_steps": 381, "total_steps": 1428, "loss": 1.9870229959487915, "lr": 9.183895937588594e-06, "epoch": 0.8004201680672269, "percentage": 26.68, "elapsed_time": "0:06:53", "remaining_time": "0:18:57"} +{"current_steps": 382, "total_steps": 1428, "loss": 2.784242868423462, "lr": 9.177190252885285e-06, "epoch": 0.8025210084033614, "percentage": 26.75, "elapsed_time": "0:06:55", "remaining_time": "0:18:56"} +{"current_steps": 383, "total_steps": 1428, "loss": 2.878697395324707, "lr": 9.17045960053991e-06, "epoch": 0.8046218487394958, "percentage": 26.82, "elapsed_time": "0:06:56", "remaining_time": "0:18:55"} +{"current_steps": 384, "total_steps": 1428, "loss": 2.7685139179229736, "lr": 9.163704020782507e-06, "epoch": 0.8067226890756303, "percentage": 26.89, "elapsed_time": "0:06:57", "remaining_time": "0:18:54"} +{"current_steps": 385, "total_steps": 1428, "loss": 2.8312299251556396, "lr": 9.156923553992107e-06, "epoch": 0.8088235294117647, "percentage": 26.96, "elapsed_time": "0:06:58", "remaining_time": "0:18:53"} +{"current_steps": 386, "total_steps": 1428, "loss": 1.7165706157684326, "lr": 9.150118240696497e-06, "epoch": 0.8109243697478992, "percentage": 27.03, "elapsed_time": "0:06:59", "remaining_time": "0:18:52"} +{"current_steps": 387, "total_steps": 1428, "loss": 3.451162815093994, "lr": 9.14328812157197e-06, "epoch": 0.8130252100840336, "percentage": 27.1, "elapsed_time": "0:07:00", "remaining_time": "0:18:50"} +{"current_steps": 388, "total_steps": 1428, "loss": 3.455259084701538, "lr": 9.136433237443093e-06, "epoch": 0.8151260504201681, "percentage": 27.17, "elapsed_time": "0:07:01", "remaining_time": "0:18:49"} +{"current_steps": 389, "total_steps": 1428, "loss": 3.3125205039978027, "lr": 9.129553629282448e-06, "epoch": 0.8172268907563025, "percentage": 27.24, "elapsed_time": "0:07:02", "remaining_time": "0:18:48"} +{"current_steps": 390, "total_steps": 1428, "loss": 3.175715923309326, "lr": 9.122649338210407e-06, "epoch": 0.819327731092437, "percentage": 27.31, "elapsed_time": "0:07:03", "remaining_time": "0:18:47"} +{"current_steps": 391, "total_steps": 1428, "loss": 3.426882743835449, "lr": 9.115720405494868e-06, "epoch": 0.8214285714285714, "percentage": 27.38, "elapsed_time": "0:07:04", "remaining_time": "0:18:46"} +{"current_steps": 392, "total_steps": 1428, "loss": 2.693225860595703, "lr": 9.108766872551016e-06, "epoch": 0.8235294117647058, "percentage": 27.45, "elapsed_time": "0:07:05", "remaining_time": "0:18:45"} +{"current_steps": 393, "total_steps": 1428, "loss": 2.8251726627349854, "lr": 9.101788780941076e-06, "epoch": 0.8256302521008403, "percentage": 27.52, "elapsed_time": "0:07:06", "remaining_time": "0:18:44"} +{"current_steps": 394, "total_steps": 1428, "loss": 2.845076560974121, "lr": 9.094786172374066e-06, "epoch": 0.8277310924369747, "percentage": 27.59, "elapsed_time": "0:07:07", "remaining_time": "0:18:43"} +{"current_steps": 395, "total_steps": 1428, "loss": 2.9212491512298584, "lr": 9.087759088705541e-06, "epoch": 0.8298319327731093, "percentage": 27.66, "elapsed_time": "0:07:09", "remaining_time": "0:18:42"} +{"current_steps": 396, "total_steps": 1428, "loss": 2.752890110015869, "lr": 9.08070757193735e-06, "epoch": 0.8319327731092437, "percentage": 27.73, "elapsed_time": "0:07:10", "remaining_time": "0:18:40"} +{"current_steps": 397, "total_steps": 1428, "loss": 3.1292171478271484, "lr": 9.07363166421738e-06, "epoch": 0.8340336134453782, "percentage": 27.8, "elapsed_time": "0:07:11", "remaining_time": "0:18:39"} +{"current_steps": 398, "total_steps": 1428, "loss": 2.2926840782165527, "lr": 9.066531407839307e-06, "epoch": 0.8361344537815126, "percentage": 27.87, "elapsed_time": "0:07:12", "remaining_time": "0:18:38"} +{"current_steps": 399, "total_steps": 1428, "loss": 2.7644119262695312, "lr": 9.059406845242343e-06, "epoch": 0.8382352941176471, "percentage": 27.94, "elapsed_time": "0:07:13", "remaining_time": "0:18:37"} +{"current_steps": 400, "total_steps": 1428, "loss": 2.9096150398254395, "lr": 9.05225801901098e-06, "epoch": 0.8403361344537815, "percentage": 28.01, "elapsed_time": "0:07:14", "remaining_time": "0:18:36"} +{"current_steps": 401, "total_steps": 1428, "loss": 4.536911964416504, "lr": 9.045084971874738e-06, "epoch": 0.842436974789916, "percentage": 28.08, "elapsed_time": "0:07:15", "remaining_time": "0:18:35"} +{"current_steps": 402, "total_steps": 1428, "loss": 3.3775062561035156, "lr": 9.03788774670791e-06, "epoch": 0.8445378151260504, "percentage": 28.15, "elapsed_time": "0:07:16", "remaining_time": "0:18:34"} +{"current_steps": 403, "total_steps": 1428, "loss": 2.755703926086426, "lr": 9.030666386529303e-06, "epoch": 0.8466386554621849, "percentage": 28.22, "elapsed_time": "0:07:17", "remaining_time": "0:18:33"} +{"current_steps": 404, "total_steps": 1428, "loss": 2.812281608581543, "lr": 9.023420934501981e-06, "epoch": 0.8487394957983193, "percentage": 28.29, "elapsed_time": "0:07:18", "remaining_time": "0:18:32"} +{"current_steps": 405, "total_steps": 1428, "loss": 2.9015493392944336, "lr": 9.01615143393301e-06, "epoch": 0.8508403361344538, "percentage": 28.36, "elapsed_time": "0:07:19", "remaining_time": "0:18:30"} +{"current_steps": 406, "total_steps": 1428, "loss": 2.8743391036987305, "lr": 9.008857928273199e-06, "epoch": 0.8529411764705882, "percentage": 28.43, "elapsed_time": "0:07:20", "remaining_time": "0:18:29"} +{"current_steps": 407, "total_steps": 1428, "loss": 2.7400550842285156, "lr": 9.001540461116835e-06, "epoch": 0.8550420168067226, "percentage": 28.5, "elapsed_time": "0:07:21", "remaining_time": "0:18:28"} +{"current_steps": 408, "total_steps": 1428, "loss": 3.788983106613159, "lr": 8.994199076201428e-06, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "0:07:23", "remaining_time": "0:18:27"} +{"current_steps": 409, "total_steps": 1428, "loss": 2.426604747772217, "lr": 8.98683381740745e-06, "epoch": 0.8592436974789915, "percentage": 28.64, "elapsed_time": "0:07:24", "remaining_time": "0:18:26"} +{"current_steps": 410, "total_steps": 1428, "loss": 2.467769145965576, "lr": 8.979444728758067e-06, "epoch": 0.8613445378151261, "percentage": 28.71, "elapsed_time": "0:07:25", "remaining_time": "0:18:25"} +{"current_steps": 411, "total_steps": 1428, "loss": 2.878884792327881, "lr": 8.97203185441888e-06, "epoch": 0.8634453781512605, "percentage": 28.78, "elapsed_time": "0:07:26", "remaining_time": "0:18:24"} +{"current_steps": 412, "total_steps": 1428, "loss": 3.323913812637329, "lr": 8.964595238697659e-06, "epoch": 0.865546218487395, "percentage": 28.85, "elapsed_time": "0:07:27", "remaining_time": "0:18:23"} +{"current_steps": 413, "total_steps": 1428, "loss": 2.2674732208251953, "lr": 8.957134926044088e-06, "epoch": 0.8676470588235294, "percentage": 28.92, "elapsed_time": "0:07:28", "remaining_time": "0:18:22"} +{"current_steps": 414, "total_steps": 1428, "loss": 2.6359667778015137, "lr": 8.949650961049479e-06, "epoch": 0.8697478991596639, "percentage": 28.99, "elapsed_time": "0:07:29", "remaining_time": "0:18:21"} +{"current_steps": 415, "total_steps": 1428, "loss": 4.3965678215026855, "lr": 8.942143388446522e-06, "epoch": 0.8718487394957983, "percentage": 29.06, "elapsed_time": "0:07:30", "remaining_time": "0:18:20"} +{"current_steps": 416, "total_steps": 1428, "loss": 3.584599733352661, "lr": 8.934612253109017e-06, "epoch": 0.8739495798319328, "percentage": 29.13, "elapsed_time": "0:07:31", "remaining_time": "0:18:19"} +{"current_steps": 417, "total_steps": 1428, "loss": 2.9781904220581055, "lr": 8.927057600051594e-06, "epoch": 0.8760504201680672, "percentage": 29.2, "elapsed_time": "0:07:32", "remaining_time": "0:18:17"} +{"current_steps": 418, "total_steps": 1428, "loss": 3.3312220573425293, "lr": 8.919479474429462e-06, "epoch": 0.8781512605042017, "percentage": 29.27, "elapsed_time": "0:07:33", "remaining_time": "0:18:16"} +{"current_steps": 419, "total_steps": 1428, "loss": 3.8054161071777344, "lr": 8.911877921538117e-06, "epoch": 0.8802521008403361, "percentage": 29.34, "elapsed_time": "0:07:35", "remaining_time": "0:18:15"} +{"current_steps": 420, "total_steps": 1428, "loss": 2.8041489124298096, "lr": 8.904252986813091e-06, "epoch": 0.8823529411764706, "percentage": 29.41, "elapsed_time": "0:07:36", "remaining_time": "0:18:14"} +{"current_steps": 421, "total_steps": 1428, "loss": 2.8391265869140625, "lr": 8.896604715829671e-06, "epoch": 0.884453781512605, "percentage": 29.48, "elapsed_time": "0:07:37", "remaining_time": "0:18:13"} +{"current_steps": 422, "total_steps": 1428, "loss": 2.6835553646087646, "lr": 8.888933154302626e-06, "epoch": 0.8865546218487395, "percentage": 29.55, "elapsed_time": "0:07:38", "remaining_time": "0:18:12"} +{"current_steps": 423, "total_steps": 1428, "loss": 2.6738481521606445, "lr": 8.881238348085936e-06, "epoch": 0.8886554621848739, "percentage": 29.62, "elapsed_time": "0:07:39", "remaining_time": "0:18:11"} +{"current_steps": 424, "total_steps": 1428, "loss": 2.619101047515869, "lr": 8.87352034317252e-06, "epoch": 0.8907563025210085, "percentage": 29.69, "elapsed_time": "0:07:40", "remaining_time": "0:18:10"} +{"current_steps": 425, "total_steps": 1428, "loss": 3.3444905281066895, "lr": 8.865779185693957e-06, "epoch": 0.8928571428571429, "percentage": 29.76, "elapsed_time": "0:07:41", "remaining_time": "0:18:09"} +{"current_steps": 426, "total_steps": 1428, "loss": 2.1527421474456787, "lr": 8.858014921920215e-06, "epoch": 0.8949579831932774, "percentage": 29.83, "elapsed_time": "0:07:42", "remaining_time": "0:18:07"} +{"current_steps": 427, "total_steps": 1428, "loss": 2.6689836978912354, "lr": 8.850227598259365e-06, "epoch": 0.8970588235294118, "percentage": 29.9, "elapsed_time": "0:07:43", "remaining_time": "0:18:06"} +{"current_steps": 428, "total_steps": 1428, "loss": 3.0119547843933105, "lr": 8.842417261257316e-06, "epoch": 0.8991596638655462, "percentage": 29.97, "elapsed_time": "0:07:44", "remaining_time": "0:18:05"} +{"current_steps": 429, "total_steps": 1428, "loss": 2.482861042022705, "lr": 8.83458395759753e-06, "epoch": 0.9012605042016807, "percentage": 30.04, "elapsed_time": "0:07:45", "remaining_time": "0:18:04"} +{"current_steps": 430, "total_steps": 1428, "loss": 2.8982067108154297, "lr": 8.826727734100742e-06, "epoch": 0.9033613445378151, "percentage": 30.11, "elapsed_time": "0:07:46", "remaining_time": "0:18:03"} +{"current_steps": 431, "total_steps": 1428, "loss": 2.5004382133483887, "lr": 8.818848637724681e-06, "epoch": 0.9054621848739496, "percentage": 30.18, "elapsed_time": "0:07:47", "remaining_time": "0:18:02"} +{"current_steps": 432, "total_steps": 1428, "loss": 2.612011194229126, "lr": 8.810946715563798e-06, "epoch": 0.907563025210084, "percentage": 30.25, "elapsed_time": "0:07:49", "remaining_time": "0:18:01"} +{"current_steps": 433, "total_steps": 1428, "loss": 2.9700820446014404, "lr": 8.803022014848966e-06, "epoch": 0.9096638655462185, "percentage": 30.32, "elapsed_time": "0:07:50", "remaining_time": "0:18:00"} +{"current_steps": 434, "total_steps": 1428, "loss": 3.248368263244629, "lr": 8.795074582947214e-06, "epoch": 0.9117647058823529, "percentage": 30.39, "elapsed_time": "0:07:51", "remaining_time": "0:17:59"} +{"current_steps": 435, "total_steps": 1428, "loss": 2.993704319000244, "lr": 8.787104467361442e-06, "epoch": 0.9138655462184874, "percentage": 30.46, "elapsed_time": "0:07:52", "remaining_time": "0:17:58"} +{"current_steps": 436, "total_steps": 1428, "loss": 2.6930155754089355, "lr": 8.779111715730127e-06, "epoch": 0.9159663865546218, "percentage": 30.53, "elapsed_time": "0:07:53", "remaining_time": "0:17:57"} +{"current_steps": 437, "total_steps": 1428, "loss": 3.069434404373169, "lr": 8.771096375827047e-06, "epoch": 0.9180672268907563, "percentage": 30.6, "elapsed_time": "0:07:54", "remaining_time": "0:17:55"} +{"current_steps": 438, "total_steps": 1428, "loss": 3.1358611583709717, "lr": 8.763058495560994e-06, "epoch": 0.9201680672268907, "percentage": 30.67, "elapsed_time": "0:07:55", "remaining_time": "0:17:54"} +{"current_steps": 439, "total_steps": 1428, "loss": 3.2987184524536133, "lr": 8.754998122975489e-06, "epoch": 0.9222689075630253, "percentage": 30.74, "elapsed_time": "0:07:56", "remaining_time": "0:17:53"} +{"current_steps": 440, "total_steps": 1428, "loss": 2.9279255867004395, "lr": 8.746915306248488e-06, "epoch": 0.9243697478991597, "percentage": 30.81, "elapsed_time": "0:07:57", "remaining_time": "0:17:52"} +{"current_steps": 441, "total_steps": 1428, "loss": 2.795942783355713, "lr": 8.7388100936921e-06, "epoch": 0.9264705882352942, "percentage": 30.88, "elapsed_time": "0:07:58", "remaining_time": "0:17:51"} +{"current_steps": 442, "total_steps": 1428, "loss": 2.7590699195861816, "lr": 8.730682533752301e-06, "epoch": 0.9285714285714286, "percentage": 30.95, "elapsed_time": "0:07:59", "remaining_time": "0:17:50"} +{"current_steps": 443, "total_steps": 1428, "loss": 2.6571459770202637, "lr": 8.722532675008635e-06, "epoch": 0.930672268907563, "percentage": 31.02, "elapsed_time": "0:08:00", "remaining_time": "0:17:49"} +{"current_steps": 444, "total_steps": 1428, "loss": 2.7342920303344727, "lr": 8.714360566173932e-06, "epoch": 0.9327731092436975, "percentage": 31.09, "elapsed_time": "0:08:01", "remaining_time": "0:17:48"} +{"current_steps": 445, "total_steps": 1428, "loss": 2.9492366313934326, "lr": 8.706166256094013e-06, "epoch": 0.9348739495798319, "percentage": 31.16, "elapsed_time": "0:08:03", "remaining_time": "0:17:47"} +{"current_steps": 446, "total_steps": 1428, "loss": 2.937699317932129, "lr": 8.6979497937474e-06, "epoch": 0.9369747899159664, "percentage": 31.23, "elapsed_time": "0:08:04", "remaining_time": "0:17:45"} +{"current_steps": 447, "total_steps": 1428, "loss": 3.23824405670166, "lr": 8.689711228245021e-06, "epoch": 0.9390756302521008, "percentage": 31.3, "elapsed_time": "0:08:05", "remaining_time": "0:17:44"} +{"current_steps": 448, "total_steps": 1428, "loss": 2.542668581008911, "lr": 8.681450608829916e-06, "epoch": 0.9411764705882353, "percentage": 31.37, "elapsed_time": "0:08:06", "remaining_time": "0:17:43"} +{"current_steps": 449, "total_steps": 1428, "loss": 3.257632255554199, "lr": 8.67316798487695e-06, "epoch": 0.9432773109243697, "percentage": 31.44, "elapsed_time": "0:08:07", "remaining_time": "0:17:42"} +{"current_steps": 450, "total_steps": 1428, "loss": 2.7072958946228027, "lr": 8.664863405892506e-06, "epoch": 0.9453781512605042, "percentage": 31.51, "elapsed_time": "0:08:08", "remaining_time": "0:17:41"} +{"current_steps": 451, "total_steps": 1428, "loss": 2.532301664352417, "lr": 8.656536921514195e-06, "epoch": 0.9474789915966386, "percentage": 31.58, "elapsed_time": "0:08:09", "remaining_time": "0:17:40"} +{"current_steps": 452, "total_steps": 1428, "loss": 2.726604461669922, "lr": 8.648188581510567e-06, "epoch": 0.9495798319327731, "percentage": 31.65, "elapsed_time": "0:08:10", "remaining_time": "0:17:39"} +{"current_steps": 453, "total_steps": 1428, "loss": 2.516594886779785, "lr": 8.639818435780797e-06, "epoch": 0.9516806722689075, "percentage": 31.72, "elapsed_time": "0:08:11", "remaining_time": "0:17:38"} +{"current_steps": 454, "total_steps": 1428, "loss": 2.7706644535064697, "lr": 8.631426534354404e-06, "epoch": 0.9537815126050421, "percentage": 31.79, "elapsed_time": "0:08:12", "remaining_time": "0:17:37"} +{"current_steps": 455, "total_steps": 1428, "loss": 3.2427144050598145, "lr": 8.623012927390936e-06, "epoch": 0.9558823529411765, "percentage": 31.86, "elapsed_time": "0:08:13", "remaining_time": "0:17:35"} +{"current_steps": 456, "total_steps": 1428, "loss": 3.1202523708343506, "lr": 8.614577665179684e-06, "epoch": 0.957983193277311, "percentage": 31.93, "elapsed_time": "0:08:14", "remaining_time": "0:17:34"} +{"current_steps": 457, "total_steps": 1428, "loss": 2.6210598945617676, "lr": 8.606120798139375e-06, "epoch": 0.9600840336134454, "percentage": 32.0, "elapsed_time": "0:08:15", "remaining_time": "0:17:33"} +{"current_steps": 458, "total_steps": 1428, "loss": 2.669271469116211, "lr": 8.597642376817865e-06, "epoch": 0.9621848739495799, "percentage": 32.07, "elapsed_time": "0:08:17", "remaining_time": "0:17:32"} +{"current_steps": 459, "total_steps": 1428, "loss": 2.6489734649658203, "lr": 8.589142451891849e-06, "epoch": 0.9642857142857143, "percentage": 32.14, "elapsed_time": "0:08:18", "remaining_time": "0:17:31"} +{"current_steps": 460, "total_steps": 1428, "loss": 3.10178804397583, "lr": 8.580621074166553e-06, "epoch": 0.9663865546218487, "percentage": 32.21, "elapsed_time": "0:08:19", "remaining_time": "0:17:30"} +{"current_steps": 461, "total_steps": 1428, "loss": 2.589158296585083, "lr": 8.572078294575423e-06, "epoch": 0.9684873949579832, "percentage": 32.28, "elapsed_time": "0:08:20", "remaining_time": "0:17:29"} +{"current_steps": 462, "total_steps": 1428, "loss": 2.5543792247772217, "lr": 8.56351416417983e-06, "epoch": 0.9705882352941176, "percentage": 32.35, "elapsed_time": "0:08:21", "remaining_time": "0:17:28"} +{"current_steps": 463, "total_steps": 1428, "loss": 2.65985369682312, "lr": 8.554928734168767e-06, "epoch": 0.9726890756302521, "percentage": 32.42, "elapsed_time": "0:08:22", "remaining_time": "0:17:27"} +{"current_steps": 464, "total_steps": 1428, "loss": 3.0177440643310547, "lr": 8.546322055858526e-06, "epoch": 0.9747899159663865, "percentage": 32.49, "elapsed_time": "0:08:23", "remaining_time": "0:17:25"} +{"current_steps": 465, "total_steps": 1428, "loss": 2.2767248153686523, "lr": 8.537694180692416e-06, "epoch": 0.976890756302521, "percentage": 32.56, "elapsed_time": "0:08:24", "remaining_time": "0:17:24"} +{"current_steps": 466, "total_steps": 1428, "loss": 2.7835707664489746, "lr": 8.529045160240433e-06, "epoch": 0.9789915966386554, "percentage": 32.63, "elapsed_time": "0:08:25", "remaining_time": "0:17:23"} +{"current_steps": 467, "total_steps": 1428, "loss": 2.4373722076416016, "lr": 8.520375046198965e-06, "epoch": 0.9810924369747899, "percentage": 32.7, "elapsed_time": "0:08:26", "remaining_time": "0:17:22"} +{"current_steps": 468, "total_steps": 1428, "loss": 2.464303731918335, "lr": 8.51168389039048e-06, "epoch": 0.9831932773109243, "percentage": 32.77, "elapsed_time": "0:08:27", "remaining_time": "0:17:21"} +{"current_steps": 469, "total_steps": 1428, "loss": 2.2609100341796875, "lr": 8.502971744763216e-06, "epoch": 0.9852941176470589, "percentage": 32.84, "elapsed_time": "0:08:28", "remaining_time": "0:17:20"} +{"current_steps": 470, "total_steps": 1428, "loss": 3.0135858058929443, "lr": 8.494238661390865e-06, "epoch": 0.9873949579831933, "percentage": 32.91, "elapsed_time": "0:08:29", "remaining_time": "0:17:19"} +{"current_steps": 471, "total_steps": 1428, "loss": 2.770965099334717, "lr": 8.485484692472272e-06, "epoch": 0.9894957983193278, "percentage": 32.98, "elapsed_time": "0:08:31", "remaining_time": "0:17:18"} +{"current_steps": 472, "total_steps": 1428, "loss": 2.6243722438812256, "lr": 8.476709890331116e-06, "epoch": 0.9915966386554622, "percentage": 33.05, "elapsed_time": "0:08:32", "remaining_time": "0:17:17"} +{"current_steps": 473, "total_steps": 1428, "loss": 2.9319207668304443, "lr": 8.467914307415601e-06, "epoch": 0.9936974789915967, "percentage": 33.12, "elapsed_time": "0:08:33", "remaining_time": "0:17:16"} +{"current_steps": 474, "total_steps": 1428, "loss": 3.0626072883605957, "lr": 8.459097996298137e-06, "epoch": 0.9957983193277311, "percentage": 33.19, "elapsed_time": "0:08:34", "remaining_time": "0:17:15"} +{"current_steps": 475, "total_steps": 1428, "loss": 3.000889778137207, "lr": 8.45026100967503e-06, "epoch": 0.9978991596638656, "percentage": 33.26, "elapsed_time": "0:08:35", "remaining_time": "0:17:13"} +{"current_steps": 476, "total_steps": 1428, "loss": 3.112825393676758, "lr": 8.441403400366169e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:08:36", "remaining_time": "0:17:12"} +{"current_steps": 477, "total_steps": 1428, "loss": 1.4137624502182007, "lr": 8.432525221314708e-06, "epoch": 1.0021008403361344, "percentage": 33.4, "elapsed_time": "0:10:15", "remaining_time": "0:20:27"} +{"current_steps": 478, "total_steps": 1428, "loss": 1.6808059215545654, "lr": 8.423626525586744e-06, "epoch": 1.004201680672269, "percentage": 33.47, "elapsed_time": "0:10:16", "remaining_time": "0:20:26"} +{"current_steps": 479, "total_steps": 1428, "loss": 1.8797330856323242, "lr": 8.414707366371006e-06, "epoch": 1.0063025210084033, "percentage": 33.54, "elapsed_time": "0:10:18", "remaining_time": "0:20:24"} +{"current_steps": 480, "total_steps": 1428, "loss": 1.9548699855804443, "lr": 8.405767796978546e-06, "epoch": 1.0084033613445378, "percentage": 33.61, "elapsed_time": "0:10:19", "remaining_time": "0:20:22"} +{"current_steps": 481, "total_steps": 1428, "loss": 1.5713114738464355, "lr": 8.396807870842396e-06, "epoch": 1.0105042016806722, "percentage": 33.68, "elapsed_time": "0:10:20", "remaining_time": "0:20:21"} +{"current_steps": 482, "total_steps": 1428, "loss": 1.69504976272583, "lr": 8.387827641517274e-06, "epoch": 1.0126050420168067, "percentage": 33.75, "elapsed_time": "0:10:21", "remaining_time": "0:20:19"} +{"current_steps": 483, "total_steps": 1428, "loss": 1.3813257217407227, "lr": 8.378827162679248e-06, "epoch": 1.0147058823529411, "percentage": 33.82, "elapsed_time": "0:10:22", "remaining_time": "0:20:17"} +{"current_steps": 484, "total_steps": 1428, "loss": 2.4568567276000977, "lr": 8.369806488125418e-06, "epoch": 1.0168067226890756, "percentage": 33.89, "elapsed_time": "0:10:23", "remaining_time": "0:20:16"} +{"current_steps": 485, "total_steps": 1428, "loss": 2.602184534072876, "lr": 8.360765671773603e-06, "epoch": 1.01890756302521, "percentage": 33.96, "elapsed_time": "0:10:24", "remaining_time": "0:20:14"} +{"current_steps": 486, "total_steps": 1428, "loss": 1.8193070888519287, "lr": 8.351704767662005e-06, "epoch": 1.0210084033613445, "percentage": 34.03, "elapsed_time": "0:10:25", "remaining_time": "0:20:12"} +{"current_steps": 487, "total_steps": 1428, "loss": 1.4549766778945923, "lr": 8.3426238299489e-06, "epoch": 1.023109243697479, "percentage": 34.1, "elapsed_time": "0:10:26", "remaining_time": "0:20:10"} +{"current_steps": 488, "total_steps": 1428, "loss": 1.4681106805801392, "lr": 8.333522912912308e-06, "epoch": 1.0252100840336134, "percentage": 34.17, "elapsed_time": "0:10:27", "remaining_time": "0:20:09"} +{"current_steps": 489, "total_steps": 1428, "loss": 1.4224164485931396, "lr": 8.324402070949658e-06, "epoch": 1.0273109243697478, "percentage": 34.24, "elapsed_time": "0:10:28", "remaining_time": "0:20:07"} +{"current_steps": 490, "total_steps": 1428, "loss": 2.200676441192627, "lr": 8.315261358577485e-06, "epoch": 1.0294117647058822, "percentage": 34.31, "elapsed_time": "0:10:29", "remaining_time": "0:20:05"} +{"current_steps": 491, "total_steps": 1428, "loss": 1.867397665977478, "lr": 8.306100830431085e-06, "epoch": 1.0315126050420167, "percentage": 34.38, "elapsed_time": "0:10:31", "remaining_time": "0:20:04"} +{"current_steps": 492, "total_steps": 1428, "loss": 1.4270985126495361, "lr": 8.296920541264197e-06, "epoch": 1.0336134453781514, "percentage": 34.45, "elapsed_time": "0:10:32", "remaining_time": "0:20:02"} +{"current_steps": 493, "total_steps": 1428, "loss": 1.464069128036499, "lr": 8.287720545948676e-06, "epoch": 1.0357142857142858, "percentage": 34.52, "elapsed_time": "0:10:33", "remaining_time": "0:20:00"} +{"current_steps": 494, "total_steps": 1428, "loss": 1.192551612854004, "lr": 8.278500899474162e-06, "epoch": 1.0378151260504203, "percentage": 34.59, "elapsed_time": "0:10:34", "remaining_time": "0:19:59"} +{"current_steps": 495, "total_steps": 1428, "loss": 2.367762327194214, "lr": 8.269261656947755e-06, "epoch": 1.0399159663865547, "percentage": 34.66, "elapsed_time": "0:10:35", "remaining_time": "0:19:57"} +{"current_steps": 496, "total_steps": 1428, "loss": 1.6752372980117798, "lr": 8.260002873593679e-06, "epoch": 1.0420168067226891, "percentage": 34.73, "elapsed_time": "0:10:36", "remaining_time": "0:19:55"} +{"current_steps": 497, "total_steps": 1428, "loss": 1.409712314605713, "lr": 8.25072460475296e-06, "epoch": 1.0441176470588236, "percentage": 34.8, "elapsed_time": "0:10:37", "remaining_time": "0:19:54"} +{"current_steps": 498, "total_steps": 1428, "loss": 1.6270588636398315, "lr": 8.24142690588309e-06, "epoch": 1.046218487394958, "percentage": 34.87, "elapsed_time": "0:10:38", "remaining_time": "0:19:52"} +{"current_steps": 499, "total_steps": 1428, "loss": 1.4294947385787964, "lr": 8.232109832557696e-06, "epoch": 1.0483193277310925, "percentage": 34.94, "elapsed_time": "0:10:39", "remaining_time": "0:19:50"} +{"current_steps": 500, "total_steps": 1428, "loss": 1.2340010404586792, "lr": 8.222773440466213e-06, "epoch": 1.050420168067227, "percentage": 35.01, "elapsed_time": "0:10:40", "remaining_time": "0:19:49"} +{"current_steps": 501, "total_steps": 1428, "loss": 1.451041340827942, "lr": 8.213417785413538e-06, "epoch": 1.0525210084033614, "percentage": 35.08, "elapsed_time": "0:10:41", "remaining_time": "0:19:47"} +{"current_steps": 502, "total_steps": 1428, "loss": 0.8124719858169556, "lr": 8.204042923319717e-06, "epoch": 1.0546218487394958, "percentage": 35.15, "elapsed_time": "0:10:42", "remaining_time": "0:19:46"} +{"current_steps": 503, "total_steps": 1428, "loss": 1.5310864448547363, "lr": 8.19464891021959e-06, "epoch": 1.0567226890756303, "percentage": 35.22, "elapsed_time": "0:10:44", "remaining_time": "0:19:44"} +{"current_steps": 504, "total_steps": 1428, "loss": 1.2139228582382202, "lr": 8.18523580226247e-06, "epoch": 1.0588235294117647, "percentage": 35.29, "elapsed_time": "0:10:45", "remaining_time": "0:19:42"} +{"current_steps": 505, "total_steps": 1428, "loss": 1.3573241233825684, "lr": 8.1758036557118e-06, "epoch": 1.0609243697478992, "percentage": 35.36, "elapsed_time": "0:10:46", "remaining_time": "0:19:41"} +{"current_steps": 506, "total_steps": 1428, "loss": 1.9899749755859375, "lr": 8.166352526944821e-06, "epoch": 1.0630252100840336, "percentage": 35.43, "elapsed_time": "0:10:47", "remaining_time": "0:19:39"} +{"current_steps": 507, "total_steps": 1428, "loss": 1.4103593826293945, "lr": 8.156882472452232e-06, "epoch": 1.065126050420168, "percentage": 35.5, "elapsed_time": "0:10:48", "remaining_time": "0:19:37"} +{"current_steps": 508, "total_steps": 1428, "loss": 1.227393627166748, "lr": 8.147393548837856e-06, "epoch": 1.0672268907563025, "percentage": 35.57, "elapsed_time": "0:10:49", "remaining_time": "0:19:36"} +{"current_steps": 509, "total_steps": 1428, "loss": 1.7060927152633667, "lr": 8.137885812818296e-06, "epoch": 1.069327731092437, "percentage": 35.64, "elapsed_time": "0:10:50", "remaining_time": "0:19:34"} +{"current_steps": 510, "total_steps": 1428, "loss": 1.890432357788086, "lr": 8.128359321222601e-06, "epoch": 1.0714285714285714, "percentage": 35.71, "elapsed_time": "0:10:51", "remaining_time": "0:19:32"} +{"current_steps": 511, "total_steps": 1428, "loss": 1.8258857727050781, "lr": 8.118814130991925e-06, "epoch": 1.0735294117647058, "percentage": 35.78, "elapsed_time": "0:10:52", "remaining_time": "0:19:31"} +{"current_steps": 512, "total_steps": 1428, "loss": 0.9584097862243652, "lr": 8.109250299179188e-06, "epoch": 1.0756302521008403, "percentage": 35.85, "elapsed_time": "0:10:53", "remaining_time": "0:19:29"} +{"current_steps": 513, "total_steps": 1428, "loss": 1.4017150402069092, "lr": 8.09966788294873e-06, "epoch": 1.0777310924369747, "percentage": 35.92, "elapsed_time": "0:10:54", "remaining_time": "0:19:28"} +{"current_steps": 514, "total_steps": 1428, "loss": 1.3034381866455078, "lr": 8.090066939575972e-06, "epoch": 1.0798319327731092, "percentage": 35.99, "elapsed_time": "0:10:55", "remaining_time": "0:19:26"} +{"current_steps": 515, "total_steps": 1428, "loss": 1.0734150409698486, "lr": 8.080447526447079e-06, "epoch": 1.0819327731092436, "percentage": 36.06, "elapsed_time": "0:10:57", "remaining_time": "0:19:24"} +{"current_steps": 516, "total_steps": 1428, "loss": 0.8819087743759155, "lr": 8.070809701058606e-06, "epoch": 1.084033613445378, "percentage": 36.13, "elapsed_time": "0:10:58", "remaining_time": "0:19:23"} +{"current_steps": 517, "total_steps": 1428, "loss": 1.3253920078277588, "lr": 8.061153521017169e-06, "epoch": 1.0861344537815125, "percentage": 36.2, "elapsed_time": "0:10:59", "remaining_time": "0:19:21"} +{"current_steps": 518, "total_steps": 1428, "loss": 1.0912744998931885, "lr": 8.051479044039086e-06, "epoch": 1.088235294117647, "percentage": 36.27, "elapsed_time": "0:11:00", "remaining_time": "0:19:20"} +{"current_steps": 519, "total_steps": 1428, "loss": 1.6941767930984497, "lr": 8.041786327950037e-06, "epoch": 1.0903361344537814, "percentage": 36.34, "elapsed_time": "0:11:01", "remaining_time": "0:19:18"} +{"current_steps": 520, "total_steps": 1428, "loss": 1.058671236038208, "lr": 8.032075430684724e-06, "epoch": 1.092436974789916, "percentage": 36.41, "elapsed_time": "0:11:02", "remaining_time": "0:19:16"} +{"current_steps": 521, "total_steps": 1428, "loss": 1.1603420972824097, "lr": 8.02234641028652e-06, "epoch": 1.0945378151260505, "percentage": 36.48, "elapsed_time": "0:11:03", "remaining_time": "0:19:15"} +{"current_steps": 522, "total_steps": 1428, "loss": 1.4285218715667725, "lr": 8.012599324907121e-06, "epoch": 1.096638655462185, "percentage": 36.55, "elapsed_time": "0:11:04", "remaining_time": "0:19:13"} +{"current_steps": 523, "total_steps": 1428, "loss": 1.3041057586669922, "lr": 8.0028342328062e-06, "epoch": 1.0987394957983194, "percentage": 36.62, "elapsed_time": "0:11:05", "remaining_time": "0:19:12"} +{"current_steps": 524, "total_steps": 1428, "loss": 2.329005718231201, "lr": 7.993051192351056e-06, "epoch": 1.1008403361344539, "percentage": 36.69, "elapsed_time": "0:11:06", "remaining_time": "0:19:10"} +{"current_steps": 525, "total_steps": 1428, "loss": 0.7331016063690186, "lr": 7.983250262016276e-06, "epoch": 1.1029411764705883, "percentage": 36.76, "elapsed_time": "0:11:07", "remaining_time": "0:19:08"} +{"current_steps": 526, "total_steps": 1428, "loss": 2.193528175354004, "lr": 7.973431500383366e-06, "epoch": 1.1050420168067228, "percentage": 36.83, "elapsed_time": "0:11:09", "remaining_time": "0:19:07"} +{"current_steps": 527, "total_steps": 1428, "loss": 1.3245251178741455, "lr": 7.963594966140423e-06, "epoch": 1.1071428571428572, "percentage": 36.9, "elapsed_time": "0:11:10", "remaining_time": "0:19:05"} +{"current_steps": 528, "total_steps": 1428, "loss": 1.1308670043945312, "lr": 7.953740718081765e-06, "epoch": 1.1092436974789917, "percentage": 36.97, "elapsed_time": "0:11:11", "remaining_time": "0:19:04"} +{"current_steps": 529, "total_steps": 1428, "loss": 1.3318034410476685, "lr": 7.943868815107594e-06, "epoch": 1.111344537815126, "percentage": 37.04, "elapsed_time": "0:11:12", "remaining_time": "0:19:02"} +{"current_steps": 530, "total_steps": 1428, "loss": 1.2564438581466675, "lr": 7.933979316223632e-06, "epoch": 1.1134453781512605, "percentage": 37.11, "elapsed_time": "0:11:13", "remaining_time": "0:19:00"} +{"current_steps": 531, "total_steps": 1428, "loss": 1.2420412302017212, "lr": 7.92407228054078e-06, "epoch": 1.115546218487395, "percentage": 37.18, "elapsed_time": "0:11:14", "remaining_time": "0:18:59"} +{"current_steps": 532, "total_steps": 1428, "loss": 1.9582582712173462, "lr": 7.914147767274756e-06, "epoch": 1.1176470588235294, "percentage": 37.25, "elapsed_time": "0:11:15", "remaining_time": "0:18:57"} +{"current_steps": 533, "total_steps": 1428, "loss": 1.7057411670684814, "lr": 7.904205835745744e-06, "epoch": 1.1197478991596639, "percentage": 37.32, "elapsed_time": "0:11:16", "remaining_time": "0:18:56"} +{"current_steps": 534, "total_steps": 1428, "loss": 1.810387134552002, "lr": 7.894246545378037e-06, "epoch": 1.1218487394957983, "percentage": 37.39, "elapsed_time": "0:11:17", "remaining_time": "0:18:54"} +{"current_steps": 535, "total_steps": 1428, "loss": 1.6038577556610107, "lr": 7.884269955699689e-06, "epoch": 1.1239495798319328, "percentage": 37.46, "elapsed_time": "0:11:18", "remaining_time": "0:18:53"} +{"current_steps": 536, "total_steps": 1428, "loss": 1.1410393714904785, "lr": 7.874276126342151e-06, "epoch": 1.1260504201680672, "percentage": 37.54, "elapsed_time": "0:11:19", "remaining_time": "0:18:51"} +{"current_steps": 537, "total_steps": 1428, "loss": 2.28239369392395, "lr": 7.86426511703992e-06, "epoch": 1.1281512605042017, "percentage": 37.61, "elapsed_time": "0:11:20", "remaining_time": "0:18:49"} +{"current_steps": 538, "total_steps": 1428, "loss": 2.1672444343566895, "lr": 7.854236987630178e-06, "epoch": 1.1302521008403361, "percentage": 37.68, "elapsed_time": "0:11:22", "remaining_time": "0:18:48"} +{"current_steps": 539, "total_steps": 1428, "loss": 1.7712535858154297, "lr": 7.844191798052438e-06, "epoch": 1.1323529411764706, "percentage": 37.75, "elapsed_time": "0:11:23", "remaining_time": "0:18:46"} +{"current_steps": 540, "total_steps": 1428, "loss": 1.4109793901443481, "lr": 7.834129608348183e-06, "epoch": 1.134453781512605, "percentage": 37.82, "elapsed_time": "0:11:24", "remaining_time": "0:18:45"} +{"current_steps": 541, "total_steps": 1428, "loss": 1.4405725002288818, "lr": 7.824050478660506e-06, "epoch": 1.1365546218487395, "percentage": 37.89, "elapsed_time": "0:11:25", "remaining_time": "0:18:43"} +{"current_steps": 542, "total_steps": 1428, "loss": 2.2450976371765137, "lr": 7.813954469233758e-06, "epoch": 1.138655462184874, "percentage": 37.96, "elapsed_time": "0:11:26", "remaining_time": "0:18:42"} +{"current_steps": 543, "total_steps": 1428, "loss": 2.16367244720459, "lr": 7.803841640413177e-06, "epoch": 1.1407563025210083, "percentage": 38.03, "elapsed_time": "0:11:27", "remaining_time": "0:18:40"} +{"current_steps": 544, "total_steps": 1428, "loss": 2.3919224739074707, "lr": 7.793712052644535e-06, "epoch": 1.1428571428571428, "percentage": 38.1, "elapsed_time": "0:11:28", "remaining_time": "0:18:39"} +{"current_steps": 545, "total_steps": 1428, "loss": 1.4211726188659668, "lr": 7.783565766473777e-06, "epoch": 1.1449579831932772, "percentage": 38.17, "elapsed_time": "0:11:29", "remaining_time": "0:18:37"} +{"current_steps": 546, "total_steps": 1428, "loss": 1.2502498626708984, "lr": 7.773402842546654e-06, "epoch": 1.1470588235294117, "percentage": 38.24, "elapsed_time": "0:11:30", "remaining_time": "0:18:35"} +{"current_steps": 547, "total_steps": 1428, "loss": 1.423762321472168, "lr": 7.76322334160836e-06, "epoch": 1.1491596638655461, "percentage": 38.31, "elapsed_time": "0:11:31", "remaining_time": "0:18:34"} +{"current_steps": 548, "total_steps": 1428, "loss": 1.1090279817581177, "lr": 7.75302732450318e-06, "epoch": 1.1512605042016806, "percentage": 38.38, "elapsed_time": "0:11:32", "remaining_time": "0:18:32"} +{"current_steps": 549, "total_steps": 1428, "loss": 1.0321426391601562, "lr": 7.742814852174112e-06, "epoch": 1.153361344537815, "percentage": 38.45, "elapsed_time": "0:11:34", "remaining_time": "0:18:31"} +{"current_steps": 550, "total_steps": 1428, "loss": 1.0928632020950317, "lr": 7.73258598566251e-06, "epoch": 1.1554621848739495, "percentage": 38.52, "elapsed_time": "0:11:35", "remaining_time": "0:18:29"} +{"current_steps": 551, "total_steps": 1428, "loss": 1.2369472980499268, "lr": 7.72234078610772e-06, "epoch": 1.157563025210084, "percentage": 38.59, "elapsed_time": "0:11:36", "remaining_time": "0:18:28"} +{"current_steps": 552, "total_steps": 1428, "loss": 1.2957392930984497, "lr": 7.712079314746716e-06, "epoch": 1.1596638655462184, "percentage": 38.66, "elapsed_time": "0:11:37", "remaining_time": "0:18:26"} +{"current_steps": 553, "total_steps": 1428, "loss": 1.6709070205688477, "lr": 7.701801632913722e-06, "epoch": 1.161764705882353, "percentage": 38.73, "elapsed_time": "0:11:38", "remaining_time": "0:18:25"} +{"current_steps": 554, "total_steps": 1428, "loss": 1.6091077327728271, "lr": 7.691507802039861e-06, "epoch": 1.1638655462184875, "percentage": 38.8, "elapsed_time": "0:11:39", "remaining_time": "0:18:23"} +{"current_steps": 555, "total_steps": 1428, "loss": 1.8003133535385132, "lr": 7.68119788365278e-06, "epoch": 1.165966386554622, "percentage": 38.87, "elapsed_time": "0:11:40", "remaining_time": "0:18:21"} +{"current_steps": 556, "total_steps": 1428, "loss": 1.0151593685150146, "lr": 7.670871939376281e-06, "epoch": 1.1680672268907564, "percentage": 38.94, "elapsed_time": "0:11:41", "remaining_time": "0:18:20"} +{"current_steps": 557, "total_steps": 1428, "loss": 1.3084783554077148, "lr": 7.660530030929961e-06, "epoch": 1.1701680672268908, "percentage": 39.01, "elapsed_time": "0:11:42", "remaining_time": "0:18:18"} +{"current_steps": 558, "total_steps": 1428, "loss": 1.3882572650909424, "lr": 7.650172220128828e-06, "epoch": 1.1722689075630253, "percentage": 39.08, "elapsed_time": "0:11:43", "remaining_time": "0:18:17"} +{"current_steps": 559, "total_steps": 1428, "loss": 1.3919298648834229, "lr": 7.639798568882947e-06, "epoch": 1.1743697478991597, "percentage": 39.15, "elapsed_time": "0:11:44", "remaining_time": "0:18:15"} +{"current_steps": 560, "total_steps": 1428, "loss": 1.3745830059051514, "lr": 7.629409139197063e-06, "epoch": 1.1764705882352942, "percentage": 39.22, "elapsed_time": "0:11:45", "remaining_time": "0:18:14"} +{"current_steps": 561, "total_steps": 1428, "loss": 1.2964568138122559, "lr": 7.619003993170226e-06, "epoch": 1.1785714285714286, "percentage": 39.29, "elapsed_time": "0:11:46", "remaining_time": "0:18:12"} +{"current_steps": 562, "total_steps": 1428, "loss": 1.75518798828125, "lr": 7.608583192995433e-06, "epoch": 1.180672268907563, "percentage": 39.36, "elapsed_time": "0:11:48", "remaining_time": "0:18:11"} +{"current_steps": 563, "total_steps": 1428, "loss": 2.156588554382324, "lr": 7.598146800959238e-06, "epoch": 1.1827731092436975, "percentage": 39.43, "elapsed_time": "0:11:49", "remaining_time": "0:18:09"} +{"current_steps": 564, "total_steps": 1428, "loss": 1.3602566719055176, "lr": 7.5876948794414015e-06, "epoch": 1.184873949579832, "percentage": 39.5, "elapsed_time": "0:11:50", "remaining_time": "0:18:08"} +{"current_steps": 565, "total_steps": 1428, "loss": 1.5620733499526978, "lr": 7.577227490914495e-06, "epoch": 1.1869747899159664, "percentage": 39.57, "elapsed_time": "0:11:51", "remaining_time": "0:18:06"} +{"current_steps": 566, "total_steps": 1428, "loss": 0.971282422542572, "lr": 7.5667446979435445e-06, "epoch": 1.1890756302521008, "percentage": 39.64, "elapsed_time": "0:11:52", "remaining_time": "0:18:04"} +{"current_steps": 567, "total_steps": 1428, "loss": 1.1717581748962402, "lr": 7.556246563185648e-06, "epoch": 1.1911764705882353, "percentage": 39.71, "elapsed_time": "0:11:53", "remaining_time": "0:18:03"} +{"current_steps": 568, "total_steps": 1428, "loss": 1.8813025951385498, "lr": 7.545733149389605e-06, "epoch": 1.1932773109243697, "percentage": 39.78, "elapsed_time": "0:11:54", "remaining_time": "0:18:01"} +{"current_steps": 569, "total_steps": 1428, "loss": 1.280207633972168, "lr": 7.535204519395538e-06, "epoch": 1.1953781512605042, "percentage": 39.85, "elapsed_time": "0:11:55", "remaining_time": "0:18:00"} +{"current_steps": 570, "total_steps": 1428, "loss": 1.5685778856277466, "lr": 7.5246607361345215e-06, "epoch": 1.1974789915966386, "percentage": 39.92, "elapsed_time": "0:11:56", "remaining_time": "0:17:58"} +{"current_steps": 571, "total_steps": 1428, "loss": 2.2011172771453857, "lr": 7.514101862628203e-06, "epoch": 1.199579831932773, "percentage": 39.99, "elapsed_time": "0:11:57", "remaining_time": "0:17:57"} +{"current_steps": 572, "total_steps": 1428, "loss": 2.0038180351257324, "lr": 7.503527961988422e-06, "epoch": 1.2016806722689075, "percentage": 40.06, "elapsed_time": "0:11:58", "remaining_time": "0:17:55"} +{"current_steps": 573, "total_steps": 1428, "loss": 1.1275922060012817, "lr": 7.492939097416842e-06, "epoch": 1.203781512605042, "percentage": 40.13, "elapsed_time": "0:11:59", "remaining_time": "0:17:54"} +{"current_steps": 574, "total_steps": 1428, "loss": 1.208678960800171, "lr": 7.482335332204568e-06, "epoch": 1.2058823529411764, "percentage": 40.2, "elapsed_time": "0:12:01", "remaining_time": "0:17:52"} +{"current_steps": 575, "total_steps": 1428, "loss": 1.7450125217437744, "lr": 7.471716729731764e-06, "epoch": 1.2079831932773109, "percentage": 40.27, "elapsed_time": "0:12:02", "remaining_time": "0:17:51"} +{"current_steps": 576, "total_steps": 1428, "loss": 1.5381510257720947, "lr": 7.461083353467283e-06, "epoch": 1.2100840336134453, "percentage": 40.34, "elapsed_time": "0:12:03", "remaining_time": "0:17:49"} +{"current_steps": 577, "total_steps": 1428, "loss": 1.6857651472091675, "lr": 7.450435266968279e-06, "epoch": 1.2121848739495797, "percentage": 40.41, "elapsed_time": "0:12:04", "remaining_time": "0:17:48"} +{"current_steps": 578, "total_steps": 1428, "loss": 1.9049471616744995, "lr": 7.4397725338798365e-06, "epoch": 1.2142857142857142, "percentage": 40.48, "elapsed_time": "0:12:05", "remaining_time": "0:17:46"} +{"current_steps": 579, "total_steps": 1428, "loss": 2.2398974895477295, "lr": 7.429095217934578e-06, "epoch": 1.2163865546218489, "percentage": 40.55, "elapsed_time": "0:12:06", "remaining_time": "0:17:45"} +{"current_steps": 580, "total_steps": 1428, "loss": 1.8767409324645996, "lr": 7.4184033829522935e-06, "epoch": 1.2184873949579833, "percentage": 40.62, "elapsed_time": "0:12:07", "remaining_time": "0:17:43"} +{"current_steps": 581, "total_steps": 1428, "loss": 1.4787061214447021, "lr": 7.4076970928395565e-06, "epoch": 1.2205882352941178, "percentage": 40.69, "elapsed_time": "0:12:08", "remaining_time": "0:17:42"} +{"current_steps": 582, "total_steps": 1428, "loss": 1.1055876016616821, "lr": 7.396976411589338e-06, "epoch": 1.2226890756302522, "percentage": 40.76, "elapsed_time": "0:12:09", "remaining_time": "0:17:40"} +{"current_steps": 583, "total_steps": 1428, "loss": 1.668757438659668, "lr": 7.386241403280629e-06, "epoch": 1.2247899159663866, "percentage": 40.83, "elapsed_time": "0:12:10", "remaining_time": "0:17:39"} +{"current_steps": 584, "total_steps": 1428, "loss": 1.2818783521652222, "lr": 7.375492132078051e-06, "epoch": 1.226890756302521, "percentage": 40.9, "elapsed_time": "0:12:11", "remaining_time": "0:17:37"} +{"current_steps": 585, "total_steps": 1428, "loss": 1.578829050064087, "lr": 7.364728662231484e-06, "epoch": 1.2289915966386555, "percentage": 40.97, "elapsed_time": "0:12:12", "remaining_time": "0:17:36"} +{"current_steps": 586, "total_steps": 1428, "loss": 1.572939157485962, "lr": 7.353951058075669e-06, "epoch": 1.23109243697479, "percentage": 41.04, "elapsed_time": "0:12:14", "remaining_time": "0:17:34"} +{"current_steps": 587, "total_steps": 1428, "loss": 3.977992057800293, "lr": 7.343159384029833e-06, "epoch": 1.2331932773109244, "percentage": 41.11, "elapsed_time": "0:12:15", "remaining_time": "0:17:33"} +{"current_steps": 588, "total_steps": 1428, "loss": 1.955003023147583, "lr": 7.332353704597299e-06, "epoch": 1.2352941176470589, "percentage": 41.18, "elapsed_time": "0:12:16", "remaining_time": "0:17:31"} +{"current_steps": 589, "total_steps": 1428, "loss": 1.5401737689971924, "lr": 7.321534084365101e-06, "epoch": 1.2373949579831933, "percentage": 41.25, "elapsed_time": "0:12:17", "remaining_time": "0:17:30"} +{"current_steps": 590, "total_steps": 1428, "loss": 1.895308017730713, "lr": 7.310700588003605e-06, "epoch": 1.2394957983193278, "percentage": 41.32, "elapsed_time": "0:12:18", "remaining_time": "0:17:28"} +{"current_steps": 591, "total_steps": 1428, "loss": 1.6920474767684937, "lr": 7.299853280266109e-06, "epoch": 1.2415966386554622, "percentage": 41.39, "elapsed_time": "0:12:19", "remaining_time": "0:17:27"} +{"current_steps": 592, "total_steps": 1428, "loss": 1.9865736961364746, "lr": 7.28899222598847e-06, "epoch": 1.2436974789915967, "percentage": 41.46, "elapsed_time": "0:12:20", "remaining_time": "0:17:25"} +{"current_steps": 593, "total_steps": 1428, "loss": 1.2350941896438599, "lr": 7.278117490088703e-06, "epoch": 1.245798319327731, "percentage": 41.53, "elapsed_time": "0:12:21", "remaining_time": "0:17:24"} +{"current_steps": 594, "total_steps": 1428, "loss": 1.800095558166504, "lr": 7.267229137566607e-06, "epoch": 1.2478991596638656, "percentage": 41.6, "elapsed_time": "0:12:22", "remaining_time": "0:17:22"} +{"current_steps": 595, "total_steps": 1428, "loss": 1.848137617111206, "lr": 7.256327233503365e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:12:23", "remaining_time": "0:17:21"} +{"current_steps": 596, "total_steps": 1428, "loss": 1.7656617164611816, "lr": 7.24541184306116e-06, "epoch": 1.2521008403361344, "percentage": 41.74, "elapsed_time": "0:12:24", "remaining_time": "0:17:19"} +{"current_steps": 597, "total_steps": 1428, "loss": 1.0096323490142822, "lr": 7.234483031482787e-06, "epoch": 1.254201680672269, "percentage": 41.81, "elapsed_time": "0:12:25", "remaining_time": "0:17:18"} +{"current_steps": 598, "total_steps": 1428, "loss": 1.428197979927063, "lr": 7.223540864091259e-06, "epoch": 1.2563025210084033, "percentage": 41.88, "elapsed_time": "0:12:27", "remaining_time": "0:17:16"} +{"current_steps": 599, "total_steps": 1428, "loss": 1.0703970193862915, "lr": 7.2125854062894184e-06, "epoch": 1.2584033613445378, "percentage": 41.95, "elapsed_time": "0:12:28", "remaining_time": "0:17:15"} +{"current_steps": 600, "total_steps": 1428, "loss": 1.7873646020889282, "lr": 7.201616723559548e-06, "epoch": 1.2605042016806722, "percentage": 42.02, "elapsed_time": "0:12:29", "remaining_time": "0:17:13"} +{"current_steps": 601, "total_steps": 1428, "loss": 1.3262135982513428, "lr": 7.190634881462976e-06, "epoch": 1.2626050420168067, "percentage": 42.09, "elapsed_time": "0:12:30", "remaining_time": "0:17:12"} +{"current_steps": 602, "total_steps": 1428, "loss": 1.6294150352478027, "lr": 7.179639945639688e-06, "epoch": 1.2647058823529411, "percentage": 42.16, "elapsed_time": "0:12:31", "remaining_time": "0:17:10"} +{"current_steps": 603, "total_steps": 1428, "loss": 2.6409220695495605, "lr": 7.168631981807931e-06, "epoch": 1.2668067226890756, "percentage": 42.23, "elapsed_time": "0:12:32", "remaining_time": "0:17:09"} +{"current_steps": 604, "total_steps": 1428, "loss": 1.3407433032989502, "lr": 7.15761105576382e-06, "epoch": 1.26890756302521, "percentage": 42.3, "elapsed_time": "0:12:33", "remaining_time": "0:17:07"} +{"current_steps": 605, "total_steps": 1428, "loss": 1.1475789546966553, "lr": 7.1465772333809524e-06, "epoch": 1.2710084033613445, "percentage": 42.37, "elapsed_time": "0:12:34", "remaining_time": "0:17:06"} +{"current_steps": 606, "total_steps": 1428, "loss": 1.8270117044448853, "lr": 7.1355305806100036e-06, "epoch": 1.273109243697479, "percentage": 42.44, "elapsed_time": "0:12:35", "remaining_time": "0:17:04"} +{"current_steps": 607, "total_steps": 1428, "loss": 2.168900489807129, "lr": 7.124471163478344e-06, "epoch": 1.2752100840336134, "percentage": 42.51, "elapsed_time": "0:12:36", "remaining_time": "0:17:03"} +{"current_steps": 608, "total_steps": 1428, "loss": 2.0142345428466797, "lr": 7.113399048089631e-06, "epoch": 1.2773109243697478, "percentage": 42.58, "elapsed_time": "0:12:37", "remaining_time": "0:17:02"} +{"current_steps": 609, "total_steps": 1428, "loss": 2.015444755554199, "lr": 7.102314300623425e-06, "epoch": 1.2794117647058822, "percentage": 42.65, "elapsed_time": "0:12:38", "remaining_time": "0:17:00"} +{"current_steps": 610, "total_steps": 1428, "loss": 1.5882906913757324, "lr": 7.091216987334792e-06, "epoch": 1.2815126050420167, "percentage": 42.72, "elapsed_time": "0:12:39", "remaining_time": "0:16:59"} +{"current_steps": 611, "total_steps": 1428, "loss": 1.4543545246124268, "lr": 7.080107174553903e-06, "epoch": 1.2836134453781511, "percentage": 42.79, "elapsed_time": "0:12:41", "remaining_time": "0:16:57"} +{"current_steps": 612, "total_steps": 1428, "loss": 1.3196444511413574, "lr": 7.068984928685638e-06, "epoch": 1.2857142857142856, "percentage": 42.86, "elapsed_time": "0:12:42", "remaining_time": "0:16:56"} +{"current_steps": 613, "total_steps": 1428, "loss": 0.8601089715957642, "lr": 7.057850316209198e-06, "epoch": 1.28781512605042, "percentage": 42.93, "elapsed_time": "0:12:43", "remaining_time": "0:16:54"} +{"current_steps": 614, "total_steps": 1428, "loss": 1.334380865097046, "lr": 7.0467034036776945e-06, "epoch": 1.2899159663865547, "percentage": 43.0, "elapsed_time": "0:12:44", "remaining_time": "0:16:53"} +{"current_steps": 615, "total_steps": 1428, "loss": 1.4980111122131348, "lr": 7.035544257717761e-06, "epoch": 1.2920168067226891, "percentage": 43.07, "elapsed_time": "0:12:45", "remaining_time": "0:16:51"} +{"current_steps": 616, "total_steps": 1428, "loss": 1.9393174648284912, "lr": 7.024372945029152e-06, "epoch": 1.2941176470588236, "percentage": 43.14, "elapsed_time": "0:12:46", "remaining_time": "0:16:50"} +{"current_steps": 617, "total_steps": 1428, "loss": 1.1070374250411987, "lr": 7.013189532384343e-06, "epoch": 1.296218487394958, "percentage": 43.21, "elapsed_time": "0:12:47", "remaining_time": "0:16:48"} +{"current_steps": 618, "total_steps": 1428, "loss": 2.146557331085205, "lr": 7.001994086628133e-06, "epoch": 1.2983193277310925, "percentage": 43.28, "elapsed_time": "0:12:48", "remaining_time": "0:16:47"} +{"current_steps": 619, "total_steps": 1428, "loss": 1.097703456878662, "lr": 6.990786674677246e-06, "epoch": 1.300420168067227, "percentage": 43.35, "elapsed_time": "0:12:49", "remaining_time": "0:16:45"} +{"current_steps": 620, "total_steps": 1428, "loss": 1.9619685411453247, "lr": 6.979567363519927e-06, "epoch": 1.3025210084033614, "percentage": 43.42, "elapsed_time": "0:12:50", "remaining_time": "0:16:44"} +{"current_steps": 621, "total_steps": 1428, "loss": 1.2424434423446655, "lr": 6.9683362202155465e-06, "epoch": 1.3046218487394958, "percentage": 43.49, "elapsed_time": "0:12:51", "remaining_time": "0:16:42"} +{"current_steps": 622, "total_steps": 1428, "loss": 1.8912100791931152, "lr": 6.957093311894199e-06, "epoch": 1.3067226890756303, "percentage": 43.56, "elapsed_time": "0:12:52", "remaining_time": "0:16:41"} +{"current_steps": 623, "total_steps": 1428, "loss": 1.4234580993652344, "lr": 6.945838705756293e-06, "epoch": 1.3088235294117647, "percentage": 43.63, "elapsed_time": "0:12:53", "remaining_time": "0:16:40"} +{"current_steps": 624, "total_steps": 1428, "loss": 1.7631306648254395, "lr": 6.934572469072163e-06, "epoch": 1.3109243697478992, "percentage": 43.7, "elapsed_time": "0:12:55", "remaining_time": "0:16:38"} +{"current_steps": 625, "total_steps": 1428, "loss": 1.275686264038086, "lr": 6.923294669181659e-06, "epoch": 1.3130252100840336, "percentage": 43.77, "elapsed_time": "0:12:56", "remaining_time": "0:16:37"} +{"current_steps": 626, "total_steps": 1428, "loss": 1.8493428230285645, "lr": 6.912005373493747e-06, "epoch": 1.315126050420168, "percentage": 43.84, "elapsed_time": "0:12:57", "remaining_time": "0:16:35"} +{"current_steps": 627, "total_steps": 1428, "loss": 1.0401699542999268, "lr": 6.900704649486103e-06, "epoch": 1.3172268907563025, "percentage": 43.91, "elapsed_time": "0:12:58", "remaining_time": "0:16:34"} +{"current_steps": 628, "total_steps": 1428, "loss": 1.932092547416687, "lr": 6.889392564704712e-06, "epoch": 1.319327731092437, "percentage": 43.98, "elapsed_time": "0:12:59", "remaining_time": "0:16:32"} +{"current_steps": 629, "total_steps": 1428, "loss": 2.0269484519958496, "lr": 6.878069186763466e-06, "epoch": 1.3214285714285714, "percentage": 44.05, "elapsed_time": "0:13:00", "remaining_time": "0:16:31"} +{"current_steps": 630, "total_steps": 1428, "loss": 1.6765419244766235, "lr": 6.866734583343753e-06, "epoch": 1.3235294117647058, "percentage": 44.12, "elapsed_time": "0:13:01", "remaining_time": "0:16:29"} +{"current_steps": 631, "total_steps": 1428, "loss": 1.7931967973709106, "lr": 6.855388822194061e-06, "epoch": 1.3256302521008403, "percentage": 44.19, "elapsed_time": "0:13:02", "remaining_time": "0:16:28"} +{"current_steps": 632, "total_steps": 1428, "loss": 0.9582860469818115, "lr": 6.844031971129571e-06, "epoch": 1.3277310924369747, "percentage": 44.26, "elapsed_time": "0:13:03", "remaining_time": "0:16:27"} +{"current_steps": 633, "total_steps": 1428, "loss": 1.7692348957061768, "lr": 6.8326640980317475e-06, "epoch": 1.3298319327731092, "percentage": 44.33, "elapsed_time": "0:13:04", "remaining_time": "0:16:25"} +{"current_steps": 634, "total_steps": 1428, "loss": 2.143463373184204, "lr": 6.821285270847934e-06, "epoch": 1.3319327731092436, "percentage": 44.4, "elapsed_time": "0:13:05", "remaining_time": "0:16:24"} +{"current_steps": 635, "total_steps": 1428, "loss": 2.290733814239502, "lr": 6.80989555759095e-06, "epoch": 1.334033613445378, "percentage": 44.47, "elapsed_time": "0:13:06", "remaining_time": "0:16:22"} +{"current_steps": 636, "total_steps": 1428, "loss": 1.4548063278198242, "lr": 6.79849502633868e-06, "epoch": 1.3361344537815127, "percentage": 44.54, "elapsed_time": "0:13:07", "remaining_time": "0:16:21"} +{"current_steps": 637, "total_steps": 1428, "loss": 1.6137502193450928, "lr": 6.787083745233674e-06, "epoch": 1.3382352941176472, "percentage": 44.61, "elapsed_time": "0:13:09", "remaining_time": "0:16:19"} +{"current_steps": 638, "total_steps": 1428, "loss": 1.277546763420105, "lr": 6.775661782482732e-06, "epoch": 1.3403361344537816, "percentage": 44.68, "elapsed_time": "0:13:10", "remaining_time": "0:16:18"} +{"current_steps": 639, "total_steps": 1428, "loss": 1.4183297157287598, "lr": 6.764229206356498e-06, "epoch": 1.342436974789916, "percentage": 44.75, "elapsed_time": "0:13:11", "remaining_time": "0:16:16"} +{"current_steps": 640, "total_steps": 1428, "loss": 2.352818012237549, "lr": 6.752786085189059e-06, "epoch": 1.3445378151260505, "percentage": 44.82, "elapsed_time": "0:13:12", "remaining_time": "0:16:15"} +{"current_steps": 641, "total_steps": 1428, "loss": 1.1966056823730469, "lr": 6.741332487377525e-06, "epoch": 1.346638655462185, "percentage": 44.89, "elapsed_time": "0:13:13", "remaining_time": "0:16:14"} +{"current_steps": 642, "total_steps": 1428, "loss": 2.1670610904693604, "lr": 6.729868481381632e-06, "epoch": 1.3487394957983194, "percentage": 44.96, "elapsed_time": "0:13:14", "remaining_time": "0:16:12"} +{"current_steps": 643, "total_steps": 1428, "loss": 1.4478580951690674, "lr": 6.718394135723321e-06, "epoch": 1.3508403361344539, "percentage": 45.03, "elapsed_time": "0:13:15", "remaining_time": "0:16:11"} +{"current_steps": 644, "total_steps": 1428, "loss": 1.1712067127227783, "lr": 6.706909518986341e-06, "epoch": 1.3529411764705883, "percentage": 45.1, "elapsed_time": "0:13:16", "remaining_time": "0:16:09"} +{"current_steps": 645, "total_steps": 1428, "loss": 1.241437315940857, "lr": 6.695414699815828e-06, "epoch": 1.3550420168067228, "percentage": 45.17, "elapsed_time": "0:13:17", "remaining_time": "0:16:08"} +{"current_steps": 646, "total_steps": 1428, "loss": 1.5295310020446777, "lr": 6.6839097469179e-06, "epoch": 1.3571428571428572, "percentage": 45.24, "elapsed_time": "0:13:18", "remaining_time": "0:16:06"} +{"current_steps": 647, "total_steps": 1428, "loss": 1.3555617332458496, "lr": 6.6723947290592505e-06, "epoch": 1.3592436974789917, "percentage": 45.31, "elapsed_time": "0:13:19", "remaining_time": "0:16:05"} +{"current_steps": 648, "total_steps": 1428, "loss": 1.3158948421478271, "lr": 6.660869715066725e-06, "epoch": 1.361344537815126, "percentage": 45.38, "elapsed_time": "0:13:20", "remaining_time": "0:16:04"} +{"current_steps": 649, "total_steps": 1428, "loss": 1.7540979385375977, "lr": 6.649334773826924e-06, "epoch": 1.3634453781512605, "percentage": 45.45, "elapsed_time": "0:13:21", "remaining_time": "0:16:02"} +{"current_steps": 650, "total_steps": 1428, "loss": 1.7170000076293945, "lr": 6.63778997428578e-06, "epoch": 1.365546218487395, "percentage": 45.52, "elapsed_time": "0:13:23", "remaining_time": "0:16:01"} +{"current_steps": 651, "total_steps": 1428, "loss": 1.2551283836364746, "lr": 6.626235385448152e-06, "epoch": 1.3676470588235294, "percentage": 45.59, "elapsed_time": "0:13:24", "remaining_time": "0:15:59"} +{"current_steps": 652, "total_steps": 1428, "loss": 1.468104362487793, "lr": 6.61467107637741e-06, "epoch": 1.3697478991596639, "percentage": 45.66, "elapsed_time": "0:13:25", "remaining_time": "0:15:58"} +{"current_steps": 653, "total_steps": 1428, "loss": 1.3832511901855469, "lr": 6.603097116195026e-06, "epoch": 1.3718487394957983, "percentage": 45.73, "elapsed_time": "0:13:26", "remaining_time": "0:15:56"} +{"current_steps": 654, "total_steps": 1428, "loss": 1.1895179748535156, "lr": 6.591513574080152e-06, "epoch": 1.3739495798319328, "percentage": 45.8, "elapsed_time": "0:13:27", "remaining_time": "0:15:55"} +{"current_steps": 655, "total_steps": 1428, "loss": 1.57008957862854, "lr": 6.579920519269218e-06, "epoch": 1.3760504201680672, "percentage": 45.87, "elapsed_time": "0:13:28", "remaining_time": "0:15:54"} +{"current_steps": 656, "total_steps": 1428, "loss": 1.1686642169952393, "lr": 6.568318021055512e-06, "epoch": 1.3781512605042017, "percentage": 45.94, "elapsed_time": "0:13:29", "remaining_time": "0:15:52"} +{"current_steps": 657, "total_steps": 1428, "loss": 1.831925392150879, "lr": 6.556706148788765e-06, "epoch": 1.3802521008403361, "percentage": 46.01, "elapsed_time": "0:13:30", "remaining_time": "0:15:51"} +{"current_steps": 658, "total_steps": 1428, "loss": 1.1927814483642578, "lr": 6.545084971874738e-06, "epoch": 1.3823529411764706, "percentage": 46.08, "elapsed_time": "0:13:31", "remaining_time": "0:15:49"} +{"current_steps": 659, "total_steps": 1428, "loss": 1.225053310394287, "lr": 6.5334545597748075e-06, "epoch": 1.384453781512605, "percentage": 46.15, "elapsed_time": "0:13:32", "remaining_time": "0:15:48"} +{"current_steps": 660, "total_steps": 1428, "loss": 1.489911437034607, "lr": 6.521814982005552e-06, "epoch": 1.3865546218487395, "percentage": 46.22, "elapsed_time": "0:13:33", "remaining_time": "0:15:46"} +{"current_steps": 661, "total_steps": 1428, "loss": 1.3653918504714966, "lr": 6.510166308138328e-06, "epoch": 1.388655462184874, "percentage": 46.29, "elapsed_time": "0:13:34", "remaining_time": "0:15:45"} +{"current_steps": 662, "total_steps": 1428, "loss": 1.7082477807998657, "lr": 6.498508607798872e-06, "epoch": 1.3907563025210083, "percentage": 46.36, "elapsed_time": "0:13:35", "remaining_time": "0:15:44"} +{"current_steps": 663, "total_steps": 1428, "loss": 1.1122634410858154, "lr": 6.48684195066686e-06, "epoch": 1.3928571428571428, "percentage": 46.43, "elapsed_time": "0:13:36", "remaining_time": "0:15:42"} +{"current_steps": 664, "total_steps": 1428, "loss": 0.9572471380233765, "lr": 6.475166406475515e-06, "epoch": 1.3949579831932772, "percentage": 46.5, "elapsed_time": "0:13:38", "remaining_time": "0:15:41"} +{"current_steps": 665, "total_steps": 1428, "loss": 1.8282674551010132, "lr": 6.4634820450111715e-06, "epoch": 1.3970588235294117, "percentage": 46.57, "elapsed_time": "0:13:39", "remaining_time": "0:15:39"} +{"current_steps": 666, "total_steps": 1428, "loss": 1.2026221752166748, "lr": 6.451788936112868e-06, "epoch": 1.3991596638655461, "percentage": 46.64, "elapsed_time": "0:13:40", "remaining_time": "0:15:38"} +{"current_steps": 667, "total_steps": 1428, "loss": 1.3183879852294922, "lr": 6.440087149671932e-06, "epoch": 1.4012605042016806, "percentage": 46.71, "elapsed_time": "0:13:41", "remaining_time": "0:15:37"} +{"current_steps": 668, "total_steps": 1428, "loss": 1.216771125793457, "lr": 6.428376755631553e-06, "epoch": 1.403361344537815, "percentage": 46.78, "elapsed_time": "0:13:42", "remaining_time": "0:15:35"} +{"current_steps": 669, "total_steps": 1428, "loss": 1.6759852170944214, "lr": 6.41665782398637e-06, "epoch": 1.4054621848739495, "percentage": 46.85, "elapsed_time": "0:13:43", "remaining_time": "0:15:34"} +{"current_steps": 670, "total_steps": 1428, "loss": 1.6593937873840332, "lr": 6.404930424782052e-06, "epoch": 1.407563025210084, "percentage": 46.92, "elapsed_time": "0:13:44", "remaining_time": "0:15:32"} +{"current_steps": 671, "total_steps": 1428, "loss": 1.672929286956787, "lr": 6.393194628114885e-06, "epoch": 1.4096638655462184, "percentage": 46.99, "elapsed_time": "0:13:45", "remaining_time": "0:15:31"} +{"current_steps": 672, "total_steps": 1428, "loss": 1.2778139114379883, "lr": 6.381450504131339e-06, "epoch": 1.4117647058823528, "percentage": 47.06, "elapsed_time": "0:13:46", "remaining_time": "0:15:29"} +{"current_steps": 673, "total_steps": 1428, "loss": 1.6472318172454834, "lr": 6.369698123027664e-06, "epoch": 1.4138655462184873, "percentage": 47.13, "elapsed_time": "0:13:47", "remaining_time": "0:15:28"} +{"current_steps": 674, "total_steps": 1428, "loss": 1.5301233530044556, "lr": 6.357937555049465e-06, "epoch": 1.415966386554622, "percentage": 47.2, "elapsed_time": "0:13:48", "remaining_time": "0:15:27"} +{"current_steps": 675, "total_steps": 1428, "loss": 1.5423755645751953, "lr": 6.3461688704912735e-06, "epoch": 1.4180672268907564, "percentage": 47.27, "elapsed_time": "0:13:49", "remaining_time": "0:15:25"} +{"current_steps": 676, "total_steps": 1428, "loss": 0.8435590863227844, "lr": 6.334392139696144e-06, "epoch": 1.4201680672268908, "percentage": 47.34, "elapsed_time": "0:13:51", "remaining_time": "0:15:24"} +{"current_steps": 677, "total_steps": 1428, "loss": 0.9243001937866211, "lr": 6.322607433055217e-06, "epoch": 1.4222689075630253, "percentage": 47.41, "elapsed_time": "0:13:52", "remaining_time": "0:15:23"} +{"current_steps": 678, "total_steps": 1428, "loss": 1.1370623111724854, "lr": 6.310814821007312e-06, "epoch": 1.4243697478991597, "percentage": 47.48, "elapsed_time": "0:13:53", "remaining_time": "0:15:21"} +{"current_steps": 679, "total_steps": 1428, "loss": 1.8121721744537354, "lr": 6.299014374038493e-06, "epoch": 1.4264705882352942, "percentage": 47.55, "elapsed_time": "0:13:54", "remaining_time": "0:15:20"} +{"current_steps": 680, "total_steps": 1428, "loss": 1.5701857805252075, "lr": 6.287206162681663e-06, "epoch": 1.4285714285714286, "percentage": 47.62, "elapsed_time": "0:13:55", "remaining_time": "0:15:18"} +{"current_steps": 681, "total_steps": 1428, "loss": 1.7376922369003296, "lr": 6.275390257516125e-06, "epoch": 1.430672268907563, "percentage": 47.69, "elapsed_time": "0:13:56", "remaining_time": "0:15:17"} +{"current_steps": 682, "total_steps": 1428, "loss": 1.722080111503601, "lr": 6.263566729167177e-06, "epoch": 1.4327731092436975, "percentage": 47.76, "elapsed_time": "0:13:57", "remaining_time": "0:15:16"} +{"current_steps": 683, "total_steps": 1428, "loss": 1.8646998405456543, "lr": 6.251735648305676e-06, "epoch": 1.434873949579832, "percentage": 47.83, "elapsed_time": "0:13:58", "remaining_time": "0:15:14"} +{"current_steps": 684, "total_steps": 1428, "loss": 1.6373791694641113, "lr": 6.239897085647624e-06, "epoch": 1.4369747899159664, "percentage": 47.9, "elapsed_time": "0:13:59", "remaining_time": "0:15:13"} +{"current_steps": 685, "total_steps": 1428, "loss": 1.5332825183868408, "lr": 6.228051111953742e-06, "epoch": 1.4390756302521008, "percentage": 47.97, "elapsed_time": "0:14:00", "remaining_time": "0:15:11"} +{"current_steps": 686, "total_steps": 1428, "loss": 1.7713117599487305, "lr": 6.216197798029049e-06, "epoch": 1.4411764705882353, "percentage": 48.04, "elapsed_time": "0:14:01", "remaining_time": "0:15:10"} +{"current_steps": 687, "total_steps": 1428, "loss": 1.3197343349456787, "lr": 6.204337214722435e-06, "epoch": 1.4432773109243697, "percentage": 48.11, "elapsed_time": "0:14:02", "remaining_time": "0:15:09"} +{"current_steps": 688, "total_steps": 1428, "loss": 1.3940856456756592, "lr": 6.192469432926241e-06, "epoch": 1.4453781512605042, "percentage": 48.18, "elapsed_time": "0:14:03", "remaining_time": "0:15:07"} +{"current_steps": 689, "total_steps": 1428, "loss": 2.0876762866973877, "lr": 6.180594523575838e-06, "epoch": 1.4474789915966386, "percentage": 48.25, "elapsed_time": "0:14:05", "remaining_time": "0:15:06"} +{"current_steps": 690, "total_steps": 1428, "loss": 2.5141618251800537, "lr": 6.1687125576491945e-06, "epoch": 1.449579831932773, "percentage": 48.32, "elapsed_time": "0:14:06", "remaining_time": "0:15:04"} +{"current_steps": 691, "total_steps": 1428, "loss": 0.9575009942054749, "lr": 6.156823606166461e-06, "epoch": 1.4516806722689075, "percentage": 48.39, "elapsed_time": "0:14:07", "remaining_time": "0:15:03"} +{"current_steps": 692, "total_steps": 1428, "loss": 1.2732771635055542, "lr": 6.144927740189537e-06, "epoch": 1.453781512605042, "percentage": 48.46, "elapsed_time": "0:14:08", "remaining_time": "0:15:02"} +{"current_steps": 693, "total_steps": 1428, "loss": 1.0447793006896973, "lr": 6.133025030821656e-06, "epoch": 1.4558823529411764, "percentage": 48.53, "elapsed_time": "0:14:09", "remaining_time": "0:15:00"} +{"current_steps": 694, "total_steps": 1428, "loss": 2.069892406463623, "lr": 6.12111554920695e-06, "epoch": 1.4579831932773109, "percentage": 48.6, "elapsed_time": "0:14:10", "remaining_time": "0:14:59"} +{"current_steps": 695, "total_steps": 1428, "loss": 1.4193060398101807, "lr": 6.1091993665300354e-06, "epoch": 1.4600840336134453, "percentage": 48.67, "elapsed_time": "0:14:11", "remaining_time": "0:14:58"} +{"current_steps": 696, "total_steps": 1428, "loss": 1.8489269018173218, "lr": 6.0972765540155764e-06, "epoch": 1.46218487394958, "percentage": 48.74, "elapsed_time": "0:14:12", "remaining_time": "0:14:56"} +{"current_steps": 697, "total_steps": 1428, "loss": 1.8245782852172852, "lr": 6.08534718292787e-06, "epoch": 1.4642857142857144, "percentage": 48.81, "elapsed_time": "0:14:13", "remaining_time": "0:14:55"} +{"current_steps": 698, "total_steps": 1428, "loss": 1.8135966062545776, "lr": 6.07341132457041e-06, "epoch": 1.4663865546218489, "percentage": 48.88, "elapsed_time": "0:14:14", "remaining_time": "0:14:53"} +{"current_steps": 699, "total_steps": 1428, "loss": 1.2886388301849365, "lr": 6.061469050285469e-06, "epoch": 1.4684873949579833, "percentage": 48.95, "elapsed_time": "0:14:15", "remaining_time": "0:14:52"} +{"current_steps": 700, "total_steps": 1428, "loss": 1.8994669914245605, "lr": 6.049520431453666e-06, "epoch": 1.4705882352941178, "percentage": 49.02, "elapsed_time": "0:14:16", "remaining_time": "0:14:51"} +{"current_steps": 701, "total_steps": 1428, "loss": 1.830640196800232, "lr": 6.037565539493542e-06, "epoch": 1.4726890756302522, "percentage": 49.09, "elapsed_time": "0:14:17", "remaining_time": "0:14:49"} +{"current_steps": 702, "total_steps": 1428, "loss": 1.253919005393982, "lr": 6.025604445861137e-06, "epoch": 1.4747899159663866, "percentage": 49.16, "elapsed_time": "0:14:19", "remaining_time": "0:14:48"} +{"current_steps": 703, "total_steps": 1428, "loss": 1.4687739610671997, "lr": 6.013637222049554e-06, "epoch": 1.476890756302521, "percentage": 49.23, "elapsed_time": "0:14:20", "remaining_time": "0:14:47"} +{"current_steps": 704, "total_steps": 1428, "loss": 0.8241528272628784, "lr": 6.0016639395885424e-06, "epoch": 1.4789915966386555, "percentage": 49.3, "elapsed_time": "0:14:21", "remaining_time": "0:14:45"} +{"current_steps": 705, "total_steps": 1428, "loss": 0.9833969473838806, "lr": 5.98968467004406e-06, "epoch": 1.48109243697479, "percentage": 49.37, "elapsed_time": "0:14:22", "remaining_time": "0:14:44"} +{"current_steps": 706, "total_steps": 1428, "loss": 1.4603691101074219, "lr": 5.977699485017855e-06, "epoch": 1.4831932773109244, "percentage": 49.44, "elapsed_time": "0:14:23", "remaining_time": "0:14:42"} +{"current_steps": 707, "total_steps": 1428, "loss": 1.2566254138946533, "lr": 5.965708456147028e-06, "epoch": 1.4852941176470589, "percentage": 49.51, "elapsed_time": "0:14:24", "remaining_time": "0:14:41"} +{"current_steps": 708, "total_steps": 1428, "loss": 1.1779121160507202, "lr": 5.953711655103615e-06, "epoch": 1.4873949579831933, "percentage": 49.58, "elapsed_time": "0:14:25", "remaining_time": "0:14:40"} +{"current_steps": 709, "total_steps": 1428, "loss": 2.1752524375915527, "lr": 5.941709153594146e-06, "epoch": 1.4894957983193278, "percentage": 49.65, "elapsed_time": "0:14:26", "remaining_time": "0:14:38"} +{"current_steps": 710, "total_steps": 1428, "loss": 1.368391752243042, "lr": 5.92970102335923e-06, "epoch": 1.4915966386554622, "percentage": 49.72, "elapsed_time": "0:14:27", "remaining_time": "0:14:37"} +{"current_steps": 711, "total_steps": 1428, "loss": 1.4870836734771729, "lr": 5.917687336173116e-06, "epoch": 1.4936974789915967, "percentage": 49.79, "elapsed_time": "0:14:28", "remaining_time": "0:14:36"} +{"current_steps": 712, "total_steps": 1428, "loss": 1.5822714567184448, "lr": 5.905668163843269e-06, "epoch": 1.495798319327731, "percentage": 49.86, "elapsed_time": "0:14:29", "remaining_time": "0:14:34"} +{"current_steps": 713, "total_steps": 1428, "loss": 1.5158865451812744, "lr": 5.893643578209939e-06, "epoch": 1.4978991596638656, "percentage": 49.93, "elapsed_time": "0:14:30", "remaining_time": "0:14:33"} +{"current_steps": 714, "total_steps": 1428, "loss": 1.0833930969238281, "lr": 5.881613651145732e-06, "epoch": 1.5, "percentage": 50.0, "elapsed_time": "0:14:32", "remaining_time": "0:14:32"} +{"current_steps": 715, "total_steps": 1428, "loss": 1.2957074642181396, "lr": 5.8695784545551815e-06, "epoch": 1.5021008403361344, "percentage": 50.07, "elapsed_time": "0:14:33", "remaining_time": "0:14:30"} +{"current_steps": 716, "total_steps": 1428, "loss": 1.541155457496643, "lr": 5.8575380603743155e-06, "epoch": 1.504201680672269, "percentage": 50.14, "elapsed_time": "0:14:34", "remaining_time": "0:14:29"} +{"current_steps": 717, "total_steps": 1428, "loss": 1.7509238719940186, "lr": 5.8454925405702326e-06, "epoch": 1.5063025210084033, "percentage": 50.21, "elapsed_time": "0:14:35", "remaining_time": "0:14:27"} +{"current_steps": 718, "total_steps": 1428, "loss": 1.8062071800231934, "lr": 5.833441967140662e-06, "epoch": 1.5084033613445378, "percentage": 50.28, "elapsed_time": "0:14:36", "remaining_time": "0:14:26"} +{"current_steps": 719, "total_steps": 1428, "loss": 1.4850780963897705, "lr": 5.821386412113546e-06, "epoch": 1.5105042016806722, "percentage": 50.35, "elapsed_time": "0:14:37", "remaining_time": "0:14:25"} +{"current_steps": 720, "total_steps": 1428, "loss": 1.1842257976531982, "lr": 5.809325947546596e-06, "epoch": 1.5126050420168067, "percentage": 50.42, "elapsed_time": "0:14:38", "remaining_time": "0:14:23"} +{"current_steps": 721, "total_steps": 1428, "loss": 1.396120548248291, "lr": 5.797260645526873e-06, "epoch": 1.5147058823529411, "percentage": 50.49, "elapsed_time": "0:14:39", "remaining_time": "0:14:22"} +{"current_steps": 722, "total_steps": 1428, "loss": 1.2990989685058594, "lr": 5.785190578170351e-06, "epoch": 1.5168067226890756, "percentage": 50.56, "elapsed_time": "0:14:40", "remaining_time": "0:14:21"} +{"current_steps": 723, "total_steps": 1428, "loss": 1.8467388153076172, "lr": 5.773115817621487e-06, "epoch": 1.51890756302521, "percentage": 50.63, "elapsed_time": "0:14:41", "remaining_time": "0:14:19"} +{"current_steps": 724, "total_steps": 1428, "loss": 1.6907732486724854, "lr": 5.761036436052788e-06, "epoch": 1.5210084033613445, "percentage": 50.7, "elapsed_time": "0:14:42", "remaining_time": "0:14:18"} +{"current_steps": 725, "total_steps": 1428, "loss": 1.265946388244629, "lr": 5.748952505664385e-06, "epoch": 1.523109243697479, "percentage": 50.77, "elapsed_time": "0:14:43", "remaining_time": "0:14:17"} +{"current_steps": 726, "total_steps": 1428, "loss": 1.2473053932189941, "lr": 5.736864098683595e-06, "epoch": 1.5252100840336134, "percentage": 50.84, "elapsed_time": "0:14:44", "remaining_time": "0:14:15"} +{"current_steps": 727, "total_steps": 1428, "loss": 0.8382349014282227, "lr": 5.724771287364492e-06, "epoch": 1.5273109243697478, "percentage": 50.91, "elapsed_time": "0:14:46", "remaining_time": "0:14:14"} +{"current_steps": 728, "total_steps": 1428, "loss": 0.6312862038612366, "lr": 5.712674143987478e-06, "epoch": 1.5294117647058822, "percentage": 50.98, "elapsed_time": "0:14:47", "remaining_time": "0:14:13"} +{"current_steps": 729, "total_steps": 1428, "loss": 2.154848575592041, "lr": 5.700572740858847e-06, "epoch": 1.5315126050420167, "percentage": 51.05, "elapsed_time": "0:14:48", "remaining_time": "0:14:11"} +{"current_steps": 730, "total_steps": 1428, "loss": 2.034533739089966, "lr": 5.688467150310353e-06, "epoch": 1.5336134453781511, "percentage": 51.12, "elapsed_time": "0:14:49", "remaining_time": "0:14:10"} +{"current_steps": 731, "total_steps": 1428, "loss": 1.1331748962402344, "lr": 5.67635744469878e-06, "epoch": 1.5357142857142856, "percentage": 51.19, "elapsed_time": "0:14:50", "remaining_time": "0:14:08"} +{"current_steps": 732, "total_steps": 1428, "loss": 2.139069080352783, "lr": 5.664243696405509e-06, "epoch": 1.53781512605042, "percentage": 51.26, "elapsed_time": "0:14:51", "remaining_time": "0:14:07"} +{"current_steps": 733, "total_steps": 1428, "loss": 1.5174198150634766, "lr": 5.652125977836083e-06, "epoch": 1.5399159663865545, "percentage": 51.33, "elapsed_time": "0:14:52", "remaining_time": "0:14:06"} +{"current_steps": 734, "total_steps": 1428, "loss": 1.4445990324020386, "lr": 5.640004361419776e-06, "epoch": 1.542016806722689, "percentage": 51.4, "elapsed_time": "0:14:53", "remaining_time": "0:14:04"} +{"current_steps": 735, "total_steps": 1428, "loss": 1.3474795818328857, "lr": 5.627878919609162e-06, "epoch": 1.5441176470588234, "percentage": 51.47, "elapsed_time": "0:14:54", "remaining_time": "0:14:03"} +{"current_steps": 736, "total_steps": 1428, "loss": 1.4871881008148193, "lr": 5.615749724879677e-06, "epoch": 1.5462184873949578, "percentage": 51.54, "elapsed_time": "0:14:55", "remaining_time": "0:14:02"} +{"current_steps": 737, "total_steps": 1428, "loss": 1.308741569519043, "lr": 5.603616849729191e-06, "epoch": 1.5483193277310925, "percentage": 51.61, "elapsed_time": "0:14:56", "remaining_time": "0:14:00"} +{"current_steps": 738, "total_steps": 1428, "loss": 1.712050199508667, "lr": 5.591480366677571e-06, "epoch": 1.550420168067227, "percentage": 51.68, "elapsed_time": "0:14:57", "remaining_time": "0:13:59"} +{"current_steps": 739, "total_steps": 1428, "loss": 1.5636662244796753, "lr": 5.579340348266251e-06, "epoch": 1.5525210084033614, "percentage": 51.75, "elapsed_time": "0:14:58", "remaining_time": "0:13:58"} +{"current_steps": 740, "total_steps": 1428, "loss": 2.132948160171509, "lr": 5.5671968670577935e-06, "epoch": 1.5546218487394958, "percentage": 51.82, "elapsed_time": "0:15:00", "remaining_time": "0:13:56"} +{"current_steps": 741, "total_steps": 1428, "loss": 1.3193635940551758, "lr": 5.55504999563546e-06, "epoch": 1.5567226890756303, "percentage": 51.89, "elapsed_time": "0:15:01", "remaining_time": "0:13:55"} +{"current_steps": 742, "total_steps": 1428, "loss": 2.288175582885742, "lr": 5.542899806602776e-06, "epoch": 1.5588235294117647, "percentage": 51.96, "elapsed_time": "0:15:02", "remaining_time": "0:13:54"} +{"current_steps": 743, "total_steps": 1428, "loss": 0.9925522804260254, "lr": 5.530746372583097e-06, "epoch": 1.5609243697478992, "percentage": 52.03, "elapsed_time": "0:15:03", "remaining_time": "0:13:52"} +{"current_steps": 744, "total_steps": 1428, "loss": 1.0975109338760376, "lr": 5.518589766219173e-06, "epoch": 1.5630252100840336, "percentage": 52.1, "elapsed_time": "0:15:04", "remaining_time": "0:13:51"} +{"current_steps": 745, "total_steps": 1428, "loss": 1.5021933317184448, "lr": 5.506430060172714e-06, "epoch": 1.565126050420168, "percentage": 52.17, "elapsed_time": "0:15:05", "remaining_time": "0:13:50"} +{"current_steps": 746, "total_steps": 1428, "loss": 1.3946982622146606, "lr": 5.494267327123965e-06, "epoch": 1.5672268907563025, "percentage": 52.24, "elapsed_time": "0:15:06", "remaining_time": "0:13:48"} +{"current_steps": 747, "total_steps": 1428, "loss": 1.1381559371948242, "lr": 5.482101639771255e-06, "epoch": 1.569327731092437, "percentage": 52.31, "elapsed_time": "0:15:07", "remaining_time": "0:13:47"} +{"current_steps": 748, "total_steps": 1428, "loss": 1.6340922117233276, "lr": 5.469933070830574e-06, "epoch": 1.5714285714285714, "percentage": 52.38, "elapsed_time": "0:15:08", "remaining_time": "0:13:46"} +{"current_steps": 749, "total_steps": 1428, "loss": 1.3076329231262207, "lr": 5.457761693035139e-06, "epoch": 1.5735294117647058, "percentage": 52.45, "elapsed_time": "0:15:09", "remaining_time": "0:13:44"} +{"current_steps": 750, "total_steps": 1428, "loss": 1.4544854164123535, "lr": 5.44558757913495e-06, "epoch": 1.5756302521008403, "percentage": 52.52, "elapsed_time": "0:15:10", "remaining_time": "0:13:43"} +{"current_steps": 751, "total_steps": 1428, "loss": 1.254534363746643, "lr": 5.433410801896366e-06, "epoch": 1.5777310924369747, "percentage": 52.59, "elapsed_time": "0:15:11", "remaining_time": "0:13:42"} +{"current_steps": 752, "total_steps": 1428, "loss": 1.6915278434753418, "lr": 5.4212314341016645e-06, "epoch": 1.5798319327731094, "percentage": 52.66, "elapsed_time": "0:15:13", "remaining_time": "0:13:40"} +{"current_steps": 753, "total_steps": 1428, "loss": 1.9941121339797974, "lr": 5.409049548548604e-06, "epoch": 1.5819327731092439, "percentage": 52.73, "elapsed_time": "0:15:14", "remaining_time": "0:13:39"} +{"current_steps": 754, "total_steps": 1428, "loss": 1.8611130714416504, "lr": 5.396865218049995e-06, "epoch": 1.5840336134453783, "percentage": 52.8, "elapsed_time": "0:15:15", "remaining_time": "0:13:38"} +{"current_steps": 755, "total_steps": 1428, "loss": 1.5740795135498047, "lr": 5.38467851543326e-06, "epoch": 1.5861344537815127, "percentage": 52.87, "elapsed_time": "0:15:16", "remaining_time": "0:13:36"} +{"current_steps": 756, "total_steps": 1428, "loss": 2.713351249694824, "lr": 5.3724895135400015e-06, "epoch": 1.5882352941176472, "percentage": 52.94, "elapsed_time": "0:15:17", "remaining_time": "0:13:35"} +{"current_steps": 757, "total_steps": 1428, "loss": 1.3163414001464844, "lr": 5.360298285225564e-06, "epoch": 1.5903361344537816, "percentage": 53.01, "elapsed_time": "0:15:18", "remaining_time": "0:13:34"} +{"current_steps": 758, "total_steps": 1428, "loss": 1.2127149105072021, "lr": 5.3481049033586e-06, "epoch": 1.592436974789916, "percentage": 53.08, "elapsed_time": "0:15:19", "remaining_time": "0:13:32"} +{"current_steps": 759, "total_steps": 1428, "loss": 1.7897974252700806, "lr": 5.335909440820635e-06, "epoch": 1.5945378151260505, "percentage": 53.15, "elapsed_time": "0:15:20", "remaining_time": "0:13:31"} +{"current_steps": 760, "total_steps": 1428, "loss": 1.1387288570404053, "lr": 5.323711970505627e-06, "epoch": 1.596638655462185, "percentage": 53.22, "elapsed_time": "0:15:21", "remaining_time": "0:13:30"} +{"current_steps": 761, "total_steps": 1428, "loss": 1.3364837169647217, "lr": 5.311512565319542e-06, "epoch": 1.5987394957983194, "percentage": 53.29, "elapsed_time": "0:15:22", "remaining_time": "0:13:28"} +{"current_steps": 762, "total_steps": 1428, "loss": 1.5517654418945312, "lr": 5.299311298179904e-06, "epoch": 1.6008403361344539, "percentage": 53.36, "elapsed_time": "0:15:23", "remaining_time": "0:13:27"} +{"current_steps": 763, "total_steps": 1428, "loss": 1.3167724609375, "lr": 5.287108242015371e-06, "epoch": 1.6029411764705883, "percentage": 53.43, "elapsed_time": "0:15:24", "remaining_time": "0:13:26"} +{"current_steps": 764, "total_steps": 1428, "loss": 0.9891781210899353, "lr": 5.27490346976529e-06, "epoch": 1.6050420168067228, "percentage": 53.5, "elapsed_time": "0:15:25", "remaining_time": "0:13:24"} +{"current_steps": 765, "total_steps": 1428, "loss": 1.4272327423095703, "lr": 5.2626970543792685e-06, "epoch": 1.6071428571428572, "percentage": 53.57, "elapsed_time": "0:15:27", "remaining_time": "0:13:23"} +{"current_steps": 766, "total_steps": 1428, "loss": 1.5374692678451538, "lr": 5.250489068816734e-06, "epoch": 1.6092436974789917, "percentage": 53.64, "elapsed_time": "0:15:28", "remaining_time": "0:13:22"} +{"current_steps": 767, "total_steps": 1428, "loss": 2.130378484725952, "lr": 5.238279586046499e-06, "epoch": 1.611344537815126, "percentage": 53.71, "elapsed_time": "0:15:29", "remaining_time": "0:13:20"} +{"current_steps": 768, "total_steps": 1428, "loss": 1.0989816188812256, "lr": 5.226068679046327e-06, "epoch": 1.6134453781512605, "percentage": 53.78, "elapsed_time": "0:15:30", "remaining_time": "0:13:19"} +{"current_steps": 769, "total_steps": 1428, "loss": 1.4945666790008545, "lr": 5.21385642080249e-06, "epoch": 1.615546218487395, "percentage": 53.85, "elapsed_time": "0:15:31", "remaining_time": "0:13:18"} +{"current_steps": 770, "total_steps": 1428, "loss": 2.0057296752929688, "lr": 5.201642884309341e-06, "epoch": 1.6176470588235294, "percentage": 53.92, "elapsed_time": "0:15:32", "remaining_time": "0:13:16"} +{"current_steps": 771, "total_steps": 1428, "loss": 1.1791839599609375, "lr": 5.189428142568872e-06, "epoch": 1.6197478991596639, "percentage": 53.99, "elapsed_time": "0:15:33", "remaining_time": "0:13:15"} +{"current_steps": 772, "total_steps": 1428, "loss": 1.836449384689331, "lr": 5.177212268590277e-06, "epoch": 1.6218487394957983, "percentage": 54.06, "elapsed_time": "0:15:34", "remaining_time": "0:13:14"} +{"current_steps": 773, "total_steps": 1428, "loss": 1.711057424545288, "lr": 5.16499533538952e-06, "epoch": 1.6239495798319328, "percentage": 54.13, "elapsed_time": "0:15:35", "remaining_time": "0:13:12"} +{"current_steps": 774, "total_steps": 1428, "loss": 1.5274529457092285, "lr": 5.152777415988894e-06, "epoch": 1.6260504201680672, "percentage": 54.2, "elapsed_time": "0:15:36", "remaining_time": "0:13:11"} +{"current_steps": 775, "total_steps": 1428, "loss": 1.687756061553955, "lr": 5.140558583416591e-06, "epoch": 1.6281512605042017, "percentage": 54.27, "elapsed_time": "0:15:37", "remaining_time": "0:13:10"} +{"current_steps": 776, "total_steps": 1428, "loss": 1.857285976409912, "lr": 5.128338910706254e-06, "epoch": 1.6302521008403361, "percentage": 54.34, "elapsed_time": "0:15:38", "remaining_time": "0:13:08"} +{"current_steps": 777, "total_steps": 1428, "loss": 2.2893779277801514, "lr": 5.1161184708965525e-06, "epoch": 1.6323529411764706, "percentage": 54.41, "elapsed_time": "0:15:40", "remaining_time": "0:13:07"} +{"current_steps": 778, "total_steps": 1428, "loss": 1.299177646636963, "lr": 5.103897337030742e-06, "epoch": 1.634453781512605, "percentage": 54.48, "elapsed_time": "0:15:41", "remaining_time": "0:13:06"} +{"current_steps": 779, "total_steps": 1428, "loss": 1.156067132949829, "lr": 5.091675582156224e-06, "epoch": 1.6365546218487395, "percentage": 54.55, "elapsed_time": "0:15:42", "remaining_time": "0:13:04"} +{"current_steps": 780, "total_steps": 1428, "loss": 1.6888867616653442, "lr": 5.07945327932411e-06, "epoch": 1.638655462184874, "percentage": 54.62, "elapsed_time": "0:15:43", "remaining_time": "0:13:03"} +{"current_steps": 781, "total_steps": 1428, "loss": 2.480485677719116, "lr": 5.067230501588792e-06, "epoch": 1.6407563025210083, "percentage": 54.69, "elapsed_time": "0:15:44", "remaining_time": "0:13:02"} +{"current_steps": 782, "total_steps": 1428, "loss": 1.1827846765518188, "lr": 5.055007322007497e-06, "epoch": 1.6428571428571428, "percentage": 54.76, "elapsed_time": "0:15:45", "remaining_time": "0:13:00"} +{"current_steps": 783, "total_steps": 1428, "loss": 0.9974920749664307, "lr": 5.0427838136398545e-06, "epoch": 1.6449579831932772, "percentage": 54.83, "elapsed_time": "0:15:46", "remaining_time": "0:12:59"} +{"current_steps": 784, "total_steps": 1428, "loss": 1.3341560363769531, "lr": 5.0305600495474586e-06, "epoch": 1.6470588235294117, "percentage": 54.9, "elapsed_time": "0:15:47", "remaining_time": "0:12:58"} +{"current_steps": 785, "total_steps": 1428, "loss": 1.7801398038864136, "lr": 5.018336102793433e-06, "epoch": 1.6491596638655461, "percentage": 54.97, "elapsed_time": "0:15:48", "remaining_time": "0:12:57"} +{"current_steps": 786, "total_steps": 1428, "loss": 1.5409959554672241, "lr": 5.006112046441993e-06, "epoch": 1.6512605042016806, "percentage": 55.04, "elapsed_time": "0:15:49", "remaining_time": "0:12:55"} +{"current_steps": 787, "total_steps": 1428, "loss": 1.7089118957519531, "lr": 4.993887953558008e-06, "epoch": 1.653361344537815, "percentage": 55.11, "elapsed_time": "0:15:50", "remaining_time": "0:12:54"} +{"current_steps": 788, "total_steps": 1428, "loss": 1.5989807844161987, "lr": 4.981663897206568e-06, "epoch": 1.6554621848739495, "percentage": 55.18, "elapsed_time": "0:15:51", "remaining_time": "0:12:53"} +{"current_steps": 789, "total_steps": 1428, "loss": 1.4693567752838135, "lr": 4.969439950452543e-06, "epoch": 1.657563025210084, "percentage": 55.25, "elapsed_time": "0:15:52", "remaining_time": "0:12:51"} +{"current_steps": 790, "total_steps": 1428, "loss": 1.7319889068603516, "lr": 4.957216186360147e-06, "epoch": 1.6596638655462184, "percentage": 55.32, "elapsed_time": "0:15:54", "remaining_time": "0:12:50"} +{"current_steps": 791, "total_steps": 1428, "loss": 1.38368558883667, "lr": 4.944992677992505e-06, "epoch": 1.6617647058823528, "percentage": 55.39, "elapsed_time": "0:15:55", "remaining_time": "0:12:49"} +{"current_steps": 792, "total_steps": 1428, "loss": 1.9276368618011475, "lr": 4.932769498411209e-06, "epoch": 1.6638655462184873, "percentage": 55.46, "elapsed_time": "0:15:56", "remaining_time": "0:12:47"} +{"current_steps": 793, "total_steps": 1428, "loss": 1.5189965963363647, "lr": 4.9205467206758914e-06, "epoch": 1.6659663865546217, "percentage": 55.53, "elapsed_time": "0:15:57", "remaining_time": "0:12:46"} +{"current_steps": 794, "total_steps": 1428, "loss": 1.8080897331237793, "lr": 4.908324417843779e-06, "epoch": 1.6680672268907561, "percentage": 55.6, "elapsed_time": "0:15:58", "remaining_time": "0:12:45"} +{"current_steps": 795, "total_steps": 1428, "loss": 1.3283686637878418, "lr": 4.896102662969259e-06, "epoch": 1.6701680672268906, "percentage": 55.67, "elapsed_time": "0:15:59", "remaining_time": "0:12:43"} +{"current_steps": 796, "total_steps": 1428, "loss": 1.7254778146743774, "lr": 4.883881529103448e-06, "epoch": 1.6722689075630253, "percentage": 55.74, "elapsed_time": "0:16:00", "remaining_time": "0:12:42"} +{"current_steps": 797, "total_steps": 1428, "loss": 1.882294774055481, "lr": 4.8716610892937486e-06, "epoch": 1.6743697478991597, "percentage": 55.81, "elapsed_time": "0:16:01", "remaining_time": "0:12:41"} +{"current_steps": 798, "total_steps": 1428, "loss": 1.955444574356079, "lr": 4.859441416583412e-06, "epoch": 1.6764705882352942, "percentage": 55.88, "elapsed_time": "0:16:02", "remaining_time": "0:12:39"} +{"current_steps": 799, "total_steps": 1428, "loss": 1.3442355394363403, "lr": 4.847222584011107e-06, "epoch": 1.6785714285714286, "percentage": 55.95, "elapsed_time": "0:16:03", "remaining_time": "0:12:38"} +{"current_steps": 800, "total_steps": 1428, "loss": 1.3532618284225464, "lr": 4.8350046646104815e-06, "epoch": 1.680672268907563, "percentage": 56.02, "elapsed_time": "0:16:04", "remaining_time": "0:12:37"} +{"current_steps": 801, "total_steps": 1428, "loss": 1.8527226448059082, "lr": 4.8227877314097245e-06, "epoch": 1.6827731092436975, "percentage": 56.09, "elapsed_time": "0:16:05", "remaining_time": "0:12:36"} +{"current_steps": 802, "total_steps": 1428, "loss": 2.1312098503112793, "lr": 4.81057185743113e-06, "epoch": 1.684873949579832, "percentage": 56.16, "elapsed_time": "0:16:07", "remaining_time": "0:12:34"} +{"current_steps": 803, "total_steps": 1428, "loss": 1.3131635189056396, "lr": 4.798357115690661e-06, "epoch": 1.6869747899159664, "percentage": 56.23, "elapsed_time": "0:16:08", "remaining_time": "0:12:33"} +{"current_steps": 804, "total_steps": 1428, "loss": 1.057523488998413, "lr": 4.7861435791975124e-06, "epoch": 1.6890756302521008, "percentage": 56.3, "elapsed_time": "0:16:09", "remaining_time": "0:12:32"} +{"current_steps": 805, "total_steps": 1428, "loss": 1.510682225227356, "lr": 4.7739313209536755e-06, "epoch": 1.6911764705882353, "percentage": 56.37, "elapsed_time": "0:16:10", "remaining_time": "0:12:30"} +{"current_steps": 806, "total_steps": 1428, "loss": 2.0877933502197266, "lr": 4.761720413953503e-06, "epoch": 1.6932773109243697, "percentage": 56.44, "elapsed_time": "0:16:11", "remaining_time": "0:12:29"} +{"current_steps": 807, "total_steps": 1428, "loss": 0.9936963319778442, "lr": 4.7495109311832665e-06, "epoch": 1.6953781512605042, "percentage": 56.51, "elapsed_time": "0:16:12", "remaining_time": "0:12:28"} +{"current_steps": 808, "total_steps": 1428, "loss": 1.4148988723754883, "lr": 4.737302945620732e-06, "epoch": 1.6974789915966386, "percentage": 56.58, "elapsed_time": "0:16:13", "remaining_time": "0:12:26"} +{"current_steps": 809, "total_steps": 1428, "loss": 1.5457355976104736, "lr": 4.72509653023471e-06, "epoch": 1.699579831932773, "percentage": 56.65, "elapsed_time": "0:16:14", "remaining_time": "0:12:25"} +{"current_steps": 810, "total_steps": 1428, "loss": 1.1069682836532593, "lr": 4.712891757984629e-06, "epoch": 1.7016806722689075, "percentage": 56.72, "elapsed_time": "0:16:15", "remaining_time": "0:12:24"} +{"current_steps": 811, "total_steps": 1428, "loss": 2.270923376083374, "lr": 4.700688701820096e-06, "epoch": 1.7037815126050422, "percentage": 56.79, "elapsed_time": "0:16:16", "remaining_time": "0:12:23"} +{"current_steps": 812, "total_steps": 1428, "loss": 2.1212430000305176, "lr": 4.688487434680459e-06, "epoch": 1.7058823529411766, "percentage": 56.86, "elapsed_time": "0:16:17", "remaining_time": "0:12:21"} +{"current_steps": 813, "total_steps": 1428, "loss": 1.340724229812622, "lr": 4.6762880294943734e-06, "epoch": 1.707983193277311, "percentage": 56.93, "elapsed_time": "0:16:18", "remaining_time": "0:12:20"} +{"current_steps": 814, "total_steps": 1428, "loss": 1.1250860691070557, "lr": 4.664090559179367e-06, "epoch": 1.7100840336134455, "percentage": 57.0, "elapsed_time": "0:16:19", "remaining_time": "0:12:19"} +{"current_steps": 815, "total_steps": 1428, "loss": 1.3906278610229492, "lr": 4.651895096641402e-06, "epoch": 1.71218487394958, "percentage": 57.07, "elapsed_time": "0:16:21", "remaining_time": "0:12:17"} +{"current_steps": 816, "total_steps": 1428, "loss": 1.5373984575271606, "lr": 4.639701714774439e-06, "epoch": 1.7142857142857144, "percentage": 57.14, "elapsed_time": "0:16:22", "remaining_time": "0:12:16"} +{"current_steps": 817, "total_steps": 1428, "loss": 1.1511554718017578, "lr": 4.627510486459999e-06, "epoch": 1.7163865546218489, "percentage": 57.21, "elapsed_time": "0:16:23", "remaining_time": "0:12:15"} +{"current_steps": 818, "total_steps": 1428, "loss": 1.0511482954025269, "lr": 4.615321484566741e-06, "epoch": 1.7184873949579833, "percentage": 57.28, "elapsed_time": "0:16:24", "remaining_time": "0:12:13"} +{"current_steps": 819, "total_steps": 1428, "loss": 1.6539651155471802, "lr": 4.603134781950007e-06, "epoch": 1.7205882352941178, "percentage": 57.35, "elapsed_time": "0:16:25", "remaining_time": "0:12:12"} +{"current_steps": 820, "total_steps": 1428, "loss": 1.7340842485427856, "lr": 4.590950451451397e-06, "epoch": 1.7226890756302522, "percentage": 57.42, "elapsed_time": "0:16:26", "remaining_time": "0:12:11"} +{"current_steps": 821, "total_steps": 1428, "loss": 1.9771497249603271, "lr": 4.578768565898337e-06, "epoch": 1.7247899159663866, "percentage": 57.49, "elapsed_time": "0:16:27", "remaining_time": "0:12:10"} +{"current_steps": 822, "total_steps": 1428, "loss": 1.6702903509140015, "lr": 4.566589198103635e-06, "epoch": 1.726890756302521, "percentage": 57.56, "elapsed_time": "0:16:28", "remaining_time": "0:12:08"} +{"current_steps": 823, "total_steps": 1428, "loss": 1.2594914436340332, "lr": 4.554412420865052e-06, "epoch": 1.7289915966386555, "percentage": 57.63, "elapsed_time": "0:16:29", "remaining_time": "0:12:07"} +{"current_steps": 824, "total_steps": 1428, "loss": 1.2319787740707397, "lr": 4.542238306964863e-06, "epoch": 1.73109243697479, "percentage": 57.7, "elapsed_time": "0:16:30", "remaining_time": "0:12:06"} +{"current_steps": 825, "total_steps": 1428, "loss": 1.631975769996643, "lr": 4.530066929169427e-06, "epoch": 1.7331932773109244, "percentage": 57.77, "elapsed_time": "0:16:31", "remaining_time": "0:12:04"} +{"current_steps": 826, "total_steps": 1428, "loss": 1.4831879138946533, "lr": 4.5178983602287476e-06, "epoch": 1.7352941176470589, "percentage": 57.84, "elapsed_time": "0:16:32", "remaining_time": "0:12:03"} +{"current_steps": 827, "total_steps": 1428, "loss": 1.225109338760376, "lr": 4.505732672876037e-06, "epoch": 1.7373949579831933, "percentage": 57.91, "elapsed_time": "0:16:33", "remaining_time": "0:12:02"} +{"current_steps": 828, "total_steps": 1428, "loss": 1.6191500425338745, "lr": 4.493569939827288e-06, "epoch": 1.7394957983193278, "percentage": 57.98, "elapsed_time": "0:16:35", "remaining_time": "0:12:01"} +{"current_steps": 829, "total_steps": 1428, "loss": 1.562519907951355, "lr": 4.48141023378083e-06, "epoch": 1.7415966386554622, "percentage": 58.05, "elapsed_time": "0:16:36", "remaining_time": "0:11:59"} +{"current_steps": 830, "total_steps": 1428, "loss": 1.5889461040496826, "lr": 4.4692536274169055e-06, "epoch": 1.7436974789915967, "percentage": 58.12, "elapsed_time": "0:16:37", "remaining_time": "0:11:58"} +{"current_steps": 831, "total_steps": 1428, "loss": 0.8582566976547241, "lr": 4.457100193397226e-06, "epoch": 1.745798319327731, "percentage": 58.19, "elapsed_time": "0:16:38", "remaining_time": "0:11:57"} +{"current_steps": 832, "total_steps": 1428, "loss": 1.2409437894821167, "lr": 4.444950004364542e-06, "epoch": 1.7478991596638656, "percentage": 58.26, "elapsed_time": "0:16:39", "remaining_time": "0:11:55"} +{"current_steps": 833, "total_steps": 1428, "loss": 1.2449380159378052, "lr": 4.432803132942208e-06, "epoch": 1.75, "percentage": 58.33, "elapsed_time": "0:16:40", "remaining_time": "0:11:54"} +{"current_steps": 834, "total_steps": 1428, "loss": 1.2676522731781006, "lr": 4.420659651733751e-06, "epoch": 1.7521008403361344, "percentage": 58.4, "elapsed_time": "0:16:41", "remaining_time": "0:11:53"} +{"current_steps": 835, "total_steps": 1428, "loss": 1.5941420793533325, "lr": 4.40851963332243e-06, "epoch": 1.754201680672269, "percentage": 58.47, "elapsed_time": "0:16:42", "remaining_time": "0:11:52"} +{"current_steps": 836, "total_steps": 1428, "loss": 1.1451562643051147, "lr": 4.396383150270811e-06, "epoch": 1.7563025210084033, "percentage": 58.54, "elapsed_time": "0:16:43", "remaining_time": "0:11:50"} +{"current_steps": 837, "total_steps": 1428, "loss": 1.4305951595306396, "lr": 4.384250275120325e-06, "epoch": 1.7584033613445378, "percentage": 58.61, "elapsed_time": "0:16:44", "remaining_time": "0:11:49"} +{"current_steps": 838, "total_steps": 1428, "loss": 1.9824583530426025, "lr": 4.372121080390841e-06, "epoch": 1.7605042016806722, "percentage": 58.68, "elapsed_time": "0:16:45", "remaining_time": "0:11:48"} +{"current_steps": 839, "total_steps": 1428, "loss": 1.2548645734786987, "lr": 4.359995638580226e-06, "epoch": 1.7626050420168067, "percentage": 58.75, "elapsed_time": "0:16:46", "remaining_time": "0:11:46"} +{"current_steps": 840, "total_steps": 1428, "loss": 1.8208611011505127, "lr": 4.34787402216392e-06, "epoch": 1.7647058823529411, "percentage": 58.82, "elapsed_time": "0:16:47", "remaining_time": "0:11:45"} +{"current_steps": 841, "total_steps": 1428, "loss": 1.3555166721343994, "lr": 4.335756303594493e-06, "epoch": 1.7668067226890756, "percentage": 58.89, "elapsed_time": "0:16:49", "remaining_time": "0:11:44"} +{"current_steps": 842, "total_steps": 1428, "loss": 0.9843342900276184, "lr": 4.323642555301222e-06, "epoch": 1.76890756302521, "percentage": 58.96, "elapsed_time": "0:16:50", "remaining_time": "0:11:43"} +{"current_steps": 843, "total_steps": 1428, "loss": 1.5203514099121094, "lr": 4.311532849689649e-06, "epoch": 1.7710084033613445, "percentage": 59.03, "elapsed_time": "0:16:51", "remaining_time": "0:11:41"} +{"current_steps": 844, "total_steps": 1428, "loss": 2.226682662963867, "lr": 4.299427259141155e-06, "epoch": 1.773109243697479, "percentage": 59.1, "elapsed_time": "0:16:52", "remaining_time": "0:11:40"} +{"current_steps": 845, "total_steps": 1428, "loss": 1.4532074928283691, "lr": 4.2873258560125244e-06, "epoch": 1.7752100840336134, "percentage": 59.17, "elapsed_time": "0:16:53", "remaining_time": "0:11:39"} +{"current_steps": 846, "total_steps": 1428, "loss": 0.939800500869751, "lr": 4.275228712635511e-06, "epoch": 1.7773109243697478, "percentage": 59.24, "elapsed_time": "0:16:54", "remaining_time": "0:11:37"} +{"current_steps": 847, "total_steps": 1428, "loss": 0.9362924098968506, "lr": 4.263135901316406e-06, "epoch": 1.7794117647058822, "percentage": 59.31, "elapsed_time": "0:16:55", "remaining_time": "0:11:36"} +{"current_steps": 848, "total_steps": 1428, "loss": 1.4257563352584839, "lr": 4.251047494335616e-06, "epoch": 1.7815126050420167, "percentage": 59.38, "elapsed_time": "0:16:56", "remaining_time": "0:11:35"} +{"current_steps": 849, "total_steps": 1428, "loss": 1.393942952156067, "lr": 4.238963563947212e-06, "epoch": 1.7836134453781511, "percentage": 59.45, "elapsed_time": "0:16:57", "remaining_time": "0:11:34"} +{"current_steps": 850, "total_steps": 1428, "loss": 1.588603138923645, "lr": 4.226884182378513e-06, "epoch": 1.7857142857142856, "percentage": 59.52, "elapsed_time": "0:16:58", "remaining_time": "0:11:32"} +{"current_steps": 851, "total_steps": 1428, "loss": 1.198427677154541, "lr": 4.2148094218296485e-06, "epoch": 1.78781512605042, "percentage": 59.59, "elapsed_time": "0:16:59", "remaining_time": "0:11:31"} +{"current_steps": 852, "total_steps": 1428, "loss": 1.0912418365478516, "lr": 4.202739354473127e-06, "epoch": 1.7899159663865545, "percentage": 59.66, "elapsed_time": "0:17:00", "remaining_time": "0:11:30"} +{"current_steps": 853, "total_steps": 1428, "loss": 1.8104877471923828, "lr": 4.190674052453405e-06, "epoch": 1.792016806722689, "percentage": 59.73, "elapsed_time": "0:17:01", "remaining_time": "0:11:28"} +{"current_steps": 854, "total_steps": 1428, "loss": 1.337807297706604, "lr": 4.178613587886455e-06, "epoch": 1.7941176470588234, "percentage": 59.8, "elapsed_time": "0:17:03", "remaining_time": "0:11:27"} +{"current_steps": 855, "total_steps": 1428, "loss": 1.0441133975982666, "lr": 4.166558032859339e-06, "epoch": 1.7962184873949578, "percentage": 59.87, "elapsed_time": "0:17:04", "remaining_time": "0:11:26"} +{"current_steps": 856, "total_steps": 1428, "loss": 1.8002381324768066, "lr": 4.154507459429769e-06, "epoch": 1.7983193277310925, "percentage": 59.94, "elapsed_time": "0:17:05", "remaining_time": "0:11:25"} +{"current_steps": 857, "total_steps": 1428, "loss": 1.7534747123718262, "lr": 4.142461939625685e-06, "epoch": 1.800420168067227, "percentage": 60.01, "elapsed_time": "0:17:06", "remaining_time": "0:11:23"} +{"current_steps": 858, "total_steps": 1428, "loss": 2.5967888832092285, "lr": 4.13042154544482e-06, "epoch": 1.8025210084033614, "percentage": 60.08, "elapsed_time": "0:17:07", "remaining_time": "0:11:22"} +{"current_steps": 859, "total_steps": 1428, "loss": 0.9714012145996094, "lr": 4.1183863488542686e-06, "epoch": 1.8046218487394958, "percentage": 60.15, "elapsed_time": "0:17:08", "remaining_time": "0:11:21"} +{"current_steps": 860, "total_steps": 1428, "loss": 2.0358502864837646, "lr": 4.106356421790062e-06, "epoch": 1.8067226890756303, "percentage": 60.22, "elapsed_time": "0:17:09", "remaining_time": "0:11:19"} +{"current_steps": 861, "total_steps": 1428, "loss": 1.2078362703323364, "lr": 4.094331836156732e-06, "epoch": 1.8088235294117647, "percentage": 60.29, "elapsed_time": "0:17:10", "remaining_time": "0:11:18"} +{"current_steps": 862, "total_steps": 1428, "loss": 1.3551952838897705, "lr": 4.082312663826886e-06, "epoch": 1.8109243697478992, "percentage": 60.36, "elapsed_time": "0:17:11", "remaining_time": "0:11:17"} +{"current_steps": 863, "total_steps": 1428, "loss": 1.7473708391189575, "lr": 4.070298976640772e-06, "epoch": 1.8130252100840336, "percentage": 60.43, "elapsed_time": "0:17:12", "remaining_time": "0:11:16"} +{"current_steps": 864, "total_steps": 1428, "loss": 1.1888244152069092, "lr": 4.058290846405856e-06, "epoch": 1.815126050420168, "percentage": 60.5, "elapsed_time": "0:17:13", "remaining_time": "0:11:14"} +{"current_steps": 865, "total_steps": 1428, "loss": 1.7867594957351685, "lr": 4.046288344896388e-06, "epoch": 1.8172268907563025, "percentage": 60.57, "elapsed_time": "0:17:14", "remaining_time": "0:11:13"} +{"current_steps": 866, "total_steps": 1428, "loss": 1.2903845310211182, "lr": 4.034291543852973e-06, "epoch": 1.819327731092437, "percentage": 60.64, "elapsed_time": "0:17:15", "remaining_time": "0:11:12"} +{"current_steps": 867, "total_steps": 1428, "loss": 1.4051203727722168, "lr": 4.022300514982146e-06, "epoch": 1.8214285714285714, "percentage": 60.71, "elapsed_time": "0:17:17", "remaining_time": "0:11:11"} +{"current_steps": 868, "total_steps": 1428, "loss": 1.7378381490707397, "lr": 4.010315329955941e-06, "epoch": 1.8235294117647058, "percentage": 60.78, "elapsed_time": "0:17:18", "remaining_time": "0:11:09"} +{"current_steps": 869, "total_steps": 1428, "loss": 1.1623207330703735, "lr": 3.998336060411459e-06, "epoch": 1.8256302521008403, "percentage": 60.85, "elapsed_time": "0:17:19", "remaining_time": "0:11:08"} +{"current_steps": 870, "total_steps": 1428, "loss": 1.9922326803207397, "lr": 3.986362777950448e-06, "epoch": 1.8277310924369747, "percentage": 60.92, "elapsed_time": "0:17:20", "remaining_time": "0:11:07"} +{"current_steps": 871, "total_steps": 1428, "loss": 1.8183355331420898, "lr": 3.9743955541388645e-06, "epoch": 1.8298319327731094, "percentage": 60.99, "elapsed_time": "0:17:21", "remaining_time": "0:11:05"} +{"current_steps": 872, "total_steps": 1428, "loss": 1.20865797996521, "lr": 3.962434460506459e-06, "epoch": 1.8319327731092439, "percentage": 61.06, "elapsed_time": "0:17:22", "remaining_time": "0:11:04"} +{"current_steps": 873, "total_steps": 1428, "loss": 1.2787063121795654, "lr": 3.950479568546336e-06, "epoch": 1.8340336134453783, "percentage": 61.13, "elapsed_time": "0:17:23", "remaining_time": "0:11:03"} +{"current_steps": 874, "total_steps": 1428, "loss": 2.1469886302948, "lr": 3.938530949714533e-06, "epoch": 1.8361344537815127, "percentage": 61.2, "elapsed_time": "0:17:24", "remaining_time": "0:11:02"} +{"current_steps": 875, "total_steps": 1428, "loss": 2.5014071464538574, "lr": 3.926588675429591e-06, "epoch": 1.8382352941176472, "percentage": 61.27, "elapsed_time": "0:17:25", "remaining_time": "0:11:00"} +{"current_steps": 876, "total_steps": 1428, "loss": 1.2857444286346436, "lr": 3.914652817072132e-06, "epoch": 1.8403361344537816, "percentage": 61.34, "elapsed_time": "0:17:26", "remaining_time": "0:10:59"} +{"current_steps": 877, "total_steps": 1428, "loss": 0.8846265077590942, "lr": 3.902723445984425e-06, "epoch": 1.842436974789916, "percentage": 61.41, "elapsed_time": "0:17:27", "remaining_time": "0:10:58"} +{"current_steps": 878, "total_steps": 1428, "loss": 3.6164169311523438, "lr": 3.890800633469968e-06, "epoch": 1.8445378151260505, "percentage": 61.48, "elapsed_time": "0:17:28", "remaining_time": "0:10:57"} +{"current_steps": 879, "total_steps": 1428, "loss": 1.778512954711914, "lr": 3.878884450793053e-06, "epoch": 1.846638655462185, "percentage": 61.55, "elapsed_time": "0:17:30", "remaining_time": "0:10:55"} +{"current_steps": 880, "total_steps": 1428, "loss": 1.2984943389892578, "lr": 3.866974969178348e-06, "epoch": 1.8487394957983194, "percentage": 61.62, "elapsed_time": "0:17:31", "remaining_time": "0:10:54"} +{"current_steps": 881, "total_steps": 1428, "loss": 1.233088493347168, "lr": 3.855072259810465e-06, "epoch": 1.8508403361344539, "percentage": 61.69, "elapsed_time": "0:17:32", "remaining_time": "0:10:53"} +{"current_steps": 882, "total_steps": 1428, "loss": 1.0973716974258423, "lr": 3.8431763938335415e-06, "epoch": 1.8529411764705883, "percentage": 61.76, "elapsed_time": "0:17:33", "remaining_time": "0:10:52"} +{"current_steps": 883, "total_steps": 1428, "loss": 1.9479036331176758, "lr": 3.831287442350806e-06, "epoch": 1.8550420168067228, "percentage": 61.83, "elapsed_time": "0:17:34", "remaining_time": "0:10:50"} +{"current_steps": 884, "total_steps": 1428, "loss": 2.3243212699890137, "lr": 3.819405476424164e-06, "epoch": 1.8571428571428572, "percentage": 61.9, "elapsed_time": "0:17:35", "remaining_time": "0:10:49"} +{"current_steps": 885, "total_steps": 1428, "loss": 2.167454242706299, "lr": 3.8075305670737605e-06, "epoch": 1.8592436974789917, "percentage": 61.97, "elapsed_time": "0:17:36", "remaining_time": "0:10:48"} +{"current_steps": 886, "total_steps": 1428, "loss": 1.3896931409835815, "lr": 3.795662785277568e-06, "epoch": 1.861344537815126, "percentage": 62.04, "elapsed_time": "0:17:37", "remaining_time": "0:10:46"} +{"current_steps": 887, "total_steps": 1428, "loss": 1.7062684297561646, "lr": 3.783802201970953e-06, "epoch": 1.8634453781512605, "percentage": 62.11, "elapsed_time": "0:17:38", "remaining_time": "0:10:45"} +{"current_steps": 888, "total_steps": 1428, "loss": 1.996096134185791, "lr": 3.7719488880462596e-06, "epoch": 1.865546218487395, "percentage": 62.18, "elapsed_time": "0:17:39", "remaining_time": "0:10:44"} +{"current_steps": 889, "total_steps": 1428, "loss": 0.9396399259567261, "lr": 3.7601029143523767e-06, "epoch": 1.8676470588235294, "percentage": 62.25, "elapsed_time": "0:17:40", "remaining_time": "0:10:43"} +{"current_steps": 890, "total_steps": 1428, "loss": 1.384545922279358, "lr": 3.748264351694324e-06, "epoch": 1.8697478991596639, "percentage": 62.32, "elapsed_time": "0:17:41", "remaining_time": "0:10:41"} +{"current_steps": 891, "total_steps": 1428, "loss": 1.298504114151001, "lr": 3.7364332708328232e-06, "epoch": 1.8718487394957983, "percentage": 62.39, "elapsed_time": "0:17:42", "remaining_time": "0:10:40"} +{"current_steps": 892, "total_steps": 1428, "loss": 1.395151138305664, "lr": 3.7246097424838746e-06, "epoch": 1.8739495798319328, "percentage": 62.46, "elapsed_time": "0:17:44", "remaining_time": "0:10:39"} +{"current_steps": 893, "total_steps": 1428, "loss": 0.9280238747596741, "lr": 3.712793837318338e-06, "epoch": 1.8760504201680672, "percentage": 62.54, "elapsed_time": "0:17:45", "remaining_time": "0:10:38"} +{"current_steps": 894, "total_steps": 1428, "loss": 1.3795464038848877, "lr": 3.7009856259615074e-06, "epoch": 1.8781512605042017, "percentage": 62.61, "elapsed_time": "0:17:46", "remaining_time": "0:10:36"} +{"current_steps": 895, "total_steps": 1428, "loss": 1.3113572597503662, "lr": 3.689185178992689e-06, "epoch": 1.8802521008403361, "percentage": 62.68, "elapsed_time": "0:17:47", "remaining_time": "0:10:35"} +{"current_steps": 896, "total_steps": 1428, "loss": 1.580859661102295, "lr": 3.677392566944783e-06, "epoch": 1.8823529411764706, "percentage": 62.75, "elapsed_time": "0:17:48", "remaining_time": "0:10:34"} +{"current_steps": 897, "total_steps": 1428, "loss": 1.5074641704559326, "lr": 3.665607860303857e-06, "epoch": 1.884453781512605, "percentage": 62.82, "elapsed_time": "0:17:49", "remaining_time": "0:10:33"} +{"current_steps": 898, "total_steps": 1428, "loss": 1.438436508178711, "lr": 3.653831129508727e-06, "epoch": 1.8865546218487395, "percentage": 62.89, "elapsed_time": "0:17:50", "remaining_time": "0:10:31"} +{"current_steps": 899, "total_steps": 1428, "loss": 2.4116339683532715, "lr": 3.642062444950537e-06, "epoch": 1.888655462184874, "percentage": 62.96, "elapsed_time": "0:17:51", "remaining_time": "0:10:30"} +{"current_steps": 900, "total_steps": 1428, "loss": 1.5296099185943604, "lr": 3.630301876972337e-06, "epoch": 1.8907563025210083, "percentage": 63.03, "elapsed_time": "0:17:52", "remaining_time": "0:10:29"} +{"current_steps": 901, "total_steps": 1428, "loss": 1.7645788192749023, "lr": 3.618549495868662e-06, "epoch": 1.8928571428571428, "percentage": 63.1, "elapsed_time": "0:17:53", "remaining_time": "0:10:28"} +{"current_steps": 902, "total_steps": 1428, "loss": 1.528565526008606, "lr": 3.606805371885117e-06, "epoch": 1.8949579831932772, "percentage": 63.17, "elapsed_time": "0:17:54", "remaining_time": "0:10:26"} +{"current_steps": 903, "total_steps": 1428, "loss": 1.5352060794830322, "lr": 3.5950695752179487e-06, "epoch": 1.8970588235294117, "percentage": 63.24, "elapsed_time": "0:17:55", "remaining_time": "0:10:25"} +{"current_steps": 904, "total_steps": 1428, "loss": 1.2181806564331055, "lr": 3.5833421760136323e-06, "epoch": 1.8991596638655461, "percentage": 63.31, "elapsed_time": "0:17:56", "remaining_time": "0:10:24"} +{"current_steps": 905, "total_steps": 1428, "loss": 1.2715753316879272, "lr": 3.5716232443684486e-06, "epoch": 1.9012605042016806, "percentage": 63.38, "elapsed_time": "0:17:58", "remaining_time": "0:10:23"} +{"current_steps": 906, "total_steps": 1428, "loss": 1.4792617559432983, "lr": 3.559912850328069e-06, "epoch": 1.903361344537815, "percentage": 63.45, "elapsed_time": "0:17:59", "remaining_time": "0:10:21"} +{"current_steps": 907, "total_steps": 1428, "loss": 1.072256326675415, "lr": 3.5482110638871325e-06, "epoch": 1.9054621848739495, "percentage": 63.52, "elapsed_time": "0:18:00", "remaining_time": "0:10:20"} +{"current_steps": 908, "total_steps": 1428, "loss": 1.5988600254058838, "lr": 3.5365179549888306e-06, "epoch": 1.907563025210084, "percentage": 63.59, "elapsed_time": "0:18:01", "remaining_time": "0:10:19"} +{"current_steps": 909, "total_steps": 1428, "loss": 2.473078489303589, "lr": 3.524833593524487e-06, "epoch": 1.9096638655462184, "percentage": 63.66, "elapsed_time": "0:18:02", "remaining_time": "0:10:17"} +{"current_steps": 910, "total_steps": 1428, "loss": 1.8987966775894165, "lr": 3.513158049333141e-06, "epoch": 1.9117647058823528, "percentage": 63.73, "elapsed_time": "0:18:03", "remaining_time": "0:10:16"} +{"current_steps": 911, "total_steps": 1428, "loss": 1.6164718866348267, "lr": 3.50149139220113e-06, "epoch": 1.9138655462184873, "percentage": 63.8, "elapsed_time": "0:18:04", "remaining_time": "0:10:15"} +{"current_steps": 912, "total_steps": 1428, "loss": 1.3376764059066772, "lr": 3.4898336918616726e-06, "epoch": 1.9159663865546217, "percentage": 63.87, "elapsed_time": "0:18:05", "remaining_time": "0:10:14"} +{"current_steps": 913, "total_steps": 1428, "loss": 1.7546143531799316, "lr": 3.47818501799445e-06, "epoch": 1.9180672268907561, "percentage": 63.94, "elapsed_time": "0:18:06", "remaining_time": "0:10:12"} +{"current_steps": 914, "total_steps": 1428, "loss": 1.4916424751281738, "lr": 3.4665454402251937e-06, "epoch": 1.9201680672268906, "percentage": 64.01, "elapsed_time": "0:18:07", "remaining_time": "0:10:11"} +{"current_steps": 915, "total_steps": 1428, "loss": 1.6852712631225586, "lr": 3.4549150281252635e-06, "epoch": 1.9222689075630253, "percentage": 64.08, "elapsed_time": "0:18:08", "remaining_time": "0:10:10"} +{"current_steps": 916, "total_steps": 1428, "loss": 1.7150108814239502, "lr": 3.443293851211237e-06, "epoch": 1.9243697478991597, "percentage": 64.15, "elapsed_time": "0:18:09", "remaining_time": "0:10:09"} +{"current_steps": 917, "total_steps": 1428, "loss": 1.7211201190948486, "lr": 3.4316819789444893e-06, "epoch": 1.9264705882352942, "percentage": 64.22, "elapsed_time": "0:18:10", "remaining_time": "0:10:07"} +{"current_steps": 918, "total_steps": 1428, "loss": 0.7268713712692261, "lr": 3.4200794807307834e-06, "epoch": 1.9285714285714286, "percentage": 64.29, "elapsed_time": "0:18:12", "remaining_time": "0:10:06"} +{"current_steps": 919, "total_steps": 1428, "loss": 1.4612197875976562, "lr": 3.40848642591985e-06, "epoch": 1.930672268907563, "percentage": 64.36, "elapsed_time": "0:18:13", "remaining_time": "0:10:05"} +{"current_steps": 920, "total_steps": 1428, "loss": 2.3325533866882324, "lr": 3.3969028838049765e-06, "epoch": 1.9327731092436975, "percentage": 64.43, "elapsed_time": "0:18:14", "remaining_time": "0:10:04"} +{"current_steps": 921, "total_steps": 1428, "loss": 1.3644397258758545, "lr": 3.3853289236225917e-06, "epoch": 1.934873949579832, "percentage": 64.5, "elapsed_time": "0:18:15", "remaining_time": "0:10:02"} +{"current_steps": 922, "total_steps": 1428, "loss": 1.405503273010254, "lr": 3.37376461455185e-06, "epoch": 1.9369747899159664, "percentage": 64.57, "elapsed_time": "0:18:16", "remaining_time": "0:10:01"} +{"current_steps": 923, "total_steps": 1428, "loss": 1.1844987869262695, "lr": 3.362210025714222e-06, "epoch": 1.9390756302521008, "percentage": 64.64, "elapsed_time": "0:18:17", "remaining_time": "0:10:00"} +{"current_steps": 924, "total_steps": 1428, "loss": 2.294912815093994, "lr": 3.350665226173078e-06, "epoch": 1.9411764705882353, "percentage": 64.71, "elapsed_time": "0:18:18", "remaining_time": "0:09:59"} +{"current_steps": 925, "total_steps": 1428, "loss": 1.3060452938079834, "lr": 3.339130284933276e-06, "epoch": 1.9432773109243697, "percentage": 64.78, "elapsed_time": "0:18:19", "remaining_time": "0:09:57"} +{"current_steps": 926, "total_steps": 1428, "loss": 1.5017865896224976, "lr": 3.327605270940751e-06, "epoch": 1.9453781512605042, "percentage": 64.85, "elapsed_time": "0:18:20", "remaining_time": "0:09:56"} +{"current_steps": 927, "total_steps": 1428, "loss": 1.9816479682922363, "lr": 3.316090253082101e-06, "epoch": 1.9474789915966386, "percentage": 64.92, "elapsed_time": "0:18:21", "remaining_time": "0:09:55"} +{"current_steps": 928, "total_steps": 1428, "loss": 1.4715440273284912, "lr": 3.304585300184173e-06, "epoch": 1.949579831932773, "percentage": 64.99, "elapsed_time": "0:18:22", "remaining_time": "0:09:54"} +{"current_steps": 929, "total_steps": 1428, "loss": 1.321998953819275, "lr": 3.293090481013661e-06, "epoch": 1.9516806722689075, "percentage": 65.06, "elapsed_time": "0:18:23", "remaining_time": "0:09:52"} +{"current_steps": 930, "total_steps": 1428, "loss": 1.1600078344345093, "lr": 3.28160586427668e-06, "epoch": 1.9537815126050422, "percentage": 65.13, "elapsed_time": "0:18:24", "remaining_time": "0:09:51"} +{"current_steps": 931, "total_steps": 1428, "loss": 1.5981496572494507, "lr": 3.2701315186183692e-06, "epoch": 1.9558823529411766, "percentage": 65.2, "elapsed_time": "0:18:26", "remaining_time": "0:09:50"} +{"current_steps": 932, "total_steps": 1428, "loss": 1.9018357992172241, "lr": 3.258667512622475e-06, "epoch": 1.957983193277311, "percentage": 65.27, "elapsed_time": "0:18:27", "remaining_time": "0:09:49"} +{"current_steps": 933, "total_steps": 1428, "loss": 1.175397515296936, "lr": 3.2472139148109416e-06, "epoch": 1.9600840336134455, "percentage": 65.34, "elapsed_time": "0:18:28", "remaining_time": "0:09:47"} +{"current_steps": 934, "total_steps": 1428, "loss": 0.5444597005844116, "lr": 3.2357707936435013e-06, "epoch": 1.96218487394958, "percentage": 65.41, "elapsed_time": "0:18:29", "remaining_time": "0:09:46"} +{"current_steps": 935, "total_steps": 1428, "loss": 1.3773345947265625, "lr": 3.224338217517269e-06, "epoch": 1.9642857142857144, "percentage": 65.48, "elapsed_time": "0:18:30", "remaining_time": "0:09:45"} +{"current_steps": 936, "total_steps": 1428, "loss": 2.028517007827759, "lr": 3.212916254766326e-06, "epoch": 1.9663865546218489, "percentage": 65.55, "elapsed_time": "0:18:31", "remaining_time": "0:09:44"} +{"current_steps": 937, "total_steps": 1428, "loss": 0.9947667121887207, "lr": 3.20150497366132e-06, "epoch": 1.9684873949579833, "percentage": 65.62, "elapsed_time": "0:18:32", "remaining_time": "0:09:42"} +{"current_steps": 938, "total_steps": 1428, "loss": 1.7532271146774292, "lr": 3.190104442409052e-06, "epoch": 1.9705882352941178, "percentage": 65.69, "elapsed_time": "0:18:33", "remaining_time": "0:09:41"} +{"current_steps": 939, "total_steps": 1428, "loss": 2.114809036254883, "lr": 3.1787147291520675e-06, "epoch": 1.9726890756302522, "percentage": 65.76, "elapsed_time": "0:18:34", "remaining_time": "0:09:40"} +{"current_steps": 940, "total_steps": 1428, "loss": 2.2796754837036133, "lr": 3.1673359019682538e-06, "epoch": 1.9747899159663866, "percentage": 65.83, "elapsed_time": "0:18:35", "remaining_time": "0:09:39"} +{"current_steps": 941, "total_steps": 1428, "loss": 1.172208547592163, "lr": 3.1559680288704297e-06, "epoch": 1.976890756302521, "percentage": 65.9, "elapsed_time": "0:18:36", "remaining_time": "0:09:38"} +{"current_steps": 942, "total_steps": 1428, "loss": 1.1454124450683594, "lr": 3.1446111778059405e-06, "epoch": 1.9789915966386555, "percentage": 65.97, "elapsed_time": "0:18:37", "remaining_time": "0:09:36"} +{"current_steps": 943, "total_steps": 1428, "loss": 1.6078896522521973, "lr": 3.1332654166562494e-06, "epoch": 1.98109243697479, "percentage": 66.04, "elapsed_time": "0:18:39", "remaining_time": "0:09:35"} +{"current_steps": 944, "total_steps": 1428, "loss": 1.2369673252105713, "lr": 3.1219308132365365e-06, "epoch": 1.9831932773109244, "percentage": 66.11, "elapsed_time": "0:18:40", "remaining_time": "0:09:34"} +{"current_steps": 945, "total_steps": 1428, "loss": 1.075582504272461, "lr": 3.110607435295289e-06, "epoch": 1.9852941176470589, "percentage": 66.18, "elapsed_time": "0:18:41", "remaining_time": "0:09:33"} +{"current_steps": 946, "total_steps": 1428, "loss": 0.9495413899421692, "lr": 3.099295350513898e-06, "epoch": 1.9873949579831933, "percentage": 66.25, "elapsed_time": "0:18:42", "remaining_time": "0:09:31"} +{"current_steps": 947, "total_steps": 1428, "loss": 1.3577098846435547, "lr": 3.087994626506254e-06, "epoch": 1.9894957983193278, "percentage": 66.32, "elapsed_time": "0:18:43", "remaining_time": "0:09:30"} +{"current_steps": 948, "total_steps": 1428, "loss": 1.229673981666565, "lr": 3.0767053308183416e-06, "epoch": 1.9915966386554622, "percentage": 66.39, "elapsed_time": "0:18:44", "remaining_time": "0:09:29"} +{"current_steps": 949, "total_steps": 1428, "loss": 1.3727761507034302, "lr": 3.0654275309278382e-06, "epoch": 1.9936974789915967, "percentage": 66.46, "elapsed_time": "0:18:45", "remaining_time": "0:09:28"} +{"current_steps": 950, "total_steps": 1428, "loss": 1.2849650382995605, "lr": 3.0541612942437095e-06, "epoch": 1.995798319327731, "percentage": 66.53, "elapsed_time": "0:18:46", "remaining_time": "0:09:26"} +{"current_steps": 951, "total_steps": 1428, "loss": 1.644538164138794, "lr": 3.0429066881058036e-06, "epoch": 1.9978991596638656, "percentage": 66.6, "elapsed_time": "0:18:47", "remaining_time": "0:09:25"} +{"current_steps": 952, "total_steps": 1428, "loss": 1.627841591835022, "lr": 3.031663779784454e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:18:48", "remaining_time": "0:09:24"} +{"current_steps": 953, "total_steps": 1428, "loss": 0.2781870365142822, "lr": 3.020432636480074e-06, "epoch": 2.0021008403361344, "percentage": 66.74, "elapsed_time": "0:20:34", "remaining_time": "0:10:15"} +{"current_steps": 954, "total_steps": 1428, "loss": 0.4595562815666199, "lr": 3.0092133253227563e-06, "epoch": 2.004201680672269, "percentage": 66.81, "elapsed_time": "0:20:35", "remaining_time": "0:10:13"} +{"current_steps": 955, "total_steps": 1428, "loss": 0.5985803604125977, "lr": 2.9980059133718687e-06, "epoch": 2.0063025210084033, "percentage": 66.88, "elapsed_time": "0:20:36", "remaining_time": "0:10:12"} +{"current_steps": 956, "total_steps": 1428, "loss": 0.41152679920196533, "lr": 2.986810467615659e-06, "epoch": 2.008403361344538, "percentage": 66.95, "elapsed_time": "0:20:37", "remaining_time": "0:10:11"} +{"current_steps": 957, "total_steps": 1428, "loss": 0.2737478017807007, "lr": 2.9756270549708497e-06, "epoch": 2.0105042016806722, "percentage": 67.02, "elapsed_time": "0:20:38", "remaining_time": "0:10:09"} +{"current_steps": 958, "total_steps": 1428, "loss": 0.3578256368637085, "lr": 2.9644557422822406e-06, "epoch": 2.0126050420168067, "percentage": 67.09, "elapsed_time": "0:20:39", "remaining_time": "0:10:08"} +{"current_steps": 959, "total_steps": 1428, "loss": 0.3519413471221924, "lr": 2.9532965963223076e-06, "epoch": 2.014705882352941, "percentage": 67.16, "elapsed_time": "0:20:40", "remaining_time": "0:10:06"} +{"current_steps": 960, "total_steps": 1428, "loss": 0.5450835227966309, "lr": 2.9421496837908036e-06, "epoch": 2.0168067226890756, "percentage": 67.23, "elapsed_time": "0:20:41", "remaining_time": "0:10:05"} +{"current_steps": 961, "total_steps": 1428, "loss": 0.7118933796882629, "lr": 2.9310150713143637e-06, "epoch": 2.01890756302521, "percentage": 67.3, "elapsed_time": "0:20:42", "remaining_time": "0:10:04"} +{"current_steps": 962, "total_steps": 1428, "loss": 0.6735545992851257, "lr": 2.9198928254461e-06, "epoch": 2.0210084033613445, "percentage": 67.37, "elapsed_time": "0:20:44", "remaining_time": "0:10:02"} +{"current_steps": 963, "total_steps": 1428, "loss": 0.6521182060241699, "lr": 2.908783012665209e-06, "epoch": 2.023109243697479, "percentage": 67.44, "elapsed_time": "0:20:45", "remaining_time": "0:10:01"} +{"current_steps": 964, "total_steps": 1428, "loss": 0.476604163646698, "lr": 2.8976856993765766e-06, "epoch": 2.0252100840336134, "percentage": 67.51, "elapsed_time": "0:20:46", "remaining_time": "0:09:59"} +{"current_steps": 965, "total_steps": 1428, "loss": 0.46952176094055176, "lr": 2.8866009519103705e-06, "epoch": 2.027310924369748, "percentage": 67.58, "elapsed_time": "0:20:47", "remaining_time": "0:09:58"} +{"current_steps": 966, "total_steps": 1428, "loss": 0.4453829526901245, "lr": 2.875528836521658e-06, "epoch": 2.0294117647058822, "percentage": 67.65, "elapsed_time": "0:20:48", "remaining_time": "0:09:57"} +{"current_steps": 967, "total_steps": 1428, "loss": 0.2944750189781189, "lr": 2.864469419389997e-06, "epoch": 2.0315126050420167, "percentage": 67.72, "elapsed_time": "0:20:49", "remaining_time": "0:09:55"} +{"current_steps": 968, "total_steps": 1428, "loss": 0.8550271391868591, "lr": 2.8534227666190484e-06, "epoch": 2.033613445378151, "percentage": 67.79, "elapsed_time": "0:20:50", "remaining_time": "0:09:54"} +{"current_steps": 969, "total_steps": 1428, "loss": 0.38192200660705566, "lr": 2.8423889442361797e-06, "epoch": 2.0357142857142856, "percentage": 67.86, "elapsed_time": "0:20:51", "remaining_time": "0:09:52"} +{"current_steps": 970, "total_steps": 1428, "loss": 0.7316254377365112, "lr": 2.831368018192071e-06, "epoch": 2.03781512605042, "percentage": 67.93, "elapsed_time": "0:20:52", "remaining_time": "0:09:51"} +{"current_steps": 971, "total_steps": 1428, "loss": 0.7615312337875366, "lr": 2.8203600543603116e-06, "epoch": 2.0399159663865545, "percentage": 68.0, "elapsed_time": "0:20:53", "remaining_time": "0:09:50"} +{"current_steps": 972, "total_steps": 1428, "loss": 0.8274880647659302, "lr": 2.809365118537024e-06, "epoch": 2.042016806722689, "percentage": 68.07, "elapsed_time": "0:20:54", "remaining_time": "0:09:48"} +{"current_steps": 973, "total_steps": 1428, "loss": 0.31469643115997314, "lr": 2.7983832764404517e-06, "epoch": 2.0441176470588234, "percentage": 68.14, "elapsed_time": "0:20:56", "remaining_time": "0:09:47"} +{"current_steps": 974, "total_steps": 1428, "loss": 0.20855772495269775, "lr": 2.787414593710583e-06, "epoch": 2.046218487394958, "percentage": 68.21, "elapsed_time": "0:20:57", "remaining_time": "0:09:45"} +{"current_steps": 975, "total_steps": 1428, "loss": 0.6759412884712219, "lr": 2.7764591359087415e-06, "epoch": 2.0483193277310923, "percentage": 68.28, "elapsed_time": "0:20:58", "remaining_time": "0:09:44"} +{"current_steps": 976, "total_steps": 1428, "loss": 0.4555593430995941, "lr": 2.7655169685172146e-06, "epoch": 2.0504201680672267, "percentage": 68.35, "elapsed_time": "0:20:59", "remaining_time": "0:09:43"} +{"current_steps": 977, "total_steps": 1428, "loss": 0.22477459907531738, "lr": 2.7545881569388404e-06, "epoch": 2.052521008403361, "percentage": 68.42, "elapsed_time": "0:21:00", "remaining_time": "0:09:41"} +{"current_steps": 978, "total_steps": 1428, "loss": 0.47387319803237915, "lr": 2.7436727664966368e-06, "epoch": 2.0546218487394956, "percentage": 68.49, "elapsed_time": "0:21:01", "remaining_time": "0:09:40"} +{"current_steps": 979, "total_steps": 1428, "loss": 0.46857523918151855, "lr": 2.7327708624333936e-06, "epoch": 2.05672268907563, "percentage": 68.56, "elapsed_time": "0:21:02", "remaining_time": "0:09:39"} +{"current_steps": 980, "total_steps": 1428, "loss": 0.4427967071533203, "lr": 2.7218825099112966e-06, "epoch": 2.0588235294117645, "percentage": 68.63, "elapsed_time": "0:21:03", "remaining_time": "0:09:37"} +{"current_steps": 981, "total_steps": 1428, "loss": 1.3617768287658691, "lr": 2.7110077740115315e-06, "epoch": 2.060924369747899, "percentage": 68.7, "elapsed_time": "0:21:04", "remaining_time": "0:09:36"} +{"current_steps": 982, "total_steps": 1428, "loss": 0.8060270547866821, "lr": 2.7001467197338905e-06, "epoch": 2.0630252100840334, "percentage": 68.77, "elapsed_time": "0:21:05", "remaining_time": "0:09:34"} +{"current_steps": 983, "total_steps": 1428, "loss": 0.29366880655288696, "lr": 2.6892994119963965e-06, "epoch": 2.0651260504201683, "percentage": 68.84, "elapsed_time": "0:21:06", "remaining_time": "0:09:33"} +{"current_steps": 984, "total_steps": 1428, "loss": 0.40074852108955383, "lr": 2.678465915634899e-06, "epoch": 2.0672268907563027, "percentage": 68.91, "elapsed_time": "0:21:08", "remaining_time": "0:09:32"} +{"current_steps": 985, "total_steps": 1428, "loss": 0.4710817337036133, "lr": 2.667646295402704e-06, "epoch": 2.069327731092437, "percentage": 68.98, "elapsed_time": "0:21:09", "remaining_time": "0:09:30"} +{"current_steps": 986, "total_steps": 1428, "loss": 0.37437137961387634, "lr": 2.656840615970169e-06, "epoch": 2.0714285714285716, "percentage": 69.05, "elapsed_time": "0:21:10", "remaining_time": "0:09:29"} +{"current_steps": 987, "total_steps": 1428, "loss": 0.9739346504211426, "lr": 2.646048941924333e-06, "epoch": 2.073529411764706, "percentage": 69.12, "elapsed_time": "0:21:11", "remaining_time": "0:09:28"} +{"current_steps": 988, "total_steps": 1428, "loss": 0.6326197981834412, "lr": 2.635271337768517e-06, "epoch": 2.0756302521008405, "percentage": 69.19, "elapsed_time": "0:21:12", "remaining_time": "0:09:26"} +{"current_steps": 989, "total_steps": 1428, "loss": 0.15397483110427856, "lr": 2.6245078679219503e-06, "epoch": 2.077731092436975, "percentage": 69.26, "elapsed_time": "0:21:13", "remaining_time": "0:09:25"} +{"current_steps": 990, "total_steps": 1428, "loss": 0.5905511379241943, "lr": 2.613758596719373e-06, "epoch": 2.0798319327731094, "percentage": 69.33, "elapsed_time": "0:21:14", "remaining_time": "0:09:23"} +{"current_steps": 991, "total_steps": 1428, "loss": 0.588984489440918, "lr": 2.603023588410662e-06, "epoch": 2.081932773109244, "percentage": 69.4, "elapsed_time": "0:21:15", "remaining_time": "0:09:22"} +{"current_steps": 992, "total_steps": 1428, "loss": 0.33690521121025085, "lr": 2.5923029071604443e-06, "epoch": 2.0840336134453783, "percentage": 69.47, "elapsed_time": "0:21:16", "remaining_time": "0:09:21"} +{"current_steps": 993, "total_steps": 1428, "loss": 0.23294681310653687, "lr": 2.5815966170477065e-06, "epoch": 2.0861344537815127, "percentage": 69.54, "elapsed_time": "0:21:17", "remaining_time": "0:09:19"} +{"current_steps": 994, "total_steps": 1428, "loss": 0.4404110908508301, "lr": 2.5709047820654236e-06, "epoch": 2.088235294117647, "percentage": 69.61, "elapsed_time": "0:21:18", "remaining_time": "0:09:18"} +{"current_steps": 995, "total_steps": 1428, "loss": 0.37340593338012695, "lr": 2.5602274661201643e-06, "epoch": 2.0903361344537816, "percentage": 69.68, "elapsed_time": "0:21:19", "remaining_time": "0:09:17"} +{"current_steps": 996, "total_steps": 1428, "loss": 0.3671455979347229, "lr": 2.549564733031722e-06, "epoch": 2.092436974789916, "percentage": 69.75, "elapsed_time": "0:21:21", "remaining_time": "0:09:15"} +{"current_steps": 997, "total_steps": 1428, "loss": 0.6218878030776978, "lr": 2.538916646532718e-06, "epoch": 2.0945378151260505, "percentage": 69.82, "elapsed_time": "0:21:22", "remaining_time": "0:09:14"} +{"current_steps": 998, "total_steps": 1428, "loss": 1.2778301239013672, "lr": 2.528283270268238e-06, "epoch": 2.096638655462185, "percentage": 69.89, "elapsed_time": "0:21:23", "remaining_time": "0:09:12"} +{"current_steps": 999, "total_steps": 1428, "loss": 0.6543454527854919, "lr": 2.517664667795434e-06, "epoch": 2.0987394957983194, "percentage": 69.96, "elapsed_time": "0:21:24", "remaining_time": "0:09:11"} +{"current_steps": 1000, "total_steps": 1428, "loss": 0.42762574553489685, "lr": 2.5070609025831605e-06, "epoch": 2.100840336134454, "percentage": 70.03, "elapsed_time": "0:21:25", "remaining_time": "0:09:10"} +{"current_steps": 1001, "total_steps": 1428, "loss": 0.40861833095550537, "lr": 2.49647203801158e-06, "epoch": 2.1029411764705883, "percentage": 70.1, "elapsed_time": "0:21:26", "remaining_time": "0:09:08"} +{"current_steps": 1002, "total_steps": 1428, "loss": 0.6941218376159668, "lr": 2.4858981373718006e-06, "epoch": 2.1050420168067228, "percentage": 70.17, "elapsed_time": "0:21:27", "remaining_time": "0:09:07"} +{"current_steps": 1003, "total_steps": 1428, "loss": 0.1615523397922516, "lr": 2.47533926386548e-06, "epoch": 2.107142857142857, "percentage": 70.24, "elapsed_time": "0:21:28", "remaining_time": "0:09:06"} +{"current_steps": 1004, "total_steps": 1428, "loss": 0.30699750781059265, "lr": 2.4647954806044633e-06, "epoch": 2.1092436974789917, "percentage": 70.31, "elapsed_time": "0:21:29", "remaining_time": "0:09:04"} +{"current_steps": 1005, "total_steps": 1428, "loss": 0.27435654401779175, "lr": 2.454266850610398e-06, "epoch": 2.111344537815126, "percentage": 70.38, "elapsed_time": "0:21:30", "remaining_time": "0:09:03"} +{"current_steps": 1006, "total_steps": 1428, "loss": 0.6352673172950745, "lr": 2.443753436814354e-06, "epoch": 2.1134453781512605, "percentage": 70.45, "elapsed_time": "0:21:31", "remaining_time": "0:09:01"} +{"current_steps": 1007, "total_steps": 1428, "loss": 0.3478729724884033, "lr": 2.433255302056458e-06, "epoch": 2.115546218487395, "percentage": 70.52, "elapsed_time": "0:21:33", "remaining_time": "0:09:00"} +{"current_steps": 1008, "total_steps": 1428, "loss": 0.3971726894378662, "lr": 2.4227725090855063e-06, "epoch": 2.1176470588235294, "percentage": 70.59, "elapsed_time": "0:21:34", "remaining_time": "0:08:59"} +{"current_steps": 1009, "total_steps": 1428, "loss": 0.9241357445716858, "lr": 2.412305120558599e-06, "epoch": 2.119747899159664, "percentage": 70.66, "elapsed_time": "0:21:35", "remaining_time": "0:08:57"} +{"current_steps": 1010, "total_steps": 1428, "loss": 0.2883678674697876, "lr": 2.40185319904076e-06, "epoch": 2.1218487394957983, "percentage": 70.73, "elapsed_time": "0:21:36", "remaining_time": "0:08:56"} +{"current_steps": 1011, "total_steps": 1428, "loss": 0.39812758564949036, "lr": 2.391416807004568e-06, "epoch": 2.1239495798319328, "percentage": 70.8, "elapsed_time": "0:21:37", "remaining_time": "0:08:55"} +{"current_steps": 1012, "total_steps": 1428, "loss": 0.6487483978271484, "lr": 2.3809960068297732e-06, "epoch": 2.1260504201680672, "percentage": 70.87, "elapsed_time": "0:21:38", "remaining_time": "0:08:53"} +{"current_steps": 1013, "total_steps": 1428, "loss": 0.44781216979026794, "lr": 2.370590860802938e-06, "epoch": 2.1281512605042017, "percentage": 70.94, "elapsed_time": "0:21:39", "remaining_time": "0:08:52"} +{"current_steps": 1014, "total_steps": 1428, "loss": 0.3241298496723175, "lr": 2.3602014311170524e-06, "epoch": 2.130252100840336, "percentage": 71.01, "elapsed_time": "0:21:40", "remaining_time": "0:08:51"} +{"current_steps": 1015, "total_steps": 1428, "loss": 0.4608106315135956, "lr": 2.3498277798711725e-06, "epoch": 2.1323529411764706, "percentage": 71.08, "elapsed_time": "0:21:41", "remaining_time": "0:08:49"} +{"current_steps": 1016, "total_steps": 1428, "loss": 0.5967488884925842, "lr": 2.3394699690700395e-06, "epoch": 2.134453781512605, "percentage": 71.15, "elapsed_time": "0:21:42", "remaining_time": "0:08:48"} +{"current_steps": 1017, "total_steps": 1428, "loss": 0.4074782729148865, "lr": 2.3291280606237186e-06, "epoch": 2.1365546218487395, "percentage": 71.22, "elapsed_time": "0:21:43", "remaining_time": "0:08:46"} +{"current_steps": 1018, "total_steps": 1428, "loss": 0.354820191860199, "lr": 2.3188021163472206e-06, "epoch": 2.138655462184874, "percentage": 71.29, "elapsed_time": "0:21:44", "remaining_time": "0:08:45"} +{"current_steps": 1019, "total_steps": 1428, "loss": 0.23287059366703033, "lr": 2.308492197960141e-06, "epoch": 2.1407563025210083, "percentage": 71.36, "elapsed_time": "0:21:46", "remaining_time": "0:08:44"} +{"current_steps": 1020, "total_steps": 1428, "loss": 1.0973201990127563, "lr": 2.2981983670862796e-06, "epoch": 2.142857142857143, "percentage": 71.43, "elapsed_time": "0:21:47", "remaining_time": "0:08:42"} +{"current_steps": 1021, "total_steps": 1428, "loss": 0.4452645778656006, "lr": 2.2879206852532854e-06, "epoch": 2.1449579831932772, "percentage": 71.5, "elapsed_time": "0:21:48", "remaining_time": "0:08:41"} +{"current_steps": 1022, "total_steps": 1428, "loss": 0.273881733417511, "lr": 2.2776592138922806e-06, "epoch": 2.1470588235294117, "percentage": 71.57, "elapsed_time": "0:21:49", "remaining_time": "0:08:40"} +{"current_steps": 1023, "total_steps": 1428, "loss": 0.20633578300476074, "lr": 2.2674140143374904e-06, "epoch": 2.149159663865546, "percentage": 71.64, "elapsed_time": "0:21:50", "remaining_time": "0:08:38"} +{"current_steps": 1024, "total_steps": 1428, "loss": 0.38969674706459045, "lr": 2.2571851478258903e-06, "epoch": 2.1512605042016806, "percentage": 71.71, "elapsed_time": "0:21:51", "remaining_time": "0:08:37"} +{"current_steps": 1025, "total_steps": 1428, "loss": 0.26989856362342834, "lr": 2.2469726754968207e-06, "epoch": 2.153361344537815, "percentage": 71.78, "elapsed_time": "0:21:52", "remaining_time": "0:08:36"} +{"current_steps": 1026, "total_steps": 1428, "loss": 0.5260115265846252, "lr": 2.236776658391641e-06, "epoch": 2.1554621848739495, "percentage": 71.85, "elapsed_time": "0:21:53", "remaining_time": "0:08:34"} +{"current_steps": 1027, "total_steps": 1428, "loss": 0.2469472587108612, "lr": 2.2265971574533474e-06, "epoch": 2.157563025210084, "percentage": 71.92, "elapsed_time": "0:21:54", "remaining_time": "0:08:33"} +{"current_steps": 1028, "total_steps": 1428, "loss": 0.201723113656044, "lr": 2.2164342335262244e-06, "epoch": 2.1596638655462184, "percentage": 71.99, "elapsed_time": "0:21:55", "remaining_time": "0:08:31"} +{"current_steps": 1029, "total_steps": 1428, "loss": 0.6355183124542236, "lr": 2.2062879473554654e-06, "epoch": 2.161764705882353, "percentage": 72.06, "elapsed_time": "0:21:56", "remaining_time": "0:08:30"} +{"current_steps": 1030, "total_steps": 1428, "loss": 0.32272863388061523, "lr": 2.1961583595868253e-06, "epoch": 2.1638655462184873, "percentage": 72.13, "elapsed_time": "0:21:57", "remaining_time": "0:08:29"} +{"current_steps": 1031, "total_steps": 1428, "loss": 0.24386917054653168, "lr": 2.186045530766244e-06, "epoch": 2.1659663865546217, "percentage": 72.2, "elapsed_time": "0:21:59", "remaining_time": "0:08:27"} +{"current_steps": 1032, "total_steps": 1428, "loss": 0.482686847448349, "lr": 2.1759495213394965e-06, "epoch": 2.168067226890756, "percentage": 72.27, "elapsed_time": "0:22:00", "remaining_time": "0:08:26"} +{"current_steps": 1033, "total_steps": 1428, "loss": 0.5142661333084106, "lr": 2.165870391651819e-06, "epoch": 2.1701680672268906, "percentage": 72.34, "elapsed_time": "0:22:01", "remaining_time": "0:08:25"} +{"current_steps": 1034, "total_steps": 1428, "loss": 0.21703539788722992, "lr": 2.155808201947563e-06, "epoch": 2.172268907563025, "percentage": 72.41, "elapsed_time": "0:22:02", "remaining_time": "0:08:23"} +{"current_steps": 1035, "total_steps": 1428, "loss": 0.4068147540092468, "lr": 2.145763012369824e-06, "epoch": 2.1743697478991595, "percentage": 72.48, "elapsed_time": "0:22:03", "remaining_time": "0:08:22"} +{"current_steps": 1036, "total_steps": 1428, "loss": 0.5949288606643677, "lr": 2.1357348829600816e-06, "epoch": 2.176470588235294, "percentage": 72.55, "elapsed_time": "0:22:04", "remaining_time": "0:08:21"} +{"current_steps": 1037, "total_steps": 1428, "loss": 0.44353166222572327, "lr": 2.125723873657852e-06, "epoch": 2.1785714285714284, "percentage": 72.62, "elapsed_time": "0:22:05", "remaining_time": "0:08:19"} +{"current_steps": 1038, "total_steps": 1428, "loss": 0.4212431013584137, "lr": 2.115730044300313e-06, "epoch": 2.180672268907563, "percentage": 72.69, "elapsed_time": "0:22:06", "remaining_time": "0:08:18"} +{"current_steps": 1039, "total_steps": 1428, "loss": 0.37279778718948364, "lr": 2.105753454621966e-06, "epoch": 2.1827731092436973, "percentage": 72.76, "elapsed_time": "0:22:07", "remaining_time": "0:08:17"} +{"current_steps": 1040, "total_steps": 1428, "loss": 0.6137001514434814, "lr": 2.095794164254259e-06, "epoch": 2.184873949579832, "percentage": 72.83, "elapsed_time": "0:22:08", "remaining_time": "0:08:15"} +{"current_steps": 1041, "total_steps": 1428, "loss": 0.20706136524677277, "lr": 2.0858522327252467e-06, "epoch": 2.1869747899159666, "percentage": 72.9, "elapsed_time": "0:22:09", "remaining_time": "0:08:14"} +{"current_steps": 1042, "total_steps": 1428, "loss": 0.3732944130897522, "lr": 2.0759277194592208e-06, "epoch": 2.189075630252101, "percentage": 72.97, "elapsed_time": "0:22:10", "remaining_time": "0:08:13"} +{"current_steps": 1043, "total_steps": 1428, "loss": 0.11849310249090195, "lr": 2.06602068377637e-06, "epoch": 2.1911764705882355, "percentage": 73.04, "elapsed_time": "0:22:12", "remaining_time": "0:08:11"} +{"current_steps": 1044, "total_steps": 1428, "loss": 0.35089147090911865, "lr": 2.0561311848924082e-06, "epoch": 2.19327731092437, "percentage": 73.11, "elapsed_time": "0:22:13", "remaining_time": "0:08:10"} +{"current_steps": 1045, "total_steps": 1428, "loss": 0.3482816219329834, "lr": 2.0462592819182377e-06, "epoch": 2.1953781512605044, "percentage": 73.18, "elapsed_time": "0:22:14", "remaining_time": "0:08:08"} +{"current_steps": 1046, "total_steps": 1428, "loss": 0.9048193097114563, "lr": 2.0364050338595792e-06, "epoch": 2.197478991596639, "percentage": 73.25, "elapsed_time": "0:22:15", "remaining_time": "0:08:07"} +{"current_steps": 1047, "total_steps": 1428, "loss": 0.34331268072128296, "lr": 2.0265684996166345e-06, "epoch": 2.1995798319327733, "percentage": 73.32, "elapsed_time": "0:22:16", "remaining_time": "0:08:06"} +{"current_steps": 1048, "total_steps": 1428, "loss": 0.35536718368530273, "lr": 2.0167497379837254e-06, "epoch": 2.2016806722689077, "percentage": 73.39, "elapsed_time": "0:22:17", "remaining_time": "0:08:04"} +{"current_steps": 1049, "total_steps": 1428, "loss": 0.20954403281211853, "lr": 2.0069488076489445e-06, "epoch": 2.203781512605042, "percentage": 73.46, "elapsed_time": "0:22:18", "remaining_time": "0:08:03"} +{"current_steps": 1050, "total_steps": 1428, "loss": 0.5290908813476562, "lr": 1.997165767193801e-06, "epoch": 2.2058823529411766, "percentage": 73.53, "elapsed_time": "0:22:19", "remaining_time": "0:08:02"} +{"current_steps": 1051, "total_steps": 1428, "loss": 0.44289880990982056, "lr": 1.9874006750928783e-06, "epoch": 2.207983193277311, "percentage": 73.6, "elapsed_time": "0:22:20", "remaining_time": "0:08:00"} +{"current_steps": 1052, "total_steps": 1428, "loss": 0.48035284876823425, "lr": 1.97765358971348e-06, "epoch": 2.2100840336134455, "percentage": 73.67, "elapsed_time": "0:22:21", "remaining_time": "0:07:59"} +{"current_steps": 1053, "total_steps": 1428, "loss": 0.2514810562133789, "lr": 1.967924569315275e-06, "epoch": 2.21218487394958, "percentage": 73.74, "elapsed_time": "0:22:22", "remaining_time": "0:07:58"} +{"current_steps": 1054, "total_steps": 1428, "loss": 0.9599279165267944, "lr": 1.958213672049964e-06, "epoch": 2.2142857142857144, "percentage": 73.81, "elapsed_time": "0:22:23", "remaining_time": "0:07:56"} +{"current_steps": 1055, "total_steps": 1428, "loss": 0.30860060453414917, "lr": 1.9485209559609148e-06, "epoch": 2.216386554621849, "percentage": 73.88, "elapsed_time": "0:22:25", "remaining_time": "0:07:55"} +{"current_steps": 1056, "total_steps": 1428, "loss": 0.7747633457183838, "lr": 1.9388464789828316e-06, "epoch": 2.2184873949579833, "percentage": 73.95, "elapsed_time": "0:22:26", "remaining_time": "0:07:54"} +{"current_steps": 1057, "total_steps": 1428, "loss": 0.3529064655303955, "lr": 1.9291902989413935e-06, "epoch": 2.2205882352941178, "percentage": 74.02, "elapsed_time": "0:22:27", "remaining_time": "0:07:52"} +{"current_steps": 1058, "total_steps": 1428, "loss": 1.0967960357666016, "lr": 1.9195524735529237e-06, "epoch": 2.222689075630252, "percentage": 74.09, "elapsed_time": "0:22:28", "remaining_time": "0:07:51"} +{"current_steps": 1059, "total_steps": 1428, "loss": 0.700248122215271, "lr": 1.909933060424029e-06, "epoch": 2.2247899159663866, "percentage": 74.16, "elapsed_time": "0:22:29", "remaining_time": "0:07:50"} +{"current_steps": 1060, "total_steps": 1428, "loss": 0.9177491068840027, "lr": 1.9003321170512728e-06, "epoch": 2.226890756302521, "percentage": 74.23, "elapsed_time": "0:22:30", "remaining_time": "0:07:48"} +{"current_steps": 1061, "total_steps": 1428, "loss": 0.543596625328064, "lr": 1.890749700820813e-06, "epoch": 2.2289915966386555, "percentage": 74.3, "elapsed_time": "0:22:31", "remaining_time": "0:07:47"} +{"current_steps": 1062, "total_steps": 1428, "loss": 0.7324357032775879, "lr": 1.8811858690080764e-06, "epoch": 2.23109243697479, "percentage": 74.37, "elapsed_time": "0:22:32", "remaining_time": "0:07:46"} +{"current_steps": 1063, "total_steps": 1428, "loss": 0.4075426459312439, "lr": 1.8716406787774e-06, "epoch": 2.2331932773109244, "percentage": 74.44, "elapsed_time": "0:22:33", "remaining_time": "0:07:44"} +{"current_steps": 1064, "total_steps": 1428, "loss": 0.39563894271850586, "lr": 1.862114187181705e-06, "epoch": 2.235294117647059, "percentage": 74.51, "elapsed_time": "0:22:34", "remaining_time": "0:07:43"} +{"current_steps": 1065, "total_steps": 1428, "loss": 0.37604600191116333, "lr": 1.8526064511621455e-06, "epoch": 2.2373949579831933, "percentage": 74.58, "elapsed_time": "0:22:35", "remaining_time": "0:07:42"} +{"current_steps": 1066, "total_steps": 1428, "loss": 0.6682062745094299, "lr": 1.843117527547768e-06, "epoch": 2.2394957983193278, "percentage": 74.65, "elapsed_time": "0:22:36", "remaining_time": "0:07:40"} +{"current_steps": 1067, "total_steps": 1428, "loss": 0.19220635294914246, "lr": 1.8336474730551807e-06, "epoch": 2.241596638655462, "percentage": 74.72, "elapsed_time": "0:22:37", "remaining_time": "0:07:39"} +{"current_steps": 1068, "total_steps": 1428, "loss": 0.27735865116119385, "lr": 1.8241963442882005e-06, "epoch": 2.2436974789915967, "percentage": 74.79, "elapsed_time": "0:22:39", "remaining_time": "0:07:38"} +{"current_steps": 1069, "total_steps": 1428, "loss": 0.41572022438049316, "lr": 1.8147641977375313e-06, "epoch": 2.245798319327731, "percentage": 74.86, "elapsed_time": "0:22:40", "remaining_time": "0:07:36"} +{"current_steps": 1070, "total_steps": 1428, "loss": 0.25049227476119995, "lr": 1.8053510897804105e-06, "epoch": 2.2478991596638656, "percentage": 74.93, "elapsed_time": "0:22:41", "remaining_time": "0:07:35"} +{"current_steps": 1071, "total_steps": 1428, "loss": 0.17869159579277039, "lr": 1.7959570766802847e-06, "epoch": 2.25, "percentage": 75.0, "elapsed_time": "0:22:42", "remaining_time": "0:07:34"} +{"current_steps": 1072, "total_steps": 1428, "loss": 0.2621746361255646, "lr": 1.786582214586462e-06, "epoch": 2.2521008403361344, "percentage": 75.07, "elapsed_time": "0:22:43", "remaining_time": "0:07:32"} +{"current_steps": 1073, "total_steps": 1428, "loss": 0.33446362614631653, "lr": 1.77722655953379e-06, "epoch": 2.254201680672269, "percentage": 75.14, "elapsed_time": "0:22:44", "remaining_time": "0:07:31"} +{"current_steps": 1074, "total_steps": 1428, "loss": 0.17267954349517822, "lr": 1.7678901674423044e-06, "epoch": 2.2563025210084033, "percentage": 75.21, "elapsed_time": "0:22:45", "remaining_time": "0:07:30"} +{"current_steps": 1075, "total_steps": 1428, "loss": 0.5281901955604553, "lr": 1.7585730941169105e-06, "epoch": 2.258403361344538, "percentage": 75.28, "elapsed_time": "0:22:46", "remaining_time": "0:07:28"} +{"current_steps": 1076, "total_steps": 1428, "loss": 0.2754780352115631, "lr": 1.7492753952470415e-06, "epoch": 2.2605042016806722, "percentage": 75.35, "elapsed_time": "0:22:47", "remaining_time": "0:07:27"} +{"current_steps": 1077, "total_steps": 1428, "loss": 0.3246016502380371, "lr": 1.739997126406322e-06, "epoch": 2.2626050420168067, "percentage": 75.42, "elapsed_time": "0:22:48", "remaining_time": "0:07:26"} +{"current_steps": 1078, "total_steps": 1428, "loss": 0.6660511493682861, "lr": 1.7307383430522474e-06, "epoch": 2.264705882352941, "percentage": 75.49, "elapsed_time": "0:22:49", "remaining_time": "0:07:24"} +{"current_steps": 1079, "total_steps": 1428, "loss": 1.2165361642837524, "lr": 1.7214991005258386e-06, "epoch": 2.2668067226890756, "percentage": 75.56, "elapsed_time": "0:22:50", "remaining_time": "0:07:23"} +{"current_steps": 1080, "total_steps": 1428, "loss": 0.18396508693695068, "lr": 1.7122794540513265e-06, "epoch": 2.26890756302521, "percentage": 75.63, "elapsed_time": "0:22:51", "remaining_time": "0:07:22"} +{"current_steps": 1081, "total_steps": 1428, "loss": 0.42018991708755493, "lr": 1.703079458735805e-06, "epoch": 2.2710084033613445, "percentage": 75.7, "elapsed_time": "0:22:53", "remaining_time": "0:07:20"} +{"current_steps": 1082, "total_steps": 1428, "loss": 0.38192903995513916, "lr": 1.6938991695689184e-06, "epoch": 2.273109243697479, "percentage": 75.77, "elapsed_time": "0:22:54", "remaining_time": "0:07:19"} +{"current_steps": 1083, "total_steps": 1428, "loss": 0.4953494966030121, "lr": 1.684738641422517e-06, "epoch": 2.2752100840336134, "percentage": 75.84, "elapsed_time": "0:22:55", "remaining_time": "0:07:18"} +{"current_steps": 1084, "total_steps": 1428, "loss": 0.5324037075042725, "lr": 1.6755979290503437e-06, "epoch": 2.277310924369748, "percentage": 75.91, "elapsed_time": "0:22:56", "remaining_time": "0:07:16"} +{"current_steps": 1085, "total_steps": 1428, "loss": 0.6618460416793823, "lr": 1.666477087087694e-06, "epoch": 2.2794117647058822, "percentage": 75.98, "elapsed_time": "0:22:57", "remaining_time": "0:07:15"} +{"current_steps": 1086, "total_steps": 1428, "loss": 0.29154300689697266, "lr": 1.6573761700511004e-06, "epoch": 2.2815126050420167, "percentage": 76.05, "elapsed_time": "0:22:58", "remaining_time": "0:07:14"} +{"current_steps": 1087, "total_steps": 1428, "loss": 0.39994263648986816, "lr": 1.6482952323379958e-06, "epoch": 2.283613445378151, "percentage": 76.12, "elapsed_time": "0:22:59", "remaining_time": "0:07:12"} +{"current_steps": 1088, "total_steps": 1428, "loss": 0.2049681693315506, "lr": 1.639234328226399e-06, "epoch": 2.2857142857142856, "percentage": 76.19, "elapsed_time": "0:23:00", "remaining_time": "0:07:11"} +{"current_steps": 1089, "total_steps": 1428, "loss": 0.35848674178123474, "lr": 1.6301935118745826e-06, "epoch": 2.28781512605042, "percentage": 76.26, "elapsed_time": "0:23:01", "remaining_time": "0:07:10"} +{"current_steps": 1090, "total_steps": 1428, "loss": 0.4794918894767761, "lr": 1.621172837320754e-06, "epoch": 2.2899159663865545, "percentage": 76.33, "elapsed_time": "0:23:02", "remaining_time": "0:07:08"} +{"current_steps": 1091, "total_steps": 1428, "loss": 0.3671627342700958, "lr": 1.6121723584827259e-06, "epoch": 2.292016806722689, "percentage": 76.4, "elapsed_time": "0:23:03", "remaining_time": "0:07:07"} +{"current_steps": 1092, "total_steps": 1428, "loss": 0.25063830614089966, "lr": 1.6031921291576048e-06, "epoch": 2.2941176470588234, "percentage": 76.47, "elapsed_time": "0:23:04", "remaining_time": "0:07:06"} +{"current_steps": 1093, "total_steps": 1428, "loss": 0.7581193447113037, "lr": 1.5942322030214547e-06, "epoch": 2.296218487394958, "percentage": 76.54, "elapsed_time": "0:23:06", "remaining_time": "0:07:04"} +{"current_steps": 1094, "total_steps": 1428, "loss": 0.4217086434364319, "lr": 1.5852926336289926e-06, "epoch": 2.2983193277310923, "percentage": 76.61, "elapsed_time": "0:23:07", "remaining_time": "0:07:03"} +{"current_steps": 1095, "total_steps": 1428, "loss": 0.5018645524978638, "lr": 1.5763734744132587e-06, "epoch": 2.3004201680672267, "percentage": 76.68, "elapsed_time": "0:23:08", "remaining_time": "0:07:02"} +{"current_steps": 1096, "total_steps": 1428, "loss": 0.5745636224746704, "lr": 1.5674747786852935e-06, "epoch": 2.302521008403361, "percentage": 76.75, "elapsed_time": "0:23:09", "remaining_time": "0:07:00"} +{"current_steps": 1097, "total_steps": 1428, "loss": 0.9145222902297974, "lr": 1.5585965996338314e-06, "epoch": 2.3046218487394956, "percentage": 76.82, "elapsed_time": "0:23:10", "remaining_time": "0:06:59"} +{"current_steps": 1098, "total_steps": 1428, "loss": 0.4312666058540344, "lr": 1.5497389903249705e-06, "epoch": 2.30672268907563, "percentage": 76.89, "elapsed_time": "0:23:11", "remaining_time": "0:06:58"} +{"current_steps": 1099, "total_steps": 1428, "loss": 0.4121660590171814, "lr": 1.5409020037018652e-06, "epoch": 2.3088235294117645, "percentage": 76.96, "elapsed_time": "0:23:12", "remaining_time": "0:06:56"} +{"current_steps": 1100, "total_steps": 1428, "loss": 0.8646482825279236, "lr": 1.5320856925843997e-06, "epoch": 2.310924369747899, "percentage": 77.03, "elapsed_time": "0:23:13", "remaining_time": "0:06:55"} +{"current_steps": 1101, "total_steps": 1428, "loss": 0.784586489200592, "lr": 1.5232901096688847e-06, "epoch": 2.3130252100840334, "percentage": 77.1, "elapsed_time": "0:23:14", "remaining_time": "0:06:54"} +{"current_steps": 1102, "total_steps": 1428, "loss": 0.9424635171890259, "lr": 1.5145153075277286e-06, "epoch": 2.315126050420168, "percentage": 77.17, "elapsed_time": "0:23:15", "remaining_time": "0:06:52"} +{"current_steps": 1103, "total_steps": 1428, "loss": 0.28385645151138306, "lr": 1.505761338609137e-06, "epoch": 2.3172268907563023, "percentage": 77.24, "elapsed_time": "0:23:16", "remaining_time": "0:06:51"} +{"current_steps": 1104, "total_steps": 1428, "loss": 0.6689031720161438, "lr": 1.4970282552367854e-06, "epoch": 2.3193277310924367, "percentage": 77.31, "elapsed_time": "0:23:17", "remaining_time": "0:06:50"} +{"current_steps": 1105, "total_steps": 1428, "loss": 0.691364586353302, "lr": 1.4883161096095189e-06, "epoch": 2.3214285714285716, "percentage": 77.38, "elapsed_time": "0:23:19", "remaining_time": "0:06:48"} +{"current_steps": 1106, "total_steps": 1428, "loss": 0.23520073294639587, "lr": 1.4796249538010354e-06, "epoch": 2.323529411764706, "percentage": 77.45, "elapsed_time": "0:23:20", "remaining_time": "0:06:47"} +{"current_steps": 1107, "total_steps": 1428, "loss": 0.4271107316017151, "lr": 1.4709548397595674e-06, "epoch": 2.3256302521008405, "percentage": 77.52, "elapsed_time": "0:23:21", "remaining_time": "0:06:46"} +{"current_steps": 1108, "total_steps": 1428, "loss": 0.9280604720115662, "lr": 1.4623058193075852e-06, "epoch": 2.327731092436975, "percentage": 77.59, "elapsed_time": "0:23:22", "remaining_time": "0:06:44"} +{"current_steps": 1109, "total_steps": 1428, "loss": 0.33376407623291016, "lr": 1.453677944141474e-06, "epoch": 2.3298319327731094, "percentage": 77.66, "elapsed_time": "0:23:23", "remaining_time": "0:06:43"} +{"current_steps": 1110, "total_steps": 1428, "loss": 0.7442219853401184, "lr": 1.4450712658312356e-06, "epoch": 2.331932773109244, "percentage": 77.73, "elapsed_time": "0:23:24", "remaining_time": "0:06:42"} +{"current_steps": 1111, "total_steps": 1428, "loss": 1.27920663356781, "lr": 1.43648583582017e-06, "epoch": 2.3340336134453783, "percentage": 77.8, "elapsed_time": "0:23:25", "remaining_time": "0:06:41"} +{"current_steps": 1112, "total_steps": 1428, "loss": 0.6456579566001892, "lr": 1.4279217054245793e-06, "epoch": 2.3361344537815127, "percentage": 77.87, "elapsed_time": "0:23:26", "remaining_time": "0:06:39"} +{"current_steps": 1113, "total_steps": 1428, "loss": 1.1350394487380981, "lr": 1.4193789258334485e-06, "epoch": 2.338235294117647, "percentage": 77.94, "elapsed_time": "0:23:27", "remaining_time": "0:06:38"} +{"current_steps": 1114, "total_steps": 1428, "loss": 0.5290108919143677, "lr": 1.4108575481081522e-06, "epoch": 2.3403361344537816, "percentage": 78.01, "elapsed_time": "0:23:28", "remaining_time": "0:06:37"} +{"current_steps": 1115, "total_steps": 1428, "loss": 0.2833002209663391, "lr": 1.4023576231821362e-06, "epoch": 2.342436974789916, "percentage": 78.08, "elapsed_time": "0:23:29", "remaining_time": "0:06:35"} +{"current_steps": 1116, "total_steps": 1428, "loss": 0.37826409935951233, "lr": 1.3938792018606278e-06, "epoch": 2.3445378151260505, "percentage": 78.15, "elapsed_time": "0:23:30", "remaining_time": "0:06:34"} +{"current_steps": 1117, "total_steps": 1428, "loss": 0.3945717215538025, "lr": 1.3854223348203171e-06, "epoch": 2.346638655462185, "percentage": 78.22, "elapsed_time": "0:23:31", "remaining_time": "0:06:33"} +{"current_steps": 1118, "total_steps": 1428, "loss": 0.31352269649505615, "lr": 1.376987072609065e-06, "epoch": 2.3487394957983194, "percentage": 78.29, "elapsed_time": "0:23:33", "remaining_time": "0:06:31"} +{"current_steps": 1119, "total_steps": 1428, "loss": 0.8024647235870361, "lr": 1.368573465645599e-06, "epoch": 2.350840336134454, "percentage": 78.36, "elapsed_time": "0:23:34", "remaining_time": "0:06:30"} +{"current_steps": 1120, "total_steps": 1428, "loss": 0.7791054248809814, "lr": 1.360181564219204e-06, "epoch": 2.3529411764705883, "percentage": 78.43, "elapsed_time": "0:23:35", "remaining_time": "0:06:29"} +{"current_steps": 1121, "total_steps": 1428, "loss": 0.37381619215011597, "lr": 1.351811418489436e-06, "epoch": 2.3550420168067228, "percentage": 78.5, "elapsed_time": "0:23:36", "remaining_time": "0:06:27"} +{"current_steps": 1122, "total_steps": 1428, "loss": 0.3184419870376587, "lr": 1.3434630784858067e-06, "epoch": 2.357142857142857, "percentage": 78.57, "elapsed_time": "0:23:37", "remaining_time": "0:06:26"} +{"current_steps": 1123, "total_steps": 1428, "loss": 0.3431350886821747, "lr": 1.335136594107498e-06, "epoch": 2.3592436974789917, "percentage": 78.64, "elapsed_time": "0:23:38", "remaining_time": "0:06:25"} +{"current_steps": 1124, "total_steps": 1428, "loss": 0.4296434819698334, "lr": 1.3268320151230518e-06, "epoch": 2.361344537815126, "percentage": 78.71, "elapsed_time": "0:23:39", "remaining_time": "0:06:23"} +{"current_steps": 1125, "total_steps": 1428, "loss": 0.48791950941085815, "lr": 1.3185493911700854e-06, "epoch": 2.3634453781512605, "percentage": 78.78, "elapsed_time": "0:23:40", "remaining_time": "0:06:22"} +{"current_steps": 1126, "total_steps": 1428, "loss": 0.29711413383483887, "lr": 1.3102887717549812e-06, "epoch": 2.365546218487395, "percentage": 78.85, "elapsed_time": "0:23:41", "remaining_time": "0:06:21"} +{"current_steps": 1127, "total_steps": 1428, "loss": 0.39902636408805847, "lr": 1.302050206252602e-06, "epoch": 2.3676470588235294, "percentage": 78.92, "elapsed_time": "0:23:42", "remaining_time": "0:06:19"} +{"current_steps": 1128, "total_steps": 1428, "loss": 0.2864948511123657, "lr": 1.2938337439059868e-06, "epoch": 2.369747899159664, "percentage": 78.99, "elapsed_time": "0:23:43", "remaining_time": "0:06:18"} +{"current_steps": 1129, "total_steps": 1428, "loss": 0.42151930928230286, "lr": 1.2856394338260691e-06, "epoch": 2.3718487394957983, "percentage": 79.06, "elapsed_time": "0:23:44", "remaining_time": "0:06:17"} +{"current_steps": 1130, "total_steps": 1428, "loss": 0.330949604511261, "lr": 1.2774673249913656e-06, "epoch": 2.3739495798319328, "percentage": 79.13, "elapsed_time": "0:23:45", "remaining_time": "0:06:16"} +{"current_steps": 1131, "total_steps": 1428, "loss": 0.832221508026123, "lr": 1.2693174662477003e-06, "epoch": 2.3760504201680672, "percentage": 79.2, "elapsed_time": "0:23:47", "remaining_time": "0:06:14"} +{"current_steps": 1132, "total_steps": 1428, "loss": 0.3243201971054077, "lr": 1.2611899063079002e-06, "epoch": 2.3781512605042017, "percentage": 79.27, "elapsed_time": "0:23:48", "remaining_time": "0:06:13"} +{"current_steps": 1133, "total_steps": 1428, "loss": 0.4209938049316406, "lr": 1.253084693751514e-06, "epoch": 2.380252100840336, "percentage": 79.34, "elapsed_time": "0:23:49", "remaining_time": "0:06:12"} +{"current_steps": 1134, "total_steps": 1428, "loss": 0.1905173659324646, "lr": 1.245001877024512e-06, "epoch": 2.3823529411764706, "percentage": 79.41, "elapsed_time": "0:23:50", "remaining_time": "0:06:10"} +{"current_steps": 1135, "total_steps": 1428, "loss": 0.31655293703079224, "lr": 1.2369415044390055e-06, "epoch": 2.384453781512605, "percentage": 79.48, "elapsed_time": "0:23:51", "remaining_time": "0:06:09"} +{"current_steps": 1136, "total_steps": 1428, "loss": 0.2780379354953766, "lr": 1.228903624172954e-06, "epoch": 2.3865546218487395, "percentage": 79.55, "elapsed_time": "0:23:52", "remaining_time": "0:06:08"} +{"current_steps": 1137, "total_steps": 1428, "loss": 0.5738459825515747, "lr": 1.220888284269874e-06, "epoch": 2.388655462184874, "percentage": 79.62, "elapsed_time": "0:23:53", "remaining_time": "0:06:06"} +{"current_steps": 1138, "total_steps": 1428, "loss": 0.4594503343105316, "lr": 1.2128955326385595e-06, "epoch": 2.3907563025210083, "percentage": 79.69, "elapsed_time": "0:23:54", "remaining_time": "0:06:05"} +{"current_steps": 1139, "total_steps": 1428, "loss": 1.6502771377563477, "lr": 1.2049254170527857e-06, "epoch": 2.392857142857143, "percentage": 79.76, "elapsed_time": "0:23:55", "remaining_time": "0:06:04"} +{"current_steps": 1140, "total_steps": 1428, "loss": 0.7063793540000916, "lr": 1.196977985151036e-06, "epoch": 2.3949579831932772, "percentage": 79.83, "elapsed_time": "0:23:56", "remaining_time": "0:06:02"} +{"current_steps": 1141, "total_steps": 1428, "loss": 0.4885460138320923, "lr": 1.1890532844362035e-06, "epoch": 2.3970588235294117, "percentage": 79.9, "elapsed_time": "0:23:57", "remaining_time": "0:06:01"} +{"current_steps": 1142, "total_steps": 1428, "loss": 0.29537534713745117, "lr": 1.1811513622753196e-06, "epoch": 2.399159663865546, "percentage": 79.97, "elapsed_time": "0:23:58", "remaining_time": "0:06:00"} +{"current_steps": 1143, "total_steps": 1428, "loss": 0.6734664440155029, "lr": 1.1732722658992597e-06, "epoch": 2.4012605042016806, "percentage": 80.04, "elapsed_time": "0:24:00", "remaining_time": "0:05:59"} +{"current_steps": 1144, "total_steps": 1428, "loss": 0.39790263772010803, "lr": 1.1654160424024718e-06, "epoch": 2.403361344537815, "percentage": 80.11, "elapsed_time": "0:24:01", "remaining_time": "0:05:57"} +{"current_steps": 1145, "total_steps": 1428, "loss": 0.2750331163406372, "lr": 1.1575827387426846e-06, "epoch": 2.4054621848739495, "percentage": 80.18, "elapsed_time": "0:24:02", "remaining_time": "0:05:56"} +{"current_steps": 1146, "total_steps": 1428, "loss": 0.44170406460762024, "lr": 1.149772401740637e-06, "epoch": 2.407563025210084, "percentage": 80.25, "elapsed_time": "0:24:03", "remaining_time": "0:05:55"} +{"current_steps": 1147, "total_steps": 1428, "loss": 0.19013899564743042, "lr": 1.1419850780797864e-06, "epoch": 2.4096638655462184, "percentage": 80.32, "elapsed_time": "0:24:04", "remaining_time": "0:05:53"} +{"current_steps": 1148, "total_steps": 1428, "loss": 0.4140137732028961, "lr": 1.1342208143060423e-06, "epoch": 2.411764705882353, "percentage": 80.39, "elapsed_time": "0:24:05", "remaining_time": "0:05:52"} +{"current_steps": 1149, "total_steps": 1428, "loss": 0.4861386716365814, "lr": 1.1264796568274811e-06, "epoch": 2.4138655462184873, "percentage": 80.46, "elapsed_time": "0:24:06", "remaining_time": "0:05:51"} +{"current_steps": 1150, "total_steps": 1428, "loss": 0.3487178683280945, "lr": 1.118761651914065e-06, "epoch": 2.4159663865546217, "percentage": 80.53, "elapsed_time": "0:24:07", "remaining_time": "0:05:49"} +{"current_steps": 1151, "total_steps": 1428, "loss": 0.6119335889816284, "lr": 1.1110668456973761e-06, "epoch": 2.418067226890756, "percentage": 80.6, "elapsed_time": "0:24:08", "remaining_time": "0:05:48"} +{"current_steps": 1152, "total_steps": 1428, "loss": 0.24830467998981476, "lr": 1.10339528417033e-06, "epoch": 2.4201680672268906, "percentage": 80.67, "elapsed_time": "0:24:09", "remaining_time": "0:05:47"} +{"current_steps": 1153, "total_steps": 1428, "loss": 0.20413950085639954, "lr": 1.0957470131869102e-06, "epoch": 2.422268907563025, "percentage": 80.74, "elapsed_time": "0:24:10", "remaining_time": "0:05:46"} +{"current_steps": 1154, "total_steps": 1428, "loss": 0.7759865522384644, "lr": 1.088122078461884e-06, "epoch": 2.4243697478991595, "percentage": 80.81, "elapsed_time": "0:24:11", "remaining_time": "0:05:44"} +{"current_steps": 1155, "total_steps": 1428, "loss": 0.9713194370269775, "lr": 1.0805205255705403e-06, "epoch": 2.426470588235294, "percentage": 80.88, "elapsed_time": "0:24:12", "remaining_time": "0:05:43"} +{"current_steps": 1156, "total_steps": 1428, "loss": 0.3234805464744568, "lr": 1.0729423999484062e-06, "epoch": 2.4285714285714284, "percentage": 80.95, "elapsed_time": "0:24:14", "remaining_time": "0:05:42"} +{"current_steps": 1157, "total_steps": 1428, "loss": 0.2364063262939453, "lr": 1.0653877468909857e-06, "epoch": 2.4306722689075633, "percentage": 81.02, "elapsed_time": "0:24:15", "remaining_time": "0:05:40"} +{"current_steps": 1158, "total_steps": 1428, "loss": 0.4705219268798828, "lr": 1.0578566115534794e-06, "epoch": 2.4327731092436977, "percentage": 81.09, "elapsed_time": "0:24:16", "remaining_time": "0:05:39"} +{"current_steps": 1159, "total_steps": 1428, "loss": 0.26277682185173035, "lr": 1.0503490389505244e-06, "epoch": 2.434873949579832, "percentage": 81.16, "elapsed_time": "0:24:17", "remaining_time": "0:05:38"} +{"current_steps": 1160, "total_steps": 1428, "loss": 0.13882672786712646, "lr": 1.0428650739559138e-06, "epoch": 2.4369747899159666, "percentage": 81.23, "elapsed_time": "0:24:18", "remaining_time": "0:05:36"} +{"current_steps": 1161, "total_steps": 1428, "loss": 0.5188834071159363, "lr": 1.0354047613023404e-06, "epoch": 2.439075630252101, "percentage": 81.3, "elapsed_time": "0:24:19", "remaining_time": "0:05:35"} +{"current_steps": 1162, "total_steps": 1428, "loss": 0.24887529015541077, "lr": 1.0279681455811219e-06, "epoch": 2.4411764705882355, "percentage": 81.37, "elapsed_time": "0:24:20", "remaining_time": "0:05:34"} +{"current_steps": 1163, "total_steps": 1428, "loss": 0.28220975399017334, "lr": 1.0205552712419343e-06, "epoch": 2.44327731092437, "percentage": 81.44, "elapsed_time": "0:24:21", "remaining_time": "0:05:33"} +{"current_steps": 1164, "total_steps": 1428, "loss": 0.24789491295814514, "lr": 1.013166182592551e-06, "epoch": 2.4453781512605044, "percentage": 81.51, "elapsed_time": "0:24:22", "remaining_time": "0:05:31"} +{"current_steps": 1165, "total_steps": 1428, "loss": 0.7892224788665771, "lr": 1.0058009237985721e-06, "epoch": 2.447478991596639, "percentage": 81.58, "elapsed_time": "0:24:23", "remaining_time": "0:05:30"} +{"current_steps": 1166, "total_steps": 1428, "loss": 0.26245754957199097, "lr": 9.98459538883167e-07, "epoch": 2.4495798319327733, "percentage": 81.65, "elapsed_time": "0:24:24", "remaining_time": "0:05:29"} +{"current_steps": 1167, "total_steps": 1428, "loss": 0.27979156374931335, "lr": 9.911420717268023e-07, "epoch": 2.4516806722689077, "percentage": 81.72, "elapsed_time": "0:24:25", "remaining_time": "0:05:27"} +{"current_steps": 1168, "total_steps": 1428, "loss": 0.7934341430664062, "lr": 9.838485660669906e-07, "epoch": 2.453781512605042, "percentage": 81.79, "elapsed_time": "0:24:26", "remaining_time": "0:05:26"} +{"current_steps": 1169, "total_steps": 1428, "loss": 0.45289355516433716, "lr": 9.765790654980195e-07, "epoch": 2.4558823529411766, "percentage": 81.86, "elapsed_time": "0:24:28", "remaining_time": "0:05:25"} +{"current_steps": 1170, "total_steps": 1428, "loss": 0.992337703704834, "lr": 9.693336134706988e-07, "epoch": 2.457983193277311, "percentage": 81.93, "elapsed_time": "0:24:29", "remaining_time": "0:05:23"} +{"current_steps": 1171, "total_steps": 1428, "loss": 0.29417842626571655, "lr": 9.621122532920908e-07, "epoch": 2.4600840336134455, "percentage": 82.0, "elapsed_time": "0:24:30", "remaining_time": "0:05:22"} +{"current_steps": 1172, "total_steps": 1428, "loss": 0.5845852494239807, "lr": 9.549150281252633e-07, "epoch": 2.46218487394958, "percentage": 82.07, "elapsed_time": "0:24:31", "remaining_time": "0:05:21"} +{"current_steps": 1173, "total_steps": 1428, "loss": 0.22582799196243286, "lr": 9.477419809890215e-07, "epoch": 2.4642857142857144, "percentage": 82.14, "elapsed_time": "0:24:32", "remaining_time": "0:05:20"} +{"current_steps": 1174, "total_steps": 1428, "loss": 0.26232588291168213, "lr": 9.405931547576591e-07, "epoch": 2.466386554621849, "percentage": 82.21, "elapsed_time": "0:24:33", "remaining_time": "0:05:18"} +{"current_steps": 1175, "total_steps": 1428, "loss": 0.9084593057632446, "lr": 9.334685921606946e-07, "epoch": 2.4684873949579833, "percentage": 82.28, "elapsed_time": "0:24:34", "remaining_time": "0:05:17"} +{"current_steps": 1176, "total_steps": 1428, "loss": 0.8386296629905701, "lr": 9.26368335782622e-07, "epoch": 2.4705882352941178, "percentage": 82.35, "elapsed_time": "0:24:35", "remaining_time": "0:05:16"} +{"current_steps": 1177, "total_steps": 1428, "loss": 1.0152020454406738, "lr": 9.192924280626514e-07, "epoch": 2.472689075630252, "percentage": 82.42, "elapsed_time": "0:24:36", "remaining_time": "0:05:14"} +{"current_steps": 1178, "total_steps": 1428, "loss": 0.42396751046180725, "lr": 9.122409112944591e-07, "epoch": 2.4747899159663866, "percentage": 82.49, "elapsed_time": "0:24:37", "remaining_time": "0:05:13"} +{"current_steps": 1179, "total_steps": 1428, "loss": 0.3439130485057831, "lr": 9.052138276259348e-07, "epoch": 2.476890756302521, "percentage": 82.56, "elapsed_time": "0:24:38", "remaining_time": "0:05:12"} +{"current_steps": 1180, "total_steps": 1428, "loss": 0.21849340200424194, "lr": 8.982112190589237e-07, "epoch": 2.4789915966386555, "percentage": 82.63, "elapsed_time": "0:24:39", "remaining_time": "0:05:11"} +{"current_steps": 1181, "total_steps": 1428, "loss": 1.047693133354187, "lr": 8.912331274489855e-07, "epoch": 2.48109243697479, "percentage": 82.7, "elapsed_time": "0:24:40", "remaining_time": "0:05:09"} +{"current_steps": 1182, "total_steps": 1428, "loss": 0.4458342492580414, "lr": 8.842795945051335e-07, "epoch": 2.4831932773109244, "percentage": 82.77, "elapsed_time": "0:24:42", "remaining_time": "0:05:08"} +{"current_steps": 1183, "total_steps": 1428, "loss": 0.26556795835494995, "lr": 8.773506617895944e-07, "epoch": 2.485294117647059, "percentage": 82.84, "elapsed_time": "0:24:43", "remaining_time": "0:05:07"} +{"current_steps": 1184, "total_steps": 1428, "loss": 0.8663069605827332, "lr": 8.704463707175526e-07, "epoch": 2.4873949579831933, "percentage": 82.91, "elapsed_time": "0:24:44", "remaining_time": "0:05:05"} +{"current_steps": 1185, "total_steps": 1428, "loss": 0.7863715291023254, "lr": 8.6356676255691e-07, "epoch": 2.4894957983193278, "percentage": 82.98, "elapsed_time": "0:24:45", "remaining_time": "0:05:04"} +{"current_steps": 1186, "total_steps": 1428, "loss": 0.2747763395309448, "lr": 8.567118784280309e-07, "epoch": 2.491596638655462, "percentage": 83.05, "elapsed_time": "0:24:46", "remaining_time": "0:05:03"} +{"current_steps": 1187, "total_steps": 1428, "loss": 0.22008158266544342, "lr": 8.498817593035053e-07, "epoch": 2.4936974789915967, "percentage": 83.12, "elapsed_time": "0:24:47", "remaining_time": "0:05:02"} +{"current_steps": 1188, "total_steps": 1428, "loss": 0.7790160179138184, "lr": 8.430764460078938e-07, "epoch": 2.495798319327731, "percentage": 83.19, "elapsed_time": "0:24:48", "remaining_time": "0:05:00"} +{"current_steps": 1189, "total_steps": 1428, "loss": 0.3692745864391327, "lr": 8.362959792174941e-07, "epoch": 2.4978991596638656, "percentage": 83.26, "elapsed_time": "0:24:49", "remaining_time": "0:04:59"} +{"current_steps": 1190, "total_steps": 1428, "loss": 0.5012900829315186, "lr": 8.295403994600921e-07, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "0:24:50", "remaining_time": "0:04:58"} +{"current_steps": 1191, "total_steps": 1428, "loss": 0.4049416780471802, "lr": 8.228097471147167e-07, "epoch": 2.5021008403361344, "percentage": 83.4, "elapsed_time": "0:24:51", "remaining_time": "0:04:56"} +{"current_steps": 1192, "total_steps": 1428, "loss": 0.14171475172042847, "lr": 8.161040624114075e-07, "epoch": 2.504201680672269, "percentage": 83.47, "elapsed_time": "0:24:52", "remaining_time": "0:04:55"} +{"current_steps": 1193, "total_steps": 1428, "loss": 0.32759952545166016, "lr": 8.094233854309647e-07, "epoch": 2.5063025210084033, "percentage": 83.54, "elapsed_time": "0:24:53", "remaining_time": "0:04:54"} +{"current_steps": 1194, "total_steps": 1428, "loss": 0.5382500886917114, "lr": 8.027677561047176e-07, "epoch": 2.508403361344538, "percentage": 83.61, "elapsed_time": "0:24:54", "remaining_time": "0:04:52"} +{"current_steps": 1195, "total_steps": 1428, "loss": 0.4815264940261841, "lr": 7.961372142142776e-07, "epoch": 2.5105042016806722, "percentage": 83.68, "elapsed_time": "0:24:56", "remaining_time": "0:04:51"} +{"current_steps": 1196, "total_steps": 1428, "loss": 0.28123000264167786, "lr": 7.89531799391311e-07, "epoch": 2.5126050420168067, "percentage": 83.75, "elapsed_time": "0:24:57", "remaining_time": "0:04:50"} +{"current_steps": 1197, "total_steps": 1428, "loss": 0.5116557478904724, "lr": 7.829515511172897e-07, "epoch": 2.514705882352941, "percentage": 83.82, "elapsed_time": "0:24:58", "remaining_time": "0:04:49"} +{"current_steps": 1198, "total_steps": 1428, "loss": 0.4502016603946686, "lr": 7.763965087232678e-07, "epoch": 2.5168067226890756, "percentage": 83.89, "elapsed_time": "0:24:59", "remaining_time": "0:04:47"} +{"current_steps": 1199, "total_steps": 1428, "loss": 0.34997278451919556, "lr": 7.698667113896346e-07, "epoch": 2.51890756302521, "percentage": 83.96, "elapsed_time": "0:25:00", "remaining_time": "0:04:46"} +{"current_steps": 1200, "total_steps": 1428, "loss": 0.15743517875671387, "lr": 7.633621981458916e-07, "epoch": 2.5210084033613445, "percentage": 84.03, "elapsed_time": "0:25:01", "remaining_time": "0:04:45"} +{"current_steps": 1201, "total_steps": 1428, "loss": 0.4513791799545288, "lr": 7.568830078704092e-07, "epoch": 2.523109243697479, "percentage": 84.1, "elapsed_time": "0:25:02", "remaining_time": "0:04:43"} +{"current_steps": 1202, "total_steps": 1428, "loss": 0.5203551054000854, "lr": 7.504291792902024e-07, "epoch": 2.5252100840336134, "percentage": 84.17, "elapsed_time": "0:25:03", "remaining_time": "0:04:42"} +{"current_steps": 1203, "total_steps": 1428, "loss": 0.5805743932723999, "lr": 7.440007509806946e-07, "epoch": 2.527310924369748, "percentage": 84.24, "elapsed_time": "0:25:04", "remaining_time": "0:04:41"} +{"current_steps": 1204, "total_steps": 1428, "loss": 0.21151217818260193, "lr": 7.375977613654861e-07, "epoch": 2.5294117647058822, "percentage": 84.31, "elapsed_time": "0:25:05", "remaining_time": "0:04:40"} +{"current_steps": 1205, "total_steps": 1428, "loss": 0.4486454725265503, "lr": 7.312202487161318e-07, "epoch": 2.5315126050420167, "percentage": 84.38, "elapsed_time": "0:25:06", "remaining_time": "0:04:38"} +{"current_steps": 1206, "total_steps": 1428, "loss": 0.8350504040718079, "lr": 7.248682511519006e-07, "epoch": 2.533613445378151, "percentage": 84.45, "elapsed_time": "0:25:07", "remaining_time": "0:04:37"} +{"current_steps": 1207, "total_steps": 1428, "loss": 0.37657079100608826, "lr": 7.18541806639561e-07, "epoch": 2.5357142857142856, "percentage": 84.52, "elapsed_time": "0:25:09", "remaining_time": "0:04:36"} +{"current_steps": 1208, "total_steps": 1428, "loss": 0.5544061660766602, "lr": 7.122409529931412e-07, "epoch": 2.53781512605042, "percentage": 84.59, "elapsed_time": "0:25:10", "remaining_time": "0:04:35"} +{"current_steps": 1209, "total_steps": 1428, "loss": 0.8755850791931152, "lr": 7.059657278737136e-07, "epoch": 2.5399159663865545, "percentage": 84.66, "elapsed_time": "0:25:11", "remaining_time": "0:04:33"} +{"current_steps": 1210, "total_steps": 1428, "loss": 0.6084367036819458, "lr": 6.997161687891635e-07, "epoch": 2.542016806722689, "percentage": 84.73, "elapsed_time": "0:25:12", "remaining_time": "0:04:32"} +{"current_steps": 1211, "total_steps": 1428, "loss": 0.3528558015823364, "lr": 6.934923130939692e-07, "epoch": 2.5441176470588234, "percentage": 84.8, "elapsed_time": "0:25:13", "remaining_time": "0:04:31"} +{"current_steps": 1212, "total_steps": 1428, "loss": 0.3760122060775757, "lr": 6.872941979889708e-07, "epoch": 2.546218487394958, "percentage": 84.87, "elapsed_time": "0:25:14", "remaining_time": "0:04:29"} +{"current_steps": 1213, "total_steps": 1428, "loss": 0.3798169195652008, "lr": 6.811218605211606e-07, "epoch": 2.5483193277310923, "percentage": 84.94, "elapsed_time": "0:25:15", "remaining_time": "0:04:28"} +{"current_steps": 1214, "total_steps": 1428, "loss": 0.20516347885131836, "lr": 6.749753375834467e-07, "epoch": 2.5504201680672267, "percentage": 85.01, "elapsed_time": "0:25:16", "remaining_time": "0:04:27"} +{"current_steps": 1215, "total_steps": 1428, "loss": 0.39129936695098877, "lr": 6.688546659144479e-07, "epoch": 2.552521008403361, "percentage": 85.08, "elapsed_time": "0:25:17", "remaining_time": "0:04:26"} +{"current_steps": 1216, "total_steps": 1428, "loss": 0.5815962553024292, "lr": 6.627598820982595e-07, "epoch": 2.5546218487394956, "percentage": 85.15, "elapsed_time": "0:25:18", "remaining_time": "0:04:24"} +{"current_steps": 1217, "total_steps": 1428, "loss": 0.2462518960237503, "lr": 6.566910225642475e-07, "epoch": 2.55672268907563, "percentage": 85.22, "elapsed_time": "0:25:19", "remaining_time": "0:04:23"} +{"current_steps": 1218, "total_steps": 1428, "loss": 0.7295534610748291, "lr": 6.50648123586819e-07, "epoch": 2.5588235294117645, "percentage": 85.29, "elapsed_time": "0:25:20", "remaining_time": "0:04:22"} +{"current_steps": 1219, "total_steps": 1428, "loss": 0.4088057577610016, "lr": 6.446312212852162e-07, "epoch": 2.560924369747899, "percentage": 85.36, "elapsed_time": "0:25:21", "remaining_time": "0:04:20"} +{"current_steps": 1220, "total_steps": 1428, "loss": 0.6498621106147766, "lr": 6.386403516232948e-07, "epoch": 2.5630252100840334, "percentage": 85.43, "elapsed_time": "0:25:23", "remaining_time": "0:04:19"} +{"current_steps": 1221, "total_steps": 1428, "loss": 0.3554389476776123, "lr": 6.326755504093063e-07, "epoch": 2.565126050420168, "percentage": 85.5, "elapsed_time": "0:25:24", "remaining_time": "0:04:18"} +{"current_steps": 1222, "total_steps": 1428, "loss": 1.3259708881378174, "lr": 6.267368532956919e-07, "epoch": 2.5672268907563023, "percentage": 85.57, "elapsed_time": "0:25:25", "remaining_time": "0:04:17"} +{"current_steps": 1223, "total_steps": 1428, "loss": 0.4336357116699219, "lr": 6.208242957788613e-07, "epoch": 2.5693277310924367, "percentage": 85.64, "elapsed_time": "0:25:26", "remaining_time": "0:04:15"} +{"current_steps": 1224, "total_steps": 1428, "loss": 0.6199144124984741, "lr": 6.14937913198988e-07, "epoch": 2.571428571428571, "percentage": 85.71, "elapsed_time": "0:25:27", "remaining_time": "0:04:14"} +{"current_steps": 1225, "total_steps": 1428, "loss": 1.075969934463501, "lr": 6.090777407397902e-07, "epoch": 2.5735294117647056, "percentage": 85.78, "elapsed_time": "0:25:28", "remaining_time": "0:04:13"} +{"current_steps": 1226, "total_steps": 1428, "loss": 0.5996450185775757, "lr": 6.032438134283286e-07, "epoch": 2.57563025210084, "percentage": 85.85, "elapsed_time": "0:25:29", "remaining_time": "0:04:12"} +{"current_steps": 1227, "total_steps": 1428, "loss": 0.37859058380126953, "lr": 5.974361661347889e-07, "epoch": 2.5777310924369745, "percentage": 85.92, "elapsed_time": "0:25:30", "remaining_time": "0:04:10"} +{"current_steps": 1228, "total_steps": 1428, "loss": 0.3595309853553772, "lr": 5.916548335722822e-07, "epoch": 2.5798319327731094, "percentage": 85.99, "elapsed_time": "0:25:31", "remaining_time": "0:04:09"} +{"current_steps": 1229, "total_steps": 1428, "loss": 0.31986016035079956, "lr": 5.858998502966273e-07, "epoch": 2.581932773109244, "percentage": 86.06, "elapsed_time": "0:25:32", "remaining_time": "0:04:08"} +{"current_steps": 1230, "total_steps": 1428, "loss": 0.3975721597671509, "lr": 5.801712507061563e-07, "epoch": 2.5840336134453783, "percentage": 86.13, "elapsed_time": "0:25:33", "remaining_time": "0:04:06"} +{"current_steps": 1231, "total_steps": 1428, "loss": 0.6717185974121094, "lr": 5.74469069041495e-07, "epoch": 2.5861344537815127, "percentage": 86.2, "elapsed_time": "0:25:34", "remaining_time": "0:04:05"} +{"current_steps": 1232, "total_steps": 1428, "loss": 0.6171470880508423, "lr": 5.687933393853718e-07, "epoch": 2.588235294117647, "percentage": 86.27, "elapsed_time": "0:25:35", "remaining_time": "0:04:04"} +{"current_steps": 1233, "total_steps": 1428, "loss": 0.47931092977523804, "lr": 5.631440956624057e-07, "epoch": 2.5903361344537816, "percentage": 86.34, "elapsed_time": "0:25:37", "remaining_time": "0:04:03"} +{"current_steps": 1234, "total_steps": 1428, "loss": 0.44013679027557373, "lr": 5.575213716389039e-07, "epoch": 2.592436974789916, "percentage": 86.41, "elapsed_time": "0:25:38", "remaining_time": "0:04:01"} +{"current_steps": 1235, "total_steps": 1428, "loss": 0.515785276889801, "lr": 5.519252009226639e-07, "epoch": 2.5945378151260505, "percentage": 86.48, "elapsed_time": "0:25:39", "remaining_time": "0:04:00"} +{"current_steps": 1236, "total_steps": 1428, "loss": 0.3664918541908264, "lr": 5.463556169627687e-07, "epoch": 2.596638655462185, "percentage": 86.55, "elapsed_time": "0:25:40", "remaining_time": "0:03:59"} +{"current_steps": 1237, "total_steps": 1428, "loss": 0.3711666762828827, "lr": 5.408126530493918e-07, "epoch": 2.5987394957983194, "percentage": 86.62, "elapsed_time": "0:25:41", "remaining_time": "0:03:57"} +{"current_steps": 1238, "total_steps": 1428, "loss": 0.12698325514793396, "lr": 5.352963423135893e-07, "epoch": 2.600840336134454, "percentage": 86.69, "elapsed_time": "0:25:42", "remaining_time": "0:03:56"} +{"current_steps": 1239, "total_steps": 1428, "loss": 0.3730424642562866, "lr": 5.298067177271144e-07, "epoch": 2.6029411764705883, "percentage": 86.76, "elapsed_time": "0:25:43", "remaining_time": "0:03:55"} +{"current_steps": 1240, "total_steps": 1428, "loss": 0.6243601441383362, "lr": 5.243438121022077e-07, "epoch": 2.6050420168067228, "percentage": 86.83, "elapsed_time": "0:25:44", "remaining_time": "0:03:54"} +{"current_steps": 1241, "total_steps": 1428, "loss": 0.18001016974449158, "lr": 5.18907658091411e-07, "epoch": 2.607142857142857, "percentage": 86.9, "elapsed_time": "0:25:45", "remaining_time": "0:03:52"} +{"current_steps": 1242, "total_steps": 1428, "loss": 0.6635949611663818, "lr": 5.134982881873646e-07, "epoch": 2.6092436974789917, "percentage": 86.97, "elapsed_time": "0:25:46", "remaining_time": "0:03:51"} +{"current_steps": 1243, "total_steps": 1428, "loss": 0.4666215777397156, "lr": 5.081157347226201e-07, "epoch": 2.611344537815126, "percentage": 87.04, "elapsed_time": "0:25:47", "remaining_time": "0:03:50"} +{"current_steps": 1244, "total_steps": 1428, "loss": 0.1682681143283844, "lr": 5.027600298694397e-07, "epoch": 2.6134453781512605, "percentage": 87.11, "elapsed_time": "0:25:48", "remaining_time": "0:03:49"} +{"current_steps": 1245, "total_steps": 1428, "loss": 0.5077744722366333, "lr": 4.974312056396113e-07, "epoch": 2.615546218487395, "percentage": 87.18, "elapsed_time": "0:25:49", "remaining_time": "0:03:47"} +{"current_steps": 1246, "total_steps": 1428, "loss": 0.44359397888183594, "lr": 4.92129293884252e-07, "epoch": 2.6176470588235294, "percentage": 87.25, "elapsed_time": "0:25:51", "remaining_time": "0:03:46"} +{"current_steps": 1247, "total_steps": 1428, "loss": 1.2246967554092407, "lr": 4.868543262936176e-07, "epoch": 2.619747899159664, "percentage": 87.32, "elapsed_time": "0:25:52", "remaining_time": "0:03:45"} +{"current_steps": 1248, "total_steps": 1428, "loss": 0.32194000482559204, "lr": 4.816063343969196e-07, "epoch": 2.6218487394957983, "percentage": 87.39, "elapsed_time": "0:25:53", "remaining_time": "0:03:44"} +{"current_steps": 1249, "total_steps": 1428, "loss": 0.5496278405189514, "lr": 4.763853495621251e-07, "epoch": 2.6239495798319328, "percentage": 87.46, "elapsed_time": "0:25:54", "remaining_time": "0:03:42"} +{"current_steps": 1250, "total_steps": 1428, "loss": 0.21257492899894714, "lr": 4.7119140299578424e-07, "epoch": 2.6260504201680672, "percentage": 87.54, "elapsed_time": "0:25:55", "remaining_time": "0:03:41"} +{"current_steps": 1251, "total_steps": 1428, "loss": 0.3104386329650879, "lr": 4.660245257428297e-07, "epoch": 2.6281512605042017, "percentage": 87.61, "elapsed_time": "0:25:56", "remaining_time": "0:03:40"} +{"current_steps": 1252, "total_steps": 1428, "loss": 0.8334522843360901, "lr": 4.6088474868640045e-07, "epoch": 2.630252100840336, "percentage": 87.68, "elapsed_time": "0:25:57", "remaining_time": "0:03:38"} +{"current_steps": 1253, "total_steps": 1428, "loss": 0.29882583022117615, "lr": 4.557721025476508e-07, "epoch": 2.6323529411764706, "percentage": 87.75, "elapsed_time": "0:25:58", "remaining_time": "0:03:37"} +{"current_steps": 1254, "total_steps": 1428, "loss": 0.3209346830844879, "lr": 4.5068661788557345e-07, "epoch": 2.634453781512605, "percentage": 87.82, "elapsed_time": "0:25:59", "remaining_time": "0:03:36"} +{"current_steps": 1255, "total_steps": 1428, "loss": 0.15333116054534912, "lr": 4.4562832509680963e-07, "epoch": 2.6365546218487395, "percentage": 87.89, "elapsed_time": "0:26:00", "remaining_time": "0:03:35"} +{"current_steps": 1256, "total_steps": 1428, "loss": 0.48582714796066284, "lr": 4.4059725441547464e-07, "epoch": 2.638655462184874, "percentage": 87.96, "elapsed_time": "0:26:01", "remaining_time": "0:03:33"} +{"current_steps": 1257, "total_steps": 1428, "loss": 0.4873425364494324, "lr": 4.355934359129699e-07, "epoch": 2.6407563025210083, "percentage": 88.03, "elapsed_time": "0:26:02", "remaining_time": "0:03:32"} +{"current_steps": 1258, "total_steps": 1428, "loss": 0.2611161768436432, "lr": 4.3061689949780995e-07, "epoch": 2.642857142857143, "percentage": 88.1, "elapsed_time": "0:26:03", "remaining_time": "0:03:31"} +{"current_steps": 1259, "total_steps": 1428, "loss": 0.27621158957481384, "lr": 4.2566767491543706e-07, "epoch": 2.6449579831932772, "percentage": 88.17, "elapsed_time": "0:26:05", "remaining_time": "0:03:30"} +{"current_steps": 1260, "total_steps": 1428, "loss": 0.849486231803894, "lr": 4.2074579174805173e-07, "epoch": 2.6470588235294117, "percentage": 88.24, "elapsed_time": "0:26:06", "remaining_time": "0:03:28"} +{"current_steps": 1261, "total_steps": 1428, "loss": 0.7652707099914551, "lr": 4.1585127941442536e-07, "epoch": 2.649159663865546, "percentage": 88.31, "elapsed_time": "0:26:07", "remaining_time": "0:03:27"} +{"current_steps": 1262, "total_steps": 1428, "loss": 0.27856025099754333, "lr": 4.1098416716973457e-07, "epoch": 2.6512605042016806, "percentage": 88.38, "elapsed_time": "0:26:08", "remaining_time": "0:03:26"} +{"current_steps": 1263, "total_steps": 1428, "loss": 0.3749684691429138, "lr": 4.0614448410538077e-07, "epoch": 2.653361344537815, "percentage": 88.45, "elapsed_time": "0:26:09", "remaining_time": "0:03:25"} +{"current_steps": 1264, "total_steps": 1428, "loss": 0.6064971685409546, "lr": 4.01332259148815e-07, "epoch": 2.6554621848739495, "percentage": 88.52, "elapsed_time": "0:26:10", "remaining_time": "0:03:23"} +{"current_steps": 1265, "total_steps": 1428, "loss": 0.31089282035827637, "lr": 3.965475210633718e-07, "epoch": 2.657563025210084, "percentage": 88.59, "elapsed_time": "0:26:11", "remaining_time": "0:03:22"} +{"current_steps": 1266, "total_steps": 1428, "loss": 0.3686492443084717, "lr": 3.917902984480881e-07, "epoch": 2.6596638655462184, "percentage": 88.66, "elapsed_time": "0:26:12", "remaining_time": "0:03:21"} +{"current_steps": 1267, "total_steps": 1428, "loss": 0.5900052785873413, "lr": 3.870606197375415e-07, "epoch": 2.661764705882353, "percentage": 88.73, "elapsed_time": "0:26:13", "remaining_time": "0:03:19"} +{"current_steps": 1268, "total_steps": 1428, "loss": 0.23156413435935974, "lr": 3.823585132016711e-07, "epoch": 2.6638655462184873, "percentage": 88.8, "elapsed_time": "0:26:14", "remaining_time": "0:03:18"} +{"current_steps": 1269, "total_steps": 1428, "loss": 1.1965575218200684, "lr": 3.776840069456189e-07, "epoch": 2.6659663865546217, "percentage": 88.87, "elapsed_time": "0:26:15", "remaining_time": "0:03:17"} +{"current_steps": 1270, "total_steps": 1428, "loss": 0.5137308835983276, "lr": 3.730371289095508e-07, "epoch": 2.668067226890756, "percentage": 88.94, "elapsed_time": "0:26:16", "remaining_time": "0:03:16"} +{"current_steps": 1271, "total_steps": 1428, "loss": 0.2563337981700897, "lr": 3.6841790686849897e-07, "epoch": 2.6701680672268906, "percentage": 89.01, "elapsed_time": "0:26:17", "remaining_time": "0:03:14"} +{"current_steps": 1272, "total_steps": 1428, "loss": 0.5659809708595276, "lr": 3.6382636843218967e-07, "epoch": 2.6722689075630255, "percentage": 89.08, "elapsed_time": "0:26:19", "remaining_time": "0:03:13"} +{"current_steps": 1273, "total_steps": 1428, "loss": 0.4689119756221771, "lr": 3.592625410448813e-07, "epoch": 2.67436974789916, "percentage": 89.15, "elapsed_time": "0:26:20", "remaining_time": "0:03:12"} +{"current_steps": 1274, "total_steps": 1428, "loss": 0.623033881187439, "lr": 3.5472645198520064e-07, "epoch": 2.6764705882352944, "percentage": 89.22, "elapsed_time": "0:26:21", "remaining_time": "0:03:11"} +{"current_steps": 1275, "total_steps": 1428, "loss": 0.5805165767669678, "lr": 3.502181283659756e-07, "epoch": 2.678571428571429, "percentage": 89.29, "elapsed_time": "0:26:22", "remaining_time": "0:03:09"} +{"current_steps": 1276, "total_steps": 1428, "loss": 0.5375624299049377, "lr": 3.4573759713407927e-07, "epoch": 2.6806722689075633, "percentage": 89.36, "elapsed_time": "0:26:23", "remaining_time": "0:03:08"} +{"current_steps": 1277, "total_steps": 1428, "loss": 0.3185434341430664, "lr": 3.4128488507026327e-07, "epoch": 2.6827731092436977, "percentage": 89.43, "elapsed_time": "0:26:24", "remaining_time": "0:03:07"} +{"current_steps": 1278, "total_steps": 1428, "loss": 2.561387538909912, "lr": 3.3686001878900365e-07, "epoch": 2.684873949579832, "percentage": 89.5, "elapsed_time": "0:26:25", "remaining_time": "0:03:06"} +{"current_steps": 1279, "total_steps": 1428, "loss": 0.5536858439445496, "lr": 3.324630247383337e-07, "epoch": 2.6869747899159666, "percentage": 89.57, "elapsed_time": "0:26:26", "remaining_time": "0:03:04"} +{"current_steps": 1280, "total_steps": 1428, "loss": 0.18657177686691284, "lr": 3.2809392919969483e-07, "epoch": 2.689075630252101, "percentage": 89.64, "elapsed_time": "0:26:27", "remaining_time": "0:03:03"} +{"current_steps": 1281, "total_steps": 1428, "loss": 0.9441865086555481, "lr": 3.2375275828777253e-07, "epoch": 2.6911764705882355, "percentage": 89.71, "elapsed_time": "0:26:28", "remaining_time": "0:03:02"} +{"current_steps": 1282, "total_steps": 1428, "loss": 0.5320143103599548, "lr": 3.194395379503451e-07, "epoch": 2.69327731092437, "percentage": 89.78, "elapsed_time": "0:26:29", "remaining_time": "0:03:01"} +{"current_steps": 1283, "total_steps": 1428, "loss": 0.5943700075149536, "lr": 3.151542939681235e-07, "epoch": 2.6953781512605044, "percentage": 89.85, "elapsed_time": "0:26:30", "remaining_time": "0:02:59"} +{"current_steps": 1284, "total_steps": 1428, "loss": 1.0508530139923096, "lr": 3.108970519546034e-07, "epoch": 2.697478991596639, "percentage": 89.92, "elapsed_time": "0:26:32", "remaining_time": "0:02:58"} +{"current_steps": 1285, "total_steps": 1428, "loss": 0.3096291124820709, "lr": 3.066678373559062e-07, "epoch": 2.6995798319327733, "percentage": 89.99, "elapsed_time": "0:26:33", "remaining_time": "0:02:57"} +{"current_steps": 1286, "total_steps": 1428, "loss": 1.133009910583496, "lr": 3.0246667545063057e-07, "epoch": 2.7016806722689077, "percentage": 90.06, "elapsed_time": "0:26:34", "remaining_time": "0:02:56"} +{"current_steps": 1287, "total_steps": 1428, "loss": 0.3362637162208557, "lr": 2.9829359134970206e-07, "epoch": 2.703781512605042, "percentage": 90.13, "elapsed_time": "0:26:35", "remaining_time": "0:02:54"} +{"current_steps": 1288, "total_steps": 1428, "loss": 0.9418044090270996, "lr": 2.9414860999621764e-07, "epoch": 2.7058823529411766, "percentage": 90.2, "elapsed_time": "0:26:36", "remaining_time": "0:02:53"} +{"current_steps": 1289, "total_steps": 1428, "loss": 0.2674849033355713, "lr": 2.9003175616530264e-07, "epoch": 2.707983193277311, "percentage": 90.27, "elapsed_time": "0:26:37", "remaining_time": "0:02:52"} +{"current_steps": 1290, "total_steps": 1428, "loss": 0.39476725459098816, "lr": 2.8594305446396245e-07, "epoch": 2.7100840336134455, "percentage": 90.34, "elapsed_time": "0:26:38", "remaining_time": "0:02:51"} +{"current_steps": 1291, "total_steps": 1428, "loss": 0.5461002588272095, "lr": 2.818825293309274e-07, "epoch": 2.71218487394958, "percentage": 90.41, "elapsed_time": "0:26:39", "remaining_time": "0:02:49"} +{"current_steps": 1292, "total_steps": 1428, "loss": 0.36206185817718506, "lr": 2.7785020503651783e-07, "epoch": 2.7142857142857144, "percentage": 90.48, "elapsed_time": "0:26:40", "remaining_time": "0:02:48"} +{"current_steps": 1293, "total_steps": 1428, "loss": 0.33151179552078247, "lr": 2.7384610568249313e-07, "epoch": 2.716386554621849, "percentage": 90.55, "elapsed_time": "0:26:41", "remaining_time": "0:02:47"} +{"current_steps": 1294, "total_steps": 1428, "loss": 0.3465487062931061, "lr": 2.698702552019045e-07, "epoch": 2.7184873949579833, "percentage": 90.62, "elapsed_time": "0:26:42", "remaining_time": "0:02:45"} +{"current_steps": 1295, "total_steps": 1428, "loss": 0.22317005693912506, "lr": 2.659226773589607e-07, "epoch": 2.7205882352941178, "percentage": 90.69, "elapsed_time": "0:26:43", "remaining_time": "0:02:44"} +{"current_steps": 1296, "total_steps": 1428, "loss": 0.34791454672813416, "lr": 2.620033957488777e-07, "epoch": 2.722689075630252, "percentage": 90.76, "elapsed_time": "0:26:44", "remaining_time": "0:02:43"} +{"current_steps": 1297, "total_steps": 1428, "loss": 0.4211697578430176, "lr": 2.581124337977425e-07, "epoch": 2.7247899159663866, "percentage": 90.83, "elapsed_time": "0:26:46", "remaining_time": "0:02:42"} +{"current_steps": 1298, "total_steps": 1428, "loss": 0.4095291495323181, "lr": 2.542498147623701e-07, "epoch": 2.726890756302521, "percentage": 90.9, "elapsed_time": "0:26:47", "remaining_time": "0:02:40"} +{"current_steps": 1299, "total_steps": 1428, "loss": 0.2518484592437744, "lr": 2.50415561730169e-07, "epoch": 2.7289915966386555, "percentage": 90.97, "elapsed_time": "0:26:48", "remaining_time": "0:02:39"} +{"current_steps": 1300, "total_steps": 1428, "loss": 0.21484610438346863, "lr": 2.4660969761899576e-07, "epoch": 2.73109243697479, "percentage": 91.04, "elapsed_time": "0:26:49", "remaining_time": "0:02:38"} +{"current_steps": 1301, "total_steps": 1428, "loss": 0.39412614703178406, "lr": 2.428322451770276e-07, "epoch": 2.7331932773109244, "percentage": 91.11, "elapsed_time": "0:26:50", "remaining_time": "0:02:37"} +{"current_steps": 1302, "total_steps": 1428, "loss": 0.34464430809020996, "lr": 2.3908322698261597e-07, "epoch": 2.735294117647059, "percentage": 91.18, "elapsed_time": "0:26:51", "remaining_time": "0:02:35"} +{"current_steps": 1303, "total_steps": 1428, "loss": 0.5757449865341187, "lr": 2.3536266544416043e-07, "epoch": 2.7373949579831933, "percentage": 91.25, "elapsed_time": "0:26:52", "remaining_time": "0:02:34"} +{"current_steps": 1304, "total_steps": 1428, "loss": 0.7968210577964783, "lr": 2.3167058279997156e-07, "epoch": 2.7394957983193278, "percentage": 91.32, "elapsed_time": "0:26:53", "remaining_time": "0:02:33"} +{"current_steps": 1305, "total_steps": 1428, "loss": 0.40927547216415405, "lr": 2.2800700111813456e-07, "epoch": 2.741596638655462, "percentage": 91.39, "elapsed_time": "0:26:54", "remaining_time": "0:02:32"} +{"current_steps": 1306, "total_steps": 1428, "loss": 0.23368996381759644, "lr": 2.2437194229638415e-07, "epoch": 2.7436974789915967, "percentage": 91.46, "elapsed_time": "0:26:55", "remaining_time": "0:02:30"} +{"current_steps": 1307, "total_steps": 1428, "loss": 0.7368482351303101, "lr": 2.2076542806196588e-07, "epoch": 2.745798319327731, "percentage": 91.53, "elapsed_time": "0:26:56", "remaining_time": "0:02:29"} +{"current_steps": 1308, "total_steps": 1428, "loss": 0.29558128118515015, "lr": 2.17187479971514e-07, "epoch": 2.7478991596638656, "percentage": 91.6, "elapsed_time": "0:26:57", "remaining_time": "0:02:28"} +{"current_steps": 1309, "total_steps": 1428, "loss": 0.2764503061771393, "lr": 2.136381194109166e-07, "epoch": 2.75, "percentage": 91.67, "elapsed_time": "0:26:58", "remaining_time": "0:02:27"} +{"current_steps": 1310, "total_steps": 1428, "loss": 0.3793492615222931, "lr": 2.1011736759519286e-07, "epoch": 2.7521008403361344, "percentage": 91.74, "elapsed_time": "0:27:00", "remaining_time": "0:02:25"} +{"current_steps": 1311, "total_steps": 1428, "loss": 0.5927262902259827, "lr": 2.0662524556835982e-07, "epoch": 2.754201680672269, "percentage": 91.81, "elapsed_time": "0:27:01", "remaining_time": "0:02:24"} +{"current_steps": 1312, "total_steps": 1428, "loss": 0.4284164607524872, "lr": 2.0316177420331375e-07, "epoch": 2.7563025210084033, "percentage": 91.88, "elapsed_time": "0:27:02", "remaining_time": "0:02:23"} +{"current_steps": 1313, "total_steps": 1428, "loss": 0.4722291827201843, "lr": 1.997269742016994e-07, "epoch": 2.758403361344538, "percentage": 91.95, "elapsed_time": "0:27:03", "remaining_time": "0:02:22"} +{"current_steps": 1314, "total_steps": 1428, "loss": 0.6627257466316223, "lr": 1.9632086609379041e-07, "epoch": 2.7605042016806722, "percentage": 92.02, "elapsed_time": "0:27:04", "remaining_time": "0:02:20"} +{"current_steps": 1315, "total_steps": 1428, "loss": 0.42083340883255005, "lr": 1.929434702383648e-07, "epoch": 2.7626050420168067, "percentage": 92.09, "elapsed_time": "0:27:05", "remaining_time": "0:02:19"} +{"current_steps": 1316, "total_steps": 1428, "loss": 0.39910781383514404, "lr": 1.895948068225828e-07, "epoch": 2.764705882352941, "percentage": 92.16, "elapsed_time": "0:27:06", "remaining_time": "0:02:18"} +{"current_steps": 1317, "total_steps": 1428, "loss": 0.2765321731567383, "lr": 1.862748958618682e-07, "epoch": 2.7668067226890756, "percentage": 92.23, "elapsed_time": "0:27:07", "remaining_time": "0:02:17"} +{"current_steps": 1318, "total_steps": 1428, "loss": 0.08827929198741913, "lr": 1.8298375719978501e-07, "epoch": 2.76890756302521, "percentage": 92.3, "elapsed_time": "0:27:08", "remaining_time": "0:02:15"} +{"current_steps": 1319, "total_steps": 1428, "loss": 0.5753570795059204, "lr": 1.797214105079248e-07, "epoch": 2.7710084033613445, "percentage": 92.37, "elapsed_time": "0:27:09", "remaining_time": "0:02:14"} +{"current_steps": 1320, "total_steps": 1428, "loss": 0.7518602013587952, "lr": 1.7648787528578127e-07, "epoch": 2.773109243697479, "percentage": 92.44, "elapsed_time": "0:27:10", "remaining_time": "0:02:13"} +{"current_steps": 1321, "total_steps": 1428, "loss": 0.6446128487586975, "lr": 1.732831708606425e-07, "epoch": 2.7752100840336134, "percentage": 92.51, "elapsed_time": "0:27:11", "remaining_time": "0:02:12"} +{"current_steps": 1322, "total_steps": 1428, "loss": 0.4714201092720032, "lr": 1.7010731638746668e-07, "epoch": 2.777310924369748, "percentage": 92.58, "elapsed_time": "0:27:13", "remaining_time": "0:02:10"} +{"current_steps": 1323, "total_steps": 1428, "loss": 0.23203890025615692, "lr": 1.669603308487755e-07, "epoch": 2.7794117647058822, "percentage": 92.65, "elapsed_time": "0:27:14", "remaining_time": "0:02:09"} +{"current_steps": 1324, "total_steps": 1428, "loss": 0.5102007389068604, "lr": 1.6384223305453417e-07, "epoch": 2.7815126050420167, "percentage": 92.72, "elapsed_time": "0:27:15", "remaining_time": "0:02:08"} +{"current_steps": 1325, "total_steps": 1428, "loss": 0.45608770847320557, "lr": 1.6075304164204385e-07, "epoch": 2.783613445378151, "percentage": 92.79, "elapsed_time": "0:27:16", "remaining_time": "0:02:07"} +{"current_steps": 1326, "total_steps": 1428, "loss": 0.5190253257751465, "lr": 1.5769277507582725e-07, "epoch": 2.7857142857142856, "percentage": 92.86, "elapsed_time": "0:27:17", "remaining_time": "0:02:05"} +{"current_steps": 1327, "total_steps": 1428, "loss": 0.5670579075813293, "lr": 1.5466145164751977e-07, "epoch": 2.78781512605042, "percentage": 92.93, "elapsed_time": "0:27:18", "remaining_time": "0:02:04"} +{"current_steps": 1328, "total_steps": 1428, "loss": 0.4676046073436737, "lr": 1.5165908947575914e-07, "epoch": 2.7899159663865545, "percentage": 93.0, "elapsed_time": "0:27:19", "remaining_time": "0:02:03"} +{"current_steps": 1329, "total_steps": 1428, "loss": 0.2914016544818878, "lr": 1.4868570650607816e-07, "epoch": 2.792016806722689, "percentage": 93.07, "elapsed_time": "0:27:20", "remaining_time": "0:02:02"} +{"current_steps": 1330, "total_steps": 1428, "loss": 1.312021017074585, "lr": 1.4574132051079658e-07, "epoch": 2.7941176470588234, "percentage": 93.14, "elapsed_time": "0:27:21", "remaining_time": "0:02:00"} +{"current_steps": 1331, "total_steps": 1428, "loss": 0.3117330074310303, "lr": 1.4282594908891666e-07, "epoch": 2.796218487394958, "percentage": 93.21, "elapsed_time": "0:27:22", "remaining_time": "0:01:59"} +{"current_steps": 1332, "total_steps": 1428, "loss": 0.2705899775028229, "lr": 1.3993960966601328e-07, "epoch": 2.7983193277310923, "percentage": 93.28, "elapsed_time": "0:27:23", "remaining_time": "0:01:58"} +{"current_steps": 1333, "total_steps": 1428, "loss": 0.2621600031852722, "lr": 1.3708231949413676e-07, "epoch": 2.8004201680672267, "percentage": 93.35, "elapsed_time": "0:27:24", "remaining_time": "0:01:57"} +{"current_steps": 1334, "total_steps": 1428, "loss": 0.40849626064300537, "lr": 1.342540956517041e-07, "epoch": 2.802521008403361, "percentage": 93.42, "elapsed_time": "0:27:25", "remaining_time": "0:01:55"} +{"current_steps": 1335, "total_steps": 1428, "loss": 0.2958400845527649, "lr": 1.3145495504339856e-07, "epoch": 2.8046218487394956, "percentage": 93.49, "elapsed_time": "0:27:27", "remaining_time": "0:01:54"} +{"current_steps": 1336, "total_steps": 1428, "loss": 0.7148715257644653, "lr": 1.2868491440007015e-07, "epoch": 2.80672268907563, "percentage": 93.56, "elapsed_time": "0:27:28", "remaining_time": "0:01:53"} +{"current_steps": 1337, "total_steps": 1428, "loss": 0.5344212055206299, "lr": 1.2594399027863302e-07, "epoch": 2.8088235294117645, "percentage": 93.63, "elapsed_time": "0:27:29", "remaining_time": "0:01:52"} +{"current_steps": 1338, "total_steps": 1428, "loss": 0.3390062749385834, "lr": 1.232321990619695e-07, "epoch": 2.810924369747899, "percentage": 93.7, "elapsed_time": "0:27:30", "remaining_time": "0:01:51"} +{"current_steps": 1339, "total_steps": 1428, "loss": 0.6602462530136108, "lr": 1.205495569588283e-07, "epoch": 2.8130252100840334, "percentage": 93.77, "elapsed_time": "0:27:31", "remaining_time": "0:01:49"} +{"current_steps": 1340, "total_steps": 1428, "loss": 0.2165951430797577, "lr": 1.1789608000373209e-07, "epoch": 2.815126050420168, "percentage": 93.84, "elapsed_time": "0:27:32", "remaining_time": "0:01:48"} +{"current_steps": 1341, "total_steps": 1428, "loss": 0.33785703778266907, "lr": 1.1527178405687845e-07, "epoch": 2.8172268907563023, "percentage": 93.91, "elapsed_time": "0:27:33", "remaining_time": "0:01:47"} +{"current_steps": 1342, "total_steps": 1428, "loss": 0.49403730034828186, "lr": 1.1267668480404559e-07, "epoch": 2.8193277310924367, "percentage": 93.98, "elapsed_time": "0:27:34", "remaining_time": "0:01:46"} +{"current_steps": 1343, "total_steps": 1428, "loss": 0.5875406265258789, "lr": 1.1011079775649969e-07, "epoch": 2.821428571428571, "percentage": 94.05, "elapsed_time": "0:27:35", "remaining_time": "0:01:44"} +{"current_steps": 1344, "total_steps": 1428, "loss": 0.4375740885734558, "lr": 1.0757413825090212e-07, "epoch": 2.8235294117647056, "percentage": 94.12, "elapsed_time": "0:27:36", "remaining_time": "0:01:43"} +{"current_steps": 1345, "total_steps": 1428, "loss": 0.6797425746917725, "lr": 1.0506672144921515e-07, "epoch": 2.82563025210084, "percentage": 94.19, "elapsed_time": "0:27:37", "remaining_time": "0:01:42"} +{"current_steps": 1346, "total_steps": 1428, "loss": 0.36085596680641174, "lr": 1.0258856233861524e-07, "epoch": 2.8277310924369745, "percentage": 94.26, "elapsed_time": "0:27:38", "remaining_time": "0:01:41"} +{"current_steps": 1347, "total_steps": 1428, "loss": 0.43387356400489807, "lr": 1.0013967573140216e-07, "epoch": 2.8298319327731094, "percentage": 94.33, "elapsed_time": "0:27:39", "remaining_time": "0:01:39"} +{"current_steps": 1348, "total_steps": 1428, "loss": 0.44897180795669556, "lr": 9.77200762649072e-08, "epoch": 2.831932773109244, "percentage": 94.4, "elapsed_time": "0:27:41", "remaining_time": "0:01:38"} +{"current_steps": 1349, "total_steps": 1428, "loss": 0.22422294318675995, "lr": 9.532977840141123e-08, "epoch": 2.8340336134453783, "percentage": 94.47, "elapsed_time": "0:27:42", "remaining_time": "0:01:37"} +{"current_steps": 1350, "total_steps": 1428, "loss": 0.642038106918335, "lr": 9.29687964280529e-08, "epoch": 2.8361344537815127, "percentage": 94.54, "elapsed_time": "0:27:43", "remaining_time": "0:01:36"} +{"current_steps": 1351, "total_steps": 1428, "loss": 0.8069763779640198, "lr": 9.063714445674776e-08, "epoch": 2.838235294117647, "percentage": 94.61, "elapsed_time": "0:27:44", "remaining_time": "0:01:34"} +{"current_steps": 1352, "total_steps": 1428, "loss": 0.36828362941741943, "lr": 8.833483642410101e-08, "epoch": 2.8403361344537816, "percentage": 94.68, "elapsed_time": "0:27:45", "remaining_time": "0:01:33"} +{"current_steps": 1353, "total_steps": 1428, "loss": 0.3019287586212158, "lr": 8.606188609132593e-08, "epoch": 2.842436974789916, "percentage": 94.75, "elapsed_time": "0:27:46", "remaining_time": "0:01:32"} +{"current_steps": 1354, "total_steps": 1428, "loss": 0.8440870046615601, "lr": 8.381830704415839e-08, "epoch": 2.8445378151260505, "percentage": 94.82, "elapsed_time": "0:27:47", "remaining_time": "0:01:31"} +{"current_steps": 1355, "total_steps": 1428, "loss": 2.0406436920166016, "lr": 8.160411269278079e-08, "epoch": 2.846638655462185, "percentage": 94.89, "elapsed_time": "0:27:48", "remaining_time": "0:01:29"} +{"current_steps": 1356, "total_steps": 1428, "loss": 0.23328936100006104, "lr": 7.941931627173827e-08, "epoch": 2.8487394957983194, "percentage": 94.96, "elapsed_time": "0:27:49", "remaining_time": "0:01:28"} +{"current_steps": 1357, "total_steps": 1428, "loss": 0.552147626876831, "lr": 7.726393083985929e-08, "epoch": 2.850840336134454, "percentage": 95.03, "elapsed_time": "0:27:50", "remaining_time": "0:01:27"} +{"current_steps": 1358, "total_steps": 1428, "loss": 0.38458627462387085, "lr": 7.513796928018069e-08, "epoch": 2.8529411764705883, "percentage": 95.1, "elapsed_time": "0:27:51", "remaining_time": "0:01:26"} +{"current_steps": 1359, "total_steps": 1428, "loss": 0.3594217300415039, "lr": 7.30414442998667e-08, "epoch": 2.8550420168067228, "percentage": 95.17, "elapsed_time": "0:27:52", "remaining_time": "0:01:24"} +{"current_steps": 1360, "total_steps": 1428, "loss": 0.5628789067268372, "lr": 7.097436843013783e-08, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "0:27:53", "remaining_time": "0:01:23"} +{"current_steps": 1361, "total_steps": 1428, "loss": 0.7206631898880005, "lr": 6.893675402618982e-08, "epoch": 2.8592436974789917, "percentage": 95.31, "elapsed_time": "0:27:55", "remaining_time": "0:01:22"} +{"current_steps": 1362, "total_steps": 1428, "loss": 0.8038681745529175, "lr": 6.692861326712652e-08, "epoch": 2.861344537815126, "percentage": 95.38, "elapsed_time": "0:27:56", "remaining_time": "0:01:21"} +{"current_steps": 1363, "total_steps": 1428, "loss": 0.7214268445968628, "lr": 6.494995815588101e-08, "epoch": 2.8634453781512605, "percentage": 95.45, "elapsed_time": "0:27:57", "remaining_time": "0:01:19"} +{"current_steps": 1364, "total_steps": 1428, "loss": 0.3757812976837158, "lr": 6.300080051914792e-08, "epoch": 2.865546218487395, "percentage": 95.52, "elapsed_time": "0:27:58", "remaining_time": "0:01:18"} +{"current_steps": 1365, "total_steps": 1428, "loss": 0.7154731154441833, "lr": 6.108115200731069e-08, "epoch": 2.8676470588235294, "percentage": 95.59, "elapsed_time": "0:27:59", "remaining_time": "0:01:17"} +{"current_steps": 1366, "total_steps": 1428, "loss": 0.6805951595306396, "lr": 5.9191024094374384e-08, "epoch": 2.869747899159664, "percentage": 95.66, "elapsed_time": "0:28:00", "remaining_time": "0:01:16"} +{"current_steps": 1367, "total_steps": 1428, "loss": 0.41078895330429077, "lr": 5.7330428077893575e-08, "epoch": 2.8718487394957983, "percentage": 95.73, "elapsed_time": "0:28:01", "remaining_time": "0:01:15"} +{"current_steps": 1368, "total_steps": 1428, "loss": 0.35648801922798157, "lr": 5.5499375078906793e-08, "epoch": 2.8739495798319328, "percentage": 95.8, "elapsed_time": "0:28:02", "remaining_time": "0:01:13"} +{"current_steps": 1369, "total_steps": 1428, "loss": 0.3897348642349243, "lr": 5.369787604186993e-08, "epoch": 2.8760504201680672, "percentage": 95.87, "elapsed_time": "0:28:03", "remaining_time": "0:01:12"} +{"current_steps": 1370, "total_steps": 1428, "loss": 0.613540530204773, "lr": 5.192594173459242e-08, "epoch": 2.8781512605042017, "percentage": 95.94, "elapsed_time": "0:28:04", "remaining_time": "0:01:11"} +{"current_steps": 1371, "total_steps": 1428, "loss": 0.4445531964302063, "lr": 5.018358274816892e-08, "epoch": 2.880252100840336, "percentage": 96.01, "elapsed_time": "0:28:05", "remaining_time": "0:01:10"} +{"current_steps": 1372, "total_steps": 1428, "loss": 0.5488522052764893, "lr": 4.847080949691996e-08, "epoch": 2.8823529411764706, "percentage": 96.08, "elapsed_time": "0:28:06", "remaining_time": "0:01:08"} +{"current_steps": 1373, "total_steps": 1428, "loss": 0.5596367716789246, "lr": 4.6787632218326385e-08, "epoch": 2.884453781512605, "percentage": 96.15, "elapsed_time": "0:28:08", "remaining_time": "0:01:07"} +{"current_steps": 1374, "total_steps": 1428, "loss": 0.38018864393234253, "lr": 4.513406097297224e-08, "epoch": 2.8865546218487395, "percentage": 96.22, "elapsed_time": "0:28:09", "remaining_time": "0:01:06"} +{"current_steps": 1375, "total_steps": 1428, "loss": 0.661139726638794, "lr": 4.351010564447977e-08, "epoch": 2.888655462184874, "percentage": 96.29, "elapsed_time": "0:28:10", "remaining_time": "0:01:05"} +{"current_steps": 1376, "total_steps": 1428, "loss": 0.2944487929344177, "lr": 4.1915775939454506e-08, "epoch": 2.8907563025210083, "percentage": 96.36, "elapsed_time": "0:28:11", "remaining_time": "0:01:03"} +{"current_steps": 1377, "total_steps": 1428, "loss": 0.23486556112766266, "lr": 4.035108138742416e-08, "epoch": 2.892857142857143, "percentage": 96.43, "elapsed_time": "0:28:12", "remaining_time": "0:01:02"} +{"current_steps": 1378, "total_steps": 1428, "loss": 0.3030620813369751, "lr": 3.881603134078482e-08, "epoch": 2.8949579831932772, "percentage": 96.5, "elapsed_time": "0:28:13", "remaining_time": "0:01:01"} +{"current_steps": 1379, "total_steps": 1428, "loss": 0.3213701546192169, "lr": 3.731063497474152e-08, "epoch": 2.8970588235294117, "percentage": 96.57, "elapsed_time": "0:28:14", "remaining_time": "0:01:00"} +{"current_steps": 1380, "total_steps": 1428, "loss": 0.22970488667488098, "lr": 3.583490128725553e-08, "epoch": 2.899159663865546, "percentage": 96.64, "elapsed_time": "0:28:15", "remaining_time": "0:00:58"} +{"current_steps": 1381, "total_steps": 1428, "loss": 0.32231050729751587, "lr": 3.4388839098992154e-08, "epoch": 2.9012605042016806, "percentage": 96.71, "elapsed_time": "0:28:16", "remaining_time": "0:00:57"} +{"current_steps": 1382, "total_steps": 1428, "loss": 0.9544304609298706, "lr": 3.2972457053262466e-08, "epoch": 2.903361344537815, "percentage": 96.78, "elapsed_time": "0:28:17", "remaining_time": "0:00:56"} +{"current_steps": 1383, "total_steps": 1428, "loss": 0.7788558006286621, "lr": 3.158576361597887e-08, "epoch": 2.9054621848739495, "percentage": 96.85, "elapsed_time": "0:28:18", "remaining_time": "0:00:55"} +{"current_steps": 1384, "total_steps": 1428, "loss": 0.2601931393146515, "lr": 3.022876707559796e-08, "epoch": 2.907563025210084, "percentage": 96.92, "elapsed_time": "0:28:19", "remaining_time": "0:00:54"} +{"current_steps": 1385, "total_steps": 1428, "loss": 0.5957424640655518, "lr": 2.890147554307665e-08, "epoch": 2.9096638655462184, "percentage": 96.99, "elapsed_time": "0:28:20", "remaining_time": "0:00:52"} +{"current_steps": 1386, "total_steps": 1428, "loss": 0.2927376925945282, "lr": 2.7603896951817755e-08, "epoch": 2.911764705882353, "percentage": 97.06, "elapsed_time": "0:28:21", "remaining_time": "0:00:51"} +{"current_steps": 1387, "total_steps": 1428, "loss": 0.5990405082702637, "lr": 2.633603905762838e-08, "epoch": 2.9138655462184873, "percentage": 97.13, "elapsed_time": "0:28:23", "remaining_time": "0:00:50"} +{"current_steps": 1388, "total_steps": 1428, "loss": 0.4513130784034729, "lr": 2.5097909438669964e-08, "epoch": 2.9159663865546217, "percentage": 97.2, "elapsed_time": "0:28:24", "remaining_time": "0:00:49"} +{"current_steps": 1389, "total_steps": 1428, "loss": 0.6215352416038513, "lr": 2.3889515495413297e-08, "epoch": 2.918067226890756, "percentage": 97.27, "elapsed_time": "0:28:25", "remaining_time": "0:00:47"} +{"current_steps": 1390, "total_steps": 1428, "loss": 0.33804643154144287, "lr": 2.2710864450596336e-08, "epoch": 2.9201680672268906, "percentage": 97.34, "elapsed_time": "0:28:26", "remaining_time": "0:00:46"} +{"current_steps": 1391, "total_steps": 1428, "loss": 0.4266011416912079, "lr": 2.1561963349178704e-08, "epoch": 2.9222689075630255, "percentage": 97.41, "elapsed_time": "0:28:27", "remaining_time": "0:00:45"} +{"current_steps": 1392, "total_steps": 1428, "loss": 0.3738781809806824, "lr": 2.0442819058300588e-08, "epoch": 2.92436974789916, "percentage": 97.48, "elapsed_time": "0:28:28", "remaining_time": "0:00:44"} +{"current_steps": 1393, "total_steps": 1428, "loss": 0.26019287109375, "lr": 1.935343826724112e-08, "epoch": 2.9264705882352944, "percentage": 97.55, "elapsed_time": "0:28:29", "remaining_time": "0:00:42"} +{"current_steps": 1394, "total_steps": 1428, "loss": 0.3799281120300293, "lr": 1.8293827487380623e-08, "epoch": 2.928571428571429, "percentage": 97.62, "elapsed_time": "0:28:30", "remaining_time": "0:00:41"} +{"current_steps": 1395, "total_steps": 1428, "loss": 0.25459083914756775, "lr": 1.726399305215787e-08, "epoch": 2.9306722689075633, "percentage": 97.69, "elapsed_time": "0:28:31", "remaining_time": "0:00:40"} +{"current_steps": 1396, "total_steps": 1428, "loss": 0.4746205806732178, "lr": 1.626394111703622e-08, "epoch": 2.9327731092436977, "percentage": 97.76, "elapsed_time": "0:28:32", "remaining_time": "0:00:39"} +{"current_steps": 1397, "total_steps": 1428, "loss": 0.4622001647949219, "lr": 1.5293677659463104e-08, "epoch": 2.934873949579832, "percentage": 97.83, "elapsed_time": "0:28:33", "remaining_time": "0:00:38"} +{"current_steps": 1398, "total_steps": 1428, "loss": 0.18047931790351868, "lr": 1.4353208478837256e-08, "epoch": 2.9369747899159666, "percentage": 97.9, "elapsed_time": "0:28:34", "remaining_time": "0:00:36"} +{"current_steps": 1399, "total_steps": 1428, "loss": 0.37007540464401245, "lr": 1.3442539196472647e-08, "epoch": 2.939075630252101, "percentage": 97.97, "elapsed_time": "0:28:36", "remaining_time": "0:00:35"} +{"current_steps": 1400, "total_steps": 1428, "loss": 0.7158060073852539, "lr": 1.2561675255564621e-08, "epoch": 2.9411764705882355, "percentage": 98.04, "elapsed_time": "0:28:37", "remaining_time": "0:00:34"} +{"current_steps": 1401, "total_steps": 1428, "loss": 0.9123420119285583, "lr": 1.1710621921159904e-08, "epoch": 2.94327731092437, "percentage": 98.11, "elapsed_time": "0:28:38", "remaining_time": "0:00:33"} +{"current_steps": 1402, "total_steps": 1428, "loss": 1.1057486534118652, "lr": 1.0889384280119985e-08, "epoch": 2.9453781512605044, "percentage": 98.18, "elapsed_time": "0:28:39", "remaining_time": "0:00:31"} +{"current_steps": 1403, "total_steps": 1428, "loss": 0.36926376819610596, "lr": 1.009796724109613e-08, "epoch": 2.947478991596639, "percentage": 98.25, "elapsed_time": "0:28:40", "remaining_time": "0:00:30"} +{"current_steps": 1404, "total_steps": 1428, "loss": 0.5240511298179626, "lr": 9.336375534497732e-09, "epoch": 2.9495798319327733, "percentage": 98.32, "elapsed_time": "0:28:41", "remaining_time": "0:00:29"} +{"current_steps": 1405, "total_steps": 1428, "loss": 1.0361064672470093, "lr": 8.60461371246235e-09, "epoch": 2.9516806722689077, "percentage": 98.39, "elapsed_time": "0:28:42", "remaining_time": "0:00:28"} +{"current_steps": 1406, "total_steps": 1428, "loss": 0.7314852476119995, "lr": 7.902686148831273e-09, "epoch": 2.953781512605042, "percentage": 98.46, "elapsed_time": "0:28:43", "remaining_time": "0:00:26"} +{"current_steps": 1407, "total_steps": 1428, "loss": 0.5929103493690491, "lr": 7.230597039123433e-09, "epoch": 2.9558823529411766, "percentage": 98.53, "elapsed_time": "0:28:44", "remaining_time": "0:00:25"} +{"current_steps": 1408, "total_steps": 1428, "loss": 0.24979953467845917, "lr": 6.588350400507093e-09, "epoch": 2.957983193277311, "percentage": 98.6, "elapsed_time": "0:28:45", "remaining_time": "0:00:24"} +{"current_steps": 1409, "total_steps": 1428, "loss": 0.810958206653595, "lr": 5.975950071779313e-09, "epoch": 2.9600840336134455, "percentage": 98.67, "elapsed_time": "0:28:46", "remaining_time": "0:00:23"} +{"current_steps": 1410, "total_steps": 1428, "loss": 0.4567590355873108, "lr": 5.393399713341518e-09, "epoch": 2.96218487394958, "percentage": 98.74, "elapsed_time": "0:28:47", "remaining_time": "0:00:22"} +{"current_steps": 1411, "total_steps": 1428, "loss": 0.34989726543426514, "lr": 4.8407028071773e-09, "epoch": 2.9642857142857144, "percentage": 98.81, "elapsed_time": "0:28:49", "remaining_time": "0:00:20"} +{"current_steps": 1412, "total_steps": 1428, "loss": 0.3826170563697815, "lr": 4.317862656831873e-09, "epoch": 2.966386554621849, "percentage": 98.88, "elapsed_time": "0:28:50", "remaining_time": "0:00:19"} +{"current_steps": 1413, "total_steps": 1428, "loss": 0.25103145837783813, "lr": 3.8248823873932026e-09, "epoch": 2.9684873949579833, "percentage": 98.95, "elapsed_time": "0:28:51", "remaining_time": "0:00:18"} +{"current_steps": 1414, "total_steps": 1428, "loss": 0.33963871002197266, "lr": 3.361764945473134e-09, "epoch": 2.9705882352941178, "percentage": 99.02, "elapsed_time": "0:28:52", "remaining_time": "0:00:17"} +{"current_steps": 1415, "total_steps": 1428, "loss": 0.5596168637275696, "lr": 2.928513099187402e-09, "epoch": 2.972689075630252, "percentage": 99.09, "elapsed_time": "0:28:53", "remaining_time": "0:00:15"} +{"current_steps": 1416, "total_steps": 1428, "loss": 0.3114224374294281, "lr": 2.52512943814176e-09, "epoch": 2.9747899159663866, "percentage": 99.16, "elapsed_time": "0:28:54", "remaining_time": "0:00:14"} +{"current_steps": 1417, "total_steps": 1428, "loss": 0.5350728631019592, "lr": 2.151616373417542e-09, "epoch": 2.976890756302521, "percentage": 99.23, "elapsed_time": "0:28:55", "remaining_time": "0:00:13"} +{"current_steps": 1418, "total_steps": 1428, "loss": 0.6644730567932129, "lr": 1.8079761375522365e-09, "epoch": 2.9789915966386555, "percentage": 99.3, "elapsed_time": "0:28:56", "remaining_time": "0:00:12"} +{"current_steps": 1419, "total_steps": 1428, "loss": 0.2426847219467163, "lr": 1.4942107845317132e-09, "epoch": 2.98109243697479, "percentage": 99.37, "elapsed_time": "0:28:57", "remaining_time": "0:00:11"} +{"current_steps": 1420, "total_steps": 1428, "loss": 0.2127893567085266, "lr": 1.210322189774682e-09, "epoch": 2.9831932773109244, "percentage": 99.44, "elapsed_time": "0:28:58", "remaining_time": "0:00:09"} +{"current_steps": 1421, "total_steps": 1428, "loss": 0.31507742404937744, "lr": 9.563120501221434e-10, "epoch": 2.985294117647059, "percentage": 99.51, "elapsed_time": "0:28:59", "remaining_time": "0:00:08"} +{"current_steps": 1422, "total_steps": 1428, "loss": 0.49292629957199097, "lr": 7.321818838279537e-10, "epoch": 2.9873949579831933, "percentage": 99.58, "elapsed_time": "0:29:00", "remaining_time": "0:00:07"} +{"current_steps": 1423, "total_steps": 1428, "loss": 0.25357064604759216, "lr": 5.379330305488317e-10, "epoch": 2.9894957983193278, "percentage": 99.65, "elapsed_time": "0:29:01", "remaining_time": "0:00:06"} +{"current_steps": 1424, "total_steps": 1428, "loss": 0.4229947328567505, "lr": 3.735666513371428e-10, "epoch": 2.991596638655462, "percentage": 99.72, "elapsed_time": "0:29:03", "remaining_time": "0:00:04"} +{"current_steps": 1425, "total_steps": 1428, "loss": 0.5679960250854492, "lr": 2.3908372863368223e-10, "epoch": 2.9936974789915967, "percentage": 99.79, "elapsed_time": "0:29:04", "remaining_time": "0:00:03"} +{"current_steps": 1426, "total_steps": 1428, "loss": 0.3406621515750885, "lr": 1.344850662604591e-10, "epoch": 2.995798319327731, "percentage": 99.86, "elapsed_time": "0:29:05", "remaining_time": "0:00:02"} +{"current_steps": 1427, "total_steps": 1428, "loss": 0.3986052870750427, "lr": 5.977128941903055e-11, "epoch": 2.9978991596638656, "percentage": 99.93, "elapsed_time": "0:29:06", "remaining_time": "0:00:01"} +{"current_steps": 1428, "total_steps": 1428, "loss": 0.49183082580566406, "lr": 1.494284468384066e-11, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:29:07", "remaining_time": "0:00:00"} +{"current_steps": 1428, "total_steps": 1428, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:30:51", "remaining_time": "0:00:00"} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..2a95de4 --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,10039 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 3.0, + "eval_steps": 500, + "global_step": 1428, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0021008403361344537, + "grad_norm": 46.99030458326992, + "learning_rate": 0.0, + "loss": 4.722589492797852, + "step": 1 + }, + { + "epoch": 0.004201680672268907, + "grad_norm": 36.88474864262765, + "learning_rate": 6.993006993006993e-08, + "loss": 3.9686050415039062, + "step": 2 + }, + { + "epoch": 0.0063025210084033615, + "grad_norm": 33.07457670969746, + "learning_rate": 1.3986013986013987e-07, + "loss": 4.086915969848633, + "step": 3 + }, + { + "epoch": 0.008403361344537815, + "grad_norm": 31.625791708920385, + "learning_rate": 2.097902097902098e-07, + "loss": 4.020754814147949, + "step": 4 + }, + { + "epoch": 0.01050420168067227, + "grad_norm": 43.0872077594366, + "learning_rate": 2.7972027972027973e-07, + "loss": 4.11073112487793, + "step": 5 + }, + { + "epoch": 0.012605042016806723, + "grad_norm": 41.05815920768766, + "learning_rate": 3.496503496503497e-07, + "loss": 4.068889141082764, + "step": 6 + }, + { + "epoch": 0.014705882352941176, + "grad_norm": 38.60187500165403, + "learning_rate": 4.195804195804196e-07, + "loss": 3.9590301513671875, + "step": 7 + }, + { + "epoch": 0.01680672268907563, + "grad_norm": 39.6727205000689, + "learning_rate": 4.895104895104896e-07, + "loss": 3.7929787635803223, + "step": 8 + }, + { + "epoch": 0.018907563025210083, + "grad_norm": 35.21152216885091, + "learning_rate": 5.594405594405595e-07, + "loss": 4.345971584320068, + "step": 9 + }, + { + "epoch": 0.02100840336134454, + "grad_norm": 32.94311862999745, + "learning_rate": 6.293706293706295e-07, + "loss": 4.204797744750977, + "step": 10 + }, + { + "epoch": 0.023109243697478993, + "grad_norm": 35.708967266069514, + "learning_rate": 6.993006993006994e-07, + "loss": 4.2924957275390625, + "step": 11 + }, + { + "epoch": 0.025210084033613446, + "grad_norm": 35.068164747297715, + "learning_rate": 7.692307692307694e-07, + "loss": 3.6519017219543457, + "step": 12 + }, + { + "epoch": 0.0273109243697479, + "grad_norm": 36.012069511225576, + "learning_rate": 8.391608391608393e-07, + "loss": 3.5902950763702393, + "step": 13 + }, + { + "epoch": 0.029411764705882353, + "grad_norm": 31.883494522724174, + "learning_rate": 9.090909090909091e-07, + "loss": 3.751192092895508, + "step": 14 + }, + { + "epoch": 0.031512605042016806, + "grad_norm": 28.67530148457089, + "learning_rate": 9.790209790209791e-07, + "loss": 4.330526351928711, + "step": 15 + }, + { + "epoch": 0.03361344537815126, + "grad_norm": 36.87930031460684, + "learning_rate": 1.0489510489510491e-06, + "loss": 3.7747349739074707, + "step": 16 + }, + { + "epoch": 0.03571428571428571, + "grad_norm": 34.94283148044396, + "learning_rate": 1.118881118881119e-06, + "loss": 3.6174468994140625, + "step": 17 + }, + { + "epoch": 0.037815126050420166, + "grad_norm": 26.489554272646977, + "learning_rate": 1.188811188811189e-06, + "loss": 3.4348971843719482, + "step": 18 + }, + { + "epoch": 0.03991596638655462, + "grad_norm": 25.603886661513403, + "learning_rate": 1.258741258741259e-06, + "loss": 3.4862470626831055, + "step": 19 + }, + { + "epoch": 0.04201680672268908, + "grad_norm": 22.404814809342252, + "learning_rate": 1.3286713286713287e-06, + "loss": 3.7471625804901123, + "step": 20 + }, + { + "epoch": 0.04411764705882353, + "grad_norm": 21.15277638751192, + "learning_rate": 1.3986013986013987e-06, + "loss": 3.6562182903289795, + "step": 21 + }, + { + "epoch": 0.046218487394957986, + "grad_norm": 20.270881263670095, + "learning_rate": 1.4685314685314685e-06, + "loss": 2.944753408432007, + "step": 22 + }, + { + "epoch": 0.04831932773109244, + "grad_norm": 22.812966816264836, + "learning_rate": 1.5384615384615387e-06, + "loss": 4.277539253234863, + "step": 23 + }, + { + "epoch": 0.05042016806722689, + "grad_norm": 21.380979723581284, + "learning_rate": 1.6083916083916085e-06, + "loss": 4.103379726409912, + "step": 24 + }, + { + "epoch": 0.052521008403361345, + "grad_norm": 13.548338819677783, + "learning_rate": 1.6783216783216785e-06, + "loss": 3.516192674636841, + "step": 25 + }, + { + "epoch": 0.0546218487394958, + "grad_norm": 16.574184790133323, + "learning_rate": 1.7482517482517483e-06, + "loss": 3.054426908493042, + "step": 26 + }, + { + "epoch": 0.05672268907563025, + "grad_norm": 14.817846975349166, + "learning_rate": 1.8181818181818183e-06, + "loss": 3.598344564437866, + "step": 27 + }, + { + "epoch": 0.058823529411764705, + "grad_norm": 13.230202987729585, + "learning_rate": 1.888111888111888e-06, + "loss": 2.1566905975341797, + "step": 28 + }, + { + "epoch": 0.06092436974789916, + "grad_norm": 19.612310968262104, + "learning_rate": 1.9580419580419583e-06, + "loss": 2.7493889331817627, + "step": 29 + }, + { + "epoch": 0.06302521008403361, + "grad_norm": 18.334666543367657, + "learning_rate": 2.027972027972028e-06, + "loss": 3.7484190464019775, + "step": 30 + }, + { + "epoch": 0.06512605042016807, + "grad_norm": 15.812972082251932, + "learning_rate": 2.0979020979020983e-06, + "loss": 3.4763312339782715, + "step": 31 + }, + { + "epoch": 0.06722689075630252, + "grad_norm": 18.340243585590446, + "learning_rate": 2.167832167832168e-06, + "loss": 4.1537184715271, + "step": 32 + }, + { + "epoch": 0.06932773109243698, + "grad_norm": 9.470566142580898, + "learning_rate": 2.237762237762238e-06, + "loss": 3.949978828430176, + "step": 33 + }, + { + "epoch": 0.07142857142857142, + "grad_norm": 15.047162012043515, + "learning_rate": 2.307692307692308e-06, + "loss": 3.095123291015625, + "step": 34 + }, + { + "epoch": 0.07352941176470588, + "grad_norm": 15.619490386855553, + "learning_rate": 2.377622377622378e-06, + "loss": 3.6232047080993652, + "step": 35 + }, + { + "epoch": 0.07563025210084033, + "grad_norm": 12.996399577415676, + "learning_rate": 2.4475524475524477e-06, + "loss": 3.801804304122925, + "step": 36 + }, + { + "epoch": 0.07773109243697479, + "grad_norm": 7.924270548246447, + "learning_rate": 2.517482517482518e-06, + "loss": 2.909287452697754, + "step": 37 + }, + { + "epoch": 0.07983193277310924, + "grad_norm": 10.838167134028488, + "learning_rate": 2.5874125874125877e-06, + "loss": 3.283078670501709, + "step": 38 + }, + { + "epoch": 0.0819327731092437, + "grad_norm": 12.236334826312302, + "learning_rate": 2.6573426573426574e-06, + "loss": 2.9224965572357178, + "step": 39 + }, + { + "epoch": 0.08403361344537816, + "grad_norm": 10.59808836361908, + "learning_rate": 2.7272727272727272e-06, + "loss": 3.591977119445801, + "step": 40 + }, + { + "epoch": 0.0861344537815126, + "grad_norm": 9.295669805450128, + "learning_rate": 2.7972027972027974e-06, + "loss": 3.0213565826416016, + "step": 41 + }, + { + "epoch": 0.08823529411764706, + "grad_norm": 12.563423620415891, + "learning_rate": 2.8671328671328672e-06, + "loss": 2.9183509349823, + "step": 42 + }, + { + "epoch": 0.09033613445378151, + "grad_norm": 13.858660538396043, + "learning_rate": 2.937062937062937e-06, + "loss": 3.4748919010162354, + "step": 43 + }, + { + "epoch": 0.09243697478991597, + "grad_norm": 11.043040598415395, + "learning_rate": 3.006993006993007e-06, + "loss": 3.53951096534729, + "step": 44 + }, + { + "epoch": 0.09453781512605042, + "grad_norm": 12.201335477546305, + "learning_rate": 3.0769230769230774e-06, + "loss": 3.2075607776641846, + "step": 45 + }, + { + "epoch": 0.09663865546218488, + "grad_norm": 20.281483402633803, + "learning_rate": 3.1468531468531472e-06, + "loss": 3.2893571853637695, + "step": 46 + }, + { + "epoch": 0.09873949579831932, + "grad_norm": 10.008468666819498, + "learning_rate": 3.216783216783217e-06, + "loss": 3.47295880317688, + "step": 47 + }, + { + "epoch": 0.10084033613445378, + "grad_norm": 11.407538553004894, + "learning_rate": 3.286713286713287e-06, + "loss": 3.5495269298553467, + "step": 48 + }, + { + "epoch": 0.10294117647058823, + "grad_norm": 16.252417297798132, + "learning_rate": 3.356643356643357e-06, + "loss": 3.218782901763916, + "step": 49 + }, + { + "epoch": 0.10504201680672269, + "grad_norm": 8.752146553121406, + "learning_rate": 3.426573426573427e-06, + "loss": 2.612854242324829, + "step": 50 + }, + { + "epoch": 0.10714285714285714, + "grad_norm": 14.782692853689836, + "learning_rate": 3.4965034965034966e-06, + "loss": 3.0805444717407227, + "step": 51 + }, + { + "epoch": 0.1092436974789916, + "grad_norm": 14.664178996815842, + "learning_rate": 3.566433566433567e-06, + "loss": 3.1539719104766846, + "step": 52 + }, + { + "epoch": 0.11134453781512606, + "grad_norm": 13.158498079025986, + "learning_rate": 3.6363636363636366e-06, + "loss": 3.5745811462402344, + "step": 53 + }, + { + "epoch": 0.1134453781512605, + "grad_norm": 9.661944205457672, + "learning_rate": 3.7062937062937064e-06, + "loss": 3.033264398574829, + "step": 54 + }, + { + "epoch": 0.11554621848739496, + "grad_norm": 8.534767379388418, + "learning_rate": 3.776223776223776e-06, + "loss": 2.5727319717407227, + "step": 55 + }, + { + "epoch": 0.11764705882352941, + "grad_norm": 10.446726865588245, + "learning_rate": 3.846153846153847e-06, + "loss": 3.4801394939422607, + "step": 56 + }, + { + "epoch": 0.11974789915966387, + "grad_norm": 11.510497882977212, + "learning_rate": 3.916083916083917e-06, + "loss": 3.253239631652832, + "step": 57 + }, + { + "epoch": 0.12184873949579832, + "grad_norm": 12.480969279334285, + "learning_rate": 3.986013986013986e-06, + "loss": 3.0049266815185547, + "step": 58 + }, + { + "epoch": 0.12394957983193278, + "grad_norm": 10.926998541566615, + "learning_rate": 4.055944055944056e-06, + "loss": 3.13586688041687, + "step": 59 + }, + { + "epoch": 0.12605042016806722, + "grad_norm": 15.080151132986066, + "learning_rate": 4.125874125874127e-06, + "loss": 3.5970468521118164, + "step": 60 + }, + { + "epoch": 0.12815126050420167, + "grad_norm": 11.40302094802426, + "learning_rate": 4.195804195804197e-06, + "loss": 3.0423130989074707, + "step": 61 + }, + { + "epoch": 0.13025210084033614, + "grad_norm": 27.877774734458356, + "learning_rate": 4.265734265734266e-06, + "loss": 3.270495891571045, + "step": 62 + }, + { + "epoch": 0.1323529411764706, + "grad_norm": 14.517043785366944, + "learning_rate": 4.335664335664336e-06, + "loss": 3.3109726905822754, + "step": 63 + }, + { + "epoch": 0.13445378151260504, + "grad_norm": 9.703645186786849, + "learning_rate": 4.405594405594406e-06, + "loss": 2.8192973136901855, + "step": 64 + }, + { + "epoch": 0.13655462184873948, + "grad_norm": 7.165620671720677, + "learning_rate": 4.475524475524476e-06, + "loss": 2.6368956565856934, + "step": 65 + }, + { + "epoch": 0.13865546218487396, + "grad_norm": 8.390508554521247, + "learning_rate": 4.5454545454545455e-06, + "loss": 3.2420871257781982, + "step": 66 + }, + { + "epoch": 0.1407563025210084, + "grad_norm": 13.495244668273582, + "learning_rate": 4.615384615384616e-06, + "loss": 3.4662106037139893, + "step": 67 + }, + { + "epoch": 0.14285714285714285, + "grad_norm": 8.727556576037161, + "learning_rate": 4.685314685314686e-06, + "loss": 2.52485728263855, + "step": 68 + }, + { + "epoch": 0.14495798319327732, + "grad_norm": 7.972842185352863, + "learning_rate": 4.755244755244756e-06, + "loss": 2.94364595413208, + "step": 69 + }, + { + "epoch": 0.14705882352941177, + "grad_norm": 9.543376366698592, + "learning_rate": 4.8251748251748255e-06, + "loss": 3.080875873565674, + "step": 70 + }, + { + "epoch": 0.14915966386554622, + "grad_norm": 9.776294776088129, + "learning_rate": 4.895104895104895e-06, + "loss": 2.779900550842285, + "step": 71 + }, + { + "epoch": 0.15126050420168066, + "grad_norm": 13.30903798143632, + "learning_rate": 4.965034965034965e-06, + "loss": 2.5541608333587646, + "step": 72 + }, + { + "epoch": 0.15336134453781514, + "grad_norm": 15.821626595005261, + "learning_rate": 5.034965034965036e-06, + "loss": 3.3032145500183105, + "step": 73 + }, + { + "epoch": 0.15546218487394958, + "grad_norm": 16.2233191932233, + "learning_rate": 5.1048951048951055e-06, + "loss": 3.302570104598999, + "step": 74 + }, + { + "epoch": 0.15756302521008403, + "grad_norm": 12.108052548372182, + "learning_rate": 5.174825174825175e-06, + "loss": 3.084743022918701, + "step": 75 + }, + { + "epoch": 0.15966386554621848, + "grad_norm": 12.123207907469205, + "learning_rate": 5.244755244755245e-06, + "loss": 2.839994430541992, + "step": 76 + }, + { + "epoch": 0.16176470588235295, + "grad_norm": 27.162201978657112, + "learning_rate": 5.314685314685315e-06, + "loss": 2.8261585235595703, + "step": 77 + }, + { + "epoch": 0.1638655462184874, + "grad_norm": 9.26220027446702, + "learning_rate": 5.384615384615385e-06, + "loss": 3.022369861602783, + "step": 78 + }, + { + "epoch": 0.16596638655462184, + "grad_norm": 34.01052504369158, + "learning_rate": 5.4545454545454545e-06, + "loss": 3.11270809173584, + "step": 79 + }, + { + "epoch": 0.16806722689075632, + "grad_norm": 10.318191696420305, + "learning_rate": 5.524475524475524e-06, + "loss": 2.8419973850250244, + "step": 80 + }, + { + "epoch": 0.17016806722689076, + "grad_norm": 8.227880656419073, + "learning_rate": 5.594405594405595e-06, + "loss": 3.14296555519104, + "step": 81 + }, + { + "epoch": 0.1722689075630252, + "grad_norm": 9.40271889928186, + "learning_rate": 5.664335664335665e-06, + "loss": 2.8033950328826904, + "step": 82 + }, + { + "epoch": 0.17436974789915966, + "grad_norm": 9.95443701525972, + "learning_rate": 5.7342657342657345e-06, + "loss": 3.087614059448242, + "step": 83 + }, + { + "epoch": 0.17647058823529413, + "grad_norm": 9.899264562788812, + "learning_rate": 5.804195804195804e-06, + "loss": 2.7504851818084717, + "step": 84 + }, + { + "epoch": 0.17857142857142858, + "grad_norm": 14.065492890913543, + "learning_rate": 5.874125874125874e-06, + "loss": 2.701443672180176, + "step": 85 + }, + { + "epoch": 0.18067226890756302, + "grad_norm": 12.602747808400954, + "learning_rate": 5.944055944055944e-06, + "loss": 2.8965351581573486, + "step": 86 + }, + { + "epoch": 0.18277310924369747, + "grad_norm": 10.478287423381614, + "learning_rate": 6.013986013986014e-06, + "loss": 2.9607667922973633, + "step": 87 + }, + { + "epoch": 0.18487394957983194, + "grad_norm": 25.168903954415445, + "learning_rate": 6.083916083916085e-06, + "loss": 3.2360849380493164, + "step": 88 + }, + { + "epoch": 0.1869747899159664, + "grad_norm": 9.706474901305377, + "learning_rate": 6.153846153846155e-06, + "loss": 3.146829605102539, + "step": 89 + }, + { + "epoch": 0.18907563025210083, + "grad_norm": 16.976357238619705, + "learning_rate": 6.223776223776225e-06, + "loss": 3.017669200897217, + "step": 90 + }, + { + "epoch": 0.19117647058823528, + "grad_norm": 22.76924701111939, + "learning_rate": 6.2937062937062944e-06, + "loss": 3.4739527702331543, + "step": 91 + }, + { + "epoch": 0.19327731092436976, + "grad_norm": 10.061400086768733, + "learning_rate": 6.363636363636364e-06, + "loss": 2.8482136726379395, + "step": 92 + }, + { + "epoch": 0.1953781512605042, + "grad_norm": 12.711145684012218, + "learning_rate": 6.433566433566434e-06, + "loss": 2.7700202465057373, + "step": 93 + }, + { + "epoch": 0.19747899159663865, + "grad_norm": 19.156479556141598, + "learning_rate": 6.503496503496504e-06, + "loss": 3.109806537628174, + "step": 94 + }, + { + "epoch": 0.19957983193277312, + "grad_norm": 7.981944912040402, + "learning_rate": 6.573426573426574e-06, + "loss": 2.9637131690979004, + "step": 95 + }, + { + "epoch": 0.20168067226890757, + "grad_norm": 12.84352715723152, + "learning_rate": 6.643356643356644e-06, + "loss": 2.846522808074951, + "step": 96 + }, + { + "epoch": 0.20378151260504201, + "grad_norm": 17.72741270084134, + "learning_rate": 6.713286713286714e-06, + "loss": 3.3485140800476074, + "step": 97 + }, + { + "epoch": 0.20588235294117646, + "grad_norm": 13.533003488049717, + "learning_rate": 6.783216783216784e-06, + "loss": 3.014303207397461, + "step": 98 + }, + { + "epoch": 0.20798319327731093, + "grad_norm": 8.522856642426069, + "learning_rate": 6.853146853146854e-06, + "loss": 2.6768596172332764, + "step": 99 + }, + { + "epoch": 0.21008403361344538, + "grad_norm": 28.089483697370316, + "learning_rate": 6.923076923076923e-06, + "loss": 2.9336276054382324, + "step": 100 + }, + { + "epoch": 0.21218487394957983, + "grad_norm": 10.595985912398088, + "learning_rate": 6.993006993006993e-06, + "loss": 3.103717803955078, + "step": 101 + }, + { + "epoch": 0.21428571428571427, + "grad_norm": 9.980132596619391, + "learning_rate": 7.062937062937063e-06, + "loss": 2.7759556770324707, + "step": 102 + }, + { + "epoch": 0.21638655462184875, + "grad_norm": 9.86026405652693, + "learning_rate": 7.132867132867134e-06, + "loss": 2.586292266845703, + "step": 103 + }, + { + "epoch": 0.2184873949579832, + "grad_norm": 15.473317115776915, + "learning_rate": 7.202797202797203e-06, + "loss": 3.109880208969116, + "step": 104 + }, + { + "epoch": 0.22058823529411764, + "grad_norm": 12.647734541011893, + "learning_rate": 7.272727272727273e-06, + "loss": 2.7075915336608887, + "step": 105 + }, + { + "epoch": 0.22268907563025211, + "grad_norm": 13.506863668083897, + "learning_rate": 7.342657342657343e-06, + "loss": 3.034566879272461, + "step": 106 + }, + { + "epoch": 0.22478991596638656, + "grad_norm": 10.413965863492892, + "learning_rate": 7.412587412587413e-06, + "loss": 2.3479254245758057, + "step": 107 + }, + { + "epoch": 0.226890756302521, + "grad_norm": 11.563038534176888, + "learning_rate": 7.4825174825174825e-06, + "loss": 2.9856462478637695, + "step": 108 + }, + { + "epoch": 0.22899159663865545, + "grad_norm": 12.710111708974129, + "learning_rate": 7.552447552447552e-06, + "loss": 3.462696075439453, + "step": 109 + }, + { + "epoch": 0.23109243697478993, + "grad_norm": 11.076816381042432, + "learning_rate": 7.622377622377622e-06, + "loss": 3.270888566970825, + "step": 110 + }, + { + "epoch": 0.23319327731092437, + "grad_norm": 11.212503376143607, + "learning_rate": 7.692307692307694e-06, + "loss": 3.048227310180664, + "step": 111 + }, + { + "epoch": 0.23529411764705882, + "grad_norm": 12.400573941878047, + "learning_rate": 7.762237762237763e-06, + "loss": 3.2194204330444336, + "step": 112 + }, + { + "epoch": 0.23739495798319327, + "grad_norm": 15.219804312233611, + "learning_rate": 7.832167832167833e-06, + "loss": 3.6809778213500977, + "step": 113 + }, + { + "epoch": 0.23949579831932774, + "grad_norm": 14.217254787332546, + "learning_rate": 7.902097902097902e-06, + "loss": 2.912044048309326, + "step": 114 + }, + { + "epoch": 0.2415966386554622, + "grad_norm": 16.623326169718574, + "learning_rate": 7.972027972027973e-06, + "loss": 3.1021275520324707, + "step": 115 + }, + { + "epoch": 0.24369747899159663, + "grad_norm": 9.18687643151976, + "learning_rate": 8.041958041958042e-06, + "loss": 3.089829683303833, + "step": 116 + }, + { + "epoch": 0.24579831932773108, + "grad_norm": 16.772079088582387, + "learning_rate": 8.111888111888112e-06, + "loss": 3.4016504287719727, + "step": 117 + }, + { + "epoch": 0.24789915966386555, + "grad_norm": 68.62004336442155, + "learning_rate": 8.181818181818183e-06, + "loss": 3.502598285675049, + "step": 118 + }, + { + "epoch": 0.25, + "grad_norm": 9.091493777708147, + "learning_rate": 8.251748251748254e-06, + "loss": 3.0750184059143066, + "step": 119 + }, + { + "epoch": 0.25210084033613445, + "grad_norm": 13.607326745790957, + "learning_rate": 8.321678321678323e-06, + "loss": 2.8168656826019287, + "step": 120 + }, + { + "epoch": 0.2542016806722689, + "grad_norm": 8.683002515816812, + "learning_rate": 8.391608391608393e-06, + "loss": 2.3565826416015625, + "step": 121 + }, + { + "epoch": 0.25630252100840334, + "grad_norm": 23.36617403509855, + "learning_rate": 8.461538461538462e-06, + "loss": 2.972810745239258, + "step": 122 + }, + { + "epoch": 0.25840336134453784, + "grad_norm": 8.174637732136828, + "learning_rate": 8.531468531468533e-06, + "loss": 2.9700140953063965, + "step": 123 + }, + { + "epoch": 0.2605042016806723, + "grad_norm": 10.47900789596826, + "learning_rate": 8.601398601398602e-06, + "loss": 3.0162484645843506, + "step": 124 + }, + { + "epoch": 0.26260504201680673, + "grad_norm": 16.076782876444586, + "learning_rate": 8.671328671328672e-06, + "loss": 3.109422445297241, + "step": 125 + }, + { + "epoch": 0.2647058823529412, + "grad_norm": 33.666522199585756, + "learning_rate": 8.741258741258743e-06, + "loss": 2.6802124977111816, + "step": 126 + }, + { + "epoch": 0.2668067226890756, + "grad_norm": 12.537622047835336, + "learning_rate": 8.811188811188812e-06, + "loss": 2.6609840393066406, + "step": 127 + }, + { + "epoch": 0.2689075630252101, + "grad_norm": 11.767487098574284, + "learning_rate": 8.881118881118883e-06, + "loss": 3.0896430015563965, + "step": 128 + }, + { + "epoch": 0.2710084033613445, + "grad_norm": 7.737680571917604, + "learning_rate": 8.951048951048951e-06, + "loss": 3.2370247840881348, + "step": 129 + }, + { + "epoch": 0.27310924369747897, + "grad_norm": 13.8395022595692, + "learning_rate": 9.020979020979022e-06, + "loss": 2.8461947441101074, + "step": 130 + }, + { + "epoch": 0.27521008403361347, + "grad_norm": 27.87627626250655, + "learning_rate": 9.090909090909091e-06, + "loss": 3.480252742767334, + "step": 131 + }, + { + "epoch": 0.2773109243697479, + "grad_norm": 8.067136701179228, + "learning_rate": 9.160839160839162e-06, + "loss": 2.8424923419952393, + "step": 132 + }, + { + "epoch": 0.27941176470588236, + "grad_norm": 12.474203656062087, + "learning_rate": 9.230769230769232e-06, + "loss": 3.4489340782165527, + "step": 133 + }, + { + "epoch": 0.2815126050420168, + "grad_norm": 9.56092760411321, + "learning_rate": 9.300699300699301e-06, + "loss": 2.48683500289917, + "step": 134 + }, + { + "epoch": 0.28361344537815125, + "grad_norm": 10.45857911102664, + "learning_rate": 9.370629370629372e-06, + "loss": 2.975668430328369, + "step": 135 + }, + { + "epoch": 0.2857142857142857, + "grad_norm": 9.79706691198192, + "learning_rate": 9.44055944055944e-06, + "loss": 3.163745403289795, + "step": 136 + }, + { + "epoch": 0.28781512605042014, + "grad_norm": 16.663615728677826, + "learning_rate": 9.510489510489511e-06, + "loss": 3.3047399520874023, + "step": 137 + }, + { + "epoch": 0.28991596638655465, + "grad_norm": 10.093105336690149, + "learning_rate": 9.58041958041958e-06, + "loss": 2.901014804840088, + "step": 138 + }, + { + "epoch": 0.2920168067226891, + "grad_norm": 10.712099293339499, + "learning_rate": 9.650349650349651e-06, + "loss": 2.4749934673309326, + "step": 139 + }, + { + "epoch": 0.29411764705882354, + "grad_norm": 12.306067699743261, + "learning_rate": 9.72027972027972e-06, + "loss": 2.735682964324951, + "step": 140 + }, + { + "epoch": 0.296218487394958, + "grad_norm": 8.899689488937057, + "learning_rate": 9.79020979020979e-06, + "loss": 1.6851799488067627, + "step": 141 + }, + { + "epoch": 0.29831932773109243, + "grad_norm": 15.412895468970188, + "learning_rate": 9.860139860139861e-06, + "loss": 2.4892358779907227, + "step": 142 + }, + { + "epoch": 0.3004201680672269, + "grad_norm": 13.718632928552148, + "learning_rate": 9.93006993006993e-06, + "loss": 3.152186870574951, + "step": 143 + }, + { + "epoch": 0.3025210084033613, + "grad_norm": 9.63303607414013, + "learning_rate": 1e-05, + "loss": 2.4623451232910156, + "step": 144 + }, + { + "epoch": 0.30462184873949577, + "grad_norm": 9.020782417307544, + "learning_rate": 9.999985057155316e-06, + "loss": 2.3573660850524902, + "step": 145 + }, + { + "epoch": 0.3067226890756303, + "grad_norm": 15.431206065267094, + "learning_rate": 9.999940228710581e-06, + "loss": 3.248166561126709, + "step": 146 + }, + { + "epoch": 0.3088235294117647, + "grad_norm": 9.624481227031932, + "learning_rate": 9.99986551493374e-06, + "loss": 3.073438882827759, + "step": 147 + }, + { + "epoch": 0.31092436974789917, + "grad_norm": 12.24535420873494, + "learning_rate": 9.999760916271368e-06, + "loss": 3.175532579421997, + "step": 148 + }, + { + "epoch": 0.3130252100840336, + "grad_norm": 8.43469444061833, + "learning_rate": 9.999626433348664e-06, + "loss": 2.2849655151367188, + "step": 149 + }, + { + "epoch": 0.31512605042016806, + "grad_norm": 13.307775899632185, + "learning_rate": 9.999462066969451e-06, + "loss": 2.7922751903533936, + "step": 150 + }, + { + "epoch": 0.3172268907563025, + "grad_norm": 11.454291564861384, + "learning_rate": 9.999267818116173e-06, + "loss": 3.03188419342041, + "step": 151 + }, + { + "epoch": 0.31932773109243695, + "grad_norm": 16.712527557096042, + "learning_rate": 9.999043687949878e-06, + "loss": 3.3826239109039307, + "step": 152 + }, + { + "epoch": 0.32142857142857145, + "grad_norm": 22.000641429064785, + "learning_rate": 9.998789677810226e-06, + "loss": 3.103822708129883, + "step": 153 + }, + { + "epoch": 0.3235294117647059, + "grad_norm": 11.206024089957094, + "learning_rate": 9.998505789215469e-06, + "loss": 2.633566379547119, + "step": 154 + }, + { + "epoch": 0.32563025210084034, + "grad_norm": 17.0566593574694, + "learning_rate": 9.998192023862448e-06, + "loss": 2.937821388244629, + "step": 155 + }, + { + "epoch": 0.3277310924369748, + "grad_norm": 10.638495096316019, + "learning_rate": 9.997848383626583e-06, + "loss": 3.0057592391967773, + "step": 156 + }, + { + "epoch": 0.32983193277310924, + "grad_norm": 13.891998906384215, + "learning_rate": 9.997474870561858e-06, + "loss": 3.4198083877563477, + "step": 157 + }, + { + "epoch": 0.3319327731092437, + "grad_norm": 7.77313705300237, + "learning_rate": 9.997071486900813e-06, + "loss": 2.748509407043457, + "step": 158 + }, + { + "epoch": 0.33403361344537813, + "grad_norm": 11.432910137348301, + "learning_rate": 9.996638235054527e-06, + "loss": 3.3422679901123047, + "step": 159 + }, + { + "epoch": 0.33613445378151263, + "grad_norm": 9.407520098068266, + "learning_rate": 9.996175117612608e-06, + "loss": 3.2214763164520264, + "step": 160 + }, + { + "epoch": 0.3382352941176471, + "grad_norm": 9.207535688673886, + "learning_rate": 9.99568213734317e-06, + "loss": 2.5538628101348877, + "step": 161 + }, + { + "epoch": 0.3403361344537815, + "grad_norm": 10.755277234400435, + "learning_rate": 9.995159297192824e-06, + "loss": 2.781787872314453, + "step": 162 + }, + { + "epoch": 0.34243697478991597, + "grad_norm": 13.097444619561006, + "learning_rate": 9.99460660028666e-06, + "loss": 3.3784282207489014, + "step": 163 + }, + { + "epoch": 0.3445378151260504, + "grad_norm": 9.022751200279867, + "learning_rate": 9.994024049928222e-06, + "loss": 3.2824249267578125, + "step": 164 + }, + { + "epoch": 0.34663865546218486, + "grad_norm": 7.521996605994801, + "learning_rate": 9.993411649599494e-06, + "loss": 2.589594841003418, + "step": 165 + }, + { + "epoch": 0.3487394957983193, + "grad_norm": 19.97411284039417, + "learning_rate": 9.992769402960878e-06, + "loss": 3.7193164825439453, + "step": 166 + }, + { + "epoch": 0.35084033613445376, + "grad_norm": 8.085906363590569, + "learning_rate": 9.99209731385117e-06, + "loss": 2.823063611984253, + "step": 167 + }, + { + "epoch": 0.35294117647058826, + "grad_norm": 11.903719879092119, + "learning_rate": 9.99139538628754e-06, + "loss": 3.1389951705932617, + "step": 168 + }, + { + "epoch": 0.3550420168067227, + "grad_norm": 21.923086009804106, + "learning_rate": 9.990663624465504e-06, + "loss": 2.9536495208740234, + "step": 169 + }, + { + "epoch": 0.35714285714285715, + "grad_norm": 13.50586631618126, + "learning_rate": 9.989902032758904e-06, + "loss": 2.6355466842651367, + "step": 170 + }, + { + "epoch": 0.3592436974789916, + "grad_norm": 5.578596081707914, + "learning_rate": 9.989110615719882e-06, + "loss": 1.1800763607025146, + "step": 171 + }, + { + "epoch": 0.36134453781512604, + "grad_norm": 16.042050675579503, + "learning_rate": 9.988289378078842e-06, + "loss": 2.679232358932495, + "step": 172 + }, + { + "epoch": 0.3634453781512605, + "grad_norm": 13.382798743317503, + "learning_rate": 9.987438324744437e-06, + "loss": 2.3583908081054688, + "step": 173 + }, + { + "epoch": 0.36554621848739494, + "grad_norm": 9.108315025108485, + "learning_rate": 9.986557460803527e-06, + "loss": 2.748077392578125, + "step": 174 + }, + { + "epoch": 0.36764705882352944, + "grad_norm": 9.67015040715346, + "learning_rate": 9.985646791521165e-06, + "loss": 3.2660067081451416, + "step": 175 + }, + { + "epoch": 0.3697478991596639, + "grad_norm": 11.678263700428246, + "learning_rate": 9.984706322340539e-06, + "loss": 2.9270148277282715, + "step": 176 + }, + { + "epoch": 0.37184873949579833, + "grad_norm": 9.845183071879623, + "learning_rate": 9.983736058882965e-06, + "loss": 2.455327033996582, + "step": 177 + }, + { + "epoch": 0.3739495798319328, + "grad_norm": 9.630887189931224, + "learning_rate": 9.982736006947842e-06, + "loss": 3.171403169631958, + "step": 178 + }, + { + "epoch": 0.3760504201680672, + "grad_norm": 7.217019473795253, + "learning_rate": 9.98170617251262e-06, + "loss": 2.6023473739624023, + "step": 179 + }, + { + "epoch": 0.37815126050420167, + "grad_norm": 7.438957257707156, + "learning_rate": 9.98064656173276e-06, + "loss": 2.7492432594299316, + "step": 180 + }, + { + "epoch": 0.3802521008403361, + "grad_norm": 12.314225953456766, + "learning_rate": 9.979557180941702e-06, + "loss": 3.520758628845215, + "step": 181 + }, + { + "epoch": 0.38235294117647056, + "grad_norm": 7.754983445761027, + "learning_rate": 9.978438036650822e-06, + "loss": 2.7245442867279053, + "step": 182 + }, + { + "epoch": 0.38445378151260506, + "grad_norm": 15.124443991385633, + "learning_rate": 9.977289135549404e-06, + "loss": 2.790768623352051, + "step": 183 + }, + { + "epoch": 0.3865546218487395, + "grad_norm": 15.169071975047261, + "learning_rate": 9.976110484504587e-06, + "loss": 2.5588126182556152, + "step": 184 + }, + { + "epoch": 0.38865546218487396, + "grad_norm": 18.50299410182784, + "learning_rate": 9.974902090561331e-06, + "loss": 3.0367865562438965, + "step": 185 + }, + { + "epoch": 0.3907563025210084, + "grad_norm": 12.853534690634186, + "learning_rate": 9.973663960942373e-06, + "loss": 3.1013669967651367, + "step": 186 + }, + { + "epoch": 0.39285714285714285, + "grad_norm": 11.962180171730763, + "learning_rate": 9.972396103048184e-06, + "loss": 2.678436279296875, + "step": 187 + }, + { + "epoch": 0.3949579831932773, + "grad_norm": 14.345031935763927, + "learning_rate": 9.971098524456925e-06, + "loss": 2.866910696029663, + "step": 188 + }, + { + "epoch": 0.39705882352941174, + "grad_norm": 24.927874908872194, + "learning_rate": 9.969771232924404e-06, + "loss": 2.6690807342529297, + "step": 189 + }, + { + "epoch": 0.39915966386554624, + "grad_norm": 13.232716463146705, + "learning_rate": 9.968414236384022e-06, + "loss": 2.615846633911133, + "step": 190 + }, + { + "epoch": 0.4012605042016807, + "grad_norm": 19.24597028348177, + "learning_rate": 9.967027542946739e-06, + "loss": 3.197604179382324, + "step": 191 + }, + { + "epoch": 0.40336134453781514, + "grad_norm": 19.57923793430777, + "learning_rate": 9.965611160901008e-06, + "loss": 1.584808349609375, + "step": 192 + }, + { + "epoch": 0.4054621848739496, + "grad_norm": 9.313854254132917, + "learning_rate": 9.964165098712745e-06, + "loss": 2.7913365364074707, + "step": 193 + }, + { + "epoch": 0.40756302521008403, + "grad_norm": 15.764914604292455, + "learning_rate": 9.962689365025259e-06, + "loss": 3.42575740814209, + "step": 194 + }, + { + "epoch": 0.4096638655462185, + "grad_norm": 9.662424511151881, + "learning_rate": 9.961183968659217e-06, + "loss": 2.6931188106536865, + "step": 195 + }, + { + "epoch": 0.4117647058823529, + "grad_norm": 13.117904635638109, + "learning_rate": 9.959648918612576e-06, + "loss": 2.4463605880737305, + "step": 196 + }, + { + "epoch": 0.41386554621848737, + "grad_norm": 8.434614198562612, + "learning_rate": 9.958084224060547e-06, + "loss": 2.647773265838623, + "step": 197 + }, + { + "epoch": 0.41596638655462187, + "grad_norm": 26.520590112059157, + "learning_rate": 9.956489894355521e-06, + "loss": 2.660770893096924, + "step": 198 + }, + { + "epoch": 0.4180672268907563, + "grad_norm": 28.510323184410662, + "learning_rate": 9.954865939027028e-06, + "loss": 3.627254009246826, + "step": 199 + }, + { + "epoch": 0.42016806722689076, + "grad_norm": 7.679364921262506, + "learning_rate": 9.953212367781675e-06, + "loss": 2.683685779571533, + "step": 200 + }, + { + "epoch": 0.4222689075630252, + "grad_norm": 13.123862369544378, + "learning_rate": 9.95152919050308e-06, + "loss": 2.7249388694763184, + "step": 201 + }, + { + "epoch": 0.42436974789915966, + "grad_norm": 6.985824973864478, + "learning_rate": 9.949816417251831e-06, + "loss": 2.933401107788086, + "step": 202 + }, + { + "epoch": 0.4264705882352941, + "grad_norm": 13.569070375050062, + "learning_rate": 9.948074058265409e-06, + "loss": 3.5457630157470703, + "step": 203 + }, + { + "epoch": 0.42857142857142855, + "grad_norm": 7.335673995298351, + "learning_rate": 9.94630212395813e-06, + "loss": 2.483736038208008, + "step": 204 + }, + { + "epoch": 0.43067226890756305, + "grad_norm": 73.9554577496319, + "learning_rate": 9.944500624921094e-06, + "loss": 2.470374584197998, + "step": 205 + }, + { + "epoch": 0.4327731092436975, + "grad_norm": 11.27254717083641, + "learning_rate": 9.942669571922108e-06, + "loss": 3.2255494594573975, + "step": 206 + }, + { + "epoch": 0.43487394957983194, + "grad_norm": 11.257221010364708, + "learning_rate": 9.940808975905627e-06, + "loss": 3.4820542335510254, + "step": 207 + }, + { + "epoch": 0.4369747899159664, + "grad_norm": 16.32933603207297, + "learning_rate": 9.93891884799269e-06, + "loss": 3.218539237976074, + "step": 208 + }, + { + "epoch": 0.43907563025210083, + "grad_norm": 27.30232213883322, + "learning_rate": 9.936999199480854e-06, + "loss": 2.8428990840911865, + "step": 209 + }, + { + "epoch": 0.4411764705882353, + "grad_norm": 8.340720464987514, + "learning_rate": 9.935050041844121e-06, + "loss": 3.661019802093506, + "step": 210 + }, + { + "epoch": 0.4432773109243697, + "grad_norm": 18.410105558121085, + "learning_rate": 9.933071386732874e-06, + "loss": 3.330902338027954, + "step": 211 + }, + { + "epoch": 0.44537815126050423, + "grad_norm": 10.649860943280096, + "learning_rate": 9.931063245973812e-06, + "loss": 2.7754883766174316, + "step": 212 + }, + { + "epoch": 0.4474789915966387, + "grad_norm": 13.898816541841864, + "learning_rate": 9.929025631569864e-06, + "loss": 2.3284661769866943, + "step": 213 + }, + { + "epoch": 0.4495798319327731, + "grad_norm": 11.170546252681195, + "learning_rate": 9.926958555700134e-06, + "loss": 2.599228858947754, + "step": 214 + }, + { + "epoch": 0.45168067226890757, + "grad_norm": 11.76779841923458, + "learning_rate": 9.924862030719821e-06, + "loss": 3.174004077911377, + "step": 215 + }, + { + "epoch": 0.453781512605042, + "grad_norm": 12.943887425672324, + "learning_rate": 9.922736069160141e-06, + "loss": 2.7390694618225098, + "step": 216 + }, + { + "epoch": 0.45588235294117646, + "grad_norm": 11.55413590289726, + "learning_rate": 9.920580683728263e-06, + "loss": 2.7388081550598145, + "step": 217 + }, + { + "epoch": 0.4579831932773109, + "grad_norm": 22.67934856569803, + "learning_rate": 9.918395887307219e-06, + "loss": 2.4359140396118164, + "step": 218 + }, + { + "epoch": 0.46008403361344535, + "grad_norm": 16.89880489289811, + "learning_rate": 9.916181692955841e-06, + "loss": 2.9688220024108887, + "step": 219 + }, + { + "epoch": 0.46218487394957986, + "grad_norm": 19.071787734842648, + "learning_rate": 9.913938113908675e-06, + "loss": 3.1534006595611572, + "step": 220 + }, + { + "epoch": 0.4642857142857143, + "grad_norm": 15.85242809267351, + "learning_rate": 9.9116651635759e-06, + "loss": 2.618938684463501, + "step": 221 + }, + { + "epoch": 0.46638655462184875, + "grad_norm": 16.618677645763935, + "learning_rate": 9.909362855543253e-06, + "loss": 2.844968318939209, + "step": 222 + }, + { + "epoch": 0.4684873949579832, + "grad_norm": 10.671971882677827, + "learning_rate": 9.907031203571948e-06, + "loss": 2.4792628288269043, + "step": 223 + }, + { + "epoch": 0.47058823529411764, + "grad_norm": 19.241816484552377, + "learning_rate": 9.90467022159859e-06, + "loss": 2.894502639770508, + "step": 224 + }, + { + "epoch": 0.4726890756302521, + "grad_norm": 23.569212607106817, + "learning_rate": 9.902279923735093e-06, + "loss": 2.792015552520752, + "step": 225 + }, + { + "epoch": 0.47478991596638653, + "grad_norm": 9.680153288005078, + "learning_rate": 9.899860324268599e-06, + "loss": 2.9171247482299805, + "step": 226 + }, + { + "epoch": 0.47689075630252103, + "grad_norm": 12.955899131578942, + "learning_rate": 9.897411437661386e-06, + "loss": 2.560214042663574, + "step": 227 + }, + { + "epoch": 0.4789915966386555, + "grad_norm": 8.404115741492017, + "learning_rate": 9.894933278550785e-06, + "loss": 3.2796883583068848, + "step": 228 + }, + { + "epoch": 0.4810924369747899, + "grad_norm": 8.318847487560761, + "learning_rate": 9.8924258617491e-06, + "loss": 3.0324971675872803, + "step": 229 + }, + { + "epoch": 0.4831932773109244, + "grad_norm": 18.51611171900766, + "learning_rate": 9.8898892022435e-06, + "loss": 3.3899683952331543, + "step": 230 + }, + { + "epoch": 0.4852941176470588, + "grad_norm": 11.1091069250737, + "learning_rate": 9.887323315195956e-06, + "loss": 2.742903709411621, + "step": 231 + }, + { + "epoch": 0.48739495798319327, + "grad_norm": 7.80795476246885, + "learning_rate": 9.884728215943122e-06, + "loss": 3.230966806411743, + "step": 232 + }, + { + "epoch": 0.4894957983193277, + "grad_norm": 13.293388527053166, + "learning_rate": 9.882103919996268e-06, + "loss": 2.8818302154541016, + "step": 233 + }, + { + "epoch": 0.49159663865546216, + "grad_norm": 6.043647907341577, + "learning_rate": 9.879450443041172e-06, + "loss": 2.358765125274658, + "step": 234 + }, + { + "epoch": 0.49369747899159666, + "grad_norm": 8.169920329828493, + "learning_rate": 9.876767800938032e-06, + "loss": 3.0420098304748535, + "step": 235 + }, + { + "epoch": 0.4957983193277311, + "grad_norm": 18.681067639331463, + "learning_rate": 9.874056009721367e-06, + "loss": 2.9595160484313965, + "step": 236 + }, + { + "epoch": 0.49789915966386555, + "grad_norm": 7.792831708992119, + "learning_rate": 9.87131508559993e-06, + "loss": 2.9571242332458496, + "step": 237 + }, + { + "epoch": 0.5, + "grad_norm": 13.533405695746444, + "learning_rate": 9.868545044956603e-06, + "loss": 2.798694610595703, + "step": 238 + }, + { + "epoch": 0.5021008403361344, + "grad_norm": 7.855798585235136, + "learning_rate": 9.865745904348296e-06, + "loss": 2.9430432319641113, + "step": 239 + }, + { + "epoch": 0.5042016806722689, + "grad_norm": 12.596029584158895, + "learning_rate": 9.862917680505863e-06, + "loss": 3.065462112426758, + "step": 240 + }, + { + "epoch": 0.5063025210084033, + "grad_norm": 11.793626015707394, + "learning_rate": 9.860060390333988e-06, + "loss": 3.8562116622924805, + "step": 241 + }, + { + "epoch": 0.5084033613445378, + "grad_norm": 8.660405200484282, + "learning_rate": 9.857174050911085e-06, + "loss": 2.645123243331909, + "step": 242 + }, + { + "epoch": 0.5105042016806722, + "grad_norm": 11.950071539791612, + "learning_rate": 9.854258679489203e-06, + "loss": 2.500267744064331, + "step": 243 + }, + { + "epoch": 0.5126050420168067, + "grad_norm": 14.029861713702717, + "learning_rate": 9.851314293493923e-06, + "loss": 2.553537368774414, + "step": 244 + }, + { + "epoch": 0.5147058823529411, + "grad_norm": 21.40352382596275, + "learning_rate": 9.848340910524243e-06, + "loss": 2.694528102874756, + "step": 245 + }, + { + "epoch": 0.5168067226890757, + "grad_norm": 11.756867034830558, + "learning_rate": 9.845338548352482e-06, + "loss": 3.2089271545410156, + "step": 246 + }, + { + "epoch": 0.5189075630252101, + "grad_norm": 13.513723971793041, + "learning_rate": 9.842307224924174e-06, + "loss": 2.443826198577881, + "step": 247 + }, + { + "epoch": 0.5210084033613446, + "grad_norm": 8.839705225157738, + "learning_rate": 9.839246958357957e-06, + "loss": 2.9329233169555664, + "step": 248 + }, + { + "epoch": 0.523109243697479, + "grad_norm": 14.107087922274081, + "learning_rate": 9.836157766945467e-06, + "loss": 2.5171399116516113, + "step": 249 + }, + { + "epoch": 0.5252100840336135, + "grad_norm": 8.285926532283062, + "learning_rate": 9.833039669151225e-06, + "loss": 3.0069408416748047, + "step": 250 + }, + { + "epoch": 0.5273109243697479, + "grad_norm": 9.58371718621674, + "learning_rate": 9.829892683612535e-06, + "loss": 2.5816359519958496, + "step": 251 + }, + { + "epoch": 0.5294117647058824, + "grad_norm": 20.00310864922347, + "learning_rate": 9.826716829139358e-06, + "loss": 2.3982670307159424, + "step": 252 + }, + { + "epoch": 0.5315126050420168, + "grad_norm": 10.648220658525108, + "learning_rate": 9.82351212471422e-06, + "loss": 2.975574016571045, + "step": 253 + }, + { + "epoch": 0.5336134453781513, + "grad_norm": 17.551242772865887, + "learning_rate": 9.820278589492076e-06, + "loss": 2.4827775955200195, + "step": 254 + }, + { + "epoch": 0.5357142857142857, + "grad_norm": 17.09184171751482, + "learning_rate": 9.817016242800215e-06, + "loss": 2.690033197402954, + "step": 255 + }, + { + "epoch": 0.5378151260504201, + "grad_norm": 14.722560106056354, + "learning_rate": 9.813725104138133e-06, + "loss": 3.346949338912964, + "step": 256 + }, + { + "epoch": 0.5399159663865546, + "grad_norm": 17.505076110573757, + "learning_rate": 9.810405193177418e-06, + "loss": 2.6791281700134277, + "step": 257 + }, + { + "epoch": 0.542016806722689, + "grad_norm": 17.808558357662132, + "learning_rate": 9.807056529761637e-06, + "loss": 2.853158950805664, + "step": 258 + }, + { + "epoch": 0.5441176470588235, + "grad_norm": 20.31515982195739, + "learning_rate": 9.80367913390621e-06, + "loss": 3.1636295318603516, + "step": 259 + }, + { + "epoch": 0.5462184873949579, + "grad_norm": 12.64467693447632, + "learning_rate": 9.800273025798302e-06, + "loss": 2.5055313110351562, + "step": 260 + }, + { + "epoch": 0.5483193277310925, + "grad_norm": 9.570949964132296, + "learning_rate": 9.796838225796688e-06, + "loss": 2.9986414909362793, + "step": 261 + }, + { + "epoch": 0.5504201680672269, + "grad_norm": 14.832124263006255, + "learning_rate": 9.793374754431642e-06, + "loss": 2.419975757598877, + "step": 262 + }, + { + "epoch": 0.5525210084033614, + "grad_norm": 22.395098332172758, + "learning_rate": 9.789882632404809e-06, + "loss": 3.0301923751831055, + "step": 263 + }, + { + "epoch": 0.5546218487394958, + "grad_norm": 8.680917615796206, + "learning_rate": 9.786361880589084e-06, + "loss": 2.846034526824951, + "step": 264 + }, + { + "epoch": 0.5567226890756303, + "grad_norm": 16.17159732015871, + "learning_rate": 9.782812520028487e-06, + "loss": 3.250943183898926, + "step": 265 + }, + { + "epoch": 0.5588235294117647, + "grad_norm": 12.800181347711561, + "learning_rate": 9.779234571938034e-06, + "loss": 2.5069515705108643, + "step": 266 + }, + { + "epoch": 0.5609243697478992, + "grad_norm": 20.58760178113823, + "learning_rate": 9.775628057703616e-06, + "loss": 2.2883377075195312, + "step": 267 + }, + { + "epoch": 0.5630252100840336, + "grad_norm": 19.3122933281468, + "learning_rate": 9.771992998881865e-06, + "loss": 1.8844149112701416, + "step": 268 + }, + { + "epoch": 0.5651260504201681, + "grad_norm": 11.766785955468544, + "learning_rate": 9.768329417200029e-06, + "loss": 2.608553409576416, + "step": 269 + }, + { + "epoch": 0.5672268907563025, + "grad_norm": 9.015634942296078, + "learning_rate": 9.76463733455584e-06, + "loss": 2.8849685192108154, + "step": 270 + }, + { + "epoch": 0.569327731092437, + "grad_norm": 10.71605416834433, + "learning_rate": 9.760916773017386e-06, + "loss": 2.83829402923584, + "step": 271 + }, + { + "epoch": 0.5714285714285714, + "grad_norm": 8.102503833940233, + "learning_rate": 9.757167754822974e-06, + "loss": 2.6053004264831543, + "step": 272 + }, + { + "epoch": 0.5735294117647058, + "grad_norm": 18.62135736056985, + "learning_rate": 9.753390302381006e-06, + "loss": 2.8338804244995117, + "step": 273 + }, + { + "epoch": 0.5756302521008403, + "grad_norm": 34.82348840659483, + "learning_rate": 9.749584438269833e-06, + "loss": 2.979978084564209, + "step": 274 + }, + { + "epoch": 0.5777310924369747, + "grad_norm": 6.726547081859168, + "learning_rate": 9.74575018523763e-06, + "loss": 1.8241777420043945, + "step": 275 + }, + { + "epoch": 0.5798319327731093, + "grad_norm": 12.206262847267514, + "learning_rate": 9.741887566202259e-06, + "loss": 3.2140274047851562, + "step": 276 + }, + { + "epoch": 0.5819327731092437, + "grad_norm": 43.432328207654045, + "learning_rate": 9.737996604251124e-06, + "loss": 3.074397325515747, + "step": 277 + }, + { + "epoch": 0.5840336134453782, + "grad_norm": 19.844157721727896, + "learning_rate": 9.73407732264104e-06, + "loss": 2.527010679244995, + "step": 278 + }, + { + "epoch": 0.5861344537815126, + "grad_norm": 10.112570131000647, + "learning_rate": 9.730129744798096e-06, + "loss": 2.6019768714904785, + "step": 279 + }, + { + "epoch": 0.5882352941176471, + "grad_norm": 216.6539557731807, + "learning_rate": 9.726153894317508e-06, + "loss": 2.848952293395996, + "step": 280 + }, + { + "epoch": 0.5903361344537815, + "grad_norm": 18.730728554973695, + "learning_rate": 9.722149794963483e-06, + "loss": 3.120556354522705, + "step": 281 + }, + { + "epoch": 0.592436974789916, + "grad_norm": 7.236837867364418, + "learning_rate": 9.718117470669072e-06, + "loss": 2.8926405906677246, + "step": 282 + }, + { + "epoch": 0.5945378151260504, + "grad_norm": 8.247663007399707, + "learning_rate": 9.714056945536039e-06, + "loss": 3.2854347229003906, + "step": 283 + }, + { + "epoch": 0.5966386554621849, + "grad_norm": 7.729125572796969, + "learning_rate": 9.709968243834698e-06, + "loss": 2.856870651245117, + "step": 284 + }, + { + "epoch": 0.5987394957983193, + "grad_norm": 20.951434970442865, + "learning_rate": 9.705851390003783e-06, + "loss": 3.3881802558898926, + "step": 285 + }, + { + "epoch": 0.6008403361344538, + "grad_norm": 8.671814837426174, + "learning_rate": 9.7017064086503e-06, + "loss": 2.6102542877197266, + "step": 286 + }, + { + "epoch": 0.6029411764705882, + "grad_norm": 8.644019718162792, + "learning_rate": 9.697533324549371e-06, + "loss": 2.7697243690490723, + "step": 287 + }, + { + "epoch": 0.6050420168067226, + "grad_norm": 12.279613000984195, + "learning_rate": 9.693332162644095e-06, + "loss": 2.568695545196533, + "step": 288 + }, + { + "epoch": 0.6071428571428571, + "grad_norm": 13.384358670021655, + "learning_rate": 9.689102948045398e-06, + "loss": 2.922543525695801, + "step": 289 + }, + { + "epoch": 0.6092436974789915, + "grad_norm": 15.250277694133263, + "learning_rate": 9.684845706031878e-06, + "loss": 3.1011314392089844, + "step": 290 + }, + { + "epoch": 0.6113445378151261, + "grad_norm": 9.840291260984259, + "learning_rate": 9.680560462049657e-06, + "loss": 2.627528429031372, + "step": 291 + }, + { + "epoch": 0.6134453781512605, + "grad_norm": 13.648735567431437, + "learning_rate": 9.676247241712228e-06, + "loss": 2.8417811393737793, + "step": 292 + }, + { + "epoch": 0.615546218487395, + "grad_norm": 8.931356705581003, + "learning_rate": 9.671906070800307e-06, + "loss": 2.3787314891815186, + "step": 293 + }, + { + "epoch": 0.6176470588235294, + "grad_norm": 7.6270227976464895, + "learning_rate": 9.667536975261667e-06, + "loss": 2.751317024230957, + "step": 294 + }, + { + "epoch": 0.6197478991596639, + "grad_norm": 7.016417787785432, + "learning_rate": 9.663139981210998e-06, + "loss": 2.6910929679870605, + "step": 295 + }, + { + "epoch": 0.6218487394957983, + "grad_norm": 11.206285204533946, + "learning_rate": 9.658715114929737e-06, + "loss": 2.801499366760254, + "step": 296 + }, + { + "epoch": 0.6239495798319328, + "grad_norm": 18.427453742915965, + "learning_rate": 9.654262402865922e-06, + "loss": 2.885946273803711, + "step": 297 + }, + { + "epoch": 0.6260504201680672, + "grad_norm": 13.114557836832477, + "learning_rate": 9.649781871634025e-06, + "loss": 3.1485133171081543, + "step": 298 + }, + { + "epoch": 0.6281512605042017, + "grad_norm": 8.349893932720915, + "learning_rate": 9.6452735480148e-06, + "loss": 3.174015998840332, + "step": 299 + }, + { + "epoch": 0.6302521008403361, + "grad_norm": 11.762326882141835, + "learning_rate": 9.64073745895512e-06, + "loss": 3.339445114135742, + "step": 300 + }, + { + "epoch": 0.6323529411764706, + "grad_norm": 7.555546243601591, + "learning_rate": 9.636173631567812e-06, + "loss": 2.9448843002319336, + "step": 301 + }, + { + "epoch": 0.634453781512605, + "grad_norm": 5.95180683932207, + "learning_rate": 9.631582093131501e-06, + "loss": 2.6363561153411865, + "step": 302 + }, + { + "epoch": 0.6365546218487395, + "grad_norm": 11.371944122058592, + "learning_rate": 9.62696287109045e-06, + "loss": 2.4621901512145996, + "step": 303 + }, + { + "epoch": 0.6386554621848739, + "grad_norm": 11.742524524874973, + "learning_rate": 9.622315993054384e-06, + "loss": 2.8623251914978027, + "step": 304 + }, + { + "epoch": 0.6407563025210085, + "grad_norm": 12.39315277601619, + "learning_rate": 9.61764148679833e-06, + "loss": 2.191575765609741, + "step": 305 + }, + { + "epoch": 0.6428571428571429, + "grad_norm": 6.720496031064891, + "learning_rate": 9.61293938026246e-06, + "loss": 2.018388271331787, + "step": 306 + }, + { + "epoch": 0.6449579831932774, + "grad_norm": 9.624398589362118, + "learning_rate": 9.608209701551913e-06, + "loss": 2.756854772567749, + "step": 307 + }, + { + "epoch": 0.6470588235294118, + "grad_norm": 21.622075822614562, + "learning_rate": 9.60345247893663e-06, + "loss": 2.6668529510498047, + "step": 308 + }, + { + "epoch": 0.6491596638655462, + "grad_norm": 14.926878160653533, + "learning_rate": 9.598667740851187e-06, + "loss": 2.6617343425750732, + "step": 309 + }, + { + "epoch": 0.6512605042016807, + "grad_norm": 9.499741494871419, + "learning_rate": 9.59385551589462e-06, + "loss": 3.1460976600646973, + "step": 310 + }, + { + "epoch": 0.6533613445378151, + "grad_norm": 17.910724072364676, + "learning_rate": 9.589015832830267e-06, + "loss": 2.7566354274749756, + "step": 311 + }, + { + "epoch": 0.6554621848739496, + "grad_norm": 15.059990921253526, + "learning_rate": 9.584148720585575e-06, + "loss": 3.3112881183624268, + "step": 312 + }, + { + "epoch": 0.657563025210084, + "grad_norm": 12.27519040871759, + "learning_rate": 9.57925420825195e-06, + "loss": 2.8563618659973145, + "step": 313 + }, + { + "epoch": 0.6596638655462185, + "grad_norm": 14.53433732237354, + "learning_rate": 9.574332325084564e-06, + "loss": 3.5544567108154297, + "step": 314 + }, + { + "epoch": 0.6617647058823529, + "grad_norm": 9.662661721128384, + "learning_rate": 9.569383100502193e-06, + "loss": 2.924015998840332, + "step": 315 + }, + { + "epoch": 0.6638655462184874, + "grad_norm": 11.360356839234715, + "learning_rate": 9.564406564087032e-06, + "loss": 2.7250008583068848, + "step": 316 + }, + { + "epoch": 0.6659663865546218, + "grad_norm": 6.265433825569306, + "learning_rate": 9.559402745584527e-06, + "loss": 2.9229238033294678, + "step": 317 + }, + { + "epoch": 0.6680672268907563, + "grad_norm": 10.23047238705242, + "learning_rate": 9.554371674903191e-06, + "loss": 3.4867515563964844, + "step": 318 + }, + { + "epoch": 0.6701680672268907, + "grad_norm": 13.446172115002414, + "learning_rate": 9.549313382114427e-06, + "loss": 2.4049417972564697, + "step": 319 + }, + { + "epoch": 0.6722689075630253, + "grad_norm": 14.135159230227343, + "learning_rate": 9.54422789745235e-06, + "loss": 3.1008338928222656, + "step": 320 + }, + { + "epoch": 0.6743697478991597, + "grad_norm": 9.140604791680513, + "learning_rate": 9.5391152513136e-06, + "loss": 2.6114342212677, + "step": 321 + }, + { + "epoch": 0.6764705882352942, + "grad_norm": 9.779919855511938, + "learning_rate": 9.533975474257171e-06, + "loss": 2.7165164947509766, + "step": 322 + }, + { + "epoch": 0.6785714285714286, + "grad_norm": 9.275622947642706, + "learning_rate": 9.528808597004216e-06, + "loss": 2.8122520446777344, + "step": 323 + }, + { + "epoch": 0.680672268907563, + "grad_norm": 14.779154717919877, + "learning_rate": 9.523614650437876e-06, + "loss": 2.862661838531494, + "step": 324 + }, + { + "epoch": 0.6827731092436975, + "grad_norm": 12.377273208842894, + "learning_rate": 9.518393665603084e-06, + "loss": 2.9812843799591064, + "step": 325 + }, + { + "epoch": 0.6848739495798319, + "grad_norm": 11.010658732376989, + "learning_rate": 9.513145673706383e-06, + "loss": 2.9455337524414062, + "step": 326 + }, + { + "epoch": 0.6869747899159664, + "grad_norm": 14.806340169845868, + "learning_rate": 9.507870706115749e-06, + "loss": 3.1577422618865967, + "step": 327 + }, + { + "epoch": 0.6890756302521008, + "grad_norm": 13.616368197529665, + "learning_rate": 9.50256879436039e-06, + "loss": 2.545835018157959, + "step": 328 + }, + { + "epoch": 0.6911764705882353, + "grad_norm": 8.987871015734585, + "learning_rate": 9.497239970130561e-06, + "loss": 2.559062957763672, + "step": 329 + }, + { + "epoch": 0.6932773109243697, + "grad_norm": 8.587992072590101, + "learning_rate": 9.491884265277383e-06, + "loss": 2.932499647140503, + "step": 330 + }, + { + "epoch": 0.6953781512605042, + "grad_norm": 7.463276523398998, + "learning_rate": 9.486501711812637e-06, + "loss": 2.967616558074951, + "step": 331 + }, + { + "epoch": 0.6974789915966386, + "grad_norm": 14.475511521289118, + "learning_rate": 9.481092341908591e-06, + "loss": 2.4604697227478027, + "step": 332 + }, + { + "epoch": 0.6995798319327731, + "grad_norm": 9.02600045542574, + "learning_rate": 9.475656187897794e-06, + "loss": 3.146969795227051, + "step": 333 + }, + { + "epoch": 0.7016806722689075, + "grad_norm": 7.639638057540197, + "learning_rate": 9.470193282272886e-06, + "loss": 3.337083339691162, + "step": 334 + }, + { + "epoch": 0.7037815126050421, + "grad_norm": 16.397307515268395, + "learning_rate": 9.464703657686412e-06, + "loss": 2.7829766273498535, + "step": 335 + }, + { + "epoch": 0.7058823529411765, + "grad_norm": 11.048022152868258, + "learning_rate": 9.45918734695061e-06, + "loss": 3.095449447631836, + "step": 336 + }, + { + "epoch": 0.707983193277311, + "grad_norm": 10.20138527201031, + "learning_rate": 9.453644383037232e-06, + "loss": 2.6790573596954346, + "step": 337 + }, + { + "epoch": 0.7100840336134454, + "grad_norm": 9.93895349514755, + "learning_rate": 9.448074799077337e-06, + "loss": 2.9844274520874023, + "step": 338 + }, + { + "epoch": 0.7121848739495799, + "grad_norm": 171.53953866617377, + "learning_rate": 9.442478628361098e-06, + "loss": 2.256910562515259, + "step": 339 + }, + { + "epoch": 0.7142857142857143, + "grad_norm": 12.351676724137773, + "learning_rate": 9.436855904337596e-06, + "loss": 2.9464545249938965, + "step": 340 + }, + { + "epoch": 0.7163865546218487, + "grad_norm": 19.404123629754835, + "learning_rate": 9.43120666061463e-06, + "loss": 2.23644757270813, + "step": 341 + }, + { + "epoch": 0.7184873949579832, + "grad_norm": 11.246236929808724, + "learning_rate": 9.425530930958507e-06, + "loss": 2.85072660446167, + "step": 342 + }, + { + "epoch": 0.7205882352941176, + "grad_norm": 17.642986778414265, + "learning_rate": 9.419828749293845e-06, + "loss": 3.09238862991333, + "step": 343 + }, + { + "epoch": 0.7226890756302521, + "grad_norm": 8.1418179714146, + "learning_rate": 9.414100149703373e-06, + "loss": 2.7548587322235107, + "step": 344 + }, + { + "epoch": 0.7247899159663865, + "grad_norm": 11.258932741699391, + "learning_rate": 9.40834516642772e-06, + "loss": 2.487452507019043, + "step": 345 + }, + { + "epoch": 0.726890756302521, + "grad_norm": 10.082639156310133, + "learning_rate": 9.402563833865213e-06, + "loss": 3.077296257019043, + "step": 346 + }, + { + "epoch": 0.7289915966386554, + "grad_norm": 11.506257708160296, + "learning_rate": 9.396756186571672e-06, + "loss": 2.6188814640045166, + "step": 347 + }, + { + "epoch": 0.7310924369747899, + "grad_norm": 11.743812268831451, + "learning_rate": 9.39092225926021e-06, + "loss": 3.150355815887451, + "step": 348 + }, + { + "epoch": 0.7331932773109243, + "grad_norm": 10.613109994526992, + "learning_rate": 9.385062086801013e-06, + "loss": 2.6666879653930664, + "step": 349 + }, + { + "epoch": 0.7352941176470589, + "grad_norm": 11.1137083326389, + "learning_rate": 9.379175704221139e-06, + "loss": 2.885680675506592, + "step": 350 + }, + { + "epoch": 0.7373949579831933, + "grad_norm": 10.845634322034954, + "learning_rate": 9.37326314670431e-06, + "loss": 2.948115110397339, + "step": 351 + }, + { + "epoch": 0.7394957983193278, + "grad_norm": 20.12834911912162, + "learning_rate": 9.367324449590694e-06, + "loss": 2.743468761444092, + "step": 352 + }, + { + "epoch": 0.7415966386554622, + "grad_norm": 10.20324180750042, + "learning_rate": 9.361359648376707e-06, + "loss": 3.0895063877105713, + "step": 353 + }, + { + "epoch": 0.7436974789915967, + "grad_norm": 16.159497011872574, + "learning_rate": 9.355368778714784e-06, + "loss": 2.808818817138672, + "step": 354 + }, + { + "epoch": 0.7457983193277311, + "grad_norm": 14.111122417184372, + "learning_rate": 9.349351876413181e-06, + "loss": 2.889227867126465, + "step": 355 + }, + { + "epoch": 0.7478991596638656, + "grad_norm": 10.685634708452614, + "learning_rate": 9.343308977435754e-06, + "loss": 3.021900177001953, + "step": 356 + }, + { + "epoch": 0.75, + "grad_norm": 29.116347517828004, + "learning_rate": 9.337240117901742e-06, + "loss": 2.4112629890441895, + "step": 357 + }, + { + "epoch": 0.7521008403361344, + "grad_norm": 8.824096565810732, + "learning_rate": 9.331145334085554e-06, + "loss": 2.898515224456787, + "step": 358 + }, + { + "epoch": 0.7542016806722689, + "grad_norm": 21.430509149211513, + "learning_rate": 9.325024662416553e-06, + "loss": 2.683413028717041, + "step": 359 + }, + { + "epoch": 0.7563025210084033, + "grad_norm": 10.321295794427858, + "learning_rate": 9.318878139478842e-06, + "loss": 2.890808582305908, + "step": 360 + }, + { + "epoch": 0.7584033613445378, + "grad_norm": 20.795050786572304, + "learning_rate": 9.312705802011029e-06, + "loss": 2.9919955730438232, + "step": 361 + }, + { + "epoch": 0.7605042016806722, + "grad_norm": 9.83932446467153, + "learning_rate": 9.306507686906033e-06, + "loss": 2.7725915908813477, + "step": 362 + }, + { + "epoch": 0.7626050420168067, + "grad_norm": 9.916160263978837, + "learning_rate": 9.300283831210838e-06, + "loss": 2.9397757053375244, + "step": 363 + }, + { + "epoch": 0.7647058823529411, + "grad_norm": 9.312450032530169, + "learning_rate": 9.294034272126286e-06, + "loss": 2.770698070526123, + "step": 364 + }, + { + "epoch": 0.7668067226890757, + "grad_norm": 13.885653883484695, + "learning_rate": 9.28775904700686e-06, + "loss": 2.5156445503234863, + "step": 365 + }, + { + "epoch": 0.7689075630252101, + "grad_norm": 13.084004538001976, + "learning_rate": 9.281458193360442e-06, + "loss": 2.597851276397705, + "step": 366 + }, + { + "epoch": 0.7710084033613446, + "grad_norm": 17.679727525867335, + "learning_rate": 9.2751317488481e-06, + "loss": 2.4659290313720703, + "step": 367 + }, + { + "epoch": 0.773109243697479, + "grad_norm": 9.199345804679885, + "learning_rate": 9.26877975128387e-06, + "loss": 3.0518131256103516, + "step": 368 + }, + { + "epoch": 0.7752100840336135, + "grad_norm": 15.824344742656248, + "learning_rate": 9.262402238634514e-06, + "loss": 2.0272233486175537, + "step": 369 + }, + { + "epoch": 0.7773109243697479, + "grad_norm": 9.874132429438818, + "learning_rate": 9.255999249019307e-06, + "loss": 2.282167911529541, + "step": 370 + }, + { + "epoch": 0.7794117647058824, + "grad_norm": 8.044430179764902, + "learning_rate": 9.2495708207098e-06, + "loss": 2.447831869125366, + "step": 371 + }, + { + "epoch": 0.7815126050420168, + "grad_norm": 15.289268393319317, + "learning_rate": 9.243116992129593e-06, + "loss": 2.5548458099365234, + "step": 372 + }, + { + "epoch": 0.7836134453781513, + "grad_norm": 18.576142639391133, + "learning_rate": 9.23663780185411e-06, + "loss": 2.2244365215301514, + "step": 373 + }, + { + "epoch": 0.7857142857142857, + "grad_norm": 8.55234069521718, + "learning_rate": 9.230133288610366e-06, + "loss": 3.044992208480835, + "step": 374 + }, + { + "epoch": 0.7878151260504201, + "grad_norm": 11.142079035862414, + "learning_rate": 9.223603491276733e-06, + "loss": 2.545569896697998, + "step": 375 + }, + { + "epoch": 0.7899159663865546, + "grad_norm": 14.123674718701432, + "learning_rate": 9.217048448882711e-06, + "loss": 3.337583541870117, + "step": 376 + }, + { + "epoch": 0.792016806722689, + "grad_norm": 16.146080651689587, + "learning_rate": 9.210468200608691e-06, + "loss": 3.1922380924224854, + "step": 377 + }, + { + "epoch": 0.7941176470588235, + "grad_norm": 12.28600079308305, + "learning_rate": 9.203862785785724e-06, + "loss": 2.5922632217407227, + "step": 378 + }, + { + "epoch": 0.7962184873949579, + "grad_norm": 18.04398024676097, + "learning_rate": 9.197232243895285e-06, + "loss": 2.876894474029541, + "step": 379 + }, + { + "epoch": 0.7983193277310925, + "grad_norm": 13.494043036714963, + "learning_rate": 9.190576614569035e-06, + "loss": 2.7677531242370605, + "step": 380 + }, + { + "epoch": 0.8004201680672269, + "grad_norm": 23.463052019031387, + "learning_rate": 9.183895937588594e-06, + "loss": 1.9870229959487915, + "step": 381 + }, + { + "epoch": 0.8025210084033614, + "grad_norm": 7.7476580634838665, + "learning_rate": 9.177190252885285e-06, + "loss": 2.784242868423462, + "step": 382 + }, + { + "epoch": 0.8046218487394958, + "grad_norm": 6.086395137680743, + "learning_rate": 9.17045960053991e-06, + "loss": 2.878697395324707, + "step": 383 + }, + { + "epoch": 0.8067226890756303, + "grad_norm": 16.59316957110638, + "learning_rate": 9.163704020782507e-06, + "loss": 2.7685139179229736, + "step": 384 + }, + { + "epoch": 0.8088235294117647, + "grad_norm": 15.470438153645851, + "learning_rate": 9.156923553992107e-06, + "loss": 2.8312299251556396, + "step": 385 + }, + { + "epoch": 0.8109243697478992, + "grad_norm": 8.00902098985157, + "learning_rate": 9.150118240696497e-06, + "loss": 1.7165706157684326, + "step": 386 + }, + { + "epoch": 0.8130252100840336, + "grad_norm": 14.0610194690077, + "learning_rate": 9.14328812157197e-06, + "loss": 3.451162815093994, + "step": 387 + }, + { + "epoch": 0.8151260504201681, + "grad_norm": 10.174053809556211, + "learning_rate": 9.136433237443093e-06, + "loss": 3.455259084701538, + "step": 388 + }, + { + "epoch": 0.8172268907563025, + "grad_norm": 14.076181600112081, + "learning_rate": 9.129553629282448e-06, + "loss": 3.3125205039978027, + "step": 389 + }, + { + "epoch": 0.819327731092437, + "grad_norm": 11.760967038966463, + "learning_rate": 9.122649338210407e-06, + "loss": 3.175715923309326, + "step": 390 + }, + { + "epoch": 0.8214285714285714, + "grad_norm": 12.215337173611072, + "learning_rate": 9.115720405494868e-06, + "loss": 3.426882743835449, + "step": 391 + }, + { + "epoch": 0.8235294117647058, + "grad_norm": 16.884819154921146, + "learning_rate": 9.108766872551016e-06, + "loss": 2.693225860595703, + "step": 392 + }, + { + "epoch": 0.8256302521008403, + "grad_norm": 11.991779005638564, + "learning_rate": 9.101788780941076e-06, + "loss": 2.8251726627349854, + "step": 393 + }, + { + "epoch": 0.8277310924369747, + "grad_norm": 8.901523397999386, + "learning_rate": 9.094786172374066e-06, + "loss": 2.845076560974121, + "step": 394 + }, + { + "epoch": 0.8298319327731093, + "grad_norm": 15.559813600064993, + "learning_rate": 9.087759088705541e-06, + "loss": 2.9212491512298584, + "step": 395 + }, + { + "epoch": 0.8319327731092437, + "grad_norm": 12.334218057409931, + "learning_rate": 9.08070757193735e-06, + "loss": 2.752890110015869, + "step": 396 + }, + { + "epoch": 0.8340336134453782, + "grad_norm": 20.040022595533, + "learning_rate": 9.07363166421738e-06, + "loss": 3.1292171478271484, + "step": 397 + }, + { + "epoch": 0.8361344537815126, + "grad_norm": 9.339997691276547, + "learning_rate": 9.066531407839307e-06, + "loss": 2.2926840782165527, + "step": 398 + }, + { + "epoch": 0.8382352941176471, + "grad_norm": 9.210411213235453, + "learning_rate": 9.059406845242343e-06, + "loss": 2.7644119262695312, + "step": 399 + }, + { + "epoch": 0.8403361344537815, + "grad_norm": 13.484928949211756, + "learning_rate": 9.05225801901098e-06, + "loss": 2.9096150398254395, + "step": 400 + }, + { + "epoch": 0.842436974789916, + "grad_norm": 21.901892899759964, + "learning_rate": 9.045084971874738e-06, + "loss": 4.536911964416504, + "step": 401 + }, + { + "epoch": 0.8445378151260504, + "grad_norm": 8.027798710835631, + "learning_rate": 9.03788774670791e-06, + "loss": 3.3775062561035156, + "step": 402 + }, + { + "epoch": 0.8466386554621849, + "grad_norm": 11.22841391004864, + "learning_rate": 9.030666386529303e-06, + "loss": 2.755703926086426, + "step": 403 + }, + { + "epoch": 0.8487394957983193, + "grad_norm": 9.698938581529527, + "learning_rate": 9.023420934501981e-06, + "loss": 2.812281608581543, + "step": 404 + }, + { + "epoch": 0.8508403361344538, + "grad_norm": 9.495702557416454, + "learning_rate": 9.01615143393301e-06, + "loss": 2.9015493392944336, + "step": 405 + }, + { + "epoch": 0.8529411764705882, + "grad_norm": 8.59480884978166, + "learning_rate": 9.008857928273199e-06, + "loss": 2.8743391036987305, + "step": 406 + }, + { + "epoch": 0.8550420168067226, + "grad_norm": 14.060855102265236, + "learning_rate": 9.001540461116835e-06, + "loss": 2.7400550842285156, + "step": 407 + }, + { + "epoch": 0.8571428571428571, + "grad_norm": 9.670354596798553, + "learning_rate": 8.994199076201428e-06, + "loss": 3.788983106613159, + "step": 408 + }, + { + "epoch": 0.8592436974789915, + "grad_norm": 10.094582977623446, + "learning_rate": 8.98683381740745e-06, + "loss": 2.426604747772217, + "step": 409 + }, + { + "epoch": 0.8613445378151261, + "grad_norm": 6.42119276092813, + "learning_rate": 8.979444728758067e-06, + "loss": 2.467769145965576, + "step": 410 + }, + { + "epoch": 0.8634453781512605, + "grad_norm": 101.25120998420752, + "learning_rate": 8.97203185441888e-06, + "loss": 2.878884792327881, + "step": 411 + }, + { + "epoch": 0.865546218487395, + "grad_norm": 10.063927366400284, + "learning_rate": 8.964595238697659e-06, + "loss": 3.323913812637329, + "step": 412 + }, + { + "epoch": 0.8676470588235294, + "grad_norm": 8.176196947638319, + "learning_rate": 8.957134926044088e-06, + "loss": 2.2674732208251953, + "step": 413 + }, + { + "epoch": 0.8697478991596639, + "grad_norm": 7.688045397272728, + "learning_rate": 8.949650961049479e-06, + "loss": 2.6359667778015137, + "step": 414 + }, + { + "epoch": 0.8718487394957983, + "grad_norm": 12.061723837223782, + "learning_rate": 8.942143388446522e-06, + "loss": 4.3965678215026855, + "step": 415 + }, + { + "epoch": 0.8739495798319328, + "grad_norm": 13.801014710596668, + "learning_rate": 8.934612253109017e-06, + "loss": 3.584599733352661, + "step": 416 + }, + { + "epoch": 0.8760504201680672, + "grad_norm": 11.465324791085347, + "learning_rate": 8.927057600051594e-06, + "loss": 2.9781904220581055, + "step": 417 + }, + { + "epoch": 0.8781512605042017, + "grad_norm": 32.19803137859573, + "learning_rate": 8.919479474429462e-06, + "loss": 3.3312220573425293, + "step": 418 + }, + { + "epoch": 0.8802521008403361, + "grad_norm": 23.418640662777587, + "learning_rate": 8.911877921538117e-06, + "loss": 3.8054161071777344, + "step": 419 + }, + { + "epoch": 0.8823529411764706, + "grad_norm": 7.760210305795623, + "learning_rate": 8.904252986813091e-06, + "loss": 2.8041489124298096, + "step": 420 + }, + { + "epoch": 0.884453781512605, + "grad_norm": 13.790720201964906, + "learning_rate": 8.896604715829671e-06, + "loss": 2.8391265869140625, + "step": 421 + }, + { + "epoch": 0.8865546218487395, + "grad_norm": 8.558877313925247, + "learning_rate": 8.888933154302626e-06, + "loss": 2.6835553646087646, + "step": 422 + }, + { + "epoch": 0.8886554621848739, + "grad_norm": 21.689551042379083, + "learning_rate": 8.881238348085936e-06, + "loss": 2.6738481521606445, + "step": 423 + }, + { + "epoch": 0.8907563025210085, + "grad_norm": 7.686758427886692, + "learning_rate": 8.87352034317252e-06, + "loss": 2.619101047515869, + "step": 424 + }, + { + "epoch": 0.8928571428571429, + "grad_norm": 20.40695143594997, + "learning_rate": 8.865779185693957e-06, + "loss": 3.3444905281066895, + "step": 425 + }, + { + "epoch": 0.8949579831932774, + "grad_norm": 27.431337065110313, + "learning_rate": 8.858014921920215e-06, + "loss": 2.1527421474456787, + "step": 426 + }, + { + "epoch": 0.8970588235294118, + "grad_norm": 20.606507987678672, + "learning_rate": 8.850227598259365e-06, + "loss": 2.6689836978912354, + "step": 427 + }, + { + "epoch": 0.8991596638655462, + "grad_norm": 8.968995022440353, + "learning_rate": 8.842417261257316e-06, + "loss": 3.0119547843933105, + "step": 428 + }, + { + "epoch": 0.9012605042016807, + "grad_norm": 28.528232969469133, + "learning_rate": 8.83458395759753e-06, + "loss": 2.482861042022705, + "step": 429 + }, + { + "epoch": 0.9033613445378151, + "grad_norm": 10.074031458183692, + "learning_rate": 8.826727734100742e-06, + "loss": 2.8982067108154297, + "step": 430 + }, + { + "epoch": 0.9054621848739496, + "grad_norm": 8.399253353390154, + "learning_rate": 8.818848637724681e-06, + "loss": 2.5004382133483887, + "step": 431 + }, + { + "epoch": 0.907563025210084, + "grad_norm": 8.747805949968082, + "learning_rate": 8.810946715563798e-06, + "loss": 2.612011194229126, + "step": 432 + }, + { + "epoch": 0.9096638655462185, + "grad_norm": 10.425702565789909, + "learning_rate": 8.803022014848966e-06, + "loss": 2.9700820446014404, + "step": 433 + }, + { + "epoch": 0.9117647058823529, + "grad_norm": 11.029401754074971, + "learning_rate": 8.795074582947214e-06, + "loss": 3.248368263244629, + "step": 434 + }, + { + "epoch": 0.9138655462184874, + "grad_norm": 9.336382488449228, + "learning_rate": 8.787104467361442e-06, + "loss": 2.993704319000244, + "step": 435 + }, + { + "epoch": 0.9159663865546218, + "grad_norm": 13.327453834983904, + "learning_rate": 8.779111715730127e-06, + "loss": 2.6930155754089355, + "step": 436 + }, + { + "epoch": 0.9180672268907563, + "grad_norm": 10.570908488031245, + "learning_rate": 8.771096375827047e-06, + "loss": 3.069434404373169, + "step": 437 + }, + { + "epoch": 0.9201680672268907, + "grad_norm": 19.381962817436207, + "learning_rate": 8.763058495560994e-06, + "loss": 3.1358611583709717, + "step": 438 + }, + { + "epoch": 0.9222689075630253, + "grad_norm": 18.418237048785702, + "learning_rate": 8.754998122975489e-06, + "loss": 3.2987184524536133, + "step": 439 + }, + { + "epoch": 0.9243697478991597, + "grad_norm": 8.737803987239646, + "learning_rate": 8.746915306248488e-06, + "loss": 2.9279255867004395, + "step": 440 + }, + { + "epoch": 0.9264705882352942, + "grad_norm": 13.117095498271222, + "learning_rate": 8.7388100936921e-06, + "loss": 2.795942783355713, + "step": 441 + }, + { + "epoch": 0.9285714285714286, + "grad_norm": 25.973728201733575, + "learning_rate": 8.730682533752301e-06, + "loss": 2.7590699195861816, + "step": 442 + }, + { + "epoch": 0.930672268907563, + "grad_norm": 9.543199289400748, + "learning_rate": 8.722532675008635e-06, + "loss": 2.6571459770202637, + "step": 443 + }, + { + "epoch": 0.9327731092436975, + "grad_norm": 10.69198569405724, + "learning_rate": 8.714360566173932e-06, + "loss": 2.7342920303344727, + "step": 444 + }, + { + "epoch": 0.9348739495798319, + "grad_norm": 13.298135717649288, + "learning_rate": 8.706166256094013e-06, + "loss": 2.9492366313934326, + "step": 445 + }, + { + "epoch": 0.9369747899159664, + "grad_norm": 18.5856782117513, + "learning_rate": 8.6979497937474e-06, + "loss": 2.937699317932129, + "step": 446 + }, + { + "epoch": 0.9390756302521008, + "grad_norm": 10.292297569389804, + "learning_rate": 8.689711228245021e-06, + "loss": 3.23824405670166, + "step": 447 + }, + { + "epoch": 0.9411764705882353, + "grad_norm": 19.90454431534383, + "learning_rate": 8.681450608829916e-06, + "loss": 2.542668581008911, + "step": 448 + }, + { + "epoch": 0.9432773109243697, + "grad_norm": 14.413143934794212, + "learning_rate": 8.67316798487695e-06, + "loss": 3.257632255554199, + "step": 449 + }, + { + "epoch": 0.9453781512605042, + "grad_norm": 10.80231465762936, + "learning_rate": 8.664863405892506e-06, + "loss": 2.7072958946228027, + "step": 450 + }, + { + "epoch": 0.9474789915966386, + "grad_norm": 18.020582485094227, + "learning_rate": 8.656536921514195e-06, + "loss": 2.532301664352417, + "step": 451 + }, + { + "epoch": 0.9495798319327731, + "grad_norm": 12.503896279810512, + "learning_rate": 8.648188581510567e-06, + "loss": 2.726604461669922, + "step": 452 + }, + { + "epoch": 0.9516806722689075, + "grad_norm": 18.785189447389097, + "learning_rate": 8.639818435780797e-06, + "loss": 2.516594886779785, + "step": 453 + }, + { + "epoch": 0.9537815126050421, + "grad_norm": 12.0120687102085, + "learning_rate": 8.631426534354404e-06, + "loss": 2.7706644535064697, + "step": 454 + }, + { + "epoch": 0.9558823529411765, + "grad_norm": 11.506720081337315, + "learning_rate": 8.623012927390936e-06, + "loss": 3.2427144050598145, + "step": 455 + }, + { + "epoch": 0.957983193277311, + "grad_norm": 10.11083550503784, + "learning_rate": 8.614577665179684e-06, + "loss": 3.1202523708343506, + "step": 456 + }, + { + "epoch": 0.9600840336134454, + "grad_norm": 15.945109216294865, + "learning_rate": 8.606120798139375e-06, + "loss": 2.6210598945617676, + "step": 457 + }, + { + "epoch": 0.9621848739495799, + "grad_norm": 9.09618149788864, + "learning_rate": 8.597642376817865e-06, + "loss": 2.669271469116211, + "step": 458 + }, + { + "epoch": 0.9642857142857143, + "grad_norm": 8.714640631605363, + "learning_rate": 8.589142451891849e-06, + "loss": 2.6489734649658203, + "step": 459 + }, + { + "epoch": 0.9663865546218487, + "grad_norm": 7.855597298788909, + "learning_rate": 8.580621074166553e-06, + "loss": 3.10178804397583, + "step": 460 + }, + { + "epoch": 0.9684873949579832, + "grad_norm": 10.502691052340555, + "learning_rate": 8.572078294575423e-06, + "loss": 2.589158296585083, + "step": 461 + }, + { + "epoch": 0.9705882352941176, + "grad_norm": 10.459968052493494, + "learning_rate": 8.56351416417983e-06, + "loss": 2.5543792247772217, + "step": 462 + }, + { + "epoch": 0.9726890756302521, + "grad_norm": 12.885512846289808, + "learning_rate": 8.554928734168767e-06, + "loss": 2.65985369682312, + "step": 463 + }, + { + "epoch": 0.9747899159663865, + "grad_norm": 9.639047199230617, + "learning_rate": 8.546322055858526e-06, + "loss": 3.0177440643310547, + "step": 464 + }, + { + "epoch": 0.976890756302521, + "grad_norm": 9.494268049756599, + "learning_rate": 8.537694180692416e-06, + "loss": 2.2767248153686523, + "step": 465 + }, + { + "epoch": 0.9789915966386554, + "grad_norm": 12.56887928459161, + "learning_rate": 8.529045160240433e-06, + "loss": 2.7835707664489746, + "step": 466 + }, + { + "epoch": 0.9810924369747899, + "grad_norm": 10.580355179128095, + "learning_rate": 8.520375046198965e-06, + "loss": 2.4373722076416016, + "step": 467 + }, + { + "epoch": 0.9831932773109243, + "grad_norm": 10.13582135951574, + "learning_rate": 8.51168389039048e-06, + "loss": 2.464303731918335, + "step": 468 + }, + { + "epoch": 0.9852941176470589, + "grad_norm": 12.209700818401375, + "learning_rate": 8.502971744763216e-06, + "loss": 2.2609100341796875, + "step": 469 + }, + { + "epoch": 0.9873949579831933, + "grad_norm": 21.359445929891656, + "learning_rate": 8.494238661390865e-06, + "loss": 3.0135858058929443, + "step": 470 + }, + { + "epoch": 0.9894957983193278, + "grad_norm": 15.087072293517004, + "learning_rate": 8.485484692472272e-06, + "loss": 2.770965099334717, + "step": 471 + }, + { + "epoch": 0.9915966386554622, + "grad_norm": 8.181199645745421, + "learning_rate": 8.476709890331116e-06, + "loss": 2.6243722438812256, + "step": 472 + }, + { + "epoch": 0.9936974789915967, + "grad_norm": 7.527423998031555, + "learning_rate": 8.467914307415601e-06, + "loss": 2.9319207668304443, + "step": 473 + }, + { + "epoch": 0.9957983193277311, + "grad_norm": 9.424234237676545, + "learning_rate": 8.459097996298137e-06, + "loss": 3.0626072883605957, + "step": 474 + }, + { + "epoch": 0.9978991596638656, + "grad_norm": 14.444274317338678, + "learning_rate": 8.45026100967503e-06, + "loss": 3.000889778137207, + "step": 475 + }, + { + "epoch": 1.0, + "grad_norm": 8.45019782867115, + "learning_rate": 8.441403400366169e-06, + "loss": 3.112825393676758, + "step": 476 + }, + { + "epoch": 1.0021008403361344, + "grad_norm": 19.596775314152666, + "learning_rate": 8.432525221314708e-06, + "loss": 1.4137624502182007, + "step": 477 + }, + { + "epoch": 1.004201680672269, + "grad_norm": 9.233023882113994, + "learning_rate": 8.423626525586744e-06, + "loss": 1.6808059215545654, + "step": 478 + }, + { + "epoch": 1.0063025210084033, + "grad_norm": 9.789186389046735, + "learning_rate": 8.414707366371006e-06, + "loss": 1.8797330856323242, + "step": 479 + }, + { + "epoch": 1.0084033613445378, + "grad_norm": 7.894274079237724, + "learning_rate": 8.405767796978546e-06, + "loss": 1.9548699855804443, + "step": 480 + }, + { + "epoch": 1.0105042016806722, + "grad_norm": 11.882995555931503, + "learning_rate": 8.396807870842396e-06, + "loss": 1.5713114738464355, + "step": 481 + }, + { + "epoch": 1.0126050420168067, + "grad_norm": 14.948396348319923, + "learning_rate": 8.387827641517274e-06, + "loss": 1.69504976272583, + "step": 482 + }, + { + "epoch": 1.0147058823529411, + "grad_norm": 6.935744624929541, + "learning_rate": 8.378827162679248e-06, + "loss": 1.3813257217407227, + "step": 483 + }, + { + "epoch": 1.0168067226890756, + "grad_norm": 9.50729885231966, + "learning_rate": 8.369806488125418e-06, + "loss": 2.4568567276000977, + "step": 484 + }, + { + "epoch": 1.01890756302521, + "grad_norm": 11.62592077082348, + "learning_rate": 8.360765671773603e-06, + "loss": 2.602184534072876, + "step": 485 + }, + { + "epoch": 1.0210084033613445, + "grad_norm": 15.469624436922395, + "learning_rate": 8.351704767662005e-06, + "loss": 1.8193070888519287, + "step": 486 + }, + { + "epoch": 1.023109243697479, + "grad_norm": 12.389371131721145, + "learning_rate": 8.3426238299489e-06, + "loss": 1.4549766778945923, + "step": 487 + }, + { + "epoch": 1.0252100840336134, + "grad_norm": 7.898711913261212, + "learning_rate": 8.333522912912308e-06, + "loss": 1.4681106805801392, + "step": 488 + }, + { + "epoch": 1.0273109243697478, + "grad_norm": 14.553557605821632, + "learning_rate": 8.324402070949658e-06, + "loss": 1.4224164485931396, + "step": 489 + }, + { + "epoch": 1.0294117647058822, + "grad_norm": 21.0322684953627, + "learning_rate": 8.315261358577485e-06, + "loss": 2.200676441192627, + "step": 490 + }, + { + "epoch": 1.0315126050420167, + "grad_norm": 14.230965851092702, + "learning_rate": 8.306100830431085e-06, + "loss": 1.867397665977478, + "step": 491 + }, + { + "epoch": 1.0336134453781514, + "grad_norm": 11.330315084805383, + "learning_rate": 8.296920541264197e-06, + "loss": 1.4270985126495361, + "step": 492 + }, + { + "epoch": 1.0357142857142858, + "grad_norm": 11.452248734086307, + "learning_rate": 8.287720545948676e-06, + "loss": 1.464069128036499, + "step": 493 + }, + { + "epoch": 1.0378151260504203, + "grad_norm": 18.476525141242952, + "learning_rate": 8.278500899474162e-06, + "loss": 1.192551612854004, + "step": 494 + }, + { + "epoch": 1.0399159663865547, + "grad_norm": 13.695173322132312, + "learning_rate": 8.269261656947755e-06, + "loss": 2.367762327194214, + "step": 495 + }, + { + "epoch": 1.0420168067226891, + "grad_norm": 12.101022572223535, + "learning_rate": 8.260002873593679e-06, + "loss": 1.6752372980117798, + "step": 496 + }, + { + "epoch": 1.0441176470588236, + "grad_norm": 14.763270168918805, + "learning_rate": 8.25072460475296e-06, + "loss": 1.409712314605713, + "step": 497 + }, + { + "epoch": 1.046218487394958, + "grad_norm": 12.622229054224464, + "learning_rate": 8.24142690588309e-06, + "loss": 1.6270588636398315, + "step": 498 + }, + { + "epoch": 1.0483193277310925, + "grad_norm": 7.889964988601032, + "learning_rate": 8.232109832557696e-06, + "loss": 1.4294947385787964, + "step": 499 + }, + { + "epoch": 1.050420168067227, + "grad_norm": 9.640341277497848, + "learning_rate": 8.222773440466213e-06, + "loss": 1.2340010404586792, + "step": 500 + }, + { + "epoch": 1.0525210084033614, + "grad_norm": 9.361065825268032, + "learning_rate": 8.213417785413538e-06, + "loss": 1.451041340827942, + "step": 501 + }, + { + "epoch": 1.0546218487394958, + "grad_norm": 10.851800895184763, + "learning_rate": 8.204042923319717e-06, + "loss": 0.8124719858169556, + "step": 502 + }, + { + "epoch": 1.0567226890756303, + "grad_norm": 13.939415896202156, + "learning_rate": 8.19464891021959e-06, + "loss": 1.5310864448547363, + "step": 503 + }, + { + "epoch": 1.0588235294117647, + "grad_norm": 12.545903899817956, + "learning_rate": 8.18523580226247e-06, + "loss": 1.2139228582382202, + "step": 504 + }, + { + "epoch": 1.0609243697478992, + "grad_norm": 7.8688457688530455, + "learning_rate": 8.1758036557118e-06, + "loss": 1.3573241233825684, + "step": 505 + }, + { + "epoch": 1.0630252100840336, + "grad_norm": 29.274148786110516, + "learning_rate": 8.166352526944821e-06, + "loss": 1.9899749755859375, + "step": 506 + }, + { + "epoch": 1.065126050420168, + "grad_norm": 12.789841758713314, + "learning_rate": 8.156882472452232e-06, + "loss": 1.4103593826293945, + "step": 507 + }, + { + "epoch": 1.0672268907563025, + "grad_norm": 11.46688535188232, + "learning_rate": 8.147393548837856e-06, + "loss": 1.227393627166748, + "step": 508 + }, + { + "epoch": 1.069327731092437, + "grad_norm": 11.67493017233716, + "learning_rate": 8.137885812818296e-06, + "loss": 1.7060927152633667, + "step": 509 + }, + { + "epoch": 1.0714285714285714, + "grad_norm": 13.183390423963338, + "learning_rate": 8.128359321222601e-06, + "loss": 1.890432357788086, + "step": 510 + }, + { + "epoch": 1.0735294117647058, + "grad_norm": 8.769195455641308, + "learning_rate": 8.118814130991925e-06, + "loss": 1.8258857727050781, + "step": 511 + }, + { + "epoch": 1.0756302521008403, + "grad_norm": 9.016866647141889, + "learning_rate": 8.109250299179188e-06, + "loss": 0.9584097862243652, + "step": 512 + }, + { + "epoch": 1.0777310924369747, + "grad_norm": 8.866656672277916, + "learning_rate": 8.09966788294873e-06, + "loss": 1.4017150402069092, + "step": 513 + }, + { + "epoch": 1.0798319327731092, + "grad_norm": 12.12920225890514, + "learning_rate": 8.090066939575972e-06, + "loss": 1.3034381866455078, + "step": 514 + }, + { + "epoch": 1.0819327731092436, + "grad_norm": 11.169332765461306, + "learning_rate": 8.080447526447079e-06, + "loss": 1.0734150409698486, + "step": 515 + }, + { + "epoch": 1.084033613445378, + "grad_norm": 15.988980575396647, + "learning_rate": 8.070809701058606e-06, + "loss": 0.8819087743759155, + "step": 516 + }, + { + "epoch": 1.0861344537815125, + "grad_norm": 10.445041930863859, + "learning_rate": 8.061153521017169e-06, + "loss": 1.3253920078277588, + "step": 517 + }, + { + "epoch": 1.088235294117647, + "grad_norm": 7.477532974278996, + "learning_rate": 8.051479044039086e-06, + "loss": 1.0912744998931885, + "step": 518 + }, + { + "epoch": 1.0903361344537814, + "grad_norm": 15.386742532344485, + "learning_rate": 8.041786327950037e-06, + "loss": 1.6941767930984497, + "step": 519 + }, + { + "epoch": 1.092436974789916, + "grad_norm": 13.631587045212196, + "learning_rate": 8.032075430684724e-06, + "loss": 1.058671236038208, + "step": 520 + }, + { + "epoch": 1.0945378151260505, + "grad_norm": 9.174394889796707, + "learning_rate": 8.02234641028652e-06, + "loss": 1.1603420972824097, + "step": 521 + }, + { + "epoch": 1.096638655462185, + "grad_norm": 18.009634618634845, + "learning_rate": 8.012599324907121e-06, + "loss": 1.4285218715667725, + "step": 522 + }, + { + "epoch": 1.0987394957983194, + "grad_norm": 18.317588738929096, + "learning_rate": 8.0028342328062e-06, + "loss": 1.3041057586669922, + "step": 523 + }, + { + "epoch": 1.1008403361344539, + "grad_norm": 17.245361771703262, + "learning_rate": 7.993051192351056e-06, + "loss": 2.329005718231201, + "step": 524 + }, + { + "epoch": 1.1029411764705883, + "grad_norm": 5.466501144551759, + "learning_rate": 7.983250262016276e-06, + "loss": 0.7331016063690186, + "step": 525 + }, + { + "epoch": 1.1050420168067228, + "grad_norm": 19.76792957260025, + "learning_rate": 7.973431500383366e-06, + "loss": 2.193528175354004, + "step": 526 + }, + { + "epoch": 1.1071428571428572, + "grad_norm": 11.04973790435175, + "learning_rate": 7.963594966140423e-06, + "loss": 1.3245251178741455, + "step": 527 + }, + { + "epoch": 1.1092436974789917, + "grad_norm": 14.50002827076454, + "learning_rate": 7.953740718081765e-06, + "loss": 1.1308670043945312, + "step": 528 + }, + { + "epoch": 1.111344537815126, + "grad_norm": 8.457254255014693, + "learning_rate": 7.943868815107594e-06, + "loss": 1.3318034410476685, + "step": 529 + }, + { + "epoch": 1.1134453781512605, + "grad_norm": 12.48006901565296, + "learning_rate": 7.933979316223632e-06, + "loss": 1.2564438581466675, + "step": 530 + }, + { + "epoch": 1.115546218487395, + "grad_norm": 13.952521489657013, + "learning_rate": 7.92407228054078e-06, + "loss": 1.2420412302017212, + "step": 531 + }, + { + "epoch": 1.1176470588235294, + "grad_norm": 11.927118732913993, + "learning_rate": 7.914147767274756e-06, + "loss": 1.9582582712173462, + "step": 532 + }, + { + "epoch": 1.1197478991596639, + "grad_norm": 29.1836862977554, + "learning_rate": 7.904205835745744e-06, + "loss": 1.7057411670684814, + "step": 533 + }, + { + "epoch": 1.1218487394957983, + "grad_norm": 8.77699695792644, + "learning_rate": 7.894246545378037e-06, + "loss": 1.810387134552002, + "step": 534 + }, + { + "epoch": 1.1239495798319328, + "grad_norm": 11.812154757139437, + "learning_rate": 7.884269955699689e-06, + "loss": 1.6038577556610107, + "step": 535 + }, + { + "epoch": 1.1260504201680672, + "grad_norm": 11.347334970124107, + "learning_rate": 7.874276126342151e-06, + "loss": 1.1410393714904785, + "step": 536 + }, + { + "epoch": 1.1281512605042017, + "grad_norm": 23.969457981422316, + "learning_rate": 7.86426511703992e-06, + "loss": 2.28239369392395, + "step": 537 + }, + { + "epoch": 1.1302521008403361, + "grad_norm": 11.3793937172999, + "learning_rate": 7.854236987630178e-06, + "loss": 2.1672444343566895, + "step": 538 + }, + { + "epoch": 1.1323529411764706, + "grad_norm": 8.571185039369908, + "learning_rate": 7.844191798052438e-06, + "loss": 1.7712535858154297, + "step": 539 + }, + { + "epoch": 1.134453781512605, + "grad_norm": 8.155743104110897, + "learning_rate": 7.834129608348183e-06, + "loss": 1.4109793901443481, + "step": 540 + }, + { + "epoch": 1.1365546218487395, + "grad_norm": 12.006945471100122, + "learning_rate": 7.824050478660506e-06, + "loss": 1.4405725002288818, + "step": 541 + }, + { + "epoch": 1.138655462184874, + "grad_norm": 16.24385934265993, + "learning_rate": 7.813954469233758e-06, + "loss": 2.2450976371765137, + "step": 542 + }, + { + "epoch": 1.1407563025210083, + "grad_norm": 63.00358955157523, + "learning_rate": 7.803841640413177e-06, + "loss": 2.16367244720459, + "step": 543 + }, + { + "epoch": 1.1428571428571428, + "grad_norm": 10.995277933527825, + "learning_rate": 7.793712052644535e-06, + "loss": 2.3919224739074707, + "step": 544 + }, + { + "epoch": 1.1449579831932772, + "grad_norm": 9.931645247221951, + "learning_rate": 7.783565766473777e-06, + "loss": 1.4211726188659668, + "step": 545 + }, + { + "epoch": 1.1470588235294117, + "grad_norm": 12.106564772704573, + "learning_rate": 7.773402842546654e-06, + "loss": 1.2502498626708984, + "step": 546 + }, + { + "epoch": 1.1491596638655461, + "grad_norm": 8.144149987908426, + "learning_rate": 7.76322334160836e-06, + "loss": 1.423762321472168, + "step": 547 + }, + { + "epoch": 1.1512605042016806, + "grad_norm": 10.152738619426868, + "learning_rate": 7.75302732450318e-06, + "loss": 1.1090279817581177, + "step": 548 + }, + { + "epoch": 1.153361344537815, + "grad_norm": 11.024880610484013, + "learning_rate": 7.742814852174112e-06, + "loss": 1.0321426391601562, + "step": 549 + }, + { + "epoch": 1.1554621848739495, + "grad_norm": 10.4112886492949, + "learning_rate": 7.73258598566251e-06, + "loss": 1.0928632020950317, + "step": 550 + }, + { + "epoch": 1.157563025210084, + "grad_norm": 17.17079853756711, + "learning_rate": 7.72234078610772e-06, + "loss": 1.2369472980499268, + "step": 551 + }, + { + "epoch": 1.1596638655462184, + "grad_norm": 12.662228894532866, + "learning_rate": 7.712079314746716e-06, + "loss": 1.2957392930984497, + "step": 552 + }, + { + "epoch": 1.161764705882353, + "grad_norm": 8.967923305212855, + "learning_rate": 7.701801632913722e-06, + "loss": 1.6709070205688477, + "step": 553 + }, + { + "epoch": 1.1638655462184875, + "grad_norm": 9.520057506790387, + "learning_rate": 7.691507802039861e-06, + "loss": 1.6091077327728271, + "step": 554 + }, + { + "epoch": 1.165966386554622, + "grad_norm": 12.924582534581134, + "learning_rate": 7.68119788365278e-06, + "loss": 1.8003133535385132, + "step": 555 + }, + { + "epoch": 1.1680672268907564, + "grad_norm": 8.027840739484652, + "learning_rate": 7.670871939376281e-06, + "loss": 1.0151593685150146, + "step": 556 + }, + { + "epoch": 1.1701680672268908, + "grad_norm": 10.792867985796137, + "learning_rate": 7.660530030929961e-06, + "loss": 1.3084783554077148, + "step": 557 + }, + { + "epoch": 1.1722689075630253, + "grad_norm": 10.336895443268714, + "learning_rate": 7.650172220128828e-06, + "loss": 1.3882572650909424, + "step": 558 + }, + { + "epoch": 1.1743697478991597, + "grad_norm": 11.46121788240209, + "learning_rate": 7.639798568882947e-06, + "loss": 1.3919298648834229, + "step": 559 + }, + { + "epoch": 1.1764705882352942, + "grad_norm": 11.442052901701038, + "learning_rate": 7.629409139197063e-06, + "loss": 1.3745830059051514, + "step": 560 + }, + { + "epoch": 1.1785714285714286, + "grad_norm": 22.18812336562329, + "learning_rate": 7.619003993170226e-06, + "loss": 1.2964568138122559, + "step": 561 + }, + { + "epoch": 1.180672268907563, + "grad_norm": 14.305068677598294, + "learning_rate": 7.608583192995433e-06, + "loss": 1.75518798828125, + "step": 562 + }, + { + "epoch": 1.1827731092436975, + "grad_norm": 38.68186634407232, + "learning_rate": 7.598146800959238e-06, + "loss": 2.156588554382324, + "step": 563 + }, + { + "epoch": 1.184873949579832, + "grad_norm": 15.824079652626462, + "learning_rate": 7.5876948794414015e-06, + "loss": 1.3602566719055176, + "step": 564 + }, + { + "epoch": 1.1869747899159664, + "grad_norm": 13.134376075413467, + "learning_rate": 7.577227490914495e-06, + "loss": 1.5620733499526978, + "step": 565 + }, + { + "epoch": 1.1890756302521008, + "grad_norm": 9.860309886809128, + "learning_rate": 7.5667446979435445e-06, + "loss": 0.971282422542572, + "step": 566 + }, + { + "epoch": 1.1911764705882353, + "grad_norm": 11.617960075857892, + "learning_rate": 7.556246563185648e-06, + "loss": 1.1717581748962402, + "step": 567 + }, + { + "epoch": 1.1932773109243697, + "grad_norm": 14.78629106010037, + "learning_rate": 7.545733149389605e-06, + "loss": 1.8813025951385498, + "step": 568 + }, + { + "epoch": 1.1953781512605042, + "grad_norm": 11.92994585452875, + "learning_rate": 7.535204519395538e-06, + "loss": 1.280207633972168, + "step": 569 + }, + { + "epoch": 1.1974789915966386, + "grad_norm": 14.537731397359755, + "learning_rate": 7.5246607361345215e-06, + "loss": 1.5685778856277466, + "step": 570 + }, + { + "epoch": 1.199579831932773, + "grad_norm": 9.978722079402786, + "learning_rate": 7.514101862628203e-06, + "loss": 2.2011172771453857, + "step": 571 + }, + { + "epoch": 1.2016806722689075, + "grad_norm": 14.328584272935853, + "learning_rate": 7.503527961988422e-06, + "loss": 2.0038180351257324, + "step": 572 + }, + { + "epoch": 1.203781512605042, + "grad_norm": 11.49676437218398, + "learning_rate": 7.492939097416842e-06, + "loss": 1.1275922060012817, + "step": 573 + }, + { + "epoch": 1.2058823529411764, + "grad_norm": 13.603928637496292, + "learning_rate": 7.482335332204568e-06, + "loss": 1.208678960800171, + "step": 574 + }, + { + "epoch": 1.2079831932773109, + "grad_norm": 10.710849924738463, + "learning_rate": 7.471716729731764e-06, + "loss": 1.7450125217437744, + "step": 575 + }, + { + "epoch": 1.2100840336134453, + "grad_norm": 10.8408813790809, + "learning_rate": 7.461083353467283e-06, + "loss": 1.5381510257720947, + "step": 576 + }, + { + "epoch": 1.2121848739495797, + "grad_norm": 10.502717838660322, + "learning_rate": 7.450435266968279e-06, + "loss": 1.6857651472091675, + "step": 577 + }, + { + "epoch": 1.2142857142857142, + "grad_norm": 10.194196645130454, + "learning_rate": 7.4397725338798365e-06, + "loss": 1.9049471616744995, + "step": 578 + }, + { + "epoch": 1.2163865546218489, + "grad_norm": 8.336901180250376, + "learning_rate": 7.429095217934578e-06, + "loss": 2.2398974895477295, + "step": 579 + }, + { + "epoch": 1.2184873949579833, + "grad_norm": 8.289301563947674, + "learning_rate": 7.4184033829522935e-06, + "loss": 1.8767409324645996, + "step": 580 + }, + { + "epoch": 1.2205882352941178, + "grad_norm": 7.83258681688038, + "learning_rate": 7.4076970928395565e-06, + "loss": 1.4787061214447021, + "step": 581 + }, + { + "epoch": 1.2226890756302522, + "grad_norm": 11.288493150816146, + "learning_rate": 7.396976411589338e-06, + "loss": 1.1055876016616821, + "step": 582 + }, + { + "epoch": 1.2247899159663866, + "grad_norm": 8.627197279612671, + "learning_rate": 7.386241403280629e-06, + "loss": 1.668757438659668, + "step": 583 + }, + { + "epoch": 1.226890756302521, + "grad_norm": 7.9829732080808276, + "learning_rate": 7.375492132078051e-06, + "loss": 1.2818783521652222, + "step": 584 + }, + { + "epoch": 1.2289915966386555, + "grad_norm": 9.132163063845432, + "learning_rate": 7.364728662231484e-06, + "loss": 1.578829050064087, + "step": 585 + }, + { + "epoch": 1.23109243697479, + "grad_norm": 9.541187433357738, + "learning_rate": 7.353951058075669e-06, + "loss": 1.572939157485962, + "step": 586 + }, + { + "epoch": 1.2331932773109244, + "grad_norm": 29.472008336805924, + "learning_rate": 7.343159384029833e-06, + "loss": 3.977992057800293, + "step": 587 + }, + { + "epoch": 1.2352941176470589, + "grad_norm": 12.577355177733914, + "learning_rate": 7.332353704597299e-06, + "loss": 1.955003023147583, + "step": 588 + }, + { + "epoch": 1.2373949579831933, + "grad_norm": 10.61755598072498, + "learning_rate": 7.321534084365101e-06, + "loss": 1.5401737689971924, + "step": 589 + }, + { + "epoch": 1.2394957983193278, + "grad_norm": 17.052134953118316, + "learning_rate": 7.310700588003605e-06, + "loss": 1.895308017730713, + "step": 590 + }, + { + "epoch": 1.2415966386554622, + "grad_norm": 13.914617942504853, + "learning_rate": 7.299853280266109e-06, + "loss": 1.6920474767684937, + "step": 591 + }, + { + "epoch": 1.2436974789915967, + "grad_norm": 18.300626922757814, + "learning_rate": 7.28899222598847e-06, + "loss": 1.9865736961364746, + "step": 592 + }, + { + "epoch": 1.245798319327731, + "grad_norm": 8.604822405832417, + "learning_rate": 7.278117490088703e-06, + "loss": 1.2350941896438599, + "step": 593 + }, + { + "epoch": 1.2478991596638656, + "grad_norm": 15.714181520858954, + "learning_rate": 7.267229137566607e-06, + "loss": 1.800095558166504, + "step": 594 + }, + { + "epoch": 1.25, + "grad_norm": 7.625924941471246, + "learning_rate": 7.256327233503365e-06, + "loss": 1.848137617111206, + "step": 595 + }, + { + "epoch": 1.2521008403361344, + "grad_norm": 8.480492494477819, + "learning_rate": 7.24541184306116e-06, + "loss": 1.7656617164611816, + "step": 596 + }, + { + "epoch": 1.254201680672269, + "grad_norm": 11.960261973795399, + "learning_rate": 7.234483031482787e-06, + "loss": 1.0096323490142822, + "step": 597 + }, + { + "epoch": 1.2563025210084033, + "grad_norm": 9.709001923888373, + "learning_rate": 7.223540864091259e-06, + "loss": 1.428197979927063, + "step": 598 + }, + { + "epoch": 1.2584033613445378, + "grad_norm": 11.628908186348927, + "learning_rate": 7.2125854062894184e-06, + "loss": 1.0703970193862915, + "step": 599 + }, + { + "epoch": 1.2605042016806722, + "grad_norm": 14.20204722362147, + "learning_rate": 7.201616723559548e-06, + "loss": 1.7873646020889282, + "step": 600 + }, + { + "epoch": 1.2626050420168067, + "grad_norm": 12.326258967391198, + "learning_rate": 7.190634881462976e-06, + "loss": 1.3262135982513428, + "step": 601 + }, + { + "epoch": 1.2647058823529411, + "grad_norm": 13.762619560991299, + "learning_rate": 7.179639945639688e-06, + "loss": 1.6294150352478027, + "step": 602 + }, + { + "epoch": 1.2668067226890756, + "grad_norm": 12.793929462404881, + "learning_rate": 7.168631981807931e-06, + "loss": 2.6409220695495605, + "step": 603 + }, + { + "epoch": 1.26890756302521, + "grad_norm": 12.75285051440542, + "learning_rate": 7.15761105576382e-06, + "loss": 1.3407433032989502, + "step": 604 + }, + { + "epoch": 1.2710084033613445, + "grad_norm": 11.811026706721915, + "learning_rate": 7.1465772333809524e-06, + "loss": 1.1475789546966553, + "step": 605 + }, + { + "epoch": 1.273109243697479, + "grad_norm": 16.182274466548407, + "learning_rate": 7.1355305806100036e-06, + "loss": 1.8270117044448853, + "step": 606 + }, + { + "epoch": 1.2752100840336134, + "grad_norm": 9.390889705782493, + "learning_rate": 7.124471163478344e-06, + "loss": 2.168900489807129, + "step": 607 + }, + { + "epoch": 1.2773109243697478, + "grad_norm": 14.960557905830523, + "learning_rate": 7.113399048089631e-06, + "loss": 2.0142345428466797, + "step": 608 + }, + { + "epoch": 1.2794117647058822, + "grad_norm": 14.63642311907181, + "learning_rate": 7.102314300623425e-06, + "loss": 2.015444755554199, + "step": 609 + }, + { + "epoch": 1.2815126050420167, + "grad_norm": 13.291155405094099, + "learning_rate": 7.091216987334792e-06, + "loss": 1.5882906913757324, + "step": 610 + }, + { + "epoch": 1.2836134453781511, + "grad_norm": 17.727064634923273, + "learning_rate": 7.080107174553903e-06, + "loss": 1.4543545246124268, + "step": 611 + }, + { + "epoch": 1.2857142857142856, + "grad_norm": 13.123573018342379, + "learning_rate": 7.068984928685638e-06, + "loss": 1.3196444511413574, + "step": 612 + }, + { + "epoch": 1.28781512605042, + "grad_norm": 11.204963124082711, + "learning_rate": 7.057850316209198e-06, + "loss": 0.8601089715957642, + "step": 613 + }, + { + "epoch": 1.2899159663865547, + "grad_norm": 11.507041064870066, + "learning_rate": 7.0467034036776945e-06, + "loss": 1.334380865097046, + "step": 614 + }, + { + "epoch": 1.2920168067226891, + "grad_norm": 9.153184893600336, + "learning_rate": 7.035544257717761e-06, + "loss": 1.4980111122131348, + "step": 615 + }, + { + "epoch": 1.2941176470588236, + "grad_norm": 11.208470095807519, + "learning_rate": 7.024372945029152e-06, + "loss": 1.9393174648284912, + "step": 616 + }, + { + "epoch": 1.296218487394958, + "grad_norm": 9.33539024674701, + "learning_rate": 7.013189532384343e-06, + "loss": 1.1070374250411987, + "step": 617 + }, + { + "epoch": 1.2983193277310925, + "grad_norm": 22.088040059228636, + "learning_rate": 7.001994086628133e-06, + "loss": 2.146557331085205, + "step": 618 + }, + { + "epoch": 1.300420168067227, + "grad_norm": 12.461539796415895, + "learning_rate": 6.990786674677246e-06, + "loss": 1.097703456878662, + "step": 619 + }, + { + "epoch": 1.3025210084033614, + "grad_norm": 10.337144677645794, + "learning_rate": 6.979567363519927e-06, + "loss": 1.9619685411453247, + "step": 620 + }, + { + "epoch": 1.3046218487394958, + "grad_norm": 8.583774398203186, + "learning_rate": 6.9683362202155465e-06, + "loss": 1.2424434423446655, + "step": 621 + }, + { + "epoch": 1.3067226890756303, + "grad_norm": 10.235846664061171, + "learning_rate": 6.957093311894199e-06, + "loss": 1.8912100791931152, + "step": 622 + }, + { + "epoch": 1.3088235294117647, + "grad_norm": 12.7496233438477, + "learning_rate": 6.945838705756293e-06, + "loss": 1.4234580993652344, + "step": 623 + }, + { + "epoch": 1.3109243697478992, + "grad_norm": 12.664108172155123, + "learning_rate": 6.934572469072163e-06, + "loss": 1.7631306648254395, + "step": 624 + }, + { + "epoch": 1.3130252100840336, + "grad_norm": 9.043940926283064, + "learning_rate": 6.923294669181659e-06, + "loss": 1.275686264038086, + "step": 625 + }, + { + "epoch": 1.315126050420168, + "grad_norm": 7.7562010562396155, + "learning_rate": 6.912005373493747e-06, + "loss": 1.8493428230285645, + "step": 626 + }, + { + "epoch": 1.3172268907563025, + "grad_norm": 10.778946101337466, + "learning_rate": 6.900704649486103e-06, + "loss": 1.0401699542999268, + "step": 627 + }, + { + "epoch": 1.319327731092437, + "grad_norm": 9.474741424665671, + "learning_rate": 6.889392564704712e-06, + "loss": 1.932092547416687, + "step": 628 + }, + { + "epoch": 1.3214285714285714, + "grad_norm": 18.187204049633937, + "learning_rate": 6.878069186763466e-06, + "loss": 2.0269484519958496, + "step": 629 + }, + { + "epoch": 1.3235294117647058, + "grad_norm": 12.371698082139902, + "learning_rate": 6.866734583343753e-06, + "loss": 1.6765419244766235, + "step": 630 + }, + { + "epoch": 1.3256302521008403, + "grad_norm": 20.859173211033255, + "learning_rate": 6.855388822194061e-06, + "loss": 1.7931967973709106, + "step": 631 + }, + { + "epoch": 1.3277310924369747, + "grad_norm": 10.82122547870125, + "learning_rate": 6.844031971129571e-06, + "loss": 0.9582860469818115, + "step": 632 + }, + { + "epoch": 1.3298319327731092, + "grad_norm": 13.255068667352083, + "learning_rate": 6.8326640980317475e-06, + "loss": 1.7692348957061768, + "step": 633 + }, + { + "epoch": 1.3319327731092436, + "grad_norm": 12.632729369596628, + "learning_rate": 6.821285270847934e-06, + "loss": 2.143463373184204, + "step": 634 + }, + { + "epoch": 1.334033613445378, + "grad_norm": 31.76404047719635, + "learning_rate": 6.80989555759095e-06, + "loss": 2.290733814239502, + "step": 635 + }, + { + "epoch": 1.3361344537815127, + "grad_norm": 18.9996916353526, + "learning_rate": 6.79849502633868e-06, + "loss": 1.4548063278198242, + "step": 636 + }, + { + "epoch": 1.3382352941176472, + "grad_norm": 10.423656653462372, + "learning_rate": 6.787083745233674e-06, + "loss": 1.6137502193450928, + "step": 637 + }, + { + "epoch": 1.3403361344537816, + "grad_norm": 9.260024233354208, + "learning_rate": 6.775661782482732e-06, + "loss": 1.277546763420105, + "step": 638 + }, + { + "epoch": 1.342436974789916, + "grad_norm": 17.22623817552147, + "learning_rate": 6.764229206356498e-06, + "loss": 1.4183297157287598, + "step": 639 + }, + { + "epoch": 1.3445378151260505, + "grad_norm": 13.655193467078059, + "learning_rate": 6.752786085189059e-06, + "loss": 2.352818012237549, + "step": 640 + }, + { + "epoch": 1.346638655462185, + "grad_norm": 10.832229231352626, + "learning_rate": 6.741332487377525e-06, + "loss": 1.1966056823730469, + "step": 641 + }, + { + "epoch": 1.3487394957983194, + "grad_norm": 16.450581846244585, + "learning_rate": 6.729868481381632e-06, + "loss": 2.1670610904693604, + "step": 642 + }, + { + "epoch": 1.3508403361344539, + "grad_norm": 14.092922253172704, + "learning_rate": 6.718394135723321e-06, + "loss": 1.4478580951690674, + "step": 643 + }, + { + "epoch": 1.3529411764705883, + "grad_norm": 9.381957347730207, + "learning_rate": 6.706909518986341e-06, + "loss": 1.1712067127227783, + "step": 644 + }, + { + "epoch": 1.3550420168067228, + "grad_norm": 10.457393453015948, + "learning_rate": 6.695414699815828e-06, + "loss": 1.241437315940857, + "step": 645 + }, + { + "epoch": 1.3571428571428572, + "grad_norm": 26.13803770478073, + "learning_rate": 6.6839097469179e-06, + "loss": 1.5295310020446777, + "step": 646 + }, + { + "epoch": 1.3592436974789917, + "grad_norm": 7.790998799935961, + "learning_rate": 6.6723947290592505e-06, + "loss": 1.3555617332458496, + "step": 647 + }, + { + "epoch": 1.361344537815126, + "grad_norm": 14.276342203489932, + "learning_rate": 6.660869715066725e-06, + "loss": 1.3158948421478271, + "step": 648 + }, + { + "epoch": 1.3634453781512605, + "grad_norm": 7.962812237225353, + "learning_rate": 6.649334773826924e-06, + "loss": 1.7540979385375977, + "step": 649 + }, + { + "epoch": 1.365546218487395, + "grad_norm": 12.139617079516373, + "learning_rate": 6.63778997428578e-06, + "loss": 1.7170000076293945, + "step": 650 + }, + { + "epoch": 1.3676470588235294, + "grad_norm": 9.424987040512477, + "learning_rate": 6.626235385448152e-06, + "loss": 1.2551283836364746, + "step": 651 + }, + { + "epoch": 1.3697478991596639, + "grad_norm": 11.731648378217931, + "learning_rate": 6.61467107637741e-06, + "loss": 1.468104362487793, + "step": 652 + }, + { + "epoch": 1.3718487394957983, + "grad_norm": 22.089135904446437, + "learning_rate": 6.603097116195026e-06, + "loss": 1.3832511901855469, + "step": 653 + }, + { + "epoch": 1.3739495798319328, + "grad_norm": 13.408397747285187, + "learning_rate": 6.591513574080152e-06, + "loss": 1.1895179748535156, + "step": 654 + }, + { + "epoch": 1.3760504201680672, + "grad_norm": 10.506415017764112, + "learning_rate": 6.579920519269218e-06, + "loss": 1.57008957862854, + "step": 655 + }, + { + "epoch": 1.3781512605042017, + "grad_norm": 7.3609644144158315, + "learning_rate": 6.568318021055512e-06, + "loss": 1.1686642169952393, + "step": 656 + }, + { + "epoch": 1.3802521008403361, + "grad_norm": 19.968281534972263, + "learning_rate": 6.556706148788765e-06, + "loss": 1.831925392150879, + "step": 657 + }, + { + "epoch": 1.3823529411764706, + "grad_norm": 14.858290457520233, + "learning_rate": 6.545084971874738e-06, + "loss": 1.1927814483642578, + "step": 658 + }, + { + "epoch": 1.384453781512605, + "grad_norm": 13.471589913344788, + "learning_rate": 6.5334545597748075e-06, + "loss": 1.225053310394287, + "step": 659 + }, + { + "epoch": 1.3865546218487395, + "grad_norm": 10.64391058893006, + "learning_rate": 6.521814982005552e-06, + "loss": 1.489911437034607, + "step": 660 + }, + { + "epoch": 1.388655462184874, + "grad_norm": 14.084203318094486, + "learning_rate": 6.510166308138328e-06, + "loss": 1.3653918504714966, + "step": 661 + }, + { + "epoch": 1.3907563025210083, + "grad_norm": 10.331380068295612, + "learning_rate": 6.498508607798872e-06, + "loss": 1.7082477807998657, + "step": 662 + }, + { + "epoch": 1.3928571428571428, + "grad_norm": 10.828390377137284, + "learning_rate": 6.48684195066686e-06, + "loss": 1.1122634410858154, + "step": 663 + }, + { + "epoch": 1.3949579831932772, + "grad_norm": 14.858926439296923, + "learning_rate": 6.475166406475515e-06, + "loss": 0.9572471380233765, + "step": 664 + }, + { + "epoch": 1.3970588235294117, + "grad_norm": 17.02414371173566, + "learning_rate": 6.4634820450111715e-06, + "loss": 1.8282674551010132, + "step": 665 + }, + { + "epoch": 1.3991596638655461, + "grad_norm": 12.803154660225488, + "learning_rate": 6.451788936112868e-06, + "loss": 1.2026221752166748, + "step": 666 + }, + { + "epoch": 1.4012605042016806, + "grad_norm": 10.424391789653072, + "learning_rate": 6.440087149671932e-06, + "loss": 1.3183879852294922, + "step": 667 + }, + { + "epoch": 1.403361344537815, + "grad_norm": 8.925077970843816, + "learning_rate": 6.428376755631553e-06, + "loss": 1.216771125793457, + "step": 668 + }, + { + "epoch": 1.4054621848739495, + "grad_norm": 12.5613140309092, + "learning_rate": 6.41665782398637e-06, + "loss": 1.6759852170944214, + "step": 669 + }, + { + "epoch": 1.407563025210084, + "grad_norm": 13.278399152081807, + "learning_rate": 6.404930424782052e-06, + "loss": 1.6593937873840332, + "step": 670 + }, + { + "epoch": 1.4096638655462184, + "grad_norm": 11.405836988138063, + "learning_rate": 6.393194628114885e-06, + "loss": 1.672929286956787, + "step": 671 + }, + { + "epoch": 1.4117647058823528, + "grad_norm": 13.1586681372233, + "learning_rate": 6.381450504131339e-06, + "loss": 1.2778139114379883, + "step": 672 + }, + { + "epoch": 1.4138655462184873, + "grad_norm": 9.462564203496632, + "learning_rate": 6.369698123027664e-06, + "loss": 1.6472318172454834, + "step": 673 + }, + { + "epoch": 1.415966386554622, + "grad_norm": 12.367075684146661, + "learning_rate": 6.357937555049465e-06, + "loss": 1.5301233530044556, + "step": 674 + }, + { + "epoch": 1.4180672268907564, + "grad_norm": 9.502388277835697, + "learning_rate": 6.3461688704912735e-06, + "loss": 1.5423755645751953, + "step": 675 + }, + { + "epoch": 1.4201680672268908, + "grad_norm": 13.340625777023925, + "learning_rate": 6.334392139696144e-06, + "loss": 0.8435590863227844, + "step": 676 + }, + { + "epoch": 1.4222689075630253, + "grad_norm": 9.498703079540906, + "learning_rate": 6.322607433055217e-06, + "loss": 0.9243001937866211, + "step": 677 + }, + { + "epoch": 1.4243697478991597, + "grad_norm": 16.692002135074148, + "learning_rate": 6.310814821007312e-06, + "loss": 1.1370623111724854, + "step": 678 + }, + { + "epoch": 1.4264705882352942, + "grad_norm": 14.252581322539957, + "learning_rate": 6.299014374038493e-06, + "loss": 1.8121721744537354, + "step": 679 + }, + { + "epoch": 1.4285714285714286, + "grad_norm": 12.146719665307664, + "learning_rate": 6.287206162681663e-06, + "loss": 1.5701857805252075, + "step": 680 + }, + { + "epoch": 1.430672268907563, + "grad_norm": 11.383072024184132, + "learning_rate": 6.275390257516125e-06, + "loss": 1.7376922369003296, + "step": 681 + }, + { + "epoch": 1.4327731092436975, + "grad_norm": 7.389859803918485, + "learning_rate": 6.263566729167177e-06, + "loss": 1.722080111503601, + "step": 682 + }, + { + "epoch": 1.434873949579832, + "grad_norm": 11.051749495669629, + "learning_rate": 6.251735648305676e-06, + "loss": 1.8646998405456543, + "step": 683 + }, + { + "epoch": 1.4369747899159664, + "grad_norm": 8.056416794494698, + "learning_rate": 6.239897085647624e-06, + "loss": 1.6373791694641113, + "step": 684 + }, + { + "epoch": 1.4390756302521008, + "grad_norm": 14.269272004271027, + "learning_rate": 6.228051111953742e-06, + "loss": 1.5332825183868408, + "step": 685 + }, + { + "epoch": 1.4411764705882353, + "grad_norm": 11.569261548147155, + "learning_rate": 6.216197798029049e-06, + "loss": 1.7713117599487305, + "step": 686 + }, + { + "epoch": 1.4432773109243697, + "grad_norm": 8.013171505509781, + "learning_rate": 6.204337214722435e-06, + "loss": 1.3197343349456787, + "step": 687 + }, + { + "epoch": 1.4453781512605042, + "grad_norm": 7.988425778687254, + "learning_rate": 6.192469432926241e-06, + "loss": 1.3940856456756592, + "step": 688 + }, + { + "epoch": 1.4474789915966386, + "grad_norm": 14.591944041736712, + "learning_rate": 6.180594523575838e-06, + "loss": 2.0876762866973877, + "step": 689 + }, + { + "epoch": 1.449579831932773, + "grad_norm": 13.421486753054541, + "learning_rate": 6.1687125576491945e-06, + "loss": 2.5141618251800537, + "step": 690 + }, + { + "epoch": 1.4516806722689075, + "grad_norm": 11.284766831118931, + "learning_rate": 6.156823606166461e-06, + "loss": 0.9575009942054749, + "step": 691 + }, + { + "epoch": 1.453781512605042, + "grad_norm": 10.180747973970707, + "learning_rate": 6.144927740189537e-06, + "loss": 1.2732771635055542, + "step": 692 + }, + { + "epoch": 1.4558823529411764, + "grad_norm": 18.346962905469923, + "learning_rate": 6.133025030821656e-06, + "loss": 1.0447793006896973, + "step": 693 + }, + { + "epoch": 1.4579831932773109, + "grad_norm": 9.72623535803224, + "learning_rate": 6.12111554920695e-06, + "loss": 2.069892406463623, + "step": 694 + }, + { + "epoch": 1.4600840336134453, + "grad_norm": 12.298140767363686, + "learning_rate": 6.1091993665300354e-06, + "loss": 1.4193060398101807, + "step": 695 + }, + { + "epoch": 1.46218487394958, + "grad_norm": 13.962463696814781, + "learning_rate": 6.0972765540155764e-06, + "loss": 1.8489269018173218, + "step": 696 + }, + { + "epoch": 1.4642857142857144, + "grad_norm": 28.27872673921732, + "learning_rate": 6.08534718292787e-06, + "loss": 1.8245782852172852, + "step": 697 + }, + { + "epoch": 1.4663865546218489, + "grad_norm": 11.704836274205533, + "learning_rate": 6.07341132457041e-06, + "loss": 1.8135966062545776, + "step": 698 + }, + { + "epoch": 1.4684873949579833, + "grad_norm": 10.329932140617693, + "learning_rate": 6.061469050285469e-06, + "loss": 1.2886388301849365, + "step": 699 + }, + { + "epoch": 1.4705882352941178, + "grad_norm": 7.515435335019253, + "learning_rate": 6.049520431453666e-06, + "loss": 1.8994669914245605, + "step": 700 + }, + { + "epoch": 1.4726890756302522, + "grad_norm": 8.559344765158919, + "learning_rate": 6.037565539493542e-06, + "loss": 1.830640196800232, + "step": 701 + }, + { + "epoch": 1.4747899159663866, + "grad_norm": 11.041841545301232, + "learning_rate": 6.025604445861137e-06, + "loss": 1.253919005393982, + "step": 702 + }, + { + "epoch": 1.476890756302521, + "grad_norm": 8.205733723815058, + "learning_rate": 6.013637222049554e-06, + "loss": 1.4687739610671997, + "step": 703 + }, + { + "epoch": 1.4789915966386555, + "grad_norm": 11.178455036225843, + "learning_rate": 6.0016639395885424e-06, + "loss": 0.8241528272628784, + "step": 704 + }, + { + "epoch": 1.48109243697479, + "grad_norm": 9.38917529173767, + "learning_rate": 5.98968467004406e-06, + "loss": 0.9833969473838806, + "step": 705 + }, + { + "epoch": 1.4831932773109244, + "grad_norm": 12.194704863353925, + "learning_rate": 5.977699485017855e-06, + "loss": 1.4603691101074219, + "step": 706 + }, + { + "epoch": 1.4852941176470589, + "grad_norm": 15.962403885996371, + "learning_rate": 5.965708456147028e-06, + "loss": 1.2566254138946533, + "step": 707 + }, + { + "epoch": 1.4873949579831933, + "grad_norm": 12.538339280369007, + "learning_rate": 5.953711655103615e-06, + "loss": 1.1779121160507202, + "step": 708 + }, + { + "epoch": 1.4894957983193278, + "grad_norm": 13.11480387819097, + "learning_rate": 5.941709153594146e-06, + "loss": 2.1752524375915527, + "step": 709 + }, + { + "epoch": 1.4915966386554622, + "grad_norm": 13.674164350381794, + "learning_rate": 5.92970102335923e-06, + "loss": 1.368391752243042, + "step": 710 + }, + { + "epoch": 1.4936974789915967, + "grad_norm": 14.25334329729132, + "learning_rate": 5.917687336173116e-06, + "loss": 1.4870836734771729, + "step": 711 + }, + { + "epoch": 1.495798319327731, + "grad_norm": 6.953756120767862, + "learning_rate": 5.905668163843269e-06, + "loss": 1.5822714567184448, + "step": 712 + }, + { + "epoch": 1.4978991596638656, + "grad_norm": 11.644576591550592, + "learning_rate": 5.893643578209939e-06, + "loss": 1.5158865451812744, + "step": 713 + }, + { + "epoch": 1.5, + "grad_norm": 7.891690515863711, + "learning_rate": 5.881613651145732e-06, + "loss": 1.0833930969238281, + "step": 714 + }, + { + "epoch": 1.5021008403361344, + "grad_norm": 10.374951659973064, + "learning_rate": 5.8695784545551815e-06, + "loss": 1.2957074642181396, + "step": 715 + }, + { + "epoch": 1.504201680672269, + "grad_norm": 11.404797448034625, + "learning_rate": 5.8575380603743155e-06, + "loss": 1.541155457496643, + "step": 716 + }, + { + "epoch": 1.5063025210084033, + "grad_norm": 9.289021596431404, + "learning_rate": 5.8454925405702326e-06, + "loss": 1.7509238719940186, + "step": 717 + }, + { + "epoch": 1.5084033613445378, + "grad_norm": 15.014764167830913, + "learning_rate": 5.833441967140662e-06, + "loss": 1.8062071800231934, + "step": 718 + }, + { + "epoch": 1.5105042016806722, + "grad_norm": 11.714801378063543, + "learning_rate": 5.821386412113546e-06, + "loss": 1.4850780963897705, + "step": 719 + }, + { + "epoch": 1.5126050420168067, + "grad_norm": 12.362413690497235, + "learning_rate": 5.809325947546596e-06, + "loss": 1.1842257976531982, + "step": 720 + }, + { + "epoch": 1.5147058823529411, + "grad_norm": 18.21069319599996, + "learning_rate": 5.797260645526873e-06, + "loss": 1.396120548248291, + "step": 721 + }, + { + "epoch": 1.5168067226890756, + "grad_norm": 9.57576869626496, + "learning_rate": 5.785190578170351e-06, + "loss": 1.2990989685058594, + "step": 722 + }, + { + "epoch": 1.51890756302521, + "grad_norm": 9.618803676236782, + "learning_rate": 5.773115817621487e-06, + "loss": 1.8467388153076172, + "step": 723 + }, + { + "epoch": 1.5210084033613445, + "grad_norm": 11.794758813101549, + "learning_rate": 5.761036436052788e-06, + "loss": 1.6907732486724854, + "step": 724 + }, + { + "epoch": 1.523109243697479, + "grad_norm": 10.45395101852907, + "learning_rate": 5.748952505664385e-06, + "loss": 1.265946388244629, + "step": 725 + }, + { + "epoch": 1.5252100840336134, + "grad_norm": 39.03800117968252, + "learning_rate": 5.736864098683595e-06, + "loss": 1.2473053932189941, + "step": 726 + }, + { + "epoch": 1.5273109243697478, + "grad_norm": 12.736788173749753, + "learning_rate": 5.724771287364492e-06, + "loss": 0.8382349014282227, + "step": 727 + }, + { + "epoch": 1.5294117647058822, + "grad_norm": 9.695123568985625, + "learning_rate": 5.712674143987478e-06, + "loss": 0.6312862038612366, + "step": 728 + }, + { + "epoch": 1.5315126050420167, + "grad_norm": 19.807295601128907, + "learning_rate": 5.700572740858847e-06, + "loss": 2.154848575592041, + "step": 729 + }, + { + "epoch": 1.5336134453781511, + "grad_norm": 8.348583198098744, + "learning_rate": 5.688467150310353e-06, + "loss": 2.034533739089966, + "step": 730 + }, + { + "epoch": 1.5357142857142856, + "grad_norm": 17.36525324904992, + "learning_rate": 5.67635744469878e-06, + "loss": 1.1331748962402344, + "step": 731 + }, + { + "epoch": 1.53781512605042, + "grad_norm": 16.447167153207392, + "learning_rate": 5.664243696405509e-06, + "loss": 2.139069080352783, + "step": 732 + }, + { + "epoch": 1.5399159663865545, + "grad_norm": 8.422362967066016, + "learning_rate": 5.652125977836083e-06, + "loss": 1.5174198150634766, + "step": 733 + }, + { + "epoch": 1.542016806722689, + "grad_norm": 11.885541322376927, + "learning_rate": 5.640004361419776e-06, + "loss": 1.4445990324020386, + "step": 734 + }, + { + "epoch": 1.5441176470588234, + "grad_norm": 13.004468722411309, + "learning_rate": 5.627878919609162e-06, + "loss": 1.3474795818328857, + "step": 735 + }, + { + "epoch": 1.5462184873949578, + "grad_norm": 8.116038341885554, + "learning_rate": 5.615749724879677e-06, + "loss": 1.4871881008148193, + "step": 736 + }, + { + "epoch": 1.5483193277310925, + "grad_norm": 9.971232266174457, + "learning_rate": 5.603616849729191e-06, + "loss": 1.308741569519043, + "step": 737 + }, + { + "epoch": 1.550420168067227, + "grad_norm": 9.853281920667216, + "learning_rate": 5.591480366677571e-06, + "loss": 1.712050199508667, + "step": 738 + }, + { + "epoch": 1.5525210084033614, + "grad_norm": 10.993711611399497, + "learning_rate": 5.579340348266251e-06, + "loss": 1.5636662244796753, + "step": 739 + }, + { + "epoch": 1.5546218487394958, + "grad_norm": 9.673522828347147, + "learning_rate": 5.5671968670577935e-06, + "loss": 2.132948160171509, + "step": 740 + }, + { + "epoch": 1.5567226890756303, + "grad_norm": 8.375544989800046, + "learning_rate": 5.55504999563546e-06, + "loss": 1.3193635940551758, + "step": 741 + }, + { + "epoch": 1.5588235294117647, + "grad_norm": 17.452697703036844, + "learning_rate": 5.542899806602776e-06, + "loss": 2.288175582885742, + "step": 742 + }, + { + "epoch": 1.5609243697478992, + "grad_norm": 9.46737262414516, + "learning_rate": 5.530746372583097e-06, + "loss": 0.9925522804260254, + "step": 743 + }, + { + "epoch": 1.5630252100840336, + "grad_norm": 11.56785515084437, + "learning_rate": 5.518589766219173e-06, + "loss": 1.0975109338760376, + "step": 744 + }, + { + "epoch": 1.565126050420168, + "grad_norm": 7.691252772883318, + "learning_rate": 5.506430060172714e-06, + "loss": 1.5021933317184448, + "step": 745 + }, + { + "epoch": 1.5672268907563025, + "grad_norm": 18.209072269714934, + "learning_rate": 5.494267327123965e-06, + "loss": 1.3946982622146606, + "step": 746 + }, + { + "epoch": 1.569327731092437, + "grad_norm": 8.665816006385743, + "learning_rate": 5.482101639771255e-06, + "loss": 1.1381559371948242, + "step": 747 + }, + { + "epoch": 1.5714285714285714, + "grad_norm": 8.44106615949262, + "learning_rate": 5.469933070830574e-06, + "loss": 1.6340922117233276, + "step": 748 + }, + { + "epoch": 1.5735294117647058, + "grad_norm": 15.525808686682517, + "learning_rate": 5.457761693035139e-06, + "loss": 1.3076329231262207, + "step": 749 + }, + { + "epoch": 1.5756302521008403, + "grad_norm": 17.23937998928761, + "learning_rate": 5.44558757913495e-06, + "loss": 1.4544854164123535, + "step": 750 + }, + { + "epoch": 1.5777310924369747, + "grad_norm": 12.32276892072033, + "learning_rate": 5.433410801896366e-06, + "loss": 1.254534363746643, + "step": 751 + }, + { + "epoch": 1.5798319327731094, + "grad_norm": 15.375685102500293, + "learning_rate": 5.4212314341016645e-06, + "loss": 1.6915278434753418, + "step": 752 + }, + { + "epoch": 1.5819327731092439, + "grad_norm": 11.585921032972996, + "learning_rate": 5.409049548548604e-06, + "loss": 1.9941121339797974, + "step": 753 + }, + { + "epoch": 1.5840336134453783, + "grad_norm": 20.541716513837855, + "learning_rate": 5.396865218049995e-06, + "loss": 1.8611130714416504, + "step": 754 + }, + { + "epoch": 1.5861344537815127, + "grad_norm": 8.615776619323707, + "learning_rate": 5.38467851543326e-06, + "loss": 1.5740795135498047, + "step": 755 + }, + { + "epoch": 1.5882352941176472, + "grad_norm": 11.309502746225869, + "learning_rate": 5.3724895135400015e-06, + "loss": 2.713351249694824, + "step": 756 + }, + { + "epoch": 1.5903361344537816, + "grad_norm": 10.253542895381939, + "learning_rate": 5.360298285225564e-06, + "loss": 1.3163414001464844, + "step": 757 + }, + { + "epoch": 1.592436974789916, + "grad_norm": 9.938347580214066, + "learning_rate": 5.3481049033586e-06, + "loss": 1.2127149105072021, + "step": 758 + }, + { + "epoch": 1.5945378151260505, + "grad_norm": 8.342953472089572, + "learning_rate": 5.335909440820635e-06, + "loss": 1.7897974252700806, + "step": 759 + }, + { + "epoch": 1.596638655462185, + "grad_norm": 15.069858504573101, + "learning_rate": 5.323711970505627e-06, + "loss": 1.1387288570404053, + "step": 760 + }, + { + "epoch": 1.5987394957983194, + "grad_norm": 11.085133444710992, + "learning_rate": 5.311512565319542e-06, + "loss": 1.3364837169647217, + "step": 761 + }, + { + "epoch": 1.6008403361344539, + "grad_norm": 32.930598343392575, + "learning_rate": 5.299311298179904e-06, + "loss": 1.5517654418945312, + "step": 762 + }, + { + "epoch": 1.6029411764705883, + "grad_norm": 8.444149682468657, + "learning_rate": 5.287108242015371e-06, + "loss": 1.3167724609375, + "step": 763 + }, + { + "epoch": 1.6050420168067228, + "grad_norm": 11.755149351980176, + "learning_rate": 5.27490346976529e-06, + "loss": 0.9891781210899353, + "step": 764 + }, + { + "epoch": 1.6071428571428572, + "grad_norm": 7.559294905407309, + "learning_rate": 5.2626970543792685e-06, + "loss": 1.4272327423095703, + "step": 765 + }, + { + "epoch": 1.6092436974789917, + "grad_norm": 15.95519407006552, + "learning_rate": 5.250489068816734e-06, + "loss": 1.5374692678451538, + "step": 766 + }, + { + "epoch": 1.611344537815126, + "grad_norm": 11.13469591726469, + "learning_rate": 5.238279586046499e-06, + "loss": 2.130378484725952, + "step": 767 + }, + { + "epoch": 1.6134453781512605, + "grad_norm": 7.655252597687492, + "learning_rate": 5.226068679046327e-06, + "loss": 1.0989816188812256, + "step": 768 + }, + { + "epoch": 1.615546218487395, + "grad_norm": 13.788475789937872, + "learning_rate": 5.21385642080249e-06, + "loss": 1.4945666790008545, + "step": 769 + }, + { + "epoch": 1.6176470588235294, + "grad_norm": 10.474320077857882, + "learning_rate": 5.201642884309341e-06, + "loss": 2.0057296752929688, + "step": 770 + }, + { + "epoch": 1.6197478991596639, + "grad_norm": 15.324254986466453, + "learning_rate": 5.189428142568872e-06, + "loss": 1.1791839599609375, + "step": 771 + }, + { + "epoch": 1.6218487394957983, + "grad_norm": 9.947837053439045, + "learning_rate": 5.177212268590277e-06, + "loss": 1.836449384689331, + "step": 772 + }, + { + "epoch": 1.6239495798319328, + "grad_norm": 13.279110268267903, + "learning_rate": 5.16499533538952e-06, + "loss": 1.711057424545288, + "step": 773 + }, + { + "epoch": 1.6260504201680672, + "grad_norm": 8.331904700424623, + "learning_rate": 5.152777415988894e-06, + "loss": 1.5274529457092285, + "step": 774 + }, + { + "epoch": 1.6281512605042017, + "grad_norm": 8.55624828912363, + "learning_rate": 5.140558583416591e-06, + "loss": 1.687756061553955, + "step": 775 + }, + { + "epoch": 1.6302521008403361, + "grad_norm": 13.622302699665928, + "learning_rate": 5.128338910706254e-06, + "loss": 1.857285976409912, + "step": 776 + }, + { + "epoch": 1.6323529411764706, + "grad_norm": 10.381639920961357, + "learning_rate": 5.1161184708965525e-06, + "loss": 2.2893779277801514, + "step": 777 + }, + { + "epoch": 1.634453781512605, + "grad_norm": 13.136015822018155, + "learning_rate": 5.103897337030742e-06, + "loss": 1.299177646636963, + "step": 778 + }, + { + "epoch": 1.6365546218487395, + "grad_norm": 12.717300364122215, + "learning_rate": 5.091675582156224e-06, + "loss": 1.156067132949829, + "step": 779 + }, + { + "epoch": 1.638655462184874, + "grad_norm": 12.064277910399447, + "learning_rate": 5.07945327932411e-06, + "loss": 1.6888867616653442, + "step": 780 + }, + { + "epoch": 1.6407563025210083, + "grad_norm": 18.58505757321674, + "learning_rate": 5.067230501588792e-06, + "loss": 2.480485677719116, + "step": 781 + }, + { + "epoch": 1.6428571428571428, + "grad_norm": 10.797297449293279, + "learning_rate": 5.055007322007497e-06, + "loss": 1.1827846765518188, + "step": 782 + }, + { + "epoch": 1.6449579831932772, + "grad_norm": 8.451797960661173, + "learning_rate": 5.0427838136398545e-06, + "loss": 0.9974920749664307, + "step": 783 + }, + { + "epoch": 1.6470588235294117, + "grad_norm": 9.35430238275204, + "learning_rate": 5.0305600495474586e-06, + "loss": 1.3341560363769531, + "step": 784 + }, + { + "epoch": 1.6491596638655461, + "grad_norm": 12.853381185509344, + "learning_rate": 5.018336102793433e-06, + "loss": 1.7801398038864136, + "step": 785 + }, + { + "epoch": 1.6512605042016806, + "grad_norm": 9.421435792652487, + "learning_rate": 5.006112046441993e-06, + "loss": 1.5409959554672241, + "step": 786 + }, + { + "epoch": 1.653361344537815, + "grad_norm": 17.569411033601973, + "learning_rate": 4.993887953558008e-06, + "loss": 1.7089118957519531, + "step": 787 + }, + { + "epoch": 1.6554621848739495, + "grad_norm": 7.577368880962854, + "learning_rate": 4.981663897206568e-06, + "loss": 1.5989807844161987, + "step": 788 + }, + { + "epoch": 1.657563025210084, + "grad_norm": 8.077886545894733, + "learning_rate": 4.969439950452543e-06, + "loss": 1.4693567752838135, + "step": 789 + }, + { + "epoch": 1.6596638655462184, + "grad_norm": 9.785283960809164, + "learning_rate": 4.957216186360147e-06, + "loss": 1.7319889068603516, + "step": 790 + }, + { + "epoch": 1.6617647058823528, + "grad_norm": 9.333867287657988, + "learning_rate": 4.944992677992505e-06, + "loss": 1.38368558883667, + "step": 791 + }, + { + "epoch": 1.6638655462184873, + "grad_norm": 12.124257442308217, + "learning_rate": 4.932769498411209e-06, + "loss": 1.9276368618011475, + "step": 792 + }, + { + "epoch": 1.6659663865546217, + "grad_norm": 11.917503250417354, + "learning_rate": 4.9205467206758914e-06, + "loss": 1.5189965963363647, + "step": 793 + }, + { + "epoch": 1.6680672268907561, + "grad_norm": 10.697092148525952, + "learning_rate": 4.908324417843779e-06, + "loss": 1.8080897331237793, + "step": 794 + }, + { + "epoch": 1.6701680672268906, + "grad_norm": 13.667659355410398, + "learning_rate": 4.896102662969259e-06, + "loss": 1.3283686637878418, + "step": 795 + }, + { + "epoch": 1.6722689075630253, + "grad_norm": 10.250252779637346, + "learning_rate": 4.883881529103448e-06, + "loss": 1.7254778146743774, + "step": 796 + }, + { + "epoch": 1.6743697478991597, + "grad_norm": 23.09605024251299, + "learning_rate": 4.8716610892937486e-06, + "loss": 1.882294774055481, + "step": 797 + }, + { + "epoch": 1.6764705882352942, + "grad_norm": 9.75260822435192, + "learning_rate": 4.859441416583412e-06, + "loss": 1.955444574356079, + "step": 798 + }, + { + "epoch": 1.6785714285714286, + "grad_norm": 9.214097989478232, + "learning_rate": 4.847222584011107e-06, + "loss": 1.3442355394363403, + "step": 799 + }, + { + "epoch": 1.680672268907563, + "grad_norm": 7.0621430973608295, + "learning_rate": 4.8350046646104815e-06, + "loss": 1.3532618284225464, + "step": 800 + }, + { + "epoch": 1.6827731092436975, + "grad_norm": 9.43032823639271, + "learning_rate": 4.8227877314097245e-06, + "loss": 1.8527226448059082, + "step": 801 + }, + { + "epoch": 1.684873949579832, + "grad_norm": 42.238546118436666, + "learning_rate": 4.81057185743113e-06, + "loss": 2.1312098503112793, + "step": 802 + }, + { + "epoch": 1.6869747899159664, + "grad_norm": 19.238236915867475, + "learning_rate": 4.798357115690661e-06, + "loss": 1.3131635189056396, + "step": 803 + }, + { + "epoch": 1.6890756302521008, + "grad_norm": 11.839412971623531, + "learning_rate": 4.7861435791975124e-06, + "loss": 1.057523488998413, + "step": 804 + }, + { + "epoch": 1.6911764705882353, + "grad_norm": 16.330203992434377, + "learning_rate": 4.7739313209536755e-06, + "loss": 1.510682225227356, + "step": 805 + }, + { + "epoch": 1.6932773109243697, + "grad_norm": 9.476255130895225, + "learning_rate": 4.761720413953503e-06, + "loss": 2.0877933502197266, + "step": 806 + }, + { + "epoch": 1.6953781512605042, + "grad_norm": 18.00296013944893, + "learning_rate": 4.7495109311832665e-06, + "loss": 0.9936963319778442, + "step": 807 + }, + { + "epoch": 1.6974789915966386, + "grad_norm": 12.213588808955969, + "learning_rate": 4.737302945620732e-06, + "loss": 1.4148988723754883, + "step": 808 + }, + { + "epoch": 1.699579831932773, + "grad_norm": 16.652878791868638, + "learning_rate": 4.72509653023471e-06, + "loss": 1.5457355976104736, + "step": 809 + }, + { + "epoch": 1.7016806722689075, + "grad_norm": 12.137844142300786, + "learning_rate": 4.712891757984629e-06, + "loss": 1.1069682836532593, + "step": 810 + }, + { + "epoch": 1.7037815126050422, + "grad_norm": 10.383790506526612, + "learning_rate": 4.700688701820096e-06, + "loss": 2.270923376083374, + "step": 811 + }, + { + "epoch": 1.7058823529411766, + "grad_norm": 9.870143573450948, + "learning_rate": 4.688487434680459e-06, + "loss": 2.1212430000305176, + "step": 812 + }, + { + "epoch": 1.707983193277311, + "grad_norm": 7.378583815892385, + "learning_rate": 4.6762880294943734e-06, + "loss": 1.340724229812622, + "step": 813 + }, + { + "epoch": 1.7100840336134455, + "grad_norm": 10.60633944294548, + "learning_rate": 4.664090559179367e-06, + "loss": 1.1250860691070557, + "step": 814 + }, + { + "epoch": 1.71218487394958, + "grad_norm": 10.395256226604776, + "learning_rate": 4.651895096641402e-06, + "loss": 1.3906278610229492, + "step": 815 + }, + { + "epoch": 1.7142857142857144, + "grad_norm": 14.563103162972197, + "learning_rate": 4.639701714774439e-06, + "loss": 1.5373984575271606, + "step": 816 + }, + { + "epoch": 1.7163865546218489, + "grad_norm": 11.845585553697056, + "learning_rate": 4.627510486459999e-06, + "loss": 1.1511554718017578, + "step": 817 + }, + { + "epoch": 1.7184873949579833, + "grad_norm": 12.016172591706953, + "learning_rate": 4.615321484566741e-06, + "loss": 1.0511482954025269, + "step": 818 + }, + { + "epoch": 1.7205882352941178, + "grad_norm": 24.328922920047308, + "learning_rate": 4.603134781950007e-06, + "loss": 1.6539651155471802, + "step": 819 + }, + { + "epoch": 1.7226890756302522, + "grad_norm": 10.354684370723726, + "learning_rate": 4.590950451451397e-06, + "loss": 1.7340842485427856, + "step": 820 + }, + { + "epoch": 1.7247899159663866, + "grad_norm": 9.128876197606015, + "learning_rate": 4.578768565898337e-06, + "loss": 1.9771497249603271, + "step": 821 + }, + { + "epoch": 1.726890756302521, + "grad_norm": 13.12308018791223, + "learning_rate": 4.566589198103635e-06, + "loss": 1.6702903509140015, + "step": 822 + }, + { + "epoch": 1.7289915966386555, + "grad_norm": 14.032448855066312, + "learning_rate": 4.554412420865052e-06, + "loss": 1.2594914436340332, + "step": 823 + }, + { + "epoch": 1.73109243697479, + "grad_norm": 11.631886990165667, + "learning_rate": 4.542238306964863e-06, + "loss": 1.2319787740707397, + "step": 824 + }, + { + "epoch": 1.7331932773109244, + "grad_norm": 12.012430999144566, + "learning_rate": 4.530066929169427e-06, + "loss": 1.631975769996643, + "step": 825 + }, + { + "epoch": 1.7352941176470589, + "grad_norm": 14.157695450219515, + "learning_rate": 4.5178983602287476e-06, + "loss": 1.4831879138946533, + "step": 826 + }, + { + "epoch": 1.7373949579831933, + "grad_norm": 12.493623072525319, + "learning_rate": 4.505732672876037e-06, + "loss": 1.225109338760376, + "step": 827 + }, + { + "epoch": 1.7394957983193278, + "grad_norm": 30.459517703838213, + "learning_rate": 4.493569939827288e-06, + "loss": 1.6191500425338745, + "step": 828 + }, + { + "epoch": 1.7415966386554622, + "grad_norm": 10.531191971687601, + "learning_rate": 4.48141023378083e-06, + "loss": 1.562519907951355, + "step": 829 + }, + { + "epoch": 1.7436974789915967, + "grad_norm": 20.955204277046732, + "learning_rate": 4.4692536274169055e-06, + "loss": 1.5889461040496826, + "step": 830 + }, + { + "epoch": 1.745798319327731, + "grad_norm": 16.275459231962, + "learning_rate": 4.457100193397226e-06, + "loss": 0.8582566976547241, + "step": 831 + }, + { + "epoch": 1.7478991596638656, + "grad_norm": 8.59181477774897, + "learning_rate": 4.444950004364542e-06, + "loss": 1.2409437894821167, + "step": 832 + }, + { + "epoch": 1.75, + "grad_norm": 11.280859647806443, + "learning_rate": 4.432803132942208e-06, + "loss": 1.2449380159378052, + "step": 833 + }, + { + "epoch": 1.7521008403361344, + "grad_norm": 13.088404793322951, + "learning_rate": 4.420659651733751e-06, + "loss": 1.2676522731781006, + "step": 834 + }, + { + "epoch": 1.754201680672269, + "grad_norm": 10.60776961423833, + "learning_rate": 4.40851963332243e-06, + "loss": 1.5941420793533325, + "step": 835 + }, + { + "epoch": 1.7563025210084033, + "grad_norm": 17.131655688023486, + "learning_rate": 4.396383150270811e-06, + "loss": 1.1451562643051147, + "step": 836 + }, + { + "epoch": 1.7584033613445378, + "grad_norm": 16.683478300158875, + "learning_rate": 4.384250275120325e-06, + "loss": 1.4305951595306396, + "step": 837 + }, + { + "epoch": 1.7605042016806722, + "grad_norm": 23.521629142849456, + "learning_rate": 4.372121080390841e-06, + "loss": 1.9824583530426025, + "step": 838 + }, + { + "epoch": 1.7626050420168067, + "grad_norm": 12.354999677804352, + "learning_rate": 4.359995638580226e-06, + "loss": 1.2548645734786987, + "step": 839 + }, + { + "epoch": 1.7647058823529411, + "grad_norm": 11.031648245105625, + "learning_rate": 4.34787402216392e-06, + "loss": 1.8208611011505127, + "step": 840 + }, + { + "epoch": 1.7668067226890756, + "grad_norm": 12.87350659067892, + "learning_rate": 4.335756303594493e-06, + "loss": 1.3555166721343994, + "step": 841 + }, + { + "epoch": 1.76890756302521, + "grad_norm": 11.399790863860508, + "learning_rate": 4.323642555301222e-06, + "loss": 0.9843342900276184, + "step": 842 + }, + { + "epoch": 1.7710084033613445, + "grad_norm": 9.734229808167726, + "learning_rate": 4.311532849689649e-06, + "loss": 1.5203514099121094, + "step": 843 + }, + { + "epoch": 1.773109243697479, + "grad_norm": 12.62619531995832, + "learning_rate": 4.299427259141155e-06, + "loss": 2.226682662963867, + "step": 844 + }, + { + "epoch": 1.7752100840336134, + "grad_norm": 9.352423304681453, + "learning_rate": 4.2873258560125244e-06, + "loss": 1.4532074928283691, + "step": 845 + }, + { + "epoch": 1.7773109243697478, + "grad_norm": 13.614475982132188, + "learning_rate": 4.275228712635511e-06, + "loss": 0.939800500869751, + "step": 846 + }, + { + "epoch": 1.7794117647058822, + "grad_norm": 7.898241318034454, + "learning_rate": 4.263135901316406e-06, + "loss": 0.9362924098968506, + "step": 847 + }, + { + "epoch": 1.7815126050420167, + "grad_norm": 12.878302238594825, + "learning_rate": 4.251047494335616e-06, + "loss": 1.4257563352584839, + "step": 848 + }, + { + "epoch": 1.7836134453781511, + "grad_norm": 11.607398907584903, + "learning_rate": 4.238963563947212e-06, + "loss": 1.393942952156067, + "step": 849 + }, + { + "epoch": 1.7857142857142856, + "grad_norm": 9.414377919796664, + "learning_rate": 4.226884182378513e-06, + "loss": 1.588603138923645, + "step": 850 + }, + { + "epoch": 1.78781512605042, + "grad_norm": 9.24807113557597, + "learning_rate": 4.2148094218296485e-06, + "loss": 1.198427677154541, + "step": 851 + }, + { + "epoch": 1.7899159663865545, + "grad_norm": 9.93269092312877, + "learning_rate": 4.202739354473127e-06, + "loss": 1.0912418365478516, + "step": 852 + }, + { + "epoch": 1.792016806722689, + "grad_norm": 9.934910320433355, + "learning_rate": 4.190674052453405e-06, + "loss": 1.8104877471923828, + "step": 853 + }, + { + "epoch": 1.7941176470588234, + "grad_norm": 9.124793784485341, + "learning_rate": 4.178613587886455e-06, + "loss": 1.337807297706604, + "step": 854 + }, + { + "epoch": 1.7962184873949578, + "grad_norm": 12.887138564407095, + "learning_rate": 4.166558032859339e-06, + "loss": 1.0441133975982666, + "step": 855 + }, + { + "epoch": 1.7983193277310925, + "grad_norm": 13.183784075535518, + "learning_rate": 4.154507459429769e-06, + "loss": 1.8002381324768066, + "step": 856 + }, + { + "epoch": 1.800420168067227, + "grad_norm": 17.636030537350624, + "learning_rate": 4.142461939625685e-06, + "loss": 1.7534747123718262, + "step": 857 + }, + { + "epoch": 1.8025210084033614, + "grad_norm": 13.439089280649503, + "learning_rate": 4.13042154544482e-06, + "loss": 2.5967888832092285, + "step": 858 + }, + { + "epoch": 1.8046218487394958, + "grad_norm": 11.531721271683752, + "learning_rate": 4.1183863488542686e-06, + "loss": 0.9714012145996094, + "step": 859 + }, + { + "epoch": 1.8067226890756303, + "grad_norm": 39.93239963926744, + "learning_rate": 4.106356421790062e-06, + "loss": 2.0358502864837646, + "step": 860 + }, + { + "epoch": 1.8088235294117647, + "grad_norm": 13.143824988546921, + "learning_rate": 4.094331836156732e-06, + "loss": 1.2078362703323364, + "step": 861 + }, + { + "epoch": 1.8109243697478992, + "grad_norm": 17.216726387192157, + "learning_rate": 4.082312663826886e-06, + "loss": 1.3551952838897705, + "step": 862 + }, + { + "epoch": 1.8130252100840336, + "grad_norm": 9.960021372460178, + "learning_rate": 4.070298976640772e-06, + "loss": 1.7473708391189575, + "step": 863 + }, + { + "epoch": 1.815126050420168, + "grad_norm": 8.856051876807816, + "learning_rate": 4.058290846405856e-06, + "loss": 1.1888244152069092, + "step": 864 + }, + { + "epoch": 1.8172268907563025, + "grad_norm": 16.353016649836196, + "learning_rate": 4.046288344896388e-06, + "loss": 1.7867594957351685, + "step": 865 + }, + { + "epoch": 1.819327731092437, + "grad_norm": 12.062167246659023, + "learning_rate": 4.034291543852973e-06, + "loss": 1.2903845310211182, + "step": 866 + }, + { + "epoch": 1.8214285714285714, + "grad_norm": 12.560697459985716, + "learning_rate": 4.022300514982146e-06, + "loss": 1.4051203727722168, + "step": 867 + }, + { + "epoch": 1.8235294117647058, + "grad_norm": 7.497031379547495, + "learning_rate": 4.010315329955941e-06, + "loss": 1.7378381490707397, + "step": 868 + }, + { + "epoch": 1.8256302521008403, + "grad_norm": 13.858534174862163, + "learning_rate": 3.998336060411459e-06, + "loss": 1.1623207330703735, + "step": 869 + }, + { + "epoch": 1.8277310924369747, + "grad_norm": 16.260048868681064, + "learning_rate": 3.986362777950448e-06, + "loss": 1.9922326803207397, + "step": 870 + }, + { + "epoch": 1.8298319327731094, + "grad_norm": 10.526911105706054, + "learning_rate": 3.9743955541388645e-06, + "loss": 1.8183355331420898, + "step": 871 + }, + { + "epoch": 1.8319327731092439, + "grad_norm": 30.127353686918507, + "learning_rate": 3.962434460506459e-06, + "loss": 1.20865797996521, + "step": 872 + }, + { + "epoch": 1.8340336134453783, + "grad_norm": 9.693811930511602, + "learning_rate": 3.950479568546336e-06, + "loss": 1.2787063121795654, + "step": 873 + }, + { + "epoch": 1.8361344537815127, + "grad_norm": 18.05960154864148, + "learning_rate": 3.938530949714533e-06, + "loss": 2.1469886302948, + "step": 874 + }, + { + "epoch": 1.8382352941176472, + "grad_norm": 18.30460348258425, + "learning_rate": 3.926588675429591e-06, + "loss": 2.5014071464538574, + "step": 875 + }, + { + "epoch": 1.8403361344537816, + "grad_norm": 9.407437407393076, + "learning_rate": 3.914652817072132e-06, + "loss": 1.2857444286346436, + "step": 876 + }, + { + "epoch": 1.842436974789916, + "grad_norm": 16.37890925961833, + "learning_rate": 3.902723445984425e-06, + "loss": 0.8846265077590942, + "step": 877 + }, + { + "epoch": 1.8445378151260505, + "grad_norm": 23.642202819656244, + "learning_rate": 3.890800633469968e-06, + "loss": 3.6164169311523438, + "step": 878 + }, + { + "epoch": 1.846638655462185, + "grad_norm": 13.713411145435602, + "learning_rate": 3.878884450793053e-06, + "loss": 1.778512954711914, + "step": 879 + }, + { + "epoch": 1.8487394957983194, + "grad_norm": 14.191930149580415, + "learning_rate": 3.866974969178348e-06, + "loss": 1.2984943389892578, + "step": 880 + }, + { + "epoch": 1.8508403361344539, + "grad_norm": 11.358190736464952, + "learning_rate": 3.855072259810465e-06, + "loss": 1.233088493347168, + "step": 881 + }, + { + "epoch": 1.8529411764705883, + "grad_norm": 12.19590848916144, + "learning_rate": 3.8431763938335415e-06, + "loss": 1.0973716974258423, + "step": 882 + }, + { + "epoch": 1.8550420168067228, + "grad_norm": 8.299847504153597, + "learning_rate": 3.831287442350806e-06, + "loss": 1.9479036331176758, + "step": 883 + }, + { + "epoch": 1.8571428571428572, + "grad_norm": 25.32246065502413, + "learning_rate": 3.819405476424164e-06, + "loss": 2.3243212699890137, + "step": 884 + }, + { + "epoch": 1.8592436974789917, + "grad_norm": 16.82297657925073, + "learning_rate": 3.8075305670737605e-06, + "loss": 2.167454242706299, + "step": 885 + }, + { + "epoch": 1.861344537815126, + "grad_norm": 21.753642919267325, + "learning_rate": 3.795662785277568e-06, + "loss": 1.3896931409835815, + "step": 886 + }, + { + "epoch": 1.8634453781512605, + "grad_norm": 11.74483761622084, + "learning_rate": 3.783802201970953e-06, + "loss": 1.7062684297561646, + "step": 887 + }, + { + "epoch": 1.865546218487395, + "grad_norm": 10.437798829559927, + "learning_rate": 3.7719488880462596e-06, + "loss": 1.996096134185791, + "step": 888 + }, + { + "epoch": 1.8676470588235294, + "grad_norm": 12.757708819402238, + "learning_rate": 3.7601029143523767e-06, + "loss": 0.9396399259567261, + "step": 889 + }, + { + "epoch": 1.8697478991596639, + "grad_norm": 9.851656503119592, + "learning_rate": 3.748264351694324e-06, + "loss": 1.384545922279358, + "step": 890 + }, + { + "epoch": 1.8718487394957983, + "grad_norm": 9.806551408884758, + "learning_rate": 3.7364332708328232e-06, + "loss": 1.298504114151001, + "step": 891 + }, + { + "epoch": 1.8739495798319328, + "grad_norm": 10.623737292924032, + "learning_rate": 3.7246097424838746e-06, + "loss": 1.395151138305664, + "step": 892 + }, + { + "epoch": 1.8760504201680672, + "grad_norm": 10.061693679195699, + "learning_rate": 3.712793837318338e-06, + "loss": 0.9280238747596741, + "step": 893 + }, + { + "epoch": 1.8781512605042017, + "grad_norm": 15.132177107654861, + "learning_rate": 3.7009856259615074e-06, + "loss": 1.3795464038848877, + "step": 894 + }, + { + "epoch": 1.8802521008403361, + "grad_norm": 6.163863926370169, + "learning_rate": 3.689185178992689e-06, + "loss": 1.3113572597503662, + "step": 895 + }, + { + "epoch": 1.8823529411764706, + "grad_norm": 9.130793358710777, + "learning_rate": 3.677392566944783e-06, + "loss": 1.580859661102295, + "step": 896 + }, + { + "epoch": 1.884453781512605, + "grad_norm": 9.259911678328434, + "learning_rate": 3.665607860303857e-06, + "loss": 1.5074641704559326, + "step": 897 + }, + { + "epoch": 1.8865546218487395, + "grad_norm": 11.62240320198324, + "learning_rate": 3.653831129508727e-06, + "loss": 1.438436508178711, + "step": 898 + }, + { + "epoch": 1.888655462184874, + "grad_norm": 21.40632893627489, + "learning_rate": 3.642062444950537e-06, + "loss": 2.4116339683532715, + "step": 899 + }, + { + "epoch": 1.8907563025210083, + "grad_norm": 11.75786970161833, + "learning_rate": 3.630301876972337e-06, + "loss": 1.5296099185943604, + "step": 900 + }, + { + "epoch": 1.8928571428571428, + "grad_norm": 13.176259265738059, + "learning_rate": 3.618549495868662e-06, + "loss": 1.7645788192749023, + "step": 901 + }, + { + "epoch": 1.8949579831932772, + "grad_norm": 8.946035833702966, + "learning_rate": 3.606805371885117e-06, + "loss": 1.528565526008606, + "step": 902 + }, + { + "epoch": 1.8970588235294117, + "grad_norm": 9.910748332846175, + "learning_rate": 3.5950695752179487e-06, + "loss": 1.5352060794830322, + "step": 903 + }, + { + "epoch": 1.8991596638655461, + "grad_norm": 8.872120526454859, + "learning_rate": 3.5833421760136323e-06, + "loss": 1.2181806564331055, + "step": 904 + }, + { + "epoch": 1.9012605042016806, + "grad_norm": 8.52566041071061, + "learning_rate": 3.5716232443684486e-06, + "loss": 1.2715753316879272, + "step": 905 + }, + { + "epoch": 1.903361344537815, + "grad_norm": 21.774545687178733, + "learning_rate": 3.559912850328069e-06, + "loss": 1.4792617559432983, + "step": 906 + }, + { + "epoch": 1.9054621848739495, + "grad_norm": 19.592792336690916, + "learning_rate": 3.5482110638871325e-06, + "loss": 1.072256326675415, + "step": 907 + }, + { + "epoch": 1.907563025210084, + "grad_norm": 13.065810555435853, + "learning_rate": 3.5365179549888306e-06, + "loss": 1.5988600254058838, + "step": 908 + }, + { + "epoch": 1.9096638655462184, + "grad_norm": 21.891373834171244, + "learning_rate": 3.524833593524487e-06, + "loss": 2.473078489303589, + "step": 909 + }, + { + "epoch": 1.9117647058823528, + "grad_norm": 10.756654205561983, + "learning_rate": 3.513158049333141e-06, + "loss": 1.8987966775894165, + "step": 910 + }, + { + "epoch": 1.9138655462184873, + "grad_norm": 11.56568429501611, + "learning_rate": 3.50149139220113e-06, + "loss": 1.6164718866348267, + "step": 911 + }, + { + "epoch": 1.9159663865546217, + "grad_norm": 11.650144499924947, + "learning_rate": 3.4898336918616726e-06, + "loss": 1.3376764059066772, + "step": 912 + }, + { + "epoch": 1.9180672268907561, + "grad_norm": 10.167435576576402, + "learning_rate": 3.47818501799445e-06, + "loss": 1.7546143531799316, + "step": 913 + }, + { + "epoch": 1.9201680672268906, + "grad_norm": 16.044159587879186, + "learning_rate": 3.4665454402251937e-06, + "loss": 1.4916424751281738, + "step": 914 + }, + { + "epoch": 1.9222689075630253, + "grad_norm": 9.485222637010883, + "learning_rate": 3.4549150281252635e-06, + "loss": 1.6852712631225586, + "step": 915 + }, + { + "epoch": 1.9243697478991597, + "grad_norm": 17.238783509738973, + "learning_rate": 3.443293851211237e-06, + "loss": 1.7150108814239502, + "step": 916 + }, + { + "epoch": 1.9264705882352942, + "grad_norm": 13.404050851317407, + "learning_rate": 3.4316819789444893e-06, + "loss": 1.7211201190948486, + "step": 917 + }, + { + "epoch": 1.9285714285714286, + "grad_norm": 12.556393984422412, + "learning_rate": 3.4200794807307834e-06, + "loss": 0.7268713712692261, + "step": 918 + }, + { + "epoch": 1.930672268907563, + "grad_norm": 18.049874392140797, + "learning_rate": 3.40848642591985e-06, + "loss": 1.4612197875976562, + "step": 919 + }, + { + "epoch": 1.9327731092436975, + "grad_norm": 15.899805779516837, + "learning_rate": 3.3969028838049765e-06, + "loss": 2.3325533866882324, + "step": 920 + }, + { + "epoch": 1.934873949579832, + "grad_norm": 12.244325200092801, + "learning_rate": 3.3853289236225917e-06, + "loss": 1.3644397258758545, + "step": 921 + }, + { + "epoch": 1.9369747899159664, + "grad_norm": 12.06507650622523, + "learning_rate": 3.37376461455185e-06, + "loss": 1.405503273010254, + "step": 922 + }, + { + "epoch": 1.9390756302521008, + "grad_norm": 16.537370916012062, + "learning_rate": 3.362210025714222e-06, + "loss": 1.1844987869262695, + "step": 923 + }, + { + "epoch": 1.9411764705882353, + "grad_norm": 10.411642432611085, + "learning_rate": 3.350665226173078e-06, + "loss": 2.294912815093994, + "step": 924 + }, + { + "epoch": 1.9432773109243697, + "grad_norm": 7.385187019711569, + "learning_rate": 3.339130284933276e-06, + "loss": 1.3060452938079834, + "step": 925 + }, + { + "epoch": 1.9453781512605042, + "grad_norm": 11.928015027901997, + "learning_rate": 3.327605270940751e-06, + "loss": 1.5017865896224976, + "step": 926 + }, + { + "epoch": 1.9474789915966386, + "grad_norm": 23.754968850349012, + "learning_rate": 3.316090253082101e-06, + "loss": 1.9816479682922363, + "step": 927 + }, + { + "epoch": 1.949579831932773, + "grad_norm": 15.3357371335637, + "learning_rate": 3.304585300184173e-06, + "loss": 1.4715440273284912, + "step": 928 + }, + { + "epoch": 1.9516806722689075, + "grad_norm": 12.706896195884193, + "learning_rate": 3.293090481013661e-06, + "loss": 1.321998953819275, + "step": 929 + }, + { + "epoch": 1.9537815126050422, + "grad_norm": 8.254920710769508, + "learning_rate": 3.28160586427668e-06, + "loss": 1.1600078344345093, + "step": 930 + }, + { + "epoch": 1.9558823529411766, + "grad_norm": 12.971411985932859, + "learning_rate": 3.2701315186183692e-06, + "loss": 1.5981496572494507, + "step": 931 + }, + { + "epoch": 1.957983193277311, + "grad_norm": 9.707338087138305, + "learning_rate": 3.258667512622475e-06, + "loss": 1.9018357992172241, + "step": 932 + }, + { + "epoch": 1.9600840336134455, + "grad_norm": 19.34885988489593, + "learning_rate": 3.2472139148109416e-06, + "loss": 1.175397515296936, + "step": 933 + }, + { + "epoch": 1.96218487394958, + "grad_norm": 14.470424387669999, + "learning_rate": 3.2357707936435013e-06, + "loss": 0.5444597005844116, + "step": 934 + }, + { + "epoch": 1.9642857142857144, + "grad_norm": 5.567855687640852, + "learning_rate": 3.224338217517269e-06, + "loss": 1.3773345947265625, + "step": 935 + }, + { + "epoch": 1.9663865546218489, + "grad_norm": 14.622402074305704, + "learning_rate": 3.212916254766326e-06, + "loss": 2.028517007827759, + "step": 936 + }, + { + "epoch": 1.9684873949579833, + "grad_norm": 9.79269410710096, + "learning_rate": 3.20150497366132e-06, + "loss": 0.9947667121887207, + "step": 937 + }, + { + "epoch": 1.9705882352941178, + "grad_norm": 27.334085978635635, + "learning_rate": 3.190104442409052e-06, + "loss": 1.7532271146774292, + "step": 938 + }, + { + "epoch": 1.9726890756302522, + "grad_norm": 12.841320289359894, + "learning_rate": 3.1787147291520675e-06, + "loss": 2.114809036254883, + "step": 939 + }, + { + "epoch": 1.9747899159663866, + "grad_norm": 11.483734843753465, + "learning_rate": 3.1673359019682538e-06, + "loss": 2.2796754837036133, + "step": 940 + }, + { + "epoch": 1.976890756302521, + "grad_norm": 11.440585157823008, + "learning_rate": 3.1559680288704297e-06, + "loss": 1.172208547592163, + "step": 941 + }, + { + "epoch": 1.9789915966386555, + "grad_norm": 17.223673892561905, + "learning_rate": 3.1446111778059405e-06, + "loss": 1.1454124450683594, + "step": 942 + }, + { + "epoch": 1.98109243697479, + "grad_norm": 9.23862037561014, + "learning_rate": 3.1332654166562494e-06, + "loss": 1.6078896522521973, + "step": 943 + }, + { + "epoch": 1.9831932773109244, + "grad_norm": 8.824526781008897, + "learning_rate": 3.1219308132365365e-06, + "loss": 1.2369673252105713, + "step": 944 + }, + { + "epoch": 1.9852941176470589, + "grad_norm": 10.697868664174909, + "learning_rate": 3.110607435295289e-06, + "loss": 1.075582504272461, + "step": 945 + }, + { + "epoch": 1.9873949579831933, + "grad_norm": 10.407621014847015, + "learning_rate": 3.099295350513898e-06, + "loss": 0.9495413899421692, + "step": 946 + }, + { + "epoch": 1.9894957983193278, + "grad_norm": 12.92768742395414, + "learning_rate": 3.087994626506254e-06, + "loss": 1.3577098846435547, + "step": 947 + }, + { + "epoch": 1.9915966386554622, + "grad_norm": 15.824553960297969, + "learning_rate": 3.0767053308183416e-06, + "loss": 1.229673981666565, + "step": 948 + }, + { + "epoch": 1.9936974789915967, + "grad_norm": 10.163559398603317, + "learning_rate": 3.0654275309278382e-06, + "loss": 1.3727761507034302, + "step": 949 + }, + { + "epoch": 1.995798319327731, + "grad_norm": 24.18617513536731, + "learning_rate": 3.0541612942437095e-06, + "loss": 1.2849650382995605, + "step": 950 + }, + { + "epoch": 1.9978991596638656, + "grad_norm": 11.306358671227525, + "learning_rate": 3.0429066881058036e-06, + "loss": 1.644538164138794, + "step": 951 + }, + { + "epoch": 2.0, + "grad_norm": 8.518728725517601, + "learning_rate": 3.031663779784454e-06, + "loss": 1.627841591835022, + "step": 952 + }, + { + "epoch": 2.0021008403361344, + "grad_norm": 7.931423247551538, + "learning_rate": 3.020432636480074e-06, + "loss": 0.2781870365142822, + "step": 953 + }, + { + "epoch": 2.004201680672269, + "grad_norm": 10.005905501706337, + "learning_rate": 3.0092133253227563e-06, + "loss": 0.4595562815666199, + "step": 954 + }, + { + "epoch": 2.0063025210084033, + "grad_norm": 11.609856477894333, + "learning_rate": 2.9980059133718687e-06, + "loss": 0.5985803604125977, + "step": 955 + }, + { + "epoch": 2.008403361344538, + "grad_norm": 9.586217141888886, + "learning_rate": 2.986810467615659e-06, + "loss": 0.41152679920196533, + "step": 956 + }, + { + "epoch": 2.0105042016806722, + "grad_norm": 7.487148279080336, + "learning_rate": 2.9756270549708497e-06, + "loss": 0.2737478017807007, + "step": 957 + }, + { + "epoch": 2.0126050420168067, + "grad_norm": 7.91452475392683, + "learning_rate": 2.9644557422822406e-06, + "loss": 0.3578256368637085, + "step": 958 + }, + { + "epoch": 2.014705882352941, + "grad_norm": 8.457279529419324, + "learning_rate": 2.9532965963223076e-06, + "loss": 0.3519413471221924, + "step": 959 + }, + { + "epoch": 2.0168067226890756, + "grad_norm": 12.98619129259147, + "learning_rate": 2.9421496837908036e-06, + "loss": 0.5450835227966309, + "step": 960 + }, + { + "epoch": 2.01890756302521, + "grad_norm": 10.10649833997759, + "learning_rate": 2.9310150713143637e-06, + "loss": 0.7118933796882629, + "step": 961 + }, + { + "epoch": 2.0210084033613445, + "grad_norm": 14.582945225729798, + "learning_rate": 2.9198928254461e-06, + "loss": 0.6735545992851257, + "step": 962 + }, + { + "epoch": 2.023109243697479, + "grad_norm": 13.612285721248329, + "learning_rate": 2.908783012665209e-06, + "loss": 0.6521182060241699, + "step": 963 + }, + { + "epoch": 2.0252100840336134, + "grad_norm": 9.78372244316324, + "learning_rate": 2.8976856993765766e-06, + "loss": 0.476604163646698, + "step": 964 + }, + { + "epoch": 2.027310924369748, + "grad_norm": 12.44882078007661, + "learning_rate": 2.8866009519103705e-06, + "loss": 0.46952176094055176, + "step": 965 + }, + { + "epoch": 2.0294117647058822, + "grad_norm": 9.57528793268096, + "learning_rate": 2.875528836521658e-06, + "loss": 0.4453829526901245, + "step": 966 + }, + { + "epoch": 2.0315126050420167, + "grad_norm": 10.439598731466846, + "learning_rate": 2.864469419389997e-06, + "loss": 0.2944750189781189, + "step": 967 + }, + { + "epoch": 2.033613445378151, + "grad_norm": 11.844927445149192, + "learning_rate": 2.8534227666190484e-06, + "loss": 0.8550271391868591, + "step": 968 + }, + { + "epoch": 2.0357142857142856, + "grad_norm": 13.15280870383674, + "learning_rate": 2.8423889442361797e-06, + "loss": 0.38192200660705566, + "step": 969 + }, + { + "epoch": 2.03781512605042, + "grad_norm": 8.57118977839964, + "learning_rate": 2.831368018192071e-06, + "loss": 0.7316254377365112, + "step": 970 + }, + { + "epoch": 2.0399159663865545, + "grad_norm": 11.697813667138346, + "learning_rate": 2.8203600543603116e-06, + "loss": 0.7615312337875366, + "step": 971 + }, + { + "epoch": 2.042016806722689, + "grad_norm": 15.849948895683397, + "learning_rate": 2.809365118537024e-06, + "loss": 0.8274880647659302, + "step": 972 + }, + { + "epoch": 2.0441176470588234, + "grad_norm": 10.693659421700279, + "learning_rate": 2.7983832764404517e-06, + "loss": 0.31469643115997314, + "step": 973 + }, + { + "epoch": 2.046218487394958, + "grad_norm": 11.44650988759124, + "learning_rate": 2.787414593710583e-06, + "loss": 0.20855772495269775, + "step": 974 + }, + { + "epoch": 2.0483193277310923, + "grad_norm": 15.81504400596588, + "learning_rate": 2.7764591359087415e-06, + "loss": 0.6759412884712219, + "step": 975 + }, + { + "epoch": 2.0504201680672267, + "grad_norm": 10.204964393759596, + "learning_rate": 2.7655169685172146e-06, + "loss": 0.4555593430995941, + "step": 976 + }, + { + "epoch": 2.052521008403361, + "grad_norm": 11.261244778956014, + "learning_rate": 2.7545881569388404e-06, + "loss": 0.22477459907531738, + "step": 977 + }, + { + "epoch": 2.0546218487394956, + "grad_norm": 12.246362257874592, + "learning_rate": 2.7436727664966368e-06, + "loss": 0.47387319803237915, + "step": 978 + }, + { + "epoch": 2.05672268907563, + "grad_norm": 8.866095217298547, + "learning_rate": 2.7327708624333936e-06, + "loss": 0.46857523918151855, + "step": 979 + }, + { + "epoch": 2.0588235294117645, + "grad_norm": 13.695082205363835, + "learning_rate": 2.7218825099112966e-06, + "loss": 0.4427967071533203, + "step": 980 + }, + { + "epoch": 2.060924369747899, + "grad_norm": 14.011986042608353, + "learning_rate": 2.7110077740115315e-06, + "loss": 1.3617768287658691, + "step": 981 + }, + { + "epoch": 2.0630252100840334, + "grad_norm": 11.10530101134504, + "learning_rate": 2.7001467197338905e-06, + "loss": 0.8060270547866821, + "step": 982 + }, + { + "epoch": 2.0651260504201683, + "grad_norm": 11.494347595831918, + "learning_rate": 2.6892994119963965e-06, + "loss": 0.29366880655288696, + "step": 983 + }, + { + "epoch": 2.0672268907563027, + "grad_norm": 11.085826364505666, + "learning_rate": 2.678465915634899e-06, + "loss": 0.40074852108955383, + "step": 984 + }, + { + "epoch": 2.069327731092437, + "grad_norm": 12.536178143522665, + "learning_rate": 2.667646295402704e-06, + "loss": 0.4710817337036133, + "step": 985 + }, + { + "epoch": 2.0714285714285716, + "grad_norm": 10.305745046176337, + "learning_rate": 2.656840615970169e-06, + "loss": 0.37437137961387634, + "step": 986 + }, + { + "epoch": 2.073529411764706, + "grad_norm": 19.03565667772653, + "learning_rate": 2.646048941924333e-06, + "loss": 0.9739346504211426, + "step": 987 + }, + { + "epoch": 2.0756302521008405, + "grad_norm": 14.96080509908609, + "learning_rate": 2.635271337768517e-06, + "loss": 0.6326197981834412, + "step": 988 + }, + { + "epoch": 2.077731092436975, + "grad_norm": 7.840013094660732, + "learning_rate": 2.6245078679219503e-06, + "loss": 0.15397483110427856, + "step": 989 + }, + { + "epoch": 2.0798319327731094, + "grad_norm": 14.418579873307118, + "learning_rate": 2.613758596719373e-06, + "loss": 0.5905511379241943, + "step": 990 + }, + { + "epoch": 2.081932773109244, + "grad_norm": 11.365880088991135, + "learning_rate": 2.603023588410662e-06, + "loss": 0.588984489440918, + "step": 991 + }, + { + "epoch": 2.0840336134453783, + "grad_norm": 8.467121557746795, + "learning_rate": 2.5923029071604443e-06, + "loss": 0.33690521121025085, + "step": 992 + }, + { + "epoch": 2.0861344537815127, + "grad_norm": 12.160131630042047, + "learning_rate": 2.5815966170477065e-06, + "loss": 0.23294681310653687, + "step": 993 + }, + { + "epoch": 2.088235294117647, + "grad_norm": 10.365330226343618, + "learning_rate": 2.5709047820654236e-06, + "loss": 0.4404110908508301, + "step": 994 + }, + { + "epoch": 2.0903361344537816, + "grad_norm": 11.818988939924239, + "learning_rate": 2.5602274661201643e-06, + "loss": 0.37340593338012695, + "step": 995 + }, + { + "epoch": 2.092436974789916, + "grad_norm": 8.208877260345274, + "learning_rate": 2.549564733031722e-06, + "loss": 0.3671455979347229, + "step": 996 + }, + { + "epoch": 2.0945378151260505, + "grad_norm": 7.093067310603152, + "learning_rate": 2.538916646532718e-06, + "loss": 0.6218878030776978, + "step": 997 + }, + { + "epoch": 2.096638655462185, + "grad_norm": 18.77124675473162, + "learning_rate": 2.528283270268238e-06, + "loss": 1.2778301239013672, + "step": 998 + }, + { + "epoch": 2.0987394957983194, + "grad_norm": 11.063294944827689, + "learning_rate": 2.517664667795434e-06, + "loss": 0.6543454527854919, + "step": 999 + }, + { + "epoch": 2.100840336134454, + "grad_norm": 14.644880561077354, + "learning_rate": 2.5070609025831605e-06, + "loss": 0.42762574553489685, + "step": 1000 + }, + { + "epoch": 2.1029411764705883, + "grad_norm": 9.207415458189004, + "learning_rate": 2.49647203801158e-06, + "loss": 0.40861833095550537, + "step": 1001 + }, + { + "epoch": 2.1050420168067228, + "grad_norm": 13.2306061568643, + "learning_rate": 2.4858981373718006e-06, + "loss": 0.6941218376159668, + "step": 1002 + }, + { + "epoch": 2.107142857142857, + "grad_norm": 7.498871262137285, + "learning_rate": 2.47533926386548e-06, + "loss": 0.1615523397922516, + "step": 1003 + }, + { + "epoch": 2.1092436974789917, + "grad_norm": 10.133323758514624, + "learning_rate": 2.4647954806044633e-06, + "loss": 0.30699750781059265, + "step": 1004 + }, + { + "epoch": 2.111344537815126, + "grad_norm": 7.757159399213717, + "learning_rate": 2.454266850610398e-06, + "loss": 0.27435654401779175, + "step": 1005 + }, + { + "epoch": 2.1134453781512605, + "grad_norm": 12.86368889886839, + "learning_rate": 2.443753436814354e-06, + "loss": 0.6352673172950745, + "step": 1006 + }, + { + "epoch": 2.115546218487395, + "grad_norm": 10.035026243076201, + "learning_rate": 2.433255302056458e-06, + "loss": 0.3478729724884033, + "step": 1007 + }, + { + "epoch": 2.1176470588235294, + "grad_norm": 24.70500681984219, + "learning_rate": 2.4227725090855063e-06, + "loss": 0.3971726894378662, + "step": 1008 + }, + { + "epoch": 2.119747899159664, + "grad_norm": 10.231694956778009, + "learning_rate": 2.412305120558599e-06, + "loss": 0.9241357445716858, + "step": 1009 + }, + { + "epoch": 2.1218487394957983, + "grad_norm": 10.754074840458836, + "learning_rate": 2.40185319904076e-06, + "loss": 0.2883678674697876, + "step": 1010 + }, + { + "epoch": 2.1239495798319328, + "grad_norm": 11.61442466478921, + "learning_rate": 2.391416807004568e-06, + "loss": 0.39812758564949036, + "step": 1011 + }, + { + "epoch": 2.1260504201680672, + "grad_norm": 12.063207487307261, + "learning_rate": 2.3809960068297732e-06, + "loss": 0.6487483978271484, + "step": 1012 + }, + { + "epoch": 2.1281512605042017, + "grad_norm": 10.36458033229305, + "learning_rate": 2.370590860802938e-06, + "loss": 0.44781216979026794, + "step": 1013 + }, + { + "epoch": 2.130252100840336, + "grad_norm": 12.86609548868944, + "learning_rate": 2.3602014311170524e-06, + "loss": 0.3241298496723175, + "step": 1014 + }, + { + "epoch": 2.1323529411764706, + "grad_norm": 15.003708633549396, + "learning_rate": 2.3498277798711725e-06, + "loss": 0.4608106315135956, + "step": 1015 + }, + { + "epoch": 2.134453781512605, + "grad_norm": 12.622777494736392, + "learning_rate": 2.3394699690700395e-06, + "loss": 0.5967488884925842, + "step": 1016 + }, + { + "epoch": 2.1365546218487395, + "grad_norm": 12.188684362144896, + "learning_rate": 2.3291280606237186e-06, + "loss": 0.4074782729148865, + "step": 1017 + }, + { + "epoch": 2.138655462184874, + "grad_norm": 8.220918786617895, + "learning_rate": 2.3188021163472206e-06, + "loss": 0.354820191860199, + "step": 1018 + }, + { + "epoch": 2.1407563025210083, + "grad_norm": 11.553371341140592, + "learning_rate": 2.308492197960141e-06, + "loss": 0.23287059366703033, + "step": 1019 + }, + { + "epoch": 2.142857142857143, + "grad_norm": 14.317771847578689, + "learning_rate": 2.2981983670862796e-06, + "loss": 1.0973201990127563, + "step": 1020 + }, + { + "epoch": 2.1449579831932772, + "grad_norm": 15.607772284187238, + "learning_rate": 2.2879206852532854e-06, + "loss": 0.4452645778656006, + "step": 1021 + }, + { + "epoch": 2.1470588235294117, + "grad_norm": 7.00439488336282, + "learning_rate": 2.2776592138922806e-06, + "loss": 0.273881733417511, + "step": 1022 + }, + { + "epoch": 2.149159663865546, + "grad_norm": 7.187420218160357, + "learning_rate": 2.2674140143374904e-06, + "loss": 0.20633578300476074, + "step": 1023 + }, + { + "epoch": 2.1512605042016806, + "grad_norm": 13.420920542298727, + "learning_rate": 2.2571851478258903e-06, + "loss": 0.38969674706459045, + "step": 1024 + }, + { + "epoch": 2.153361344537815, + "grad_norm": 10.472493973829605, + "learning_rate": 2.2469726754968207e-06, + "loss": 0.26989856362342834, + "step": 1025 + }, + { + "epoch": 2.1554621848739495, + "grad_norm": 7.949292792396312, + "learning_rate": 2.236776658391641e-06, + "loss": 0.5260115265846252, + "step": 1026 + }, + { + "epoch": 2.157563025210084, + "grad_norm": 10.053195823647455, + "learning_rate": 2.2265971574533474e-06, + "loss": 0.2469472587108612, + "step": 1027 + }, + { + "epoch": 2.1596638655462184, + "grad_norm": 10.2298360545254, + "learning_rate": 2.2164342335262244e-06, + "loss": 0.201723113656044, + "step": 1028 + }, + { + "epoch": 2.161764705882353, + "grad_norm": 8.12616695246335, + "learning_rate": 2.2062879473554654e-06, + "loss": 0.6355183124542236, + "step": 1029 + }, + { + "epoch": 2.1638655462184873, + "grad_norm": 8.264174037140188, + "learning_rate": 2.1961583595868253e-06, + "loss": 0.32272863388061523, + "step": 1030 + }, + { + "epoch": 2.1659663865546217, + "grad_norm": 7.57735519623744, + "learning_rate": 2.186045530766244e-06, + "loss": 0.24386917054653168, + "step": 1031 + }, + { + "epoch": 2.168067226890756, + "grad_norm": 14.627933253501514, + "learning_rate": 2.1759495213394965e-06, + "loss": 0.482686847448349, + "step": 1032 + }, + { + "epoch": 2.1701680672268906, + "grad_norm": 11.019581985915595, + "learning_rate": 2.165870391651819e-06, + "loss": 0.5142661333084106, + "step": 1033 + }, + { + "epoch": 2.172268907563025, + "grad_norm": 5.2143700025854605, + "learning_rate": 2.155808201947563e-06, + "loss": 0.21703539788722992, + "step": 1034 + }, + { + "epoch": 2.1743697478991595, + "grad_norm": 8.891172137251035, + "learning_rate": 2.145763012369824e-06, + "loss": 0.4068147540092468, + "step": 1035 + }, + { + "epoch": 2.176470588235294, + "grad_norm": 8.535335024751161, + "learning_rate": 2.1357348829600816e-06, + "loss": 0.5949288606643677, + "step": 1036 + }, + { + "epoch": 2.1785714285714284, + "grad_norm": 9.215827064680754, + "learning_rate": 2.125723873657852e-06, + "loss": 0.44353166222572327, + "step": 1037 + }, + { + "epoch": 2.180672268907563, + "grad_norm": 10.942670044267897, + "learning_rate": 2.115730044300313e-06, + "loss": 0.4212431013584137, + "step": 1038 + }, + { + "epoch": 2.1827731092436973, + "grad_norm": 9.670977047855832, + "learning_rate": 2.105753454621966e-06, + "loss": 0.37279778718948364, + "step": 1039 + }, + { + "epoch": 2.184873949579832, + "grad_norm": 15.451697195363522, + "learning_rate": 2.095794164254259e-06, + "loss": 0.6137001514434814, + "step": 1040 + }, + { + "epoch": 2.1869747899159666, + "grad_norm": 9.221135375907481, + "learning_rate": 2.0858522327252467e-06, + "loss": 0.20706136524677277, + "step": 1041 + }, + { + "epoch": 2.189075630252101, + "grad_norm": 7.176753088694497, + "learning_rate": 2.0759277194592208e-06, + "loss": 0.3732944130897522, + "step": 1042 + }, + { + "epoch": 2.1911764705882355, + "grad_norm": 6.567221722351546, + "learning_rate": 2.06602068377637e-06, + "loss": 0.11849310249090195, + "step": 1043 + }, + { + "epoch": 2.19327731092437, + "grad_norm": 8.709699534320997, + "learning_rate": 2.0561311848924082e-06, + "loss": 0.35089147090911865, + "step": 1044 + }, + { + "epoch": 2.1953781512605044, + "grad_norm": 6.892712538403868, + "learning_rate": 2.0462592819182377e-06, + "loss": 0.3482816219329834, + "step": 1045 + }, + { + "epoch": 2.197478991596639, + "grad_norm": 11.886398314518281, + "learning_rate": 2.0364050338595792e-06, + "loss": 0.9048193097114563, + "step": 1046 + }, + { + "epoch": 2.1995798319327733, + "grad_norm": 9.38373013746351, + "learning_rate": 2.0265684996166345e-06, + "loss": 0.34331268072128296, + "step": 1047 + }, + { + "epoch": 2.2016806722689077, + "grad_norm": 13.372941805785942, + "learning_rate": 2.0167497379837254e-06, + "loss": 0.35536718368530273, + "step": 1048 + }, + { + "epoch": 2.203781512605042, + "grad_norm": 7.556671458015662, + "learning_rate": 2.0069488076489445e-06, + "loss": 0.20954403281211853, + "step": 1049 + }, + { + "epoch": 2.2058823529411766, + "grad_norm": 8.35211924521852, + "learning_rate": 1.997165767193801e-06, + "loss": 0.5290908813476562, + "step": 1050 + }, + { + "epoch": 2.207983193277311, + "grad_norm": 10.477600594311985, + "learning_rate": 1.9874006750928783e-06, + "loss": 0.44289880990982056, + "step": 1051 + }, + { + "epoch": 2.2100840336134455, + "grad_norm": 8.191084415042441, + "learning_rate": 1.97765358971348e-06, + "loss": 0.48035284876823425, + "step": 1052 + }, + { + "epoch": 2.21218487394958, + "grad_norm": 14.892166225942573, + "learning_rate": 1.967924569315275e-06, + "loss": 0.2514810562133789, + "step": 1053 + }, + { + "epoch": 2.2142857142857144, + "grad_norm": 9.73259092640212, + "learning_rate": 1.958213672049964e-06, + "loss": 0.9599279165267944, + "step": 1054 + }, + { + "epoch": 2.216386554621849, + "grad_norm": 10.01655023470503, + "learning_rate": 1.9485209559609148e-06, + "loss": 0.30860060453414917, + "step": 1055 + }, + { + "epoch": 2.2184873949579833, + "grad_norm": 21.410996670654146, + "learning_rate": 1.9388464789828316e-06, + "loss": 0.7747633457183838, + "step": 1056 + }, + { + "epoch": 2.2205882352941178, + "grad_norm": 14.431755517939498, + "learning_rate": 1.9291902989413935e-06, + "loss": 0.3529064655303955, + "step": 1057 + }, + { + "epoch": 2.222689075630252, + "grad_norm": 19.684041196466477, + "learning_rate": 1.9195524735529237e-06, + "loss": 1.0967960357666016, + "step": 1058 + }, + { + "epoch": 2.2247899159663866, + "grad_norm": 9.812143417300405, + "learning_rate": 1.909933060424029e-06, + "loss": 0.700248122215271, + "step": 1059 + }, + { + "epoch": 2.226890756302521, + "grad_norm": 10.765309787627796, + "learning_rate": 1.9003321170512728e-06, + "loss": 0.9177491068840027, + "step": 1060 + }, + { + "epoch": 2.2289915966386555, + "grad_norm": 12.811209076397098, + "learning_rate": 1.890749700820813e-06, + "loss": 0.543596625328064, + "step": 1061 + }, + { + "epoch": 2.23109243697479, + "grad_norm": 17.31969106411562, + "learning_rate": 1.8811858690080764e-06, + "loss": 0.7324357032775879, + "step": 1062 + }, + { + "epoch": 2.2331932773109244, + "grad_norm": 9.418477503451474, + "learning_rate": 1.8716406787774e-06, + "loss": 0.4075426459312439, + "step": 1063 + }, + { + "epoch": 2.235294117647059, + "grad_norm": 7.9458980097838605, + "learning_rate": 1.862114187181705e-06, + "loss": 0.39563894271850586, + "step": 1064 + }, + { + "epoch": 2.2373949579831933, + "grad_norm": 8.299260491259234, + "learning_rate": 1.8526064511621455e-06, + "loss": 0.37604600191116333, + "step": 1065 + }, + { + "epoch": 2.2394957983193278, + "grad_norm": 10.435458479716717, + "learning_rate": 1.843117527547768e-06, + "loss": 0.6682062745094299, + "step": 1066 + }, + { + "epoch": 2.241596638655462, + "grad_norm": 8.776734857977067, + "learning_rate": 1.8336474730551807e-06, + "loss": 0.19220635294914246, + "step": 1067 + }, + { + "epoch": 2.2436974789915967, + "grad_norm": 14.521651377727974, + "learning_rate": 1.8241963442882005e-06, + "loss": 0.27735865116119385, + "step": 1068 + }, + { + "epoch": 2.245798319327731, + "grad_norm": 8.651493755796526, + "learning_rate": 1.8147641977375313e-06, + "loss": 0.41572022438049316, + "step": 1069 + }, + { + "epoch": 2.2478991596638656, + "grad_norm": 7.20135853576087, + "learning_rate": 1.8053510897804105e-06, + "loss": 0.25049227476119995, + "step": 1070 + }, + { + "epoch": 2.25, + "grad_norm": 8.485627286621954, + "learning_rate": 1.7959570766802847e-06, + "loss": 0.17869159579277039, + "step": 1071 + }, + { + "epoch": 2.2521008403361344, + "grad_norm": 8.831664553556859, + "learning_rate": 1.786582214586462e-06, + "loss": 0.2621746361255646, + "step": 1072 + }, + { + "epoch": 2.254201680672269, + "grad_norm": 13.640791806331189, + "learning_rate": 1.77722655953379e-06, + "loss": 0.33446362614631653, + "step": 1073 + }, + { + "epoch": 2.2563025210084033, + "grad_norm": 5.657158630793571, + "learning_rate": 1.7678901674423044e-06, + "loss": 0.17267954349517822, + "step": 1074 + }, + { + "epoch": 2.258403361344538, + "grad_norm": 11.516922535812704, + "learning_rate": 1.7585730941169105e-06, + "loss": 0.5281901955604553, + "step": 1075 + }, + { + "epoch": 2.2605042016806722, + "grad_norm": 11.298403957574713, + "learning_rate": 1.7492753952470415e-06, + "loss": 0.2754780352115631, + "step": 1076 + }, + { + "epoch": 2.2626050420168067, + "grad_norm": 10.413722402153681, + "learning_rate": 1.739997126406322e-06, + "loss": 0.3246016502380371, + "step": 1077 + }, + { + "epoch": 2.264705882352941, + "grad_norm": 14.097971965363062, + "learning_rate": 1.7307383430522474e-06, + "loss": 0.6660511493682861, + "step": 1078 + }, + { + "epoch": 2.2668067226890756, + "grad_norm": 22.503701517732946, + "learning_rate": 1.7214991005258386e-06, + "loss": 1.2165361642837524, + "step": 1079 + }, + { + "epoch": 2.26890756302521, + "grad_norm": 8.328219817576464, + "learning_rate": 1.7122794540513265e-06, + "loss": 0.18396508693695068, + "step": 1080 + }, + { + "epoch": 2.2710084033613445, + "grad_norm": 7.768308930354123, + "learning_rate": 1.703079458735805e-06, + "loss": 0.42018991708755493, + "step": 1081 + }, + { + "epoch": 2.273109243697479, + "grad_norm": 9.610477928803583, + "learning_rate": 1.6938991695689184e-06, + "loss": 0.38192903995513916, + "step": 1082 + }, + { + "epoch": 2.2752100840336134, + "grad_norm": 9.57071965935329, + "learning_rate": 1.684738641422517e-06, + "loss": 0.4953494966030121, + "step": 1083 + }, + { + "epoch": 2.277310924369748, + "grad_norm": 11.62580762547179, + "learning_rate": 1.6755979290503437e-06, + "loss": 0.5324037075042725, + "step": 1084 + }, + { + "epoch": 2.2794117647058822, + "grad_norm": 9.119930665905265, + "learning_rate": 1.666477087087694e-06, + "loss": 0.6618460416793823, + "step": 1085 + }, + { + "epoch": 2.2815126050420167, + "grad_norm": 12.668770516893803, + "learning_rate": 1.6573761700511004e-06, + "loss": 0.29154300689697266, + "step": 1086 + }, + { + "epoch": 2.283613445378151, + "grad_norm": 10.126878534173718, + "learning_rate": 1.6482952323379958e-06, + "loss": 0.39994263648986816, + "step": 1087 + }, + { + "epoch": 2.2857142857142856, + "grad_norm": 8.084921146733947, + "learning_rate": 1.639234328226399e-06, + "loss": 0.2049681693315506, + "step": 1088 + }, + { + "epoch": 2.28781512605042, + "grad_norm": 9.167757841002748, + "learning_rate": 1.6301935118745826e-06, + "loss": 0.35848674178123474, + "step": 1089 + }, + { + "epoch": 2.2899159663865545, + "grad_norm": 12.543365522318467, + "learning_rate": 1.621172837320754e-06, + "loss": 0.4794918894767761, + "step": 1090 + }, + { + "epoch": 2.292016806722689, + "grad_norm": 6.873717233986044, + "learning_rate": 1.6121723584827259e-06, + "loss": 0.3671627342700958, + "step": 1091 + }, + { + "epoch": 2.2941176470588234, + "grad_norm": 9.315544619619539, + "learning_rate": 1.6031921291576048e-06, + "loss": 0.25063830614089966, + "step": 1092 + }, + { + "epoch": 2.296218487394958, + "grad_norm": 11.618408926786485, + "learning_rate": 1.5942322030214547e-06, + "loss": 0.7581193447113037, + "step": 1093 + }, + { + "epoch": 2.2983193277310923, + "grad_norm": 7.9613247000723595, + "learning_rate": 1.5852926336289926e-06, + "loss": 0.4217086434364319, + "step": 1094 + }, + { + "epoch": 2.3004201680672267, + "grad_norm": 10.341036096752598, + "learning_rate": 1.5763734744132587e-06, + "loss": 0.5018645524978638, + "step": 1095 + }, + { + "epoch": 2.302521008403361, + "grad_norm": 14.166467122386207, + "learning_rate": 1.5674747786852935e-06, + "loss": 0.5745636224746704, + "step": 1096 + }, + { + "epoch": 2.3046218487394956, + "grad_norm": 9.77165887856765, + "learning_rate": 1.5585965996338314e-06, + "loss": 0.9145222902297974, + "step": 1097 + }, + { + "epoch": 2.30672268907563, + "grad_norm": 15.937224453039251, + "learning_rate": 1.5497389903249705e-06, + "loss": 0.4312666058540344, + "step": 1098 + }, + { + "epoch": 2.3088235294117645, + "grad_norm": 8.945920679970577, + "learning_rate": 1.5409020037018652e-06, + "loss": 0.4121660590171814, + "step": 1099 + }, + { + "epoch": 2.310924369747899, + "grad_norm": 10.839281933281265, + "learning_rate": 1.5320856925843997e-06, + "loss": 0.8646482825279236, + "step": 1100 + }, + { + "epoch": 2.3130252100840334, + "grad_norm": 12.806561724880765, + "learning_rate": 1.5232901096688847e-06, + "loss": 0.784586489200592, + "step": 1101 + }, + { + "epoch": 2.315126050420168, + "grad_norm": 10.817682905964707, + "learning_rate": 1.5145153075277286e-06, + "loss": 0.9424635171890259, + "step": 1102 + }, + { + "epoch": 2.3172268907563023, + "grad_norm": 8.922023653272449, + "learning_rate": 1.505761338609137e-06, + "loss": 0.28385645151138306, + "step": 1103 + }, + { + "epoch": 2.3193277310924367, + "grad_norm": 15.30593506620364, + "learning_rate": 1.4970282552367854e-06, + "loss": 0.6689031720161438, + "step": 1104 + }, + { + "epoch": 2.3214285714285716, + "grad_norm": 10.05546946420467, + "learning_rate": 1.4883161096095189e-06, + "loss": 0.691364586353302, + "step": 1105 + }, + { + "epoch": 2.323529411764706, + "grad_norm": 13.976863852979069, + "learning_rate": 1.4796249538010354e-06, + "loss": 0.23520073294639587, + "step": 1106 + }, + { + "epoch": 2.3256302521008405, + "grad_norm": 9.578643377397341, + "learning_rate": 1.4709548397595674e-06, + "loss": 0.4271107316017151, + "step": 1107 + }, + { + "epoch": 2.327731092436975, + "grad_norm": 16.17388877757899, + "learning_rate": 1.4623058193075852e-06, + "loss": 0.9280604720115662, + "step": 1108 + }, + { + "epoch": 2.3298319327731094, + "grad_norm": 13.041308775276805, + "learning_rate": 1.453677944141474e-06, + "loss": 0.33376407623291016, + "step": 1109 + }, + { + "epoch": 2.331932773109244, + "grad_norm": 13.186142451412863, + "learning_rate": 1.4450712658312356e-06, + "loss": 0.7442219853401184, + "step": 1110 + }, + { + "epoch": 2.3340336134453783, + "grad_norm": 10.969810510823187, + "learning_rate": 1.43648583582017e-06, + "loss": 1.27920663356781, + "step": 1111 + }, + { + "epoch": 2.3361344537815127, + "grad_norm": 22.653518753891586, + "learning_rate": 1.4279217054245793e-06, + "loss": 0.6456579566001892, + "step": 1112 + }, + { + "epoch": 2.338235294117647, + "grad_norm": 13.638307761366974, + "learning_rate": 1.4193789258334485e-06, + "loss": 1.1350394487380981, + "step": 1113 + }, + { + "epoch": 2.3403361344537816, + "grad_norm": 10.59397199917471, + "learning_rate": 1.4108575481081522e-06, + "loss": 0.5290108919143677, + "step": 1114 + }, + { + "epoch": 2.342436974789916, + "grad_norm": 9.100247445169298, + "learning_rate": 1.4023576231821362e-06, + "loss": 0.2833002209663391, + "step": 1115 + }, + { + "epoch": 2.3445378151260505, + "grad_norm": 18.49442431345445, + "learning_rate": 1.3938792018606278e-06, + "loss": 0.37826409935951233, + "step": 1116 + }, + { + "epoch": 2.346638655462185, + "grad_norm": 12.477810112402349, + "learning_rate": 1.3854223348203171e-06, + "loss": 0.3945717215538025, + "step": 1117 + }, + { + "epoch": 2.3487394957983194, + "grad_norm": 8.789544191123422, + "learning_rate": 1.376987072609065e-06, + "loss": 0.31352269649505615, + "step": 1118 + }, + { + "epoch": 2.350840336134454, + "grad_norm": 14.219313270123468, + "learning_rate": 1.368573465645599e-06, + "loss": 0.8024647235870361, + "step": 1119 + }, + { + "epoch": 2.3529411764705883, + "grad_norm": 10.007349065084831, + "learning_rate": 1.360181564219204e-06, + "loss": 0.7791054248809814, + "step": 1120 + }, + { + "epoch": 2.3550420168067228, + "grad_norm": 12.213364584526106, + "learning_rate": 1.351811418489436e-06, + "loss": 0.37381619215011597, + "step": 1121 + }, + { + "epoch": 2.357142857142857, + "grad_norm": 10.713765677783302, + "learning_rate": 1.3434630784858067e-06, + "loss": 0.3184419870376587, + "step": 1122 + }, + { + "epoch": 2.3592436974789917, + "grad_norm": 11.470256693930569, + "learning_rate": 1.335136594107498e-06, + "loss": 0.3431350886821747, + "step": 1123 + }, + { + "epoch": 2.361344537815126, + "grad_norm": 9.119684880351647, + "learning_rate": 1.3268320151230518e-06, + "loss": 0.4296434819698334, + "step": 1124 + }, + { + "epoch": 2.3634453781512605, + "grad_norm": 10.866853294417046, + "learning_rate": 1.3185493911700854e-06, + "loss": 0.48791950941085815, + "step": 1125 + }, + { + "epoch": 2.365546218487395, + "grad_norm": 9.540925370722046, + "learning_rate": 1.3102887717549812e-06, + "loss": 0.29711413383483887, + "step": 1126 + }, + { + "epoch": 2.3676470588235294, + "grad_norm": 11.627989144711366, + "learning_rate": 1.302050206252602e-06, + "loss": 0.39902636408805847, + "step": 1127 + }, + { + "epoch": 2.369747899159664, + "grad_norm": 6.365770038684127, + "learning_rate": 1.2938337439059868e-06, + "loss": 0.2864948511123657, + "step": 1128 + }, + { + "epoch": 2.3718487394957983, + "grad_norm": 12.606248234313094, + "learning_rate": 1.2856394338260691e-06, + "loss": 0.42151930928230286, + "step": 1129 + }, + { + "epoch": 2.3739495798319328, + "grad_norm": 8.544922775672411, + "learning_rate": 1.2774673249913656e-06, + "loss": 0.330949604511261, + "step": 1130 + }, + { + "epoch": 2.3760504201680672, + "grad_norm": 12.681787759512487, + "learning_rate": 1.2693174662477003e-06, + "loss": 0.832221508026123, + "step": 1131 + }, + { + "epoch": 2.3781512605042017, + "grad_norm": 16.15687539830067, + "learning_rate": 1.2611899063079002e-06, + "loss": 0.3243201971054077, + "step": 1132 + }, + { + "epoch": 2.380252100840336, + "grad_norm": 11.42137338593432, + "learning_rate": 1.253084693751514e-06, + "loss": 0.4209938049316406, + "step": 1133 + }, + { + "epoch": 2.3823529411764706, + "grad_norm": 10.49566833203582, + "learning_rate": 1.245001877024512e-06, + "loss": 0.1905173659324646, + "step": 1134 + }, + { + "epoch": 2.384453781512605, + "grad_norm": 9.325292405896798, + "learning_rate": 1.2369415044390055e-06, + "loss": 0.31655293703079224, + "step": 1135 + }, + { + "epoch": 2.3865546218487395, + "grad_norm": 12.150405014710023, + "learning_rate": 1.228903624172954e-06, + "loss": 0.2780379354953766, + "step": 1136 + }, + { + "epoch": 2.388655462184874, + "grad_norm": 7.132176058282011, + "learning_rate": 1.220888284269874e-06, + "loss": 0.5738459825515747, + "step": 1137 + }, + { + "epoch": 2.3907563025210083, + "grad_norm": 9.199984669814489, + "learning_rate": 1.2128955326385595e-06, + "loss": 0.4594503343105316, + "step": 1138 + }, + { + "epoch": 2.392857142857143, + "grad_norm": 246.0490199481034, + "learning_rate": 1.2049254170527857e-06, + "loss": 1.6502771377563477, + "step": 1139 + }, + { + "epoch": 2.3949579831932772, + "grad_norm": 10.645480745934366, + "learning_rate": 1.196977985151036e-06, + "loss": 0.7063793540000916, + "step": 1140 + }, + { + "epoch": 2.3970588235294117, + "grad_norm": 12.466682957005606, + "learning_rate": 1.1890532844362035e-06, + "loss": 0.4885460138320923, + "step": 1141 + }, + { + "epoch": 2.399159663865546, + "grad_norm": 8.222098406246245, + "learning_rate": 1.1811513622753196e-06, + "loss": 0.29537534713745117, + "step": 1142 + }, + { + "epoch": 2.4012605042016806, + "grad_norm": 10.08444013945275, + "learning_rate": 1.1732722658992597e-06, + "loss": 0.6734664440155029, + "step": 1143 + }, + { + "epoch": 2.403361344537815, + "grad_norm": 12.85839873964936, + "learning_rate": 1.1654160424024718e-06, + "loss": 0.39790263772010803, + "step": 1144 + }, + { + "epoch": 2.4054621848739495, + "grad_norm": 19.32478545248631, + "learning_rate": 1.1575827387426846e-06, + "loss": 0.2750331163406372, + "step": 1145 + }, + { + "epoch": 2.407563025210084, + "grad_norm": 9.972826363554564, + "learning_rate": 1.149772401740637e-06, + "loss": 0.44170406460762024, + "step": 1146 + }, + { + "epoch": 2.4096638655462184, + "grad_norm": 7.314481031395291, + "learning_rate": 1.1419850780797864e-06, + "loss": 0.19013899564743042, + "step": 1147 + }, + { + "epoch": 2.411764705882353, + "grad_norm": 7.432016042351664, + "learning_rate": 1.1342208143060423e-06, + "loss": 0.4140137732028961, + "step": 1148 + }, + { + "epoch": 2.4138655462184873, + "grad_norm": 11.414471382112064, + "learning_rate": 1.1264796568274811e-06, + "loss": 0.4861386716365814, + "step": 1149 + }, + { + "epoch": 2.4159663865546217, + "grad_norm": 13.684580354320987, + "learning_rate": 1.118761651914065e-06, + "loss": 0.3487178683280945, + "step": 1150 + }, + { + "epoch": 2.418067226890756, + "grad_norm": 8.714659720362214, + "learning_rate": 1.1110668456973761e-06, + "loss": 0.6119335889816284, + "step": 1151 + }, + { + "epoch": 2.4201680672268906, + "grad_norm": 10.585809423186294, + "learning_rate": 1.10339528417033e-06, + "loss": 0.24830467998981476, + "step": 1152 + }, + { + "epoch": 2.422268907563025, + "grad_norm": 6.6530689382799375, + "learning_rate": 1.0957470131869102e-06, + "loss": 0.20413950085639954, + "step": 1153 + }, + { + "epoch": 2.4243697478991595, + "grad_norm": 11.585229233250407, + "learning_rate": 1.088122078461884e-06, + "loss": 0.7759865522384644, + "step": 1154 + }, + { + "epoch": 2.426470588235294, + "grad_norm": 14.183804098321202, + "learning_rate": 1.0805205255705403e-06, + "loss": 0.9713194370269775, + "step": 1155 + }, + { + "epoch": 2.4285714285714284, + "grad_norm": 11.392423008755229, + "learning_rate": 1.0729423999484062e-06, + "loss": 0.3234805464744568, + "step": 1156 + }, + { + "epoch": 2.4306722689075633, + "grad_norm": 7.504753087219636, + "learning_rate": 1.0653877468909857e-06, + "loss": 0.2364063262939453, + "step": 1157 + }, + { + "epoch": 2.4327731092436977, + "grad_norm": 9.823099282463206, + "learning_rate": 1.0578566115534794e-06, + "loss": 0.4705219268798828, + "step": 1158 + }, + { + "epoch": 2.434873949579832, + "grad_norm": 9.451122750213175, + "learning_rate": 1.0503490389505244e-06, + "loss": 0.26277682185173035, + "step": 1159 + }, + { + "epoch": 2.4369747899159666, + "grad_norm": 9.336273451144258, + "learning_rate": 1.0428650739559138e-06, + "loss": 0.13882672786712646, + "step": 1160 + }, + { + "epoch": 2.439075630252101, + "grad_norm": 7.52407325404656, + "learning_rate": 1.0354047613023404e-06, + "loss": 0.5188834071159363, + "step": 1161 + }, + { + "epoch": 2.4411764705882355, + "grad_norm": 7.853041816369125, + "learning_rate": 1.0279681455811219e-06, + "loss": 0.24887529015541077, + "step": 1162 + }, + { + "epoch": 2.44327731092437, + "grad_norm": 10.755975449643415, + "learning_rate": 1.0205552712419343e-06, + "loss": 0.28220975399017334, + "step": 1163 + }, + { + "epoch": 2.4453781512605044, + "grad_norm": 10.623188982430918, + "learning_rate": 1.013166182592551e-06, + "loss": 0.24789491295814514, + "step": 1164 + }, + { + "epoch": 2.447478991596639, + "grad_norm": 10.265380274150749, + "learning_rate": 1.0058009237985721e-06, + "loss": 0.7892224788665771, + "step": 1165 + }, + { + "epoch": 2.4495798319327733, + "grad_norm": 11.896169947706998, + "learning_rate": 9.98459538883167e-07, + "loss": 0.26245754957199097, + "step": 1166 + }, + { + "epoch": 2.4516806722689077, + "grad_norm": 11.049089295820975, + "learning_rate": 9.911420717268023e-07, + "loss": 0.27979156374931335, + "step": 1167 + }, + { + "epoch": 2.453781512605042, + "grad_norm": 13.265137697114756, + "learning_rate": 9.838485660669906e-07, + "loss": 0.7934341430664062, + "step": 1168 + }, + { + "epoch": 2.4558823529411766, + "grad_norm": 10.018047542365926, + "learning_rate": 9.765790654980195e-07, + "loss": 0.45289355516433716, + "step": 1169 + }, + { + "epoch": 2.457983193277311, + "grad_norm": 13.567130161558774, + "learning_rate": 9.693336134706988e-07, + "loss": 0.992337703704834, + "step": 1170 + }, + { + "epoch": 2.4600840336134455, + "grad_norm": 9.387778498410693, + "learning_rate": 9.621122532920908e-07, + "loss": 0.29417842626571655, + "step": 1171 + }, + { + "epoch": 2.46218487394958, + "grad_norm": 9.114348977338564, + "learning_rate": 9.549150281252633e-07, + "loss": 0.5845852494239807, + "step": 1172 + }, + { + "epoch": 2.4642857142857144, + "grad_norm": 9.288921226395173, + "learning_rate": 9.477419809890215e-07, + "loss": 0.22582799196243286, + "step": 1173 + }, + { + "epoch": 2.466386554621849, + "grad_norm": 13.268912659944744, + "learning_rate": 9.405931547576591e-07, + "loss": 0.26232588291168213, + "step": 1174 + }, + { + "epoch": 2.4684873949579833, + "grad_norm": 9.072509999987034, + "learning_rate": 9.334685921606946e-07, + "loss": 0.9084593057632446, + "step": 1175 + }, + { + "epoch": 2.4705882352941178, + "grad_norm": 11.285010838093699, + "learning_rate": 9.26368335782622e-07, + "loss": 0.8386296629905701, + "step": 1176 + }, + { + "epoch": 2.472689075630252, + "grad_norm": 11.02721308505799, + "learning_rate": 9.192924280626514e-07, + "loss": 1.0152020454406738, + "step": 1177 + }, + { + "epoch": 2.4747899159663866, + "grad_norm": 12.924069581096365, + "learning_rate": 9.122409112944591e-07, + "loss": 0.42396751046180725, + "step": 1178 + }, + { + "epoch": 2.476890756302521, + "grad_norm": 13.79023717049261, + "learning_rate": 9.052138276259348e-07, + "loss": 0.3439130485057831, + "step": 1179 + }, + { + "epoch": 2.4789915966386555, + "grad_norm": 8.00992187627695, + "learning_rate": 8.982112190589237e-07, + "loss": 0.21849340200424194, + "step": 1180 + }, + { + "epoch": 2.48109243697479, + "grad_norm": 17.238112347826142, + "learning_rate": 8.912331274489855e-07, + "loss": 1.047693133354187, + "step": 1181 + }, + { + "epoch": 2.4831932773109244, + "grad_norm": 10.977700782429032, + "learning_rate": 8.842795945051335e-07, + "loss": 0.4458342492580414, + "step": 1182 + }, + { + "epoch": 2.485294117647059, + "grad_norm": 6.2173703827542735, + "learning_rate": 8.773506617895944e-07, + "loss": 0.26556795835494995, + "step": 1183 + }, + { + "epoch": 2.4873949579831933, + "grad_norm": 14.598955541616366, + "learning_rate": 8.704463707175526e-07, + "loss": 0.8663069605827332, + "step": 1184 + }, + { + "epoch": 2.4894957983193278, + "grad_norm": 9.599096123627477, + "learning_rate": 8.6356676255691e-07, + "loss": 0.7863715291023254, + "step": 1185 + }, + { + "epoch": 2.491596638655462, + "grad_norm": 7.756695128139413, + "learning_rate": 8.567118784280309e-07, + "loss": 0.2747763395309448, + "step": 1186 + }, + { + "epoch": 2.4936974789915967, + "grad_norm": 15.296434795066423, + "learning_rate": 8.498817593035053e-07, + "loss": 0.22008158266544342, + "step": 1187 + }, + { + "epoch": 2.495798319327731, + "grad_norm": 42.195018093662426, + "learning_rate": 8.430764460078938e-07, + "loss": 0.7790160179138184, + "step": 1188 + }, + { + "epoch": 2.4978991596638656, + "grad_norm": 14.930505610933327, + "learning_rate": 8.362959792174941e-07, + "loss": 0.3692745864391327, + "step": 1189 + }, + { + "epoch": 2.5, + "grad_norm": 15.547844843931736, + "learning_rate": 8.295403994600921e-07, + "loss": 0.5012900829315186, + "step": 1190 + }, + { + "epoch": 2.5021008403361344, + "grad_norm": 13.218952734739705, + "learning_rate": 8.228097471147167e-07, + "loss": 0.4049416780471802, + "step": 1191 + }, + { + "epoch": 2.504201680672269, + "grad_norm": 11.42318009744243, + "learning_rate": 8.161040624114075e-07, + "loss": 0.14171475172042847, + "step": 1192 + }, + { + "epoch": 2.5063025210084033, + "grad_norm": 8.26466575159723, + "learning_rate": 8.094233854309647e-07, + "loss": 0.32759952545166016, + "step": 1193 + }, + { + "epoch": 2.508403361344538, + "grad_norm": 13.359323997562882, + "learning_rate": 8.027677561047176e-07, + "loss": 0.5382500886917114, + "step": 1194 + }, + { + "epoch": 2.5105042016806722, + "grad_norm": 9.050399443504134, + "learning_rate": 7.961372142142776e-07, + "loss": 0.4815264940261841, + "step": 1195 + }, + { + "epoch": 2.5126050420168067, + "grad_norm": 8.2857361498368, + "learning_rate": 7.89531799391311e-07, + "loss": 0.28123000264167786, + "step": 1196 + }, + { + "epoch": 2.514705882352941, + "grad_norm": 14.813927596451204, + "learning_rate": 7.829515511172897e-07, + "loss": 0.5116557478904724, + "step": 1197 + }, + { + "epoch": 2.5168067226890756, + "grad_norm": 11.672590724543431, + "learning_rate": 7.763965087232678e-07, + "loss": 0.4502016603946686, + "step": 1198 + }, + { + "epoch": 2.51890756302521, + "grad_norm": 8.420294235923025, + "learning_rate": 7.698667113896346e-07, + "loss": 0.34997278451919556, + "step": 1199 + }, + { + "epoch": 2.5210084033613445, + "grad_norm": 4.856432012218632, + "learning_rate": 7.633621981458916e-07, + "loss": 0.15743517875671387, + "step": 1200 + }, + { + "epoch": 2.523109243697479, + "grad_norm": 10.116924629282346, + "learning_rate": 7.568830078704092e-07, + "loss": 0.4513791799545288, + "step": 1201 + }, + { + "epoch": 2.5252100840336134, + "grad_norm": 10.448219454906289, + "learning_rate": 7.504291792902024e-07, + "loss": 0.5203551054000854, + "step": 1202 + }, + { + "epoch": 2.527310924369748, + "grad_norm": 7.4896542285298, + "learning_rate": 7.440007509806946e-07, + "loss": 0.5805743932723999, + "step": 1203 + }, + { + "epoch": 2.5294117647058822, + "grad_norm": 6.637043733478462, + "learning_rate": 7.375977613654861e-07, + "loss": 0.21151217818260193, + "step": 1204 + }, + { + "epoch": 2.5315126050420167, + "grad_norm": 11.756396934264371, + "learning_rate": 7.312202487161318e-07, + "loss": 0.4486454725265503, + "step": 1205 + }, + { + "epoch": 2.533613445378151, + "grad_norm": 13.216341095384697, + "learning_rate": 7.248682511519006e-07, + "loss": 0.8350504040718079, + "step": 1206 + }, + { + "epoch": 2.5357142857142856, + "grad_norm": 14.368316188442714, + "learning_rate": 7.18541806639561e-07, + "loss": 0.37657079100608826, + "step": 1207 + }, + { + "epoch": 2.53781512605042, + "grad_norm": 10.572863577964558, + "learning_rate": 7.122409529931412e-07, + "loss": 0.5544061660766602, + "step": 1208 + }, + { + "epoch": 2.5399159663865545, + "grad_norm": 13.009489309703797, + "learning_rate": 7.059657278737136e-07, + "loss": 0.8755850791931152, + "step": 1209 + }, + { + "epoch": 2.542016806722689, + "grad_norm": 10.419835233671352, + "learning_rate": 6.997161687891635e-07, + "loss": 0.6084367036819458, + "step": 1210 + }, + { + "epoch": 2.5441176470588234, + "grad_norm": 7.424045502482636, + "learning_rate": 6.934923130939692e-07, + "loss": 0.3528558015823364, + "step": 1211 + }, + { + "epoch": 2.546218487394958, + "grad_norm": 22.05326914016899, + "learning_rate": 6.872941979889708e-07, + "loss": 0.3760122060775757, + "step": 1212 + }, + { + "epoch": 2.5483193277310923, + "grad_norm": 8.437103819513496, + "learning_rate": 6.811218605211606e-07, + "loss": 0.3798169195652008, + "step": 1213 + }, + { + "epoch": 2.5504201680672267, + "grad_norm": 15.105682353848836, + "learning_rate": 6.749753375834467e-07, + "loss": 0.20516347885131836, + "step": 1214 + }, + { + "epoch": 2.552521008403361, + "grad_norm": 15.328640967464176, + "learning_rate": 6.688546659144479e-07, + "loss": 0.39129936695098877, + "step": 1215 + }, + { + "epoch": 2.5546218487394956, + "grad_norm": 18.19539322746799, + "learning_rate": 6.627598820982595e-07, + "loss": 0.5815962553024292, + "step": 1216 + }, + { + "epoch": 2.55672268907563, + "grad_norm": 10.358040499956887, + "learning_rate": 6.566910225642475e-07, + "loss": 0.2462518960237503, + "step": 1217 + }, + { + "epoch": 2.5588235294117645, + "grad_norm": 23.882665351929745, + "learning_rate": 6.50648123586819e-07, + "loss": 0.7295534610748291, + "step": 1218 + }, + { + "epoch": 2.560924369747899, + "grad_norm": 11.419325337575849, + "learning_rate": 6.446312212852162e-07, + "loss": 0.4088057577610016, + "step": 1219 + }, + { + "epoch": 2.5630252100840334, + "grad_norm": 18.506668669014132, + "learning_rate": 6.386403516232948e-07, + "loss": 0.6498621106147766, + "step": 1220 + }, + { + "epoch": 2.565126050420168, + "grad_norm": 12.707186533109224, + "learning_rate": 6.326755504093063e-07, + "loss": 0.3554389476776123, + "step": 1221 + }, + { + "epoch": 2.5672268907563023, + "grad_norm": 12.462287833643975, + "learning_rate": 6.267368532956919e-07, + "loss": 1.3259708881378174, + "step": 1222 + }, + { + "epoch": 2.5693277310924367, + "grad_norm": 8.69258882253335, + "learning_rate": 6.208242957788613e-07, + "loss": 0.4336357116699219, + "step": 1223 + }, + { + "epoch": 2.571428571428571, + "grad_norm": 10.998188149878677, + "learning_rate": 6.14937913198988e-07, + "loss": 0.6199144124984741, + "step": 1224 + }, + { + "epoch": 2.5735294117647056, + "grad_norm": 20.134120954604086, + "learning_rate": 6.090777407397902e-07, + "loss": 1.075969934463501, + "step": 1225 + }, + { + "epoch": 2.57563025210084, + "grad_norm": 9.646318558023589, + "learning_rate": 6.032438134283286e-07, + "loss": 0.5996450185775757, + "step": 1226 + }, + { + "epoch": 2.5777310924369745, + "grad_norm": 10.633484513814087, + "learning_rate": 5.974361661347889e-07, + "loss": 0.37859058380126953, + "step": 1227 + }, + { + "epoch": 2.5798319327731094, + "grad_norm": 18.160538186398977, + "learning_rate": 5.916548335722822e-07, + "loss": 0.3595309853553772, + "step": 1228 + }, + { + "epoch": 2.581932773109244, + "grad_norm": 12.156397479975382, + "learning_rate": 5.858998502966273e-07, + "loss": 0.31986016035079956, + "step": 1229 + }, + { + "epoch": 2.5840336134453783, + "grad_norm": 12.635254524437713, + "learning_rate": 5.801712507061563e-07, + "loss": 0.3975721597671509, + "step": 1230 + }, + { + "epoch": 2.5861344537815127, + "grad_norm": 10.900463191925608, + "learning_rate": 5.74469069041495e-07, + "loss": 0.6717185974121094, + "step": 1231 + }, + { + "epoch": 2.588235294117647, + "grad_norm": 10.60292331277609, + "learning_rate": 5.687933393853718e-07, + "loss": 0.6171470880508423, + "step": 1232 + }, + { + "epoch": 2.5903361344537816, + "grad_norm": 11.817453815932138, + "learning_rate": 5.631440956624057e-07, + "loss": 0.47931092977523804, + "step": 1233 + }, + { + "epoch": 2.592436974789916, + "grad_norm": 14.65524897977516, + "learning_rate": 5.575213716389039e-07, + "loss": 0.44013679027557373, + "step": 1234 + }, + { + "epoch": 2.5945378151260505, + "grad_norm": 14.640686063418055, + "learning_rate": 5.519252009226639e-07, + "loss": 0.515785276889801, + "step": 1235 + }, + { + "epoch": 2.596638655462185, + "grad_norm": 9.51325634200356, + "learning_rate": 5.463556169627687e-07, + "loss": 0.3664918541908264, + "step": 1236 + }, + { + "epoch": 2.5987394957983194, + "grad_norm": 9.591516923545466, + "learning_rate": 5.408126530493918e-07, + "loss": 0.3711666762828827, + "step": 1237 + }, + { + "epoch": 2.600840336134454, + "grad_norm": 7.071071092917334, + "learning_rate": 5.352963423135893e-07, + "loss": 0.12698325514793396, + "step": 1238 + }, + { + "epoch": 2.6029411764705883, + "grad_norm": 8.042424735857201, + "learning_rate": 5.298067177271144e-07, + "loss": 0.3730424642562866, + "step": 1239 + }, + { + "epoch": 2.6050420168067228, + "grad_norm": 9.069780325522164, + "learning_rate": 5.243438121022077e-07, + "loss": 0.6243601441383362, + "step": 1240 + }, + { + "epoch": 2.607142857142857, + "grad_norm": 7.246887997362519, + "learning_rate": 5.18907658091411e-07, + "loss": 0.18001016974449158, + "step": 1241 + }, + { + "epoch": 2.6092436974789917, + "grad_norm": 15.652638965395807, + "learning_rate": 5.134982881873646e-07, + "loss": 0.6635949611663818, + "step": 1242 + }, + { + "epoch": 2.611344537815126, + "grad_norm": 9.642543803196963, + "learning_rate": 5.081157347226201e-07, + "loss": 0.4666215777397156, + "step": 1243 + }, + { + "epoch": 2.6134453781512605, + "grad_norm": 9.416633968819704, + "learning_rate": 5.027600298694397e-07, + "loss": 0.1682681143283844, + "step": 1244 + }, + { + "epoch": 2.615546218487395, + "grad_norm": 14.036854769880513, + "learning_rate": 4.974312056396113e-07, + "loss": 0.5077744722366333, + "step": 1245 + }, + { + "epoch": 2.6176470588235294, + "grad_norm": 11.722652840072532, + "learning_rate": 4.92129293884252e-07, + "loss": 0.44359397888183594, + "step": 1246 + }, + { + "epoch": 2.619747899159664, + "grad_norm": 15.585836072486865, + "learning_rate": 4.868543262936176e-07, + "loss": 1.2246967554092407, + "step": 1247 + }, + { + "epoch": 2.6218487394957983, + "grad_norm": 10.770044484279795, + "learning_rate": 4.816063343969196e-07, + "loss": 0.32194000482559204, + "step": 1248 + }, + { + "epoch": 2.6239495798319328, + "grad_norm": 11.639608924375384, + "learning_rate": 4.763853495621251e-07, + "loss": 0.5496278405189514, + "step": 1249 + }, + { + "epoch": 2.6260504201680672, + "grad_norm": 6.671350027648182, + "learning_rate": 4.7119140299578424e-07, + "loss": 0.21257492899894714, + "step": 1250 + }, + { + "epoch": 2.6281512605042017, + "grad_norm": 12.713785072488509, + "learning_rate": 4.660245257428297e-07, + "loss": 0.3104386329650879, + "step": 1251 + }, + { + "epoch": 2.630252100840336, + "grad_norm": 14.031766333020213, + "learning_rate": 4.6088474868640045e-07, + "loss": 0.8334522843360901, + "step": 1252 + }, + { + "epoch": 2.6323529411764706, + "grad_norm": 9.251230979164895, + "learning_rate": 4.557721025476508e-07, + "loss": 0.29882583022117615, + "step": 1253 + }, + { + "epoch": 2.634453781512605, + "grad_norm": 10.2580288266136, + "learning_rate": 4.5068661788557345e-07, + "loss": 0.3209346830844879, + "step": 1254 + }, + { + "epoch": 2.6365546218487395, + "grad_norm": 5.604118390936418, + "learning_rate": 4.4562832509680963e-07, + "loss": 0.15333116054534912, + "step": 1255 + }, + { + "epoch": 2.638655462184874, + "grad_norm": 19.802213443985696, + "learning_rate": 4.4059725441547464e-07, + "loss": 0.48582714796066284, + "step": 1256 + }, + { + "epoch": 2.6407563025210083, + "grad_norm": 11.514218359185726, + "learning_rate": 4.355934359129699e-07, + "loss": 0.4873425364494324, + "step": 1257 + }, + { + "epoch": 2.642857142857143, + "grad_norm": 11.373550533887446, + "learning_rate": 4.3061689949780995e-07, + "loss": 0.2611161768436432, + "step": 1258 + }, + { + "epoch": 2.6449579831932772, + "grad_norm": 13.616066692598451, + "learning_rate": 4.2566767491543706e-07, + "loss": 0.27621158957481384, + "step": 1259 + }, + { + "epoch": 2.6470588235294117, + "grad_norm": 13.034515066864026, + "learning_rate": 4.2074579174805173e-07, + "loss": 0.849486231803894, + "step": 1260 + }, + { + "epoch": 2.649159663865546, + "grad_norm": 11.86057949603211, + "learning_rate": 4.1585127941442536e-07, + "loss": 0.7652707099914551, + "step": 1261 + }, + { + "epoch": 2.6512605042016806, + "grad_norm": 9.803056978877574, + "learning_rate": 4.1098416716973457e-07, + "loss": 0.27856025099754333, + "step": 1262 + }, + { + "epoch": 2.653361344537815, + "grad_norm": 10.956379977903175, + "learning_rate": 4.0614448410538077e-07, + "loss": 0.3749684691429138, + "step": 1263 + }, + { + "epoch": 2.6554621848739495, + "grad_norm": 12.001506859449199, + "learning_rate": 4.01332259148815e-07, + "loss": 0.6064971685409546, + "step": 1264 + }, + { + "epoch": 2.657563025210084, + "grad_norm": 8.750382381092477, + "learning_rate": 3.965475210633718e-07, + "loss": 0.31089282035827637, + "step": 1265 + }, + { + "epoch": 2.6596638655462184, + "grad_norm": 11.062101410973414, + "learning_rate": 3.917902984480881e-07, + "loss": 0.3686492443084717, + "step": 1266 + }, + { + "epoch": 2.661764705882353, + "grad_norm": 9.181597675394137, + "learning_rate": 3.870606197375415e-07, + "loss": 0.5900052785873413, + "step": 1267 + }, + { + "epoch": 2.6638655462184873, + "grad_norm": 11.229435985209061, + "learning_rate": 3.823585132016711e-07, + "loss": 0.23156413435935974, + "step": 1268 + }, + { + "epoch": 2.6659663865546217, + "grad_norm": 14.580552525176778, + "learning_rate": 3.776840069456189e-07, + "loss": 1.1965575218200684, + "step": 1269 + }, + { + "epoch": 2.668067226890756, + "grad_norm": 11.440843191964541, + "learning_rate": 3.730371289095508e-07, + "loss": 0.5137308835983276, + "step": 1270 + }, + { + "epoch": 2.6701680672268906, + "grad_norm": 10.19938284065176, + "learning_rate": 3.6841790686849897e-07, + "loss": 0.2563337981700897, + "step": 1271 + }, + { + "epoch": 2.6722689075630255, + "grad_norm": 12.902940912955524, + "learning_rate": 3.6382636843218967e-07, + "loss": 0.5659809708595276, + "step": 1272 + }, + { + "epoch": 2.67436974789916, + "grad_norm": 10.012067877403453, + "learning_rate": 3.592625410448813e-07, + "loss": 0.4689119756221771, + "step": 1273 + }, + { + "epoch": 2.6764705882352944, + "grad_norm": 7.152049482781003, + "learning_rate": 3.5472645198520064e-07, + "loss": 0.623033881187439, + "step": 1274 + }, + { + "epoch": 2.678571428571429, + "grad_norm": 12.87568935637631, + "learning_rate": 3.502181283659756e-07, + "loss": 0.5805165767669678, + "step": 1275 + }, + { + "epoch": 2.6806722689075633, + "grad_norm": 9.41187997958309, + "learning_rate": 3.4573759713407927e-07, + "loss": 0.5375624299049377, + "step": 1276 + }, + { + "epoch": 2.6827731092436977, + "grad_norm": 9.91288200334237, + "learning_rate": 3.4128488507026327e-07, + "loss": 0.3185434341430664, + "step": 1277 + }, + { + "epoch": 2.684873949579832, + "grad_norm": 15.97191633077991, + "learning_rate": 3.3686001878900365e-07, + "loss": 2.561387538909912, + "step": 1278 + }, + { + "epoch": 2.6869747899159666, + "grad_norm": 15.172775416815085, + "learning_rate": 3.324630247383337e-07, + "loss": 0.5536858439445496, + "step": 1279 + }, + { + "epoch": 2.689075630252101, + "grad_norm": 8.67689739732767, + "learning_rate": 3.2809392919969483e-07, + "loss": 0.18657177686691284, + "step": 1280 + }, + { + "epoch": 2.6911764705882355, + "grad_norm": 12.844508734340609, + "learning_rate": 3.2375275828777253e-07, + "loss": 0.9441865086555481, + "step": 1281 + }, + { + "epoch": 2.69327731092437, + "grad_norm": 9.066706121878353, + "learning_rate": 3.194395379503451e-07, + "loss": 0.5320143103599548, + "step": 1282 + }, + { + "epoch": 2.6953781512605044, + "grad_norm": 8.980483143209002, + "learning_rate": 3.151542939681235e-07, + "loss": 0.5943700075149536, + "step": 1283 + }, + { + "epoch": 2.697478991596639, + "grad_norm": 54.073743939162, + "learning_rate": 3.108970519546034e-07, + "loss": 1.0508530139923096, + "step": 1284 + }, + { + "epoch": 2.6995798319327733, + "grad_norm": 10.409633106680213, + "learning_rate": 3.066678373559062e-07, + "loss": 0.3096291124820709, + "step": 1285 + }, + { + "epoch": 2.7016806722689077, + "grad_norm": 17.871716634928575, + "learning_rate": 3.0246667545063057e-07, + "loss": 1.133009910583496, + "step": 1286 + }, + { + "epoch": 2.703781512605042, + "grad_norm": 10.727929813588565, + "learning_rate": 2.9829359134970206e-07, + "loss": 0.3362637162208557, + "step": 1287 + }, + { + "epoch": 2.7058823529411766, + "grad_norm": 10.027811395629024, + "learning_rate": 2.9414860999621764e-07, + "loss": 0.9418044090270996, + "step": 1288 + }, + { + "epoch": 2.707983193277311, + "grad_norm": 8.072200583551933, + "learning_rate": 2.9003175616530264e-07, + "loss": 0.2674849033355713, + "step": 1289 + }, + { + "epoch": 2.7100840336134455, + "grad_norm": 7.662563052553184, + "learning_rate": 2.8594305446396245e-07, + "loss": 0.39476725459098816, + "step": 1290 + }, + { + "epoch": 2.71218487394958, + "grad_norm": 7.931717377933664, + "learning_rate": 2.818825293309274e-07, + "loss": 0.5461002588272095, + "step": 1291 + }, + { + "epoch": 2.7142857142857144, + "grad_norm": 9.069033415947747, + "learning_rate": 2.7785020503651783e-07, + "loss": 0.36206185817718506, + "step": 1292 + }, + { + "epoch": 2.716386554621849, + "grad_norm": 11.269854164923549, + "learning_rate": 2.7384610568249313e-07, + "loss": 0.33151179552078247, + "step": 1293 + }, + { + "epoch": 2.7184873949579833, + "grad_norm": 10.182183999098427, + "learning_rate": 2.698702552019045e-07, + "loss": 0.3465487062931061, + "step": 1294 + }, + { + "epoch": 2.7205882352941178, + "grad_norm": 12.712025830447253, + "learning_rate": 2.659226773589607e-07, + "loss": 0.22317005693912506, + "step": 1295 + }, + { + "epoch": 2.722689075630252, + "grad_norm": 11.83879887595397, + "learning_rate": 2.620033957488777e-07, + "loss": 0.34791454672813416, + "step": 1296 + }, + { + "epoch": 2.7247899159663866, + "grad_norm": 12.416917803129223, + "learning_rate": 2.581124337977425e-07, + "loss": 0.4211697578430176, + "step": 1297 + }, + { + "epoch": 2.726890756302521, + "grad_norm": 15.495534828622619, + "learning_rate": 2.542498147623701e-07, + "loss": 0.4095291495323181, + "step": 1298 + }, + { + "epoch": 2.7289915966386555, + "grad_norm": 6.6678037455089925, + "learning_rate": 2.50415561730169e-07, + "loss": 0.2518484592437744, + "step": 1299 + }, + { + "epoch": 2.73109243697479, + "grad_norm": 8.694983560441388, + "learning_rate": 2.4660969761899576e-07, + "loss": 0.21484610438346863, + "step": 1300 + }, + { + "epoch": 2.7331932773109244, + "grad_norm": 11.820763178851392, + "learning_rate": 2.428322451770276e-07, + "loss": 0.39412614703178406, + "step": 1301 + }, + { + "epoch": 2.735294117647059, + "grad_norm": 11.877133639126868, + "learning_rate": 2.3908322698261597e-07, + "loss": 0.34464430809020996, + "step": 1302 + }, + { + "epoch": 2.7373949579831933, + "grad_norm": 10.16702078484984, + "learning_rate": 2.3536266544416043e-07, + "loss": 0.5757449865341187, + "step": 1303 + }, + { + "epoch": 2.7394957983193278, + "grad_norm": 12.93026525257059, + "learning_rate": 2.3167058279997156e-07, + "loss": 0.7968210577964783, + "step": 1304 + }, + { + "epoch": 2.741596638655462, + "grad_norm": 10.635434378996248, + "learning_rate": 2.2800700111813456e-07, + "loss": 0.40927547216415405, + "step": 1305 + }, + { + "epoch": 2.7436974789915967, + "grad_norm": 9.037444336220418, + "learning_rate": 2.2437194229638415e-07, + "loss": 0.23368996381759644, + "step": 1306 + }, + { + "epoch": 2.745798319327731, + "grad_norm": 128.54979302169804, + "learning_rate": 2.2076542806196588e-07, + "loss": 0.7368482351303101, + "step": 1307 + }, + { + "epoch": 2.7478991596638656, + "grad_norm": 8.202648198989193, + "learning_rate": 2.17187479971514e-07, + "loss": 0.29558128118515015, + "step": 1308 + }, + { + "epoch": 2.75, + "grad_norm": 6.885187685182277, + "learning_rate": 2.136381194109166e-07, + "loss": 0.2764503061771393, + "step": 1309 + }, + { + "epoch": 2.7521008403361344, + "grad_norm": 8.730199073100707, + "learning_rate": 2.1011736759519286e-07, + "loss": 0.3793492615222931, + "step": 1310 + }, + { + "epoch": 2.754201680672269, + "grad_norm": 8.631276466119623, + "learning_rate": 2.0662524556835982e-07, + "loss": 0.5927262902259827, + "step": 1311 + }, + { + "epoch": 2.7563025210084033, + "grad_norm": 12.625981527108426, + "learning_rate": 2.0316177420331375e-07, + "loss": 0.4284164607524872, + "step": 1312 + }, + { + "epoch": 2.758403361344538, + "grad_norm": 9.329175719292097, + "learning_rate": 1.997269742016994e-07, + "loss": 0.4722291827201843, + "step": 1313 + }, + { + "epoch": 2.7605042016806722, + "grad_norm": 17.532238777546283, + "learning_rate": 1.9632086609379041e-07, + "loss": 0.6627257466316223, + "step": 1314 + }, + { + "epoch": 2.7626050420168067, + "grad_norm": 9.92918276948977, + "learning_rate": 1.929434702383648e-07, + "loss": 0.42083340883255005, + "step": 1315 + }, + { + "epoch": 2.764705882352941, + "grad_norm": 9.589305807880846, + "learning_rate": 1.895948068225828e-07, + "loss": 0.39910781383514404, + "step": 1316 + }, + { + "epoch": 2.7668067226890756, + "grad_norm": 11.560419759358716, + "learning_rate": 1.862748958618682e-07, + "loss": 0.2765321731567383, + "step": 1317 + }, + { + "epoch": 2.76890756302521, + "grad_norm": 6.28366130869059, + "learning_rate": 1.8298375719978501e-07, + "loss": 0.08827929198741913, + "step": 1318 + }, + { + "epoch": 2.7710084033613445, + "grad_norm": 10.943149316905583, + "learning_rate": 1.797214105079248e-07, + "loss": 0.5753570795059204, + "step": 1319 + }, + { + "epoch": 2.773109243697479, + "grad_norm": 13.46621194548743, + "learning_rate": 1.7648787528578127e-07, + "loss": 0.7518602013587952, + "step": 1320 + }, + { + "epoch": 2.7752100840336134, + "grad_norm": 9.047171390898557, + "learning_rate": 1.732831708606425e-07, + "loss": 0.6446128487586975, + "step": 1321 + }, + { + "epoch": 2.777310924369748, + "grad_norm": 13.738460244304907, + "learning_rate": 1.7010731638746668e-07, + "loss": 0.4714201092720032, + "step": 1322 + }, + { + "epoch": 2.7794117647058822, + "grad_norm": 9.086358928536246, + "learning_rate": 1.669603308487755e-07, + "loss": 0.23203890025615692, + "step": 1323 + }, + { + "epoch": 2.7815126050420167, + "grad_norm": 25.798347784352785, + "learning_rate": 1.6384223305453417e-07, + "loss": 0.5102007389068604, + "step": 1324 + }, + { + "epoch": 2.783613445378151, + "grad_norm": 11.210651055014003, + "learning_rate": 1.6075304164204385e-07, + "loss": 0.45608770847320557, + "step": 1325 + }, + { + "epoch": 2.7857142857142856, + "grad_norm": 7.6934549954682465, + "learning_rate": 1.5769277507582725e-07, + "loss": 0.5190253257751465, + "step": 1326 + }, + { + "epoch": 2.78781512605042, + "grad_norm": 13.485529024983622, + "learning_rate": 1.5466145164751977e-07, + "loss": 0.5670579075813293, + "step": 1327 + }, + { + "epoch": 2.7899159663865545, + "grad_norm": 8.323766066498216, + "learning_rate": 1.5165908947575914e-07, + "loss": 0.4676046073436737, + "step": 1328 + }, + { + "epoch": 2.792016806722689, + "grad_norm": 11.23683105022603, + "learning_rate": 1.4868570650607816e-07, + "loss": 0.2914016544818878, + "step": 1329 + }, + { + "epoch": 2.7941176470588234, + "grad_norm": 17.258281880666775, + "learning_rate": 1.4574132051079658e-07, + "loss": 1.312021017074585, + "step": 1330 + }, + { + "epoch": 2.796218487394958, + "grad_norm": 9.249285303088671, + "learning_rate": 1.4282594908891666e-07, + "loss": 0.3117330074310303, + "step": 1331 + }, + { + "epoch": 2.7983193277310923, + "grad_norm": 9.999090012754882, + "learning_rate": 1.3993960966601328e-07, + "loss": 0.2705899775028229, + "step": 1332 + }, + { + "epoch": 2.8004201680672267, + "grad_norm": 9.383011281190877, + "learning_rate": 1.3708231949413676e-07, + "loss": 0.2621600031852722, + "step": 1333 + }, + { + "epoch": 2.802521008403361, + "grad_norm": 11.854334740139995, + "learning_rate": 1.342540956517041e-07, + "loss": 0.40849626064300537, + "step": 1334 + }, + { + "epoch": 2.8046218487394956, + "grad_norm": 10.05169136975745, + "learning_rate": 1.3145495504339856e-07, + "loss": 0.2958400845527649, + "step": 1335 + }, + { + "epoch": 2.80672268907563, + "grad_norm": 13.23608329431821, + "learning_rate": 1.2868491440007015e-07, + "loss": 0.7148715257644653, + "step": 1336 + }, + { + "epoch": 2.8088235294117645, + "grad_norm": 11.059610717001991, + "learning_rate": 1.2594399027863302e-07, + "loss": 0.5344212055206299, + "step": 1337 + }, + { + "epoch": 2.810924369747899, + "grad_norm": 9.850144807315097, + "learning_rate": 1.232321990619695e-07, + "loss": 0.3390062749385834, + "step": 1338 + }, + { + "epoch": 2.8130252100840334, + "grad_norm": 12.782218028007712, + "learning_rate": 1.205495569588283e-07, + "loss": 0.6602462530136108, + "step": 1339 + }, + { + "epoch": 2.815126050420168, + "grad_norm": 9.16202056000073, + "learning_rate": 1.1789608000373209e-07, + "loss": 0.2165951430797577, + "step": 1340 + }, + { + "epoch": 2.8172268907563023, + "grad_norm": 9.639282432785762, + "learning_rate": 1.1527178405687845e-07, + "loss": 0.33785703778266907, + "step": 1341 + }, + { + "epoch": 2.8193277310924367, + "grad_norm": 16.018225078825093, + "learning_rate": 1.1267668480404559e-07, + "loss": 0.49403730034828186, + "step": 1342 + }, + { + "epoch": 2.821428571428571, + "grad_norm": 13.934169182843426, + "learning_rate": 1.1011079775649969e-07, + "loss": 0.5875406265258789, + "step": 1343 + }, + { + "epoch": 2.8235294117647056, + "grad_norm": 10.314949862812936, + "learning_rate": 1.0757413825090212e-07, + "loss": 0.4375740885734558, + "step": 1344 + }, + { + "epoch": 2.82563025210084, + "grad_norm": 11.258449104141572, + "learning_rate": 1.0506672144921515e-07, + "loss": 0.6797425746917725, + "step": 1345 + }, + { + "epoch": 2.8277310924369745, + "grad_norm": 10.94330965699598, + "learning_rate": 1.0258856233861524e-07, + "loss": 0.36085596680641174, + "step": 1346 + }, + { + "epoch": 2.8298319327731094, + "grad_norm": 9.174555872255727, + "learning_rate": 1.0013967573140216e-07, + "loss": 0.43387356400489807, + "step": 1347 + }, + { + "epoch": 2.831932773109244, + "grad_norm": 11.299994940843328, + "learning_rate": 9.77200762649072e-08, + "loss": 0.44897180795669556, + "step": 1348 + }, + { + "epoch": 2.8340336134453783, + "grad_norm": 10.295685178570979, + "learning_rate": 9.532977840141123e-08, + "loss": 0.22422294318675995, + "step": 1349 + }, + { + "epoch": 2.8361344537815127, + "grad_norm": 8.127889054633478, + "learning_rate": 9.29687964280529e-08, + "loss": 0.642038106918335, + "step": 1350 + }, + { + "epoch": 2.838235294117647, + "grad_norm": 11.9364629190832, + "learning_rate": 9.063714445674776e-08, + "loss": 0.8069763779640198, + "step": 1351 + }, + { + "epoch": 2.8403361344537816, + "grad_norm": 11.63460546823257, + "learning_rate": 8.833483642410101e-08, + "loss": 0.36828362941741943, + "step": 1352 + }, + { + "epoch": 2.842436974789916, + "grad_norm": 10.042654306225293, + "learning_rate": 8.606188609132593e-08, + "loss": 0.3019287586212158, + "step": 1353 + }, + { + "epoch": 2.8445378151260505, + "grad_norm": 10.265644800483537, + "learning_rate": 8.381830704415839e-08, + "loss": 0.8440870046615601, + "step": 1354 + }, + { + "epoch": 2.846638655462185, + "grad_norm": 11.67889502498505, + "learning_rate": 8.160411269278079e-08, + "loss": 2.0406436920166016, + "step": 1355 + }, + { + "epoch": 2.8487394957983194, + "grad_norm": 11.659752416837614, + "learning_rate": 7.941931627173827e-08, + "loss": 0.23328936100006104, + "step": 1356 + }, + { + "epoch": 2.850840336134454, + "grad_norm": 14.52369655098527, + "learning_rate": 7.726393083985929e-08, + "loss": 0.552147626876831, + "step": 1357 + }, + { + "epoch": 2.8529411764705883, + "grad_norm": 8.467901286703713, + "learning_rate": 7.513796928018069e-08, + "loss": 0.38458627462387085, + "step": 1358 + }, + { + "epoch": 2.8550420168067228, + "grad_norm": 7.6124021321848, + "learning_rate": 7.30414442998667e-08, + "loss": 0.3594217300415039, + "step": 1359 + }, + { + "epoch": 2.857142857142857, + "grad_norm": 12.272607778978339, + "learning_rate": 7.097436843013783e-08, + "loss": 0.5628789067268372, + "step": 1360 + }, + { + "epoch": 2.8592436974789917, + "grad_norm": 9.345724512814346, + "learning_rate": 6.893675402618982e-08, + "loss": 0.7206631898880005, + "step": 1361 + }, + { + "epoch": 2.861344537815126, + "grad_norm": 13.88429967852116, + "learning_rate": 6.692861326712652e-08, + "loss": 0.8038681745529175, + "step": 1362 + }, + { + "epoch": 2.8634453781512605, + "grad_norm": 15.55581945591023, + "learning_rate": 6.494995815588101e-08, + "loss": 0.7214268445968628, + "step": 1363 + }, + { + "epoch": 2.865546218487395, + "grad_norm": 10.920690128080313, + "learning_rate": 6.300080051914792e-08, + "loss": 0.3757812976837158, + "step": 1364 + }, + { + "epoch": 2.8676470588235294, + "grad_norm": 9.02181459032139, + "learning_rate": 6.108115200731069e-08, + "loss": 0.7154731154441833, + "step": 1365 + }, + { + "epoch": 2.869747899159664, + "grad_norm": 12.825891467379778, + "learning_rate": 5.9191024094374384e-08, + "loss": 0.6805951595306396, + "step": 1366 + }, + { + "epoch": 2.8718487394957983, + "grad_norm": 10.058469083040828, + "learning_rate": 5.7330428077893575e-08, + "loss": 0.41078895330429077, + "step": 1367 + }, + { + "epoch": 2.8739495798319328, + "grad_norm": 8.36551151872813, + "learning_rate": 5.5499375078906793e-08, + "loss": 0.35648801922798157, + "step": 1368 + }, + { + "epoch": 2.8760504201680672, + "grad_norm": 18.110033778975207, + "learning_rate": 5.369787604186993e-08, + "loss": 0.3897348642349243, + "step": 1369 + }, + { + "epoch": 2.8781512605042017, + "grad_norm": 8.750407331993259, + "learning_rate": 5.192594173459242e-08, + "loss": 0.613540530204773, + "step": 1370 + }, + { + "epoch": 2.880252100840336, + "grad_norm": 8.528139704622195, + "learning_rate": 5.018358274816892e-08, + "loss": 0.4445531964302063, + "step": 1371 + }, + { + "epoch": 2.8823529411764706, + "grad_norm": 11.859807560110708, + "learning_rate": 4.847080949691996e-08, + "loss": 0.5488522052764893, + "step": 1372 + }, + { + "epoch": 2.884453781512605, + "grad_norm": 10.23407853457865, + "learning_rate": 4.6787632218326385e-08, + "loss": 0.5596367716789246, + "step": 1373 + }, + { + "epoch": 2.8865546218487395, + "grad_norm": 11.296256406092558, + "learning_rate": 4.513406097297224e-08, + "loss": 0.38018864393234253, + "step": 1374 + }, + { + "epoch": 2.888655462184874, + "grad_norm": 12.156451974202069, + "learning_rate": 4.351010564447977e-08, + "loss": 0.661139726638794, + "step": 1375 + }, + { + "epoch": 2.8907563025210083, + "grad_norm": 7.3170273092091485, + "learning_rate": 4.1915775939454506e-08, + "loss": 0.2944487929344177, + "step": 1376 + }, + { + "epoch": 2.892857142857143, + "grad_norm": 9.331145503425732, + "learning_rate": 4.035108138742416e-08, + "loss": 0.23486556112766266, + "step": 1377 + }, + { + "epoch": 2.8949579831932772, + "grad_norm": 11.863919468865829, + "learning_rate": 3.881603134078482e-08, + "loss": 0.3030620813369751, + "step": 1378 + }, + { + "epoch": 2.8970588235294117, + "grad_norm": 12.573022210864796, + "learning_rate": 3.731063497474152e-08, + "loss": 0.3213701546192169, + "step": 1379 + }, + { + "epoch": 2.899159663865546, + "grad_norm": 6.674326596763006, + "learning_rate": 3.583490128725553e-08, + "loss": 0.22970488667488098, + "step": 1380 + }, + { + "epoch": 2.9012605042016806, + "grad_norm": 13.577742623896349, + "learning_rate": 3.4388839098992154e-08, + "loss": 0.32231050729751587, + "step": 1381 + }, + { + "epoch": 2.903361344537815, + "grad_norm": 16.538926889757885, + "learning_rate": 3.2972457053262466e-08, + "loss": 0.9544304609298706, + "step": 1382 + }, + { + "epoch": 2.9054621848739495, + "grad_norm": 20.22528777991979, + "learning_rate": 3.158576361597887e-08, + "loss": 0.7788558006286621, + "step": 1383 + }, + { + "epoch": 2.907563025210084, + "grad_norm": 16.130951952781945, + "learning_rate": 3.022876707559796e-08, + "loss": 0.2601931393146515, + "step": 1384 + }, + { + "epoch": 2.9096638655462184, + "grad_norm": 13.778242873434662, + "learning_rate": 2.890147554307665e-08, + "loss": 0.5957424640655518, + "step": 1385 + }, + { + "epoch": 2.911764705882353, + "grad_norm": 10.295105075509534, + "learning_rate": 2.7603896951817755e-08, + "loss": 0.2927376925945282, + "step": 1386 + }, + { + "epoch": 2.9138655462184873, + "grad_norm": 18.743122797679717, + "learning_rate": 2.633603905762838e-08, + "loss": 0.5990405082702637, + "step": 1387 + }, + { + "epoch": 2.9159663865546217, + "grad_norm": 14.887502358752755, + "learning_rate": 2.5097909438669964e-08, + "loss": 0.4513130784034729, + "step": 1388 + }, + { + "epoch": 2.918067226890756, + "grad_norm": 9.564277783357335, + "learning_rate": 2.3889515495413297e-08, + "loss": 0.6215352416038513, + "step": 1389 + }, + { + "epoch": 2.9201680672268906, + "grad_norm": 5.003008688132311, + "learning_rate": 2.2710864450596336e-08, + "loss": 0.33804643154144287, + "step": 1390 + }, + { + "epoch": 2.9222689075630255, + "grad_norm": 9.060022958520825, + "learning_rate": 2.1561963349178704e-08, + "loss": 0.4266011416912079, + "step": 1391 + }, + { + "epoch": 2.92436974789916, + "grad_norm": 9.49932040181115, + "learning_rate": 2.0442819058300588e-08, + "loss": 0.3738781809806824, + "step": 1392 + }, + { + "epoch": 2.9264705882352944, + "grad_norm": 11.474699381578137, + "learning_rate": 1.935343826724112e-08, + "loss": 0.26019287109375, + "step": 1393 + }, + { + "epoch": 2.928571428571429, + "grad_norm": 9.426307307224148, + "learning_rate": 1.8293827487380623e-08, + "loss": 0.3799281120300293, + "step": 1394 + }, + { + "epoch": 2.9306722689075633, + "grad_norm": 12.711822585165105, + "learning_rate": 1.726399305215787e-08, + "loss": 0.25459083914756775, + "step": 1395 + }, + { + "epoch": 2.9327731092436977, + "grad_norm": 12.88439286989085, + "learning_rate": 1.626394111703622e-08, + "loss": 0.4746205806732178, + "step": 1396 + }, + { + "epoch": 2.934873949579832, + "grad_norm": 15.570716719123634, + "learning_rate": 1.5293677659463104e-08, + "loss": 0.4622001647949219, + "step": 1397 + }, + { + "epoch": 2.9369747899159666, + "grad_norm": 6.94964938645385, + "learning_rate": 1.4353208478837256e-08, + "loss": 0.18047931790351868, + "step": 1398 + }, + { + "epoch": 2.939075630252101, + "grad_norm": 10.000416990177895, + "learning_rate": 1.3442539196472647e-08, + "loss": 0.37007540464401245, + "step": 1399 + }, + { + "epoch": 2.9411764705882355, + "grad_norm": 8.931832554567432, + "learning_rate": 1.2561675255564621e-08, + "loss": 0.7158060073852539, + "step": 1400 + }, + { + "epoch": 2.94327731092437, + "grad_norm": 11.017696540531707, + "learning_rate": 1.1710621921159904e-08, + "loss": 0.9123420119285583, + "step": 1401 + }, + { + "epoch": 2.9453781512605044, + "grad_norm": 13.459702577958145, + "learning_rate": 1.0889384280119985e-08, + "loss": 1.1057486534118652, + "step": 1402 + }, + { + "epoch": 2.947478991596639, + "grad_norm": 11.44996683672279, + "learning_rate": 1.009796724109613e-08, + "loss": 0.36926376819610596, + "step": 1403 + }, + { + "epoch": 2.9495798319327733, + "grad_norm": 8.32543080681241, + "learning_rate": 9.336375534497732e-09, + "loss": 0.5240511298179626, + "step": 1404 + }, + { + "epoch": 2.9516806722689077, + "grad_norm": 16.41897161685657, + "learning_rate": 8.60461371246235e-09, + "loss": 1.0361064672470093, + "step": 1405 + }, + { + "epoch": 2.953781512605042, + "grad_norm": 15.488903163881536, + "learning_rate": 7.902686148831273e-09, + "loss": 0.7314852476119995, + "step": 1406 + }, + { + "epoch": 2.9558823529411766, + "grad_norm": 10.609488526695282, + "learning_rate": 7.230597039123433e-09, + "loss": 0.5929103493690491, + "step": 1407 + }, + { + "epoch": 2.957983193277311, + "grad_norm": 9.545516911394982, + "learning_rate": 6.588350400507093e-09, + "loss": 0.24979953467845917, + "step": 1408 + }, + { + "epoch": 2.9600840336134455, + "grad_norm": 16.112825448357878, + "learning_rate": 5.975950071779313e-09, + "loss": 0.810958206653595, + "step": 1409 + }, + { + "epoch": 2.96218487394958, + "grad_norm": 8.6763799711489, + "learning_rate": 5.393399713341518e-09, + "loss": 0.4567590355873108, + "step": 1410 + }, + { + "epoch": 2.9642857142857144, + "grad_norm": 10.068385761335634, + "learning_rate": 4.8407028071773e-09, + "loss": 0.34989726543426514, + "step": 1411 + }, + { + "epoch": 2.966386554621849, + "grad_norm": 11.30284408928835, + "learning_rate": 4.317862656831873e-09, + "loss": 0.3826170563697815, + "step": 1412 + }, + { + "epoch": 2.9684873949579833, + "grad_norm": 13.404023548287954, + "learning_rate": 3.8248823873932026e-09, + "loss": 0.25103145837783813, + "step": 1413 + }, + { + "epoch": 2.9705882352941178, + "grad_norm": 10.423177049027613, + "learning_rate": 3.361764945473134e-09, + "loss": 0.33963871002197266, + "step": 1414 + }, + { + "epoch": 2.972689075630252, + "grad_norm": 9.701343246515489, + "learning_rate": 2.928513099187402e-09, + "loss": 0.5596168637275696, + "step": 1415 + }, + { + "epoch": 2.9747899159663866, + "grad_norm": 8.852327800983687, + "learning_rate": 2.52512943814176e-09, + "loss": 0.3114224374294281, + "step": 1416 + }, + { + "epoch": 2.976890756302521, + "grad_norm": 8.400624424787871, + "learning_rate": 2.151616373417542e-09, + "loss": 0.5350728631019592, + "step": 1417 + }, + { + "epoch": 2.9789915966386555, + "grad_norm": 10.794481012917993, + "learning_rate": 1.8079761375522365e-09, + "loss": 0.6644730567932129, + "step": 1418 + }, + { + "epoch": 2.98109243697479, + "grad_norm": 9.282496929164791, + "learning_rate": 1.4942107845317132e-09, + "loss": 0.2426847219467163, + "step": 1419 + }, + { + "epoch": 2.9831932773109244, + "grad_norm": 9.113139352861424, + "learning_rate": 1.210322189774682e-09, + "loss": 0.2127893567085266, + "step": 1420 + }, + { + "epoch": 2.985294117647059, + "grad_norm": 10.249299245135052, + "learning_rate": 9.563120501221434e-10, + "loss": 0.31507742404937744, + "step": 1421 + }, + { + "epoch": 2.9873949579831933, + "grad_norm": 10.643798027898825, + "learning_rate": 7.321818838279537e-10, + "loss": 0.49292629957199097, + "step": 1422 + }, + { + "epoch": 2.9894957983193278, + "grad_norm": 7.762285292055822, + "learning_rate": 5.379330305488317e-10, + "loss": 0.25357064604759216, + "step": 1423 + }, + { + "epoch": 2.991596638655462, + "grad_norm": 7.423869479037056, + "learning_rate": 3.735666513371428e-10, + "loss": 0.4229947328567505, + "step": 1424 + }, + { + "epoch": 2.9936974789915967, + "grad_norm": 10.794639890750766, + "learning_rate": 2.3908372863368223e-10, + "loss": 0.5679960250854492, + "step": 1425 + }, + { + "epoch": 2.995798319327731, + "grad_norm": 9.814210260546373, + "learning_rate": 1.344850662604591e-10, + "loss": 0.3406621515750885, + "step": 1426 + }, + { + "epoch": 2.9978991596638656, + "grad_norm": 7.52747077028302, + "learning_rate": 5.977128941903055e-11, + "loss": 0.3986052870750427, + "step": 1427 + }, + { + "epoch": 3.0, + "grad_norm": 8.379236977666347, + "learning_rate": 1.494284468384066e-11, + "loss": 0.49183082580566406, + "step": 1428 + }, + { + "epoch": 3.0, + "step": 1428, + "total_flos": 3902317486080.0, + "train_loss": 1.6620939874066776, + "train_runtime": 1853.0016, + "train_samples_per_second": 3.081, + "train_steps_per_second": 0.771 + } + ], + "logging_steps": 1, + "max_steps": 1428, + "num_input_tokens_seen": 0, + "num_train_epochs": 3, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 3902317486080.0, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..21c9801 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7b4e21a20ef01f690b3b8da223636f2e953c8c6f66982e3b5ba5df4d156a10c +size 7096 diff --git a/training_loss.png b/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..5fa782751961c0fcf30779bbc20f5ef3357ce6dd GIT binary patch literal 51056 zcmd>mg;$kZ`|Sn+K}t~R4pC|876b)RFli*Dq`ON}L`tPgQ3RFl?obgBk?uwsX{q}x z&Trf?eq-GK;C{n1&UcW#_xrB(toh72pZV^PyDB${&(NH~U@*i=it_g{7;Ik*25TH2 z4}K!lH9QUf5_eS4aC~56;^<;vZ;ZKP;Am@U<7oNRkjdHD-r=c@wEz!4ACD*(lbNHV zt%Eo(uhswk4IUeNQ{H-Qrw(`*0$W8*2MmVP0R4lNDUoYiu9#}o15yuM*|qs< z7wiBWY=S>dua`IWp9s8;ABZ0rh#6^@UhN~iV`5sfk^CyYQ##r}GX_`oEDro36EJI# z!t!Inhd*f^%vg&5{q#vBh7JA5?>WCBh8+E(Y!ek5hT!BE4T;EoPkwZkACKVL$&a2> z`QtF1yrcX}S?tJ@w_|Bx`v3Foa2{bOC@H75hiph^BS*fkPqp$}^m2Xp_|eaR%JXom zZzARX&p7@kcsE{Bk*z#+O|Ph+>C^L(x+)-0&qs80v{M`GBwae@E%72Wv{5`*(d64J zc6}wko!gfbCI5b9 z)hM@TPx1V#bTB7#TyGq!JKMb-78dsNkK^uUx9WAl>yv%8M?yiwv=l2(0|LH(za_c# z`+;=r+TqMpgv|Cob`G7+IQ;_GbweH3iNLQN9YOW_*T!nR>{{tvcG;eP{`}b%KJ2~C zSk3c@h?~bphwJn2BhqSWq%$3g2Q1@ce57e;Xx6@S=AK;hix)5aDk2nR+YfIBq{4;5 zdh-$aS5%1i4AG0(kw}ol`%+J@waBHtsjvbN^ zQt~`34r@1Q{QT(4+OR`spsVvr)!uC4e9xEINs;5vpRX(p6rNUFDVEYz=2mQsH259mit3c(K9g>Zj3_ zAMpZl(q7{CA3RuJD(p;yPvWiKBqyO0^<5q+y`J0m8Z$lq&`wJ$VZln+vfsD2S53!z zZ-zM``uJe2k(7@ntZa8Ov{C9pYUZa;>wjnzHETS@KHiQe|4Ah`Kfyjb{q6Oo%a`ki zY-;IOJ~iP)9lTr*6dCjEwi@VB*9(KgGBtL5B;vh4H0C~h1i#h%=|RTY;m%lShr*2; zcq!iho}ycQ((;nvyN-pqIc9g8=lS{D7tfKOJ9qtR$$(|h<6L#_BI=-LU1mhzbPPjW z#=IymT)0pMrMwp5b8vmjxl?+d3tr&7JQyhL^$&x&sFL(tnYa49atv4fh|AdW3byxD zn8?puJ(;G~)+duqA^mv<*RSzQaj2#=9qesHLHz^-;3WAR?ZL*z54q=7Z_@;kGKRws zKV)P)IoMs_-JOcq>(tiPUWXNVUsgti=Z~eSsadx9OF7?T$2!-cztEI)_D8(`n>Xj# z*x4suDf86#W^3~*XzNb!;j8BI0-Y_&|ffFF#dfKr$#B#8RAVT`zCHI|`u%;$?9fx)ymO?8# zJAM*+@c^gA-gOg$KUhV`jOn;b+` zd>FX?z`(%Wb{p?gq0N&eE5VH3&+VpKn5Cr|sHv%U2RgljUc5L{x>YrzKAd036)H07 z>Mz4nXN;>^WJZQZLWlpp>-mo#w{ItlU-+VyO}^at$I-C)#f3CVI4&Axw#?G|O9Di+ z!bI!q>v589SE1N27}vRE7e4(u3{}{TA94JR?dhdjW6fju01-BF)oFCEYI=C9ws`_=2$ zL8+|uYTJBD;BdM9%Yyx;vN9otNkT%qNK!MND@O3{@8O}!E>|gCOTmNkL#$v zl@8kzqIal*J=e(7$GWJR^0LNj|3!=I__NcIDJkJHhksPjjl)*DaOsqtP4)asfEi!) zIhHu-5`aN2wfpp#b^k7tLW8Y^9@p&wQ-vvEVPV6S;qtPHAX?k*J0cU^sxr;hJEMfv zk0apn&-pHrn!_sfm)Wtd)a+Xm(TkryO+r`4nOo%tge8RhNs8Mn^}z(GPaUzyuy5r` z1tD~2*X80qKCgd{P(8u520g>--5IK_K1Umj!|sdOCs?XqkL@jks12;D*sxQdZk(tc z3lv_S!<@>}Xfw-ioB_O8MMbM#hM- zqwP{ryGfkK9?L>a&CRm!yWZyKlc9wuu^xHBt{n3g7}M?)12kQ|&P0;_s01vS+JZ0n9-tVAPdmD34 zP(v{ddV^pdFsQY#Q#$lCqvu%wT-$TWBlQ(di)-IFQpe%M1^`x~9dF~QBpNEUaZ$d8 zs3i2M=ccJ%6kKiCcXuq+9F7lRcYsc`0=dHrZN`RLZVV>fcl1%R6Qzrj@({jwCm{ez zjNprUZc7_)?Mr~FsZo#BN5kO;RJY@=DzF9Yz{SJTnF-QBLk>CqTMHHVl3E~0Cgsr= zwF#g?sBJ{Pe(irfm}COhzWLqt;5?^AwbA~!YNmq1!jlDUJdMSDk3(s#%dk>?j>J-2 zCkaroIn4f8cRjGOvWgS7q6w!H^FyZ$j*^0|E`816wl>x@KFHzBdc*jUo*xyw_@RnGi*6S ztIC}_#;di*-nkBu_FFybh3?fU+}zwVv5(Z$3ch{&wgh{zkK=*8-YO@?y3g%*=Dj5-RUVHlxudmUnLJn~>nUm?ysmOYU^Fn6Dk>yHzkb09 z|ND(&q+ykc13^J}-h0p&8nN|j;b?dde2roq@bkkiDK3uID*--0;cNEe z)hlwiXgEkAv(h%Bk|kwjakZ37&JwU!@{3R-1p@;E;1`Ti{}O|1O}Krr*G#Yg)?K>x zWu1t6c`_$8XyG) zi{I8eeU4t=QC6NRJzY2IJYtS)l=}3gRxx>7sqi*glPp@`7h zAgrHwM2~s#()Vai&6wqiQD}6Jcj~2D101GZ z57t{XF$7xwsvQDeJ=lV_G#lTWs;K8E&hAHz;n<3c9Q5lqZpN2 zw;B*;|NU!EC+$h)%h@{#Kwq$OIlQPy5V4Nv=;+TotG1$u_)RW+$-MzfusZ|mSq7pu z-)`#0Xz@5_ijF};-2}V>k-d_mcnoe+>xlwMz)cpo7>87l;o4^&DW zcj<7$7@<}+1ze(U+x?-RKQWaf;UF{HDlYkn-K>j#`y^kZ%DeHAVZ9$NOX%qIdQ5B0hXzgLTx{mL{04z}L-fZ*R~1@})75^6_(!>}loY16F!62WzKdc=f_# z^}MOQ{%x*b&XfWIdyYe;3DGW3C_Pu;ZR=e(8NaoV&d$uNGhDvLT?TMs(75h8-g2U5YzRgofcXS+6+ht@4U}a7YohO87j- zv%@o7bl01kdUxDN6%EF+HNASu&`izv^RIk*Q~?b>Bjy0 zA8hU7>FMcz z3JD8iV|aP+h^UyfG&8#Q=*MgqeqTOHzhX51^WDK5>y4LnaIl{Bd{IX#n~F~#W73`w z2#uNg!N=PZrEZ9b0bah#%R7tY$8fnrJ}|zhyw~@&wL<|>&?-BVKuv+Zr;_$8>ufEt z9Ju-;L8z_$f{7qaSEY+hSHbV!4}rXw^{n2ya|hSuC=lOk8?zf*He7Mb;dR@uA8l<8 zgl8E9&CX)ft6KKvQX`-YrvQenTkGm^6&Yo`>A2bq$LpRIEZXtD(H~X^=SMIHS{xCL zAU?VQu)Knhn*>1qJP!o^K$hvBz1#44nDZ1A-+9y>QmS=X)2C)*lo;QDBB=w7 zVFxR5{=$U`=y3kvHi7cEqO}SuS%-+k`|CO;-(6W+xWZ>Tx)d=YjjR$ zbcX<;FfuVod-o1Y?Mw8rBxvwYpFSNNr2C9PjRO`vI1Kzoc~Y6_rY}W6SApF183(~8 zuc;ZY$Oo^j$X;D_!tw?FH=*kD?;Na}A1r6rKPc4$4LV9)M=}i35M>LWzwjA0;e+w8 z9!>dSl1oVF0x0zUqNnE&akd<(h<35i_1fw|rJ1G>Y72|-;?_B0D!#g9H_j@RYL6X? z=0~S;0?1bg)iR%2ThHqK@?A{15ajb!O8qpPR`}50y}c}em3lmfL+bmMYW~9x&3*gI zFNP(q0@Q5|XJ=<$2ulRr2!{#;5(NPP0jQ=^CY>o^z(4fCNkfXzBDWf^aNq}_>;z>7 z^i(dbB7Egoo|!QNx(41W=1xJw`;t;p^!q!jb3W=7vC7KIb|X%GZjv{Vwh^`&eF;eC zu9KUc9Twq$qjSR#H0p+*I#0}?rSK_RshdKUra!KUQUguCb?a81e^5rP;l}1mQ%Is55PENXVA^?02P#4Dk%8#|-ZC%&9xvUK$Rr zgpxbK`b%xy0xh)2H)HVHymvcQnx4^nmsu@GCj@9L;`h=c9HTkPPoG}qDW4|)-P1E+ zKMvV}L7GXKL|~UExm+`Bj4koUT2$Kk2cU zvZh7A?L6;8_asp}?75EQMv%~aP74qFErn4Nq!qTTi)6ko&$1CjYh8!zP^2B;q&0#2 z`uqZ?8s_X+2GmJ{>6c&CSwXFgK6D#%oxzWDZ@RgOeQ#^qV~YiQYgBIUmojh2c0GH( z-M4#>9zC*tqWBplm5RB{ztWe?DpypO_emBq$i(jKI$MoR>5tH+~4b;Q0jg z$jZztYezy8*0QXfLxb%Uht^KUGQ|6csV5JfM>T-o}1MjVO2~+j{r|tf2{>gj8>b5r%tI&(Z^ED~aM@cDU zp0)xk98FDXla8csyvnMovF*ZAP780$v{iQ`->%p^FD$yX!(kfra8Qq_GY-8qf*Vjx zQeA&Pe!O_k*X^w*tU#Uy*DefD6x8JPbY4O)Vc`rEEKJ?#c&M)4c80s-3=c6S62KZU z7n1cRoNg&AI}G(@-g__EAq23|+dLPMz9&+<7xp#q5^-=8p^KRF5*0Z)`T1%AI`hvD9?w^d* zJn#YUVZXkw7?mr2ogm$#+~@e{F}DYFAY}TETnWU~_2)m~H~)QUX{3@8!2WFYV)>4q zx3@I1Vv{9YDy(>KQ%#>Tg#k+hNG-0%RT`VE(CisMIZNG&mvG@Ju^9{J)-G9V1CM&t zYe)AyCFRCNkEd5kK#79ES69GgDNIX8609w$q^3sk_wQfHn9!f*#V~cCsM(vPy{8nk zuwd>9R5DK7>B{~4_dTU^K;oUAK0}BH)UJTH2>y$+B5cXIa(*ba$GjQYO9=7SFCrA{ zNRbL{4yCNL8tdw+Z(TxG2fVpPky%utLWr^EQ3Bpn&8tyH@FG#a_E|1BERTA~$<514 zin?L#@u5vrh&MP@o&+?POGn)~Nf@PHqVog{OlE(eQ$E#UOgwPTW2nR`tv2^=yB*jY z1r%{B`om>*abgY^k0U&+eWgHD!P^Y8O~Qq|6=hnclC#Rw^aE-=Xza;8DtjAk2= zaV)*L^*VEpb^*#B^Ss~!J;`abUZv~cbs0aI!FFpgE7mHl{RX&2WZIds<;G>RkJYsE z#KA!T$;K{s=Stme8?Y{xfld0(r;tCMix)8c8}m}uAMag7MFQ`;#&w`$V4Rv`)YQ}_ z!B?L2v3dHm9^K_j1}PdbF)^?tt@r;@ydJLg@u8D)e>g2ZT57{6Y&AG-Cm{xfb8)bg zZxi6N(Cn$+fyuXjo&{NG$Re#)2>ak%bxC z;lGb-Lt{r2$A_yv{H7grlDp&nU%!5>12e_9px`QUPd%CbWN8*6%`{Xt}@~4Td@*^a0k5rU6FA#s+_2^Z%NdZY7b_3 zT|u7j74X2tUxL02Zc`w5b+i#u+ZuOQz8EwH8Nl2X4Gpedy^8Eb=|_y1)F0=Ru+Q3- z-$H~C3?E#VVY}1F0{pj_`=seP8B2Y$9iSttfWSErt<-4XlaT%|FEMkL^=uK|#vxdohl}(tq#YN$F)(wfupKmtdBu-@p0*+eM`JIt1_yN zeTV5yprGD$|G9hrz8~y%q8{id#~Qr!yO@t3KCBrJ0MP#3*jNYYoR*b!ThQ9V;>(zL zBPD~+ft@FaBV-z`RBfodgqb)oF)?ab>+sJLu!PXKW29ti@Ignsz|H9Nt>dHBSK z9~ijz{zg93wIvJ)C7>~FgA~{l=K$klq|&9Z(6rO!^{ZF?FumM{i!&6l8RgQtX+<3e zq__an4>R9NFHn)C`LK7^ZO957xGDlBSK8l;I-k(!?RoEOPDZDE z*Mo=*QelozHh8#v43J-3rIc5=LLo_UiNH zL3!xcf?>K{v6%BD82n|4F(6?PxOHgdtW(93Rbal6I@37?_ESHq(rE`vb8|x{ar%8Y z4;5i^%G6X(HHp*rM`G74;;GukiN9II3JCW z^hQ5qW`3O#xB*)PYM{^3+M0)!k+D-H{%YVzfw8h;P8(oJTMASLa>7DGLkB1yyFNRF z90q#@2iTtbV6NvQxtjRuRYOa2b3QV5dA-*O9~s{h4F_-aq|)Hf%Cw+m1VgcO1Ho7! zq#KMnB~~TTvcX#0NvN>D=^zBN6vV~X?Zv)`p2e*t2sI2ubE*e@Ao>AA`%Z5_qNTcL zr}k={CcGL8Mvql~OD4{&$k@zXTRu#Gh<9U!{<4dnhaniwV59*nI4FRLTpp$$A`PWm zok?Pij{zi6-6tj_eD6q=NzKm6II1CxvUIDK&f3)d8TIFS4=aJ$?Fg3Hd=O5-#D#!;91|qI8y!De!=1`f2p3>MW|q z!oos@Eq9hc5J|Dgd%s`FZ3x4|Fnk?-~e;i482L z_m1Gt?Lzy>6Hiuo7<`rDp8MMAL`CnGv+r)MD09jNVBg~uEgV>yma~^>wOvdfj#${_v)b89NR?B@H zhKRbJ&!Ld>>gaNBFZZwmn@;tE#f60`lQlAVCP>-95QY)*C+=k#a+|jDpVD9;aEXhn z39jw?XpXM~s1xpy3Dt6yNEia_%iQbYH^%RvbR$dI@KrYbZntW7kQ&BSO& zMn?xi8!jGdO67GxX*72V7Q+8RW;k6NU9Nh8Cowa>d8PkXSZ(F70l!BSHbYH~MNBOI zmM{vo$-e>i3?qxE*w|JV_D~^34Bjgm@wK+~2^qOBR$aN*gZuaY3(3j9A#0n^&i}J}@xSbx z!T&2e_W}#uiy=ddu|eq&IED>U7g+FtsLnf9#D%YK{FkU>`IxVjo%#8*oQH=8tSC+t zpff0Qx!k^Bk1J#ZC#gFY6Fc!_;41!VUlblcW&lp78J0!|Z(FQ|))bf;IIMgop;8`x zC)qr*LXB)SSP`(KSeTiahr5~mVw=Bt1_b!B!_;J)U8l`YcuWyHD_{We(HU~^4|aHQ11 zyd?;#FhTF;0yYn%uFzNz4a;C>=esjVkz(i?Mq@SP=z+a7-C26&q?LU5lPu<&A#n_ zliGk|N#JcLmjq@Kn0N=LLMeG$fM`u_@RPsu*Qp~@OsjX&9Q?7(*BQWs&r*^nk+kbL z7oWGZAGD79^J&k3F%psPi`-nA1voG>#KM5yq=E=e1K?XQ!MTeV3>y9Fxc^CiF;%ra zXn|PpNsa*nUBHP85(SG#(5p_23E#HC9Y8C6$jVSjy7FO8A{DjP5Gq0m6)xS1^R;{J zHV^3;$=nq&H<-TN=riWmR62=|u7Gz1j;6u)HC)l=aXH2MqD8sZ%EbE~G_$h=^7;G;M zDBii#{3~5~9e7Ky5l?{6T_Sy)27+tn(D8b1eKVscU?!D!b9Ian)M%ox)nqIX!lnNF zQ^3<72;G2`P(fkgUK1I{R+J7lzf{#Bs=#f-1i88>B7p=xBq}F?#$bgh;V>4!np6?? zPvURf1^{@j$i~l42I7_%u}LE%qqnN5(kOb+H98uucQ8qb0ROWc%3Mf-pO3^gOuzk* z!3a)-K2^(VIWe8+*$max7Ptk(*15Dxi1fU+qQ|Dl-aSJr!uA}?QC!nZ@aUKsMR=uN zL+*qDm)fxb(DnRRK@NhDdW0p$VFFsp%(7hMigoq%=2o*V5GDKun;mk8M8Li#Fy zthUoX6oU`-!zZQ*!$W5%fZ!Y-a4$MhTMU}m|9p47QA&uVDH4|t+klGcUhefT1K};s z7G)U-=r`{|S5Sy=l3%(;QHLMMiTj|>gy3Z7@crhWMq*xGqvBH(EYpE;hY{9Gc1sct zI+gEjEU>e3gaq({QcS{EY%0!vdKJ%-4WgQU`V{F8r~@rs13WRHdWK;m)c;Y(e$Y>E zbkYz`UKM~9*?$?c_zn9chAkh-j79a%cI4V60yx}IGWyrywPY2(7TW)vs;;)>(y?#= zH}Ux?9ys8@Z)6!o)Sz!g@hPq>9o-u<34C232dVAn`2Q381$8`;a^@X2xi8rnQ>-Eh z%`13!5YEcqh0l7%NA$LbPjPm*?)+(V1&X_nYC^^|1O$O4)plW7eF(u<7p6vSXPsY8wcQO9; zzM#TUVB=s8{1;pdWFqh&lnfF(ZCwune$eY!-~-{UWGqW^)G{bSaY2bwffz%9Js9#C z03}LWj^)zy1Ifn3%#78i<3PNyxajYA@yR*3x!dMdZNxg=0Nxb(R6)n_#^07z&rbLn zYZhrQ8|=-sjd?wKbio=1;lplo$)fht_`Ny0q2R~HFit`2hw%z0XFj;e2g^1-jcBy3 zW7m8^QB}3I#A?VES;y+N|1NYS+4ay1#otE4^H+Cw{*zV`PtXd;=%C=y`MSCRgWuDS zz4wf(AimRI>m!4P7H%7}699P_l%+j|LCgvg#h$>f4@xY0vt$9E2+qcOE!Od z&GD|QY)KL%f-D%6y}5d%2q6*JLa8Q9JP4s6vWa&lWo;TPf5 z)~``q`;HSXR+ekbVLrIllOkZ2CVJP82?u#uu{!nyH^S*cP~r$;*=ClO(=v?Go}#=* zC~8T|dNX|5r_a0?NVhz2XUsSVd?Xm)ul1q(LGlUG&$18!gA(HhH0qLsY_uP|$~Acv zh_4$&5@9%hP(un4*x<%zU_~-tz8rE~YCR$jJ@oHJqTth4W>%P~@Gt@?d!Dy@YP8E=q8>A4+ZhB5m6^R~fF6Aw2a|5iS#t&$Y42?-h6*aDU z??|Be2<9v$C5Kk30o8!9N`}B%$d|hAnxVl#2xI13^zlR~;`n~}@WDD>j|-8Z2|Aw; zygo*`2bFi+j9D(ey>$(zONx)^{U9-|HC0gko68Rn%Az!x{Jnc*5b@xwZJ_~-hb$5H z>u*ikSdgm03A^DBBLt{QTo{)jDul8*-jy(sG=S~KV5%RJ*3CTL4upA8-GnXjbifUL zki^JgEd~*{g>G+r{%P!ReR2s#Irz7f;wl-=M2OW;$pqTvj${cKPCP}&DlWEe zQ5rLyt3e1pVR&5bY-@4L{O*{^v-U2jkM2OQSqi`;t%rmyzsrgaqM~3juOeph1O~C* zVX={sz96g7&=>M-b?|l(Fy+BPiT~OT#CXAsI}d4{+><$?Mn3kK_dYiYUSnXG=nDSu zdWXa+6S(y1x=zsxhqXXJ(S>^-F6up58?Q%p6#_7bWSz#Kxj!oH-By{SXW$)8fPdcv z0Z@oRy)|?v`?WC++$o z8;134M_ns++}$KB3;<7~2=j>oaX$}#Llt8j_1480+eJfH^N}-0=;v7y(M#M#t;~)~ z%DFtsPnl6OI}6RMK5zarp>at$`L&W*A^r9)tr}^%lP8n{a-nw_vk{t|W!2%VpIIrrXH@A2f8md27w z0jA~buMedE7?jVxll{`e!p%)ABqW5= zbG}lyE6Saq&x+OG_|AnyHXs;6G?;M(rY-?R$WG;QPmlodkk>eUcK$og3KOO6k8AHZ zak{)foDUD{fNx$8ipE1+{w!pQS=&-6fur;3U@ZLVo#GS3=j+dZxyvUY8^DmQrkwWd zIW^EIYy)JD6 zp2hvCIe($VI+gZhsk;yr3JAq=tVr>^IFP5j(=YjF!WNB}w9{&O9nNbl-b7>pG~<&f$5Qz!H&fEV^r z-srr3L02>Zmm`)#~KhY8u8%iPSfrctqeqaWTQuLU=yvI1zoOpS< zE!c|uzEY=DkE_$u+1WPiMQ3o{F5cIqSLvryX?j{&RQY2;{tavO2e!W_ zYe8N}Q3nHTNtmbaLfBqkkmixq20YxvEF=_ttgfL!^{V_E!L=tzL92KyPNyCa>31^4 zYXf-I6o)G1s`b>3v*jVr3D@Xk#B=3U{rkkpOUJ|u0_EzYfCIO`kWj7-@fy9D*k?7((YFw zOo(U1zTS2j@4x32^`2`|+J1Q7!}rs?2^XvIflmI5IjtWPapYu%0gv@|*v{VHL)fzR zT$AuE9S|Mjo%8aFi?VYcDuz3I+W&Jm{ML}nc3^X-JC4u!b<6>9Bw33wEl-*g8 z-yl-oR`{CBOW$;CS>mLL>5KmD+?K>bZ9~zmc++fZ$f1IOlO*Mwm-mOy#U32;@Ul$} zbVZGS??*;aacITF8`V8Oc!=>GV3^^z31E5DZgP*&44vSUC5RKv#uLCZE$5DiaL^Tg z9r!;_oua;a=G&dH)0l^XMZsB7S+5AK-pY38RF zopxD(i(z_x3D7Tq)wJiA^O%tdHh%LXu9Gx&kPl9Og?_^j7gi%YNxe{l+n0nR zl-D`AzTng&<}vlG?(U&lv|CZ903L4+9#di*2UkL|EGJsURLVRuwKF9fnO5e(QY^si?0B(-Od-gfRZKO#XHCNI7p8X8_Ht}`q)T~aO zN{NTOe%-EqLZL(wpUbwW^#>Iyv?yfcu-KvnJo?YB=xmNKTS_uiNY{+!lI-J5OnT@2UFUN;6A-nJW+3c53monZ96=Y91$B2wCN|_qupFV1@tyK7^LuMJV z*c#Uy$@JU4R6%6r&#=aQZd&9`xY8ec_c7RI`U34gM>*CMf)>E<6jx_xjCf%}}In?Ngyl1)E zT2d~tqFqbD*TlT{HF`o9G|d(oLp@oPHs--WjlpD_&^jlZ6Ajih8b^P&34KX44&}XT zt;gQXcH*6!A@{xKr#AUlXuc^n+@f@Qq~^+-p7Kf$f0)0j@VjOf;9gYT6`+7>PwTO4 z9enlESnC|BH5Vw%TR#=g>o|pKZhBO<1?V_1{f08W6&d6G zr-yn&gpGr``qd`JH=%dD^%FtZ{jrtorit${Z(p`;QAl_9lf7AoSK#~IB|Ulf^82NC zcp9<{2FmO_nO}w3VSI%Pk14KYybgTuF*~W~+}F_;7cn_;jn|{w&4h-AOa6q2YL1T& z%to%T21(Y*i(D_U^JDq|1wsCS-#1 zFYD^Lb@E$mGq&>DVRBzaLb5p) z?Fve`haWJ*jiM*irF>hqa}wM}uPS}Y2=;qpK*x=byDff25TUChfYtlwAzlLKWt6X042m;?K3`u@Q&7)K zdZb#GV=Ex`DdUk_Ytk~;YD2Wg`VHNHBJV|&4zfLdjdlxplI-z+n^jkS{WixQ)s|BdjP*gcNld=!=EjCBrDv?y&cys>wyV@cFY z-a^;>Zn8D=C`pB4Z1qb6Aa?=%g8;!|?RA8de-y)1H~x9{QG4buaxHnQ{p9%~;AXpu zj(mVPAS{_V*Nv7Adp?s&PecEuvuAE_l?O!V6AJqz<=#>g(OmpUDq)MSR^qOtb9s4b z^xo8U1FMOuAui|Aa;1G9PO_yBG_WEp+e|?9`4)6yf6wZ7>D#N;WIoN;pIR61GQHJs zJ-eS%tS_iScuVfmUB49WA-A_GYDt*xOAbfa@&2~7HzOxW76-Y^%p?pe&^fB8*!%-~QvUY96I$(oD396~J?n(&Iu{?VIq_8G%dfd;RMs2;kR*->VC z5(XU!4AJeb-xZ2syt{&R;uqRSVwMaPl|z3gPIEil@smHz&OND2uISR6C*fKmHqIZO zbb3hPABQ6%)Lq( zy-f3!y1B{@$K}Qdews%nf7~Z;zxS|z&WHCik%I8I-yD&jAw@Wh@e+otGOh2GXd!sU zISsHTXEhM1eeuG&jEGBrRSa>|IaaQ=@0Gq%iX{nZ0>ZKGD;@c>X4!o>gnDagL4n54 zirIx2=9=kW|NK1Xq$875*T8=&3@hs?|C6cpoF|5w`UB6d95{Z!i@rl|#{b|G6>Nwc zH5`h_q=&3GDB%gYnjyVFN;SIX(}`^t6xwqhgju&~^cFg)ieo3-TXQJ;JdHgx=o+atYMFMZ$;4*X;)sY=A^0Y*dKhQNd9k#yd#u`JP`HDMg>U=ZCUHXQP;jTthU=*?2B$4I`PO~dww(m~6 zW0l5_aJ$@!5mFsw?ys0k3byC0v9GGQvmU2`0mp1O#vw>0xVtb^LtKpshn1jdUs|q) z5LNUoW~~0}@e)@l8|@$bQ2lgrK!o9dTvrNaG!upY6vJ9O=qA@IyrmzHT+~=`laa%kR~nDE3V-`tsF*d* ziX=;1XW1cy@}`IeH4;tpK&6QyjebHs5!`AJP5N$U#`T5k?sR~H3ss`GsH;kE;G%SF z&bQ1ziESZ$!mz@(ZnheK$bAsNdFF|d%!(00;Q%+{)r4y;NZGJ0SL?yS^je0f% z@+k9uRhSDtN@V07v?QUB_&&18k3D(RQFHC&i(T#lt`kKj(nKhE31BevYEH!y+m8g_ zP3v$TSLOx$Fu9;aYi<{PouK6Hrj?`$N67cOfNK(a5+7yt>$lQFU;I8CF)T6Idv+!1 zv&fzZ8H+iAg7!^6rZie|U;c(nKS4}g$e?iCLygSui_P>>OW{0Q_9gtT#@cWt;p0w0 zr^f5CGnt6m7H(_!Wc6l<`^pVwJ4a=jmx@EyD~xsO_4i!0~>}FL&rr zMxi$lGUwwG)KR@-Vof>T^SyRH^IgHGQ$pFgN~9n89I@ANReAKY8|ZyL=3l>`sd;!* zGy32%`J>h^LwS?qVzslEg8BAKfsJ1jY&{at?bEs=M}*ikEr6=Mqn1+*eew-|{^Y}F zwIk{wPOavTtojU`#}=`+txu8;t5EW@QhcB>-L&nPlFxFf{9S!;=;-^eq+-NdEdU}f0a;VJ#7jtBO# zH=9%dx$5Ni*O-T|aVAMADo?e3(KaB%H;pCi_u>G-LGkRXguO~q2v^^vDlwV*`2@pX z(AXPp-6pIY-k^rQm*PLXFr?2g%sdr4THp9MNPCyds2dRo`Ne|}<} zZ$Y6Qt2lk@Yn()^S8eSXQyPi2*qNJ>7b%LgmozG-1j8SdUdegiH2X`OE@!jdc-bbg z_^#52c8-Po_f=#vu6Bf{>M|ra*A8C17qu;+PA|6lc?-wFA=rjTpCnPBAiD%%-VS*; zb{;&m4^a_G^z9rF9GiqMwrF{zt{VseoInqAX67y?3SVX6*eBf~;({*yKZgyjKL{pP zc1ddaetpiBxxef3_TTPFeo+Z(%v$^Ct%FswFtaR|-qeS~t1Z98mt?wMvM09fB{-X- zHnX$;Wo@FQTRKF%S==}4-?nvq9>$)!^3m1m@aUGgNrB_aL&4D@ji7VIISqX})i=@$ zq(+$zZvv*`hdjk{orzXQ&%9HK+A^U>&(K54;NkXHIKc>!g8T#aSqy-w9Du;_{=4rK zSrTfY4~Tg}8PtU@N~?svWRt2LU106`yyKz5e z<>^;zU;-EMR1ybxUKDOt)C6mMUpmivys@9y=9zHQ%}e65_ONyz(z*G{;EBPvlrUYs zOaR}D0pn~^G!}p_{J8BrGMC~(f}UThZD?q)PO;Lba?~33>B305u3tOYTOecTlX~18 z1Y#_6sc6)gomT&O_hd+0&?ReDZUOs``SiI*s>8J<&B0u~&az$Rg>28{zLs}fy62$9UkZ31X6pGrO8OV7YkFaaeZ)VnH|@=40MFu=_C|NOI-GYwag@F=6KDau zKi_Idco?z~W$^s5?e3bvfD=3;qyz)BjpHjSZYpnWU+C05cA-3LpKiXyfW5WJz?EC`D%NDPhP>;&{-xyvCVT>ZUJS(AP_6{N zZ)Kua8aOGo9t=?O07Etu8kX&ACTzD0GeUt*xH?+t0a=+P?p7AoVij9zZ=y5UyyRy4Rj63^Qon+qDc+%xw~n%@~{bl}TT#rrG4 zeeY>at zeY2rU-P`Vpu+y%p*Y4S4rCKf2(ORhJTc!%?$nfmirGl5&BFfEpDlRJXW@Qi03yLHO8>G8Ix?8$SNF!iQQ2f?;-s|(?hdna6e+%}1jZzVGA8>g=ZNPW)(RHy8x5*LfL`!wwyz_i% z+hWG4e%Hs7h0I~8-o^1}IDvexXZ(5KoymSTd`SQPgOJ2zUvI(Y*i)x>BysLgGgO}c3 z=}rx$$V+Pyk&*WIG{&_<=Y)9g#tz&dH@9#RgPwOZ2Muq9sxbVUD_JBC{vBY*q)5D| zjtm(Xt8iQ8{o29c@Y;(#mEIkR&2sasdT@R2X)NLRJA#9^;PpYf2532qD#jfq8ZdGy z+OO6<>$0)GOo^EC&X?#Ki_N9K>l^)}Svx`-o;w!uO4+5MxBi5;TQg2&ywJH;dgc*4 znUVzgFa?Ho5v2%>8(Fp8P`L`9DEKB4qu6rJ@p|1X7?*KD8^_B913qV%93Win3wa6Nq|%8PK7A+FKwqSW$}oA%cG8_SKuRm3mlYLp+@2x*s&s=I2e3+7r{ zTFiy``vovv)+qBHT}{)${hnG(oA2KnIYtPE)p@`8D}e`n2BAcjs`+z|#eN_ zJ85#orbfs#BzsQ(8!=@;`ZDxMU?^tS`*U`{KF# z$HHHWzt{R`Q;H#6DsdaIne9mjlNv&}v9Ib%I$?sBVRiGegS{%lrUEmD5n+4LcTwu^ zm2frUT_1E^o1~`e97}n1l`zPRyIX@4MY*UAPa=Sm4g$__)Wr$|=ciVBYE`#jy ztIrJ^&;;=oVd*4%!^JlvxH+Cg0bMBnE}gZ<^J>peK9;v!Uvu^wQ`_A5W_KooPdop) z>5B>bjENiL+401W?%a>t{!KES-VS~4;(Wc-#reC3x9uK1<5W@-%*R0jAd8XN#xV%g z6O=RlY7WSY*FtyUpcshBYUhmu-UY8pxXtrgJT}Gi_^=KqLzn{;g)xYDgM{HnwJb>E zb?Y)ZTC`AlUX8Q&Q>Oy8sezz_zdZiCJc86G%bg8kIEz<-`K(ueFyGXx7Cqd`NBDGo zR#DH%B$$fp-EK45eTBBGy_DF92rKR@xiqE!;VC`E%NnYWAqB&m&hHYy9UXdwfc}<= zj~+8x+cIyFmdZD9=9sx0gROt1WWKGCGKgsPiRgFnLKC+qe1tYX`>-m8${WvRGJifi zGt9kQdas3}T+zBp`jRr^!P)-B;PKg|ne6Eli|Os=v7uIX1(SFVuNE&9dBr2<7c^|M zj`8mQQrW8=cMt1)2IPm%%%G=gFCafgJTPzU2}&XDuEVaI_!e(C>N#h(zUoq9HOr86 zAlo{LPNv48! zl8U4dVUIEKwLl3jS;F?XCa{G<*9i5j4ab}B(;40c$_IuPv zYjYoC6elv1qvnh1LqZxhQI)i&zZ7gWwiiCC_>g@(3h{We#VLWM4vu6m zBlEnHj1YgHsjqN#b&BBJUJ&%!5ASuboi42g1bHhR$B~Y7wCHpM8p6E98SHi)wB_;n zHQU$vuNbC5QvM4%8Kslfl9lVTZ*sz-cj};D<*s889+hl$cZ4?$%m#r~}jndc#u{v_0Ckf z`T3w*mKt#u<6y4Lq+%BofITh)A&<;o0?EuhU{l5#t>6A^IkFZoGUSIpT>LU{8U&qBDl7IG? zl($Pxb9Ys|rzo>bBDoAC>vzv1p@cfkkx>f3EqXy)li6@!u`!bv8t@jn>hX$ z1U05gUDv>rO>|d%L!oBKJ3;#wZet8(C#y1JL`=i{dWt0;{{pzz*H^k-hTgL)TFVv} z5C%aWYM5pvSKmFBwtd(>e)QQ%nJmqUjjXA%c8=)kfHSFHhOW*oRBy%8NYq+>1n z6}U6>{mD$8YVCu}`?4*jsb0w^J~r3PatVsD1_xIrzM`yoVWY+GMC}6PzQR6>p-)nc zMb|%bz!}Zs1+-sRw3Xa#zQ@Xcq%Y z7I)j;qGlpjSy(E^Bo6eR(Qfz-a>nNdtHs9UaZ}>vs?3iEB95ZIVK{AoMa=PsT7;!J zejy&2jUM9*+!v*2T^3Va_j zmKdyGPOvJv%nWqKQO}|LQf(quWki-4uri{w)7f6|Z8h|@F9nXx8pts6wo3}MA{iScC% zQKTB;)yQUX=l*?e`+qo ze*KVr&qWt1ebc5gum!Ay(MwSWcgd&Mr`QzmKS0-zs30@6FXhhpk6KE75NAy)!1%haD+M5W2SH*OZ2#y zz&H5_Hlca>EtvE+k?^KzH2An~?Xo3i55_GO!)T$m)L^E}MA!y8vV0Y<$d2tHZn$}e z;K(@RV;jnPYCwMr16kwm#@c->eYaTWFvIKiW`I*%UvkUITLn@8&VsRFTA-%$SqY7% z|H0}-R_hcoAf?CfzbXMra-AU0-fcFtQ@f$fUNh>wv5%^lkEr#X++-(~a$8^T)&GKk zWiH`w9Ace$75xWq<`JD<2gb^b-p${7`&2!`wiVPhJ02w00#;iGuvWcS)w}bQOC~FY zb5}+>K_L-ckKcU2NU(>FZ0-?t8$~Q5rR~P=R@B}rkr@Njy|Dlz@nn76khs31L1QC1Kg8R># z{1+N50?}<3KpWix0TQ!3z5A^xp;bmkT4BoZjx8KyoK5c$gZ)@PI`eSJn^4(-LYZj??O06c9Ili zSm^SLu5Xm3(m@i;KrnUhKxeSiALEgQ8ne=2p^0S~|4tTlGl0eQ0Z`;CAjcN#)EfH$ z0$RUt$A!%Klb^IPGw3V;d!O-!j&>WSiE&=hJn?gM))^k0hR}Eg5~kF5T?Hd){_s#< zp&|Fogc?V9u}Wc3)At|`5&It|?-<`$29>gJnPyDK@B+oO|E@tcZ84``B)yQPvjPa& z-{=)ksE{O;G>0MDnwo$Cpkq)AjISh61_G2O3QgXFAR5x;UOP;X@rrLg;@iJiK}EE> zk%U3g6NL^DDwIw=PZ_DKBA>w=*L`39qpXd~#T#Z^J&EA5*#T_#^SP{}$;adqoM_H4 zdngj)w=oGkBua~giC^$CzXjNyOwxWRIn-}=Gy#h~rn)VRl7fO{K!6Bj3+jyhlxd6t z0dbb2qv&eU;_eJ3b&;AVGXcjG4jS>$Mh=tl-d>LJ&lPPCKE9ufL`w5z((YNR;f`t` zpNh@=T_aZo!4Gcxa@_zM24gxOBNUSKe7d1@wEtpq`{}RN`iYm*S(VI}NZ>qpQ=xBK z|5k?}^ypan69k$nfKt7;0pg(_cy~F0Zy3@G_>pRchGZLKw^;K?B2(oxq6c7PqpZhnOza7_}aM&IRLUS)z8%)J28+@!MeTml=Gwp;#D7 zHc^a2{L-DyP))uNZbws&76Nw#^RbU9FOYp*Giq6orSqkaR$0`&j6UsZN)EIRhBD04 z-pJX$T3t8lO)mY{FU|kjrJVKN?ZMo^!OmL`mB}iJ(pOZS7%mH>Q~{}o=um!Ttt0YfKtH&fEJv!BocXfB8?vZv6HnMFM zO?`+Ch!+45{Y_5~pw|(J_`Y`P{%r-AjghWaA}>@MD2cWe-@dp@Q5NT~rA#Lb3Vu>- z)JbvEKA$ktYgiZAyDIeqWtY*Z1aqfhDg7XoDh}M3+;gp!iQDODy8rdpZVnf{Uc+ts zieOlekGTB8w1Q7zDA{;JIW(3rZ53OEK8IBo0s%;qEw-?F$x(9%Twa)g zHzq~P;nnSv{l|Ftv^@L$_0ccLuA_3V3;Uuph>F|#=wPie#zW^;78H~N*K6R~Z0ei| zgkAB8mN<$YZk(b|aq99&`PINK0|&AAM3j_%W*o#hdwlGgv>ht~;xr903NZYDNG1Gu zRFcJQi2|kk0Iml-#N}+63jpeTR&t^(*4Ap7H;nqVzLFq<%@I4`f^CjRXb7or{E>jV@bYT1EE`T* z+g)qVZ zGNf;)OPOLG6*wNv-FlR++hMvTWh@>2m!14w1?}`%8B>^G*`!tK6e!{q2)ZxImp=cB zzx#EDVWEBP%a$YP08*6)YSwM;{CbIw_kZv|v5r4BohRnA-7UVX?9(dw`S%AO)&ypQvx6>VcMr6>cMIw^Dtee z?t<8xdSq=tD@H(RdRj~B)QsSGccxEwF&@Jh&oOPvx1y4=uA0Yptq4t4) z^Hm5`-R`<)MVZ6J^HX?XM|`JKp2Zqs`P$oB{lJA%q?$Bw$xPQ6g}W0^fp3*eH*gEM z`48j+Bwq`GHm!^%N-y9+nt}!+Kfv`OV!lL!K(i$vdL9iJ@kIdiVOC&fbG>AKz+$)C zCwctX;Uh-?s=vt=vZR<#?OTfQA&92X0 zMM0?NxKE9_eS50%u4tb7eR~mk8R?I%SfH$lq|H$yQBO!)qHRIbC4g*P0KHOWrgg&jhL)G0z#G^r82^|$i9#EB;fX!F3OK3PjHWiOCb%nde$t-i0ow#pr-edq96&lMO& z{Z#m_$J-TO%s1(W3KsPIJV0T{T+D&^bQ?1WEvZW>R}uq*w3LxSUBX-ssl2bSWabr6 zKbDObqZq8XTM076WuKA zGRM&-Dp=d!XvYS5{*-imz3!O+>lt!)njhZX)sAD~rZIFl{V}S|@Qn5l*6E^d8}vy3 z5-lvqODlM<$4oMM$UN>${yUaK2i4F;6VanQO;aLGbU7W^U4ZF777UAb0LBE0AMgjg zbp}dk`U9|0nD@WTNg}T|8kFs@QJeM|ldijBMkY$9_449g;c|lA-H=Cc>XHli@3;H= zx{@=nqFiNaM92D18~dhy1i9^-&W|=!93)KoaQAqj_8LJDeg8@S$SgNKGT6rcEmV;6 zQ{loSG}^eB8<7*FXEyzRqO0Wb_hp7aA&sC{igl3fDVBWq2VI+5niF}yrVR7!L+xE_ zm5l<2RM7ntXFTKYA(N%|f%?M0ETBGTjyR1EM}$;x0^@5AwbBHuoc_~F<`PAeo<4#2 zCiND@9t!(36C?YwJ>IHlbU8PbXVX{);!6L*;eovZ zhr7ttQ5d=;@^86g@Bqqng?HjmevrElFYGigRqIQ4my z-ge+WO||Y|iJFMVd@$A9bfFg2~gJf87fX0`pS+ zsFb1%13xufz|5^axLVM~&0v?Gw^!dh@FUCQxJ>t|BnP%kQ?-Qq;&nSDSu|5d22HpLzy}}VTAY`c1Kq3f4i{s?{o)HBcABh_0}DRgv@k<%pILuJzVF>X1y+z?IJ4v2GKIxTUwK=Mzd1 zi0$;kV|Phg;vi8`qI~RelBc8+jTV>1jNI4o@lU?$R|3wh{y4+y27->a=`zZ#--;U9 zM9-%T`fLU44Yk~(b{=PcKhn5_=gM)6C07uzuA1z3sT5;A-43A;runIG$};8$7h(7T z1>6H5KwyWL2rPk>ediQai*YveuP^G^`pdkZ!?2?YTvt5?e~yug&6%~nlQRk|o#-TP z@w~CeN63;oc)o5LkGy)Brs6zxOb=>Xm%7GDiYSnM8T-Ne55?xmiRZICgnvRi5Dwaaqbr~Vw`-%q+w(Q|5 zBwV{whWv+XKQi~3dl!Ep`?pd`>Kj>CM zdZ*~|DmF6Do<*X$o9<0o`=25XBg|`%seM6qE{)sXhZpqDK1fShAd3eXzev8rz}AC= zaq?})31Y>`o5=#KnaberziV+qPhlKv+oi>-D)7w6I6*sTFqv}t0j(sSjyuJpeR8k_ z2Gt9WZ)cYAJKCzN`q)0JR~!pgVK{Kui3OiO|2&KlKGT@YwIckO@^NHMpP0a;TIo zy{*}YPvc-Wy}m=y=8qWohPsdj++K0MbEH zUS2$4rWgV`F9;kX-+%QLPNsk(TKoIv1U1ziCQ1-_Ft<=!P^9nT_o?m2PfZ1>f{@K! zzJTli+BND5p?ahUCpjxgY0_kpH%dPApAohIkExo@dsPvgNz z=-W2qbacxEy>dQna2IVgc?flDin8{F52vsh_P?!~gk-wnJ8(@>#5?H%TB|RgJcON0 zW~QkgSX=o_bLsp8s*wL7FA&avhl6HN@+!*it-fNCAG^t?m}`=qJkNRj<_tJZ!&f zUZMQFc611G(le2Q=&3h^Tgwm~jq5qNN2T6=(aO!?ImcjFOrJ-&TOD|QK>jGOp+^?5 znQetfJnj>jzQ@SFV9n=ZveVTWvvfj7(B7eahb8jCwBuh)0cgpoT!3pE$b@~c07Y5L z@DL0s=$%OaYU?=b0t>_A)WpCX;wP}8rDRzl3SEK7W6ySTh^Qwr{WZ#$5v(#=?A3~@ ztUs0(AyL-u86k-EceegFBDGNNaN_b$+|A%&RYL`Xhvql)w*>7NghEw$N)-E5G8Ho6 z)%XLidO72uDgq$+c{p+yWF`*{<9fzE2^${oqgGi={I$+m$8nc4#*+Re35x~AXkP=! z*gKHrW@KbkGrRNF{8w9CTuf?BOgb1!YNpYH_G|2Fjf6D~X$W>nv3>odV5n@b z*+Q>yeW$yd@j$uG@WXS4eKkG4Oy5_Cto~8XtUqw=_CLS+4hqLu6Dx0i*U$Addl3!$ zk%aV_K%rhA{0gzqBLFy*K`15?ipd1mwbhQ?0=OG+RDy5UuLEpDO61FN|GGMcqV?1s zvfUe-{bFiURc2Bxk+1${?Y%Dch|kfEa}JY528L^tHX{S;41?xGrL)Nv9B<&JRz0{wIMF|yj71g%LR+ij zCsMqk>$~t0KGdHPC>QEt(WyIuF&8-MF9bhtYN|slGTIpmZ;t zSKzLUM7zBH!&!Mi({~o4%M=pMymc5wV7A-d6XC(pRUGJF#Hn7=2$r?2 zvJ#{IiatD__>T)0gF1eb=8Co=lRUZg&$`v+-}A*jSzr`6-nA#x611A4mZ`P+eNm8{ z3az210^v$*&c1lF(;C5GWW)v}x3$;xnE%|h8vQG4P2)lyc~P}r)(oq@vAc?@#Vn?i zLw*Sq^ejh}w1w=eo)RAZx#f`a{Tj(}0MG}CtB=Fre6HnmrDjXFKxd*`_*FZv4)-Vz z%C_<41zTXP{Fu=-5(Zp=pL9;dAnVIqTLf^4dcL6J#rlB#c}=} z5=Gmrwu-LT>qtN`K2vvMkEyWPXrOQ^((O+wGEe%;(*&Znc_6yc{%!+RId0fePwSQl zSu#QHs7C7HKbBikK_N(`BD1>N=>-;|0E12V!i994UOtOXj={~`Oir(Ka%^`;w?1Q) zD7^Tio$ZSH#?dNbalqID3{YaflsAz*d*~Nsih?f;GRELYE=i`PAIbuE?@+>zn8bp6 zWE)GWI$s2yUzy=VlP(Ct-cp-(JJP|b&1RLWicAWO;XodHxpd9bId6VhfM%1pi+FtC z(!k1_xo9?ZEDO@u5|*icRfnJqdmWm(*Ep0GZ6oMtQXaD1Jyry&>_Z zQ{59@QL7D8-fz`CLZdCgw1Sb+4nBHQY4)H(Mjvvjx;x}Rj~D#?oOi+1Vp0W$sBB@Y z6E+jF$Li#3wDj)F5bI^6aK+YeT3Bv!ErGa+0wPdOSWgk}-|47`olt-n_mB-v0rXZ| zGkO*}ZiQJ|5<_iqv$M>|I2cVVFY;z~m}S$3F9gbKz9f;`9bdodojsV}6RR_kw7GFN zRTKR2J7wzZK7h|-trXOr_J%oCU z<}O7Ya+T>+v8@V^4Xv^V^b(LZ<)%-Q(q{v9rdEGu;}%O+k`DB~yS6BTRM}n|bFSEV zn}ZRgE65h5j~<4H8AGbf%@x2)?5-UX^%$Xi&I^tXhn`Lv{%$bdu|r;Q*=^{(&QHOSN!yi}~RGab|5O)F*m0|T0ll1*u&k0LhKqOR>lR+%LUvVsork?!QxhrAGi+Tpw zF61L7IxqK^>>XNe)@_(ceq1lMYe0IB&&#-Oa*|)(@1JhQrCQb>e)V7PWFqP+=IxCaS`LMHUd|0*MjgQK>b%u?rDYJ<6-344g>WyO;<`<1PUd9Os5Cf zYcWCeGGuH&EQ>g#)K9(-9p_e=?l9PbT-BH-fP=7_v9p^&?U2-OLg%kp=gZ!oi76bI zMmkPaA9;o|Qg5lv=$kYYc1whjwHv>OsCsL+#_U&EWd`4Bd5z|CB+TmXPtEr>^saoy zfUcX~PZgcc({Rw32MF)yX=O*ev|#6CZYOAIUf37-^DL!e=kp7-f6Y7;l{!+xp62> z!ulx84l56|t|c$9S+R<#MU4IBE}CPGn-O12)IiOy!;NK7S!{;Js5q%P5cpJ?abiBA zGn}{_*Et*sMtqz%TDEH*F!$d2M4>2r0seEfga82>^A51f8XwXRVjVt<1gUv(0{{VV zQ$|XxjQzQBXS0Gv#b(+82;jpx@7`w;*T1c>z&f(5z7ZUNuiR>>fz3`bn`;8>!&JB` z@>tUFlF)b-#E76b14Brg;>$3ooS}rCDP~$a7wQkIi{{?U?ZHz`S?gDOkH4W_G(d*d}EZ`u&+^5BJXMi3n~2Cj1Ky@s$O}K zz`EKW58vXM=&g?oVyTQ1a=k!V2WYKENHEAtsbxvj_rPO+0Ar*-A@bynC+dcZ`=tfk z&Q~-+2MoPFx*?*n{qbIlG9uUZBBMnFhh~AbDh0BL+64!krTc;b>;i-e{WCc5aj^K zJyNhaBnF96XeAnSx)Bd)Bm9`TK7i-!eC@di#jqZ;u5t&MIs@Y_3?!@SLR(bz?|Xrk znn<&&y*#RizxxBw5S=Dw6N~^5A+agSWPC&I*LzsSLdlsU(!Wa;D|Sq9jZ%I8m5w6L z&Yo}}f7jL=H(1T7rSubNpQ zNS*5Rdzl)%#H29m-0St{8Vk(aFlHDW>91gV%~_H9(Sfq&9W*9oP^aDdaFzG1$d-V!)@jyy>~+(I3}_K({n z&+&&>++%pDkL?#d82GRtteR}Fbl_6lAaAJg>C3CW-HyLnoptTD<`gaUFLQZ_j$?e+ zTqR6erc`*o?&jYzTp#?-}jxy1u9EOU>LuvK#w8X?djm?df~&y z@f`0;lAM0IoefuHNn}CWZbvzM+LSfV2epM}(;%G^j({D*psI)!1~Qwr;7npk5>0bvPF zv;lAIFAluBC5~lk#@79qFDkAkA2nJ?0*10)wYw*S+vpaCsRp>)-wnM5K!x=^a ziIOWc$LjoD+^qV_T1YiR2diq?i8A8_9f9LQ{@>6xe(p&GG)NS)0SG>Q>22y-=H_jn zO#i1>2_u}IkgJv#f;_~&bjI=dP6kBQfK)AW3OEU_fjvqaJnu^@5M*9TAJoiUxP~4h z`-*Z&GD5sF_zK&H;?o}Z!74+&7Dg+}H>ukX? z*)g3gjbGMd!Rle-(6XZ_uVe-sHl!BZrF;eD`-wCwL=3ru#lsZ`)z4etxKSmd9hb{+ z7Xk*RB8y_-lI>OR5S--`F>3O#)+im^;e+fD73o;b~5RUOL1V@IU1XYV&H4rU;=MUgvxQm zM~7d30&YO9o8*9JFdRzE&(4{;K%4Cs|h|eM3dKsw30831kSht$yoC`3&KU+toMvR${_>qo3 zSQ_3an;&u+z7jNfeE|4Hdy5I|3=7d|llHvroXQ@KDfq1IvwMV)&ePmz$Iu6(gd>28 zgwBq+H~$P%O23YO@x@)tm^T;K)+rvy`n#hz*k^TzMXc6Bpq>Ck@ zC@?!%jq+sJXl4Rx3e0!X7?r#)^NJQYi?3@bbjmB5^6<>4j)BS1v_Y`$Q{&Mspdmyz zRJPd2_4{)wf|JJ03IwV__^n>H#wba0aIBc}7(e5374L_AZKe zLu8Vw%#%?qZE&H4a&Wq8gq-1Ng72(9@n6&kQds(9AMrfjqIcol&BLv8j&5|Lm=|Mv z$O}~8$;jAM4n~4>9|6M!YJ(G6kv^lX!AcO2RXWKH0Y0ixx%qc)|CAh((+r4{Gh@HO zSkWFe9ns7gE2AIYj}Lag`c9OSiU$0IHYzC1X^R6E^&NCs0Nho_I==KfZjRfO2odnY*e_0w?U@U=d8_v@N37MJx`rro|9!@^k@hz#Wu1V3@-TPr{lflOE->>V1{}= z`8%k$mx@w`jaZ=%OJ$;Y7_E8tjb!7 z;El%aZ>3$9squm6NfpMh2BSrFK#Fdoap!vHLh$Dk<16f*ZVxOI;hZ?vw9_a1hGnyQ zq2KmZpVMD%ed{N{saG|goEG7Oleh|=|AX)>FAYlX2bi=&KJ0ad9yR)w@8p=1z@f1a>{pn61DiZ58spOA+Sa=6-^|FsgGXxmIT8u zFuu!sHKq`I=qp|CIH5z$k*Vf`G5Wtxhm1JtZyGYyRNZL8&;eCd&yEG-f$OKPLV#5BI+Tc zC;=MxWb=4byDx-IrE)kbZtx?0;%!@QU;;ru`)(s*Tm~wFsdsBbI#zQET(GOm1p=Tr zY(~ViY>bnUMD~H_7L|H0-QCLAlEdpOeNQ!CUaEu41Qk&tzPsiQz<~UG5dmtz7cpA7q)2WwbGB?%P}Jgl9ui4V=!J1-WwfBix_f zGC@AMxCWEaL%%)Ge`gyS5D5ktvremM*qcuVt;JIc*EY$)+5=n7V=_c3sn9ruObpd? zG$U?R%f z-5?*J;QQ1A3$hgQuQ#IS>>iAJ$(BBRA0g~8lBWb^Mds=RO^D%mrR?Fhv?D2yU=t7T zw)Au|u7D86w*&}<>zL3j5^n~85wiu5YO6#Mdlxvg9b=N^XoijyY_JKyU9<5l-+GVw zJ$fSYqP}q$n-L+}Ub`A2P`(%{{xV?aUA$o-p%Tl*==#;;$A7Os^hyqt_7??{ONSs^GOc#MGItklHWpfuS;P|bW)6)Hwtm`;?`18 zv%&;5%HQ24+X1!%=V#TN5z(ol;cW}`RXd4Gi?B?;c;7x5QmA?ot^*9RvP}J)=Xl%%LhA=-X z{bB_RJD|GJ-%tH|c<)rf#mb?na)z`EnPNe5*0$qEpoDP33_Am!BtBQLVahW#o*Ig>T1t$OxxlWw_uCc(z>D;G9o4{Zt<>OOsQ;Y%54|Wz+yUxp| zpP}-t1BYQqMmvNe z4@%X}O}3S+$$yBv#BJw)Jz4BS-<$uTRLkzwgS-Q;_}f=XiB<`4c8v~}Q=K38LQBTw zkyIXS=*7yG{BD<=AX;DRXJWW=PITYKiN?v#z!|rnh)58@)F3=I`SM;11Qgip^Z{L7VH&s$5v+1? zUrg~<>WlqYTarG4e!y^2u;X2Ir$7XbX)j^DOfm|H@*ad#x#R}mBRtZzfAU1iw~L~h z`WV}!$bUvZ`w$Zl&_Umw1d0|}$WjPyl3lER)GOkmnY|zw7fRo??kDD)t8>wl4ke#R z@HPke^PaSqa~GFHo7{Hfo%He+1B!Zlfqk~&$lI1pC;?RS(Sk%S+Hzln1c`{?zLvhH zo|m|j$?jf|!RsgYu1o|lYf>b1P@+#;HJ6mO^8iK~H4#p*bW8FY(`(rGGgy7rcUKOE z!nBH-L@P`1$O7X9+E&>NeATtIN1nw>JI3;WBgT!3juP>qBSSz>`#KsIUB8shrzJrk zzo-fGH**H;@g<98Qf9p4B<%9%VOXLx;s~OMRC32pn#B(702c?Fbi@ml8^Cf;&7c6c z@5c;UCP00!j~LTwqH65UW1L534PF}`+w{g8fY97%BqtL^ArIBSW7XW5)?B@OH#qkW ze)Xq&2)`(os+##h#msM_0tOZBYb{EXSM-}@xBFL3LL>7beYSd;xpspO=2I8eCEaf! z`e!Z=l;Ir)9|!fn;LHYvGl0pm9;s4^?AOI3N#3nZr%rmwa0rWG@eddYq2b(+6?Siz zP2-qWS4pbJ_clL=l@)Esll38=*j>JCr7FW-b5E%aUyUVyBuKm-IyM%{D93Ni8_gJC zlnb=wc|l-Jhzy#r{UQ;CyB2zyyq@rR*UG=hpfhwklFxpwykB$XpJl4JMFG1TyXhAL zN8tXWFUL|;cr|ZFlw58`L^rOw6xh}Ft#p;)XnhwQ^%V{T^85IPxC5>s1=ddNP`;3v z3s7>qQumE^yDzeESKN+XlNhhHc=&k1p-y>vlkUx5Oj#szSmQbp@N91`LVK778gZW3 zvz`%1Vo){EWneB&qtex~V}rjaY0CH33g-3E>uJtjK;8+=*2oM6wG9lzTe&hCyzsTo zaLI5>y@d;j{78u&V&Cch0Jg%XR!7R)f(Yx=VyZsZOT^G$x~=@Z881y? z;%P(iM@B4dmcmEdkEg2FotoY#Q5@-pLzjj8=xQqkrHexx{{9Jl0W%uBV33I0j=YYL z!>4`gLalm%P5^r-yqhe)f5Q8aG+B(UG5eTgcW3qwBlqQS$nT(?kMk= z$TCaL23@-Q(M=E{^N4VL{fHyC5e9%7#YruOu)_3hOni15jl1UUl(xckS^stG6kr?{ zV7;W+l!yNYtNV~$ht$MzxR9F5hm%5Fs<)8`akyiKEHITd0U2w>0>sP@HLH7oiVKab z4N>ji(rkDBj;;OV87>_sTkUi#fY4ro45c!)ZlA_!Oy;wEg`h;8re+8Kgs(Amo*>JJ z0Gsje*A#8-L9_4cQ;5X3?eh2+uFR)i6?|JYd~dw8wotGnu_Et8t?d)}cY&)b6}{D~ z%3rpjw%CM0{s_4lRhJ1v6`B36u1xRX3}dk*Vq)p+N=}+RJRIpiK^TcFJG17hsOAnv zj9P5S@h|W`3R1-Vc>jZCEL?yNAPwv_j1c>mwB& zp8A!h?eTY6;<#}O&4OX&apGnRO5L}9Y<)RK#1VzXB~fs#v_mRYy>Sgf6?_vzgh9)j zarH5aAoz5tb_7^{W56|2KsSPt%h%pgM@RSS1W@TbDr@>p4fsf&(^(U1HYmL(d20du zoZ~T^W=i?azekYr?Hx8$@?6Exp@N7;%*t6tD-j|&@f;AdVvbl^1+h&LUEm>G_6R&XlU%{M-R zH~~692~5w|u=f7J=2Uo<@v>39Y!ZQtxt6xX+`+_2%GR*Fhpff{*&j;`dC+oweg3O1 z-l_mj5!Gk5;BNDJ-Rap`>c=-&BG|`qQwEsxfS6iC{5BX>(4hW3scN+P zVoH&|-F7mKqM=d$gX4Y1rr>XFMKbRc8WZqGZYg+n*d`ULEI9Xr=k;xn+=#PmM(n)% zw=Dp~k!kI13`((l)g7Ms57;9XaH$3vxZ)D;!WQs(OYUX>oEId6{aet~RWoXOH(u4 zPXT_0?cs(xX32h?Rei%a45(K4)qc;d+u@;eOs@N5p0KW~Wtp2WnN8I}m(ssZ^N$WB zUmB!g^e!x_j7E3jDKV;ytR=TKJavJv7*s)3YxYwr&QaV_-a>eb89$+l`*-pd&Z)_# z8S=8$X#hajB=Ad$dY}HZi;AtzhX8f|4{sjn#sya5_9fMQxCX~Y^wnz78%Y9j3Qi(4 zP9jFxkfYzNV)1Z(f(*oegXSN8p5W?3{;#sL4yv*X1N@~VrCUNmK)SmH1SF+9rMoT- z(kUS*N+=~D-Q6YKDR}`AkZ!3x*Kc=cc4zjFb#Rzr;J)WQ=gD)P^LsK`S*mE=z9_tE zM+<^-(6dRzD%@=vtt>p3TjFf%DD{t5DL$UpsBh4r1u-#mAiL$tZ&Cl|`qwojoOB4D zj@tEMWLZyJEqUIbIR(VWi|ayEf&G$QrD9SY=x0C#3F%P zt7ymSB&t_#Z(UF)rR)nE`!;(cop)t^9f;YTi@0~aZe6&7fZg9Q24 zoYiWW6y9J1>vR~6_BM~SIhng_r!1*WV~XHho_~-r4sAewnvP|mb(QlndDf1U(2D-3 zOi8s&ItX7qBtAoH2i&ro=dVwOg%znA=@LhQ)= zcWyBA08n*0KQ@nbecK$8H(tPDAn8aY|DrXWHtl&$petci4SQ_JkWZrN?#Gvr*a zpb_TNk=*a2f&G9)%p5;>UV#i5n~imumSZXlttcAwzhxGwkyf|&IxA;FWPr%tBxMUPoDQhd0o!g+_qkl|fD?`oFr&$%yamkfVVBR2`0p+&qzl9D< zv2%$Em>#L^A~G}q{vxsz6ZcaVbl_<`?6nyn^pDi|<*@k_Q0%IMyPu)VeCSBZg;pVe ztFRroIoNa*KDK3H$uWIi{(x5ko@&XaKABd&h5?a+Nk!#{k2ejkGE#Xp?&rA;kbf;s zi7N;3FlfU;o`#GrnDq2}*tUsx8HlXFR>qXVQ&2{$0wwLne=H34$V6<8ZSDGw&%|TG zSl7U*VH~rPR>?65x=X$+D9n=!{Jggv6XAvR<0Q+5mM9vFKz&d-@m*rSInmLCS0W?UhC{f?~4q}F5wgDngyJWU~- zy!&@@1)$rnHC52SJ}5Yl5G8J>)JS{u7zyj+*&#|^KI?DUd>H^p!r+0K)rtVJb-YPn z-k_hMLE-3k`CzmQ*gm&5AN1?YpFyiKTfSoQc6*6I`5PqEC+k<)ZCa|+9!3_;??EdL z?V48@5|{;R;37VtHI4GIe6gmzg1<0g@KC@Ui$a1KHzE@;2sAc87*48{_UqzPMG8t| zSqj+20o${Pkdzsy-Z0FPyF9;ut3l!E+n`Si;3mqUs7KfOFBV7JSu;=5*vMIr3*1%7 zwz_!$|0Ody6k>^?)Ev5~D#I5&chvsF>I^7YGckK2GQ^UXV{<9fSE8t0LGY{yp+oDb z&+HLJ+y^{KY2S)$T=H<*3B_eBG?JwqGd)xJcYByJ0R}pC#fHCX{fKRjMvDuv;&NtG zm+w>XqZ(ZEKa>E5myhx$D2XXtte1!?*t;VI8)b6MGjG9}XJ}PWSv7_PQuqP2o2S5z zYBA_*0Frgp9@q zJMO&Y7Zhiw4mfJrO>=JGAAr1$bOw7JfihmeGg{SYxm7ArMJ&l-fnsh$+<({jV5n`~ z)d}t~Bs{zENqFzj0eFi1UkXok`?=I!35LH8qaH+LKz>drw2#RR{9iX_`&CZtLNQ0^mXaezRc*BIZX40!^u>>LkvkY_b}WL;`UvJ=V>m zrr_vernNPnc4QqHl#;>E4ylYfM24P#{CZ(%zVaAKIPh;8yHL#s+_L3v(buK>CPjLu z5+aL_mvCOnp2Gz54j)EB7Ja0|dNH_c+&~uzIO?jUp(>1oNik%#Gl-p3qD$uSP?g}E zdBno6p7#1I>By0{50s^NL@pQHA%D`8_q8c>gd&n-MY~kAl>XIkbfNxm%f^D*oh4Us zfL*M;Hg@TBHIKroMt2FLxuFA7U}y<3WijnZw7o92wVIY9Sq#*s?68{>lL#_Ez+V9~ zB?1Nz6c8!LHoYTLG`q;&E*#;HgssLVR~%Fb zgF*r^SdWM5zcf7zXFPU*Qbom8yAnaq{L&pO>+Rn<}p>m1lrWYRQc6>Ct^WH zXL5rn>u*K>BRUdxb7`#W40{?5I;c)h?%K@-2?_b1BW~se_EB0ao|n~R~+{h zyQ#@Kx5(+#1{Zz7E9B3tUV?hWpsLaTPa5N^-G~j(oOi@tkp!SJ_DgU5@_Gt5tw2F& zcu>+2z+w+w&=@Z85SF@jT2mnXNg+5hUgpb`FWAa}v#^j;R4AB*Q+T`g5?J<85BPsqHg5(xU3LeHgz!zU1Jat2Wuu<}tfP3!-pvC$@+K_K= z)vi$oI0A-&GIv4kQhu*eOcNQ4){eV@MrpB+#b(WX%JWvxoI0(5CyjF94ltg~14rj8 zH=7yerAe!1q!G%x(Mqv|vgq@W++}c|1dv0Bum+SPREA6&2C)WpLt={v>?}$nq}0E$ zxVKa-#C;K7{*ZB#j8gpfSy0)+Ghg8GLf+_sYgxfn`iJb&5oZ2X^B5u~M~LG?{4mR? zj+w6o*ZLGHy$#|*VIj9|WOv8KJ9iMs%dy&qk}9cNZVPDD73eP^zUYMkZb%7E{buKe zezEHU;C-9w`Br@rvFWc2A;|v?EN=h(J5a>=bU<>ZIwi5s5s+yH%IX_yM(q=fgfdE4 z-oZOJ{K0_bFWW^buSsZY)I|~~N+WoKJ8B#cx*`14Zpv-g#RLVr&4yJ{&ym^E4)1xC zz3+nheW2etU^u^p%YgodoFNnDF+SxJ#|CjSsBsL*8b6y#B8PV^1c$Yv`o>QdOLB@Q zfh4BKejqgc@y{@49{0(=h$gzu@qbOl4s5B&OOBWr5=*8t}9{t!{4vJ z=To_Bqu2h$bRlSH&+I86po%)-&j}#fg4P;GlY{uID{90kJ}u4b^q^T_qqeTYJC*Ep zpL7o4SJU8ilSV$5Cim2N>Qc_TH{p4aO|aA#1B4*hh$iD>vl4yi#&Zx>XZ)M7*F4nO z*o^QsznaJ(as&aKYln<#_pJDc>c34JRPgjX5%MjYDMnF?=hSJsAd1g=uhoz}m*PSB zK+-%Gbzw9yUUsz=g7%-Z%luGtLplT((LN{ZgL*)wa)EUT167n7>Y_BES+aBzn{8s- ziOtl=vGr;r>!WkyPm2-U&A#rA&&5{)$%7tt1i?WgtBBgOzlOSgYEd--2Fk^Hl_jzG zuQ8uOHa+UxHkSso67^-a5-~bpN*}|IQ3qTx%#gq7Rkzwxcd`Dlm~otUX~F)fGC0Rd zj~EHxIYh?8&0+=R6pwnx>aza0m4C;h&r0kgyocV{rfJeY`N0JMRS&1fpS35f4Rzkb zQM2X~icG0ymGhJ~PC9l;+vW>z6(oniEMi*}onO>@j7 zrbZ1_K}rwpRUqp95G3k>4R7)R&II2`Y#Xj$n(#u}(-y}{QI7zbw!yKx;|*JY-GHebi%z|XAZEm&0v0xgH_pcr<4n&0qPY#}3U1kL^y#F-7&$B@AltGd< z0+}=Tb-Jb`m8@gs)>Fju`OsdSA}YlI|Cu`C?2BnTF>M3Cui`IRX2pX`IbukqDk7em z@l=(Yy^;=gNDL^uOc+@Dfl0P2anXgF63!zs&bl8+ogjzZcKt2s2w_a^D=xU1I-Ermr1A z`Xg7q7o3grYePX`7|e?$pfRw{ZHf zwardHRIO$vNxKx4G>-)?HlW zEFGYMxw7C%+{`)fNkdEOX*7tD^;7D6~RdJJsMS;rG^K@ zQNzZ!TIo3Tdqn<+d-%79D*(=wCc>&c`#iMJnrf|bvP@w1zy_OfEvvvgx0Xa}gKxNG zs_39CuwkZ_gUTdkU{pRZe1eQV|~az8c`JreD1lq=Q8PTSVsPM{PuiB7;a)~q>w z{ifBQS@vc3_xhfn5Xctag z;g*^$CgZE1NSDTMRG!A&yU@HvJd$6=qOXmof*+RssQg|n`cm8oOQhUxy!!^^fKhB& zRppsNny@e;HA%DICCs5uWjj}EP5`<{fFhZtYCT^{>y80C4qsx~F+OS}iQfUi&TsA=;*@N0CTg~zBS{3A4Xgs#A z`*H+|0iy%0x_Sw)*coqUD7y5WgJ$4Z7-{czZtk#}!hv$_%a@^Jt(L?yQKkTx;sk5B?>u?U5oCVq{b0(LAFThGU$ps3HU9m@!w6x?d1Tcqr-$E?kcnqj&RA=#Zzer1cNmJVtb&D-d>AoQP?ITy-rT`_*%KixVB!A!`=Cgr&sUlFWz03IVe}A zb1@H!2~5l`=6W^OA#en^A*(Kbih0N=OzftH03}npuU;v(94V~4IRChFO{QZb?iH8nIL-Tp$y3M#udxtfZR51FJ zZ54DEeXUCS7gTHKAjO>!HsKh~>u&v2DPI{$OCwE2QAgRz`i18YKB7SzTkqS`R2v(ox3AEAXb>Uu z1|)(qKbIcPNvL8uv~vqRqr7TV<&Wq3(l=6Q)QYt`ttM+Rze8Nws;~>#S=zr{qJ2|L zuIRBRI-A*Zd?KZ)fUP5XICmMRb5=4!e&}#{E<7anS%v*wUAjoiuc2z2o-b;l-D8)diO8cwwD8rH;K%O+oUz4#%7k*~H10T!Zbj%;V1nR~xni`w^=B zy;p|=rx&5ou2FU5m0Jdv8NIlfH#!B*YA8#w+ATZN%yE}Hj;~z9VC{$Gu_OZ2+M>o?IQ+Kow%|_D*C(L%5SxFJ&J*R2 zTs$;bjTV%d7xxH~7S)nYpDC|j4sy|q#u&gHnTnkxWgSCX=HJBWaF{uyRW94J+Ahx) z@SIk`j-)1hHsfpS+rGK!3NP8GR`#DP5w^hi7|$O3p-LZ3B7NT>Bt}I=l-w}(t=E5{ z*qLozX;m;|C~dI=eOqymAg5Iuu1Eev$idOkX3I{I3I&~x7PPKaIm8+->qmT^kXZD( zLlZ*f^1G_3iCMA;-poRU+m9~NbG~X7b22j{Z{(D^CFog?AuM4kI2d=@9#2~W8;=&| z!f|x8oSaX$s$5M+(-kI|jxLu;UZi5`9PL+It<8pFc`R!sO$v-H-l8zh>jHJN<7xWa z{bC+SFq-=f=vGX6bo!~t1^x1a6#Du%@%qq33%H8W4B1W7j*!LB8H)vIynMM<{9cFf za#@&J8c!D(g2HSzh;LUa&=KIY*tKWP4#I4fY~0qzdk^+`1e!zFRa8w+Db2C@JlZ^! z4b#w1t8S>ArkT-)+@0N=8K*{$P#acr3BOP^4$rpY1SH(-VXhJ_2?$AZU49^?U@J|E zObhTqUCNr4S?-6(%g7*XiSM$wlwYc;;O~+fsLf3yX3B*x{f>FFk6wI zyhv8B`%T zEE;|JkZiy7`2b#8^3w5z$V$^LUjB+1d=7$N7t`}zy09dbk$Tz*ZKj=*4-dt>I1XoC zO2uP~lz_;4M!;P5Ty0&=7)qK1C`nlM)+_2H0@=q4;%zmVZ&^7|g8hD^A%=KI)jC}+_kr42s1NNNp6Xcduc9%R*RgcbZ}sT5cKkg&(M=SG)em(U)IkB zVt}-_WQ8?lh4q$szcbu(Dzra#&#jB4D!Ql7zMC5*qkOAr&D568&nZ<{Ox1X>dr<5_ z1ZiFzOY}|n_gv=5rNBEfK_luUd30 zTqVoe%*#YXi+6`8kU}KFAI%tEj+dUUnFtlDoDh6Gb;;hybWTqXJk|{}S4w6XHfrrZD_^+vyQ4r zxxOJ{l2t2=H|Cg&cvul?u2|LlPB$G-;xl2n;G3SCAC1`zi&kp>2X|Q>wTG;_>KU&R5Wn6a zv2r}B9E~&6BF$v;Hb@>B+w1L3`YG){AaA+ia1^$K~`d5{m=s~yRuXzHL#xCB+R+1&oHtokq z{q(FjHsY9E5Pn~%CWi0l8dwUwZY8r)an~nAI9M6h?X|a?W~TR?!2EqfnMi-R&;rd{ zz?+P`drUy56on&TrkSG0RZ^Brza-2|@f@3{uU9vbbmF2dz?nh^a#^rmJ4BC%_xMTM z>43lAM_5-}%+c2J6A$+cBGfS*&l~$^GH0wVZ=OX+P5FAc_?Dn}#bkeX0SWVxSJO{q*2_ecBOWpUNmGn!v7R%(~N|*3>$U zzG3T17;Y=MaP6RT!gky=lfUa3H)M+{lE0iLuvW3FkcmgG)~YL+MZo1^@NuKjbPy>d zI;zmbX2ubHd^H-Uel^d~be&Rs(&7$PvRM7+whIbVccF1^-x<3~-tQf+x7xYHJg;+2 zC%?O1z2^JAm!1eilU*+=4m{LRcuR(@RZPDW;O>vghD8gk+?HTKG&_%qd9Nh+6| z=e0g|lX-HN75SU*#}n&Fl@T(#yZCO^T^C8t>E1%1%*I~R5a#c&r2I~; z5jsx5*$NlZ%>JK|B{szfJWh7)rLUmF4bL%5sLCb1lKt${LCOh_$9F2V^Mqbh?oDfD zlr^ku?Oi=l;NO{cdz!f%y0JR!`8fW;ThB*8__@O8G4|7}BHUaBANR5FzaEQ!k)8`ss`eJo@tmOGhF*^R@}S&;RS zzeKU4{Iu2NI;x(lo9XUQpjS>m(y*iBZ$)6ir623-VlCfzO5o;}0SCMTx<6>)Um{S* z{EL4~rSFjO3bYa?zek9p@S0e)J_2hB=(=)YpFHmHd0YI3e5bgGsdBn!_TpO??VSzd zP`EST`Q7YY4Rc^ z9-{(2@9sLKn3G$Yx=$`%r4g$sL&g{aBQ_WS3E3c1?PwQszv;##2vVZ%yLm`AUt57OTKn)9k8 z`KNyqu3P!ZBhBv>*4gK^-Lfk3+CUvKRQ&oCOsdZF^2n$tIiRZyYwnMV91o>e-NS4* z&2Yd&@DN;ZRG-w?^+r?ha--Zmh_~MV-IG^T4CyrO06dxszsrM8Cwx4-iLZ(D=*Q~} zX&!&5$#+78A#H#Y;(ao}czk<0W^uUEn#O5{Xf>JTf@MAQq&+?%lwSL;{S)m3 z1>~Y{cc$2^R(~tu>gwv>*zwd8P#hs~adBb#rE+?DpJ2yTRosG^D(z!Fe|HMhwX~iE zWr#qXo_Zc}obWakBupqR?et`0oW0Od}jcO5D=0o3zEj`<&(H z=QnJ9FgOC7ni>OAY4AwiWO->cuK9SnFkdU|>q0{QQ!5q5TVrnUO0&19h= z#lbfnTW;&H-dME9kHhH|5d4;RckO!m`!|*v-KFY360vz?_x+Bw8R` zKlnm~kirERl*gMvC_>JB#j=9#eSV++?Q|Lp#{9MTcCGA7ZS{pI!Eh~7Nl=9=9@>Au z`%fO>fAfF5=)ZU>is=U@1X~JTFqoX2Y|2T>`DT#t59rlakv`2>tW(~Xr|=$^oE)Qh z`5ov$Me;I%N^42O#3TVwGQsR1T2+&+KHOibYioaND9Fo026c9C2P{LDo%&;lSjLx@ zL=*GR7688QsRI574ik0>{z?0Gmvuxc|05|d*Bv&zv~+Yxeiwg|$}wq+6x!a*mGsk{>7O*x1;-FBYtmGBU7oC!!{D zUv7kx7^`K73BR^mt+YUeldF4rdL)zS9Tsa8T*cHpsQ_@Pe%b2@)*~d?#>VmFD~@xh zt-BZ-u(dw_)ko=M`j(SHmYDuX z_q*=TUuoXl{XLg1n2N5opNnyBzta{y`9arZRUHkayVFU(d?Z6iqr{+Ig^+|K_U`5~ zw)vpx6+JzD)Z(K4br$%zn5!%AB%lQse-`MRTF3wXjuB*$Wk}3SG z&S8NT02^smtF1=Jfz)Bi-g)EcDY2C{QkYHkx{1qSczVB4gB=PS%YfyE1nijKw$y6UDToQnVxPKLCG z%L9nll@1Hs*QdZ>;SmtfX_p&|MU`TdoSe8JNctc5l1QUn;wY4Avxo!G`*l`#Bn~Dd z=j&HVwDo(M+}A}iwzft7W1t?DhLt$h#>R$p9?>`Z+c&wqyu2vD_KX3LrXL6{d2?-U zTZ&u&g@#?;Y{4ZycqwvSIXI}8J-62jlz=e|7dD>#0x|gN?_T+qpZNWi1&u;- zgUh<~17BOhui;O0fwvpfEL6?FkoSh5V20t+)qAbt;uZ=&oE1n!S5$EJu3o3I=)?ef z5?EGvBaA6Y1=z2|ke-EV>u_AU0xufjvInphwEXY z$ivSb=D^yYuN9J+y>Bz6rwc+)zZ=eZje9y zamSDHKnOuL9;ibozUTTce?F zo4*i{@rbiC4~V3#?Q;*|%v+?1?&gEZ$=B_NvD=Gkb%A%jf0mm`fVMb69rNY_cc-7X z0BE?pf0RbsCI=f^__C9Z;hYUG8V(NitH`X!DInh#-zK@TEeq7s0evA90j0-8g1 zT&v-ytgP(4_7?SNSO<`KuK5u%Tv=IJ@ADa*O6Z}nd@}F+2o3cg1PWjN68(9T^J?I%XCYqD#NIeGlQgHjXU&7g`{; z7#tena)rs*@REZsxE5Y*P(Pr>%OOQ}bD7(t2LJwT6Zb?w<#>L+(n9_9YsCMi7b={| z#KECs=2b%RU6SaBz{Aa50Tk)>kF~^mzmS)1aJkubxreTy2U(A0_0Eywy{76SbBXxfbz4)UidOocIqANtssy*smQb;6jrb;9rGy(?qPy(1p z@STp4(HhraRzMm}^kUv(zQL7F{NdJ}o{^EI%=*n6u%yhp;=X50ii(PxP3~@PMjhDeag@_kcbaXT%cyrSd zL_o54Gcz+xtgM>TCVG0&IXSe~Spct0!Tu3bHtmMQtirs8!y+L$!FIaU^pjY07yuLj*bpH9g`pdP8m-~NQjn^@nze=0>;*;$RXj) z3MiG2#JYfINEPt0|SiJSgPjFre7o9)7Llnv%_J&LP|zX zF6PU_?e>WnUH--A&*YWPtK#tg2$C(gCxCg@7I30CCpoPLoC*bYq;7*tHWNELF$fV! z7~b2C*CXzfT=ezHxq{O7sD=i?%Akk9-Z6U?(YQcTOuHphF?%tLZuhd;;8XgacPg94pJJS0w{H1ePV4n6{A-Tb4Hr9X>>? zN1>#Ab}8P!K3NmCU%gb^2ReFsygl9e=-o*Of z@#g;{b_6L59ts(J3yL=9X*WpIq#Tc7y$!(ogWwqCY%%au`d^fZuda5rE%6WyO2SFw z<-kLpa&X`PweJ8{Hy%gg7B`t*3dC!xZIlofxHUZLK&n`90M@r3#L=$5hRLqaMa3f9 z|IU=-5)q-q_J)8sDyOp2)dho|b{Ap9R3JF2u-&N11O0S+tp629YuL>}GY%gg-+ZGx zBRr-{NlE$I)I<){3JDSx8JSyDgwA6wyg372sKCOh3GmnTBt>ksq@gHHH29WwjLaa3`;%1PryMB?J;D zM@LRhzUCpkb+hWTP1#_`ehWH8fYbosc=l#Ht*Xs#F7_KvM@0}IpkILfTv_;lW!Kg5 z#xbz!5p4lfN#Hs4BQL21T_B7q z8Im?OOv6?@;H#^eW9P8k zL}U_hP9%PJrqOb-Xb+btz`y@}c@KhA%QtV<0sY(&%Erw6y*(Yg?jaBeCMNmhFx#nb zW{Wkpa9n<3T3Qrnzyadm?EHLL*TbG@g5&#}!)~YgZu3fytIw#|6p}_plwdmk^(Wy> zABjpxIGodm5937#7zPnBF%0;(o-8pxwb!ph9zWqa3#rD{jk0$k%m3TmiII$^(!$#5tHm{-?3IAU@^#84ZpB`{N X@D161rT>Zn0sj