From f85638b9ed66dd365624284dc6c8dc19926625b8 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 3 Jun 2026 05:09:13 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: mlfoundations-dev/nemo_nano_code_300k Source: Original Platform --- .gitattributes | 56 + README.md | 61 + added_tokens.json | 24 + all_results.json | 8 + config.json | 29 + configuration.json | 1 + generation_config.json | 14 + merges.txt | 3 + model-00001-of-00004.safetensors | 3 + model-00002-of-00004.safetensors | 3 + model-00003-of-00004.safetensors | 3 + model-00004-of-00004.safetensors | 3 + model.safetensors.index.json | 346 + ....out.tfevents.1747065198.jrc0930.1144863.0 | 3 + ...s.out.tfevents.1747151728.jrc0914.177532.0 | 3 + ....out.tfevents.1747326457.jrc0913.1643946.0 | 3 + ...s.out.tfevents.1747412990.jrc0910.965145.0 | 3 + ....out.tfevents.1747499580.jrc0910.1185976.0 | 3 + special_tokens_map.json | 31 + start_end.json | 1 + tokenizer.json | 3 + tokenizer_config.json | 208 + train_results.json | 8 + trainer_log.jsonl | 1679 ++++ trainer_state.json | 7252 +++++++++++++++++ training_args.bin | 3 + training_loss.png | Bin 0 -> 39178 bytes vocab.json | 3 + 28 files changed, 9757 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 all_results.json create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 merges.txt create mode 100644 model-00001-of-00004.safetensors create mode 100644 model-00002-of-00004.safetensors create mode 100644 model-00003-of-00004.safetensors create mode 100644 model-00004-of-00004.safetensors create mode 100644 model.safetensors.index.json create mode 100644 runs/May12_17-48-34_jrc0930/events.out.tfevents.1747065198.jrc0930.1144863.0 create mode 100644 runs/May13_17-50-53_jrc0914/events.out.tfevents.1747151728.jrc0914.177532.0 create mode 100644 runs/May15_18-22-36_jrc0913/events.out.tfevents.1747326457.jrc0913.1643946.0 create mode 100644 runs/May16_18-25-09_jrc0910/events.out.tfevents.1747412990.jrc0910.965145.0 create mode 100644 runs/May17_18-28-14_jrc0910/events.out.tfevents.1747499580.jrc0910.1185976.0 create mode 100644 special_tokens_map.json create mode 100644 start_end.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_loss.png create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..a4b06e2 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,56 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text + + +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text + +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +model-00003-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +model-00002-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +model-00004-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +merges.txt filter=lfs diff=lfs merge=lfs -text +model-00001-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text +training_args.bin filter=lfs diff=lfs merge=lfs -text +vocab.json filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..c9965d0 --- /dev/null +++ b/README.md @@ -0,0 +1,61 @@ +--- +library_name: transformers +license: other +base_model: Qwen/Qwen2.5-7B-Instruct +tags: +- llama-factory +- full +- generated_from_trainer +model-index: +- name: nemo_nano_code_300k + results: [] +--- + + + +# nemo_nano_code_300k + +This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on the mlfoundations-dev/nemo_nano_code_300k dataset. + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 8e-05 +- train_batch_size: 1 +- eval_batch_size: 8 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 16 +- gradient_accumulation_steps: 32 +- total_train_batch_size: 512 +- total_eval_batch_size: 128 +- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 5.0 + +### Training results + + + +### Framework versions + +- Transformers 4.46.1 +- Pytorch 2.5.0a0+b465a5843b.nv24.09 +- Datasets 3.5.0 +- Tokenizers 0.20.3 diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..482ced4 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,24 @@ +{ + "": 151658, + "": 151657, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..8bd8a3a --- /dev/null +++ b/all_results.json @@ -0,0 +1,8 @@ +{ + "epoch": 4.999242079733212, + "total_flos": 2.739131934768418e+19, + "train_loss": 0.07882811409755817, + "train_runtime": 48155.7887, + "train_samples_per_second": 10.958, + "train_steps_per_second": 0.021 +} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..a916f0b --- /dev/null +++ b/config.json @@ -0,0 +1,29 @@ +{ + "_name_or_path": "/p/data1/mmlaion/dcft/hub/models--Qwen--Qwen2.5-7B-Instruct/snapshots/a09a35458c702b33eeacc393d103063234e8bc28", + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "bos_token_id": 151643, + "eos_token_id": 151645, + "hidden_act": "silu", + "hidden_size": 3584, + "initializer_range": 0.02, + "intermediate_size": 18944, + "max_position_embeddings": 32768, + "max_window_layers": 28, + "model_type": "qwen2", + "num_attention_heads": 28, + "num_hidden_layers": 28, + "num_key_value_heads": 4, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.46.1", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 152064 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..a753841 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,14 @@ +{ + "bos_token_id": 151643, + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "repetition_penalty": 1.05, + "temperature": 0.7, + "top_k": 20, + "top_p": 0.8, + "transformers_version": "4.46.1" +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model-00001-of-00004.safetensors b/model-00001-of-00004.safetensors new file mode 100644 index 0000000..d343422 --- /dev/null +++ b/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82f4073a28450edeb7a680548acc45fecc0d2ff2d6ad53ab4a2766025139800 +size 4877660776 diff --git a/model-00002-of-00004.safetensors b/model-00002-of-00004.safetensors new file mode 100644 index 0000000..4097554 --- /dev/null +++ b/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8309e32dcbc3d1a072c6697df413c93d738611fdc1135feb38dc4a41b557ba66 +size 4932751008 diff --git a/model-00003-of-00004.safetensors b/model-00003-of-00004.safetensors new file mode 100644 index 0000000..8c33837 --- /dev/null +++ b/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09c24d59f0b88ba6bc3c4528927f8c57a1e8cc159dea981ccd402cd07b464f8 +size 4330865200 diff --git a/model-00004-of-00004.safetensors b/model-00004-of-00004.safetensors new file mode 100644 index 0000000..1e0bbb9 --- /dev/null +++ b/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb5059a0aba439c96bbcf7b864fe8504e242be4f42f5207ca66871755cd111a8 +size 1089994880 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..6ca5084 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,346 @@ +{ + "metadata": { + "total_size": 15231233024 + }, + "weight_map": { + "lm_head.weight": "model-00004-of-00004.safetensors", + "model.embed_tokens.weight": "model-00001-of-00004.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.18.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.19.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.19.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.19.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.20.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.8.self_attn.k_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.v_proj.bias": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.k_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.q_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.v_proj.bias": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.norm.weight": "model-00003-of-00004.safetensors" + } +} diff --git a/runs/May12_17-48-34_jrc0930/events.out.tfevents.1747065198.jrc0930.1144863.0 b/runs/May12_17-48-34_jrc0930/events.out.tfevents.1747065198.jrc0930.1144863.0 new file mode 100644 index 0000000..cbc930c --- /dev/null +++ b/runs/May12_17-48-34_jrc0930/events.out.tfevents.1747065198.jrc0930.1144863.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2285e28d6a703437dd5f2fb1ce3f3f907b4797cd10b425c70f6131e47ffa019a +size 82645 diff --git a/runs/May13_17-50-53_jrc0914/events.out.tfevents.1747151728.jrc0914.177532.0 b/runs/May13_17-50-53_jrc0914/events.out.tfevents.1747151728.jrc0914.177532.0 new file mode 100644 index 0000000..5a56658 --- /dev/null +++ b/runs/May13_17-50-53_jrc0914/events.out.tfevents.1747151728.jrc0914.177532.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1297f7cced014342ce106713be6d56c9a7358dc1b7a51dcaf1107c75dae0e1e9 +size 83219 diff --git a/runs/May15_18-22-36_jrc0913/events.out.tfevents.1747326457.jrc0913.1643946.0 b/runs/May15_18-22-36_jrc0913/events.out.tfevents.1747326457.jrc0913.1643946.0 new file mode 100644 index 0000000..50692fd --- /dev/null +++ b/runs/May15_18-22-36_jrc0913/events.out.tfevents.1747326457.jrc0913.1643946.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f788fa05798ddd111ca270e5a65920b52db44d7d23b15346b53f52ae226a68 +size 83219 diff --git a/runs/May16_18-25-09_jrc0910/events.out.tfevents.1747412990.jrc0910.965145.0 b/runs/May16_18-25-09_jrc0910/events.out.tfevents.1747412990.jrc0910.965145.0 new file mode 100644 index 0000000..64476a5 --- /dev/null +++ b/runs/May16_18-25-09_jrc0910/events.out.tfevents.1747412990.jrc0910.965145.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eafb01f86b19a07e44bc74b9ac0fb1c3f69716b34fe30dc3050d58ffa1d159fe +size 83219 diff --git a/runs/May17_18-28-14_jrc0910/events.out.tfevents.1747499580.jrc0910.1185976.0 b/runs/May17_18-28-14_jrc0910/events.out.tfevents.1747499580.jrc0910.1185976.0 new file mode 100644 index 0000000..436c319 --- /dev/null +++ b/runs/May17_18-28-14_jrc0910/events.out.tfevents.1747499580.jrc0910.1185976.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d079be3f4f68859b9433f7c9a76b2d616d2ac0331b01e9ef86d92868d9bb372 +size 49391 diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..17305b3 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/start_end.json b/start_end.json new file mode 100644 index 0000000..b1f38a9 --- /dev/null +++ b/start_end.json @@ -0,0 +1 @@ +{"start_time": "2025-05-17 18:28:14", "end_time": "2025-05-18 07:55:47"} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..51ebb3b --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..b84f53a --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,208 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "chat_template": "{%- if tools %}\n {{- '<|im_start|>system\\n' }}\n {%- if messages[0]['role'] == 'system' %}\n {{- messages[0]['content'] }}\n {%- else %}\n {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }}\n {%- endif %}\n {{- \"\\n\\n# Tools\\n\\nYou may call one or more functions to assist with the user query.\\n\\nYou are provided with function signatures within XML tags:\\n\" }}\n {%- for tool in tools %}\n {{- \"\\n\" }}\n {{- tool | tojson }}\n {%- endfor %}\n {{- \"\\n\\n\\nFor each function call, return a json object with function name and arguments within XML tags:\\n\\n{\\\"name\\\": , \\\"arguments\\\": }\\n<|im_end|>\\n\" }}\n{%- else %}\n {%- if messages[0]['role'] == 'system' %}\n {{- '<|im_start|>system\\n' + messages[0]['content'] + '<|im_end|>\\n' }}\n {%- else %}\n {{- '<|im_start|>system\\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\\n' }}\n {%- endif %}\n{%- endif %}\n{%- for message in messages %}\n {%- if (message.role == \"user\") or (message.role == \"system\" and not loop.first) or (message.role == \"assistant\" and not message.tool_calls) %}\n {{- '<|im_start|>' + message.role + '\\n' + message.content + '<|im_end|>' + '\\n' }}\n {%- elif message.role == \"assistant\" %}\n {{- '<|im_start|>' + message.role }}\n {%- if message.content %}\n {{- '\\n' + message.content }}\n {%- endif %}\n {%- for tool_call in message.tool_calls %}\n {%- if tool_call.function is defined %}\n {%- set tool_call = tool_call.function %}\n {%- endif %}\n {{- '\\n\\n{\"name\": \"' }}\n {{- tool_call.name }}\n {{- '\", \"arguments\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- '}\\n' }}\n {%- endfor %}\n {{- '<|im_end|>\\n' }}\n {%- elif message.role == \"tool\" %}\n {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != \"tool\") %}\n {{- '<|im_start|>user' }}\n {%- endif %}\n {{- '\\n\\n' }}\n {{- message.content }}\n {{- '\\n' }}\n {%- if loop.last or (messages[loop.index0 + 1].role != \"tool\") %}\n {{- '<|im_end|>\\n' }}\n {%- endif %}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|im_start|>assistant\\n' }}\n{%- endif %}\n", + "clean_up_tokenization_spaces": false, + "eos_token": "<|endoftext|>", + "errors": "replace", + "model_max_length": 131072, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..8bd8a3a --- /dev/null +++ b/train_results.json @@ -0,0 +1,8 @@ +{ + "epoch": 4.999242079733212, + "total_flos": 2.739131934768418e+19, + "train_loss": 0.07882811409755817, + "train_runtime": 48155.7887, + "train_samples_per_second": 10.958, + "train_steps_per_second": 0.021 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..f298340 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,1679 @@ +{"current_steps": 1, "total_steps": 1030, "loss": 1.0147, "lr": 7.766990291262136e-07, "epoch": 0.004850689707442777, "percentage": 0.1, "elapsed_time": "0:04:11", "remaining_time": "2 days, 23:55:24"} +{"current_steps": 2, "total_steps": 1030, "loss": 1.0217, "lr": 1.5533980582524272e-06, "epoch": 0.009701379414885554, "percentage": 0.19, "elapsed_time": "0:08:05", "remaining_time": "2 days, 21:16:08"} +{"current_steps": 3, "total_steps": 1030, "loss": 1.0059, "lr": 2.330097087378641e-06, "epoch": 0.01455206912232833, "percentage": 0.29, "elapsed_time": "0:11:58", "remaining_time": "2 days, 20:21:14"} +{"current_steps": 4, "total_steps": 1030, "loss": 0.9987, "lr": 3.1067961165048544e-06, "epoch": 0.01940275882977111, "percentage": 0.39, "elapsed_time": "0:15:53", "remaining_time": "2 days, 19:54:39"} +{"current_steps": 5, "total_steps": 1030, "loss": 0.9654, "lr": 3.883495145631068e-06, "epoch": 0.024253448537213885, "percentage": 0.49, "elapsed_time": "0:19:46", "remaining_time": "2 days, 19:35:16"} +{"current_steps": 6, "total_steps": 1030, "loss": 0.9221, "lr": 4.660194174757282e-06, "epoch": 0.02910413824465666, "percentage": 0.58, "elapsed_time": "0:23:40", "remaining_time": "2 days, 19:21:29"} +{"current_steps": 7, "total_steps": 1030, "loss": 0.9118, "lr": 5.436893203883496e-06, "epoch": 0.03395482795209944, "percentage": 0.68, "elapsed_time": "0:27:34", "remaining_time": "2 days, 19:10:34"} +{"current_steps": 8, "total_steps": 1030, "loss": 0.8818, "lr": 6.213592233009709e-06, "epoch": 0.03880551765954222, "percentage": 0.78, "elapsed_time": "0:31:27", "remaining_time": "2 days, 18:58:10"} +{"current_steps": 9, "total_steps": 1030, "loss": 0.8912, "lr": 6.990291262135923e-06, "epoch": 0.04365620736698499, "percentage": 0.87, "elapsed_time": "0:35:20", "remaining_time": "2 days, 18:50:10"} +{"current_steps": 10, "total_steps": 1030, "loss": 0.8779, "lr": 7.766990291262136e-06, "epoch": 0.04850689707442777, "percentage": 0.97, "elapsed_time": "0:39:14", "remaining_time": "2 days, 18:43:09"} +{"current_steps": 11, "total_steps": 1030, "loss": 0.8328, "lr": 8.54368932038835e-06, "epoch": 0.053357586781870546, "percentage": 1.07, "elapsed_time": "0:43:07", "remaining_time": "2 days, 18:34:19"} +{"current_steps": 12, "total_steps": 1030, "loss": 0.8149, "lr": 9.320388349514565e-06, "epoch": 0.05820827648931332, "percentage": 1.17, "elapsed_time": "0:47:01", "remaining_time": "2 days, 18:28:38"} +{"current_steps": 13, "total_steps": 1030, "loss": 0.7941, "lr": 1.0097087378640778e-05, "epoch": 0.0630589661967561, "percentage": 1.26, "elapsed_time": "0:50:54", "remaining_time": "2 days, 18:23:05"} +{"current_steps": 14, "total_steps": 1030, "loss": 0.7751, "lr": 1.0873786407766991e-05, "epoch": 0.06790965590419888, "percentage": 1.36, "elapsed_time": "0:54:48", "remaining_time": "2 days, 18:17:57"} +{"current_steps": 15, "total_steps": 1030, "loss": 0.7603, "lr": 1.1650485436893204e-05, "epoch": 0.07276034561164166, "percentage": 1.46, "elapsed_time": "0:58:42", "remaining_time": "2 days, 18:12:28"} +{"current_steps": 16, "total_steps": 1030, "loss": 0.7456, "lr": 1.2427184466019418e-05, "epoch": 0.07761103531908443, "percentage": 1.55, "elapsed_time": "1:02:35", "remaining_time": "2 days, 18:06:25"} +{"current_steps": 17, "total_steps": 1030, "loss": 0.74, "lr": 1.3203883495145633e-05, "epoch": 0.08246172502652721, "percentage": 1.65, "elapsed_time": "1:06:28", "remaining_time": "2 days, 18:01:20"} +{"current_steps": 18, "total_steps": 1030, "loss": 0.7223, "lr": 1.3980582524271846e-05, "epoch": 0.08731241473396999, "percentage": 1.75, "elapsed_time": "1:10:22", "remaining_time": "2 days, 17:56:43"} +{"current_steps": 19, "total_steps": 1030, "loss": 0.7149, "lr": 1.475728155339806e-05, "epoch": 0.09216310444141276, "percentage": 1.84, "elapsed_time": "1:14:17", "remaining_time": "2 days, 17:52:46"} +{"current_steps": 20, "total_steps": 1030, "loss": 0.7032, "lr": 1.5533980582524273e-05, "epoch": 0.09701379414885554, "percentage": 1.94, "elapsed_time": "1:18:10", "remaining_time": "2 days, 17:48:04"} +{"current_steps": 21, "total_steps": 1030, "loss": 0.697, "lr": 1.6310679611650486e-05, "epoch": 0.10186448385629832, "percentage": 2.04, "elapsed_time": "1:22:03", "remaining_time": "2 days, 17:42:25"} +{"current_steps": 22, "total_steps": 1030, "loss": 0.6913, "lr": 1.70873786407767e-05, "epoch": 0.10671517356374109, "percentage": 2.14, "elapsed_time": "1:25:56", "remaining_time": "2 days, 17:37:47"} +{"current_steps": 23, "total_steps": 1030, "loss": 0.6844, "lr": 1.7864077669902916e-05, "epoch": 0.11156586327118387, "percentage": 2.23, "elapsed_time": "1:29:49", "remaining_time": "2 days, 17:33:02"} +{"current_steps": 24, "total_steps": 1030, "loss": 0.6807, "lr": 1.864077669902913e-05, "epoch": 0.11641655297862664, "percentage": 2.33, "elapsed_time": "1:33:43", "remaining_time": "2 days, 17:28:35"} +{"current_steps": 25, "total_steps": 1030, "loss": 0.6651, "lr": 1.9417475728155343e-05, "epoch": 0.12126724268606942, "percentage": 2.43, "elapsed_time": "1:37:36", "remaining_time": "2 days, 17:23:59"} +{"current_steps": 26, "total_steps": 1030, "loss": 0.6661, "lr": 2.0194174757281556e-05, "epoch": 0.1261179323935122, "percentage": 2.52, "elapsed_time": "1:41:29", "remaining_time": "2 days, 17:19:25"} +{"current_steps": 27, "total_steps": 1030, "loss": 0.6655, "lr": 2.097087378640777e-05, "epoch": 0.13096862210095497, "percentage": 2.62, "elapsed_time": "1:45:23", "remaining_time": "2 days, 17:14:49"} +{"current_steps": 28, "total_steps": 1030, "loss": 0.6541, "lr": 2.1747572815533982e-05, "epoch": 0.13581931180839776, "percentage": 2.72, "elapsed_time": "1:49:17", "remaining_time": "2 days, 17:10:52"} +{"current_steps": 29, "total_steps": 1030, "loss": 0.6534, "lr": 2.2524271844660196e-05, "epoch": 0.14067000151584053, "percentage": 2.82, "elapsed_time": "1:53:11", "remaining_time": "2 days, 17:06:48"} +{"current_steps": 30, "total_steps": 1030, "loss": 0.6536, "lr": 2.330097087378641e-05, "epoch": 0.14552069122328332, "percentage": 2.91, "elapsed_time": "1:57:05", "remaining_time": "2 days, 17:02:50"} +{"current_steps": 31, "total_steps": 1030, "loss": 0.6545, "lr": 2.4077669902912622e-05, "epoch": 0.15037138093072608, "percentage": 3.01, "elapsed_time": "2:00:59", "remaining_time": "2 days, 16:58:54"} +{"current_steps": 32, "total_steps": 1030, "loss": 0.6314, "lr": 2.4854368932038836e-05, "epoch": 0.15522207063816887, "percentage": 3.11, "elapsed_time": "2:04:52", "remaining_time": "2 days, 16:54:33"} +{"current_steps": 33, "total_steps": 1030, "loss": 0.6373, "lr": 2.5631067961165052e-05, "epoch": 0.16007276034561163, "percentage": 3.2, "elapsed_time": "2:08:45", "remaining_time": "2 days, 16:50:09"} +{"current_steps": 34, "total_steps": 1030, "loss": 0.63, "lr": 2.6407766990291266e-05, "epoch": 0.16492345005305442, "percentage": 3.3, "elapsed_time": "2:12:38", "remaining_time": "2 days, 16:45:35"} +{"current_steps": 35, "total_steps": 1030, "loss": 0.6456, "lr": 2.718446601941748e-05, "epoch": 0.16977413976049718, "percentage": 3.4, "elapsed_time": "2:16:31", "remaining_time": "2 days, 16:41:08"} +{"current_steps": 36, "total_steps": 1030, "loss": 0.6308, "lr": 2.7961165048543692e-05, "epoch": 0.17462482946793997, "percentage": 3.5, "elapsed_time": "2:20:24", "remaining_time": "2 days, 16:37:03"} +{"current_steps": 37, "total_steps": 1030, "loss": 0.6398, "lr": 2.8737864077669905e-05, "epoch": 0.17947551917538274, "percentage": 3.59, "elapsed_time": "2:24:18", "remaining_time": "2 days, 16:32:51"} +{"current_steps": 38, "total_steps": 1030, "loss": 0.6276, "lr": 2.951456310679612e-05, "epoch": 0.18432620888282553, "percentage": 3.69, "elapsed_time": "2:28:12", "remaining_time": "2 days, 16:28:50"} +{"current_steps": 39, "total_steps": 1030, "loss": 0.6218, "lr": 3.0291262135922332e-05, "epoch": 0.18917689859026832, "percentage": 3.79, "elapsed_time": "2:32:05", "remaining_time": "2 days, 16:24:47"} +{"current_steps": 40, "total_steps": 1030, "loss": 0.6253, "lr": 3.1067961165048545e-05, "epoch": 0.19402758829771108, "percentage": 3.88, "elapsed_time": "2:35:58", "remaining_time": "2 days, 16:20:30"} +{"current_steps": 41, "total_steps": 1030, "loss": 0.6281, "lr": 3.184466019417476e-05, "epoch": 0.19887827800515387, "percentage": 3.98, "elapsed_time": "2:39:51", "remaining_time": "2 days, 16:15:57"} +{"current_steps": 42, "total_steps": 1030, "loss": 0.6235, "lr": 3.262135922330097e-05, "epoch": 0.20372896771259663, "percentage": 4.08, "elapsed_time": "2:43:45", "remaining_time": "2 days, 16:12:05"} +{"current_steps": 43, "total_steps": 1030, "loss": 0.622, "lr": 3.339805825242719e-05, "epoch": 0.20857965742003942, "percentage": 4.17, "elapsed_time": "2:47:38", "remaining_time": "2 days, 16:08:03"} +{"current_steps": 44, "total_steps": 1030, "loss": 0.6107, "lr": 3.41747572815534e-05, "epoch": 0.21343034712748218, "percentage": 4.27, "elapsed_time": "2:51:31", "remaining_time": "2 days, 16:03:53"} +{"current_steps": 45, "total_steps": 1030, "loss": 0.6151, "lr": 3.4951456310679615e-05, "epoch": 0.21828103683492497, "percentage": 4.37, "elapsed_time": "2:55:25", "remaining_time": "2 days, 16:00:00"} +{"current_steps": 46, "total_steps": 1030, "loss": 0.6089, "lr": 3.572815533980583e-05, "epoch": 0.22313172654236774, "percentage": 4.47, "elapsed_time": "2:59:23", "remaining_time": "2 days, 15:57:24"} +{"current_steps": 47, "total_steps": 1030, "loss": 0.6165, "lr": 3.650485436893204e-05, "epoch": 0.22798241624981053, "percentage": 4.56, "elapsed_time": "3:03:16", "remaining_time": "2 days, 15:53:20"} +{"current_steps": 48, "total_steps": 1030, "loss": 0.6104, "lr": 3.728155339805826e-05, "epoch": 0.2328331059572533, "percentage": 4.66, "elapsed_time": "3:07:10", "remaining_time": "2 days, 15:49:21"} +{"current_steps": 49, "total_steps": 1030, "loss": 0.6086, "lr": 3.805825242718447e-05, "epoch": 0.23768379566469608, "percentage": 4.76, "elapsed_time": "3:11:04", "remaining_time": "2 days, 15:45:30"} +{"current_steps": 50, "total_steps": 1030, "loss": 0.6123, "lr": 3.8834951456310685e-05, "epoch": 0.24253448537213884, "percentage": 4.85, "elapsed_time": "3:14:58", "remaining_time": "2 days, 15:41:29"} +{"current_steps": 51, "total_steps": 1030, "loss": 0.5979, "lr": 3.9611650485436895e-05, "epoch": 0.24738517507958163, "percentage": 4.95, "elapsed_time": "3:18:51", "remaining_time": "2 days, 15:37:13"} +{"current_steps": 52, "total_steps": 1030, "loss": 0.6134, "lr": 4.038834951456311e-05, "epoch": 0.2522358647870244, "percentage": 5.05, "elapsed_time": "3:22:44", "remaining_time": "2 days, 15:33:12"} +{"current_steps": 53, "total_steps": 1030, "loss": 0.5987, "lr": 4.116504854368932e-05, "epoch": 0.25708655449446716, "percentage": 5.15, "elapsed_time": "3:26:39", "remaining_time": "2 days, 15:29:23"} +{"current_steps": 54, "total_steps": 1030, "loss": 0.6134, "lr": 4.194174757281554e-05, "epoch": 0.26193724420190995, "percentage": 5.24, "elapsed_time": "3:30:33", "remaining_time": "2 days, 15:25:34"} +{"current_steps": 55, "total_steps": 1030, "loss": 0.5978, "lr": 4.271844660194175e-05, "epoch": 0.26678793390935274, "percentage": 5.34, "elapsed_time": "3:34:26", "remaining_time": "2 days, 15:21:26"} +{"current_steps": 56, "total_steps": 1030, "loss": 0.5944, "lr": 4.3495145631067965e-05, "epoch": 0.2716386236167955, "percentage": 5.44, "elapsed_time": "3:38:21", "remaining_time": "2 days, 15:17:47"} +{"current_steps": 57, "total_steps": 1030, "loss": 0.6052, "lr": 4.4271844660194175e-05, "epoch": 0.2764893133242383, "percentage": 5.53, "elapsed_time": "3:42:14", "remaining_time": "2 days, 15:13:47"} +{"current_steps": 58, "total_steps": 1030, "loss": 0.6008, "lr": 4.504854368932039e-05, "epoch": 0.28134000303168105, "percentage": 5.63, "elapsed_time": "3:46:08", "remaining_time": "2 days, 15:09:55"} +{"current_steps": 59, "total_steps": 1030, "loss": 0.594, "lr": 4.58252427184466e-05, "epoch": 0.28619069273912384, "percentage": 5.73, "elapsed_time": "3:50:02", "remaining_time": "2 days, 15:05:58"} +{"current_steps": 60, "total_steps": 1030, "loss": 0.5892, "lr": 4.660194174757282e-05, "epoch": 0.29104138244656663, "percentage": 5.83, "elapsed_time": "3:53:55", "remaining_time": "2 days, 15:01:39"} +{"current_steps": 61, "total_steps": 1030, "loss": 0.5931, "lr": 4.737864077669903e-05, "epoch": 0.2958920721540094, "percentage": 5.92, "elapsed_time": "3:57:51", "remaining_time": "2 days, 14:58:18"} +{"current_steps": 62, "total_steps": 1030, "loss": 0.5932, "lr": 4.8155339805825245e-05, "epoch": 0.30074276186145216, "percentage": 6.02, "elapsed_time": "4:01:44", "remaining_time": "2 days, 14:54:22"} +{"current_steps": 63, "total_steps": 1030, "loss": 0.5948, "lr": 4.8932038834951454e-05, "epoch": 0.30559345156889495, "percentage": 6.12, "elapsed_time": "4:05:38", "remaining_time": "2 days, 14:50:19"} +{"current_steps": 64, "total_steps": 1030, "loss": 0.5897, "lr": 4.970873786407767e-05, "epoch": 0.31044414127633774, "percentage": 6.21, "elapsed_time": "4:09:31", "remaining_time": "2 days, 14:46:17"} +{"current_steps": 65, "total_steps": 1030, "loss": 0.5824, "lr": 5.0485436893203895e-05, "epoch": 0.3152948309837805, "percentage": 6.31, "elapsed_time": "4:13:25", "remaining_time": "2 days, 14:42:17"} +{"current_steps": 66, "total_steps": 1030, "loss": 0.5802, "lr": 5.1262135922330105e-05, "epoch": 0.32014552069122326, "percentage": 6.41, "elapsed_time": "4:17:19", "remaining_time": "2 days, 14:38:24"} +{"current_steps": 67, "total_steps": 1030, "loss": 0.5804, "lr": 5.203883495145632e-05, "epoch": 0.32499621039866605, "percentage": 6.5, "elapsed_time": "4:21:12", "remaining_time": "2 days, 14:34:28"} +{"current_steps": 68, "total_steps": 1030, "loss": 0.5812, "lr": 5.281553398058253e-05, "epoch": 0.32984690010610884, "percentage": 6.6, "elapsed_time": "4:25:06", "remaining_time": "2 days, 14:30:31"} +{"current_steps": 69, "total_steps": 1030, "loss": 0.5862, "lr": 5.359223300970875e-05, "epoch": 0.33469758981355163, "percentage": 6.7, "elapsed_time": "4:29:00", "remaining_time": "2 days, 14:26:43"} +{"current_steps": 70, "total_steps": 1030, "loss": 0.5912, "lr": 5.436893203883496e-05, "epoch": 0.33954827952099437, "percentage": 6.8, "elapsed_time": "4:32:55", "remaining_time": "2 days, 14:22:52"} +{"current_steps": 71, "total_steps": 1030, "loss": 0.5906, "lr": 5.5145631067961174e-05, "epoch": 0.34439896922843716, "percentage": 6.89, "elapsed_time": "4:36:49", "remaining_time": "2 days, 14:19:03"} +{"current_steps": 72, "total_steps": 1030, "loss": 0.5824, "lr": 5.5922330097087384e-05, "epoch": 0.34924965893587995, "percentage": 6.99, "elapsed_time": "4:40:42", "remaining_time": "2 days, 14:15:01"} +{"current_steps": 73, "total_steps": 1030, "loss": 0.6359, "lr": 5.66990291262136e-05, "epoch": 0.35410034864332274, "percentage": 7.09, "elapsed_time": "4:44:35", "remaining_time": "2 days, 14:10:47"} +{"current_steps": 74, "total_steps": 1030, "loss": 0.6486, "lr": 5.747572815533981e-05, "epoch": 0.3589510383507655, "percentage": 7.18, "elapsed_time": "4:48:29", "remaining_time": "2 days, 14:06:54"} +{"current_steps": 75, "total_steps": 1030, "loss": 0.595, "lr": 5.825242718446603e-05, "epoch": 0.36380172805820826, "percentage": 7.28, "elapsed_time": "4:52:23", "remaining_time": "2 days, 14:03:06"} +{"current_steps": 76, "total_steps": 1030, "loss": 0.6387, "lr": 5.902912621359224e-05, "epoch": 0.36865241776565105, "percentage": 7.38, "elapsed_time": "4:56:18", "remaining_time": "2 days, 13:59:22"} +{"current_steps": 77, "total_steps": 1030, "loss": 0.6344, "lr": 5.9805825242718454e-05, "epoch": 0.37350310747309384, "percentage": 7.48, "elapsed_time": "5:00:11", "remaining_time": "2 days, 13:55:17"} +{"current_steps": 78, "total_steps": 1030, "loss": 0.6048, "lr": 6.0582524271844664e-05, "epoch": 0.37835379718053663, "percentage": 7.57, "elapsed_time": "5:04:05", "remaining_time": "2 days, 13:51:28"} +{"current_steps": 79, "total_steps": 1030, "loss": 0.6203, "lr": 6.135922330097087e-05, "epoch": 0.38320448688797937, "percentage": 7.67, "elapsed_time": "5:07:58", "remaining_time": "2 days, 13:47:25"} +{"current_steps": 80, "total_steps": 1030, "loss": 0.6052, "lr": 6.213592233009709e-05, "epoch": 0.38805517659542216, "percentage": 7.77, "elapsed_time": "5:11:51", "remaining_time": "2 days, 13:43:16"} +{"current_steps": 81, "total_steps": 1030, "loss": 0.6112, "lr": 6.291262135922331e-05, "epoch": 0.39290586630286495, "percentage": 7.86, "elapsed_time": "5:15:44", "remaining_time": "2 days, 13:39:20"} +{"current_steps": 82, "total_steps": 1030, "loss": 0.5977, "lr": 6.368932038834952e-05, "epoch": 0.39775655601030774, "percentage": 7.96, "elapsed_time": "5:19:38", "remaining_time": "2 days, 13:35:26"} +{"current_steps": 83, "total_steps": 1030, "loss": 0.5914, "lr": 6.446601941747573e-05, "epoch": 0.4026072457177505, "percentage": 8.06, "elapsed_time": "5:23:33", "remaining_time": "2 days, 13:31:35"} +{"current_steps": 84, "total_steps": 1030, "loss": 0.5918, "lr": 6.524271844660194e-05, "epoch": 0.40745793542519326, "percentage": 8.16, "elapsed_time": "5:27:26", "remaining_time": "2 days, 13:27:39"} +{"current_steps": 85, "total_steps": 1030, "loss": 0.5948, "lr": 6.601941747572816e-05, "epoch": 0.41230862513263605, "percentage": 8.25, "elapsed_time": "5:31:18", "remaining_time": "2 days, 13:23:25"} +{"current_steps": 86, "total_steps": 1030, "loss": 0.5839, "lr": 6.679611650485438e-05, "epoch": 0.41715931484007884, "percentage": 8.35, "elapsed_time": "5:35:11", "remaining_time": "2 days, 13:19:13"} +{"current_steps": 87, "total_steps": 1030, "loss": 0.5833, "lr": 6.757281553398058e-05, "epoch": 0.4220100045475216, "percentage": 8.45, "elapsed_time": "5:39:04", "remaining_time": "2 days, 13:15:20"} +{"current_steps": 88, "total_steps": 1030, "loss": 0.5818, "lr": 6.83495145631068e-05, "epoch": 0.42686069425496437, "percentage": 8.54, "elapsed_time": "5:42:58", "remaining_time": "2 days, 13:11:21"} +{"current_steps": 89, "total_steps": 1030, "loss": 0.5863, "lr": 6.912621359223301e-05, "epoch": 0.43171138396240716, "percentage": 8.64, "elapsed_time": "5:46:50", "remaining_time": "2 days, 13:07:10"} +{"current_steps": 90, "total_steps": 1030, "loss": 0.5821, "lr": 6.990291262135923e-05, "epoch": 0.43656207366984995, "percentage": 8.74, "elapsed_time": "5:50:43", "remaining_time": "2 days, 13:03:04"} +{"current_steps": 91, "total_steps": 1030, "loss": 0.5814, "lr": 7.067961165048545e-05, "epoch": 0.4414127633772927, "percentage": 8.83, "elapsed_time": "5:54:37", "remaining_time": "2 days, 12:59:11"} +{"current_steps": 92, "total_steps": 1030, "loss": 0.5819, "lr": 7.145631067961166e-05, "epoch": 0.4462634530847355, "percentage": 8.93, "elapsed_time": "5:58:30", "remaining_time": "2 days, 12:55:16"} +{"current_steps": 93, "total_steps": 1030, "loss": 0.5752, "lr": 7.223300970873787e-05, "epoch": 0.45111414279217826, "percentage": 9.03, "elapsed_time": "6:02:23", "remaining_time": "2 days, 12:51:09"} +{"current_steps": 94, "total_steps": 1030, "loss": 0.5786, "lr": 7.300970873786408e-05, "epoch": 0.45596483249962105, "percentage": 9.13, "elapsed_time": "6:06:17", "remaining_time": "2 days, 12:47:17"} +{"current_steps": 95, "total_steps": 1030, "loss": 0.5789, "lr": 7.37864077669903e-05, "epoch": 0.46081552220706384, "percentage": 9.22, "elapsed_time": "6:10:10", "remaining_time": "2 days, 12:43:20"} +{"current_steps": 96, "total_steps": 1030, "loss": 0.5745, "lr": 7.456310679611652e-05, "epoch": 0.4656662119145066, "percentage": 9.32, "elapsed_time": "6:14:03", "remaining_time": "2 days, 12:39:13"} +{"current_steps": 97, "total_steps": 1030, "loss": 0.5775, "lr": 7.533980582524272e-05, "epoch": 0.47051690162194937, "percentage": 9.42, "elapsed_time": "6:17:57", "remaining_time": "2 days, 12:35:20"} +{"current_steps": 98, "total_steps": 1030, "loss": 0.5699, "lr": 7.611650485436894e-05, "epoch": 0.47536759132939216, "percentage": 9.51, "elapsed_time": "6:21:50", "remaining_time": "2 days, 12:31:26"} +{"current_steps": 99, "total_steps": 1030, "loss": 0.5733, "lr": 7.689320388349515e-05, "epoch": 0.48021828103683495, "percentage": 9.61, "elapsed_time": "6:25:43", "remaining_time": "2 days, 12:27:19"} +{"current_steps": 100, "total_steps": 1030, "loss": 0.5735, "lr": 7.766990291262137e-05, "epoch": 0.4850689707442777, "percentage": 9.71, "elapsed_time": "6:29:37", "remaining_time": "2 days, 12:23:26"} +{"current_steps": 101, "total_steps": 1030, "loss": 0.5733, "lr": 7.844660194174757e-05, "epoch": 0.4899196604517205, "percentage": 9.81, "elapsed_time": "6:33:30", "remaining_time": "2 days, 12:19:31"} +{"current_steps": 102, "total_steps": 1030, "loss": 0.576, "lr": 7.922330097087379e-05, "epoch": 0.49477035015916326, "percentage": 9.9, "elapsed_time": "6:37:22", "remaining_time": "2 days, 12:15:24"} +{"current_steps": 103, "total_steps": 1030, "loss": 0.5697, "lr": 8e-05, "epoch": 0.49962103986660605, "percentage": 10.0, "elapsed_time": "6:41:17", "remaining_time": "2 days, 12:11:35"} +{"current_steps": 104, "total_steps": 1030, "loss": 0.5799, "lr": 7.999977029531286e-05, "epoch": 0.5044717295740488, "percentage": 10.1, "elapsed_time": "6:45:10", "remaining_time": "2 days, 12:07:39"} +{"current_steps": 105, "total_steps": 1030, "loss": 0.5756, "lr": 7.999908118388965e-05, "epoch": 0.5093224192814916, "percentage": 10.19, "elapsed_time": "6:49:03", "remaining_time": "2 days, 12:03:33"} +{"current_steps": 106, "total_steps": 1030, "loss": 0.5713, "lr": 7.999793267364497e-05, "epoch": 0.5141731089889343, "percentage": 10.29, "elapsed_time": "6:52:56", "remaining_time": "2 days, 11:59:39"} +{"current_steps": 107, "total_steps": 1030, "loss": 0.5733, "lr": 7.999632477776974e-05, "epoch": 0.5190237986963772, "percentage": 10.39, "elapsed_time": "6:56:51", "remaining_time": "2 days, 11:55:51"} +{"current_steps": 108, "total_steps": 1030, "loss": 0.5661, "lr": 7.9994257514731e-05, "epoch": 0.5238744884038199, "percentage": 10.49, "elapsed_time": "7:00:45", "remaining_time": "2 days, 11:51:58"} +{"current_steps": 109, "total_steps": 1030, "loss": 0.5719, "lr": 7.999173090827177e-05, "epoch": 0.5287251781112627, "percentage": 10.58, "elapsed_time": "7:04:38", "remaining_time": "2 days, 11:48:01"} +{"current_steps": 110, "total_steps": 1030, "loss": 0.5695, "lr": 7.998874498741072e-05, "epoch": 0.5335758678187055, "percentage": 10.68, "elapsed_time": "7:08:31", "remaining_time": "2 days, 11:44:00"} +{"current_steps": 111, "total_steps": 1030, "loss": 0.5712, "lr": 7.998529978644183e-05, "epoch": 0.5384265575261482, "percentage": 10.78, "elapsed_time": "7:12:25", "remaining_time": "2 days, 11:40:06"} +{"current_steps": 112, "total_steps": 1030, "loss": 0.5609, "lr": 7.998139534493407e-05, "epoch": 0.543277247233591, "percentage": 10.87, "elapsed_time": "7:16:18", "remaining_time": "2 days, 11:36:13"} +{"current_steps": 113, "total_steps": 1030, "loss": 0.5648, "lr": 7.997703170773084e-05, "epoch": 0.5481279369410338, "percentage": 10.97, "elapsed_time": "7:20:16", "remaining_time": "2 days, 11:32:54"} +{"current_steps": 114, "total_steps": 1030, "loss": 0.5757, "lr": 7.997220892494955e-05, "epoch": 0.5529786266484766, "percentage": 11.07, "elapsed_time": "7:24:09", "remaining_time": "2 days, 11:28:53"} +{"current_steps": 115, "total_steps": 1030, "loss": 0.566, "lr": 7.996692705198097e-05, "epoch": 0.5578293163559194, "percentage": 11.17, "elapsed_time": "7:28:03", "remaining_time": "2 days, 11:24:55"} +{"current_steps": 116, "total_steps": 1030, "loss": 0.5757, "lr": 7.996118614948869e-05, "epoch": 0.5626800060633621, "percentage": 11.26, "elapsed_time": "7:31:56", "remaining_time": "2 days, 11:21:01"} +{"current_steps": 117, "total_steps": 1030, "loss": 0.5697, "lr": 7.995498628340827e-05, "epoch": 0.567530695770805, "percentage": 11.36, "elapsed_time": "7:35:49", "remaining_time": "2 days, 11:17:02"} +{"current_steps": 118, "total_steps": 1030, "loss": 0.5672, "lr": 7.994832752494667e-05, "epoch": 0.5723813854782477, "percentage": 11.46, "elapsed_time": "7:39:43", "remaining_time": "2 days, 11:13:05"} +{"current_steps": 119, "total_steps": 1030, "loss": 0.5624, "lr": 7.994120995058127e-05, "epoch": 0.5772320751856904, "percentage": 11.55, "elapsed_time": "7:43:36", "remaining_time": "2 days, 11:09:11"} +{"current_steps": 120, "total_steps": 1030, "loss": 0.554, "lr": 7.993363364205907e-05, "epoch": 0.5820827648931333, "percentage": 11.65, "elapsed_time": "7:47:30", "remaining_time": "2 days, 11:05:16"} +{"current_steps": 121, "total_steps": 1030, "loss": 0.556, "lr": 7.992559868639576e-05, "epoch": 0.586933454600576, "percentage": 11.75, "elapsed_time": "7:51:23", "remaining_time": "2 days, 11:01:14"} +{"current_steps": 122, "total_steps": 1030, "loss": 0.5526, "lr": 7.99171051758747e-05, "epoch": 0.5917841443080188, "percentage": 11.84, "elapsed_time": "7:55:16", "remaining_time": "2 days, 10:57:18"} +{"current_steps": 123, "total_steps": 1030, "loss": 0.5609, "lr": 7.990815320804583e-05, "epoch": 0.5966348340154616, "percentage": 11.94, "elapsed_time": "7:59:09", "remaining_time": "2 days, 10:53:21"} +{"current_steps": 124, "total_steps": 1030, "loss": 0.5586, "lr": 7.98987428857246e-05, "epoch": 0.6014855237229043, "percentage": 12.04, "elapsed_time": "8:03:03", "remaining_time": "2 days, 10:49:25"} +{"current_steps": 125, "total_steps": 1030, "loss": 0.5507, "lr": 7.988887431699079e-05, "epoch": 0.6063362134303472, "percentage": 12.14, "elapsed_time": "8:06:57", "remaining_time": "2 days, 10:45:34"} +{"current_steps": 126, "total_steps": 1030, "loss": 0.5568, "lr": 7.987854761518719e-05, "epoch": 0.6111869031377899, "percentage": 12.23, "elapsed_time": "8:10:51", "remaining_time": "2 days, 10:41:41"} +{"current_steps": 127, "total_steps": 1030, "loss": 0.5591, "lr": 7.986776289891842e-05, "epoch": 0.6160375928452326, "percentage": 12.33, "elapsed_time": "8:14:44", "remaining_time": "2 days, 10:37:45"} +{"current_steps": 128, "total_steps": 1030, "loss": 0.5563, "lr": 7.985652029204946e-05, "epoch": 0.6208882825526755, "percentage": 12.43, "elapsed_time": "8:18:37", "remaining_time": "2 days, 10:33:48"} +{"current_steps": 129, "total_steps": 1030, "loss": 0.5491, "lr": 7.984481992370429e-05, "epoch": 0.6257389722601182, "percentage": 12.52, "elapsed_time": "8:22:30", "remaining_time": "2 days, 10:29:49"} +{"current_steps": 130, "total_steps": 1030, "loss": 0.5418, "lr": 7.983266192826437e-05, "epoch": 0.630589661967561, "percentage": 12.62, "elapsed_time": "8:26:25", "remaining_time": "2 days, 10:25:59"} +{"current_steps": 131, "total_steps": 1030, "loss": 0.5441, "lr": 7.982004644536716e-05, "epoch": 0.6354403516750038, "percentage": 12.72, "elapsed_time": "8:30:18", "remaining_time": "2 days, 10:22:00"} +{"current_steps": 132, "total_steps": 1030, "loss": 0.5493, "lr": 7.98069736199044e-05, "epoch": 0.6402910413824465, "percentage": 12.82, "elapsed_time": "8:34:10", "remaining_time": "2 days, 10:17:59"} +{"current_steps": 133, "total_steps": 1030, "loss": 0.5465, "lr": 7.979344360202055e-05, "epoch": 0.6451417310898894, "percentage": 12.91, "elapsed_time": "8:38:05", "remaining_time": "2 days, 10:14:08"} +{"current_steps": 134, "total_steps": 1030, "loss": 0.5475, "lr": 7.977945654711108e-05, "epoch": 0.6499924207973321, "percentage": 13.01, "elapsed_time": "8:41:59", "remaining_time": "2 days, 10:10:19"} +{"current_steps": 135, "total_steps": 1030, "loss": 0.543, "lr": 7.976501261582056e-05, "epoch": 0.654843110504775, "percentage": 13.11, "elapsed_time": "8:45:53", "remaining_time": "2 days, 10:06:26"} +{"current_steps": 136, "total_steps": 1030, "loss": 0.5525, "lr": 7.975011197404092e-05, "epoch": 0.6596938002122177, "percentage": 13.2, "elapsed_time": "8:49:46", "remaining_time": "2 days, 10:02:31"} +{"current_steps": 137, "total_steps": 1030, "loss": 0.5518, "lr": 7.973475479290956e-05, "epoch": 0.6645444899196604, "percentage": 13.3, "elapsed_time": "8:53:39", "remaining_time": "2 days, 9:58:32"} +{"current_steps": 138, "total_steps": 1030, "loss": 0.5417, "lr": 7.971894124880727e-05, "epoch": 0.6693951796271033, "percentage": 13.4, "elapsed_time": "8:57:33", "remaining_time": "2 days, 9:54:37"} +{"current_steps": 139, "total_steps": 1030, "loss": 0.5464, "lr": 7.970267152335632e-05, "epoch": 0.674245869334546, "percentage": 13.5, "elapsed_time": "9:01:27", "remaining_time": "2 days, 9:50:45"} +{"current_steps": 140, "total_steps": 1030, "loss": 0.544, "lr": 7.968594580341832e-05, "epoch": 0.6790965590419887, "percentage": 13.59, "elapsed_time": "9:05:20", "remaining_time": "2 days, 9:46:51"} +{"current_steps": 141, "total_steps": 1030, "loss": 0.5351, "lr": 7.966876428109209e-05, "epoch": 0.6839472487494316, "percentage": 13.69, "elapsed_time": "9:09:15", "remaining_time": "2 days, 9:43:00"} +{"current_steps": 142, "total_steps": 1030, "loss": 0.5397, "lr": 7.965112715371144e-05, "epoch": 0.6887979384568743, "percentage": 13.79, "elapsed_time": "9:13:09", "remaining_time": "2 days, 9:39:09"} +{"current_steps": 143, "total_steps": 1030, "loss": 0.5346, "lr": 7.96330346238429e-05, "epoch": 0.6936486281643172, "percentage": 13.88, "elapsed_time": "9:17:02", "remaining_time": "2 days, 9:35:15"} +{"current_steps": 144, "total_steps": 1030, "loss": 0.5395, "lr": 7.961448689928341e-05, "epoch": 0.6984993178717599, "percentage": 13.98, "elapsed_time": "9:20:56", "remaining_time": "2 days, 9:31:23"} +{"current_steps": 145, "total_steps": 1030, "loss": 0.5447, "lr": 7.959548419305796e-05, "epoch": 0.7033500075792026, "percentage": 14.08, "elapsed_time": "9:24:49", "remaining_time": "2 days, 9:27:24"} +{"current_steps": 146, "total_steps": 1030, "loss": 0.5364, "lr": 7.957602672341707e-05, "epoch": 0.7082006972866455, "percentage": 14.17, "elapsed_time": "9:28:43", "remaining_time": "2 days, 9:23:29"} +{"current_steps": 147, "total_steps": 1030, "loss": 0.5381, "lr": 7.955611471383433e-05, "epoch": 0.7130513869940882, "percentage": 14.27, "elapsed_time": "9:32:37", "remaining_time": "2 days, 9:19:36"} +{"current_steps": 148, "total_steps": 1030, "loss": 0.5381, "lr": 7.953574839300385e-05, "epoch": 0.717902076701531, "percentage": 14.37, "elapsed_time": "9:36:30", "remaining_time": "2 days, 9:15:42"} +{"current_steps": 149, "total_steps": 1030, "loss": 0.5398, "lr": 7.95149279948376e-05, "epoch": 0.7227527664089738, "percentage": 14.47, "elapsed_time": "9:40:24", "remaining_time": "2 days, 9:11:51"} +{"current_steps": 150, "total_steps": 1030, "loss": 0.5386, "lr": 7.949365375846271e-05, "epoch": 0.7276034561164165, "percentage": 14.56, "elapsed_time": "9:44:18", "remaining_time": "2 days, 9:07:57"} +{"current_steps": 151, "total_steps": 1030, "loss": 0.5328, "lr": 7.94719259282188e-05, "epoch": 0.7324541458238594, "percentage": 14.66, "elapsed_time": "9:48:11", "remaining_time": "2 days, 9:03:57"} +{"current_steps": 152, "total_steps": 1030, "loss": 0.5406, "lr": 7.944974475365506e-05, "epoch": 0.7373048355313021, "percentage": 14.76, "elapsed_time": "9:52:05", "remaining_time": "2 days, 9:00:04"} +{"current_steps": 153, "total_steps": 1030, "loss": 0.5375, "lr": 7.94271104895275e-05, "epoch": 0.7421555252387448, "percentage": 14.85, "elapsed_time": "9:55:59", "remaining_time": "2 days, 8:56:11"} +{"current_steps": 154, "total_steps": 1030, "loss": 0.5322, "lr": 7.940402339579596e-05, "epoch": 0.7470062149461877, "percentage": 14.95, "elapsed_time": "9:59:52", "remaining_time": "2 days, 8:52:19"} +{"current_steps": 155, "total_steps": 1030, "loss": 0.5312, "lr": 7.93804837376211e-05, "epoch": 0.7518569046536304, "percentage": 15.05, "elapsed_time": "10:03:46", "remaining_time": "2 days, 8:48:25"} +{"current_steps": 156, "total_steps": 1030, "loss": 0.5362, "lr": 7.935649178536142e-05, "epoch": 0.7567075943610733, "percentage": 15.15, "elapsed_time": "10:07:40", "remaining_time": "2 days, 8:44:34"} +{"current_steps": 157, "total_steps": 1030, "loss": 0.5454, "lr": 7.93320478145701e-05, "epoch": 0.761558284068516, "percentage": 15.24, "elapsed_time": "10:11:34", "remaining_time": "2 days, 8:40:41"} +{"current_steps": 158, "total_steps": 1030, "loss": 0.5369, "lr": 7.93071521059919e-05, "epoch": 0.7664089737759587, "percentage": 15.34, "elapsed_time": "10:15:27", "remaining_time": "2 days, 8:36:41"} +{"current_steps": 159, "total_steps": 1030, "loss": 0.5255, "lr": 7.928180494555983e-05, "epoch": 0.7712596634834016, "percentage": 15.44, "elapsed_time": "10:19:21", "remaining_time": "2 days, 8:32:49"} +{"current_steps": 160, "total_steps": 1030, "loss": 0.535, "lr": 7.925600662439201e-05, "epoch": 0.7761103531908443, "percentage": 15.53, "elapsed_time": "10:23:15", "remaining_time": "2 days, 8:28:56"} +{"current_steps": 161, "total_steps": 1030, "loss": 0.5293, "lr": 7.922975743878817e-05, "epoch": 0.780961042898287, "percentage": 15.63, "elapsed_time": "10:27:09", "remaining_time": "2 days, 8:25:05"} +{"current_steps": 162, "total_steps": 1030, "loss": 0.5298, "lr": 7.92030576902264e-05, "epoch": 0.7858117326057299, "percentage": 15.73, "elapsed_time": "10:31:03", "remaining_time": "2 days, 8:21:11"} +{"current_steps": 163, "total_steps": 1030, "loss": 0.5315, "lr": 7.917590768535952e-05, "epoch": 0.7906624223131726, "percentage": 15.83, "elapsed_time": "10:34:57", "remaining_time": "2 days, 8:17:21"} +{"current_steps": 164, "total_steps": 1030, "loss": 0.5279, "lr": 7.914830773601173e-05, "epoch": 0.7955131120206155, "percentage": 15.92, "elapsed_time": "10:38:50", "remaining_time": "2 days, 8:13:25"} +{"current_steps": 165, "total_steps": 1030, "loss": 0.5372, "lr": 7.912025815917489e-05, "epoch": 0.8003638017280582, "percentage": 16.02, "elapsed_time": "10:42:45", "remaining_time": "2 days, 8:09:35"} +{"current_steps": 166, "total_steps": 1030, "loss": 0.535, "lr": 7.909175927700499e-05, "epoch": 0.805214491435501, "percentage": 16.12, "elapsed_time": "10:46:39", "remaining_time": "2 days, 8:05:46"} +{"current_steps": 167, "total_steps": 1030, "loss": 0.5333, "lr": 7.906281141681839e-05, "epoch": 0.8100651811429438, "percentage": 16.21, "elapsed_time": "10:50:33", "remaining_time": "2 days, 8:01:51"} +{"current_steps": 168, "total_steps": 1030, "loss": 0.5289, "lr": 7.903341491108798e-05, "epoch": 0.8149158708503865, "percentage": 16.31, "elapsed_time": "10:54:27", "remaining_time": "2 days, 7:57:57"} +{"current_steps": 169, "total_steps": 1030, "loss": 0.5331, "lr": 7.900357009743958e-05, "epoch": 0.8197665605578294, "percentage": 16.41, "elapsed_time": "10:58:21", "remaining_time": "2 days, 7:54:05"} +{"current_steps": 170, "total_steps": 1030, "loss": 0.5266, "lr": 7.897327731864784e-05, "epoch": 0.8246172502652721, "percentage": 16.5, "elapsed_time": "11:02:14", "remaining_time": "2 days, 7:50:11"} +{"current_steps": 171, "total_steps": 1030, "loss": 0.522, "lr": 7.894253692263244e-05, "epoch": 0.8294679399727148, "percentage": 16.6, "elapsed_time": "11:06:07", "remaining_time": "2 days, 7:46:13"} +{"current_steps": 172, "total_steps": 1030, "loss": 0.5297, "lr": 7.891134926245402e-05, "epoch": 0.8343186296801577, "percentage": 16.7, "elapsed_time": "11:10:00", "remaining_time": "2 days, 7:42:16"} +{"current_steps": 173, "total_steps": 1030, "loss": 0.5319, "lr": 7.887971469631016e-05, "epoch": 0.8391693193876004, "percentage": 16.8, "elapsed_time": "11:13:55", "remaining_time": "2 days, 7:38:25"} +{"current_steps": 174, "total_steps": 1030, "loss": 0.5408, "lr": 7.884763358753129e-05, "epoch": 0.8440200090950432, "percentage": 16.89, "elapsed_time": "11:17:48", "remaining_time": "2 days, 7:34:32"} +{"current_steps": 175, "total_steps": 1030, "loss": 0.5326, "lr": 7.881510630457643e-05, "epoch": 0.848870698802486, "percentage": 16.99, "elapsed_time": "11:21:42", "remaining_time": "2 days, 7:30:36"} +{"current_steps": 176, "total_steps": 1030, "loss": 0.5281, "lr": 7.878213322102908e-05, "epoch": 0.8537213885099287, "percentage": 17.09, "elapsed_time": "11:25:35", "remaining_time": "2 days, 7:26:41"} +{"current_steps": 177, "total_steps": 1030, "loss": 0.5269, "lr": 7.874871471559282e-05, "epoch": 0.8585720782173716, "percentage": 17.18, "elapsed_time": "11:29:29", "remaining_time": "2 days, 7:22:48"} +{"current_steps": 178, "total_steps": 1030, "loss": 0.5326, "lr": 7.8714851172087e-05, "epoch": 0.8634227679248143, "percentage": 17.28, "elapsed_time": "11:33:23", "remaining_time": "2 days, 7:18:54"} +{"current_steps": 179, "total_steps": 1030, "loss": 0.5312, "lr": 7.868054297944237e-05, "epoch": 0.868273457632257, "percentage": 17.38, "elapsed_time": "11:37:16", "remaining_time": "2 days, 7:15:00"} +{"current_steps": 180, "total_steps": 1030, "loss": 0.5265, "lr": 7.864579053169657e-05, "epoch": 0.8731241473396999, "percentage": 17.48, "elapsed_time": "11:41:10", "remaining_time": "2 days, 7:11:05"} +{"current_steps": 181, "total_steps": 1030, "loss": 0.5242, "lr": 7.86105942279896e-05, "epoch": 0.8779748370471426, "percentage": 17.57, "elapsed_time": "11:45:03", "remaining_time": "2 days, 7:07:07"} +{"current_steps": 182, "total_steps": 1030, "loss": 0.5117, "lr": 7.857495447255925e-05, "epoch": 0.8828255267545854, "percentage": 17.67, "elapsed_time": "11:48:57", "remaining_time": "2 days, 7:03:14"} +{"current_steps": 183, "total_steps": 1030, "loss": 0.5275, "lr": 7.853887167473646e-05, "epoch": 0.8876762164620282, "percentage": 17.77, "elapsed_time": "11:52:51", "remaining_time": "2 days, 6:59:23"} +{"current_steps": 184, "total_steps": 1030, "loss": 0.5236, "lr": 7.850234624894064e-05, "epoch": 0.892526906169471, "percentage": 17.86, "elapsed_time": "11:56:44", "remaining_time": "2 days, 6:55:29"} +{"current_steps": 185, "total_steps": 1030, "loss": 0.5269, "lr": 7.846537861467485e-05, "epoch": 0.8973775958769138, "percentage": 17.96, "elapsed_time": "12:00:38", "remaining_time": "2 days, 6:51:36"} +{"current_steps": 186, "total_steps": 1030, "loss": 0.5177, "lr": 7.842796919652104e-05, "epoch": 0.9022282855843565, "percentage": 18.06, "elapsed_time": "12:04:32", "remaining_time": "2 days, 6:47:44"} +{"current_steps": 187, "total_steps": 1030, "loss": 0.5236, "lr": 7.839011842413514e-05, "epoch": 0.9070789752917993, "percentage": 18.16, "elapsed_time": "12:08:27", "remaining_time": "2 days, 6:43:52"} +{"current_steps": 188, "total_steps": 1030, "loss": 0.5237, "lr": 7.835182673224212e-05, "epoch": 0.9119296649992421, "percentage": 18.25, "elapsed_time": "12:12:20", "remaining_time": "2 days, 6:39:57"} +{"current_steps": 189, "total_steps": 1030, "loss": 0.5193, "lr": 7.831309456063107e-05, "epoch": 0.9167803547066848, "percentage": 18.35, "elapsed_time": "12:16:13", "remaining_time": "2 days, 6:36:01"} +{"current_steps": 190, "total_steps": 1030, "loss": 0.5242, "lr": 7.827392235415005e-05, "epoch": 0.9216310444141277, "percentage": 18.45, "elapsed_time": "12:20:07", "remaining_time": "2 days, 6:32:07"} +{"current_steps": 191, "total_steps": 1030, "loss": 0.5223, "lr": 7.823431056270103e-05, "epoch": 0.9264817341215704, "percentage": 18.54, "elapsed_time": "12:24:00", "remaining_time": "2 days, 6:28:12"} +{"current_steps": 192, "total_steps": 1030, "loss": 0.522, "lr": 7.81942596412347e-05, "epoch": 0.9313324238290132, "percentage": 18.64, "elapsed_time": "12:27:53", "remaining_time": "2 days, 6:24:16"} +{"current_steps": 193, "total_steps": 1030, "loss": 0.509, "lr": 7.815377004974532e-05, "epoch": 0.936183113536456, "percentage": 18.74, "elapsed_time": "12:31:47", "remaining_time": "2 days, 6:20:20"} +{"current_steps": 194, "total_steps": 1030, "loss": 0.522, "lr": 7.811284225326529e-05, "epoch": 0.9410338032438987, "percentage": 18.83, "elapsed_time": "12:35:40", "remaining_time": "2 days, 6:16:25"} +{"current_steps": 195, "total_steps": 1030, "loss": 0.5258, "lr": 7.807147672185996e-05, "epoch": 0.9458844929513415, "percentage": 18.93, "elapsed_time": "12:39:34", "remaining_time": "2 days, 6:12:30"} +{"current_steps": 196, "total_steps": 1030, "loss": 0.524, "lr": 7.802967393062219e-05, "epoch": 0.9507351826587843, "percentage": 19.03, "elapsed_time": "12:43:31", "remaining_time": "2 days, 6:08:52"} +{"current_steps": 197, "total_steps": 1030, "loss": 0.5227, "lr": 7.798743435966676e-05, "epoch": 0.955585872366227, "percentage": 19.13, "elapsed_time": "12:47:25", "remaining_time": "2 days, 6:04:58"} +{"current_steps": 198, "total_steps": 1030, "loss": 0.5143, "lr": 7.794475849412512e-05, "epoch": 0.9604365620736699, "percentage": 19.22, "elapsed_time": "12:51:19", "remaining_time": "2 days, 6:01:05"} +{"current_steps": 199, "total_steps": 1030, "loss": 0.5186, "lr": 7.790164682413954e-05, "epoch": 0.9652872517811126, "percentage": 19.32, "elapsed_time": "12:55:12", "remaining_time": "2 days, 5:57:12"} +{"current_steps": 200, "total_steps": 1030, "loss": 0.5185, "lr": 7.785809984485765e-05, "epoch": 0.9701379414885554, "percentage": 19.42, "elapsed_time": "12:59:06", "remaining_time": "2 days, 5:53:19"} +{"current_steps": 201, "total_steps": 1030, "loss": 0.5179, "lr": 7.781411805642675e-05, "epoch": 0.9749886311959982, "percentage": 19.51, "elapsed_time": "13:03:01", "remaining_time": "2 days, 5:49:27"} +{"current_steps": 202, "total_steps": 1030, "loss": 0.5185, "lr": 7.776970196398795e-05, "epoch": 0.979839320903441, "percentage": 19.61, "elapsed_time": "13:06:54", "remaining_time": "2 days, 5:45:34"} +{"current_steps": 203, "total_steps": 1030, "loss": 0.5223, "lr": 7.77248520776705e-05, "epoch": 0.9846900106108837, "percentage": 19.71, "elapsed_time": "13:10:49", "remaining_time": "2 days, 5:41:42"} +{"current_steps": 204, "total_steps": 1030, "loss": 0.514, "lr": 7.767956891258585e-05, "epoch": 0.9895407003183265, "percentage": 19.81, "elapsed_time": "13:14:42", "remaining_time": "2 days, 5:37:48"} +{"current_steps": 205, "total_steps": 1030, "loss": 0.5227, "lr": 7.763385298882177e-05, "epoch": 0.9943913900257693, "percentage": 19.9, "elapsed_time": "13:18:35", "remaining_time": "2 days, 5:33:50"} +{"current_steps": 206, "total_steps": 1030, "loss": 0.5161, "lr": 7.758770483143634e-05, "epoch": 0.9992420797332121, "percentage": 20.0, "elapsed_time": "13:22:28", "remaining_time": "2 days, 5:29:55"} +{"current_steps": 207, "total_steps": 1030, "loss": 1.0269, "lr": 7.754112497045198e-05, "epoch": 1.0046991056540853, "percentage": 20.1, "elapsed_time": "13:26:50", "remaining_time": "2 days, 5:27:51"} +{"current_steps": 208, "total_steps": 1030, "loss": 0.5131, "lr": 7.749411394084931e-05, "epoch": 1.009549795361528, "percentage": 20.19, "elapsed_time": "13:30:44", "remaining_time": "2 days, 5:23:57"} +{"current_steps": 209, "total_steps": 1030, "loss": 0.5155, "lr": 7.744667228256102e-05, "epoch": 1.0144004850689707, "percentage": 20.29, "elapsed_time": "13:34:36", "remaining_time": "2 days, 5:19:59"} +{"current_steps": 210, "total_steps": 1030, "loss": 0.5066, "lr": 7.739880054046567e-05, "epoch": 1.0192511747764135, "percentage": 20.39, "elapsed_time": "13:38:30", "remaining_time": "2 days, 5:16:03"} +{"current_steps": 211, "total_steps": 1030, "loss": 0.5046, "lr": 7.735049926438143e-05, "epoch": 1.0241018644838562, "percentage": 20.49, "elapsed_time": "13:42:24", "remaining_time": "2 days, 5:12:09"} +{"current_steps": 212, "total_steps": 1030, "loss": 0.5057, "lr": 7.730176900905978e-05, "epoch": 1.0289525541912992, "percentage": 20.58, "elapsed_time": "13:46:16", "remaining_time": "2 days, 5:08:10"} +{"current_steps": 213, "total_steps": 1030, "loss": 0.5033, "lr": 7.725261033417914e-05, "epoch": 1.033803243898742, "percentage": 20.68, "elapsed_time": "13:50:10", "remaining_time": "2 days, 5:04:16"} +{"current_steps": 214, "total_steps": 1030, "loss": 0.5118, "lr": 7.720302380433838e-05, "epoch": 1.0386539336061846, "percentage": 20.78, "elapsed_time": "13:54:04", "remaining_time": "2 days, 5:00:22"} +{"current_steps": 215, "total_steps": 1030, "loss": 0.4943, "lr": 7.715300998905045e-05, "epoch": 1.0435046233136274, "percentage": 20.87, "elapsed_time": "13:57:56", "remaining_time": "2 days, 4:56:23"} +{"current_steps": 216, "total_steps": 1030, "loss": 0.5066, "lr": 7.710256946273572e-05, "epoch": 1.04835531302107, "percentage": 20.97, "elapsed_time": "14:01:50", "remaining_time": "2 days, 4:52:28"} +{"current_steps": 217, "total_steps": 1030, "loss": 0.4964, "lr": 7.705170280471546e-05, "epoch": 1.053206002728513, "percentage": 21.07, "elapsed_time": "14:05:43", "remaining_time": "2 days, 4:48:31"} +{"current_steps": 218, "total_steps": 1030, "loss": 0.4987, "lr": 7.700041059920516e-05, "epoch": 1.0580566924359558, "percentage": 21.17, "elapsed_time": "14:09:36", "remaining_time": "2 days, 4:44:35"} +{"current_steps": 219, "total_steps": 1030, "loss": 0.4984, "lr": 7.694869343530781e-05, "epoch": 1.0629073821433985, "percentage": 21.26, "elapsed_time": "14:13:30", "remaining_time": "2 days, 4:40:41"} +{"current_steps": 220, "total_steps": 1030, "loss": 0.4955, "lr": 7.689655190700719e-05, "epoch": 1.0677580718508413, "percentage": 21.36, "elapsed_time": "14:17:23", "remaining_time": "2 days, 4:36:45"} +{"current_steps": 221, "total_steps": 1030, "loss": 0.5072, "lr": 7.684398661316092e-05, "epoch": 1.072608761558284, "percentage": 21.46, "elapsed_time": "14:21:16", "remaining_time": "2 days, 4:32:50"} +{"current_steps": 222, "total_steps": 1030, "loss": 0.5078, "lr": 7.679099815749377e-05, "epoch": 1.0774594512657267, "percentage": 21.55, "elapsed_time": "14:25:10", "remaining_time": "2 days, 4:28:55"} +{"current_steps": 223, "total_steps": 1030, "loss": 0.5033, "lr": 7.673758714859052e-05, "epoch": 1.0823101409731697, "percentage": 21.65, "elapsed_time": "14:29:04", "remaining_time": "2 days, 4:25:03"} +{"current_steps": 224, "total_steps": 1030, "loss": 0.4998, "lr": 7.668375419988918e-05, "epoch": 1.0871608306806124, "percentage": 21.75, "elapsed_time": "14:32:58", "remaining_time": "2 days, 4:21:09"} +{"current_steps": 225, "total_steps": 1030, "loss": 0.4992, "lr": 7.662949992967375e-05, "epoch": 1.0920115203880552, "percentage": 21.84, "elapsed_time": "14:36:52", "remaining_time": "2 days, 4:17:14"} +{"current_steps": 226, "total_steps": 1030, "loss": 0.4994, "lr": 7.657482496106725e-05, "epoch": 1.096862210095498, "percentage": 21.94, "elapsed_time": "14:40:44", "remaining_time": "2 days, 4:13:16"} +{"current_steps": 227, "total_steps": 1030, "loss": 0.4936, "lr": 7.651972992202449e-05, "epoch": 1.1017128998029406, "percentage": 22.04, "elapsed_time": "14:44:38", "remaining_time": "2 days, 4:09:22"} +{"current_steps": 228, "total_steps": 1030, "loss": 0.502, "lr": 7.646421544532492e-05, "epoch": 1.1065635895103836, "percentage": 22.14, "elapsed_time": "14:48:32", "remaining_time": "2 days, 4:05:28"} +{"current_steps": 229, "total_steps": 1030, "loss": 0.502, "lr": 7.640828216856532e-05, "epoch": 1.1114142792178263, "percentage": 22.23, "elapsed_time": "14:52:25", "remaining_time": "2 days, 4:01:33"} +{"current_steps": 230, "total_steps": 1030, "loss": 0.4965, "lr": 7.635193073415246e-05, "epoch": 1.116264968925269, "percentage": 22.33, "elapsed_time": "14:56:19", "remaining_time": "2 days, 3:57:38"} +{"current_steps": 231, "total_steps": 1030, "loss": 0.4993, "lr": 7.62951617892958e-05, "epoch": 1.1211156586327118, "percentage": 22.43, "elapsed_time": "15:00:12", "remaining_time": "2 days, 3:53:41"} +{"current_steps": 232, "total_steps": 1030, "loss": 0.4921, "lr": 7.623797598599995e-05, "epoch": 1.1259663483401545, "percentage": 22.52, "elapsed_time": "15:04:05", "remaining_time": "2 days, 3:49:44"} +{"current_steps": 233, "total_steps": 1030, "loss": 0.4921, "lr": 7.618037398105728e-05, "epoch": 1.1308170380475975, "percentage": 22.62, "elapsed_time": "15:07:58", "remaining_time": "2 days, 3:45:48"} +{"current_steps": 234, "total_steps": 1030, "loss": 0.4963, "lr": 7.612235643604031e-05, "epoch": 1.1356677277550402, "percentage": 22.72, "elapsed_time": "15:11:52", "remaining_time": "2 days, 3:41:54"} +{"current_steps": 235, "total_steps": 1030, "loss": 0.4965, "lr": 7.606392401729415e-05, "epoch": 1.140518417462483, "percentage": 22.82, "elapsed_time": "15:15:44", "remaining_time": "2 days, 3:37:57"} +{"current_steps": 236, "total_steps": 1030, "loss": 0.5002, "lr": 7.600507739592879e-05, "epoch": 1.1453691071699257, "percentage": 22.91, "elapsed_time": "15:19:38", "remaining_time": "2 days, 3:34:02"} +{"current_steps": 237, "total_steps": 1030, "loss": 0.4978, "lr": 7.594581724781152e-05, "epoch": 1.1502197968773684, "percentage": 23.01, "elapsed_time": "15:23:32", "remaining_time": "2 days, 3:30:08"} +{"current_steps": 238, "total_steps": 1030, "loss": 0.4976, "lr": 7.588614425355898e-05, "epoch": 1.1550704865848114, "percentage": 23.11, "elapsed_time": "15:27:25", "remaining_time": "2 days, 3:26:11"} +{"current_steps": 239, "total_steps": 1030, "loss": 0.4907, "lr": 7.582605909852951e-05, "epoch": 1.159921176292254, "percentage": 23.2, "elapsed_time": "15:31:18", "remaining_time": "2 days, 3:22:16"} +{"current_steps": 240, "total_steps": 1030, "loss": 0.495, "lr": 7.576556247281522e-05, "epoch": 1.1647718659996968, "percentage": 23.3, "elapsed_time": "15:35:12", "remaining_time": "2 days, 3:18:24"} +{"current_steps": 241, "total_steps": 1030, "loss": 0.5027, "lr": 7.570465507123401e-05, "epoch": 1.1696225557071396, "percentage": 23.4, "elapsed_time": "15:39:06", "remaining_time": "2 days, 3:14:29"} +{"current_steps": 242, "total_steps": 1030, "loss": 0.4909, "lr": 7.564333759332167e-05, "epoch": 1.1744732454145823, "percentage": 23.5, "elapsed_time": "15:42:59", "remaining_time": "2 days, 3:10:33"} +{"current_steps": 243, "total_steps": 1030, "loss": 0.4951, "lr": 7.558161074332379e-05, "epoch": 1.1793239351220253, "percentage": 23.59, "elapsed_time": "15:46:52", "remaining_time": "2 days, 3:06:38"} +{"current_steps": 244, "total_steps": 1030, "loss": 0.499, "lr": 7.551947523018774e-05, "epoch": 1.184174624829468, "percentage": 23.69, "elapsed_time": "15:50:46", "remaining_time": "2 days, 3:02:43"} +{"current_steps": 245, "total_steps": 1030, "loss": 0.4948, "lr": 7.54569317675544e-05, "epoch": 1.1890253145369107, "percentage": 23.79, "elapsed_time": "15:54:39", "remaining_time": "2 days, 2:58:47"} +{"current_steps": 246, "total_steps": 1030, "loss": 0.4973, "lr": 7.539398107375015e-05, "epoch": 1.1938760042443535, "percentage": 23.88, "elapsed_time": "15:58:32", "remaining_time": "2 days, 2:54:50"} +{"current_steps": 247, "total_steps": 1030, "loss": 0.4976, "lr": 7.533062387177843e-05, "epoch": 1.1987266939517962, "percentage": 23.98, "elapsed_time": "16:02:24", "remaining_time": "2 days, 2:50:52"} +{"current_steps": 248, "total_steps": 1030, "loss": 0.4975, "lr": 7.526686088931156e-05, "epoch": 1.2035773836592392, "percentage": 24.08, "elapsed_time": "16:06:18", "remaining_time": "2 days, 2:46:58"} +{"current_steps": 249, "total_steps": 1030, "loss": 0.4918, "lr": 7.520269285868235e-05, "epoch": 1.208428073366682, "percentage": 24.17, "elapsed_time": "16:10:11", "remaining_time": "2 days, 2:43:02"} +{"current_steps": 250, "total_steps": 1030, "loss": 0.4901, "lr": 7.513812051687564e-05, "epoch": 1.2132787630741246, "percentage": 24.27, "elapsed_time": "16:14:04", "remaining_time": "2 days, 2:39:06"} +{"current_steps": 251, "total_steps": 1030, "loss": 0.4888, "lr": 7.507314460551993e-05, "epoch": 1.2181294527815674, "percentage": 24.37, "elapsed_time": "16:17:58", "remaining_time": "2 days, 2:35:13"} +{"current_steps": 252, "total_steps": 1030, "loss": 0.4933, "lr": 7.500776587087878e-05, "epoch": 1.22298014248901, "percentage": 24.47, "elapsed_time": "16:21:51", "remaining_time": "2 days, 2:31:18"} +{"current_steps": 253, "total_steps": 1030, "loss": 0.4805, "lr": 7.494198506384229e-05, "epoch": 1.2278308321964528, "percentage": 24.56, "elapsed_time": "16:25:44", "remaining_time": "2 days, 2:27:22"} +{"current_steps": 254, "total_steps": 1030, "loss": 0.5025, "lr": 7.487580293991844e-05, "epoch": 1.2326815219038958, "percentage": 24.66, "elapsed_time": "16:29:38", "remaining_time": "2 days, 2:23:27"} +{"current_steps": 255, "total_steps": 1030, "loss": 0.4975, "lr": 7.480922025922443e-05, "epoch": 1.2375322116113385, "percentage": 24.76, "elapsed_time": "16:33:33", "remaining_time": "2 days, 2:19:37"} +{"current_steps": 256, "total_steps": 1030, "loss": 0.4928, "lr": 7.474223778647796e-05, "epoch": 1.2423829013187813, "percentage": 24.85, "elapsed_time": "16:37:27", "remaining_time": "2 days, 2:15:45"} +{"current_steps": 257, "total_steps": 1030, "loss": 0.4912, "lr": 7.467485629098842e-05, "epoch": 1.247233591026224, "percentage": 24.95, "elapsed_time": "16:41:20", "remaining_time": "2 days, 2:11:48"} +{"current_steps": 258, "total_steps": 1030, "loss": 0.4979, "lr": 7.460707654664807e-05, "epoch": 1.252084280733667, "percentage": 25.05, "elapsed_time": "16:45:13", "remaining_time": "2 days, 2:07:54"} +{"current_steps": 259, "total_steps": 1030, "loss": 0.4891, "lr": 7.453889933192316e-05, "epoch": 1.2569349704411095, "percentage": 25.15, "elapsed_time": "16:49:07", "remaining_time": "2 days, 2:03:59"} +{"current_steps": 260, "total_steps": 1030, "loss": 0.4871, "lr": 7.447032542984502e-05, "epoch": 1.2617856601485524, "percentage": 25.24, "elapsed_time": "16:53:00", "remaining_time": "2 days, 2:00:04"} +{"current_steps": 261, "total_steps": 1030, "loss": 0.4854, "lr": 7.440135562800093e-05, "epoch": 1.2666363498559952, "percentage": 25.34, "elapsed_time": "16:56:54", "remaining_time": "2 days, 1:56:09"} +{"current_steps": 262, "total_steps": 1030, "loss": 0.4984, "lr": 7.433199071852526e-05, "epoch": 1.271487039563438, "percentage": 25.44, "elapsed_time": "17:00:47", "remaining_time": "2 days, 1:52:13"} +{"current_steps": 263, "total_steps": 1030, "loss": 0.4894, "lr": 7.426223149809023e-05, "epoch": 1.2763377292708806, "percentage": 25.53, "elapsed_time": "17:04:40", "remaining_time": "2 days, 1:48:17"} +{"current_steps": 264, "total_steps": 1030, "loss": 0.4855, "lr": 7.419207876789685e-05, "epoch": 1.2811884189783234, "percentage": 25.63, "elapsed_time": "17:08:32", "remaining_time": "2 days, 1:44:20"} +{"current_steps": 265, "total_steps": 1030, "loss": 0.4897, "lr": 7.412153333366567e-05, "epoch": 1.2860391086857663, "percentage": 25.73, "elapsed_time": "17:12:26", "remaining_time": "2 days, 1:40:26"} +{"current_steps": 266, "total_steps": 1030, "loss": 0.5014, "lr": 7.405059600562751e-05, "epoch": 1.290889798393209, "percentage": 25.83, "elapsed_time": "17:16:19", "remaining_time": "2 days, 1:36:31"} +{"current_steps": 267, "total_steps": 1030, "loss": 0.5003, "lr": 7.397926759851425e-05, "epoch": 1.2957404881006518, "percentage": 25.92, "elapsed_time": "17:20:12", "remaining_time": "2 days, 1:32:35"} +{"current_steps": 268, "total_steps": 1030, "loss": 0.4981, "lr": 7.390754893154933e-05, "epoch": 1.3005911778080945, "percentage": 26.02, "elapsed_time": "17:24:06", "remaining_time": "2 days, 1:28:40"} +{"current_steps": 269, "total_steps": 1030, "loss": 0.4991, "lr": 7.383544082843846e-05, "epoch": 1.3054418675155373, "percentage": 26.12, "elapsed_time": "17:27:59", "remaining_time": "2 days, 1:24:45"} +{"current_steps": 270, "total_steps": 1030, "loss": 0.4949, "lr": 7.376294411736009e-05, "epoch": 1.3102925572229802, "percentage": 26.21, "elapsed_time": "17:31:52", "remaining_time": "2 days, 1:20:51"} +{"current_steps": 271, "total_steps": 1030, "loss": 0.4967, "lr": 7.369005963095596e-05, "epoch": 1.315143246930423, "percentage": 26.31, "elapsed_time": "17:35:46", "remaining_time": "2 days, 1:16:55"} +{"current_steps": 272, "total_steps": 1030, "loss": 0.4946, "lr": 7.361678820632145e-05, "epoch": 1.3199939366378657, "percentage": 26.41, "elapsed_time": "17:39:40", "remaining_time": "2 days, 1:13:03"} +{"current_steps": 273, "total_steps": 1030, "loss": 0.4899, "lr": 7.354313068499607e-05, "epoch": 1.3248446263453084, "percentage": 26.5, "elapsed_time": "17:43:33", "remaining_time": "2 days, 1:09:09"} +{"current_steps": 274, "total_steps": 1030, "loss": 0.497, "lr": 7.346908791295369e-05, "epoch": 1.3296953160527512, "percentage": 26.6, "elapsed_time": "17:47:27", "remaining_time": "2 days, 1:05:14"} +{"current_steps": 275, "total_steps": 1030, "loss": 0.4858, "lr": 7.339466074059292e-05, "epoch": 1.334546005760194, "percentage": 26.7, "elapsed_time": "17:51:19", "remaining_time": "2 days, 1:01:17"} +{"current_steps": 276, "total_steps": 1030, "loss": 0.4993, "lr": 7.331985002272726e-05, "epoch": 1.3393966954676368, "percentage": 26.8, "elapsed_time": "17:55:12", "remaining_time": "2 days, 0:57:22"} +{"current_steps": 277, "total_steps": 1030, "loss": 0.4868, "lr": 7.324465661857534e-05, "epoch": 1.3442473851750796, "percentage": 26.89, "elapsed_time": "17:59:06", "remaining_time": "2 days, 0:53:27"} +{"current_steps": 278, "total_steps": 1030, "loss": 0.4928, "lr": 7.316908139175105e-05, "epoch": 1.3490980748825223, "percentage": 26.99, "elapsed_time": "18:03:00", "remaining_time": "2 days, 0:49:34"} +{"current_steps": 279, "total_steps": 1030, "loss": 0.4909, "lr": 7.309312521025356e-05, "epoch": 1.353948764589965, "percentage": 27.09, "elapsed_time": "18:06:54", "remaining_time": "2 days, 0:45:41"} +{"current_steps": 280, "total_steps": 1030, "loss": 0.4906, "lr": 7.301678894645742e-05, "epoch": 1.358799454297408, "percentage": 27.18, "elapsed_time": "18:10:48", "remaining_time": "2 days, 0:41:47"} +{"current_steps": 281, "total_steps": 1030, "loss": 0.4942, "lr": 7.294007347710251e-05, "epoch": 1.3636501440048507, "percentage": 27.28, "elapsed_time": "18:14:40", "remaining_time": "2 days, 0:37:49"} +{"current_steps": 282, "total_steps": 1030, "loss": 0.4826, "lr": 7.286297968328397e-05, "epoch": 1.3685008337122935, "percentage": 27.38, "elapsed_time": "18:18:34", "remaining_time": "2 days, 0:33:55"} +{"current_steps": 283, "total_steps": 1030, "loss": 0.4953, "lr": 7.27855084504421e-05, "epoch": 1.3733515234197362, "percentage": 27.48, "elapsed_time": "18:22:27", "remaining_time": "2 days, 0:30:00"} +{"current_steps": 284, "total_steps": 1030, "loss": 0.4901, "lr": 7.270766066835217e-05, "epoch": 1.378202213127179, "percentage": 27.57, "elapsed_time": "18:26:20", "remaining_time": "2 days, 0:26:05"} +{"current_steps": 285, "total_steps": 1030, "loss": 0.4893, "lr": 7.262943723111419e-05, "epoch": 1.383052902834622, "percentage": 27.67, "elapsed_time": "18:30:13", "remaining_time": "2 days, 0:22:09"} +{"current_steps": 286, "total_steps": 1030, "loss": 0.4887, "lr": 7.255083903714266e-05, "epoch": 1.3879035925420646, "percentage": 27.77, "elapsed_time": "18:34:07", "remaining_time": "2 days, 0:18:16"} +{"current_steps": 287, "total_steps": 1030, "loss": 0.4852, "lr": 7.247186698915625e-05, "epoch": 1.3927542822495074, "percentage": 27.86, "elapsed_time": "18:38:00", "remaining_time": "2 days, 0:14:22"} +{"current_steps": 288, "total_steps": 1030, "loss": 0.4808, "lr": 7.239252199416749e-05, "epoch": 1.39760497195695, "percentage": 27.96, "elapsed_time": "18:41:54", "remaining_time": "2 days, 0:10:27"} +{"current_steps": 289, "total_steps": 1030, "loss": 0.4813, "lr": 7.23128049634722e-05, "epoch": 1.4024556616643928, "percentage": 28.06, "elapsed_time": "18:45:46", "remaining_time": "2 days, 0:06:31"} +{"current_steps": 290, "total_steps": 1030, "loss": 0.4811, "lr": 7.223271681263916e-05, "epoch": 1.4073063513718358, "percentage": 28.16, "elapsed_time": "18:49:40", "remaining_time": "2 days, 0:02:37"} +{"current_steps": 291, "total_steps": 1030, "loss": 0.489, "lr": 7.215225846149957e-05, "epoch": 1.4121570410792785, "percentage": 28.25, "elapsed_time": "18:53:34", "remaining_time": "1 day, 23:58:43"} +{"current_steps": 292, "total_steps": 1030, "loss": 0.4855, "lr": 7.207143083413643e-05, "epoch": 1.4170077307867213, "percentage": 28.35, "elapsed_time": "18:57:27", "remaining_time": "1 day, 23:54:48"} +{"current_steps": 293, "total_steps": 1030, "loss": 0.4863, "lr": 7.1990234858874e-05, "epoch": 1.421858420494164, "percentage": 28.45, "elapsed_time": "19:01:20", "remaining_time": "1 day, 23:50:51"} +{"current_steps": 294, "total_steps": 1030, "loss": 0.4906, "lr": 7.190867146826707e-05, "epoch": 1.4267091102016067, "percentage": 28.54, "elapsed_time": "19:05:12", "remaining_time": "1 day, 23:46:54"} +{"current_steps": 295, "total_steps": 1030, "loss": 0.4842, "lr": 7.182674159909031e-05, "epoch": 1.4315597999090497, "percentage": 28.64, "elapsed_time": "19:09:06", "remaining_time": "1 day, 23:43:01"} +{"current_steps": 296, "total_steps": 1030, "loss": 0.4927, "lr": 7.174444619232745e-05, "epoch": 1.4364104896164924, "percentage": 28.74, "elapsed_time": "19:12:59", "remaining_time": "1 day, 23:39:06"} +{"current_steps": 297, "total_steps": 1030, "loss": 0.4906, "lr": 7.166178619316056e-05, "epoch": 1.4412611793239352, "percentage": 28.83, "elapsed_time": "19:16:52", "remaining_time": "1 day, 23:35:10"} +{"current_steps": 298, "total_steps": 1030, "loss": 0.4844, "lr": 7.157876255095906e-05, "epoch": 1.446111869031378, "percentage": 28.93, "elapsed_time": "19:20:45", "remaining_time": "1 day, 23:31:15"} +{"current_steps": 299, "total_steps": 1030, "loss": 0.488, "lr": 7.149537621926895e-05, "epoch": 1.4509625587388206, "percentage": 29.03, "elapsed_time": "19:24:38", "remaining_time": "1 day, 23:27:20"} +{"current_steps": 300, "total_steps": 1030, "loss": 0.4877, "lr": 7.14116281558018e-05, "epoch": 1.4558132484462636, "percentage": 29.13, "elapsed_time": "19:28:32", "remaining_time": "1 day, 23:23:26"} +{"current_steps": 301, "total_steps": 1030, "loss": 0.4971, "lr": 7.132751932242376e-05, "epoch": 1.460663938153706, "percentage": 29.22, "elapsed_time": "19:32:25", "remaining_time": "1 day, 23:19:31"} +{"current_steps": 302, "total_steps": 1030, "loss": 0.4864, "lr": 7.124305068514444e-05, "epoch": 1.465514627861149, "percentage": 29.32, "elapsed_time": "19:36:18", "remaining_time": "1 day, 23:15:35"} +{"current_steps": 303, "total_steps": 1030, "loss": 0.4861, "lr": 7.1158223214106e-05, "epoch": 1.4703653175685918, "percentage": 29.42, "elapsed_time": "19:40:12", "remaining_time": "1 day, 23:11:42"} +{"current_steps": 304, "total_steps": 1030, "loss": 0.482, "lr": 7.107303788357177e-05, "epoch": 1.4752160072760345, "percentage": 29.51, "elapsed_time": "19:44:04", "remaining_time": "1 day, 23:07:44"} +{"current_steps": 305, "total_steps": 1030, "loss": 0.4834, "lr": 7.098749567191527e-05, "epoch": 1.4800666969834773, "percentage": 29.61, "elapsed_time": "19:48:04", "remaining_time": "1 day, 23:04:06"} +{"current_steps": 306, "total_steps": 1030, "loss": 0.4881, "lr": 7.090159756160886e-05, "epoch": 1.48491738669092, "percentage": 29.71, "elapsed_time": "19:51:57", "remaining_time": "1 day, 23:00:11"} +{"current_steps": 307, "total_steps": 1030, "loss": 0.4854, "lr": 7.081534453921242e-05, "epoch": 1.489768076398363, "percentage": 29.81, "elapsed_time": "19:55:50", "remaining_time": "1 day, 22:56:16"} +{"current_steps": 308, "total_steps": 1030, "loss": 0.492, "lr": 7.072873759536217e-05, "epoch": 1.4946187661058057, "percentage": 29.9, "elapsed_time": "19:59:44", "remaining_time": "1 day, 22:52:21"} +{"current_steps": 309, "total_steps": 1030, "loss": 0.4795, "lr": 7.064177772475912e-05, "epoch": 1.4994694558132484, "percentage": 30.0, "elapsed_time": "20:03:36", "remaining_time": "1 day, 22:48:26"} +{"current_steps": 310, "total_steps": 1030, "loss": 0.4885, "lr": 7.05544659261578e-05, "epoch": 1.5043201455206914, "percentage": 30.1, "elapsed_time": "20:07:30", "remaining_time": "1 day, 22:44:31"} +{"current_steps": 311, "total_steps": 1030, "loss": 0.486, "lr": 7.046680320235466e-05, "epoch": 1.5091708352281339, "percentage": 30.19, "elapsed_time": "20:11:23", "remaining_time": "1 day, 22:40:36"} +{"current_steps": 312, "total_steps": 1030, "loss": 0.4881, "lr": 7.037879056017663e-05, "epoch": 1.5140215249355768, "percentage": 30.29, "elapsed_time": "20:15:16", "remaining_time": "1 day, 22:36:40"} +{"current_steps": 313, "total_steps": 1030, "loss": 0.4829, "lr": 7.029042901046952e-05, "epoch": 1.5188722146430196, "percentage": 30.39, "elapsed_time": "20:19:08", "remaining_time": "1 day, 22:32:43"} +{"current_steps": 314, "total_steps": 1030, "loss": 0.4873, "lr": 7.020171956808645e-05, "epoch": 1.5237229043504623, "percentage": 30.49, "elapsed_time": "20:23:02", "remaining_time": "1 day, 22:28:50"} +{"current_steps": 315, "total_steps": 1030, "loss": 0.4966, "lr": 7.011266325187615e-05, "epoch": 1.5285735940579053, "percentage": 30.58, "elapsed_time": "20:26:55", "remaining_time": "1 day, 22:24:55"} +{"current_steps": 316, "total_steps": 1030, "loss": 0.4869, "lr": 7.002326108467129e-05, "epoch": 1.5334242837653478, "percentage": 30.68, "elapsed_time": "20:30:48", "remaining_time": "1 day, 22:20:59"} +{"current_steps": 317, "total_steps": 1030, "loss": 0.4777, "lr": 6.993351409327672e-05, "epoch": 1.5382749734727907, "percentage": 30.78, "elapsed_time": "20:34:42", "remaining_time": "1 day, 22:17:06"} +{"current_steps": 318, "total_steps": 1030, "loss": 0.4922, "lr": 6.984342330845764e-05, "epoch": 1.5431256631802335, "percentage": 30.87, "elapsed_time": "20:38:35", "remaining_time": "1 day, 22:13:10"} +{"current_steps": 319, "total_steps": 1030, "loss": 0.4961, "lr": 6.975298976492785e-05, "epoch": 1.5479763528876762, "percentage": 30.97, "elapsed_time": "20:42:28", "remaining_time": "1 day, 22:09:16"} +{"current_steps": 320, "total_steps": 1030, "loss": 0.4893, "lr": 6.966221450133779e-05, "epoch": 1.552827042595119, "percentage": 31.07, "elapsed_time": "20:46:22", "remaining_time": "1 day, 22:05:23"} +{"current_steps": 321, "total_steps": 1030, "loss": 0.4925, "lr": 6.957109856026261e-05, "epoch": 1.5576777323025617, "percentage": 31.17, "elapsed_time": "20:50:15", "remaining_time": "1 day, 22:01:29"} +{"current_steps": 322, "total_steps": 1030, "loss": 0.4765, "lr": 6.94796429881903e-05, "epoch": 1.5625284220100046, "percentage": 31.26, "elapsed_time": "20:54:08", "remaining_time": "1 day, 21:57:33"} +{"current_steps": 323, "total_steps": 1030, "loss": 0.4878, "lr": 6.938784883550948e-05, "epoch": 1.5673791117174474, "percentage": 31.36, "elapsed_time": "20:58:02", "remaining_time": "1 day, 21:53:39"} +{"current_steps": 324, "total_steps": 1030, "loss": 0.4858, "lr": 6.929571715649755e-05, "epoch": 1.57222980142489, "percentage": 31.46, "elapsed_time": "21:01:55", "remaining_time": "1 day, 21:49:46"} +{"current_steps": 325, "total_steps": 1030, "loss": 0.4916, "lr": 6.920324900930842e-05, "epoch": 1.5770804911323328, "percentage": 31.55, "elapsed_time": "21:05:49", "remaining_time": "1 day, 21:45:51"} +{"current_steps": 326, "total_steps": 1030, "loss": 0.4831, "lr": 6.911044545596042e-05, "epoch": 1.5819311808397756, "percentage": 31.65, "elapsed_time": "21:09:42", "remaining_time": "1 day, 21:41:56"} +{"current_steps": 327, "total_steps": 1030, "loss": 0.4903, "lr": 6.901730756232411e-05, "epoch": 1.5867818705472185, "percentage": 31.75, "elapsed_time": "21:13:35", "remaining_time": "1 day, 21:38:00"} +{"current_steps": 328, "total_steps": 1030, "loss": 0.4943, "lr": 6.892383639811005e-05, "epoch": 1.591632560254661, "percentage": 31.84, "elapsed_time": "21:17:28", "remaining_time": "1 day, 21:34:05"} +{"current_steps": 329, "total_steps": 1030, "loss": 0.4835, "lr": 6.883003303685644e-05, "epoch": 1.596483249962104, "percentage": 31.94, "elapsed_time": "21:21:20", "remaining_time": "1 day, 21:30:09"} +{"current_steps": 330, "total_steps": 1030, "loss": 0.4871, "lr": 6.87358985559169e-05, "epoch": 1.6013339396695467, "percentage": 32.04, "elapsed_time": "21:25:14", "remaining_time": "1 day, 21:26:15"} +{"current_steps": 331, "total_steps": 1030, "loss": 0.4947, "lr": 6.864143403644797e-05, "epoch": 1.6061846293769895, "percentage": 32.14, "elapsed_time": "21:29:07", "remaining_time": "1 day, 21:22:21"} +{"current_steps": 332, "total_steps": 1030, "loss": 0.4856, "lr": 6.85466405633968e-05, "epoch": 1.6110353190844324, "percentage": 32.23, "elapsed_time": "21:33:00", "remaining_time": "1 day, 21:18:25"} +{"current_steps": 333, "total_steps": 1030, "loss": 0.4783, "lr": 6.845151922548865e-05, "epoch": 1.615886008791875, "percentage": 32.33, "elapsed_time": "21:36:54", "remaining_time": "1 day, 21:14:32"} +{"current_steps": 334, "total_steps": 1030, "loss": 0.4784, "lr": 6.835607111521439e-05, "epoch": 1.620736698499318, "percentage": 32.43, "elapsed_time": "21:40:47", "remaining_time": "1 day, 21:10:37"} +{"current_steps": 335, "total_steps": 1030, "loss": 0.494, "lr": 6.826029732881793e-05, "epoch": 1.6255873882067606, "percentage": 32.52, "elapsed_time": "21:44:40", "remaining_time": "1 day, 21:06:42"} +{"current_steps": 336, "total_steps": 1030, "loss": 0.4881, "lr": 6.816419896628363e-05, "epoch": 1.6304380779142034, "percentage": 32.62, "elapsed_time": "21:48:34", "remaining_time": "1 day, 21:02:49"} +{"current_steps": 337, "total_steps": 1030, "loss": 0.4814, "lr": 6.806777713132374e-05, "epoch": 1.6352887676216463, "percentage": 32.72, "elapsed_time": "21:52:27", "remaining_time": "1 day, 20:58:55"} +{"current_steps": 338, "total_steps": 1030, "loss": 0.4893, "lr": 6.79710329313656e-05, "epoch": 1.6401394573290888, "percentage": 32.82, "elapsed_time": "21:56:20", "remaining_time": "1 day, 20:55:00"} +{"current_steps": 339, "total_steps": 1030, "loss": 0.4745, "lr": 6.787396747753903e-05, "epoch": 1.6449901470365318, "percentage": 32.91, "elapsed_time": "22:00:14", "remaining_time": "1 day, 20:51:06"} +{"current_steps": 340, "total_steps": 1030, "loss": 0.4763, "lr": 6.777658188466354e-05, "epoch": 1.6498408367439745, "percentage": 33.01, "elapsed_time": "22:04:08", "remaining_time": "1 day, 20:47:13"} +{"current_steps": 341, "total_steps": 1030, "loss": 0.4926, "lr": 6.767887727123544e-05, "epoch": 1.6546915264514173, "percentage": 33.11, "elapsed_time": "22:08:00", "remaining_time": "1 day, 20:43:16"} +{"current_steps": 342, "total_steps": 1030, "loss": 0.4825, "lr": 6.758085475941516e-05, "epoch": 1.6595422161588602, "percentage": 33.2, "elapsed_time": "22:11:54", "remaining_time": "1 day, 20:39:22"} +{"current_steps": 343, "total_steps": 1030, "loss": 0.476, "lr": 6.748251547501418e-05, "epoch": 1.6643929058663027, "percentage": 33.3, "elapsed_time": "22:15:47", "remaining_time": "1 day, 20:35:28"} +{"current_steps": 344, "total_steps": 1030, "loss": 0.4822, "lr": 6.738386054748226e-05, "epoch": 1.6692435955737457, "percentage": 33.4, "elapsed_time": "22:19:41", "remaining_time": "1 day, 20:31:34"} +{"current_steps": 345, "total_steps": 1030, "loss": 0.4898, "lr": 6.728489110989434e-05, "epoch": 1.6740942852811884, "percentage": 33.5, "elapsed_time": "22:23:34", "remaining_time": "1 day, 20:27:41"} +{"current_steps": 346, "total_steps": 1030, "loss": 0.4779, "lr": 6.718560829893762e-05, "epoch": 1.6789449749886312, "percentage": 33.59, "elapsed_time": "22:27:28", "remaining_time": "1 day, 20:23:48"} +{"current_steps": 347, "total_steps": 1030, "loss": 0.4871, "lr": 6.708601325489844e-05, "epoch": 1.6837956646960741, "percentage": 33.69, "elapsed_time": "22:31:22", "remaining_time": "1 day, 20:19:54"} +{"current_steps": 348, "total_steps": 1030, "loss": 0.4851, "lr": 6.698610712164924e-05, "epoch": 1.6886463544035166, "percentage": 33.79, "elapsed_time": "22:35:16", "remaining_time": "1 day, 20:16:01"} +{"current_steps": 349, "total_steps": 1030, "loss": 0.473, "lr": 6.688589104663536e-05, "epoch": 1.6934970441109596, "percentage": 33.88, "elapsed_time": "22:39:08", "remaining_time": "1 day, 20:12:05"} +{"current_steps": 350, "total_steps": 1030, "loss": 0.4779, "lr": 6.67853661808619e-05, "epoch": 1.6983477338184023, "percentage": 33.98, "elapsed_time": "22:43:02", "remaining_time": "1 day, 20:08:11"} +{"current_steps": 351, "total_steps": 1030, "loss": 0.4841, "lr": 6.668453367888052e-05, "epoch": 1.703198423525845, "percentage": 34.08, "elapsed_time": "22:46:56", "remaining_time": "1 day, 20:04:19"} +{"current_steps": 352, "total_steps": 1030, "loss": 0.4791, "lr": 6.658339469877613e-05, "epoch": 1.708049113233288, "percentage": 34.17, "elapsed_time": "22:50:50", "remaining_time": "1 day, 20:00:25"} +{"current_steps": 353, "total_steps": 1030, "loss": 0.4826, "lr": 6.64819504021536e-05, "epoch": 1.7128998029407305, "percentage": 34.27, "elapsed_time": "22:54:44", "remaining_time": "1 day, 19:56:32"} +{"current_steps": 354, "total_steps": 1030, "loss": 0.4782, "lr": 6.638020195412448e-05, "epoch": 1.7177504926481735, "percentage": 34.37, "elapsed_time": "22:58:36", "remaining_time": "1 day, 19:52:36"} +{"current_steps": 355, "total_steps": 1030, "loss": 0.4933, "lr": 6.627815052329354e-05, "epoch": 1.7226011823556162, "percentage": 34.47, "elapsed_time": "23:02:30", "remaining_time": "1 day, 19:48:42"} +{"current_steps": 356, "total_steps": 1030, "loss": 0.4881, "lr": 6.617579728174535e-05, "epoch": 1.727451872063059, "percentage": 34.56, "elapsed_time": "23:06:23", "remaining_time": "1 day, 19:44:47"} +{"current_steps": 357, "total_steps": 1030, "loss": 0.4795, "lr": 6.60731434050309e-05, "epoch": 1.732302561770502, "percentage": 34.66, "elapsed_time": "23:10:16", "remaining_time": "1 day, 19:40:53"} +{"current_steps": 358, "total_steps": 1030, "loss": 0.4829, "lr": 6.597019007215401e-05, "epoch": 1.7371532514779444, "percentage": 34.76, "elapsed_time": "23:14:10", "remaining_time": "1 day, 19:36:59"} +{"current_steps": 359, "total_steps": 1030, "loss": 0.4773, "lr": 6.586693846555788e-05, "epoch": 1.7420039411853874, "percentage": 34.85, "elapsed_time": "23:18:03", "remaining_time": "1 day, 19:33:04"} +{"current_steps": 360, "total_steps": 1030, "loss": 0.48, "lr": 6.576338977111134e-05, "epoch": 1.74685463089283, "percentage": 34.95, "elapsed_time": "23:21:56", "remaining_time": "1 day, 19:29:09"} +{"current_steps": 361, "total_steps": 1030, "loss": 0.4766, "lr": 6.565954517809543e-05, "epoch": 1.7517053206002728, "percentage": 35.05, "elapsed_time": "23:25:48", "remaining_time": "1 day, 19:25:14"} +{"current_steps": 362, "total_steps": 1030, "loss": 0.4782, "lr": 6.555540587918968e-05, "epoch": 1.7565560103077156, "percentage": 35.15, "elapsed_time": "23:29:43", "remaining_time": "1 day, 19:21:22"} +{"current_steps": 363, "total_steps": 1030, "loss": 0.4808, "lr": 6.545097307045831e-05, "epoch": 1.7614067000151583, "percentage": 35.24, "elapsed_time": "23:33:36", "remaining_time": "1 day, 19:17:27"} +{"current_steps": 364, "total_steps": 1030, "loss": 0.4852, "lr": 6.534624795133662e-05, "epoch": 1.7662573897226013, "percentage": 35.34, "elapsed_time": "23:37:30", "remaining_time": "1 day, 19:13:34"} +{"current_steps": 365, "total_steps": 1030, "loss": 0.4785, "lr": 6.524123172461711e-05, "epoch": 1.771108079430044, "percentage": 35.44, "elapsed_time": "23:41:24", "remaining_time": "1 day, 19:09:40"} +{"current_steps": 366, "total_steps": 1030, "loss": 0.4789, "lr": 6.51359255964358e-05, "epoch": 1.7759587691374867, "percentage": 35.53, "elapsed_time": "23:45:18", "remaining_time": "1 day, 19:05:47"} +{"current_steps": 367, "total_steps": 1030, "loss": 0.4762, "lr": 6.503033077625824e-05, "epoch": 1.7808094588449295, "percentage": 35.63, "elapsed_time": "23:49:12", "remaining_time": "1 day, 19:01:55"} +{"current_steps": 368, "total_steps": 1030, "loss": 0.4837, "lr": 6.492444847686566e-05, "epoch": 1.7856601485523722, "percentage": 35.73, "elapsed_time": "23:53:06", "remaining_time": "1 day, 18:58:02"} +{"current_steps": 207, "total_steps": 1030, "loss": 0.5126, "lr": 7.754112497045198e-05, "epoch": 1.0048506897074427, "percentage": 20.1, "elapsed_time": "0:04:10", "remaining_time": "0:16:37"} +{"current_steps": 208, "total_steps": 1030, "loss": 0.5093, "lr": 7.749411394084931e-05, "epoch": 1.0097013794148855, "percentage": 20.19, "elapsed_time": "0:08:04", "remaining_time": "0:31:56"} +{"current_steps": 209, "total_steps": 1030, "loss": 0.5129, "lr": 7.744667228256102e-05, "epoch": 1.0145520691223284, "percentage": 20.29, "elapsed_time": "0:11:58", "remaining_time": "0:47:01"} +{"current_steps": 210, "total_steps": 1030, "loss": 0.504, "lr": 7.739880054046567e-05, "epoch": 1.0194027588297712, "percentage": 20.39, "elapsed_time": "0:15:51", "remaining_time": "1:01:56"} +{"current_steps": 211, "total_steps": 1030, "loss": 0.5008, "lr": 7.735049926438143e-05, "epoch": 1.024253448537214, "percentage": 20.49, "elapsed_time": "0:19:45", "remaining_time": "1:16:40"} +{"current_steps": 212, "total_steps": 1030, "loss": 0.5039, "lr": 7.730176900905978e-05, "epoch": 1.0291041382446566, "percentage": 20.58, "elapsed_time": "0:23:38", "remaining_time": "1:31:14"} +{"current_steps": 213, "total_steps": 1030, "loss": 0.4987, "lr": 7.725261033417914e-05, "epoch": 1.0339548279520994, "percentage": 20.68, "elapsed_time": "0:27:31", "remaining_time": "1:45:36"} +{"current_steps": 214, "total_steps": 1030, "loss": 0.5082, "lr": 7.720302380433838e-05, "epoch": 1.0388055176595423, "percentage": 20.78, "elapsed_time": "0:31:25", "remaining_time": "1:59:48"} +{"current_steps": 215, "total_steps": 1030, "loss": 0.4903, "lr": 7.715300998905045e-05, "epoch": 1.043656207366985, "percentage": 20.87, "elapsed_time": "0:35:19", "remaining_time": "2:13:53"} +{"current_steps": 216, "total_steps": 1030, "loss": 0.5061, "lr": 7.710256946273572e-05, "epoch": 1.0485068970744278, "percentage": 20.97, "elapsed_time": "0:39:13", "remaining_time": "2:27:48"} +{"current_steps": 217, "total_steps": 1030, "loss": 0.4923, "lr": 7.705170280471546e-05, "epoch": 1.0533575867818705, "percentage": 21.07, "elapsed_time": "0:43:07", "remaining_time": "2:41:33"} +{"current_steps": 218, "total_steps": 1030, "loss": 0.4958, "lr": 7.700041059920516e-05, "epoch": 1.0582082764893133, "percentage": 21.17, "elapsed_time": "0:47:00", "remaining_time": "2:55:07"} +{"current_steps": 219, "total_steps": 1030, "loss": 0.4949, "lr": 7.694869343530781e-05, "epoch": 1.0630589661967562, "percentage": 21.26, "elapsed_time": "0:50:54", "remaining_time": "3:08:30"} +{"current_steps": 220, "total_steps": 1030, "loss": 0.4958, "lr": 7.689655190700719e-05, "epoch": 1.067909655904199, "percentage": 21.36, "elapsed_time": "0:54:47", "remaining_time": "3:21:45"} +{"current_steps": 221, "total_steps": 1030, "loss": 0.5034, "lr": 7.684398661316092e-05, "epoch": 1.0727603456116417, "percentage": 21.46, "elapsed_time": "0:58:41", "remaining_time": "3:34:49"} +{"current_steps": 222, "total_steps": 1030, "loss": 0.508, "lr": 7.679099815749377e-05, "epoch": 1.0776110353190844, "percentage": 21.55, "elapsed_time": "1:02:34", "remaining_time": "3:47:46"} +{"current_steps": 223, "total_steps": 1030, "loss": 0.5012, "lr": 7.673758714859052e-05, "epoch": 1.0824617250265272, "percentage": 21.65, "elapsed_time": "1:06:28", "remaining_time": "4:00:34"} +{"current_steps": 224, "total_steps": 1030, "loss": 0.5003, "lr": 7.668375419988918e-05, "epoch": 1.08731241473397, "percentage": 21.75, "elapsed_time": "1:10:22", "remaining_time": "4:13:12"} +{"current_steps": 225, "total_steps": 1030, "loss": 0.4984, "lr": 7.662949992967375e-05, "epoch": 1.0921631044414128, "percentage": 21.84, "elapsed_time": "1:14:15", "remaining_time": "4:25:41"} +{"current_steps": 226, "total_steps": 1030, "loss": 0.499, "lr": 7.657482496106725e-05, "epoch": 1.0970137941488556, "percentage": 21.94, "elapsed_time": "1:18:09", "remaining_time": "4:38:02"} +{"current_steps": 227, "total_steps": 1030, "loss": 0.4964, "lr": 7.651972992202449e-05, "epoch": 1.1018644838562983, "percentage": 22.04, "elapsed_time": "1:22:04", "remaining_time": "4:50:18"} +{"current_steps": 228, "total_steps": 1030, "loss": 0.501, "lr": 7.646421544532492e-05, "epoch": 1.106715173563741, "percentage": 22.14, "elapsed_time": "1:25:57", "remaining_time": "5:02:20"} +{"current_steps": 229, "total_steps": 1030, "loss": 0.5019, "lr": 7.640828216856532e-05, "epoch": 1.1115658632711838, "percentage": 22.23, "elapsed_time": "1:29:51", "remaining_time": "5:14:17"} +{"current_steps": 230, "total_steps": 1030, "loss": 0.4954, "lr": 7.635193073415246e-05, "epoch": 1.1164165529786267, "percentage": 22.33, "elapsed_time": "1:33:45", "remaining_time": "5:26:05"} +{"current_steps": 231, "total_steps": 1030, "loss": 0.4966, "lr": 7.62951617892958e-05, "epoch": 1.1212672426860695, "percentage": 22.43, "elapsed_time": "1:37:39", "remaining_time": "5:37:46"} +{"current_steps": 232, "total_steps": 1030, "loss": 0.4869, "lr": 7.623797598599995e-05, "epoch": 1.1261179323935122, "percentage": 22.52, "elapsed_time": "1:41:32", "remaining_time": "5:49:17"} +{"current_steps": 233, "total_steps": 1030, "loss": 0.4876, "lr": 7.618037398105728e-05, "epoch": 1.130968622100955, "percentage": 22.62, "elapsed_time": "1:45:27", "remaining_time": "6:00:42"} +{"current_steps": 234, "total_steps": 1030, "loss": 0.495, "lr": 7.612235643604031e-05, "epoch": 1.1358193118083977, "percentage": 22.72, "elapsed_time": "1:49:21", "remaining_time": "6:11:58"} +{"current_steps": 235, "total_steps": 1030, "loss": 0.4953, "lr": 7.606392401729415e-05, "epoch": 1.1406700015158404, "percentage": 22.82, "elapsed_time": "1:53:15", "remaining_time": "6:23:08"} +{"current_steps": 236, "total_steps": 1030, "loss": 0.4972, "lr": 7.600507739592879e-05, "epoch": 1.1455206912232834, "percentage": 22.91, "elapsed_time": "1:57:09", "remaining_time": "6:34:09"} +{"current_steps": 237, "total_steps": 1030, "loss": 0.4957, "lr": 7.594581724781152e-05, "epoch": 1.150371380930726, "percentage": 23.01, "elapsed_time": "2:01:03", "remaining_time": "6:45:03"} +{"current_steps": 238, "total_steps": 1030, "loss": 0.4955, "lr": 7.588614425355898e-05, "epoch": 1.1552220706381688, "percentage": 23.11, "elapsed_time": "2:04:57", "remaining_time": "6:55:48"} +{"current_steps": 239, "total_steps": 1030, "loss": 0.4937, "lr": 7.582605909852951e-05, "epoch": 1.1600727603456116, "percentage": 23.2, "elapsed_time": "2:08:51", "remaining_time": "7:06:26"} +{"current_steps": 240, "total_steps": 1030, "loss": 0.4969, "lr": 7.576556247281522e-05, "epoch": 1.1649234500530543, "percentage": 23.3, "elapsed_time": "2:12:44", "remaining_time": "7:16:56"} +{"current_steps": 241, "total_steps": 1030, "loss": 0.5042, "lr": 7.570465507123401e-05, "epoch": 1.1697741397604973, "percentage": 23.4, "elapsed_time": "2:16:38", "remaining_time": "7:27:19"} +{"current_steps": 242, "total_steps": 1030, "loss": 0.4906, "lr": 7.564333759332167e-05, "epoch": 1.17462482946794, "percentage": 23.5, "elapsed_time": "2:20:31", "remaining_time": "7:37:34"} +{"current_steps": 243, "total_steps": 1030, "loss": 0.4966, "lr": 7.558161074332379e-05, "epoch": 1.1794755191753827, "percentage": 23.59, "elapsed_time": "2:24:25", "remaining_time": "7:47:43"} +{"current_steps": 244, "total_steps": 1030, "loss": 0.4997, "lr": 7.551947523018774e-05, "epoch": 1.1843262088828255, "percentage": 23.69, "elapsed_time": "2:28:19", "remaining_time": "7:57:47"} +{"current_steps": 245, "total_steps": 1030, "loss": 0.4954, "lr": 7.54569317675544e-05, "epoch": 1.1891768985902682, "percentage": 23.79, "elapsed_time": "2:32:13", "remaining_time": "8:07:43"} +{"current_steps": 246, "total_steps": 1030, "loss": 0.4979, "lr": 7.539398107375015e-05, "epoch": 1.1940275882977112, "percentage": 23.88, "elapsed_time": "2:36:07", "remaining_time": "8:17:33"} +{"current_steps": 247, "total_steps": 1030, "loss": 0.4982, "lr": 7.533062387177843e-05, "epoch": 1.198878278005154, "percentage": 23.98, "elapsed_time": "2:40:01", "remaining_time": "8:27:16"} +{"current_steps": 248, "total_steps": 1030, "loss": 0.4991, "lr": 7.526686088931156e-05, "epoch": 1.2037289677125966, "percentage": 24.08, "elapsed_time": "2:43:55", "remaining_time": "8:36:53"} +{"current_steps": 249, "total_steps": 1030, "loss": 0.4908, "lr": 7.520269285868235e-05, "epoch": 1.2085796574200394, "percentage": 24.17, "elapsed_time": "2:47:49", "remaining_time": "8:46:22"} +{"current_steps": 250, "total_steps": 1030, "loss": 0.4917, "lr": 7.513812051687564e-05, "epoch": 1.213430347127482, "percentage": 24.27, "elapsed_time": "2:51:43", "remaining_time": "8:55:46"} +{"current_steps": 251, "total_steps": 1030, "loss": 0.4898, "lr": 7.507314460551993e-05, "epoch": 1.218281036834925, "percentage": 24.37, "elapsed_time": "2:55:37", "remaining_time": "9:05:03"} +{"current_steps": 252, "total_steps": 1030, "loss": 0.4929, "lr": 7.500776587087878e-05, "epoch": 1.2231317265423678, "percentage": 24.47, "elapsed_time": "2:59:31", "remaining_time": "9:14:13"} +{"current_steps": 253, "total_steps": 1030, "loss": 0.4826, "lr": 7.494198506384229e-05, "epoch": 1.2279824162498105, "percentage": 24.56, "elapsed_time": "3:03:25", "remaining_time": "9:23:18"} +{"current_steps": 254, "total_steps": 1030, "loss": 0.5021, "lr": 7.487580293991844e-05, "epoch": 1.2328331059572533, "percentage": 24.66, "elapsed_time": "3:07:18", "remaining_time": "9:32:15"} +{"current_steps": 255, "total_steps": 1030, "loss": 0.4974, "lr": 7.480922025922443e-05, "epoch": 1.237683795664696, "percentage": 24.76, "elapsed_time": "3:11:11", "remaining_time": "9:41:04"} +{"current_steps": 256, "total_steps": 1030, "loss": 0.4934, "lr": 7.474223778647796e-05, "epoch": 1.242534485372139, "percentage": 24.85, "elapsed_time": "3:15:05", "remaining_time": "9:49:49"} +{"current_steps": 257, "total_steps": 1030, "loss": 0.4907, "lr": 7.467485629098842e-05, "epoch": 1.2473851750795817, "percentage": 24.95, "elapsed_time": "3:18:59", "remaining_time": "9:58:30"} +{"current_steps": 258, "total_steps": 1030, "loss": 0.4974, "lr": 7.460707654664807e-05, "epoch": 1.2522358647870244, "percentage": 25.05, "elapsed_time": "3:22:53", "remaining_time": "10:07:04"} +{"current_steps": 259, "total_steps": 1030, "loss": 0.4893, "lr": 7.453889933192316e-05, "epoch": 1.2570865544944672, "percentage": 25.15, "elapsed_time": "3:26:47", "remaining_time": "10:15:34"} +{"current_steps": 260, "total_steps": 1030, "loss": 0.4882, "lr": 7.447032542984502e-05, "epoch": 1.26193724420191, "percentage": 25.24, "elapsed_time": "3:30:41", "remaining_time": "10:23:57"} +{"current_steps": 261, "total_steps": 1030, "loss": 0.487, "lr": 7.440135562800093e-05, "epoch": 1.2667879339093528, "percentage": 25.34, "elapsed_time": "3:34:34", "remaining_time": "10:32:13"} +{"current_steps": 262, "total_steps": 1030, "loss": 0.4965, "lr": 7.433199071852526e-05, "epoch": 1.2716386236167956, "percentage": 25.44, "elapsed_time": "3:38:27", "remaining_time": "10:40:22"} +{"current_steps": 263, "total_steps": 1030, "loss": 0.4922, "lr": 7.426223149809023e-05, "epoch": 1.2764893133242383, "percentage": 25.53, "elapsed_time": "3:42:21", "remaining_time": "10:48:27"} +{"current_steps": 264, "total_steps": 1030, "loss": 0.4844, "lr": 7.419207876789685e-05, "epoch": 1.281340003031681, "percentage": 25.63, "elapsed_time": "3:46:15", "remaining_time": "10:56:28"} +{"current_steps": 265, "total_steps": 1030, "loss": 0.4887, "lr": 7.412153333366567e-05, "epoch": 1.2861906927391238, "percentage": 25.73, "elapsed_time": "3:50:09", "remaining_time": "11:04:24"} +{"current_steps": 266, "total_steps": 1030, "loss": 0.4974, "lr": 7.405059600562751e-05, "epoch": 1.2910413824465667, "percentage": 25.83, "elapsed_time": "3:54:03", "remaining_time": "11:12:15"} +{"current_steps": 267, "total_steps": 1030, "loss": 0.4946, "lr": 7.397926759851425e-05, "epoch": 1.2958920721540095, "percentage": 25.92, "elapsed_time": "3:57:57", "remaining_time": "11:20:00"} +{"current_steps": 268, "total_steps": 1030, "loss": 0.4914, "lr": 7.390754893154933e-05, "epoch": 1.3007427618614522, "percentage": 26.02, "elapsed_time": "4:01:51", "remaining_time": "11:27:40"} +{"current_steps": 269, "total_steps": 1030, "loss": 0.4906, "lr": 7.383544082843846e-05, "epoch": 1.305593451568895, "percentage": 26.12, "elapsed_time": "4:05:45", "remaining_time": "11:35:15"} +{"current_steps": 270, "total_steps": 1030, "loss": 0.4877, "lr": 7.376294411736009e-05, "epoch": 1.3104441412763377, "percentage": 26.21, "elapsed_time": "4:09:39", "remaining_time": "11:42:43"} +{"current_steps": 271, "total_steps": 1030, "loss": 0.4962, "lr": 7.369005963095596e-05, "epoch": 1.3152948309837806, "percentage": 26.31, "elapsed_time": "4:13:33", "remaining_time": "11:50:09"} +{"current_steps": 272, "total_steps": 1030, "loss": 0.4918, "lr": 7.361678820632145e-05, "epoch": 1.3201455206912232, "percentage": 26.41, "elapsed_time": "4:17:27", "remaining_time": "11:57:28"} +{"current_steps": 273, "total_steps": 1030, "loss": 0.4892, "lr": 7.354313068499607e-05, "epoch": 1.324996210398666, "percentage": 26.5, "elapsed_time": "4:21:21", "remaining_time": "12:04:42"} +{"current_steps": 274, "total_steps": 1030, "loss": 0.495, "lr": 7.346908791295369e-05, "epoch": 1.3298469001061088, "percentage": 26.6, "elapsed_time": "4:25:15", "remaining_time": "12:11:52"} +{"current_steps": 275, "total_steps": 1030, "loss": 0.4862, "lr": 7.339466074059292e-05, "epoch": 1.3346975898135516, "percentage": 26.7, "elapsed_time": "4:29:09", "remaining_time": "12:18:57"} +{"current_steps": 276, "total_steps": 1030, "loss": 0.4986, "lr": 7.331985002272726e-05, "epoch": 1.3395482795209943, "percentage": 26.8, "elapsed_time": "4:33:02", "remaining_time": "12:25:56"} +{"current_steps": 277, "total_steps": 1030, "loss": 0.4868, "lr": 7.324465661857534e-05, "epoch": 1.344398969228437, "percentage": 26.89, "elapsed_time": "4:36:56", "remaining_time": "12:32:49"} +{"current_steps": 278, "total_steps": 1030, "loss": 0.4886, "lr": 7.316908139175105e-05, "epoch": 1.34924965893588, "percentage": 26.99, "elapsed_time": "4:40:49", "remaining_time": "12:39:38"} +{"current_steps": 279, "total_steps": 1030, "loss": 0.4909, "lr": 7.309312521025356e-05, "epoch": 1.3541003486433227, "percentage": 27.09, "elapsed_time": "4:44:44", "remaining_time": "12:46:26"} +{"current_steps": 280, "total_steps": 1030, "loss": 0.4915, "lr": 7.301678894645742e-05, "epoch": 1.3589510383507655, "percentage": 27.18, "elapsed_time": "4:48:38", "remaining_time": "12:53:09"} +{"current_steps": 281, "total_steps": 1030, "loss": 0.4935, "lr": 7.294007347710251e-05, "epoch": 1.3638017280582082, "percentage": 27.28, "elapsed_time": "4:52:32", "remaining_time": "12:59:45"} +{"current_steps": 282, "total_steps": 1030, "loss": 0.4834, "lr": 7.286297968328397e-05, "epoch": 1.368652417765651, "percentage": 27.38, "elapsed_time": "4:56:26", "remaining_time": "13:06:18"} +{"current_steps": 283, "total_steps": 1030, "loss": 0.4953, "lr": 7.27855084504421e-05, "epoch": 1.373503107473094, "percentage": 27.48, "elapsed_time": "5:00:20", "remaining_time": "13:12:45"} +{"current_steps": 284, "total_steps": 1030, "loss": 0.4872, "lr": 7.270766066835217e-05, "epoch": 1.3783537971805366, "percentage": 27.57, "elapsed_time": "5:04:13", "remaining_time": "13:19:07"} +{"current_steps": 285, "total_steps": 1030, "loss": 0.4916, "lr": 7.262943723111419e-05, "epoch": 1.3832044868879794, "percentage": 27.67, "elapsed_time": "5:08:08", "remaining_time": "13:25:30"} +{"current_steps": 286, "total_steps": 1030, "loss": 0.4866, "lr": 7.255083903714266e-05, "epoch": 1.388055176595422, "percentage": 27.77, "elapsed_time": "5:12:02", "remaining_time": "13:31:44"} +{"current_steps": 287, "total_steps": 1030, "loss": 0.4879, "lr": 7.247186698915625e-05, "epoch": 1.3929058663028648, "percentage": 27.86, "elapsed_time": "5:15:55", "remaining_time": "13:37:52"} +{"current_steps": 288, "total_steps": 1030, "loss": 0.4812, "lr": 7.239252199416749e-05, "epoch": 1.3977565560103078, "percentage": 27.96, "elapsed_time": "5:19:48", "remaining_time": "13:43:58"} +{"current_steps": 289, "total_steps": 1030, "loss": 0.4809, "lr": 7.23128049634722e-05, "epoch": 1.4026072457177505, "percentage": 28.06, "elapsed_time": "5:23:42", "remaining_time": "13:49:59"} +{"current_steps": 290, "total_steps": 1030, "loss": 0.4839, "lr": 7.223271681263916e-05, "epoch": 1.4074579354251933, "percentage": 28.16, "elapsed_time": "5:27:35", "remaining_time": "13:55:56"} +{"current_steps": 291, "total_steps": 1030, "loss": 0.4899, "lr": 7.215225846149957e-05, "epoch": 1.412308625132636, "percentage": 28.25, "elapsed_time": "5:31:29", "remaining_time": "14:01:49"} +{"current_steps": 292, "total_steps": 1030, "loss": 0.4865, "lr": 7.207143083413643e-05, "epoch": 1.4171593148400787, "percentage": 28.35, "elapsed_time": "5:35:23", "remaining_time": "14:07:39"} +{"current_steps": 293, "total_steps": 1030, "loss": 0.4876, "lr": 7.1990234858874e-05, "epoch": 1.4220100045475217, "percentage": 28.45, "elapsed_time": "5:39:17", "remaining_time": "14:13:25"} +{"current_steps": 294, "total_steps": 1030, "loss": 0.4936, "lr": 7.190867146826707e-05, "epoch": 1.4268606942549644, "percentage": 28.54, "elapsed_time": "5:43:10", "remaining_time": "14:19:07"} +{"current_steps": 295, "total_steps": 1030, "loss": 0.4845, "lr": 7.182674159909031e-05, "epoch": 1.4317113839624072, "percentage": 28.64, "elapsed_time": "5:47:04", "remaining_time": "14:24:43"} +{"current_steps": 296, "total_steps": 1030, "loss": 0.4952, "lr": 7.174444619232745e-05, "epoch": 1.43656207366985, "percentage": 28.74, "elapsed_time": "5:50:57", "remaining_time": "14:30:16"} +{"current_steps": 297, "total_steps": 1030, "loss": 0.4912, "lr": 7.166178619316056e-05, "epoch": 1.4414127633772926, "percentage": 28.83, "elapsed_time": "5:54:51", "remaining_time": "14:35:47"} +{"current_steps": 298, "total_steps": 1030, "loss": 0.4875, "lr": 7.157876255095906e-05, "epoch": 1.4462634530847356, "percentage": 28.93, "elapsed_time": "5:58:45", "remaining_time": "14:41:14"} +{"current_steps": 299, "total_steps": 1030, "loss": 0.4862, "lr": 7.149537621926895e-05, "epoch": 1.4511141427921783, "percentage": 29.03, "elapsed_time": "6:02:39", "remaining_time": "14:46:37"} +{"current_steps": 300, "total_steps": 1030, "loss": 0.4879, "lr": 7.14116281558018e-05, "epoch": 1.455964832499621, "percentage": 29.13, "elapsed_time": "6:06:32", "remaining_time": "14:51:56"} +{"current_steps": 301, "total_steps": 1030, "loss": 0.4984, "lr": 7.132751932242376e-05, "epoch": 1.4608155222070638, "percentage": 29.22, "elapsed_time": "6:10:26", "remaining_time": "14:57:11"} +{"current_steps": 302, "total_steps": 1030, "loss": 0.487, "lr": 7.124305068514444e-05, "epoch": 1.4656662119145065, "percentage": 29.32, "elapsed_time": "6:14:20", "remaining_time": "15:02:22"} +{"current_steps": 303, "total_steps": 1030, "loss": 0.4878, "lr": 7.1158223214106e-05, "epoch": 1.4705169016219495, "percentage": 29.42, "elapsed_time": "6:18:13", "remaining_time": "15:07:29"} +{"current_steps": 304, "total_steps": 1030, "loss": 0.4819, "lr": 7.107303788357177e-05, "epoch": 1.4753675913293922, "percentage": 29.51, "elapsed_time": "6:22:07", "remaining_time": "15:12:34"} +{"current_steps": 305, "total_steps": 1030, "loss": 0.4852, "lr": 7.098749567191527e-05, "epoch": 1.480218281036835, "percentage": 29.61, "elapsed_time": "6:26:01", "remaining_time": "15:17:35"} +{"current_steps": 306, "total_steps": 1030, "loss": 0.4877, "lr": 7.090159756160886e-05, "epoch": 1.4850689707442777, "percentage": 29.71, "elapsed_time": "6:29:55", "remaining_time": "15:22:34"} +{"current_steps": 307, "total_steps": 1030, "loss": 0.4852, "lr": 7.081534453921242e-05, "epoch": 1.4899196604517204, "percentage": 29.81, "elapsed_time": "6:33:49", "remaining_time": "15:27:28"} +{"current_steps": 308, "total_steps": 1030, "loss": 0.4913, "lr": 7.072873759536217e-05, "epoch": 1.4947703501591634, "percentage": 29.9, "elapsed_time": "6:37:43", "remaining_time": "15:32:19"} +{"current_steps": 309, "total_steps": 1030, "loss": 0.4798, "lr": 7.064177772475912e-05, "epoch": 1.499621039866606, "percentage": 30.0, "elapsed_time": "6:41:37", "remaining_time": "15:37:07"} +{"current_steps": 310, "total_steps": 1030, "loss": 0.4867, "lr": 7.05544659261578e-05, "epoch": 1.5044717295740488, "percentage": 30.1, "elapsed_time": "6:45:30", "remaining_time": "15:41:50"} +{"current_steps": 311, "total_steps": 1030, "loss": 0.4871, "lr": 7.046680320235466e-05, "epoch": 1.5093224192814916, "percentage": 30.19, "elapsed_time": "6:49:24", "remaining_time": "15:46:30"} +{"current_steps": 312, "total_steps": 1030, "loss": 0.4842, "lr": 7.037879056017663e-05, "epoch": 1.5141731089889343, "percentage": 30.29, "elapsed_time": "6:53:18", "remaining_time": "15:51:07"} +{"current_steps": 313, "total_steps": 1030, "loss": 0.4802, "lr": 7.029042901046952e-05, "epoch": 1.5190237986963773, "percentage": 30.39, "elapsed_time": "6:57:11", "remaining_time": "15:55:40"} +{"current_steps": 314, "total_steps": 1030, "loss": 0.4859, "lr": 7.020171956808645e-05, "epoch": 1.5238744884038198, "percentage": 30.49, "elapsed_time": "7:01:05", "remaining_time": "16:00:11"} +{"current_steps": 315, "total_steps": 1030, "loss": 0.496, "lr": 7.011266325187615e-05, "epoch": 1.5287251781112627, "percentage": 30.58, "elapsed_time": "7:04:58", "remaining_time": "16:04:38"} +{"current_steps": 316, "total_steps": 1030, "loss": 0.4864, "lr": 7.002326108467129e-05, "epoch": 1.5335758678187055, "percentage": 30.68, "elapsed_time": "7:08:51", "remaining_time": "16:09:00"} +{"current_steps": 317, "total_steps": 1030, "loss": 0.4763, "lr": 6.993351409327672e-05, "epoch": 1.5384265575261482, "percentage": 30.78, "elapsed_time": "7:12:45", "remaining_time": "16:13:22"} +{"current_steps": 318, "total_steps": 1030, "loss": 0.4952, "lr": 6.984342330845764e-05, "epoch": 1.5432772472335912, "percentage": 30.87, "elapsed_time": "7:16:39", "remaining_time": "16:17:40"} +{"current_steps": 319, "total_steps": 1030, "loss": 0.4952, "lr": 6.975298976492785e-05, "epoch": 1.5481279369410337, "percentage": 30.97, "elapsed_time": "7:20:33", "remaining_time": "16:21:56"} +{"current_steps": 320, "total_steps": 1030, "loss": 0.4901, "lr": 6.966221450133779e-05, "epoch": 1.5529786266484766, "percentage": 31.07, "elapsed_time": "7:24:27", "remaining_time": "16:26:08"} +{"current_steps": 321, "total_steps": 1030, "loss": 0.4917, "lr": 6.957109856026261e-05, "epoch": 1.5578293163559194, "percentage": 31.17, "elapsed_time": "7:28:21", "remaining_time": "16:30:17"} +{"current_steps": 322, "total_steps": 1030, "loss": 0.4771, "lr": 6.94796429881903e-05, "epoch": 1.562680006063362, "percentage": 31.26, "elapsed_time": "7:32:13", "remaining_time": "16:34:20"} +{"current_steps": 323, "total_steps": 1030, "loss": 0.4889, "lr": 6.938784883550948e-05, "epoch": 1.567530695770805, "percentage": 31.36, "elapsed_time": "7:36:07", "remaining_time": "16:38:23"} +{"current_steps": 324, "total_steps": 1030, "loss": 0.4866, "lr": 6.929571715649755e-05, "epoch": 1.5723813854782476, "percentage": 31.46, "elapsed_time": "7:40:01", "remaining_time": "16:42:25"} +{"current_steps": 325, "total_steps": 1030, "loss": 0.4907, "lr": 6.920324900930842e-05, "epoch": 1.5772320751856905, "percentage": 31.55, "elapsed_time": "7:43:55", "remaining_time": "16:46:22"} +{"current_steps": 326, "total_steps": 1030, "loss": 0.4854, "lr": 6.911044545596042e-05, "epoch": 1.5820827648931333, "percentage": 31.65, "elapsed_time": "7:47:49", "remaining_time": "16:50:15"} +{"current_steps": 327, "total_steps": 1030, "loss": 0.4895, "lr": 6.901730756232411e-05, "epoch": 1.586933454600576, "percentage": 31.75, "elapsed_time": "7:51:43", "remaining_time": "16:54:07"} +{"current_steps": 328, "total_steps": 1030, "loss": 0.4958, "lr": 6.892383639811005e-05, "epoch": 1.591784144308019, "percentage": 31.84, "elapsed_time": "7:55:37", "remaining_time": "16:57:56"} +{"current_steps": 329, "total_steps": 1030, "loss": 0.4844, "lr": 6.883003303685644e-05, "epoch": 1.5966348340154615, "percentage": 31.94, "elapsed_time": "7:59:31", "remaining_time": "17:01:42"} +{"current_steps": 330, "total_steps": 1030, "loss": 0.489, "lr": 6.87358985559169e-05, "epoch": 1.6014855237229044, "percentage": 32.04, "elapsed_time": "8:03:24", "remaining_time": "17:05:25"} +{"current_steps": 331, "total_steps": 1030, "loss": 0.4945, "lr": 6.864143403644797e-05, "epoch": 1.6063362134303472, "percentage": 32.14, "elapsed_time": "8:07:17", "remaining_time": "17:09:03"} +{"current_steps": 332, "total_steps": 1030, "loss": 0.4855, "lr": 6.85466405633968e-05, "epoch": 1.61118690313779, "percentage": 32.23, "elapsed_time": "8:11:11", "remaining_time": "17:12:40"} +{"current_steps": 333, "total_steps": 1030, "loss": 0.4783, "lr": 6.845151922548865e-05, "epoch": 1.6160375928452326, "percentage": 32.33, "elapsed_time": "8:15:04", "remaining_time": "17:16:14"} +{"current_steps": 334, "total_steps": 1030, "loss": 0.4796, "lr": 6.835607111521439e-05, "epoch": 1.6208882825526754, "percentage": 32.43, "elapsed_time": "8:18:57", "remaining_time": "17:19:45"} +{"current_steps": 335, "total_steps": 1030, "loss": 0.4928, "lr": 6.826029732881793e-05, "epoch": 1.6257389722601183, "percentage": 32.52, "elapsed_time": "8:22:51", "remaining_time": "17:23:14"} +{"current_steps": 336, "total_steps": 1030, "loss": 0.4851, "lr": 6.816419896628363e-05, "epoch": 1.630589661967561, "percentage": 32.62, "elapsed_time": "8:26:45", "remaining_time": "17:26:41"} +{"current_steps": 337, "total_steps": 1030, "loss": 0.4826, "lr": 6.806777713132374e-05, "epoch": 1.6354403516750038, "percentage": 32.72, "elapsed_time": "8:30:39", "remaining_time": "17:30:06"} +{"current_steps": 338, "total_steps": 1030, "loss": 0.4873, "lr": 6.79710329313656e-05, "epoch": 1.6402910413824465, "percentage": 32.82, "elapsed_time": "8:34:33", "remaining_time": "17:33:28"} +{"current_steps": 339, "total_steps": 1030, "loss": 0.4744, "lr": 6.787396747753903e-05, "epoch": 1.6451417310898893, "percentage": 32.91, "elapsed_time": "8:38:27", "remaining_time": "17:36:47"} +{"current_steps": 340, "total_steps": 1030, "loss": 0.4765, "lr": 6.777658188466354e-05, "epoch": 1.6499924207973322, "percentage": 33.01, "elapsed_time": "8:42:21", "remaining_time": "17:40:04"} +{"current_steps": 341, "total_steps": 1030, "loss": 0.4931, "lr": 6.767887727123544e-05, "epoch": 1.654843110504775, "percentage": 33.11, "elapsed_time": "8:46:15", "remaining_time": "17:43:18"} +{"current_steps": 342, "total_steps": 1030, "loss": 0.4875, "lr": 6.758085475941516e-05, "epoch": 1.6596938002122177, "percentage": 33.2, "elapsed_time": "8:50:09", "remaining_time": "17:46:30"} +{"current_steps": 343, "total_steps": 1030, "loss": 0.4783, "lr": 6.748251547501418e-05, "epoch": 1.6645444899196604, "percentage": 33.3, "elapsed_time": "8:54:03", "remaining_time": "17:49:40"} +{"current_steps": 344, "total_steps": 1030, "loss": 0.4836, "lr": 6.738386054748226e-05, "epoch": 1.6693951796271032, "percentage": 33.4, "elapsed_time": "8:57:57", "remaining_time": "17:52:46"} +{"current_steps": 345, "total_steps": 1030, "loss": 0.4883, "lr": 6.728489110989434e-05, "epoch": 1.674245869334546, "percentage": 33.5, "elapsed_time": "9:01:50", "remaining_time": "17:55:50"} +{"current_steps": 346, "total_steps": 1030, "loss": 0.4799, "lr": 6.718560829893762e-05, "epoch": 1.6790965590419886, "percentage": 33.59, "elapsed_time": "9:05:43", "remaining_time": "17:58:50"} +{"current_steps": 347, "total_steps": 1030, "loss": 0.4872, "lr": 6.708601325489844e-05, "epoch": 1.6839472487494316, "percentage": 33.69, "elapsed_time": "9:09:36", "remaining_time": "18:01:48"} +{"current_steps": 348, "total_steps": 1030, "loss": 0.4864, "lr": 6.698610712164924e-05, "epoch": 1.6887979384568743, "percentage": 33.79, "elapsed_time": "9:13:30", "remaining_time": "18:04:44"} +{"current_steps": 349, "total_steps": 1030, "loss": 0.4731, "lr": 6.688589104663536e-05, "epoch": 1.693648628164317, "percentage": 33.88, "elapsed_time": "9:17:23", "remaining_time": "18:07:37"} +{"current_steps": 350, "total_steps": 1030, "loss": 0.4771, "lr": 6.67853661808619e-05, "epoch": 1.69849931787176, "percentage": 33.98, "elapsed_time": "9:21:17", "remaining_time": "18:10:30"} +{"current_steps": 351, "total_steps": 1030, "loss": 0.4867, "lr": 6.668453367888052e-05, "epoch": 1.7033500075792025, "percentage": 34.08, "elapsed_time": "9:25:11", "remaining_time": "18:13:21"} +{"current_steps": 352, "total_steps": 1030, "loss": 0.478, "lr": 6.658339469877613e-05, "epoch": 1.7082006972866455, "percentage": 34.17, "elapsed_time": "9:29:04", "remaining_time": "18:16:07"} +{"current_steps": 353, "total_steps": 1030, "loss": 0.4814, "lr": 6.64819504021536e-05, "epoch": 1.7130513869940882, "percentage": 34.27, "elapsed_time": "9:32:58", "remaining_time": "18:18:52"} +{"current_steps": 354, "total_steps": 1030, "loss": 0.4771, "lr": 6.638020195412448e-05, "epoch": 1.717902076701531, "percentage": 34.37, "elapsed_time": "9:36:51", "remaining_time": "18:21:33"} +{"current_steps": 355, "total_steps": 1030, "loss": 0.4925, "lr": 6.627815052329354e-05, "epoch": 1.722752766408974, "percentage": 34.47, "elapsed_time": "9:40:45", "remaining_time": "18:24:15"} +{"current_steps": 356, "total_steps": 1030, "loss": 0.4854, "lr": 6.617579728174535e-05, "epoch": 1.7276034561164164, "percentage": 34.56, "elapsed_time": "9:44:39", "remaining_time": "18:26:53"} +{"current_steps": 357, "total_steps": 1030, "loss": 0.4777, "lr": 6.60731434050309e-05, "epoch": 1.7324541458238594, "percentage": 34.66, "elapsed_time": "9:48:33", "remaining_time": "18:29:31"} +{"current_steps": 358, "total_steps": 1030, "loss": 0.4783, "lr": 6.597019007215401e-05, "epoch": 1.737304835531302, "percentage": 34.76, "elapsed_time": "9:52:27", "remaining_time": "18:32:06"} +{"current_steps": 359, "total_steps": 1030, "loss": 0.4743, "lr": 6.586693846555788e-05, "epoch": 1.7421555252387448, "percentage": 34.85, "elapsed_time": "9:56:21", "remaining_time": "18:34:37"} +{"current_steps": 360, "total_steps": 1030, "loss": 0.48, "lr": 6.576338977111134e-05, "epoch": 1.7470062149461878, "percentage": 34.95, "elapsed_time": "10:00:15", "remaining_time": "18:37:08"} +{"current_steps": 361, "total_steps": 1030, "loss": 0.4747, "lr": 6.565954517809543e-05, "epoch": 1.7518569046536303, "percentage": 35.05, "elapsed_time": "10:04:09", "remaining_time": "18:39:36"} +{"current_steps": 362, "total_steps": 1030, "loss": 0.4778, "lr": 6.555540587918968e-05, "epoch": 1.7567075943610733, "percentage": 35.15, "elapsed_time": "10:08:03", "remaining_time": "18:42:03"} +{"current_steps": 363, "total_steps": 1030, "loss": 0.4795, "lr": 6.545097307045831e-05, "epoch": 1.761558284068516, "percentage": 35.24, "elapsed_time": "10:11:57", "remaining_time": "18:44:26"} +{"current_steps": 364, "total_steps": 1030, "loss": 0.4851, "lr": 6.534624795133662e-05, "epoch": 1.7664089737759587, "percentage": 35.34, "elapsed_time": "10:15:51", "remaining_time": "18:46:48"} +{"current_steps": 365, "total_steps": 1030, "loss": 0.4794, "lr": 6.524123172461711e-05, "epoch": 1.7712596634834017, "percentage": 35.44, "elapsed_time": "10:19:45", "remaining_time": "18:49:08"} +{"current_steps": 366, "total_steps": 1030, "loss": 0.4774, "lr": 6.51359255964358e-05, "epoch": 1.7761103531908442, "percentage": 35.53, "elapsed_time": "10:23:39", "remaining_time": "18:51:26"} +{"current_steps": 367, "total_steps": 1030, "loss": 0.4746, "lr": 6.503033077625824e-05, "epoch": 1.7809610428982872, "percentage": 35.63, "elapsed_time": "10:27:32", "remaining_time": "18:53:41"} +{"current_steps": 368, "total_steps": 1030, "loss": 0.4849, "lr": 6.492444847686566e-05, "epoch": 1.78581173260573, "percentage": 35.73, "elapsed_time": "10:31:26", "remaining_time": "18:55:54"} +{"current_steps": 369, "total_steps": 1030, "loss": 0.4814, "lr": 6.481827991434111e-05, "epoch": 1.7906624223131726, "percentage": 35.83, "elapsed_time": "10:35:19", "remaining_time": "18:58:04"} +{"current_steps": 370, "total_steps": 1030, "loss": 0.4813, "lr": 6.471182630805538e-05, "epoch": 1.7955131120206156, "percentage": 35.92, "elapsed_time": "10:39:13", "remaining_time": "19:00:14"} +{"current_steps": 371, "total_steps": 1030, "loss": 0.4865, "lr": 6.460508888065314e-05, "epoch": 1.800363801728058, "percentage": 36.02, "elapsed_time": "10:43:07", "remaining_time": "19:02:22"} +{"current_steps": 372, "total_steps": 1030, "loss": 0.4752, "lr": 6.449806885803873e-05, "epoch": 1.805214491435501, "percentage": 36.12, "elapsed_time": "10:47:01", "remaining_time": "19:04:27"} +{"current_steps": 373, "total_steps": 1030, "loss": 0.4776, "lr": 6.439076746936219e-05, "epoch": 1.8100651811429438, "percentage": 36.21, "elapsed_time": "10:50:55", "remaining_time": "19:06:32"} +{"current_steps": 374, "total_steps": 1030, "loss": 0.4833, "lr": 6.428318594700509e-05, "epoch": 1.8149158708503865, "percentage": 36.31, "elapsed_time": "10:54:49", "remaining_time": "19:08:33"} +{"current_steps": 375, "total_steps": 1030, "loss": 0.4808, "lr": 6.417532552656647e-05, "epoch": 1.8197665605578295, "percentage": 36.41, "elapsed_time": "10:58:43", "remaining_time": "19:10:34"} +{"current_steps": 376, "total_steps": 1030, "loss": 0.475, "lr": 6.406718744684851e-05, "epoch": 1.824617250265272, "percentage": 36.5, "elapsed_time": "11:02:37", "remaining_time": "19:12:32"} +{"current_steps": 377, "total_steps": 1030, "loss": 0.4718, "lr": 6.395877294984241e-05, "epoch": 1.829467939972715, "percentage": 36.6, "elapsed_time": "11:06:31", "remaining_time": "19:14:28"} +{"current_steps": 378, "total_steps": 1030, "loss": 0.4858, "lr": 6.385008328071406e-05, "epoch": 1.8343186296801577, "percentage": 36.7, "elapsed_time": "11:10:25", "remaining_time": "19:16:23"} +{"current_steps": 379, "total_steps": 1030, "loss": 0.4797, "lr": 6.374111968778982e-05, "epoch": 1.8391693193876004, "percentage": 36.8, "elapsed_time": "11:14:19", "remaining_time": "19:18:15"} +{"current_steps": 380, "total_steps": 1030, "loss": 0.4819, "lr": 6.363188342254206e-05, "epoch": 1.8440200090950432, "percentage": 36.89, "elapsed_time": "11:18:13", "remaining_time": "19:20:07"} +{"current_steps": 381, "total_steps": 1030, "loss": 0.4777, "lr": 6.352237573957488e-05, "epoch": 1.848870698802486, "percentage": 36.99, "elapsed_time": "11:22:07", "remaining_time": "19:21:56"} +{"current_steps": 382, "total_steps": 1030, "loss": 0.4812, "lr": 6.341259789660969e-05, "epoch": 1.8537213885099288, "percentage": 37.09, "elapsed_time": "11:26:01", "remaining_time": "19:23:43"} +{"current_steps": 383, "total_steps": 1030, "loss": 0.4722, "lr": 6.330255115447076e-05, "epoch": 1.8585720782173716, "percentage": 37.18, "elapsed_time": "11:29:55", "remaining_time": "19:25:28"} +{"current_steps": 384, "total_steps": 1030, "loss": 0.4786, "lr": 6.319223677707069e-05, "epoch": 1.8634227679248143, "percentage": 37.28, "elapsed_time": "11:33:49", "remaining_time": "19:27:12"} +{"current_steps": 385, "total_steps": 1030, "loss": 0.4766, "lr": 6.308165603139598e-05, "epoch": 1.868273457632257, "percentage": 37.38, "elapsed_time": "11:37:43", "remaining_time": "19:28:54"} +{"current_steps": 386, "total_steps": 1030, "loss": 0.4746, "lr": 6.29708101874924e-05, "epoch": 1.8731241473396998, "percentage": 37.48, "elapsed_time": "11:41:37", "remaining_time": "19:30:35"} +{"current_steps": 387, "total_steps": 1030, "loss": 0.4777, "lr": 6.285970051845045e-05, "epoch": 1.8779748370471427, "percentage": 37.57, "elapsed_time": "11:45:31", "remaining_time": "19:32:13"} +{"current_steps": 388, "total_steps": 1030, "loss": 0.4762, "lr": 6.274832830039071e-05, "epoch": 1.8828255267545853, "percentage": 37.67, "elapsed_time": "11:49:25", "remaining_time": "19:33:50"} +{"current_steps": 389, "total_steps": 1030, "loss": 0.4882, "lr": 6.26366948124492e-05, "epoch": 1.8876762164620282, "percentage": 37.77, "elapsed_time": "11:53:19", "remaining_time": "19:35:24"} +{"current_steps": 390, "total_steps": 1030, "loss": 0.4746, "lr": 6.25248013367627e-05, "epoch": 1.892526906169471, "percentage": 37.86, "elapsed_time": "11:57:11", "remaining_time": "19:36:55"} +{"current_steps": 391, "total_steps": 1030, "loss": 0.4863, "lr": 6.241264915845401e-05, "epoch": 1.8973775958769137, "percentage": 37.96, "elapsed_time": "12:01:05", "remaining_time": "19:38:26"} +{"current_steps": 392, "total_steps": 1030, "loss": 0.4803, "lr": 6.230023956561716e-05, "epoch": 1.9022282855843566, "percentage": 38.06, "elapsed_time": "12:04:58", "remaining_time": "19:39:56"} +{"current_steps": 393, "total_steps": 1030, "loss": 0.4769, "lr": 6.218757384930268e-05, "epoch": 1.9070789752917991, "percentage": 38.16, "elapsed_time": "12:08:51", "remaining_time": "19:41:22"} +{"current_steps": 394, "total_steps": 1030, "loss": 0.4798, "lr": 6.207465330350273e-05, "epoch": 1.911929664999242, "percentage": 38.25, "elapsed_time": "12:12:45", "remaining_time": "19:42:49"} +{"current_steps": 395, "total_steps": 1030, "loss": 0.479, "lr": 6.196147922513623e-05, "epoch": 1.9167803547066848, "percentage": 38.35, "elapsed_time": "12:16:39", "remaining_time": "19:44:14"} +{"current_steps": 396, "total_steps": 1030, "loss": 0.4776, "lr": 6.184805291403402e-05, "epoch": 1.9216310444141276, "percentage": 38.45, "elapsed_time": "12:20:33", "remaining_time": "19:45:38"} +{"current_steps": 397, "total_steps": 1030, "loss": 0.475, "lr": 6.173437567292383e-05, "epoch": 1.9264817341215705, "percentage": 38.54, "elapsed_time": "12:24:27", "remaining_time": "19:47:00"} +{"current_steps": 398, "total_steps": 1030, "loss": 0.4719, "lr": 6.162044880741544e-05, "epoch": 1.931332423829013, "percentage": 38.64, "elapsed_time": "12:28:21", "remaining_time": "19:48:20"} +{"current_steps": 399, "total_steps": 1030, "loss": 0.4871, "lr": 6.150627362598557e-05, "epoch": 1.936183113536456, "percentage": 38.74, "elapsed_time": "12:32:15", "remaining_time": "19:49:39"} +{"current_steps": 400, "total_steps": 1030, "loss": 0.4806, "lr": 6.139185143996298e-05, "epoch": 1.9410338032438987, "percentage": 38.83, "elapsed_time": "12:36:09", "remaining_time": "19:50:56"} +{"current_steps": 401, "total_steps": 1030, "loss": 0.478, "lr": 6.127718356351326e-05, "epoch": 1.9458844929513415, "percentage": 38.93, "elapsed_time": "12:40:03", "remaining_time": "19:52:11"} +{"current_steps": 402, "total_steps": 1030, "loss": 0.4714, "lr": 6.116227131362385e-05, "epoch": 1.9507351826587844, "percentage": 39.03, "elapsed_time": "12:43:57", "remaining_time": "19:53:26"} +{"current_steps": 403, "total_steps": 1030, "loss": 0.4779, "lr": 6.104711601008888e-05, "epoch": 1.955585872366227, "percentage": 39.13, "elapsed_time": "12:47:51", "remaining_time": "19:54:38"} +{"current_steps": 404, "total_steps": 1030, "loss": 0.4846, "lr": 6.0931718975493985e-05, "epoch": 1.96043656207367, "percentage": 39.22, "elapsed_time": "12:51:44", "remaining_time": "19:55:49"} +{"current_steps": 405, "total_steps": 1030, "loss": 0.4691, "lr": 6.081608153520117e-05, "epoch": 1.9652872517811126, "percentage": 39.32, "elapsed_time": "12:55:38", "remaining_time": "19:56:58"} +{"current_steps": 406, "total_steps": 1030, "loss": 0.4787, "lr": 6.0700205017333525e-05, "epoch": 1.9701379414885554, "percentage": 39.42, "elapsed_time": "12:59:31", "remaining_time": "19:58:04"} +{"current_steps": 407, "total_steps": 1030, "loss": 0.4689, "lr": 6.058409075276002e-05, "epoch": 1.9749886311959983, "percentage": 39.51, "elapsed_time": "13:03:25", "remaining_time": "19:59:11"} +{"current_steps": 408, "total_steps": 1030, "loss": 0.475, "lr": 6.046774007508019e-05, "epoch": 1.9798393209034408, "percentage": 39.61, "elapsed_time": "13:07:19", "remaining_time": "20:00:16"} +{"current_steps": 409, "total_steps": 1030, "loss": 0.4747, "lr": 6.035115432060883e-05, "epoch": 1.9846900106108838, "percentage": 39.71, "elapsed_time": "13:11:13", "remaining_time": "20:01:20"} +{"current_steps": 410, "total_steps": 1030, "loss": 0.4786, "lr": 6.0234334828360655e-05, "epoch": 1.9895407003183265, "percentage": 39.81, "elapsed_time": "13:15:07", "remaining_time": "20:02:22"} +{"current_steps": 411, "total_steps": 1030, "loss": 0.4802, "lr": 6.011728294003494e-05, "epoch": 1.9943913900257693, "percentage": 39.9, "elapsed_time": "13:19:01", "remaining_time": "20:03:24"} +{"current_steps": 412, "total_steps": 1030, "loss": 0.4768, "lr": 6.000000000000001e-05, "epoch": 1.9992420797332122, "percentage": 40.0, "elapsed_time": "13:22:55", "remaining_time": "20:04:22"} +{"current_steps": 413, "total_steps": 1030, "loss": 0.8958, "lr": 5.988248735527793e-05, "epoch": 2.004699105654085, "percentage": 40.1, "elapsed_time": "13:27:16", "remaining_time": "20:06:01"} +{"current_steps": 414, "total_steps": 1030, "loss": 0.4703, "lr": 5.9764746355528994e-05, "epoch": 2.009549795361528, "percentage": 40.19, "elapsed_time": "13:31:10", "remaining_time": "20:06:57"} +{"current_steps": 415, "total_steps": 1030, "loss": 0.4736, "lr": 5.964677835303615e-05, "epoch": 2.014400485068971, "percentage": 40.29, "elapsed_time": "13:35:03", "remaining_time": "20:07:50"} +{"current_steps": 416, "total_steps": 1030, "loss": 0.4636, "lr": 5.952858470268955e-05, "epoch": 2.0192511747764135, "percentage": 40.39, "elapsed_time": "13:38:56", "remaining_time": "20:08:43"} +{"current_steps": 417, "total_steps": 1030, "loss": 0.4688, "lr": 5.941016676197098e-05, "epoch": 2.0241018644838564, "percentage": 40.49, "elapsed_time": "13:42:48", "remaining_time": "20:09:33"} +{"current_steps": 418, "total_steps": 1030, "loss": 0.471, "lr": 5.929152589093825e-05, "epoch": 2.028952554191299, "percentage": 40.58, "elapsed_time": "13:46:42", "remaining_time": "20:10:23"} +{"current_steps": 419, "total_steps": 1030, "loss": 0.4661, "lr": 5.9172663452209554e-05, "epoch": 2.033803243898742, "percentage": 40.68, "elapsed_time": "13:50:35", "remaining_time": "20:11:11"} +{"current_steps": 420, "total_steps": 1030, "loss": 0.4704, "lr": 5.9053580810947845e-05, "epoch": 2.0386539336061844, "percentage": 40.78, "elapsed_time": "13:54:28", "remaining_time": "20:11:58"} +{"current_steps": 421, "total_steps": 1030, "loss": 0.4707, "lr": 5.89342793348452e-05, "epoch": 2.0435046233136274, "percentage": 40.87, "elapsed_time": "13:58:20", "remaining_time": "20:12:43"} +{"current_steps": 422, "total_steps": 1030, "loss": 0.4662, "lr": 5.881476039410699e-05, "epoch": 2.0483553130210703, "percentage": 40.97, "elapsed_time": "14:02:14", "remaining_time": "20:13:28"} +{"current_steps": 423, "total_steps": 1030, "loss": 0.4586, "lr": 5.869502536143629e-05, "epoch": 2.053206002728513, "percentage": 41.07, "elapsed_time": "14:06:08", "remaining_time": "20:14:12"} +{"current_steps": 424, "total_steps": 1030, "loss": 0.4628, "lr": 5.857507561201802e-05, "epoch": 2.058056692435956, "percentage": 41.17, "elapsed_time": "14:10:01", "remaining_time": "20:14:53"} +{"current_steps": 425, "total_steps": 1030, "loss": 0.4598, "lr": 5.845491252350312e-05, "epoch": 2.0629073821433983, "percentage": 41.26, "elapsed_time": "14:13:54", "remaining_time": "20:15:33"} +{"current_steps": 426, "total_steps": 1030, "loss": 0.4557, "lr": 5.833453747599286e-05, "epoch": 2.0677580718508413, "percentage": 41.36, "elapsed_time": "14:17:48", "remaining_time": "20:16:14"} +{"current_steps": 427, "total_steps": 1030, "loss": 0.4606, "lr": 5.821395185202285e-05, "epoch": 2.072608761558284, "percentage": 41.46, "elapsed_time": "14:21:42", "remaining_time": "20:16:52"} +{"current_steps": 428, "total_steps": 1030, "loss": 0.466, "lr": 5.809315703654726e-05, "epoch": 2.0774594512657267, "percentage": 41.55, "elapsed_time": "14:25:35", "remaining_time": "20:17:29"} +{"current_steps": 429, "total_steps": 1030, "loss": 0.4623, "lr": 5.797215441692284e-05, "epoch": 2.0823101409731697, "percentage": 41.65, "elapsed_time": "14:29:28", "remaining_time": "20:18:04"} +{"current_steps": 430, "total_steps": 1030, "loss": 0.4612, "lr": 5.785094538289304e-05, "epoch": 2.087160830680612, "percentage": 41.75, "elapsed_time": "14:33:22", "remaining_time": "20:18:39"} +{"current_steps": 431, "total_steps": 1030, "loss": 0.4622, "lr": 5.772953132657202e-05, "epoch": 2.092011520388055, "percentage": 41.84, "elapsed_time": "14:37:16", "remaining_time": "20:19:13"} +{"current_steps": 432, "total_steps": 1030, "loss": 0.4508, "lr": 5.7607913642428666e-05, "epoch": 2.096862210095498, "percentage": 41.94, "elapsed_time": "14:41:08", "remaining_time": "20:19:44"} +{"current_steps": 433, "total_steps": 1030, "loss": 0.451, "lr": 5.7486093727270606e-05, "epoch": 2.1017128998029406, "percentage": 42.04, "elapsed_time": "14:45:02", "remaining_time": "20:20:15"} +{"current_steps": 434, "total_steps": 1030, "loss": 0.4491, "lr": 5.736407298022809e-05, "epoch": 2.1065635895103836, "percentage": 42.14, "elapsed_time": "14:48:55", "remaining_time": "20:20:44"} +{"current_steps": 435, "total_steps": 1030, "loss": 0.459, "lr": 5.7241852802738e-05, "epoch": 2.111414279217826, "percentage": 42.23, "elapsed_time": "14:52:48", "remaining_time": "20:21:12"} +{"current_steps": 436, "total_steps": 1030, "loss": 0.4471, "lr": 5.711943459852772e-05, "epoch": 2.116264968925269, "percentage": 42.33, "elapsed_time": "14:56:42", "remaining_time": "20:21:39"} +{"current_steps": 437, "total_steps": 1030, "loss": 0.4447, "lr": 5.699681977359902e-05, "epoch": 2.121115658632712, "percentage": 42.43, "elapsed_time": "15:00:35", "remaining_time": "20:22:05"} +{"current_steps": 438, "total_steps": 1030, "loss": 0.4515, "lr": 5.6874009736211896e-05, "epoch": 2.1259663483401545, "percentage": 42.52, "elapsed_time": "15:04:28", "remaining_time": "20:22:29"} +{"current_steps": 439, "total_steps": 1030, "loss": 0.4503, "lr": 5.675100589686839e-05, "epoch": 2.1308170380475975, "percentage": 42.62, "elapsed_time": "15:08:22", "remaining_time": "20:22:54"} +{"current_steps": 440, "total_steps": 1030, "loss": 0.4552, "lr": 5.662780966829646e-05, "epoch": 2.13566772775504, "percentage": 42.72, "elapsed_time": "15:12:16", "remaining_time": "20:23:16"} +{"current_steps": 441, "total_steps": 1030, "loss": 0.4555, "lr": 5.650442246543364e-05, "epoch": 2.140518417462483, "percentage": 42.82, "elapsed_time": "15:16:10", "remaining_time": "20:23:38"} +{"current_steps": 442, "total_steps": 1030, "loss": 0.4484, "lr": 5.638084570541088e-05, "epoch": 2.145369107169926, "percentage": 42.91, "elapsed_time": "15:20:04", "remaining_time": "20:23:59"} +{"current_steps": 443, "total_steps": 1030, "loss": 0.4586, "lr": 5.625708080753621e-05, "epoch": 2.1502197968773684, "percentage": 43.01, "elapsed_time": "15:23:58", "remaining_time": "20:24:19"} +{"current_steps": 444, "total_steps": 1030, "loss": 0.4484, "lr": 5.6133129193278525e-05, "epoch": 2.1550704865848114, "percentage": 43.11, "elapsed_time": "15:27:52", "remaining_time": "20:24:37"} +{"current_steps": 445, "total_steps": 1030, "loss": 0.4521, "lr": 5.600899228625112e-05, "epoch": 2.159921176292254, "percentage": 43.2, "elapsed_time": "15:31:46", "remaining_time": "20:24:55"} +{"current_steps": 446, "total_steps": 1030, "loss": 0.4529, "lr": 5.588467151219549e-05, "epoch": 2.164771865999697, "percentage": 43.3, "elapsed_time": "15:35:39", "remaining_time": "20:25:10"} +{"current_steps": 447, "total_steps": 1030, "loss": 0.4411, "lr": 5.5760168298964874e-05, "epoch": 2.16962255570714, "percentage": 43.4, "elapsed_time": "15:39:32", "remaining_time": "20:25:24"} +{"current_steps": 448, "total_steps": 1030, "loss": 0.4484, "lr": 5.563548407650782e-05, "epoch": 2.1744732454145823, "percentage": 43.5, "elapsed_time": "15:43:26", "remaining_time": "20:25:37"} +{"current_steps": 449, "total_steps": 1030, "loss": 0.4506, "lr": 5.551062027685187e-05, "epoch": 2.1793239351220253, "percentage": 43.59, "elapsed_time": "15:47:20", "remaining_time": "20:25:50"} +{"current_steps": 450, "total_steps": 1030, "loss": 0.4508, "lr": 5.5385578334087006e-05, "epoch": 2.184174624829468, "percentage": 43.69, "elapsed_time": "15:51:12", "remaining_time": "20:26:00"} +{"current_steps": 451, "total_steps": 1030, "loss": 0.4491, "lr": 5.526035968434927e-05, "epoch": 2.1890253145369107, "percentage": 43.79, "elapsed_time": "15:55:06", "remaining_time": "20:26:11"} +{"current_steps": 452, "total_steps": 1030, "loss": 0.461, "lr": 5.513496576580418e-05, "epoch": 2.1938760042443537, "percentage": 43.88, "elapsed_time": "15:59:00", "remaining_time": "20:26:20"} +{"current_steps": 453, "total_steps": 1030, "loss": 0.4525, "lr": 5.5009398018630276e-05, "epoch": 2.198726693951796, "percentage": 43.98, "elapsed_time": "16:02:54", "remaining_time": "20:26:29"} +{"current_steps": 454, "total_steps": 1030, "loss": 0.447, "lr": 5.4883657885002575e-05, "epoch": 2.203577383659239, "percentage": 44.08, "elapsed_time": "16:06:48", "remaining_time": "20:26:37"} +{"current_steps": 455, "total_steps": 1030, "loss": 0.4441, "lr": 5.475774680907597e-05, "epoch": 2.2084280733666817, "percentage": 44.17, "elapsed_time": "16:10:43", "remaining_time": "20:26:44"} +{"current_steps": 456, "total_steps": 1030, "loss": 0.4444, "lr": 5.463166623696868e-05, "epoch": 2.2132787630741246, "percentage": 44.27, "elapsed_time": "16:14:36", "remaining_time": "20:26:49"} +{"current_steps": 457, "total_steps": 1030, "loss": 0.4471, "lr": 5.450541761674562e-05, "epoch": 2.218129452781567, "percentage": 44.37, "elapsed_time": "16:18:30", "remaining_time": "20:26:52"} +{"current_steps": 458, "total_steps": 1030, "loss": 0.448, "lr": 5.437900239840179e-05, "epoch": 2.22298014248901, "percentage": 44.47, "elapsed_time": "16:22:23", "remaining_time": "20:26:55"} +{"current_steps": 459, "total_steps": 1030, "loss": 0.4448, "lr": 5.42524220338456e-05, "epoch": 2.227830832196453, "percentage": 44.56, "elapsed_time": "16:26:17", "remaining_time": "20:26:56"} +{"current_steps": 460, "total_steps": 1030, "loss": 0.4542, "lr": 5.412567797688219e-05, "epoch": 2.2326815219038956, "percentage": 44.66, "elapsed_time": "16:30:11", "remaining_time": "20:26:58"} +{"current_steps": 461, "total_steps": 1030, "loss": 0.4541, "lr": 5.3998771683196754e-05, "epoch": 2.2375322116113385, "percentage": 44.76, "elapsed_time": "16:34:04", "remaining_time": "20:26:58"} +{"current_steps": 462, "total_steps": 1030, "loss": 0.4449, "lr": 5.3871704610337836e-05, "epoch": 2.2423829013187815, "percentage": 44.85, "elapsed_time": "16:37:58", "remaining_time": "20:26:57"} +{"current_steps": 463, "total_steps": 1030, "loss": 0.4454, "lr": 5.374447821770053e-05, "epoch": 2.247233591026224, "percentage": 44.95, "elapsed_time": "16:41:52", "remaining_time": "20:26:55"} +{"current_steps": 464, "total_steps": 1030, "loss": 0.4418, "lr": 5.361709396650977e-05, "epoch": 2.252084280733667, "percentage": 45.05, "elapsed_time": "16:45:46", "remaining_time": "20:26:52"} +{"current_steps": 465, "total_steps": 1030, "loss": 0.4485, "lr": 5.3489553319803566e-05, "epoch": 2.2569349704411095, "percentage": 45.15, "elapsed_time": "16:49:40", "remaining_time": "20:26:48"} +{"current_steps": 466, "total_steps": 1030, "loss": 0.4497, "lr": 5.336185774241609e-05, "epoch": 2.2617856601485524, "percentage": 45.24, "elapsed_time": "16:53:33", "remaining_time": "20:26:42"} +{"current_steps": 467, "total_steps": 1030, "loss": 0.4514, "lr": 5.3234008700961e-05, "epoch": 2.266636349855995, "percentage": 45.34, "elapsed_time": "16:57:26", "remaining_time": "20:26:35"} +{"current_steps": 468, "total_steps": 1030, "loss": 0.4406, "lr": 5.3106007663814505e-05, "epoch": 2.271487039563438, "percentage": 45.44, "elapsed_time": "17:01:20", "remaining_time": "20:26:29"} +{"current_steps": 469, "total_steps": 1030, "loss": 0.4548, "lr": 5.2977856101098484e-05, "epoch": 2.276337729270881, "percentage": 45.53, "elapsed_time": "17:05:14", "remaining_time": "20:26:21"} +{"current_steps": 470, "total_steps": 1030, "loss": 0.4605, "lr": 5.284955548466371e-05, "epoch": 2.2811884189783234, "percentage": 45.63, "elapsed_time": "17:09:08", "remaining_time": "20:26:12"} +{"current_steps": 471, "total_steps": 1030, "loss": 0.4471, "lr": 5.272110728807279e-05, "epoch": 2.2860391086857663, "percentage": 45.73, "elapsed_time": "17:13:03", "remaining_time": "20:26:03"} +{"current_steps": 472, "total_steps": 1030, "loss": 0.4511, "lr": 5.25925129865834e-05, "epoch": 2.2908897983932093, "percentage": 45.83, "elapsed_time": "17:16:56", "remaining_time": "20:25:52"} +{"current_steps": 473, "total_steps": 1030, "loss": 0.4438, "lr": 5.246377405713121e-05, "epoch": 2.295740488100652, "percentage": 45.92, "elapsed_time": "17:20:50", "remaining_time": "20:25:41"} +{"current_steps": 474, "total_steps": 1030, "loss": 0.4434, "lr": 5.2334891978313006e-05, "epoch": 2.3005911778080947, "percentage": 46.02, "elapsed_time": "17:24:44", "remaining_time": "20:25:28"} +{"current_steps": 475, "total_steps": 1030, "loss": 0.4493, "lr": 5.220586823036966e-05, "epoch": 2.3054418675155373, "percentage": 46.12, "elapsed_time": "17:28:38", "remaining_time": "20:25:15"} +{"current_steps": 476, "total_steps": 1030, "loss": 0.4426, "lr": 5.207670429516915e-05, "epoch": 2.31029255722298, "percentage": 46.21, "elapsed_time": "17:32:31", "remaining_time": "20:25:00"} +{"current_steps": 477, "total_steps": 1030, "loss": 0.4589, "lr": 5.1947401656189546e-05, "epoch": 2.3151432469304227, "percentage": 46.31, "elapsed_time": "17:36:24", "remaining_time": "20:24:43"} +{"current_steps": 478, "total_steps": 1030, "loss": 0.4461, "lr": 5.181796179850197e-05, "epoch": 2.3199939366378657, "percentage": 46.41, "elapsed_time": "17:40:18", "remaining_time": "20:24:27"} +{"current_steps": 479, "total_steps": 1030, "loss": 0.4494, "lr": 5.168838620875352e-05, "epoch": 2.3248446263453086, "percentage": 46.5, "elapsed_time": "17:44:11", "remaining_time": "20:24:09"} +{"current_steps": 480, "total_steps": 1030, "loss": 0.4513, "lr": 5.155867637515019e-05, "epoch": 2.329695316052751, "percentage": 46.6, "elapsed_time": "17:48:05", "remaining_time": "20:23:50"} +{"current_steps": 481, "total_steps": 1030, "loss": 0.4518, "lr": 5.142883378743984e-05, "epoch": 2.334546005760194, "percentage": 46.7, "elapsed_time": "17:51:58", "remaining_time": "20:23:31"} +{"current_steps": 482, "total_steps": 1030, "loss": 0.4497, "lr": 5.129885993689502e-05, "epoch": 2.3393966954676366, "percentage": 46.8, "elapsed_time": "17:55:52", "remaining_time": "20:23:11"} +{"current_steps": 483, "total_steps": 1030, "loss": 0.4463, "lr": 5.116875631629585e-05, "epoch": 2.3442473851750796, "percentage": 46.89, "elapsed_time": "17:59:45", "remaining_time": "20:22:49"} +{"current_steps": 484, "total_steps": 1030, "loss": 0.44, "lr": 5.10385244199129e-05, "epoch": 2.3490980748825225, "percentage": 46.99, "elapsed_time": "18:03:38", "remaining_time": "20:22:27"} +{"current_steps": 485, "total_steps": 1030, "loss": 0.4481, "lr": 5.0908165743490047e-05, "epoch": 2.353948764589965, "percentage": 47.09, "elapsed_time": "18:07:32", "remaining_time": "20:22:05"} +{"current_steps": 486, "total_steps": 1030, "loss": 0.4518, "lr": 5.0777681784227224e-05, "epoch": 2.358799454297408, "percentage": 47.18, "elapsed_time": "18:11:26", "remaining_time": "20:21:42"} +{"current_steps": 487, "total_steps": 1030, "loss": 0.4485, "lr": 5.064707404076327e-05, "epoch": 2.3636501440048505, "percentage": 47.28, "elapsed_time": "18:15:20", "remaining_time": "20:21:17"} +{"current_steps": 488, "total_steps": 1030, "loss": 0.4485, "lr": 5.051634401315875e-05, "epoch": 2.3685008337122935, "percentage": 47.38, "elapsed_time": "18:19:14", "remaining_time": "20:20:52"} +{"current_steps": 489, "total_steps": 1030, "loss": 0.4418, "lr": 5.0385493202878656e-05, "epoch": 2.3733515234197364, "percentage": 47.48, "elapsed_time": "18:23:08", "remaining_time": "20:20:27"} +{"current_steps": 490, "total_steps": 1030, "loss": 0.4426, "lr": 5.025452311277522e-05, "epoch": 2.378202213127179, "percentage": 47.57, "elapsed_time": "18:27:03", "remaining_time": "20:20:00"} +{"current_steps": 491, "total_steps": 1030, "loss": 0.4475, "lr": 5.01234352470706e-05, "epoch": 2.383052902834622, "percentage": 47.67, "elapsed_time": "18:30:56", "remaining_time": "20:19:33"} +{"current_steps": 492, "total_steps": 1030, "loss": 0.4427, "lr": 4.999223111133968e-05, "epoch": 2.3879035925420644, "percentage": 47.77, "elapsed_time": "18:34:50", "remaining_time": "20:19:04"} +{"current_steps": 493, "total_steps": 1030, "loss": 0.4384, "lr": 4.986091221249269e-05, "epoch": 2.3927542822495074, "percentage": 47.86, "elapsed_time": "18:38:44", "remaining_time": "20:18:35"} +{"current_steps": 494, "total_steps": 1030, "loss": 0.4441, "lr": 4.972948005875796e-05, "epoch": 2.39760497195695, "percentage": 47.96, "elapsed_time": "18:42:39", "remaining_time": "20:18:06"} +{"current_steps": 495, "total_steps": 1030, "loss": 0.4399, "lr": 4.959793615966459e-05, "epoch": 2.402455661664393, "percentage": 48.06, "elapsed_time": "18:46:32", "remaining_time": "20:17:34"} +{"current_steps": 496, "total_steps": 1030, "loss": 0.4532, "lr": 4.946628202602508e-05, "epoch": 2.407306351371836, "percentage": 48.16, "elapsed_time": "18:50:26", "remaining_time": "20:17:02"} +{"current_steps": 497, "total_steps": 1030, "loss": 0.4493, "lr": 4.933451916991802e-05, "epoch": 2.4121570410792783, "percentage": 48.25, "elapsed_time": "18:54:20", "remaining_time": "20:16:29"} +{"current_steps": 498, "total_steps": 1030, "loss": 0.4476, "lr": 4.920264910467066e-05, "epoch": 2.4170077307867213, "percentage": 48.35, "elapsed_time": "18:58:12", "remaining_time": "20:15:55"} +{"current_steps": 499, "total_steps": 1030, "loss": 0.4483, "lr": 4.9070673344841645e-05, "epoch": 2.421858420494164, "percentage": 48.45, "elapsed_time": "19:02:06", "remaining_time": "20:15:20"} +{"current_steps": 500, "total_steps": 1030, "loss": 0.4513, "lr": 4.893859340620348e-05, "epoch": 2.4267091102016067, "percentage": 48.54, "elapsed_time": "19:05:59", "remaining_time": "20:14:45"} +{"current_steps": 501, "total_steps": 1030, "loss": 0.4439, "lr": 4.880641080572522e-05, "epoch": 2.4315597999090497, "percentage": 48.64, "elapsed_time": "19:09:52", "remaining_time": "20:14:08"} +{"current_steps": 502, "total_steps": 1030, "loss": 0.4486, "lr": 4.8674127061555025e-05, "epoch": 2.436410489616492, "percentage": 48.74, "elapsed_time": "19:13:46", "remaining_time": "20:13:32"} +{"current_steps": 503, "total_steps": 1030, "loss": 0.4598, "lr": 4.8541743693002676e-05, "epoch": 2.441261179323935, "percentage": 48.83, "elapsed_time": "19:17:40", "remaining_time": "20:12:54"} +{"current_steps": 504, "total_steps": 1030, "loss": 0.4485, "lr": 4.8409262220522196e-05, "epoch": 2.4461118690313777, "percentage": 48.93, "elapsed_time": "19:21:34", "remaining_time": "20:12:16"} +{"current_steps": 505, "total_steps": 1030, "loss": 0.4454, "lr": 4.8276684165694336e-05, "epoch": 2.4509625587388206, "percentage": 49.03, "elapsed_time": "19:25:28", "remaining_time": "20:11:38"} +{"current_steps": 506, "total_steps": 1030, "loss": 0.4502, "lr": 4.814401105120914e-05, "epoch": 2.4558132484462636, "percentage": 49.13, "elapsed_time": "19:29:22", "remaining_time": "20:10:58"} +{"current_steps": 507, "total_steps": 1030, "loss": 0.4455, "lr": 4.8011244400848414e-05, "epoch": 2.460663938153706, "percentage": 49.22, "elapsed_time": "19:33:16", "remaining_time": "20:10:18"} +{"current_steps": 508, "total_steps": 1030, "loss": 0.4522, "lr": 4.787838573946825e-05, "epoch": 2.465514627861149, "percentage": 49.32, "elapsed_time": "19:37:11", "remaining_time": "20:09:37"} +{"current_steps": 509, "total_steps": 1030, "loss": 0.4422, "lr": 4.774543659298152e-05, "epoch": 2.470365317568592, "percentage": 49.42, "elapsed_time": "19:41:04", "remaining_time": "20:08:55"} +{"current_steps": 510, "total_steps": 1030, "loss": 0.4456, "lr": 4.761239848834031e-05, "epoch": 2.4752160072760345, "percentage": 49.51, "elapsed_time": "19:44:58", "remaining_time": "20:08:12"} +{"current_steps": 511, "total_steps": 1030, "loss": 0.447, "lr": 4.747927295351845e-05, "epoch": 2.4800666969834775, "percentage": 49.61, "elapsed_time": "19:48:52", "remaining_time": "20:07:29"} +{"current_steps": 512, "total_steps": 1030, "loss": 0.4494, "lr": 4.734606151749389e-05, "epoch": 2.48491738669092, "percentage": 49.71, "elapsed_time": "19:52:46", "remaining_time": "20:06:45"} +{"current_steps": 513, "total_steps": 1030, "loss": 0.4467, "lr": 4.7212765710231204e-05, "epoch": 2.489768076398363, "percentage": 49.81, "elapsed_time": "19:56:40", "remaining_time": "20:06:00"} +{"current_steps": 514, "total_steps": 1030, "loss": 0.4492, "lr": 4.707938706266397e-05, "epoch": 2.4946187661058055, "percentage": 49.9, "elapsed_time": "20:00:34", "remaining_time": "20:05:14"} +{"current_steps": 515, "total_steps": 1030, "loss": 0.4434, "lr": 4.694592710667723e-05, "epoch": 2.4994694558132484, "percentage": 50.0, "elapsed_time": "20:04:28", "remaining_time": "20:04:28"} +{"current_steps": 516, "total_steps": 1030, "loss": 0.444, "lr": 4.681238737508983e-05, "epoch": 2.5043201455206914, "percentage": 50.1, "elapsed_time": "20:08:22", "remaining_time": "20:03:41"} +{"current_steps": 517, "total_steps": 1030, "loss": 0.4429, "lr": 4.6678769401636894e-05, "epoch": 2.509170835228134, "percentage": 50.19, "elapsed_time": "20:12:16", "remaining_time": "20:02:54"} +{"current_steps": 518, "total_steps": 1030, "loss": 0.4566, "lr": 4.6545074720952166e-05, "epoch": 2.514021524935577, "percentage": 50.29, "elapsed_time": "20:16:10", "remaining_time": "20:02:05"} +{"current_steps": 519, "total_steps": 1030, "loss": 0.4397, "lr": 4.641130486855038e-05, "epoch": 2.51887221464302, "percentage": 50.39, "elapsed_time": "20:20:04", "remaining_time": "20:01:16"} +{"current_steps": 520, "total_steps": 1030, "loss": 0.4442, "lr": 4.627746138080966e-05, "epoch": 2.5237229043504623, "percentage": 50.49, "elapsed_time": "20:23:58", "remaining_time": "20:00:26"} +{"current_steps": 521, "total_steps": 1030, "loss": 0.4452, "lr": 4.614354579495379e-05, "epoch": 2.5285735940579053, "percentage": 50.58, "elapsed_time": "20:27:52", "remaining_time": "19:59:35"} +{"current_steps": 522, "total_steps": 1030, "loss": 0.4445, "lr": 4.6009559649034695e-05, "epoch": 2.533424283765348, "percentage": 50.68, "elapsed_time": "20:31:45", "remaining_time": "19:58:43"} +{"current_steps": 523, "total_steps": 1030, "loss": 0.4457, "lr": 4.587550448191465e-05, "epoch": 2.5382749734727907, "percentage": 50.78, "elapsed_time": "20:35:39", "remaining_time": "19:57:51"} +{"current_steps": 524, "total_steps": 1030, "loss": 0.457, "lr": 4.5741381833248655e-05, "epoch": 2.5431256631802333, "percentage": 50.87, "elapsed_time": "20:39:32", "remaining_time": "19:56:58"} +{"current_steps": 525, "total_steps": 1030, "loss": 0.4457, "lr": 4.560719324346677e-05, "epoch": 2.547976352887676, "percentage": 50.97, "elapsed_time": "20:43:26", "remaining_time": "19:56:04"} +{"current_steps": 526, "total_steps": 1030, "loss": 0.4471, "lr": 4.547294025375641e-05, "epoch": 2.552827042595119, "percentage": 51.07, "elapsed_time": "20:47:20", "remaining_time": "19:55:10"} +{"current_steps": 527, "total_steps": 1030, "loss": 0.4485, "lr": 4.533862440604461e-05, "epoch": 2.5576777323025617, "percentage": 51.17, "elapsed_time": "20:51:13", "remaining_time": "19:54:14"} +{"current_steps": 528, "total_steps": 1030, "loss": 0.4394, "lr": 4.520424724298036e-05, "epoch": 2.5625284220100046, "percentage": 51.26, "elapsed_time": "20:55:06", "remaining_time": "19:53:18"} +{"current_steps": 529, "total_steps": 1030, "loss": 0.446, "lr": 4.5069810307916874e-05, "epoch": 2.5673791117174476, "percentage": 51.36, "elapsed_time": "20:59:00", "remaining_time": "19:52:22"} +{"current_steps": 530, "total_steps": 1030, "loss": 0.4414, "lr": 4.493531514489385e-05, "epoch": 2.57222980142489, "percentage": 51.46, "elapsed_time": "21:02:54", "remaining_time": "19:51:25"} +{"current_steps": 531, "total_steps": 1030, "loss": 0.4442, "lr": 4.480076329861977e-05, "epoch": 2.5770804911323326, "percentage": 51.55, "elapsed_time": "21:06:47", "remaining_time": "19:50:27"} +{"current_steps": 532, "total_steps": 1030, "loss": 0.4498, "lr": 4.46661563144541e-05, "epoch": 2.5819311808397756, "percentage": 51.65, "elapsed_time": "21:10:40", "remaining_time": "19:49:28"} +{"current_steps": 533, "total_steps": 1030, "loss": 0.4439, "lr": 4.453149573838962e-05, "epoch": 2.5867818705472185, "percentage": 51.75, "elapsed_time": "21:14:34", "remaining_time": "19:48:28"} +{"current_steps": 534, "total_steps": 1030, "loss": 0.4507, "lr": 4.43967831170346e-05, "epoch": 2.591632560254661, "percentage": 51.84, "elapsed_time": "21:18:27", "remaining_time": "19:47:29"} +{"current_steps": 535, "total_steps": 1030, "loss": 0.4481, "lr": 4.426201999759505e-05, "epoch": 2.596483249962104, "percentage": 51.94, "elapsed_time": "21:22:20", "remaining_time": "19:46:28"} +{"current_steps": 536, "total_steps": 1030, "loss": 0.441, "lr": 4.4127207927857e-05, "epoch": 2.601333939669547, "percentage": 52.04, "elapsed_time": "21:26:14", "remaining_time": "19:45:27"} +{"current_steps": 537, "total_steps": 1030, "loss": 0.4577, "lr": 4.3992348456168666e-05, "epoch": 2.6061846293769895, "percentage": 52.14, "elapsed_time": "21:30:07", "remaining_time": "19:44:24"} +{"current_steps": 538, "total_steps": 1030, "loss": 0.4434, "lr": 4.385744313142267e-05, "epoch": 2.6110353190844324, "percentage": 52.23, "elapsed_time": "21:34:00", "remaining_time": "19:43:22"} +{"current_steps": 539, "total_steps": 1030, "loss": 0.4411, "lr": 4.372249350303828e-05, "epoch": 2.615886008791875, "percentage": 52.33, "elapsed_time": "21:37:54", "remaining_time": "19:42:19"} +{"current_steps": 540, "total_steps": 1030, "loss": 0.456, "lr": 4.358750112094363e-05, "epoch": 2.620736698499318, "percentage": 52.43, "elapsed_time": "21:41:47", "remaining_time": "19:41:15"} +{"current_steps": 541, "total_steps": 1030, "loss": 0.4345, "lr": 4.3452467535557846e-05, "epoch": 2.6255873882067604, "percentage": 52.52, "elapsed_time": "21:45:40", "remaining_time": "19:40:10"} +{"current_steps": 542, "total_steps": 1030, "loss": 0.4542, "lr": 4.3317394297773304e-05, "epoch": 2.6304380779142034, "percentage": 52.62, "elapsed_time": "21:49:35", "remaining_time": "19:39:06"} +{"current_steps": 543, "total_steps": 1030, "loss": 0.4333, "lr": 4.3182282958937816e-05, "epoch": 2.6352887676216463, "percentage": 52.72, "elapsed_time": "21:53:28", "remaining_time": "19:38:01"} +{"current_steps": 544, "total_steps": 1030, "loss": 0.4476, "lr": 4.304713507083673e-05, "epoch": 2.640139457329089, "percentage": 52.82, "elapsed_time": "21:57:22", "remaining_time": "19:36:55"} +{"current_steps": 545, "total_steps": 1030, "loss": 0.4469, "lr": 4.291195218567523e-05, "epoch": 2.644990147036532, "percentage": 52.91, "elapsed_time": "22:01:16", "remaining_time": "19:35:48"} +{"current_steps": 546, "total_steps": 1030, "loss": 0.4402, "lr": 4.277673585606046e-05, "epoch": 2.6498408367439747, "percentage": 53.01, "elapsed_time": "22:05:09", "remaining_time": "19:34:41"} +{"current_steps": 547, "total_steps": 1030, "loss": 0.4597, "lr": 4.264148763498364e-05, "epoch": 2.6546915264514173, "percentage": 53.11, "elapsed_time": "22:09:03", "remaining_time": "19:33:33"} +{"current_steps": 548, "total_steps": 1030, "loss": 0.4401, "lr": 4.250620907580226e-05, "epoch": 2.65954221615886, "percentage": 53.2, "elapsed_time": "22:12:57", "remaining_time": "19:32:24"} +{"current_steps": 549, "total_steps": 1030, "loss": 0.4483, "lr": 4.237090173222231e-05, "epoch": 2.6643929058663027, "percentage": 53.3, "elapsed_time": "22:16:51", "remaining_time": "19:31:16"} +{"current_steps": 550, "total_steps": 1030, "loss": 0.4499, "lr": 4.223556715828033e-05, "epoch": 2.6692435955737457, "percentage": 53.4, "elapsed_time": "22:20:45", "remaining_time": "19:30:06"} +{"current_steps": 551, "total_steps": 1030, "loss": 0.4507, "lr": 4.2100206908325603e-05, "epoch": 2.674094285281188, "percentage": 53.5, "elapsed_time": "22:24:38", "remaining_time": "19:28:56"} +{"current_steps": 552, "total_steps": 1030, "loss": 0.4409, "lr": 4.196482253700235e-05, "epoch": 2.678944974988631, "percentage": 53.59, "elapsed_time": "22:28:32", "remaining_time": "19:27:45"} +{"current_steps": 553, "total_steps": 1030, "loss": 0.4446, "lr": 4.182941559923179e-05, "epoch": 2.683795664696074, "percentage": 53.69, "elapsed_time": "22:32:26", "remaining_time": "19:26:34"} +{"current_steps": 554, "total_steps": 1030, "loss": 0.4437, "lr": 4.169398765019433e-05, "epoch": 2.6886463544035166, "percentage": 53.79, "elapsed_time": "22:36:19", "remaining_time": "19:25:21"} +{"current_steps": 555, "total_steps": 1030, "loss": 0.442, "lr": 4.15585402453117e-05, "epoch": 2.6934970441109596, "percentage": 53.88, "elapsed_time": "22:40:12", "remaining_time": "19:24:08"} +{"current_steps": 556, "total_steps": 1030, "loss": 0.4418, "lr": 4.14230749402291e-05, "epoch": 2.6983477338184025, "percentage": 53.98, "elapsed_time": "22:44:06", "remaining_time": "19:22:55"} +{"current_steps": 557, "total_steps": 1030, "loss": 0.4338, "lr": 4.128759329079732e-05, "epoch": 2.703198423525845, "percentage": 54.08, "elapsed_time": "22:48:00", "remaining_time": "19:21:41"} +{"current_steps": 558, "total_steps": 1030, "loss": 0.4355, "lr": 4.115209685305482e-05, "epoch": 2.708049113233288, "percentage": 54.17, "elapsed_time": "22:51:53", "remaining_time": "19:20:26"} +{"current_steps": 559, "total_steps": 1030, "loss": 0.4423, "lr": 4.101658718320998e-05, "epoch": 2.7128998029407305, "percentage": 54.27, "elapsed_time": "22:55:46", "remaining_time": "19:19:11"} +{"current_steps": 560, "total_steps": 1030, "loss": 0.4468, "lr": 4.088106583762309e-05, "epoch": 2.7177504926481735, "percentage": 54.37, "elapsed_time": "22:59:40", "remaining_time": "19:17:56"} +{"current_steps": 561, "total_steps": 1030, "loss": 0.449, "lr": 4.074553437278857e-05, "epoch": 2.722601182355616, "percentage": 54.47, "elapsed_time": "23:03:34", "remaining_time": "19:16:40"} +{"current_steps": 562, "total_steps": 1030, "loss": 0.4466, "lr": 4.060999434531704e-05, "epoch": 2.727451872063059, "percentage": 54.56, "elapsed_time": "23:07:28", "remaining_time": "19:15:24"} +{"current_steps": 563, "total_steps": 1030, "loss": 0.4432, "lr": 4.047444731191751e-05, "epoch": 2.732302561770502, "percentage": 54.66, "elapsed_time": "23:11:22", "remaining_time": "19:14:07"} +{"current_steps": 564, "total_steps": 1030, "loss": 0.4448, "lr": 4.033889482937943e-05, "epoch": 2.7371532514779444, "percentage": 54.76, "elapsed_time": "23:15:16", "remaining_time": "19:12:50"} +{"current_steps": 565, "total_steps": 1030, "loss": 0.4557, "lr": 4.020333845455478e-05, "epoch": 2.7420039411853874, "percentage": 54.85, "elapsed_time": "23:19:10", "remaining_time": "19:11:31"} +{"current_steps": 566, "total_steps": 1030, "loss": 0.4449, "lr": 4.0067779744340345e-05, "epoch": 2.7468546308928303, "percentage": 54.95, "elapsed_time": "23:23:03", "remaining_time": "19:10:12"} +{"current_steps": 567, "total_steps": 1030, "loss": 0.4471, "lr": 3.993222025565966e-05, "epoch": 2.751705320600273, "percentage": 55.05, "elapsed_time": "23:26:56", "remaining_time": "19:08:52"} +{"current_steps": 568, "total_steps": 1030, "loss": 0.4453, "lr": 3.979666154544522e-05, "epoch": 2.7565560103077154, "percentage": 55.15, "elapsed_time": "23:30:50", "remaining_time": "19:07:33"} +{"current_steps": 569, "total_steps": 1030, "loss": 0.4428, "lr": 3.96611051706206e-05, "epoch": 2.7614067000151583, "percentage": 55.24, "elapsed_time": "23:34:44", "remaining_time": "19:06:12"} +{"current_steps": 570, "total_steps": 1030, "loss": 0.4502, "lr": 3.9525552688082494e-05, "epoch": 2.7662573897226013, "percentage": 55.34, "elapsed_time": "23:38:37", "remaining_time": "19:04:50"} +{"current_steps": 571, "total_steps": 1030, "loss": 0.4432, "lr": 3.939000565468297e-05, "epoch": 2.771108079430044, "percentage": 55.44, "elapsed_time": "23:42:30", "remaining_time": "19:03:29"} +{"current_steps": 572, "total_steps": 1030, "loss": 0.4463, "lr": 3.9254465627211444e-05, "epoch": 2.7759587691374867, "percentage": 55.53, "elapsed_time": "23:46:24", "remaining_time": "19:02:07"} +{"current_steps": 573, "total_steps": 1030, "loss": 0.4438, "lr": 3.911893416237693e-05, "epoch": 2.7808094588449297, "percentage": 55.63, "elapsed_time": "23:50:18", "remaining_time": "19:00:45"} +{"current_steps": 574, "total_steps": 1030, "loss": 0.4405, "lr": 3.8983412816790045e-05, "epoch": 2.785660148552372, "percentage": 55.73, "elapsed_time": "23:54:12", "remaining_time": "18:59:22"} +{"current_steps": 413, "total_steps": 1030, "loss": 0.4473, "lr": 5.988248735527793e-05, "epoch": 2.004850689707443, "percentage": 40.1, "elapsed_time": "0:04:10", "remaining_time": "0:06:14"} +{"current_steps": 414, "total_steps": 1030, "loss": 0.4501, "lr": 5.9764746355528994e-05, "epoch": 2.0097013794148855, "percentage": 40.19, "elapsed_time": "0:08:04", "remaining_time": "0:12:00"} +{"current_steps": 415, "total_steps": 1030, "loss": 0.4483, "lr": 5.964677835303615e-05, "epoch": 2.0145520691223284, "percentage": 40.29, "elapsed_time": "0:11:57", "remaining_time": "0:17:43"} +{"current_steps": 416, "total_steps": 1030, "loss": 0.4468, "lr": 5.952858470268955e-05, "epoch": 2.019402758829771, "percentage": 40.39, "elapsed_time": "0:15:51", "remaining_time": "0:23:24"} +{"current_steps": 417, "total_steps": 1030, "loss": 0.4499, "lr": 5.941016676197098e-05, "epoch": 2.024253448537214, "percentage": 40.49, "elapsed_time": "0:19:45", "remaining_time": "0:29:02"} +{"current_steps": 418, "total_steps": 1030, "loss": 0.4498, "lr": 5.929152589093825e-05, "epoch": 2.029104138244657, "percentage": 40.58, "elapsed_time": "0:23:39", "remaining_time": "0:34:38"} +{"current_steps": 419, "total_steps": 1030, "loss": 0.449, "lr": 5.9172663452209554e-05, "epoch": 2.0339548279520994, "percentage": 40.68, "elapsed_time": "0:27:33", "remaining_time": "0:40:10"} +{"current_steps": 420, "total_steps": 1030, "loss": 0.4555, "lr": 5.9053580810947845e-05, "epoch": 2.0388055176595423, "percentage": 40.78, "elapsed_time": "0:31:26", "remaining_time": "0:45:39"} +{"current_steps": 421, "total_steps": 1030, "loss": 0.4537, "lr": 5.89342793348452e-05, "epoch": 2.043656207366985, "percentage": 40.87, "elapsed_time": "0:35:19", "remaining_time": "0:51:06"} +{"current_steps": 422, "total_steps": 1030, "loss": 0.4579, "lr": 5.881476039410699e-05, "epoch": 2.048506897074428, "percentage": 40.97, "elapsed_time": "0:39:13", "remaining_time": "0:56:31"} +{"current_steps": 423, "total_steps": 1030, "loss": 0.4478, "lr": 5.869502536143629e-05, "epoch": 2.0533575867818707, "percentage": 41.07, "elapsed_time": "0:43:18", "remaining_time": "1:02:09"} +{"current_steps": 424, "total_steps": 1030, "loss": 0.4501, "lr": 5.857507561201802e-05, "epoch": 2.0582082764893133, "percentage": 41.17, "elapsed_time": "0:47:11", "remaining_time": "1:07:27"} +{"current_steps": 425, "total_steps": 1030, "loss": 0.4479, "lr": 5.845491252350312e-05, "epoch": 2.063058966196756, "percentage": 41.26, "elapsed_time": "0:51:05", "remaining_time": "1:12:43"} +{"current_steps": 426, "total_steps": 1030, "loss": 0.4466, "lr": 5.833453747599286e-05, "epoch": 2.0679096559041987, "percentage": 41.36, "elapsed_time": "0:54:59", "remaining_time": "1:17:58"} +{"current_steps": 427, "total_steps": 1030, "loss": 0.449, "lr": 5.821395185202285e-05, "epoch": 2.0727603456116417, "percentage": 41.46, "elapsed_time": "0:58:53", "remaining_time": "1:23:10"} +{"current_steps": 428, "total_steps": 1030, "loss": 0.4581, "lr": 5.809315703654726e-05, "epoch": 2.0776110353190846, "percentage": 41.55, "elapsed_time": "1:02:47", "remaining_time": "1:28:19"} +{"current_steps": 429, "total_steps": 1030, "loss": 0.4534, "lr": 5.797215441692284e-05, "epoch": 2.082461725026527, "percentage": 41.65, "elapsed_time": "1:06:41", "remaining_time": "1:33:26"} +{"current_steps": 430, "total_steps": 1030, "loss": 0.4537, "lr": 5.785094538289304e-05, "epoch": 2.08731241473397, "percentage": 41.75, "elapsed_time": "1:10:35", "remaining_time": "1:38:30"} +{"current_steps": 431, "total_steps": 1030, "loss": 0.4553, "lr": 5.772953132657202e-05, "epoch": 2.0921631044414126, "percentage": 41.84, "elapsed_time": "1:14:29", "remaining_time": "1:43:31"} +{"current_steps": 432, "total_steps": 1030, "loss": 0.4424, "lr": 5.7607913642428666e-05, "epoch": 2.0970137941488556, "percentage": 41.94, "elapsed_time": "1:18:23", "remaining_time": "1:48:31"} +{"current_steps": 433, "total_steps": 1030, "loss": 0.4462, "lr": 5.7486093727270606e-05, "epoch": 2.101864483856298, "percentage": 42.04, "elapsed_time": "1:22:17", "remaining_time": "1:53:27"} +{"current_steps": 434, "total_steps": 1030, "loss": 0.4434, "lr": 5.736407298022809e-05, "epoch": 2.106715173563741, "percentage": 42.14, "elapsed_time": "1:26:11", "remaining_time": "1:58:21"} +{"current_steps": 435, "total_steps": 1030, "loss": 0.4533, "lr": 5.7241852802738e-05, "epoch": 2.111565863271184, "percentage": 42.23, "elapsed_time": "1:30:05", "remaining_time": "2:03:13"} +{"current_steps": 436, "total_steps": 1030, "loss": 0.4427, "lr": 5.711943459852772e-05, "epoch": 2.1164165529786265, "percentage": 42.33, "elapsed_time": "1:33:59", "remaining_time": "2:08:03"} +{"current_steps": 437, "total_steps": 1030, "loss": 0.4385, "lr": 5.699681977359902e-05, "epoch": 2.1212672426860695, "percentage": 42.43, "elapsed_time": "1:37:53", "remaining_time": "2:12:49"} +{"current_steps": 438, "total_steps": 1030, "loss": 0.4465, "lr": 5.6874009736211896e-05, "epoch": 2.1261179323935124, "percentage": 42.52, "elapsed_time": "1:41:47", "remaining_time": "2:17:34"} +{"current_steps": 439, "total_steps": 1030, "loss": 0.4472, "lr": 5.675100589686839e-05, "epoch": 2.130968622100955, "percentage": 42.62, "elapsed_time": "1:45:41", "remaining_time": "2:22:16"} +{"current_steps": 440, "total_steps": 1030, "loss": 0.4486, "lr": 5.662780966829646e-05, "epoch": 2.135819311808398, "percentage": 42.72, "elapsed_time": "1:49:35", "remaining_time": "2:26:57"} +{"current_steps": 441, "total_steps": 1030, "loss": 0.4525, "lr": 5.650442246543364e-05, "epoch": 2.1406700015158404, "percentage": 42.82, "elapsed_time": "1:53:29", "remaining_time": "2:31:34"} +{"current_steps": 442, "total_steps": 1030, "loss": 0.4451, "lr": 5.638084570541088e-05, "epoch": 2.1455206912232834, "percentage": 42.91, "elapsed_time": "1:57:23", "remaining_time": "2:36:10"} +{"current_steps": 443, "total_steps": 1030, "loss": 0.455, "lr": 5.625708080753621e-05, "epoch": 2.150371380930726, "percentage": 43.01, "elapsed_time": "2:01:17", "remaining_time": "2:40:43"} +{"current_steps": 444, "total_steps": 1030, "loss": 0.4453, "lr": 5.6133129193278525e-05, "epoch": 2.155222070638169, "percentage": 43.11, "elapsed_time": "2:05:12", "remaining_time": "2:45:14"} +{"current_steps": 445, "total_steps": 1030, "loss": 0.4523, "lr": 5.600899228625112e-05, "epoch": 2.160072760345612, "percentage": 43.2, "elapsed_time": "2:09:05", "remaining_time": "2:49:41"} +{"current_steps": 446, "total_steps": 1030, "loss": 0.4481, "lr": 5.588467151219549e-05, "epoch": 2.1649234500530543, "percentage": 43.3, "elapsed_time": "2:12:58", "remaining_time": "2:54:06"} +{"current_steps": 447, "total_steps": 1030, "loss": 0.4397, "lr": 5.5760168298964874e-05, "epoch": 2.1697741397604973, "percentage": 43.4, "elapsed_time": "2:16:51", "remaining_time": "2:58:29"} +{"current_steps": 448, "total_steps": 1030, "loss": 0.4464, "lr": 5.563548407650782e-05, "epoch": 2.17462482946794, "percentage": 43.5, "elapsed_time": "2:20:45", "remaining_time": "3:02:50"} +{"current_steps": 449, "total_steps": 1030, "loss": 0.4487, "lr": 5.551062027685187e-05, "epoch": 2.1794755191753827, "percentage": 43.59, "elapsed_time": "2:24:38", "remaining_time": "3:07:10"} +{"current_steps": 450, "total_steps": 1030, "loss": 0.4481, "lr": 5.5385578334087006e-05, "epoch": 2.1843262088828257, "percentage": 43.69, "elapsed_time": "2:28:31", "remaining_time": "3:11:26"} +{"current_steps": 451, "total_steps": 1030, "loss": 0.4469, "lr": 5.526035968434927e-05, "epoch": 2.189176898590268, "percentage": 43.79, "elapsed_time": "2:32:25", "remaining_time": "3:15:40"} +{"current_steps": 452, "total_steps": 1030, "loss": 0.4573, "lr": 5.513496576580418e-05, "epoch": 2.194027588297711, "percentage": 43.88, "elapsed_time": "2:36:19", "remaining_time": "3:19:54"} +{"current_steps": 453, "total_steps": 1030, "loss": 0.4498, "lr": 5.5009398018630276e-05, "epoch": 2.1988782780051537, "percentage": 43.98, "elapsed_time": "2:40:13", "remaining_time": "3:24:04"} +{"current_steps": 454, "total_steps": 1030, "loss": 0.4449, "lr": 5.4883657885002575e-05, "epoch": 2.2037289677125966, "percentage": 44.08, "elapsed_time": "2:44:06", "remaining_time": "3:28:12"} +{"current_steps": 455, "total_steps": 1030, "loss": 0.443, "lr": 5.475774680907597e-05, "epoch": 2.2085796574200396, "percentage": 44.17, "elapsed_time": "2:48:00", "remaining_time": "3:32:18"} +{"current_steps": 456, "total_steps": 1030, "loss": 0.4434, "lr": 5.463166623696868e-05, "epoch": 2.213430347127482, "percentage": 44.27, "elapsed_time": "2:51:53", "remaining_time": "3:36:21"} +{"current_steps": 457, "total_steps": 1030, "loss": 0.4445, "lr": 5.450541761674562e-05, "epoch": 2.218281036834925, "percentage": 44.37, "elapsed_time": "2:55:47", "remaining_time": "3:40:24"} +{"current_steps": 458, "total_steps": 1030, "loss": 0.4465, "lr": 5.437900239840179e-05, "epoch": 2.2231317265423676, "percentage": 44.47, "elapsed_time": "2:59:40", "remaining_time": "3:44:23"} +{"current_steps": 459, "total_steps": 1030, "loss": 0.4453, "lr": 5.42524220338456e-05, "epoch": 2.2279824162498105, "percentage": 44.56, "elapsed_time": "3:03:33", "remaining_time": "3:48:20"} +{"current_steps": 460, "total_steps": 1030, "loss": 0.4498, "lr": 5.412567797688219e-05, "epoch": 2.2328331059572535, "percentage": 44.66, "elapsed_time": "3:07:27", "remaining_time": "3:52:16"} +{"current_steps": 461, "total_steps": 1030, "loss": 0.4527, "lr": 5.3998771683196754e-05, "epoch": 2.237683795664696, "percentage": 44.76, "elapsed_time": "3:11:21", "remaining_time": "3:56:11"} +{"current_steps": 462, "total_steps": 1030, "loss": 0.4444, "lr": 5.3871704610337836e-05, "epoch": 2.242534485372139, "percentage": 44.85, "elapsed_time": "3:15:15", "remaining_time": "4:00:03"} +{"current_steps": 463, "total_steps": 1030, "loss": 0.4431, "lr": 5.374447821770053e-05, "epoch": 2.2473851750795815, "percentage": 44.95, "elapsed_time": "3:19:09", "remaining_time": "4:03:53"} +{"current_steps": 464, "total_steps": 1030, "loss": 0.4404, "lr": 5.361709396650977e-05, "epoch": 2.2522358647870244, "percentage": 45.05, "elapsed_time": "3:23:03", "remaining_time": "4:07:42"} +{"current_steps": 465, "total_steps": 1030, "loss": 0.4496, "lr": 5.3489553319803566e-05, "epoch": 2.2570865544944674, "percentage": 45.15, "elapsed_time": "3:26:57", "remaining_time": "4:11:27"} +{"current_steps": 466, "total_steps": 1030, "loss": 0.4469, "lr": 5.336185774241609e-05, "epoch": 2.26193724420191, "percentage": 45.24, "elapsed_time": "3:30:50", "remaining_time": "4:15:10"} +{"current_steps": 467, "total_steps": 1030, "loss": 0.4505, "lr": 5.3234008700961e-05, "epoch": 2.266787933909353, "percentage": 45.34, "elapsed_time": "3:34:43", "remaining_time": "4:18:52"} +{"current_steps": 468, "total_steps": 1030, "loss": 0.4406, "lr": 5.3106007663814505e-05, "epoch": 2.2716386236167954, "percentage": 45.44, "elapsed_time": "3:38:37", "remaining_time": "4:22:31"} +{"current_steps": 469, "total_steps": 1030, "loss": 0.4525, "lr": 5.2977856101098484e-05, "epoch": 2.2764893133242383, "percentage": 45.53, "elapsed_time": "3:42:30", "remaining_time": "4:26:09"} +{"current_steps": 470, "total_steps": 1030, "loss": 0.4592, "lr": 5.284955548466371e-05, "epoch": 2.281340003031681, "percentage": 45.63, "elapsed_time": "3:46:23", "remaining_time": "4:29:45"} +{"current_steps": 471, "total_steps": 1030, "loss": 0.4459, "lr": 5.272110728807279e-05, "epoch": 2.286190692739124, "percentage": 45.73, "elapsed_time": "3:50:17", "remaining_time": "4:33:18"} +{"current_steps": 472, "total_steps": 1030, "loss": 0.4523, "lr": 5.25925129865834e-05, "epoch": 2.2910413824465667, "percentage": 45.83, "elapsed_time": "3:54:10", "remaining_time": "4:36:50"} +{"current_steps": 473, "total_steps": 1030, "loss": 0.4426, "lr": 5.246377405713121e-05, "epoch": 2.2958920721540093, "percentage": 45.92, "elapsed_time": "3:58:03", "remaining_time": "4:40:20"} +{"current_steps": 474, "total_steps": 1030, "loss": 0.4426, "lr": 5.2334891978313006e-05, "epoch": 2.300742761861452, "percentage": 46.02, "elapsed_time": "4:01:57", "remaining_time": "4:43:48"} +{"current_steps": 475, "total_steps": 1030, "loss": 0.4458, "lr": 5.220586823036966e-05, "epoch": 2.305593451568895, "percentage": 46.12, "elapsed_time": "4:05:51", "remaining_time": "4:47:16"} +{"current_steps": 476, "total_steps": 1030, "loss": 0.4433, "lr": 5.207670429516915e-05, "epoch": 2.3104441412763377, "percentage": 46.21, "elapsed_time": "4:09:45", "remaining_time": "4:50:40"} +{"current_steps": 477, "total_steps": 1030, "loss": 0.4593, "lr": 5.1947401656189546e-05, "epoch": 2.3152948309837806, "percentage": 46.31, "elapsed_time": "4:13:39", "remaining_time": "4:54:04"} +{"current_steps": 478, "total_steps": 1030, "loss": 0.4424, "lr": 5.181796179850197e-05, "epoch": 2.320145520691223, "percentage": 46.41, "elapsed_time": "4:17:33", "remaining_time": "4:57:25"} +{"current_steps": 479, "total_steps": 1030, "loss": 0.4503, "lr": 5.168838620875352e-05, "epoch": 2.324996210398666, "percentage": 46.5, "elapsed_time": "4:21:26", "remaining_time": "5:00:44"} +{"current_steps": 480, "total_steps": 1030, "loss": 0.4506, "lr": 5.155867637515019e-05, "epoch": 2.3298469001061086, "percentage": 46.6, "elapsed_time": "4:25:19", "remaining_time": "5:04:01"} +{"current_steps": 481, "total_steps": 1030, "loss": 0.4513, "lr": 5.142883378743984e-05, "epoch": 2.3346975898135516, "percentage": 46.7, "elapsed_time": "4:29:13", "remaining_time": "5:07:17"} +{"current_steps": 482, "total_steps": 1030, "loss": 0.4488, "lr": 5.129885993689502e-05, "epoch": 2.3395482795209945, "percentage": 46.8, "elapsed_time": "4:33:07", "remaining_time": "5:10:31"} +{"current_steps": 483, "total_steps": 1030, "loss": 0.4456, "lr": 5.116875631629585e-05, "epoch": 2.344398969228437, "percentage": 46.89, "elapsed_time": "4:37:01", "remaining_time": "5:13:43"} +{"current_steps": 484, "total_steps": 1030, "loss": 0.4386, "lr": 5.10385244199129e-05, "epoch": 2.34924965893588, "percentage": 46.99, "elapsed_time": "4:40:56", "remaining_time": "5:16:55"} +{"current_steps": 485, "total_steps": 1030, "loss": 0.4482, "lr": 5.0908165743490047e-05, "epoch": 2.354100348643323, "percentage": 47.09, "elapsed_time": "4:44:50", "remaining_time": "5:20:04"} +{"current_steps": 486, "total_steps": 1030, "loss": 0.4496, "lr": 5.0777681784227224e-05, "epoch": 2.3589510383507655, "percentage": 47.18, "elapsed_time": "4:48:45", "remaining_time": "5:23:12"} +{"current_steps": 487, "total_steps": 1030, "loss": 0.4502, "lr": 5.064707404076327e-05, "epoch": 2.3638017280582084, "percentage": 47.28, "elapsed_time": "4:52:39", "remaining_time": "5:26:18"} +{"current_steps": 488, "total_steps": 1030, "loss": 0.448, "lr": 5.051634401315875e-05, "epoch": 2.368652417765651, "percentage": 47.38, "elapsed_time": "4:56:33", "remaining_time": "5:29:22"} +{"current_steps": 489, "total_steps": 1030, "loss": 0.4416, "lr": 5.0385493202878656e-05, "epoch": 2.373503107473094, "percentage": 47.48, "elapsed_time": "5:00:27", "remaining_time": "5:32:24"} +{"current_steps": 490, "total_steps": 1030, "loss": 0.4413, "lr": 5.025452311277522e-05, "epoch": 2.3783537971805364, "percentage": 47.57, "elapsed_time": "5:04:21", "remaining_time": "5:35:24"} +{"current_steps": 491, "total_steps": 1030, "loss": 0.4472, "lr": 5.01234352470706e-05, "epoch": 2.3832044868879794, "percentage": 47.67, "elapsed_time": "5:08:15", "remaining_time": "5:38:23"} +{"current_steps": 492, "total_steps": 1030, "loss": 0.4405, "lr": 4.999223111133968e-05, "epoch": 2.3880551765954223, "percentage": 47.77, "elapsed_time": "5:12:10", "remaining_time": "5:41:22"} +{"current_steps": 493, "total_steps": 1030, "loss": 0.44, "lr": 4.986091221249269e-05, "epoch": 2.392905866302865, "percentage": 47.86, "elapsed_time": "5:16:03", "remaining_time": "5:44:16"} +{"current_steps": 494, "total_steps": 1030, "loss": 0.4432, "lr": 4.972948005875796e-05, "epoch": 2.397756556010308, "percentage": 47.96, "elapsed_time": "5:19:57", "remaining_time": "5:47:09"} +{"current_steps": 495, "total_steps": 1030, "loss": 0.4401, "lr": 4.959793615966459e-05, "epoch": 2.4026072457177503, "percentage": 48.06, "elapsed_time": "5:23:51", "remaining_time": "5:50:01"} +{"current_steps": 496, "total_steps": 1030, "loss": 0.4526, "lr": 4.946628202602508e-05, "epoch": 2.4074579354251933, "percentage": 48.16, "elapsed_time": "5:27:44", "remaining_time": "5:52:51"} +{"current_steps": 497, "total_steps": 1030, "loss": 0.4474, "lr": 4.933451916991802e-05, "epoch": 2.412308625132636, "percentage": 48.25, "elapsed_time": "5:31:39", "remaining_time": "5:55:40"} +{"current_steps": 498, "total_steps": 1030, "loss": 0.4485, "lr": 4.920264910467066e-05, "epoch": 2.4171593148400787, "percentage": 48.35, "elapsed_time": "5:35:31", "remaining_time": "5:58:26"} +{"current_steps": 499, "total_steps": 1030, "loss": 0.4471, "lr": 4.9070673344841645e-05, "epoch": 2.4220100045475217, "percentage": 48.45, "elapsed_time": "5:39:25", "remaining_time": "6:01:11"} +{"current_steps": 500, "total_steps": 1030, "loss": 0.4518, "lr": 4.893859340620348e-05, "epoch": 2.426860694254964, "percentage": 48.54, "elapsed_time": "5:43:19", "remaining_time": "6:03:55"} +{"current_steps": 501, "total_steps": 1030, "loss": 0.4426, "lr": 4.880641080572522e-05, "epoch": 2.431711383962407, "percentage": 48.64, "elapsed_time": "5:47:12", "remaining_time": "6:06:36"} +{"current_steps": 502, "total_steps": 1030, "loss": 0.4492, "lr": 4.8674127061555025e-05, "epoch": 2.43656207366985, "percentage": 48.74, "elapsed_time": "5:51:06", "remaining_time": "6:09:17"} +{"current_steps": 503, "total_steps": 1030, "loss": 0.4576, "lr": 4.8541743693002676e-05, "epoch": 2.4414127633772926, "percentage": 48.83, "elapsed_time": "5:54:59", "remaining_time": "6:11:56"} +{"current_steps": 504, "total_steps": 1030, "loss": 0.4476, "lr": 4.8409262220522196e-05, "epoch": 2.4462634530847356, "percentage": 48.93, "elapsed_time": "5:58:53", "remaining_time": "6:14:33"} +{"current_steps": 505, "total_steps": 1030, "loss": 0.4479, "lr": 4.8276684165694336e-05, "epoch": 2.451114142792178, "percentage": 49.03, "elapsed_time": "6:02:47", "remaining_time": "6:17:09"} +{"current_steps": 506, "total_steps": 1030, "loss": 0.4479, "lr": 4.814401105120914e-05, "epoch": 2.455964832499621, "percentage": 49.13, "elapsed_time": "6:06:41", "remaining_time": "6:19:43"} +{"current_steps": 507, "total_steps": 1030, "loss": 0.4466, "lr": 4.8011244400848414e-05, "epoch": 2.460815522207064, "percentage": 49.22, "elapsed_time": "6:10:34", "remaining_time": "6:22:16"} +{"current_steps": 508, "total_steps": 1030, "loss": 0.4503, "lr": 4.787838573946825e-05, "epoch": 2.4656662119145065, "percentage": 49.32, "elapsed_time": "6:14:27", "remaining_time": "6:24:47"} +{"current_steps": 509, "total_steps": 1030, "loss": 0.4419, "lr": 4.774543659298152e-05, "epoch": 2.4705169016219495, "percentage": 49.42, "elapsed_time": "6:18:21", "remaining_time": "6:27:16"} +{"current_steps": 510, "total_steps": 1030, "loss": 0.4443, "lr": 4.761239848834031e-05, "epoch": 2.475367591329392, "percentage": 49.51, "elapsed_time": "6:22:15", "remaining_time": "6:29:45"} +{"current_steps": 511, "total_steps": 1030, "loss": 0.4474, "lr": 4.747927295351845e-05, "epoch": 2.480218281036835, "percentage": 49.61, "elapsed_time": "6:26:09", "remaining_time": "6:32:12"} +{"current_steps": 512, "total_steps": 1030, "loss": 0.4473, "lr": 4.734606151749389e-05, "epoch": 2.485068970744278, "percentage": 49.71, "elapsed_time": "6:30:03", "remaining_time": "6:34:38"} +{"current_steps": 513, "total_steps": 1030, "loss": 0.4481, "lr": 4.7212765710231204e-05, "epoch": 2.4899196604517204, "percentage": 49.81, "elapsed_time": "6:33:57", "remaining_time": "6:37:01"} +{"current_steps": 514, "total_steps": 1030, "loss": 0.4484, "lr": 4.707938706266397e-05, "epoch": 2.4947703501591634, "percentage": 49.9, "elapsed_time": "6:37:52", "remaining_time": "6:39:24"} +{"current_steps": 515, "total_steps": 1030, "loss": 0.444, "lr": 4.694592710667723e-05, "epoch": 2.499621039866606, "percentage": 50.0, "elapsed_time": "6:41:45", "remaining_time": "6:41:45"} +{"current_steps": 516, "total_steps": 1030, "loss": 0.4424, "lr": 4.681238737508983e-05, "epoch": 2.504471729574049, "percentage": 50.1, "elapsed_time": "6:45:39", "remaining_time": "6:44:05"} +{"current_steps": 517, "total_steps": 1030, "loss": 0.4444, "lr": 4.6678769401636894e-05, "epoch": 2.5093224192814914, "percentage": 50.19, "elapsed_time": "6:49:33", "remaining_time": "6:46:23"} +{"current_steps": 518, "total_steps": 1030, "loss": 0.456, "lr": 4.6545074720952166e-05, "epoch": 2.5141731089889343, "percentage": 50.29, "elapsed_time": "6:53:27", "remaining_time": "6:48:40"} +{"current_steps": 519, "total_steps": 1030, "loss": 0.4396, "lr": 4.641130486855038e-05, "epoch": 2.5190237986963773, "percentage": 50.39, "elapsed_time": "6:57:21", "remaining_time": "6:50:55"} +{"current_steps": 520, "total_steps": 1030, "loss": 0.4432, "lr": 4.627746138080966e-05, "epoch": 2.52387448840382, "percentage": 50.49, "elapsed_time": "7:01:15", "remaining_time": "6:53:09"} +{"current_steps": 521, "total_steps": 1030, "loss": 0.4448, "lr": 4.614354579495379e-05, "epoch": 2.5287251781112627, "percentage": 50.58, "elapsed_time": "7:05:09", "remaining_time": "6:55:21"} +{"current_steps": 522, "total_steps": 1030, "loss": 0.4432, "lr": 4.6009559649034695e-05, "epoch": 2.5335758678187057, "percentage": 50.68, "elapsed_time": "7:09:03", "remaining_time": "6:57:32"} +{"current_steps": 523, "total_steps": 1030, "loss": 0.4474, "lr": 4.587550448191465e-05, "epoch": 2.538426557526148, "percentage": 50.78, "elapsed_time": "7:12:56", "remaining_time": "6:59:41"} +{"current_steps": 524, "total_steps": 1030, "loss": 0.455, "lr": 4.5741381833248655e-05, "epoch": 2.543277247233591, "percentage": 50.87, "elapsed_time": "7:16:49", "remaining_time": "7:01:48"} +{"current_steps": 525, "total_steps": 1030, "loss": 0.4457, "lr": 4.560719324346677e-05, "epoch": 2.5481279369410337, "percentage": 50.97, "elapsed_time": "7:20:43", "remaining_time": "7:03:56"} +{"current_steps": 526, "total_steps": 1030, "loss": 0.4478, "lr": 4.547294025375641e-05, "epoch": 2.5529786266484766, "percentage": 51.07, "elapsed_time": "7:24:37", "remaining_time": "7:06:01"} +{"current_steps": 527, "total_steps": 1030, "loss": 0.447, "lr": 4.533862440604461e-05, "epoch": 2.557829316355919, "percentage": 51.17, "elapsed_time": "7:28:31", "remaining_time": "7:08:05"} +{"current_steps": 528, "total_steps": 1030, "loss": 0.4408, "lr": 4.520424724298036e-05, "epoch": 2.562680006063362, "percentage": 51.26, "elapsed_time": "7:32:25", "remaining_time": "7:10:08"} +{"current_steps": 529, "total_steps": 1030, "loss": 0.4441, "lr": 4.5069810307916874e-05, "epoch": 2.567530695770805, "percentage": 51.36, "elapsed_time": "7:36:19", "remaining_time": "7:12:09"} +{"current_steps": 530, "total_steps": 1030, "loss": 0.4425, "lr": 4.493531514489385e-05, "epoch": 2.5723813854782476, "percentage": 51.46, "elapsed_time": "7:40:12", "remaining_time": "7:14:09"} +{"current_steps": 531, "total_steps": 1030, "loss": 0.4433, "lr": 4.480076329861977e-05, "epoch": 2.5772320751856905, "percentage": 51.55, "elapsed_time": "7:44:05", "remaining_time": "7:16:07"} +{"current_steps": 532, "total_steps": 1030, "loss": 0.4487, "lr": 4.46661563144541e-05, "epoch": 2.5820827648931335, "percentage": 51.65, "elapsed_time": "7:47:59", "remaining_time": "7:18:04"} +{"current_steps": 533, "total_steps": 1030, "loss": 0.4445, "lr": 4.453149573838962e-05, "epoch": 2.586933454600576, "percentage": 51.75, "elapsed_time": "7:51:53", "remaining_time": "7:20:00"} +{"current_steps": 534, "total_steps": 1030, "loss": 0.4494, "lr": 4.43967831170346e-05, "epoch": 2.591784144308019, "percentage": 51.84, "elapsed_time": "7:55:47", "remaining_time": "7:21:56"} +{"current_steps": 535, "total_steps": 1030, "loss": 0.4484, "lr": 4.426201999759505e-05, "epoch": 2.5966348340154615, "percentage": 51.94, "elapsed_time": "7:59:41", "remaining_time": "7:23:49"} +{"current_steps": 536, "total_steps": 1030, "loss": 0.4419, "lr": 4.4127207927857e-05, "epoch": 2.6014855237229044, "percentage": 52.04, "elapsed_time": "8:03:35", "remaining_time": "7:25:41"} +{"current_steps": 537, "total_steps": 1030, "loss": 0.4568, "lr": 4.3992348456168666e-05, "epoch": 2.606336213430347, "percentage": 52.14, "elapsed_time": "8:07:29", "remaining_time": "7:27:32"} +{"current_steps": 538, "total_steps": 1030, "loss": 0.4427, "lr": 4.385744313142267e-05, "epoch": 2.61118690313779, "percentage": 52.23, "elapsed_time": "8:11:23", "remaining_time": "7:29:23"} +{"current_steps": 539, "total_steps": 1030, "loss": 0.4418, "lr": 4.372249350303828e-05, "epoch": 2.616037592845233, "percentage": 52.33, "elapsed_time": "8:15:17", "remaining_time": "7:31:10"} +{"current_steps": 540, "total_steps": 1030, "loss": 0.4544, "lr": 4.358750112094363e-05, "epoch": 2.6208882825526754, "percentage": 52.43, "elapsed_time": "8:19:11", "remaining_time": "7:32:58"} +{"current_steps": 541, "total_steps": 1030, "loss": 0.4372, "lr": 4.3452467535557846e-05, "epoch": 2.6257389722601183, "percentage": 52.52, "elapsed_time": "8:23:05", "remaining_time": "7:34:43"} +{"current_steps": 542, "total_steps": 1030, "loss": 0.4517, "lr": 4.3317394297773304e-05, "epoch": 2.6305896619675613, "percentage": 52.62, "elapsed_time": "8:26:58", "remaining_time": "7:36:28"} +{"current_steps": 543, "total_steps": 1030, "loss": 0.4333, "lr": 4.3182282958937816e-05, "epoch": 2.635440351675004, "percentage": 52.72, "elapsed_time": "8:30:52", "remaining_time": "7:38:11"} +{"current_steps": 544, "total_steps": 1030, "loss": 0.4481, "lr": 4.304713507083673e-05, "epoch": 2.6402910413824463, "percentage": 52.82, "elapsed_time": "8:34:45", "remaining_time": "7:39:52"} +{"current_steps": 545, "total_steps": 1030, "loss": 0.4466, "lr": 4.291195218567523e-05, "epoch": 2.6451417310898893, "percentage": 52.91, "elapsed_time": "8:38:39", "remaining_time": "7:41:33"} +{"current_steps": 546, "total_steps": 1030, "loss": 0.4405, "lr": 4.277673585606046e-05, "epoch": 2.649992420797332, "percentage": 53.01, "elapsed_time": "8:42:32", "remaining_time": "7:43:12"} +{"current_steps": 547, "total_steps": 1030, "loss": 0.4566, "lr": 4.264148763498364e-05, "epoch": 2.6548431105047747, "percentage": 53.11, "elapsed_time": "8:46:26", "remaining_time": "7:44:50"} +{"current_steps": 548, "total_steps": 1030, "loss": 0.4407, "lr": 4.250620907580226e-05, "epoch": 2.6596938002122177, "percentage": 53.2, "elapsed_time": "8:50:19", "remaining_time": "7:46:27"} +{"current_steps": 549, "total_steps": 1030, "loss": 0.4493, "lr": 4.237090173222231e-05, "epoch": 2.6645444899196606, "percentage": 53.3, "elapsed_time": "8:54:13", "remaining_time": "7:48:03"} +{"current_steps": 550, "total_steps": 1030, "loss": 0.4511, "lr": 4.223556715828033e-05, "epoch": 2.669395179627103, "percentage": 53.4, "elapsed_time": "8:58:07", "remaining_time": "7:49:38"} +{"current_steps": 551, "total_steps": 1030, "loss": 0.447, "lr": 4.2100206908325603e-05, "epoch": 2.674245869334546, "percentage": 53.5, "elapsed_time": "9:02:01", "remaining_time": "7:51:11"} +{"current_steps": 552, "total_steps": 1030, "loss": 0.4415, "lr": 4.196482253700235e-05, "epoch": 2.6790965590419886, "percentage": 53.59, "elapsed_time": "9:05:55", "remaining_time": "7:52:44"} +{"current_steps": 553, "total_steps": 1030, "loss": 0.4457, "lr": 4.182941559923179e-05, "epoch": 2.6839472487494316, "percentage": 53.69, "elapsed_time": "9:09:49", "remaining_time": "7:54:15"} +{"current_steps": 554, "total_steps": 1030, "loss": 0.4422, "lr": 4.169398765019433e-05, "epoch": 2.688797938456874, "percentage": 53.79, "elapsed_time": "9:13:43", "remaining_time": "7:55:45"} +{"current_steps": 555, "total_steps": 1030, "loss": 0.4429, "lr": 4.15585402453117e-05, "epoch": 2.693648628164317, "percentage": 53.88, "elapsed_time": "9:17:37", "remaining_time": "7:57:14"} +{"current_steps": 556, "total_steps": 1030, "loss": 0.4421, "lr": 4.14230749402291e-05, "epoch": 2.69849931787176, "percentage": 53.98, "elapsed_time": "9:21:31", "remaining_time": "7:58:42"} +{"current_steps": 557, "total_steps": 1030, "loss": 0.4318, "lr": 4.128759329079732e-05, "epoch": 2.7033500075792025, "percentage": 54.08, "elapsed_time": "9:25:25", "remaining_time": "8:00:09"} +{"current_steps": 558, "total_steps": 1030, "loss": 0.4374, "lr": 4.115209685305482e-05, "epoch": 2.7082006972866455, "percentage": 54.17, "elapsed_time": "9:29:19", "remaining_time": "8:01:34"} +{"current_steps": 559, "total_steps": 1030, "loss": 0.4429, "lr": 4.101658718320998e-05, "epoch": 2.7130513869940884, "percentage": 54.27, "elapsed_time": "9:33:13", "remaining_time": "8:02:59"} +{"current_steps": 560, "total_steps": 1030, "loss": 0.4456, "lr": 4.088106583762309e-05, "epoch": 2.717902076701531, "percentage": 54.37, "elapsed_time": "9:37:07", "remaining_time": "8:04:22"} +{"current_steps": 561, "total_steps": 1030, "loss": 0.4494, "lr": 4.074553437278857e-05, "epoch": 2.722752766408974, "percentage": 54.47, "elapsed_time": "9:41:01", "remaining_time": "8:05:44"} +{"current_steps": 562, "total_steps": 1030, "loss": 0.4449, "lr": 4.060999434531704e-05, "epoch": 2.7276034561164164, "percentage": 54.56, "elapsed_time": "9:44:55", "remaining_time": "8:07:05"} +{"current_steps": 563, "total_steps": 1030, "loss": 0.4426, "lr": 4.047444731191751e-05, "epoch": 2.7324541458238594, "percentage": 54.66, "elapsed_time": "9:48:49", "remaining_time": "8:08:25"} +{"current_steps": 564, "total_steps": 1030, "loss": 0.4445, "lr": 4.033889482937943e-05, "epoch": 2.737304835531302, "percentage": 54.76, "elapsed_time": "9:52:43", "remaining_time": "8:09:43"} +{"current_steps": 565, "total_steps": 1030, "loss": 0.4565, "lr": 4.020333845455478e-05, "epoch": 2.742155525238745, "percentage": 54.85, "elapsed_time": "9:56:37", "remaining_time": "8:11:01"} +{"current_steps": 566, "total_steps": 1030, "loss": 0.4459, "lr": 4.0067779744340345e-05, "epoch": 2.747006214946188, "percentage": 54.95, "elapsed_time": "10:00:31", "remaining_time": "8:12:18"} +{"current_steps": 567, "total_steps": 1030, "loss": 0.4447, "lr": 3.993222025565966e-05, "epoch": 2.7518569046536303, "percentage": 55.05, "elapsed_time": "10:04:25", "remaining_time": "8:13:33"} +{"current_steps": 568, "total_steps": 1030, "loss": 0.4452, "lr": 3.979666154544522e-05, "epoch": 2.7567075943610733, "percentage": 55.15, "elapsed_time": "10:08:19", "remaining_time": "8:14:48"} +{"current_steps": 569, "total_steps": 1030, "loss": 0.4421, "lr": 3.96611051706206e-05, "epoch": 2.7615582840685162, "percentage": 55.24, "elapsed_time": "10:12:13", "remaining_time": "8:16:01"} +{"current_steps": 570, "total_steps": 1030, "loss": 0.4509, "lr": 3.9525552688082494e-05, "epoch": 2.7664089737759587, "percentage": 55.34, "elapsed_time": "10:16:07", "remaining_time": "8:17:13"} +{"current_steps": 571, "total_steps": 1030, "loss": 0.4442, "lr": 3.939000565468297e-05, "epoch": 2.7712596634834017, "percentage": 55.44, "elapsed_time": "10:20:01", "remaining_time": "8:18:24"} +{"current_steps": 572, "total_steps": 1030, "loss": 0.4458, "lr": 3.9254465627211444e-05, "epoch": 2.776110353190844, "percentage": 55.53, "elapsed_time": "10:23:56", "remaining_time": "8:19:35"} +{"current_steps": 573, "total_steps": 1030, "loss": 0.4423, "lr": 3.911893416237693e-05, "epoch": 2.780961042898287, "percentage": 55.63, "elapsed_time": "10:27:49", "remaining_time": "8:20:43"} +{"current_steps": 574, "total_steps": 1030, "loss": 0.4415, "lr": 3.8983412816790045e-05, "epoch": 2.7858117326057297, "percentage": 55.73, "elapsed_time": "10:31:43", "remaining_time": "8:21:51"} +{"current_steps": 575, "total_steps": 1030, "loss": 0.4419, "lr": 3.8847903146945186e-05, "epoch": 2.7906624223131726, "percentage": 55.83, "elapsed_time": "10:35:37", "remaining_time": "8:22:58"} +{"current_steps": 576, "total_steps": 1030, "loss": 0.4477, "lr": 3.871240670920269e-05, "epoch": 2.7955131120206156, "percentage": 55.92, "elapsed_time": "10:39:32", "remaining_time": "8:24:04"} +{"current_steps": 577, "total_steps": 1030, "loss": 0.4458, "lr": 3.85769250597709e-05, "epoch": 2.800363801728058, "percentage": 56.02, "elapsed_time": "10:43:25", "remaining_time": "8:25:09"} +{"current_steps": 578, "total_steps": 1030, "loss": 0.4403, "lr": 3.844145975468832e-05, "epoch": 2.805214491435501, "percentage": 56.12, "elapsed_time": "10:47:19", "remaining_time": "8:26:13"} +{"current_steps": 579, "total_steps": 1030, "loss": 0.4509, "lr": 3.830601234980569e-05, "epoch": 2.810065181142944, "percentage": 56.21, "elapsed_time": "10:51:13", "remaining_time": "8:27:15"} +{"current_steps": 580, "total_steps": 1030, "loss": 0.4492, "lr": 3.8170584400768224e-05, "epoch": 2.8149158708503865, "percentage": 56.31, "elapsed_time": "10:55:07", "remaining_time": "8:28:17"} +{"current_steps": 581, "total_steps": 1030, "loss": 0.4475, "lr": 3.8035177462997664e-05, "epoch": 2.8197665605578295, "percentage": 56.41, "elapsed_time": "10:59:01", "remaining_time": "8:29:17"} +{"current_steps": 582, "total_steps": 1030, "loss": 0.4419, "lr": 3.7899793091674396e-05, "epoch": 2.824617250265272, "percentage": 56.5, "elapsed_time": "11:02:54", "remaining_time": "8:30:16"} +{"current_steps": 583, "total_steps": 1030, "loss": 0.4421, "lr": 3.776443284171969e-05, "epoch": 2.829467939972715, "percentage": 56.6, "elapsed_time": "11:06:47", "remaining_time": "8:31:14"} +{"current_steps": 584, "total_steps": 1030, "loss": 0.4399, "lr": 3.7629098267777706e-05, "epoch": 2.8343186296801575, "percentage": 56.7, "elapsed_time": "11:10:41", "remaining_time": "8:32:12"} +{"current_steps": 585, "total_steps": 1030, "loss": 0.4328, "lr": 3.7493790924197746e-05, "epoch": 2.8391693193876004, "percentage": 56.8, "elapsed_time": "11:14:35", "remaining_time": "8:33:09"} +{"current_steps": 586, "total_steps": 1030, "loss": 0.4403, "lr": 3.735851236501637e-05, "epoch": 2.8440200090950434, "percentage": 56.89, "elapsed_time": "11:18:29", "remaining_time": "8:34:04"} +{"current_steps": 587, "total_steps": 1030, "loss": 0.4375, "lr": 3.722326414393954e-05, "epoch": 2.848870698802486, "percentage": 56.99, "elapsed_time": "11:22:23", "remaining_time": "8:34:59"} +{"current_steps": 588, "total_steps": 1030, "loss": 0.4465, "lr": 3.708804781432478e-05, "epoch": 2.853721388509929, "percentage": 57.09, "elapsed_time": "11:26:17", "remaining_time": "8:35:53"} +{"current_steps": 589, "total_steps": 1030, "loss": 0.4478, "lr": 3.6952864929163286e-05, "epoch": 2.858572078217372, "percentage": 57.18, "elapsed_time": "11:30:11", "remaining_time": "8:36:45"} +{"current_steps": 590, "total_steps": 1030, "loss": 0.4433, "lr": 3.6817717041062204e-05, "epoch": 2.8634227679248143, "percentage": 57.28, "elapsed_time": "11:34:05", "remaining_time": "8:37:37"} +{"current_steps": 591, "total_steps": 1030, "loss": 0.4426, "lr": 3.66826057022267e-05, "epoch": 2.868273457632257, "percentage": 57.38, "elapsed_time": "11:37:58", "remaining_time": "8:38:27"} +{"current_steps": 592, "total_steps": 1030, "loss": 0.437, "lr": 3.654753246444217e-05, "epoch": 2.8731241473397, "percentage": 57.48, "elapsed_time": "11:41:51", "remaining_time": "8:39:17"} +{"current_steps": 593, "total_steps": 1030, "loss": 0.4404, "lr": 3.641249887905638e-05, "epoch": 2.8779748370471427, "percentage": 57.57, "elapsed_time": "11:45:45", "remaining_time": "8:40:05"} +{"current_steps": 594, "total_steps": 1030, "loss": 0.4418, "lr": 3.627750649696173e-05, "epoch": 2.8828255267545853, "percentage": 57.67, "elapsed_time": "11:49:39", "remaining_time": "8:40:53"} +{"current_steps": 595, "total_steps": 1030, "loss": 0.4482, "lr": 3.614255686857734e-05, "epoch": 2.887676216462028, "percentage": 57.77, "elapsed_time": "11:53:33", "remaining_time": "8:41:40"} +{"current_steps": 596, "total_steps": 1030, "loss": 0.4407, "lr": 3.600765154383134e-05, "epoch": 2.892526906169471, "percentage": 57.86, "elapsed_time": "11:57:27", "remaining_time": "8:42:26"} +{"current_steps": 597, "total_steps": 1030, "loss": 0.4502, "lr": 3.587279207214301e-05, "epoch": 2.8973775958769137, "percentage": 57.96, "elapsed_time": "12:01:21", "remaining_time": "8:43:11"} +{"current_steps": 598, "total_steps": 1030, "loss": 0.4504, "lr": 3.5737980002404965e-05, "epoch": 2.9022282855843566, "percentage": 58.06, "elapsed_time": "12:05:15", "remaining_time": "8:43:55"} +{"current_steps": 599, "total_steps": 1030, "loss": 0.4444, "lr": 3.5603216882965415e-05, "epoch": 2.907078975291799, "percentage": 58.16, "elapsed_time": "12:09:09", "remaining_time": "8:44:38"} +{"current_steps": 600, "total_steps": 1030, "loss": 0.4497, "lr": 3.5468504261610387e-05, "epoch": 2.911929664999242, "percentage": 58.25, "elapsed_time": "12:13:03", "remaining_time": "8:45:21"} +{"current_steps": 601, "total_steps": 1030, "loss": 0.4449, "lr": 3.5333843685545914e-05, "epoch": 2.9167803547066846, "percentage": 58.35, "elapsed_time": "12:16:57", "remaining_time": "8:46:02"} +{"current_steps": 602, "total_steps": 1030, "loss": 0.4434, "lr": 3.519923670138025e-05, "epoch": 2.9216310444141276, "percentage": 58.45, "elapsed_time": "12:20:51", "remaining_time": "8:46:43"} +{"current_steps": 603, "total_steps": 1030, "loss": 0.4394, "lr": 3.506468485510616e-05, "epoch": 2.9264817341215705, "percentage": 58.54, "elapsed_time": "12:24:45", "remaining_time": "8:47:22"} +{"current_steps": 604, "total_steps": 1030, "loss": 0.4513, "lr": 3.493018969208314e-05, "epoch": 2.931332423829013, "percentage": 58.64, "elapsed_time": "12:28:39", "remaining_time": "8:48:01"} +{"current_steps": 605, "total_steps": 1030, "loss": 0.4425, "lr": 3.479575275701965e-05, "epoch": 2.936183113536456, "percentage": 58.74, "elapsed_time": "12:32:33", "remaining_time": "8:48:39"} +{"current_steps": 606, "total_steps": 1030, "loss": 0.4384, "lr": 3.4661375593955405e-05, "epoch": 2.941033803243899, "percentage": 58.83, "elapsed_time": "12:36:27", "remaining_time": "8:49:16"} +{"current_steps": 607, "total_steps": 1030, "loss": 0.4451, "lr": 3.45270597462436e-05, "epoch": 2.9458844929513415, "percentage": 58.93, "elapsed_time": "12:40:21", "remaining_time": "8:49:52"} +{"current_steps": 608, "total_steps": 1030, "loss": 0.4383, "lr": 3.4392806756533233e-05, "epoch": 2.9507351826587844, "percentage": 59.03, "elapsed_time": "12:44:15", "remaining_time": "8:50:27"} +{"current_steps": 609, "total_steps": 1030, "loss": 0.4453, "lr": 3.425861816675135e-05, "epoch": 2.955585872366227, "percentage": 59.13, "elapsed_time": "12:48:09", "remaining_time": "8:51:01"} +{"current_steps": 610, "total_steps": 1030, "loss": 0.436, "lr": 3.4124495518085366e-05, "epoch": 2.96043656207367, "percentage": 59.22, "elapsed_time": "12:52:03", "remaining_time": "8:51:34"} +{"current_steps": 611, "total_steps": 1030, "loss": 0.4467, "lr": 3.399044035096532e-05, "epoch": 2.9652872517811124, "percentage": 59.32, "elapsed_time": "12:55:57", "remaining_time": "8:52:07"} +{"current_steps": 612, "total_steps": 1030, "loss": 0.4364, "lr": 3.3856454205046223e-05, "epoch": 2.9701379414885554, "percentage": 59.42, "elapsed_time": "12:59:51", "remaining_time": "8:52:38"} +{"current_steps": 613, "total_steps": 1030, "loss": 0.4517, "lr": 3.372253861919036e-05, "epoch": 2.9749886311959983, "percentage": 59.51, "elapsed_time": "13:03:45", "remaining_time": "8:53:09"} +{"current_steps": 614, "total_steps": 1030, "loss": 0.4464, "lr": 3.3588695131449626e-05, "epoch": 2.979839320903441, "percentage": 59.61, "elapsed_time": "13:07:38", "remaining_time": "8:53:38"} +{"current_steps": 615, "total_steps": 1030, "loss": 0.4446, "lr": 3.3454925279047854e-05, "epoch": 2.984690010610884, "percentage": 59.71, "elapsed_time": "13:11:31", "remaining_time": "8:54:07"} +{"current_steps": 616, "total_steps": 1030, "loss": 0.4449, "lr": 3.3321230598363126e-05, "epoch": 2.9895407003183267, "percentage": 59.81, "elapsed_time": "13:15:27", "remaining_time": "8:54:36"} +{"current_steps": 617, "total_steps": 1030, "loss": 0.4457, "lr": 3.3187612624910185e-05, "epoch": 2.9943913900257693, "percentage": 59.9, "elapsed_time": "13:19:21", "remaining_time": "8:55:03"} +{"current_steps": 618, "total_steps": 1030, "loss": 0.4524, "lr": 3.305407289332279e-05, "epoch": 2.999242079733212, "percentage": 60.0, "elapsed_time": "13:23:14", "remaining_time": "8:55:29"} +{"current_steps": 619, "total_steps": 1030, "loss": 0.8623, "lr": 3.2920612937336035e-05, "epoch": 3.004699105654085, "percentage": 60.1, "elapsed_time": "13:27:37", "remaining_time": "8:56:14"} +{"current_steps": 620, "total_steps": 1030, "loss": 0.4236, "lr": 3.2787234289768816e-05, "epoch": 3.009549795361528, "percentage": 60.19, "elapsed_time": "13:31:30", "remaining_time": "8:56:38"} +{"current_steps": 621, "total_steps": 1030, "loss": 0.43, "lr": 3.2653938482506125e-05, "epoch": 3.014400485068971, "percentage": 60.29, "elapsed_time": "13:35:24", "remaining_time": "8:57:02"} +{"current_steps": 622, "total_steps": 1030, "loss": 0.422, "lr": 3.252072704648157e-05, "epoch": 3.0192511747764135, "percentage": 60.39, "elapsed_time": "13:39:18", "remaining_time": "8:57:25"} +{"current_steps": 623, "total_steps": 1030, "loss": 0.4178, "lr": 3.2387601511659695e-05, "epoch": 3.0241018644838564, "percentage": 60.49, "elapsed_time": "13:43:12", "remaining_time": "8:57:47"} +{"current_steps": 624, "total_steps": 1030, "loss": 0.4226, "lr": 3.22545634070185e-05, "epoch": 3.028952554191299, "percentage": 60.58, "elapsed_time": "13:47:05", "remaining_time": "8:58:08"} +{"current_steps": 625, "total_steps": 1030, "loss": 0.4171, "lr": 3.212161426053177e-05, "epoch": 3.033803243898742, "percentage": 60.68, "elapsed_time": "13:50:59", "remaining_time": "8:58:29"} +{"current_steps": 626, "total_steps": 1030, "loss": 0.4214, "lr": 3.19887555991516e-05, "epoch": 3.0386539336061844, "percentage": 60.78, "elapsed_time": "13:54:53", "remaining_time": "8:58:48"} +{"current_steps": 627, "total_steps": 1030, "loss": 0.4266, "lr": 3.1855988948790866e-05, "epoch": 3.0435046233136274, "percentage": 60.87, "elapsed_time": "13:58:46", "remaining_time": "8:59:07"} +{"current_steps": 628, "total_steps": 1030, "loss": 0.4232, "lr": 3.172331583430567e-05, "epoch": 3.0483553130210703, "percentage": 60.97, "elapsed_time": "14:02:40", "remaining_time": "8:59:25"} +{"current_steps": 629, "total_steps": 1030, "loss": 0.4248, "lr": 3.1590737779477825e-05, "epoch": 3.053206002728513, "percentage": 61.07, "elapsed_time": "14:06:34", "remaining_time": "8:59:42"} +{"current_steps": 630, "total_steps": 1030, "loss": 0.4201, "lr": 3.145825630699734e-05, "epoch": 3.058056692435956, "percentage": 61.17, "elapsed_time": "14:10:27", "remaining_time": "8:59:58"} +{"current_steps": 631, "total_steps": 1030, "loss": 0.4324, "lr": 3.1325872938444995e-05, "epoch": 3.0629073821433983, "percentage": 61.26, "elapsed_time": "14:14:20", "remaining_time": "9:00:13"} +{"current_steps": 632, "total_steps": 1030, "loss": 0.4238, "lr": 3.119358919427478e-05, "epoch": 3.0677580718508413, "percentage": 61.36, "elapsed_time": "14:18:14", "remaining_time": "9:00:28"} +{"current_steps": 633, "total_steps": 1030, "loss": 0.428, "lr": 3.106140659379652e-05, "epoch": 3.072608761558284, "percentage": 61.46, "elapsed_time": "14:22:08", "remaining_time": "9:00:42"} +{"current_steps": 634, "total_steps": 1030, "loss": 0.4184, "lr": 3.092932665515837e-05, "epoch": 3.0774594512657267, "percentage": 61.55, "elapsed_time": "14:26:01", "remaining_time": "9:00:55"} +{"current_steps": 635, "total_steps": 1030, "loss": 0.4141, "lr": 3.079735089532935e-05, "epoch": 3.0823101409731697, "percentage": 61.65, "elapsed_time": "14:29:54", "remaining_time": "9:01:07"} +{"current_steps": 636, "total_steps": 1030, "loss": 0.4221, "lr": 3.0665480830082e-05, "epoch": 3.087160830680612, "percentage": 61.75, "elapsed_time": "14:33:47", "remaining_time": "9:01:18"} +{"current_steps": 637, "total_steps": 1030, "loss": 0.4211, "lr": 3.0533717973974924e-05, "epoch": 3.092011520388055, "percentage": 61.84, "elapsed_time": "14:37:40", "remaining_time": "9:01:29"} +{"current_steps": 638, "total_steps": 1030, "loss": 0.4184, "lr": 3.040206384033542e-05, "epoch": 3.096862210095498, "percentage": 61.94, "elapsed_time": "14:41:34", "remaining_time": "9:01:39"} +{"current_steps": 639, "total_steps": 1030, "loss": 0.407, "lr": 3.0270519941242052e-05, "epoch": 3.1017128998029406, "percentage": 62.04, "elapsed_time": "14:45:27", "remaining_time": "9:01:48"} +{"current_steps": 640, "total_steps": 1030, "loss": 0.4199, "lr": 3.0139087787507323e-05, "epoch": 3.1065635895103836, "percentage": 62.14, "elapsed_time": "14:49:21", "remaining_time": "9:01:57"} +{"current_steps": 641, "total_steps": 1030, "loss": 0.4191, "lr": 3.0007768888660337e-05, "epoch": 3.111414279217826, "percentage": 62.23, "elapsed_time": "14:53:14", "remaining_time": "9:02:04"} +{"current_steps": 642, "total_steps": 1030, "loss": 0.4266, "lr": 2.9876564752929406e-05, "epoch": 3.116264968925269, "percentage": 62.33, "elapsed_time": "14:57:08", "remaining_time": "9:02:11"} +{"current_steps": 643, "total_steps": 1030, "loss": 0.4214, "lr": 2.9745476887224806e-05, "epoch": 3.121115658632712, "percentage": 62.43, "elapsed_time": "15:01:02", "remaining_time": "9:02:18"} +{"current_steps": 644, "total_steps": 1030, "loss": 0.4175, "lr": 2.961450679712135e-05, "epoch": 3.1259663483401545, "percentage": 62.52, "elapsed_time": "15:04:56", "remaining_time": "9:02:24"} +{"current_steps": 645, "total_steps": 1030, "loss": 0.4215, "lr": 2.9483655986841265e-05, "epoch": 3.1308170380475975, "percentage": 62.62, "elapsed_time": "15:08:49", "remaining_time": "9:02:28"} +{"current_steps": 646, "total_steps": 1030, "loss": 0.423, "lr": 2.9352925959236732e-05, "epoch": 3.13566772775504, "percentage": 62.72, "elapsed_time": "15:12:42", "remaining_time": "9:02:32"} +{"current_steps": 647, "total_steps": 1030, "loss": 0.4202, "lr": 2.92223182157728e-05, "epoch": 3.140518417462483, "percentage": 62.82, "elapsed_time": "15:16:35", "remaining_time": "9:02:35"} +{"current_steps": 648, "total_steps": 1030, "loss": 0.417, "lr": 2.909183425650996e-05, "epoch": 3.145369107169926, "percentage": 62.91, "elapsed_time": "15:20:29", "remaining_time": "9:02:37"} +{"current_steps": 649, "total_steps": 1030, "loss": 0.4076, "lr": 2.8961475580087108e-05, "epoch": 3.1502197968773684, "percentage": 63.01, "elapsed_time": "15:24:22", "remaining_time": "9:02:39"} +{"current_steps": 650, "total_steps": 1030, "loss": 0.4207, "lr": 2.8831243683704162e-05, "epoch": 3.1550704865848114, "percentage": 63.11, "elapsed_time": "15:28:15", "remaining_time": "9:02:40"} +{"current_steps": 651, "total_steps": 1030, "loss": 0.4157, "lr": 2.8701140063104996e-05, "epoch": 3.159921176292254, "percentage": 63.2, "elapsed_time": "15:32:08", "remaining_time": "9:02:40"} +{"current_steps": 652, "total_steps": 1030, "loss": 0.4105, "lr": 2.857116621256018e-05, "epoch": 3.164771865999697, "percentage": 63.3, "elapsed_time": "15:36:02", "remaining_time": "9:02:40"} +{"current_steps": 653, "total_steps": 1030, "loss": 0.4077, "lr": 2.8441323624849827e-05, "epoch": 3.16962255570714, "percentage": 63.4, "elapsed_time": "15:39:57", "remaining_time": "9:02:40"} +{"current_steps": 654, "total_steps": 1030, "loss": 0.4171, "lr": 2.83116137912465e-05, "epoch": 3.1744732454145823, "percentage": 63.5, "elapsed_time": "15:43:50", "remaining_time": "9:02:38"} +{"current_steps": 655, "total_steps": 1030, "loss": 0.4197, "lr": 2.8182038201498038e-05, "epoch": 3.1793239351220253, "percentage": 63.59, "elapsed_time": "15:47:44", "remaining_time": "9:02:35"} +{"current_steps": 656, "total_steps": 1030, "loss": 0.4098, "lr": 2.8052598343810474e-05, "epoch": 3.184174624829468, "percentage": 63.69, "elapsed_time": "15:51:37", "remaining_time": "9:02:32"} +{"current_steps": 657, "total_steps": 1030, "loss": 0.4221, "lr": 2.7923295704830868e-05, "epoch": 3.1890253145369107, "percentage": 63.79, "elapsed_time": "15:55:31", "remaining_time": "9:02:28"} +{"current_steps": 658, "total_steps": 1030, "loss": 0.4233, "lr": 2.7794131769630355e-05, "epoch": 3.1938760042443537, "percentage": 63.88, "elapsed_time": "15:59:25", "remaining_time": "9:02:24"} +{"current_steps": 659, "total_steps": 1030, "loss": 0.4212, "lr": 2.7665108021687007e-05, "epoch": 3.198726693951796, "percentage": 63.98, "elapsed_time": "16:03:18", "remaining_time": "9:02:19"} +{"current_steps": 660, "total_steps": 1030, "loss": 0.4182, "lr": 2.753622594286879e-05, "epoch": 3.203577383659239, "percentage": 64.08, "elapsed_time": "16:07:11", "remaining_time": "9:02:12"} +{"current_steps": 661, "total_steps": 1030, "loss": 0.4082, "lr": 2.7407487013416615e-05, "epoch": 3.2084280733666817, "percentage": 64.17, "elapsed_time": "16:11:05", "remaining_time": "9:02:06"} +{"current_steps": 662, "total_steps": 1030, "loss": 0.4186, "lr": 2.727889271192722e-05, "epoch": 3.2132787630741246, "percentage": 64.27, "elapsed_time": "16:14:58", "remaining_time": "9:01:58"} +{"current_steps": 663, "total_steps": 1030, "loss": 0.4192, "lr": 2.715044451533631e-05, "epoch": 3.218129452781567, "percentage": 64.37, "elapsed_time": "16:18:52", "remaining_time": "9:01:51"} +{"current_steps": 664, "total_steps": 1030, "loss": 0.4147, "lr": 2.702214389890152e-05, "epoch": 3.22298014248901, "percentage": 64.47, "elapsed_time": "16:22:45", "remaining_time": "9:01:42"} +{"current_steps": 665, "total_steps": 1030, "loss": 0.4041, "lr": 2.6893992336185512e-05, "epoch": 3.227830832196453, "percentage": 64.56, "elapsed_time": "16:26:38", "remaining_time": "9:01:32"} +{"current_steps": 666, "total_steps": 1030, "loss": 0.4141, "lr": 2.6765991299039025e-05, "epoch": 3.2326815219038956, "percentage": 64.66, "elapsed_time": "16:30:33", "remaining_time": "9:01:22"} +{"current_steps": 667, "total_steps": 1030, "loss": 0.4146, "lr": 2.663814225758393e-05, "epoch": 3.2375322116113385, "percentage": 64.76, "elapsed_time": "16:34:26", "remaining_time": "9:01:12"} +{"current_steps": 668, "total_steps": 1030, "loss": 0.418, "lr": 2.6510446680196448e-05, "epoch": 3.2423829013187815, "percentage": 64.85, "elapsed_time": "16:38:19", "remaining_time": "9:01:00"} +{"current_steps": 669, "total_steps": 1030, "loss": 0.4208, "lr": 2.638290603349023e-05, "epoch": 3.247233591026224, "percentage": 64.95, "elapsed_time": "16:42:12", "remaining_time": "9:00:48"} +{"current_steps": 670, "total_steps": 1030, "loss": 0.4194, "lr": 2.625552178229949e-05, "epoch": 3.252084280733667, "percentage": 65.05, "elapsed_time": "16:46:06", "remaining_time": "9:00:35"} +{"current_steps": 671, "total_steps": 1030, "loss": 0.4109, "lr": 2.612829538966218e-05, "epoch": 3.2569349704411095, "percentage": 65.15, "elapsed_time": "16:50:00", "remaining_time": "9:00:22"} +{"current_steps": 672, "total_steps": 1030, "loss": 0.42, "lr": 2.6001228316803256e-05, "epoch": 3.2617856601485524, "percentage": 65.24, "elapsed_time": "16:53:54", "remaining_time": "9:00:08"} +{"current_steps": 673, "total_steps": 1030, "loss": 0.4165, "lr": 2.5874322023117824e-05, "epoch": 3.266636349855995, "percentage": 65.34, "elapsed_time": "16:57:47", "remaining_time": "8:59:53"} +{"current_steps": 674, "total_steps": 1030, "loss": 0.418, "lr": 2.5747577966154404e-05, "epoch": 3.271487039563438, "percentage": 65.44, "elapsed_time": "17:01:41", "remaining_time": "8:59:38"} +{"current_steps": 675, "total_steps": 1030, "loss": 0.409, "lr": 2.5620997601598215e-05, "epoch": 3.276337729270881, "percentage": 65.53, "elapsed_time": "17:05:34", "remaining_time": "8:59:22"} +{"current_steps": 676, "total_steps": 1030, "loss": 0.4174, "lr": 2.5494582383254388e-05, "epoch": 3.2811884189783234, "percentage": 65.63, "elapsed_time": "17:09:29", "remaining_time": "8:59:06"} +{"current_steps": 677, "total_steps": 1030, "loss": 0.4134, "lr": 2.5368333763031324e-05, "epoch": 3.2860391086857663, "percentage": 65.73, "elapsed_time": "17:13:22", "remaining_time": "8:58:49"} +{"current_steps": 678, "total_steps": 1030, "loss": 0.4097, "lr": 2.5242253190924034e-05, "epoch": 3.2908897983932093, "percentage": 65.83, "elapsed_time": "17:17:16", "remaining_time": "8:58:31"} +{"current_steps": 679, "total_steps": 1030, "loss": 0.411, "lr": 2.5116342114997442e-05, "epoch": 3.295740488100652, "percentage": 65.92, "elapsed_time": "17:21:09", "remaining_time": "8:58:12"} +{"current_steps": 680, "total_steps": 1030, "loss": 0.421, "lr": 2.4990601981369737e-05, "epoch": 3.3005911778080947, "percentage": 66.02, "elapsed_time": "17:25:02", "remaining_time": "8:57:53"} +{"current_steps": 681, "total_steps": 1030, "loss": 0.4101, "lr": 2.4865034234195834e-05, "epoch": 3.3054418675155373, "percentage": 66.12, "elapsed_time": "17:28:56", "remaining_time": "8:57:34"} +{"current_steps": 682, "total_steps": 1030, "loss": 0.4166, "lr": 2.4739640315650747e-05, "epoch": 3.31029255722298, "percentage": 66.21, "elapsed_time": "17:32:50", "remaining_time": "8:57:13"} +{"current_steps": 683, "total_steps": 1030, "loss": 0.4207, "lr": 2.4614421665912997e-05, "epoch": 3.3151432469304227, "percentage": 66.31, "elapsed_time": "17:36:44", "remaining_time": "8:56:52"} +{"current_steps": 684, "total_steps": 1030, "loss": 0.4147, "lr": 2.4489379723148147e-05, "epoch": 3.3199939366378657, "percentage": 66.41, "elapsed_time": "17:40:37", "remaining_time": "8:56:30"} +{"current_steps": 685, "total_steps": 1030, "loss": 0.4196, "lr": 2.4364515923492187e-05, "epoch": 3.3248446263453086, "percentage": 66.5, "elapsed_time": "17:44:30", "remaining_time": "8:56:08"} +{"current_steps": 686, "total_steps": 1030, "loss": 0.4163, "lr": 2.4239831701035143e-05, "epoch": 3.329695316052751, "percentage": 66.6, "elapsed_time": "17:48:24", "remaining_time": "8:55:45"} +{"current_steps": 687, "total_steps": 1030, "loss": 0.4192, "lr": 2.411532848780451e-05, "epoch": 3.334546005760194, "percentage": 66.7, "elapsed_time": "17:52:18", "remaining_time": "8:55:22"} +{"current_steps": 688, "total_steps": 1030, "loss": 0.4144, "lr": 2.399100771374888e-05, "epoch": 3.3393966954676366, "percentage": 66.8, "elapsed_time": "17:56:11", "remaining_time": "8:54:58"} +{"current_steps": 689, "total_steps": 1030, "loss": 0.4112, "lr": 2.3866870806721495e-05, "epoch": 3.3442473851750796, "percentage": 66.89, "elapsed_time": "18:00:05", "remaining_time": "8:54:33"} +{"current_steps": 690, "total_steps": 1030, "loss": 0.4215, "lr": 2.37429191924638e-05, "epoch": 3.3490980748825225, "percentage": 66.99, "elapsed_time": "18:03:58", "remaining_time": "8:54:08"} +{"current_steps": 691, "total_steps": 1030, "loss": 0.4171, "lr": 2.361915429458913e-05, "epoch": 3.353948764589965, "percentage": 67.09, "elapsed_time": "18:07:52", "remaining_time": "8:53:42"} +{"current_steps": 692, "total_steps": 1030, "loss": 0.417, "lr": 2.349557753456637e-05, "epoch": 3.358799454297408, "percentage": 67.18, "elapsed_time": "18:11:46", "remaining_time": "8:53:15"} +{"current_steps": 693, "total_steps": 1030, "loss": 0.4195, "lr": 2.3372190331703556e-05, "epoch": 3.3636501440048505, "percentage": 67.28, "elapsed_time": "18:15:40", "remaining_time": "8:52:48"} +{"current_steps": 694, "total_steps": 1030, "loss": 0.4123, "lr": 2.324899410313161e-05, "epoch": 3.3685008337122935, "percentage": 67.38, "elapsed_time": "18:19:33", "remaining_time": "8:52:20"} +{"current_steps": 695, "total_steps": 1030, "loss": 0.4201, "lr": 2.3125990263788118e-05, "epoch": 3.3733515234197364, "percentage": 67.48, "elapsed_time": "18:23:26", "remaining_time": "8:51:52"} +{"current_steps": 696, "total_steps": 1030, "loss": 0.4128, "lr": 2.3003180226400986e-05, "epoch": 3.378202213127179, "percentage": 67.57, "elapsed_time": "18:27:20", "remaining_time": "8:51:24"} +{"current_steps": 697, "total_steps": 1030, "loss": 0.4121, "lr": 2.288056540147229e-05, "epoch": 3.383052902834622, "percentage": 67.67, "elapsed_time": "18:31:14", "remaining_time": "8:50:54"} +{"current_steps": 698, "total_steps": 1030, "loss": 0.4145, "lr": 2.275814719726201e-05, "epoch": 3.3879035925420644, "percentage": 67.77, "elapsed_time": "18:35:09", "remaining_time": "8:50:24"} +{"current_steps": 699, "total_steps": 1030, "loss": 0.4221, "lr": 2.263592701977193e-05, "epoch": 3.3927542822495074, "percentage": 67.86, "elapsed_time": "18:39:02", "remaining_time": "8:49:54"} +{"current_steps": 700, "total_steps": 1030, "loss": 0.414, "lr": 2.2513906272729397e-05, "epoch": 3.39760497195695, "percentage": 67.96, "elapsed_time": "18:42:56", "remaining_time": "8:49:23"} +{"current_steps": 701, "total_steps": 1030, "loss": 0.4176, "lr": 2.239208635757133e-05, "epoch": 3.402455661664393, "percentage": 68.06, "elapsed_time": "18:46:48", "remaining_time": "8:48:50"} +{"current_steps": 702, "total_steps": 1030, "loss": 0.4268, "lr": 2.2270468673428004e-05, "epoch": 3.407306351371836, "percentage": 68.16, "elapsed_time": "18:50:42", "remaining_time": "8:48:18"} +{"current_steps": 703, "total_steps": 1030, "loss": 0.407, "lr": 2.2149054617106974e-05, "epoch": 3.4121570410792783, "percentage": 68.25, "elapsed_time": "18:54:35", "remaining_time": "8:47:45"} +{"current_steps": 704, "total_steps": 1030, "loss": 0.4246, "lr": 2.2027845583077175e-05, "epoch": 3.4170077307867213, "percentage": 68.35, "elapsed_time": "18:58:28", "remaining_time": "8:47:11"} +{"current_steps": 705, "total_steps": 1030, "loss": 0.406, "lr": 2.1906842963452757e-05, "epoch": 3.421858420494164, "percentage": 68.45, "elapsed_time": "19:02:22", "remaining_time": "8:46:37"} +{"current_steps": 706, "total_steps": 1030, "loss": 0.4154, "lr": 2.178604814797715e-05, "epoch": 3.4267091102016067, "percentage": 68.54, "elapsed_time": "19:06:15", "remaining_time": "8:46:02"} +{"current_steps": 707, "total_steps": 1030, "loss": 0.4134, "lr": 2.1665462524007162e-05, "epoch": 3.4315597999090497, "percentage": 68.64, "elapsed_time": "19:10:09", "remaining_time": "8:45:27"} +{"current_steps": 708, "total_steps": 1030, "loss": 0.4211, "lr": 2.1545087476496903e-05, "epoch": 3.436410489616492, "percentage": 68.74, "elapsed_time": "19:14:02", "remaining_time": "8:44:51"} +{"current_steps": 709, "total_steps": 1030, "loss": 0.4235, "lr": 2.1424924387981996e-05, "epoch": 3.441261179323935, "percentage": 68.83, "elapsed_time": "19:17:55", "remaining_time": "8:44:15"} +{"current_steps": 710, "total_steps": 1030, "loss": 0.4118, "lr": 2.1304974638563715e-05, "epoch": 3.4461118690313777, "percentage": 68.93, "elapsed_time": "19:21:49", "remaining_time": "8:43:38"} +{"current_steps": 711, "total_steps": 1030, "loss": 0.4228, "lr": 2.1185239605893013e-05, "epoch": 3.4509625587388206, "percentage": 69.03, "elapsed_time": "19:25:42", "remaining_time": "8:43:00"} +{"current_steps": 712, "total_steps": 1030, "loss": 0.4209, "lr": 2.106572066515482e-05, "epoch": 3.4558132484462636, "percentage": 69.13, "elapsed_time": "19:29:36", "remaining_time": "8:42:22"} +{"current_steps": 713, "total_steps": 1030, "loss": 0.4137, "lr": 2.0946419189052162e-05, "epoch": 3.460663938153706, "percentage": 69.22, "elapsed_time": "19:33:28", "remaining_time": "8:41:43"} +{"current_steps": 714, "total_steps": 1030, "loss": 0.4217, "lr": 2.0827336547790452e-05, "epoch": 3.465514627861149, "percentage": 69.32, "elapsed_time": "19:37:22", "remaining_time": "8:41:04"} +{"current_steps": 715, "total_steps": 1030, "loss": 0.4173, "lr": 2.0708474109061752e-05, "epoch": 3.470365317568592, "percentage": 69.42, "elapsed_time": "19:41:16", "remaining_time": "8:40:25"} +{"current_steps": 716, "total_steps": 1030, "loss": 0.4017, "lr": 2.0589833238029032e-05, "epoch": 3.4752160072760345, "percentage": 69.51, "elapsed_time": "19:45:09", "remaining_time": "8:39:44"} +{"current_steps": 717, "total_steps": 1030, "loss": 0.415, "lr": 2.0471415297310455e-05, "epoch": 3.4800666969834775, "percentage": 69.61, "elapsed_time": "19:49:02", "remaining_time": "8:39:04"} +{"current_steps": 718, "total_steps": 1030, "loss": 0.4107, "lr": 2.0353221646963864e-05, "epoch": 3.48491738669092, "percentage": 69.71, "elapsed_time": "19:52:56", "remaining_time": "8:38:22"} +{"current_steps": 719, "total_steps": 1030, "loss": 0.4227, "lr": 2.0235253644471012e-05, "epoch": 3.489768076398363, "percentage": 69.81, "elapsed_time": "19:56:50", "remaining_time": "8:37:41"} +{"current_steps": 720, "total_steps": 1030, "loss": 0.4155, "lr": 2.011751264472206e-05, "epoch": 3.4946187661058055, "percentage": 69.9, "elapsed_time": "20:00:43", "remaining_time": "8:36:58"} +{"current_steps": 721, "total_steps": 1030, "loss": 0.4185, "lr": 2.0000000000000012e-05, "epoch": 3.4994694558132484, "percentage": 70.0, "elapsed_time": "20:04:37", "remaining_time": "8:36:15"} +{"current_steps": 722, "total_steps": 1030, "loss": 0.4257, "lr": 1.9882717059965086e-05, "epoch": 3.5043201455206914, "percentage": 70.1, "elapsed_time": "20:08:30", "remaining_time": "8:35:32"} +{"current_steps": 723, "total_steps": 1030, "loss": 0.4139, "lr": 1.9765665171639345e-05, "epoch": 3.509170835228134, "percentage": 70.19, "elapsed_time": "20:12:24", "remaining_time": "8:34:48"} +{"current_steps": 724, "total_steps": 1030, "loss": 0.404, "lr": 1.964884567939118e-05, "epoch": 3.514021524935577, "percentage": 70.29, "elapsed_time": "20:16:18", "remaining_time": "8:34:04"} +{"current_steps": 725, "total_steps": 1030, "loss": 0.4151, "lr": 1.9532259924919823e-05, "epoch": 3.51887221464302, "percentage": 70.39, "elapsed_time": "20:20:12", "remaining_time": "8:33:19"} +{"current_steps": 726, "total_steps": 1030, "loss": 0.4186, "lr": 1.9415909247239996e-05, "epoch": 3.5237229043504623, "percentage": 70.49, "elapsed_time": "20:24:05", "remaining_time": "8:32:33"} +{"current_steps": 727, "total_steps": 1030, "loss": 0.4097, "lr": 1.9299794982666485e-05, "epoch": 3.5285735940579053, "percentage": 70.58, "elapsed_time": "20:27:58", "remaining_time": "8:31:47"} +{"current_steps": 728, "total_steps": 1030, "loss": 0.4077, "lr": 1.9183918464798837e-05, "epoch": 3.533424283765348, "percentage": 70.68, "elapsed_time": "20:31:52", "remaining_time": "8:31:01"} +{"current_steps": 729, "total_steps": 1030, "loss": 0.4147, "lr": 1.906828102450601e-05, "epoch": 3.5382749734727907, "percentage": 70.78, "elapsed_time": "20:35:46", "remaining_time": "8:30:14"} +{"current_steps": 730, "total_steps": 1030, "loss": 0.41, "lr": 1.895288398991114e-05, "epoch": 3.5431256631802333, "percentage": 70.87, "elapsed_time": "20:39:40", "remaining_time": "8:29:27"} +{"current_steps": 731, "total_steps": 1030, "loss": 0.4171, "lr": 1.8837728686376158e-05, "epoch": 3.547976352887676, "percentage": 70.97, "elapsed_time": "20:43:33", "remaining_time": "8:28:38"} +{"current_steps": 732, "total_steps": 1030, "loss": 0.4258, "lr": 1.8722816436486754e-05, "epoch": 3.552827042595119, "percentage": 71.07, "elapsed_time": "20:47:26", "remaining_time": "8:27:50"} +{"current_steps": 733, "total_steps": 1030, "loss": 0.4227, "lr": 1.8608148560037036e-05, "epoch": 3.5576777323025617, "percentage": 71.17, "elapsed_time": "20:51:20", "remaining_time": "8:27:01"} +{"current_steps": 734, "total_steps": 1030, "loss": 0.4074, "lr": 1.8493726374014442e-05, "epoch": 3.5625284220100046, "percentage": 71.26, "elapsed_time": "20:55:14", "remaining_time": "8:26:12"} +{"current_steps": 735, "total_steps": 1030, "loss": 0.4078, "lr": 1.8379551192584588e-05, "epoch": 3.5673791117174476, "percentage": 71.36, "elapsed_time": "20:59:08", "remaining_time": "8:25:22"} +{"current_steps": 736, "total_steps": 1030, "loss": 0.4192, "lr": 1.826562432707619e-05, "epoch": 3.57222980142489, "percentage": 71.46, "elapsed_time": "21:03:02", "remaining_time": "8:24:31"} +{"current_steps": 737, "total_steps": 1030, "loss": 0.4158, "lr": 1.8151947085965994e-05, "epoch": 3.5770804911323326, "percentage": 71.55, "elapsed_time": "21:06:55", "remaining_time": "8:23:40"} +{"current_steps": 738, "total_steps": 1030, "loss": 0.4134, "lr": 1.803852077486377e-05, "epoch": 3.5819311808397756, "percentage": 71.65, "elapsed_time": "21:10:49", "remaining_time": "8:22:49"} +{"current_steps": 739, "total_steps": 1030, "loss": 0.4097, "lr": 1.7925346696497295e-05, "epoch": 3.5867818705472185, "percentage": 71.75, "elapsed_time": "21:14:42", "remaining_time": "8:21:56"} +{"current_steps": 740, "total_steps": 1030, "loss": 0.4148, "lr": 1.781242615069733e-05, "epoch": 3.591632560254661, "percentage": 71.84, "elapsed_time": "21:18:36", "remaining_time": "8:21:04"} +{"current_steps": 741, "total_steps": 1030, "loss": 0.4097, "lr": 1.7699760434382853e-05, "epoch": 3.596483249962104, "percentage": 71.94, "elapsed_time": "21:22:29", "remaining_time": "8:20:11"} +{"current_steps": 742, "total_steps": 1030, "loss": 0.4192, "lr": 1.758735084154601e-05, "epoch": 3.601333939669547, "percentage": 72.04, "elapsed_time": "21:26:22", "remaining_time": "8:19:17"} +{"current_steps": 743, "total_steps": 1030, "loss": 0.4134, "lr": 1.7475198663237297e-05, "epoch": 3.6061846293769895, "percentage": 72.14, "elapsed_time": "21:30:16", "remaining_time": "8:18:23"} +{"current_steps": 744, "total_steps": 1030, "loss": 0.4161, "lr": 1.736330518755082e-05, "epoch": 3.6110353190844324, "percentage": 72.23, "elapsed_time": "21:34:10", "remaining_time": "8:17:29"} +{"current_steps": 745, "total_steps": 1030, "loss": 0.4181, "lr": 1.7251671699609313e-05, "epoch": 3.615886008791875, "percentage": 72.33, "elapsed_time": "21:38:04", "remaining_time": "8:16:34"} +{"current_steps": 746, "total_steps": 1030, "loss": 0.42, "lr": 1.7140299481549557e-05, "epoch": 3.620736698499318, "percentage": 72.43, "elapsed_time": "21:41:57", "remaining_time": "8:15:38"} +{"current_steps": 747, "total_steps": 1030, "loss": 0.4236, "lr": 1.7029189812507603e-05, "epoch": 3.6255873882067604, "percentage": 72.52, "elapsed_time": "21:45:50", "remaining_time": "8:14:42"} +{"current_steps": 748, "total_steps": 1030, "loss": 0.4118, "lr": 1.6918343968604027e-05, "epoch": 3.6304380779142034, "percentage": 72.62, "elapsed_time": "21:49:43", "remaining_time": "8:13:46"} +{"current_steps": 749, "total_steps": 1030, "loss": 0.4093, "lr": 1.6807763222929315e-05, "epoch": 3.6352887676216463, "percentage": 72.72, "elapsed_time": "21:53:37", "remaining_time": "8:12:49"} +{"current_steps": 750, "total_steps": 1030, "loss": 0.4166, "lr": 1.669744884552926e-05, "epoch": 3.640139457329089, "percentage": 72.82, "elapsed_time": "21:57:30", "remaining_time": "8:11:52"} +{"current_steps": 751, "total_steps": 1030, "loss": 0.4147, "lr": 1.6587402103390314e-05, "epoch": 3.644990147036532, "percentage": 72.91, "elapsed_time": "22:01:25", "remaining_time": "8:10:54"} +{"current_steps": 752, "total_steps": 1030, "loss": 0.4187, "lr": 1.6477624260425137e-05, "epoch": 3.6498408367439747, "percentage": 73.01, "elapsed_time": "22:05:18", "remaining_time": "8:09:56"} +{"current_steps": 753, "total_steps": 1030, "loss": 0.4131, "lr": 1.6368116577457973e-05, "epoch": 3.6546915264514173, "percentage": 73.11, "elapsed_time": "22:09:13", "remaining_time": "8:08:58"} +{"current_steps": 754, "total_steps": 1030, "loss": 0.4146, "lr": 1.6258880312210195e-05, "epoch": 3.65954221615886, "percentage": 73.2, "elapsed_time": "22:13:07", "remaining_time": "8:07:59"} +{"current_steps": 755, "total_steps": 1030, "loss": 0.4159, "lr": 1.6149916719285942e-05, "epoch": 3.6643929058663027, "percentage": 73.3, "elapsed_time": "22:17:01", "remaining_time": "8:06:59"} +{"current_steps": 756, "total_steps": 1030, "loss": 0.4094, "lr": 1.6041227050157607e-05, "epoch": 3.6692435955737457, "percentage": 73.4, "elapsed_time": "22:20:55", "remaining_time": "8:05:59"} +{"current_steps": 757, "total_steps": 1030, "loss": 0.4129, "lr": 1.5932812553151506e-05, "epoch": 3.674094285281188, "percentage": 73.5, "elapsed_time": "22:24:49", "remaining_time": "8:04:59"} +{"current_steps": 758, "total_steps": 1030, "loss": 0.4184, "lr": 1.582467447343355e-05, "epoch": 3.678944974988631, "percentage": 73.59, "elapsed_time": "22:28:42", "remaining_time": "8:03:58"} +{"current_steps": 759, "total_steps": 1030, "loss": 0.4158, "lr": 1.5716814052994928e-05, "epoch": 3.683795664696074, "percentage": 73.69, "elapsed_time": "22:32:37", "remaining_time": "8:02:57"} +{"current_steps": 760, "total_steps": 1030, "loss": 0.405, "lr": 1.5609232530637827e-05, "epoch": 3.6886463544035166, "percentage": 73.79, "elapsed_time": "22:36:30", "remaining_time": "8:01:55"} +{"current_steps": 761, "total_steps": 1030, "loss": 0.4149, "lr": 1.5501931141961278e-05, "epoch": 3.6934970441109596, "percentage": 73.88, "elapsed_time": "22:40:24", "remaining_time": "8:00:52"} +{"current_steps": 762, "total_steps": 1030, "loss": 0.4106, "lr": 1.539491111934686e-05, "epoch": 3.6983477338184025, "percentage": 73.98, "elapsed_time": "22:44:18", "remaining_time": "7:59:50"} +{"current_steps": 763, "total_steps": 1030, "loss": 0.4187, "lr": 1.5288173691944613e-05, "epoch": 3.703198423525845, "percentage": 74.08, "elapsed_time": "22:48:12", "remaining_time": "7:58:47"} +{"current_steps": 764, "total_steps": 1030, "loss": 0.4132, "lr": 1.5181720085658906e-05, "epoch": 3.708049113233288, "percentage": 74.17, "elapsed_time": "22:52:06", "remaining_time": "7:57:43"} +{"current_steps": 765, "total_steps": 1030, "loss": 0.4113, "lr": 1.5075551523134358e-05, "epoch": 3.7128998029407305, "percentage": 74.27, "elapsed_time": "22:56:00", "remaining_time": "7:56:39"} +{"current_steps": 766, "total_steps": 1030, "loss": 0.4085, "lr": 1.4969669223741771e-05, "epoch": 3.7177504926481735, "percentage": 74.37, "elapsed_time": "22:59:53", "remaining_time": "7:55:34"} +{"current_steps": 767, "total_steps": 1030, "loss": 0.4169, "lr": 1.4864074403564216e-05, "epoch": 3.722601182355616, "percentage": 74.47, "elapsed_time": "23:03:46", "remaining_time": "7:54:29"} +{"current_steps": 768, "total_steps": 1030, "loss": 0.4178, "lr": 1.4758768275382887e-05, "epoch": 3.727451872063059, "percentage": 74.56, "elapsed_time": "23:07:40", "remaining_time": "7:53:24"} +{"current_steps": 769, "total_steps": 1030, "loss": 0.4137, "lr": 1.4653752048663394e-05, "epoch": 3.732302561770502, "percentage": 74.66, "elapsed_time": "23:11:34", "remaining_time": "7:52:18"} +{"current_steps": 770, "total_steps": 1030, "loss": 0.4149, "lr": 1.4549026929541693e-05, "epoch": 3.7371532514779444, "percentage": 74.76, "elapsed_time": "23:15:28", "remaining_time": "7:51:11"} +{"current_steps": 771, "total_steps": 1030, "loss": 0.4122, "lr": 1.4444594120810326e-05, "epoch": 3.7420039411853874, "percentage": 74.85, "elapsed_time": "23:19:21", "remaining_time": "7:50:04"} +{"current_steps": 772, "total_steps": 1030, "loss": 0.4209, "lr": 1.4340454821904573e-05, "epoch": 3.7468546308928303, "percentage": 74.95, "elapsed_time": "23:23:14", "remaining_time": "7:48:57"} +{"current_steps": 773, "total_steps": 1030, "loss": 0.4133, "lr": 1.4236610228888683e-05, "epoch": 3.751705320600273, "percentage": 75.05, "elapsed_time": "23:27:08", "remaining_time": "7:47:50"} +{"current_steps": 774, "total_steps": 1030, "loss": 0.4121, "lr": 1.4133061534442133e-05, "epoch": 3.7565560103077154, "percentage": 75.15, "elapsed_time": "23:31:02", "remaining_time": "7:46:42"} +{"current_steps": 775, "total_steps": 1030, "loss": 0.4152, "lr": 1.4029809927845981e-05, "epoch": 3.7614067000151583, "percentage": 75.24, "elapsed_time": "23:34:57", "remaining_time": "7:45:33"} +{"current_steps": 776, "total_steps": 1030, "loss": 0.4125, "lr": 1.3926856594969115e-05, "epoch": 3.7662573897226013, "percentage": 75.34, "elapsed_time": "23:38:51", "remaining_time": "7:44:25"} +{"current_steps": 777, "total_steps": 1030, "loss": 0.411, "lr": 1.3824202718254655e-05, "epoch": 3.771108079430044, "percentage": 75.44, "elapsed_time": "23:42:45", "remaining_time": "7:43:15"} +{"current_steps": 778, "total_steps": 1030, "loss": 0.4108, "lr": 1.3721849476706477e-05, "epoch": 3.7759587691374867, "percentage": 75.53, "elapsed_time": "23:46:38", "remaining_time": "7:42:06"} +{"current_steps": 779, "total_steps": 1030, "loss": 0.4133, "lr": 1.3619798045875529e-05, "epoch": 3.7808094588449297, "percentage": 75.63, "elapsed_time": "23:50:33", "remaining_time": "7:40:56"} +{"current_steps": 780, "total_steps": 1030, "loss": 0.4088, "lr": 1.3518049597846412e-05, "epoch": 3.785660148552372, "percentage": 75.73, "elapsed_time": "23:54:28", "remaining_time": "7:39:45"} +{"current_steps": 619, "total_steps": 1030, "loss": 0.4186, "lr": 3.2920612937336035e-05, "epoch": 3.004850689707443, "percentage": 60.1, "elapsed_time": "0:04:11", "remaining_time": "0:02:46"} +{"current_steps": 620, "total_steps": 1030, "loss": 0.4198, "lr": 3.2787234289768816e-05, "epoch": 3.0097013794148855, "percentage": 60.19, "elapsed_time": "0:08:04", "remaining_time": "0:05:20"} +{"current_steps": 621, "total_steps": 1030, "loss": 0.4257, "lr": 3.2653938482506125e-05, "epoch": 3.0145520691223284, "percentage": 60.29, "elapsed_time": "0:11:58", "remaining_time": "0:07:53"} +{"current_steps": 622, "total_steps": 1030, "loss": 0.4165, "lr": 3.252072704648157e-05, "epoch": 3.019402758829771, "percentage": 60.39, "elapsed_time": "0:15:52", "remaining_time": "0:10:24"} +{"current_steps": 623, "total_steps": 1030, "loss": 0.4099, "lr": 3.2387601511659695e-05, "epoch": 3.024253448537214, "percentage": 60.49, "elapsed_time": "0:19:45", "remaining_time": "0:12:54"} +{"current_steps": 624, "total_steps": 1030, "loss": 0.4152, "lr": 3.22545634070185e-05, "epoch": 3.029104138244657, "percentage": 60.58, "elapsed_time": "0:23:39", "remaining_time": "0:15:23"} +{"current_steps": 625, "total_steps": 1030, "loss": 0.4128, "lr": 3.212161426053177e-05, "epoch": 3.0339548279520994, "percentage": 60.68, "elapsed_time": "0:27:32", "remaining_time": "0:17:51"} +{"current_steps": 626, "total_steps": 1030, "loss": 0.4129, "lr": 3.19887555991516e-05, "epoch": 3.0388055176595423, "percentage": 60.78, "elapsed_time": "0:31:26", "remaining_time": "0:20:17"} +{"current_steps": 627, "total_steps": 1030, "loss": 0.419, "lr": 3.1855988948790866e-05, "epoch": 3.043656207366985, "percentage": 60.87, "elapsed_time": "0:35:19", "remaining_time": "0:22:42"} +{"current_steps": 628, "total_steps": 1030, "loss": 0.4179, "lr": 3.172331583430567e-05, "epoch": 3.048506897074428, "percentage": 60.97, "elapsed_time": "0:39:13", "remaining_time": "0:25:06"} +{"current_steps": 629, "total_steps": 1030, "loss": 0.4187, "lr": 3.1590737779477825e-05, "epoch": 3.0533575867818707, "percentage": 61.07, "elapsed_time": "0:43:07", "remaining_time": "0:27:29"} +{"current_steps": 630, "total_steps": 1030, "loss": 0.4145, "lr": 3.145825630699734e-05, "epoch": 3.0582082764893133, "percentage": 61.17, "elapsed_time": "0:47:00", "remaining_time": "0:29:51"} +{"current_steps": 631, "total_steps": 1030, "loss": 0.4269, "lr": 3.1325872938444995e-05, "epoch": 3.063058966196756, "percentage": 61.26, "elapsed_time": "0:50:54", "remaining_time": "0:32:11"} +{"current_steps": 632, "total_steps": 1030, "loss": 0.4189, "lr": 3.119358919427478e-05, "epoch": 3.0679096559041987, "percentage": 61.36, "elapsed_time": "0:54:48", "remaining_time": "0:34:30"} +{"current_steps": 633, "total_steps": 1030, "loss": 0.4218, "lr": 3.106140659379652e-05, "epoch": 3.0727603456116417, "percentage": 61.46, "elapsed_time": "0:58:41", "remaining_time": "0:36:48"} +{"current_steps": 634, "total_steps": 1030, "loss": 0.4142, "lr": 3.092932665515837e-05, "epoch": 3.0776110353190846, "percentage": 61.55, "elapsed_time": "1:02:35", "remaining_time": "0:39:05"} +{"current_steps": 635, "total_steps": 1030, "loss": 0.4092, "lr": 3.079735089532935e-05, "epoch": 3.082461725026527, "percentage": 61.65, "elapsed_time": "1:06:28", "remaining_time": "0:41:21"} +{"current_steps": 636, "total_steps": 1030, "loss": 0.4176, "lr": 3.0665480830082e-05, "epoch": 3.08731241473397, "percentage": 61.75, "elapsed_time": "1:10:22", "remaining_time": "0:43:36"} +{"current_steps": 637, "total_steps": 1030, "loss": 0.4171, "lr": 3.0533717973974924e-05, "epoch": 3.0921631044414126, "percentage": 61.84, "elapsed_time": "1:14:16", "remaining_time": "0:45:49"} +{"current_steps": 638, "total_steps": 1030, "loss": 0.4142, "lr": 3.040206384033542e-05, "epoch": 3.0970137941488556, "percentage": 61.94, "elapsed_time": "1:18:09", "remaining_time": "0:48:01"} +{"current_steps": 639, "total_steps": 1030, "loss": 0.4045, "lr": 3.0270519941242052e-05, "epoch": 3.101864483856298, "percentage": 62.04, "elapsed_time": "1:22:03", "remaining_time": "0:50:12"} +{"current_steps": 640, "total_steps": 1030, "loss": 0.4162, "lr": 3.0139087787507323e-05, "epoch": 3.106715173563741, "percentage": 62.14, "elapsed_time": "1:25:57", "remaining_time": "0:52:22"} +{"current_steps": 641, "total_steps": 1030, "loss": 0.4162, "lr": 3.0007768888660337e-05, "epoch": 3.111565863271184, "percentage": 62.23, "elapsed_time": "1:29:50", "remaining_time": "0:54:31"} +{"current_steps": 642, "total_steps": 1030, "loss": 0.423, "lr": 2.9876564752929406e-05, "epoch": 3.1164165529786265, "percentage": 62.33, "elapsed_time": "1:33:43", "remaining_time": "0:56:38"} +{"current_steps": 643, "total_steps": 1030, "loss": 0.4186, "lr": 2.9745476887224806e-05, "epoch": 3.1212672426860695, "percentage": 62.43, "elapsed_time": "1:37:36", "remaining_time": "0:58:45"} +{"current_steps": 644, "total_steps": 1030, "loss": 0.4149, "lr": 2.961450679712135e-05, "epoch": 3.1261179323935124, "percentage": 62.52, "elapsed_time": "1:41:31", "remaining_time": "1:00:51"} +{"current_steps": 645, "total_steps": 1030, "loss": 0.4185, "lr": 2.9483655986841265e-05, "epoch": 3.130968622100955, "percentage": 62.62, "elapsed_time": "1:45:25", "remaining_time": "1:02:55"} +{"current_steps": 646, "total_steps": 1030, "loss": 0.4199, "lr": 2.9352925959236732e-05, "epoch": 3.135819311808398, "percentage": 62.72, "elapsed_time": "1:49:19", "remaining_time": "1:04:58"} +{"current_steps": 647, "total_steps": 1030, "loss": 0.4187, "lr": 2.92223182157728e-05, "epoch": 3.1406700015158404, "percentage": 62.82, "elapsed_time": "1:53:13", "remaining_time": "1:07:01"} +{"current_steps": 648, "total_steps": 1030, "loss": 0.4144, "lr": 2.909183425650996e-05, "epoch": 3.1455206912232834, "percentage": 62.91, "elapsed_time": "1:57:08", "remaining_time": "1:09:03"} +{"current_steps": 649, "total_steps": 1030, "loss": 0.4065, "lr": 2.8961475580087108e-05, "epoch": 3.150371380930726, "percentage": 63.01, "elapsed_time": "2:01:01", "remaining_time": "1:11:02"} +{"current_steps": 650, "total_steps": 1030, "loss": 0.4167, "lr": 2.8831243683704162e-05, "epoch": 3.155222070638169, "percentage": 63.11, "elapsed_time": "2:04:54", "remaining_time": "1:13:01"} +{"current_steps": 651, "total_steps": 1030, "loss": 0.4163, "lr": 2.8701140063104996e-05, "epoch": 3.160072760345612, "percentage": 63.2, "elapsed_time": "2:08:48", "remaining_time": "1:14:59"} +{"current_steps": 652, "total_steps": 1030, "loss": 0.4066, "lr": 2.857116621256018e-05, "epoch": 3.1649234500530543, "percentage": 63.3, "elapsed_time": "2:12:42", "remaining_time": "1:16:56"} +{"current_steps": 653, "total_steps": 1030, "loss": 0.4073, "lr": 2.8441323624849827e-05, "epoch": 3.1697741397604973, "percentage": 63.4, "elapsed_time": "2:16:35", "remaining_time": "1:18:51"} +{"current_steps": 654, "total_steps": 1030, "loss": 0.4148, "lr": 2.83116137912465e-05, "epoch": 3.17462482946794, "percentage": 63.5, "elapsed_time": "2:20:28", "remaining_time": "1:20:46"} +{"current_steps": 655, "total_steps": 1030, "loss": 0.4185, "lr": 2.8182038201498038e-05, "epoch": 3.1794755191753827, "percentage": 63.59, "elapsed_time": "2:24:22", "remaining_time": "1:22:39"} +{"current_steps": 656, "total_steps": 1030, "loss": 0.4084, "lr": 2.8052598343810474e-05, "epoch": 3.1843262088828257, "percentage": 63.69, "elapsed_time": "2:28:15", "remaining_time": "1:24:31"} +{"current_steps": 657, "total_steps": 1030, "loss": 0.4209, "lr": 2.7923295704830868e-05, "epoch": 3.189176898590268, "percentage": 63.79, "elapsed_time": "2:32:08", "remaining_time": "1:26:22"} +{"current_steps": 658, "total_steps": 1030, "loss": 0.4203, "lr": 2.7794131769630355e-05, "epoch": 3.194027588297711, "percentage": 63.88, "elapsed_time": "2:36:02", "remaining_time": "1:28:13"} +{"current_steps": 659, "total_steps": 1030, "loss": 0.4229, "lr": 2.7665108021687007e-05, "epoch": 3.1988782780051537, "percentage": 63.98, "elapsed_time": "2:39:57", "remaining_time": "1:30:02"} +{"current_steps": 660, "total_steps": 1030, "loss": 0.4145, "lr": 2.753622594286879e-05, "epoch": 3.2037289677125966, "percentage": 64.08, "elapsed_time": "2:43:50", "remaining_time": "1:31:51"} +{"current_steps": 661, "total_steps": 1030, "loss": 0.4083, "lr": 2.7407487013416615e-05, "epoch": 3.2085796574200396, "percentage": 64.17, "elapsed_time": "2:47:43", "remaining_time": "1:33:37"} +{"current_steps": 662, "total_steps": 1030, "loss": 0.4187, "lr": 2.727889271192722e-05, "epoch": 3.213430347127482, "percentage": 64.27, "elapsed_time": "2:51:37", "remaining_time": "1:35:24"} +{"current_steps": 663, "total_steps": 1030, "loss": 0.4164, "lr": 2.715044451533631e-05, "epoch": 3.218281036834925, "percentage": 64.37, "elapsed_time": "2:55:31", "remaining_time": "1:37:09"} +{"current_steps": 664, "total_steps": 1030, "loss": 0.413, "lr": 2.702214389890152e-05, "epoch": 3.2231317265423676, "percentage": 64.47, "elapsed_time": "2:59:25", "remaining_time": "1:38:53"} +{"current_steps": 665, "total_steps": 1030, "loss": 0.4035, "lr": 2.6893992336185512e-05, "epoch": 3.2279824162498105, "percentage": 64.56, "elapsed_time": "3:03:19", "remaining_time": "1:40:37"} +{"current_steps": 666, "total_steps": 1030, "loss": 0.4145, "lr": 2.6765991299039025e-05, "epoch": 3.2328331059572535, "percentage": 64.66, "elapsed_time": "3:07:12", "remaining_time": "1:42:19"} +{"current_steps": 667, "total_steps": 1030, "loss": 0.4117, "lr": 2.663814225758393e-05, "epoch": 3.237683795664696, "percentage": 64.76, "elapsed_time": "3:11:07", "remaining_time": "1:44:00"} +{"current_steps": 668, "total_steps": 1030, "loss": 0.4195, "lr": 2.6510446680196448e-05, "epoch": 3.242534485372139, "percentage": 64.85, "elapsed_time": "3:15:00", "remaining_time": "1:45:40"} +{"current_steps": 669, "total_steps": 1030, "loss": 0.4203, "lr": 2.638290603349023e-05, "epoch": 3.2473851750795815, "percentage": 64.95, "elapsed_time": "3:18:54", "remaining_time": "1:47:20"} +{"current_steps": 670, "total_steps": 1030, "loss": 0.4159, "lr": 2.625552178229949e-05, "epoch": 3.2522358647870244, "percentage": 65.05, "elapsed_time": "3:22:49", "remaining_time": "1:48:58"} +{"current_steps": 671, "total_steps": 1030, "loss": 0.4111, "lr": 2.612829538966218e-05, "epoch": 3.2570865544944674, "percentage": 65.15, "elapsed_time": "3:26:43", "remaining_time": "1:50:36"} +{"current_steps": 672, "total_steps": 1030, "loss": 0.4196, "lr": 2.6001228316803256e-05, "epoch": 3.26193724420191, "percentage": 65.24, "elapsed_time": "3:30:36", "remaining_time": "1:52:12"} +{"current_steps": 673, "total_steps": 1030, "loss": 0.4162, "lr": 2.5874322023117824e-05, "epoch": 3.266787933909353, "percentage": 65.34, "elapsed_time": "3:34:29", "remaining_time": "1:53:46"} +{"current_steps": 674, "total_steps": 1030, "loss": 0.4165, "lr": 2.5747577966154404e-05, "epoch": 3.2716386236167954, "percentage": 65.44, "elapsed_time": "3:38:23", "remaining_time": "1:55:20"} +{"current_steps": 675, "total_steps": 1030, "loss": 0.4076, "lr": 2.5620997601598215e-05, "epoch": 3.2764893133242383, "percentage": 65.53, "elapsed_time": "3:42:16", "remaining_time": "1:56:53"} +{"current_steps": 676, "total_steps": 1030, "loss": 0.4174, "lr": 2.5494582383254388e-05, "epoch": 3.281340003031681, "percentage": 65.63, "elapsed_time": "3:46:09", "remaining_time": "1:58:25"} +{"current_steps": 677, "total_steps": 1030, "loss": 0.4131, "lr": 2.5368333763031324e-05, "epoch": 3.286190692739124, "percentage": 65.73, "elapsed_time": "3:50:03", "remaining_time": "1:59:57"} +{"current_steps": 678, "total_steps": 1030, "loss": 0.4092, "lr": 2.5242253190924034e-05, "epoch": 3.2910413824465667, "percentage": 65.83, "elapsed_time": "3:53:56", "remaining_time": "2:01:27"} +{"current_steps": 679, "total_steps": 1030, "loss": 0.409, "lr": 2.5116342114997442e-05, "epoch": 3.2958920721540093, "percentage": 65.92, "elapsed_time": "3:57:51", "remaining_time": "2:02:57"} +{"current_steps": 680, "total_steps": 1030, "loss": 0.4201, "lr": 2.4990601981369737e-05, "epoch": 3.300742761861452, "percentage": 66.02, "elapsed_time": "4:01:44", "remaining_time": "2:04:25"} +{"current_steps": 681, "total_steps": 1030, "loss": 0.4107, "lr": 2.4865034234195834e-05, "epoch": 3.305593451568895, "percentage": 66.12, "elapsed_time": "4:05:37", "remaining_time": "2:05:52"} +{"current_steps": 682, "total_steps": 1030, "loss": 0.4145, "lr": 2.4739640315650747e-05, "epoch": 3.3104441412763377, "percentage": 66.21, "elapsed_time": "4:09:31", "remaining_time": "2:07:19"} +{"current_steps": 683, "total_steps": 1030, "loss": 0.4213, "lr": 2.4614421665912997e-05, "epoch": 3.3152948309837806, "percentage": 66.31, "elapsed_time": "4:13:25", "remaining_time": "2:08:44"} +{"current_steps": 684, "total_steps": 1030, "loss": 0.4129, "lr": 2.4489379723148147e-05, "epoch": 3.320145520691223, "percentage": 66.41, "elapsed_time": "4:17:23", "remaining_time": "2:10:11"} +{"current_steps": 685, "total_steps": 1030, "loss": 0.4193, "lr": 2.4364515923492187e-05, "epoch": 3.324996210398666, "percentage": 66.5, "elapsed_time": "4:21:16", "remaining_time": "2:11:35"} +{"current_steps": 686, "total_steps": 1030, "loss": 0.418, "lr": 2.4239831701035143e-05, "epoch": 3.3298469001061086, "percentage": 66.6, "elapsed_time": "4:25:11", "remaining_time": "2:12:58"} +{"current_steps": 687, "total_steps": 1030, "loss": 0.4166, "lr": 2.411532848780451e-05, "epoch": 3.3346975898135516, "percentage": 66.7, "elapsed_time": "4:29:04", "remaining_time": "2:14:20"} +{"current_steps": 688, "total_steps": 1030, "loss": 0.4138, "lr": 2.399100771374888e-05, "epoch": 3.3395482795209945, "percentage": 66.8, "elapsed_time": "4:32:59", "remaining_time": "2:15:41"} +{"current_steps": 689, "total_steps": 1030, "loss": 0.4111, "lr": 2.3866870806721495e-05, "epoch": 3.344398969228437, "percentage": 66.89, "elapsed_time": "4:36:55", "remaining_time": "2:17:03"} +{"current_steps": 690, "total_steps": 1030, "loss": 0.42, "lr": 2.37429191924638e-05, "epoch": 3.34924965893588, "percentage": 66.99, "elapsed_time": "4:40:49", "remaining_time": "2:18:22"} +{"current_steps": 691, "total_steps": 1030, "loss": 0.417, "lr": 2.361915429458913e-05, "epoch": 3.354100348643323, "percentage": 67.09, "elapsed_time": "4:44:43", "remaining_time": "2:19:40"} +{"current_steps": 692, "total_steps": 1030, "loss": 0.4168, "lr": 2.349557753456637e-05, "epoch": 3.3589510383507655, "percentage": 67.18, "elapsed_time": "4:48:38", "remaining_time": "2:20:58"} +{"current_steps": 693, "total_steps": 1030, "loss": 0.4189, "lr": 2.3372190331703556e-05, "epoch": 3.3638017280582084, "percentage": 67.28, "elapsed_time": "4:52:32", "remaining_time": "2:22:15"} +{"current_steps": 694, "total_steps": 1030, "loss": 0.4125, "lr": 2.324899410313161e-05, "epoch": 3.368652417765651, "percentage": 67.38, "elapsed_time": "4:56:25", "remaining_time": "2:23:30"} +{"current_steps": 695, "total_steps": 1030, "loss": 0.4186, "lr": 2.3125990263788118e-05, "epoch": 3.373503107473094, "percentage": 67.48, "elapsed_time": "5:00:19", "remaining_time": "2:24:45"} +{"current_steps": 696, "total_steps": 1030, "loss": 0.4123, "lr": 2.3003180226400986e-05, "epoch": 3.3783537971805364, "percentage": 67.57, "elapsed_time": "5:04:13", "remaining_time": "2:25:59"} +{"current_steps": 697, "total_steps": 1030, "loss": 0.4129, "lr": 2.288056540147229e-05, "epoch": 3.3832044868879794, "percentage": 67.67, "elapsed_time": "5:08:06", "remaining_time": "2:27:12"} +{"current_steps": 698, "total_steps": 1030, "loss": 0.4133, "lr": 2.275814719726201e-05, "epoch": 3.3880551765954223, "percentage": 67.77, "elapsed_time": "5:12:01", "remaining_time": "2:28:24"} +{"current_steps": 699, "total_steps": 1030, "loss": 0.4219, "lr": 2.263592701977193e-05, "epoch": 3.392905866302865, "percentage": 67.86, "elapsed_time": "5:15:55", "remaining_time": "2:29:36"} +{"current_steps": 700, "total_steps": 1030, "loss": 0.4143, "lr": 2.2513906272729397e-05, "epoch": 3.397756556010308, "percentage": 67.96, "elapsed_time": "5:19:48", "remaining_time": "2:30:46"} +{"current_steps": 701, "total_steps": 1030, "loss": 0.4166, "lr": 2.239208635757133e-05, "epoch": 3.4026072457177503, "percentage": 68.06, "elapsed_time": "5:23:43", "remaining_time": "2:31:55"} +{"current_steps": 702, "total_steps": 1030, "loss": 0.4259, "lr": 2.2270468673428004e-05, "epoch": 3.4074579354251933, "percentage": 68.16, "elapsed_time": "5:27:37", "remaining_time": "2:33:04"} +{"current_steps": 703, "total_steps": 1030, "loss": 0.407, "lr": 2.2149054617106974e-05, "epoch": 3.412308625132636, "percentage": 68.25, "elapsed_time": "5:31:31", "remaining_time": "2:34:12"} +{"current_steps": 704, "total_steps": 1030, "loss": 0.4231, "lr": 2.2027845583077175e-05, "epoch": 3.4171593148400787, "percentage": 68.35, "elapsed_time": "5:35:24", "remaining_time": "2:35:19"} +{"current_steps": 705, "total_steps": 1030, "loss": 0.4069, "lr": 2.1906842963452757e-05, "epoch": 3.4220100045475217, "percentage": 68.45, "elapsed_time": "5:39:19", "remaining_time": "2:36:25"} +{"current_steps": 706, "total_steps": 1030, "loss": 0.4149, "lr": 2.178604814797715e-05, "epoch": 3.426860694254964, "percentage": 68.54, "elapsed_time": "5:43:13", "remaining_time": "2:37:30"} +{"current_steps": 707, "total_steps": 1030, "loss": 0.4125, "lr": 2.1665462524007162e-05, "epoch": 3.431711383962407, "percentage": 68.64, "elapsed_time": "5:47:07", "remaining_time": "2:38:35"} +{"current_steps": 708, "total_steps": 1030, "loss": 0.4216, "lr": 2.1545087476496903e-05, "epoch": 3.43656207366985, "percentage": 68.74, "elapsed_time": "5:51:01", "remaining_time": "2:39:38"} +{"current_steps": 709, "total_steps": 1030, "loss": 0.4227, "lr": 2.1424924387981996e-05, "epoch": 3.4414127633772926, "percentage": 68.83, "elapsed_time": "5:54:54", "remaining_time": "2:40:41"} +{"current_steps": 710, "total_steps": 1030, "loss": 0.4116, "lr": 2.1304974638563715e-05, "epoch": 3.4462634530847356, "percentage": 68.93, "elapsed_time": "5:58:48", "remaining_time": "2:41:43"} +{"current_steps": 711, "total_steps": 1030, "loss": 0.4217, "lr": 2.1185239605893013e-05, "epoch": 3.451114142792178, "percentage": 69.03, "elapsed_time": "6:02:41", "remaining_time": "2:42:43"} +{"current_steps": 712, "total_steps": 1030, "loss": 0.4193, "lr": 2.106572066515482e-05, "epoch": 3.455964832499621, "percentage": 69.13, "elapsed_time": "6:06:35", "remaining_time": "2:43:43"} +{"current_steps": 713, "total_steps": 1030, "loss": 0.4147, "lr": 2.0946419189052162e-05, "epoch": 3.460815522207064, "percentage": 69.22, "elapsed_time": "6:10:28", "remaining_time": "2:44:43"} +{"current_steps": 714, "total_steps": 1030, "loss": 0.4214, "lr": 2.0827336547790452e-05, "epoch": 3.4656662119145065, "percentage": 69.32, "elapsed_time": "6:14:23", "remaining_time": "2:45:41"} +{"current_steps": 715, "total_steps": 1030, "loss": 0.416, "lr": 2.0708474109061752e-05, "epoch": 3.4705169016219495, "percentage": 69.42, "elapsed_time": "6:18:16", "remaining_time": "2:46:39"} +{"current_steps": 716, "total_steps": 1030, "loss": 0.4001, "lr": 2.0589833238029032e-05, "epoch": 3.475367591329392, "percentage": 69.51, "elapsed_time": "6:22:12", "remaining_time": "2:47:37"} +{"current_steps": 717, "total_steps": 1030, "loss": 0.4158, "lr": 2.0471415297310455e-05, "epoch": 3.480218281036835, "percentage": 69.61, "elapsed_time": "6:26:05", "remaining_time": "2:48:32"} +{"current_steps": 718, "total_steps": 1030, "loss": 0.41, "lr": 2.0353221646963864e-05, "epoch": 3.485068970744278, "percentage": 69.71, "elapsed_time": "6:29:58", "remaining_time": "2:49:27"} +{"current_steps": 719, "total_steps": 1030, "loss": 0.4226, "lr": 2.0235253644471012e-05, "epoch": 3.4899196604517204, "percentage": 69.81, "elapsed_time": "6:33:52", "remaining_time": "2:50:22"} +{"current_steps": 720, "total_steps": 1030, "loss": 0.4163, "lr": 2.011751264472206e-05, "epoch": 3.4947703501591634, "percentage": 69.9, "elapsed_time": "6:37:45", "remaining_time": "2:51:15"} +{"current_steps": 721, "total_steps": 1030, "loss": 0.4185, "lr": 2.0000000000000012e-05, "epoch": 3.499621039866606, "percentage": 70.0, "elapsed_time": "6:41:39", "remaining_time": "2:52:08"} +{"current_steps": 722, "total_steps": 1030, "loss": 0.4243, "lr": 1.9882717059965086e-05, "epoch": 3.504471729574049, "percentage": 70.1, "elapsed_time": "6:45:33", "remaining_time": "2:53:00"} +{"current_steps": 723, "total_steps": 1030, "loss": 0.4139, "lr": 1.9765665171639345e-05, "epoch": 3.5093224192814914, "percentage": 70.19, "elapsed_time": "6:49:27", "remaining_time": "2:53:51"} +{"current_steps": 724, "total_steps": 1030, "loss": 0.4023, "lr": 1.964884567939118e-05, "epoch": 3.5141731089889343, "percentage": 70.29, "elapsed_time": "6:53:20", "remaining_time": "2:54:42"} +{"current_steps": 725, "total_steps": 1030, "loss": 0.416, "lr": 1.9532259924919823e-05, "epoch": 3.5190237986963773, "percentage": 70.39, "elapsed_time": "6:57:13", "remaining_time": "2:55:31"} +{"current_steps": 726, "total_steps": 1030, "loss": 0.4198, "lr": 1.9415909247239996e-05, "epoch": 3.52387448840382, "percentage": 70.49, "elapsed_time": "7:01:08", "remaining_time": "2:56:20"} +{"current_steps": 727, "total_steps": 1030, "loss": 0.4084, "lr": 1.9299794982666485e-05, "epoch": 3.5287251781112627, "percentage": 70.58, "elapsed_time": "7:05:01", "remaining_time": "2:57:08"} +{"current_steps": 728, "total_steps": 1030, "loss": 0.408, "lr": 1.9183918464798837e-05, "epoch": 3.5335758678187057, "percentage": 70.68, "elapsed_time": "7:08:55", "remaining_time": "2:57:55"} +{"current_steps": 729, "total_steps": 1030, "loss": 0.4131, "lr": 1.906828102450601e-05, "epoch": 3.538426557526148, "percentage": 70.78, "elapsed_time": "7:12:48", "remaining_time": "2:58:42"} +{"current_steps": 730, "total_steps": 1030, "loss": 0.4102, "lr": 1.895288398991114e-05, "epoch": 3.543277247233591, "percentage": 70.87, "elapsed_time": "7:16:42", "remaining_time": "2:59:28"} +{"current_steps": 731, "total_steps": 1030, "loss": 0.4176, "lr": 1.8837728686376158e-05, "epoch": 3.5481279369410337, "percentage": 70.97, "elapsed_time": "7:20:36", "remaining_time": "3:00:13"} +{"current_steps": 732, "total_steps": 1030, "loss": 0.4238, "lr": 1.8722816436486754e-05, "epoch": 3.5529786266484766, "percentage": 71.07, "elapsed_time": "7:24:29", "remaining_time": "3:00:57"} +{"current_steps": 733, "total_steps": 1030, "loss": 0.4248, "lr": 1.8608148560037036e-05, "epoch": 3.557829316355919, "percentage": 71.17, "elapsed_time": "7:28:23", "remaining_time": "3:01:40"} +{"current_steps": 734, "total_steps": 1030, "loss": 0.4047, "lr": 1.8493726374014442e-05, "epoch": 3.562680006063362, "percentage": 71.26, "elapsed_time": "7:32:16", "remaining_time": "3:02:23"} +{"current_steps": 735, "total_steps": 1030, "loss": 0.4105, "lr": 1.8379551192584588e-05, "epoch": 3.567530695770805, "percentage": 71.36, "elapsed_time": "7:36:11", "remaining_time": "3:03:05"} +{"current_steps": 736, "total_steps": 1030, "loss": 0.4158, "lr": 1.826562432707619e-05, "epoch": 3.5723813854782476, "percentage": 71.46, "elapsed_time": "7:40:04", "remaining_time": "3:03:46"} +{"current_steps": 737, "total_steps": 1030, "loss": 0.4157, "lr": 1.8151947085965994e-05, "epoch": 3.5772320751856905, "percentage": 71.55, "elapsed_time": "7:43:57", "remaining_time": "3:04:26"} +{"current_steps": 738, "total_steps": 1030, "loss": 0.4144, "lr": 1.803852077486377e-05, "epoch": 3.5820827648931335, "percentage": 71.65, "elapsed_time": "7:47:51", "remaining_time": "3:05:06"} +{"current_steps": 739, "total_steps": 1030, "loss": 0.4082, "lr": 1.7925346696497295e-05, "epoch": 3.586933454600576, "percentage": 71.75, "elapsed_time": "7:51:44", "remaining_time": "3:05:45"} +{"current_steps": 740, "total_steps": 1030, "loss": 0.4137, "lr": 1.781242615069733e-05, "epoch": 3.591784144308019, "percentage": 71.84, "elapsed_time": "7:55:38", "remaining_time": "3:06:24"} +{"current_steps": 741, "total_steps": 1030, "loss": 0.4108, "lr": 1.7699760434382853e-05, "epoch": 3.5966348340154615, "percentage": 71.94, "elapsed_time": "7:59:31", "remaining_time": "3:07:01"} +{"current_steps": 742, "total_steps": 1030, "loss": 0.4189, "lr": 1.758735084154601e-05, "epoch": 3.6014855237229044, "percentage": 72.04, "elapsed_time": "8:03:25", "remaining_time": "3:07:38"} +{"current_steps": 743, "total_steps": 1030, "loss": 0.4123, "lr": 1.7475198663237297e-05, "epoch": 3.606336213430347, "percentage": 72.14, "elapsed_time": "8:07:19", "remaining_time": "3:08:14"} +{"current_steps": 744, "total_steps": 1030, "loss": 0.4158, "lr": 1.736330518755082e-05, "epoch": 3.61118690313779, "percentage": 72.23, "elapsed_time": "8:11:12", "remaining_time": "3:08:49"} +{"current_steps": 745, "total_steps": 1030, "loss": 0.4182, "lr": 1.7251671699609313e-05, "epoch": 3.616037592845233, "percentage": 72.33, "elapsed_time": "8:15:06", "remaining_time": "3:09:24"} +{"current_steps": 746, "total_steps": 1030, "loss": 0.4213, "lr": 1.7140299481549557e-05, "epoch": 3.6208882825526754, "percentage": 72.43, "elapsed_time": "8:18:59", "remaining_time": "3:09:57"} +{"current_steps": 747, "total_steps": 1030, "loss": 0.4224, "lr": 1.7029189812507603e-05, "epoch": 3.6257389722601183, "percentage": 72.52, "elapsed_time": "8:22:52", "remaining_time": "3:10:30"} +{"current_steps": 748, "total_steps": 1030, "loss": 0.4106, "lr": 1.6918343968604027e-05, "epoch": 3.6305896619675613, "percentage": 72.62, "elapsed_time": "8:26:46", "remaining_time": "3:11:03"} +{"current_steps": 749, "total_steps": 1030, "loss": 0.408, "lr": 1.6807763222929315e-05, "epoch": 3.635440351675004, "percentage": 72.72, "elapsed_time": "8:30:39", "remaining_time": "3:11:35"} +{"current_steps": 750, "total_steps": 1030, "loss": 0.4169, "lr": 1.669744884552926e-05, "epoch": 3.6402910413824463, "percentage": 72.82, "elapsed_time": "8:34:32", "remaining_time": "3:12:05"} +{"current_steps": 751, "total_steps": 1030, "loss": 0.4162, "lr": 1.6587402103390314e-05, "epoch": 3.6451417310898893, "percentage": 72.91, "elapsed_time": "8:38:26", "remaining_time": "3:12:36"} +{"current_steps": 752, "total_steps": 1030, "loss": 0.4179, "lr": 1.6477624260425137e-05, "epoch": 3.649992420797332, "percentage": 73.01, "elapsed_time": "8:42:20", "remaining_time": "3:13:05"} +{"current_steps": 753, "total_steps": 1030, "loss": 0.4124, "lr": 1.6368116577457973e-05, "epoch": 3.6548431105047747, "percentage": 73.11, "elapsed_time": "8:46:13", "remaining_time": "3:13:34"} +{"current_steps": 754, "total_steps": 1030, "loss": 0.4152, "lr": 1.6258880312210195e-05, "epoch": 3.6596938002122177, "percentage": 73.2, "elapsed_time": "8:50:07", "remaining_time": "3:14:02"} +{"current_steps": 755, "total_steps": 1030, "loss": 0.4147, "lr": 1.6149916719285942e-05, "epoch": 3.6645444899196606, "percentage": 73.3, "elapsed_time": "8:54:00", "remaining_time": "3:14:30"} +{"current_steps": 756, "total_steps": 1030, "loss": 0.4096, "lr": 1.6041227050157607e-05, "epoch": 3.669395179627103, "percentage": 73.4, "elapsed_time": "8:57:53", "remaining_time": "3:14:56"} +{"current_steps": 757, "total_steps": 1030, "loss": 0.4128, "lr": 1.5932812553151506e-05, "epoch": 3.674245869334546, "percentage": 73.5, "elapsed_time": "9:01:47", "remaining_time": "3:15:23"} +{"current_steps": 758, "total_steps": 1030, "loss": 0.4179, "lr": 1.582467447343355e-05, "epoch": 3.6790965590419886, "percentage": 73.59, "elapsed_time": "9:05:40", "remaining_time": "3:15:48"} +{"current_steps": 759, "total_steps": 1030, "loss": 0.4153, "lr": 1.5716814052994928e-05, "epoch": 3.6839472487494316, "percentage": 73.69, "elapsed_time": "9:09:33", "remaining_time": "3:16:13"} +{"current_steps": 760, "total_steps": 1030, "loss": 0.4065, "lr": 1.5609232530637827e-05, "epoch": 3.688797938456874, "percentage": 73.79, "elapsed_time": "9:13:27", "remaining_time": "3:16:37"} +{"current_steps": 761, "total_steps": 1030, "loss": 0.4135, "lr": 1.5501931141961278e-05, "epoch": 3.693648628164317, "percentage": 73.88, "elapsed_time": "9:17:20", "remaining_time": "3:17:00"} +{"current_steps": 762, "total_steps": 1030, "loss": 0.4102, "lr": 1.539491111934686e-05, "epoch": 3.69849931787176, "percentage": 73.98, "elapsed_time": "9:21:14", "remaining_time": "3:17:23"} +{"current_steps": 763, "total_steps": 1030, "loss": 0.4193, "lr": 1.5288173691944613e-05, "epoch": 3.7033500075792025, "percentage": 74.08, "elapsed_time": "9:25:08", "remaining_time": "3:17:45"} +{"current_steps": 764, "total_steps": 1030, "loss": 0.4131, "lr": 1.5181720085658906e-05, "epoch": 3.7082006972866455, "percentage": 74.17, "elapsed_time": "9:29:02", "remaining_time": "3:18:07"} +{"current_steps": 765, "total_steps": 1030, "loss": 0.4107, "lr": 1.5075551523134358e-05, "epoch": 3.7130513869940884, "percentage": 74.27, "elapsed_time": "9:32:55", "remaining_time": "3:18:27"} +{"current_steps": 766, "total_steps": 1030, "loss": 0.4093, "lr": 1.4969669223741771e-05, "epoch": 3.717902076701531, "percentage": 74.37, "elapsed_time": "9:36:48", "remaining_time": "3:18:47"} +{"current_steps": 767, "total_steps": 1030, "loss": 0.4142, "lr": 1.4864074403564216e-05, "epoch": 3.722752766408974, "percentage": 74.47, "elapsed_time": "9:40:43", "remaining_time": "3:19:07"} +{"current_steps": 768, "total_steps": 1030, "loss": 0.4205, "lr": 1.4758768275382887e-05, "epoch": 3.7276034561164164, "percentage": 74.56, "elapsed_time": "9:44:36", "remaining_time": "3:19:26"} +{"current_steps": 769, "total_steps": 1030, "loss": 0.412, "lr": 1.4653752048663394e-05, "epoch": 3.7324541458238594, "percentage": 74.66, "elapsed_time": "9:48:30", "remaining_time": "3:19:44"} +{"current_steps": 770, "total_steps": 1030, "loss": 0.4148, "lr": 1.4549026929541693e-05, "epoch": 3.737304835531302, "percentage": 74.76, "elapsed_time": "9:52:24", "remaining_time": "3:20:02"} +{"current_steps": 771, "total_steps": 1030, "loss": 0.4115, "lr": 1.4444594120810326e-05, "epoch": 3.742155525238745, "percentage": 74.85, "elapsed_time": "9:56:17", "remaining_time": "3:20:18"} +{"current_steps": 772, "total_steps": 1030, "loss": 0.4194, "lr": 1.4340454821904573e-05, "epoch": 3.747006214946188, "percentage": 74.95, "elapsed_time": "10:00:10", "remaining_time": "3:20:34"} +{"current_steps": 773, "total_steps": 1030, "loss": 0.4143, "lr": 1.4236610228888683e-05, "epoch": 3.7518569046536303, "percentage": 75.05, "elapsed_time": "10:04:05", "remaining_time": "3:20:50"} +{"current_steps": 774, "total_steps": 1030, "loss": 0.4121, "lr": 1.4133061534442133e-05, "epoch": 3.7567075943610733, "percentage": 75.15, "elapsed_time": "10:07:59", "remaining_time": "3:21:05"} +{"current_steps": 775, "total_steps": 1030, "loss": 0.4146, "lr": 1.4029809927845981e-05, "epoch": 3.7615582840685162, "percentage": 75.24, "elapsed_time": "10:11:53", "remaining_time": "3:21:19"} +{"current_steps": 776, "total_steps": 1030, "loss": 0.4125, "lr": 1.3926856594969115e-05, "epoch": 3.7664089737759587, "percentage": 75.34, "elapsed_time": "10:15:47", "remaining_time": "3:21:33"} +{"current_steps": 777, "total_steps": 1030, "loss": 0.4081, "lr": 1.3824202718254655e-05, "epoch": 3.7712596634834017, "percentage": 75.44, "elapsed_time": "10:19:40", "remaining_time": "3:21:46"} +{"current_steps": 778, "total_steps": 1030, "loss": 0.413, "lr": 1.3721849476706477e-05, "epoch": 3.776110353190844, "percentage": 75.53, "elapsed_time": "10:23:34", "remaining_time": "3:21:58"} +{"current_steps": 779, "total_steps": 1030, "loss": 0.4117, "lr": 1.3619798045875529e-05, "epoch": 3.780961042898287, "percentage": 75.63, "elapsed_time": "10:27:27", "remaining_time": "3:22:10"} +{"current_steps": 780, "total_steps": 1030, "loss": 0.4097, "lr": 1.3518049597846412e-05, "epoch": 3.7858117326057297, "percentage": 75.73, "elapsed_time": "10:31:21", "remaining_time": "3:22:21"} +{"current_steps": 781, "total_steps": 1030, "loss": 0.4146, "lr": 1.3416605301223893e-05, "epoch": 3.7906624223131726, "percentage": 75.83, "elapsed_time": "10:35:14", "remaining_time": "3:22:31"} +{"current_steps": 782, "total_steps": 1030, "loss": 0.415, "lr": 1.3315466321119486e-05, "epoch": 3.7955131120206156, "percentage": 75.92, "elapsed_time": "10:39:09", "remaining_time": "3:22:42"} +{"current_steps": 783, "total_steps": 1030, "loss": 0.4187, "lr": 1.3214633819138105e-05, "epoch": 3.800363801728058, "percentage": 76.02, "elapsed_time": "10:43:03", "remaining_time": "3:22:51"} +{"current_steps": 784, "total_steps": 1030, "loss": 0.4083, "lr": 1.3114108953364655e-05, "epoch": 3.805214491435501, "percentage": 76.12, "elapsed_time": "10:46:57", "remaining_time": "3:22:59"} +{"current_steps": 785, "total_steps": 1030, "loss": 0.415, "lr": 1.3013892878350771e-05, "epoch": 3.810065181142944, "percentage": 76.21, "elapsed_time": "10:50:51", "remaining_time": "3:23:08"} +{"current_steps": 786, "total_steps": 1030, "loss": 0.4082, "lr": 1.2913986745101567e-05, "epoch": 3.8149158708503865, "percentage": 76.31, "elapsed_time": "10:54:44", "remaining_time": "3:23:15"} +{"current_steps": 787, "total_steps": 1030, "loss": 0.416, "lr": 1.2814391701062392e-05, "epoch": 3.8197665605578295, "percentage": 76.41, "elapsed_time": "10:58:38", "remaining_time": "3:23:22"} +{"current_steps": 788, "total_steps": 1030, "loss": 0.4118, "lr": 1.2715108890105663e-05, "epoch": 3.824617250265272, "percentage": 76.5, "elapsed_time": "11:02:31", "remaining_time": "3:23:28"} +{"current_steps": 789, "total_steps": 1030, "loss": 0.4202, "lr": 1.2616139452517748e-05, "epoch": 3.829467939972715, "percentage": 76.6, "elapsed_time": "11:06:25", "remaining_time": "3:23:33"} +{"current_steps": 790, "total_steps": 1030, "loss": 0.414, "lr": 1.2517484524985836e-05, "epoch": 3.8343186296801575, "percentage": 76.7, "elapsed_time": "11:10:19", "remaining_time": "3:23:38"} +{"current_steps": 791, "total_steps": 1030, "loss": 0.4169, "lr": 1.2419145240584856e-05, "epoch": 3.8391693193876004, "percentage": 76.8, "elapsed_time": "11:14:12", "remaining_time": "3:23:42"} +{"current_steps": 792, "total_steps": 1030, "loss": 0.4121, "lr": 1.2321122728764566e-05, "epoch": 3.8440200090950434, "percentage": 76.89, "elapsed_time": "11:18:07", "remaining_time": "3:23:46"} +{"current_steps": 793, "total_steps": 1030, "loss": 0.4177, "lr": 1.222341811533648e-05, "epoch": 3.848870698802486, "percentage": 76.99, "elapsed_time": "11:22:00", "remaining_time": "3:23:49"} +{"current_steps": 794, "total_steps": 1030, "loss": 0.4211, "lr": 1.2126032522460975e-05, "epoch": 3.853721388509929, "percentage": 77.09, "elapsed_time": "11:25:54", "remaining_time": "3:23:52"} +{"current_steps": 795, "total_steps": 1030, "loss": 0.4204, "lr": 1.2028967068634417e-05, "epoch": 3.858572078217372, "percentage": 77.18, "elapsed_time": "11:29:49", "remaining_time": "3:23:54"} +{"current_steps": 796, "total_steps": 1030, "loss": 0.4119, "lr": 1.193222286867628e-05, "epoch": 3.8634227679248143, "percentage": 77.28, "elapsed_time": "11:33:43", "remaining_time": "3:23:55"} +{"current_steps": 797, "total_steps": 1030, "loss": 0.4086, "lr": 1.1835801033716372e-05, "epoch": 3.868273457632257, "percentage": 77.38, "elapsed_time": "11:37:37", "remaining_time": "3:23:56"} +{"current_steps": 798, "total_steps": 1030, "loss": 0.4214, "lr": 1.1739702671182083e-05, "epoch": 3.8731241473397, "percentage": 77.48, "elapsed_time": "11:41:31", "remaining_time": "3:23:57"} +{"current_steps": 799, "total_steps": 1030, "loss": 0.4095, "lr": 1.1643928884785618e-05, "epoch": 3.8779748370471427, "percentage": 77.57, "elapsed_time": "11:45:24", "remaining_time": "3:23:56"} +{"current_steps": 800, "total_steps": 1030, "loss": 0.4218, "lr": 1.1548480774511353e-05, "epoch": 3.8828255267545853, "percentage": 77.67, "elapsed_time": "11:49:18", "remaining_time": "3:23:55"} +{"current_steps": 801, "total_steps": 1030, "loss": 0.4218, "lr": 1.1453359436603213e-05, "epoch": 3.887676216462028, "percentage": 77.77, "elapsed_time": "11:53:13", "remaining_time": "3:23:54"} +{"current_steps": 802, "total_steps": 1030, "loss": 0.421, "lr": 1.1358565963552039e-05, "epoch": 3.892526906169471, "percentage": 77.86, "elapsed_time": "11:57:06", "remaining_time": "3:23:52"} +{"current_steps": 803, "total_steps": 1030, "loss": 0.4088, "lr": 1.126410144408312e-05, "epoch": 3.8973775958769137, "percentage": 77.96, "elapsed_time": "12:01:00", "remaining_time": "3:23:49"} +{"current_steps": 804, "total_steps": 1030, "loss": 0.4105, "lr": 1.1169966963143568e-05, "epoch": 3.9022282855843566, "percentage": 78.06, "elapsed_time": "12:04:55", "remaining_time": "3:23:46"} +{"current_steps": 805, "total_steps": 1030, "loss": 0.4114, "lr": 1.1076163601889953e-05, "epoch": 3.907078975291799, "percentage": 78.16, "elapsed_time": "12:08:48", "remaining_time": "3:23:42"} +{"current_steps": 806, "total_steps": 1030, "loss": 0.4099, "lr": 1.098269243767589e-05, "epoch": 3.911929664999242, "percentage": 78.25, "elapsed_time": "12:12:43", "remaining_time": "3:23:38"} +{"current_steps": 807, "total_steps": 1030, "loss": 0.417, "lr": 1.0889554544039593e-05, "epoch": 3.9167803547066846, "percentage": 78.35, "elapsed_time": "12:16:37", "remaining_time": "3:23:33"} +{"current_steps": 808, "total_steps": 1030, "loss": 0.4092, "lr": 1.0796750990691596e-05, "epoch": 3.9216310444141276, "percentage": 78.45, "elapsed_time": "12:20:31", "remaining_time": "3:23:27"} +{"current_steps": 809, "total_steps": 1030, "loss": 0.4156, "lr": 1.0704282843502459e-05, "epoch": 3.9264817341215705, "percentage": 78.54, "elapsed_time": "12:24:25", "remaining_time": "3:23:21"} +{"current_steps": 810, "total_steps": 1030, "loss": 0.4209, "lr": 1.0612151164490525e-05, "epoch": 3.931332423829013, "percentage": 78.64, "elapsed_time": "12:28:18", "remaining_time": "3:23:14"} +{"current_steps": 811, "total_steps": 1030, "loss": 0.4193, "lr": 1.0520357011809707e-05, "epoch": 3.936183113536456, "percentage": 78.74, "elapsed_time": "12:32:13", "remaining_time": "3:23:07"} +{"current_steps": 812, "total_steps": 1030, "loss": 0.415, "lr": 1.0428901439737387e-05, "epoch": 3.941033803243899, "percentage": 78.83, "elapsed_time": "12:36:07", "remaining_time": "3:22:59"} +{"current_steps": 813, "total_steps": 1030, "loss": 0.4152, "lr": 1.0337785498662223e-05, "epoch": 3.9458844929513415, "percentage": 78.93, "elapsed_time": "12:40:01", "remaining_time": "3:22:51"} +{"current_steps": 814, "total_steps": 1030, "loss": 0.4153, "lr": 1.024701023507216e-05, "epoch": 3.9507351826587844, "percentage": 79.03, "elapsed_time": "12:43:55", "remaining_time": "3:22:42"} +{"current_steps": 815, "total_steps": 1030, "loss": 0.4156, "lr": 1.015657669154237e-05, "epoch": 3.955585872366227, "percentage": 79.13, "elapsed_time": "12:47:49", "remaining_time": "3:22:33"} +{"current_steps": 816, "total_steps": 1030, "loss": 0.4109, "lr": 1.00664859067233e-05, "epoch": 3.96043656207367, "percentage": 79.22, "elapsed_time": "12:51:42", "remaining_time": "3:22:23"} +{"current_steps": 817, "total_steps": 1030, "loss": 0.4107, "lr": 9.976738915328719e-06, "epoch": 3.9652872517811124, "percentage": 79.32, "elapsed_time": "12:55:36", "remaining_time": "3:22:12"} +{"current_steps": 818, "total_steps": 1030, "loss": 0.4178, "lr": 9.887336748123864e-06, "epoch": 3.9701379414885554, "percentage": 79.42, "elapsed_time": "12:59:29", "remaining_time": "3:22:01"} +{"current_steps": 819, "total_steps": 1030, "loss": 0.4202, "lr": 9.798280431913558e-06, "epoch": 3.9749886311959983, "percentage": 79.51, "elapsed_time": "13:03:22", "remaining_time": "3:21:49"} +{"current_steps": 820, "total_steps": 1030, "loss": 0.4123, "lr": 9.709570989530493e-06, "epoch": 3.979839320903441, "percentage": 79.61, "elapsed_time": "13:07:16", "remaining_time": "3:21:37"} +{"current_steps": 821, "total_steps": 1030, "loss": 0.4132, "lr": 9.621209439823388e-06, "epoch": 3.984690010610884, "percentage": 79.71, "elapsed_time": "13:11:09", "remaining_time": "3:21:24"} +{"current_steps": 822, "total_steps": 1030, "loss": 0.4101, "lr": 9.533196797645354e-06, "epoch": 3.9895407003183267, "percentage": 79.81, "elapsed_time": "13:15:03", "remaining_time": "3:21:10"} +{"current_steps": 823, "total_steps": 1030, "loss": 0.412, "lr": 9.44553407384221e-06, "epoch": 3.9943913900257693, "percentage": 79.9, "elapsed_time": "13:18:56", "remaining_time": "3:20:56"} +{"current_steps": 824, "total_steps": 1030, "loss": 0.4113, "lr": 9.358222275240884e-06, "epoch": 3.999242079733212, "percentage": 80.0, "elapsed_time": "13:22:49", "remaining_time": "3:20:42"} +{"current_steps": 825, "total_steps": 1030, "loss": 0.8099, "lr": 9.271262404637835e-06, "epoch": 4.004699105654085, "percentage": 80.1, "elapsed_time": "13:27:13", "remaining_time": "3:20:35"} +{"current_steps": 826, "total_steps": 1030, "loss": 0.3979, "lr": 9.184655460787591e-06, "epoch": 4.009549795361528, "percentage": 80.19, "elapsed_time": "13:31:06", "remaining_time": "3:20:19"} +{"current_steps": 827, "total_steps": 1030, "loss": 0.3951, "lr": 9.098402438391161e-06, "epoch": 4.014400485068971, "percentage": 80.29, "elapsed_time": "13:35:00", "remaining_time": "3:20:03"} +{"current_steps": 828, "total_steps": 1030, "loss": 0.4017, "lr": 9.012504328084724e-06, "epoch": 4.0192511747764135, "percentage": 80.39, "elapsed_time": "13:38:53", "remaining_time": "3:19:46"} +{"current_steps": 829, "total_steps": 1030, "loss": 0.4025, "lr": 8.926962116428228e-06, "epoch": 4.024101864483856, "percentage": 80.49, "elapsed_time": "13:42:46", "remaining_time": "3:19:29"} +{"current_steps": 830, "total_steps": 1030, "loss": 0.4009, "lr": 8.841776785894014e-06, "epoch": 4.028952554191299, "percentage": 80.58, "elapsed_time": "13:46:40", "remaining_time": "3:19:11"} +{"current_steps": 831, "total_steps": 1030, "loss": 0.3992, "lr": 8.756949314855565e-06, "epoch": 4.033803243898742, "percentage": 80.68, "elapsed_time": "13:50:33", "remaining_time": "3:18:53"} +{"current_steps": 832, "total_steps": 1030, "loss": 0.3919, "lr": 8.672480677576267e-06, "epoch": 4.038653933606184, "percentage": 80.78, "elapsed_time": "13:54:26", "remaining_time": "3:18:34"} +{"current_steps": 833, "total_steps": 1030, "loss": 0.3919, "lr": 8.58837184419821e-06, "epoch": 4.043504623313628, "percentage": 80.87, "elapsed_time": "13:58:20", "remaining_time": "3:18:15"} +{"current_steps": 834, "total_steps": 1030, "loss": 0.3921, "lr": 8.504623780731056e-06, "epoch": 4.04835531302107, "percentage": 80.97, "elapsed_time": "14:02:13", "remaining_time": "3:17:56"} +{"current_steps": 835, "total_steps": 1030, "loss": 0.3979, "lr": 8.421237449040962e-06, "epoch": 4.053206002728513, "percentage": 81.07, "elapsed_time": "14:06:06", "remaining_time": "3:17:35"} +{"current_steps": 836, "total_steps": 1030, "loss": 0.3948, "lr": 8.338213806839453e-06, "epoch": 4.058056692435955, "percentage": 81.17, "elapsed_time": "14:10:00", "remaining_time": "3:17:15"} +{"current_steps": 837, "total_steps": 1030, "loss": 0.3907, "lr": 8.255553807672547e-06, "epoch": 4.062907382143399, "percentage": 81.26, "elapsed_time": "14:13:54", "remaining_time": "3:16:53"} +{"current_steps": 838, "total_steps": 1030, "loss": 0.3905, "lr": 8.1732584009097e-06, "epoch": 4.067758071850841, "percentage": 81.36, "elapsed_time": "14:17:48", "remaining_time": "3:16:32"} +{"current_steps": 839, "total_steps": 1030, "loss": 0.3958, "lr": 8.091328531732925e-06, "epoch": 4.072608761558284, "percentage": 81.46, "elapsed_time": "14:21:41", "remaining_time": "3:16:09"} +{"current_steps": 840, "total_steps": 1030, "loss": 0.3919, "lr": 8.009765141126014e-06, "epoch": 4.077459451265727, "percentage": 81.55, "elapsed_time": "14:25:34", "remaining_time": "3:15:47"} +{"current_steps": 841, "total_steps": 1030, "loss": 0.3919, "lr": 7.928569165863584e-06, "epoch": 4.08231014097317, "percentage": 81.65, "elapsed_time": "14:29:27", "remaining_time": "3:15:23"} +{"current_steps": 842, "total_steps": 1030, "loss": 0.3875, "lr": 7.847741538500439e-06, "epoch": 4.087160830680612, "percentage": 81.75, "elapsed_time": "14:33:21", "remaining_time": "3:15:00"} +{"current_steps": 843, "total_steps": 1030, "loss": 0.3947, "lr": 7.767283187360846e-06, "epoch": 4.092011520388056, "percentage": 81.84, "elapsed_time": "14:37:14", "remaining_time": "3:14:35"} +{"current_steps": 844, "total_steps": 1030, "loss": 0.394, "lr": 7.687195036527813e-06, "epoch": 4.096862210095498, "percentage": 81.94, "elapsed_time": "14:41:08", "remaining_time": "3:14:11"} +{"current_steps": 845, "total_steps": 1030, "loss": 0.4012, "lr": 7.60747800583252e-06, "epoch": 4.101712899802941, "percentage": 82.04, "elapsed_time": "14:45:01", "remaining_time": "3:13:45"} +{"current_steps": 846, "total_steps": 1030, "loss": 0.3974, "lr": 7.52813301084375e-06, "epoch": 4.106563589510383, "percentage": 82.14, "elapsed_time": "14:48:54", "remaining_time": "3:13:19"} +{"current_steps": 847, "total_steps": 1030, "loss": 0.3947, "lr": 7.449160962857358e-06, "epoch": 4.1114142792178265, "percentage": 82.23, "elapsed_time": "14:52:48", "remaining_time": "3:12:53"} +{"current_steps": 848, "total_steps": 1030, "loss": 0.3959, "lr": 7.370562768885823e-06, "epoch": 4.116264968925269, "percentage": 82.33, "elapsed_time": "14:56:42", "remaining_time": "3:12:27"} +{"current_steps": 849, "total_steps": 1030, "loss": 0.3956, "lr": 7.292339331647848e-06, "epoch": 4.121115658632712, "percentage": 82.43, "elapsed_time": "15:00:34", "remaining_time": "3:11:59"} +{"current_steps": 850, "total_steps": 1030, "loss": 0.3992, "lr": 7.214491549557898e-06, "epoch": 4.125966348340155, "percentage": 82.52, "elapsed_time": "15:04:28", "remaining_time": "3:11:32"} +{"current_steps": 851, "total_steps": 1030, "loss": 0.3928, "lr": 7.1370203167160326e-06, "epoch": 4.1308170380475975, "percentage": 82.62, "elapsed_time": "15:08:22", "remaining_time": "3:11:04"} +{"current_steps": 852, "total_steps": 1030, "loss": 0.3972, "lr": 7.0599265228975e-06, "epoch": 4.13566772775504, "percentage": 82.72, "elapsed_time": "15:12:16", "remaining_time": "3:10:35"} +{"current_steps": 853, "total_steps": 1030, "loss": 0.402, "lr": 6.983211053542591e-06, "epoch": 4.1405184174624825, "percentage": 82.82, "elapsed_time": "15:16:10", "remaining_time": "3:10:06"} +{"current_steps": 854, "total_steps": 1030, "loss": 0.4034, "lr": 6.9068747897464535e-06, "epoch": 4.145369107169926, "percentage": 82.91, "elapsed_time": "15:20:04", "remaining_time": "3:09:37"} +{"current_steps": 855, "total_steps": 1030, "loss": 0.4021, "lr": 6.830918608248964e-06, "epoch": 4.150219796877368, "percentage": 83.01, "elapsed_time": "15:23:57", "remaining_time": "3:09:06"} +{"current_steps": 856, "total_steps": 1030, "loss": 0.397, "lr": 6.755343381424659e-06, "epoch": 4.155070486584811, "percentage": 83.11, "elapsed_time": "15:27:50", "remaining_time": "3:08:36"} +{"current_steps": 857, "total_steps": 1030, "loss": 0.3911, "lr": 6.68014997727275e-06, "epoch": 4.159921176292254, "percentage": 83.2, "elapsed_time": "15:31:44", "remaining_time": "3:08:05"} +{"current_steps": 858, "total_steps": 1030, "loss": 0.3898, "lr": 6.605339259407104e-06, "epoch": 4.164771865999697, "percentage": 83.3, "elapsed_time": "15:35:37", "remaining_time": "3:07:33"} +{"current_steps": 859, "total_steps": 1030, "loss": 0.3933, "lr": 6.530912087046317e-06, "epoch": 4.169622555707139, "percentage": 83.4, "elapsed_time": "15:39:30", "remaining_time": "3:07:01"} +{"current_steps": 860, "total_steps": 1030, "loss": 0.3962, "lr": 6.456869315003946e-06, "epoch": 4.174473245414583, "percentage": 83.5, "elapsed_time": "15:43:24", "remaining_time": "3:06:29"} +{"current_steps": 861, "total_steps": 1030, "loss": 0.3989, "lr": 6.3832117936785564e-06, "epoch": 4.179323935122025, "percentage": 83.59, "elapsed_time": "15:47:18", "remaining_time": "3:05:56"} +{"current_steps": 862, "total_steps": 1030, "loss": 0.3939, "lr": 6.309940369044047e-06, "epoch": 4.184174624829468, "percentage": 83.69, "elapsed_time": "15:51:12", "remaining_time": "3:05:23"} +{"current_steps": 863, "total_steps": 1030, "loss": 0.3907, "lr": 6.23705588263992e-06, "epoch": 4.18902531453691, "percentage": 83.79, "elapsed_time": "15:55:05", "remaining_time": "3:04:49"} +{"current_steps": 864, "total_steps": 1030, "loss": 0.3941, "lr": 6.164559171561553e-06, "epoch": 4.193876004244354, "percentage": 83.88, "elapsed_time": "15:59:00", "remaining_time": "3:04:15"} +{"current_steps": 865, "total_steps": 1030, "loss": 0.3982, "lr": 6.092451068450671e-06, "epoch": 4.198726693951796, "percentage": 83.98, "elapsed_time": "16:02:54", "remaining_time": "3:03:40"} +{"current_steps": 866, "total_steps": 1030, "loss": 0.3928, "lr": 6.020732401485751e-06, "epoch": 4.203577383659239, "percentage": 84.08, "elapsed_time": "16:06:49", "remaining_time": "3:03:05"} +{"current_steps": 867, "total_steps": 1030, "loss": 0.4001, "lr": 5.9494039943724845e-06, "epoch": 4.208428073366682, "percentage": 84.17, "elapsed_time": "16:10:42", "remaining_time": "3:02:29"} +{"current_steps": 868, "total_steps": 1030, "loss": 0.3977, "lr": 5.878466666334341e-06, "epoch": 4.213278763074125, "percentage": 84.27, "elapsed_time": "16:14:36", "remaining_time": "3:01:53"} +{"current_steps": 869, "total_steps": 1030, "loss": 0.3906, "lr": 5.80792123210316e-06, "epoch": 4.218129452781567, "percentage": 84.37, "elapsed_time": "16:18:30", "remaining_time": "3:01:17"} +{"current_steps": 870, "total_steps": 1030, "loss": 0.3952, "lr": 5.737768501909773e-06, "epoch": 4.2229801424890105, "percentage": 84.47, "elapsed_time": "16:22:23", "remaining_time": "3:00:40"} +{"current_steps": 871, "total_steps": 1030, "loss": 0.386, "lr": 5.668009281474751e-06, "epoch": 4.227830832196453, "percentage": 84.56, "elapsed_time": "16:26:17", "remaining_time": "3:00:02"} +{"current_steps": 872, "total_steps": 1030, "loss": 0.391, "lr": 5.598644371999085e-06, "epoch": 4.232681521903896, "percentage": 84.66, "elapsed_time": "16:30:11", "remaining_time": "2:59:24"} +{"current_steps": 873, "total_steps": 1030, "loss": 0.3947, "lr": 5.5296745701549906e-06, "epoch": 4.237532211611338, "percentage": 84.76, "elapsed_time": "16:34:05", "remaining_time": "2:58:46"} +{"current_steps": 874, "total_steps": 1030, "loss": 0.4001, "lr": 5.4611006680768305e-06, "epoch": 4.2423829013187815, "percentage": 84.85, "elapsed_time": "16:37:58", "remaining_time": "2:58:07"} +{"current_steps": 875, "total_steps": 1030, "loss": 0.3889, "lr": 5.3929234533519345e-06, "epoch": 4.247233591026224, "percentage": 84.95, "elapsed_time": "16:41:51", "remaining_time": "2:57:28"} +{"current_steps": 876, "total_steps": 1030, "loss": 0.3948, "lr": 5.325143709011587e-06, "epoch": 4.2520842807336665, "percentage": 85.05, "elapsed_time": "16:45:46", "remaining_time": "2:56:48"} +{"current_steps": 877, "total_steps": 1030, "loss": 0.3927, "lr": 5.257762213522055e-06, "epoch": 4.25693497044111, "percentage": 85.15, "elapsed_time": "16:49:39", "remaining_time": "2:56:08"} +{"current_steps": 878, "total_steps": 1030, "loss": 0.3904, "lr": 5.19077974077558e-06, "epoch": 4.261785660148552, "percentage": 85.24, "elapsed_time": "16:53:33", "remaining_time": "2:55:28"} +{"current_steps": 879, "total_steps": 1030, "loss": 0.3997, "lr": 5.124197060081564e-06, "epoch": 4.266636349855995, "percentage": 85.34, "elapsed_time": "16:57:26", "remaining_time": "2:54:46"} +{"current_steps": 880, "total_steps": 1030, "loss": 0.3971, "lr": 5.058014936157714e-06, "epoch": 4.271487039563438, "percentage": 85.44, "elapsed_time": "17:01:20", "remaining_time": "2:54:05"} +{"current_steps": 881, "total_steps": 1030, "loss": 0.4, "lr": 4.992234129121225e-06, "epoch": 4.276337729270881, "percentage": 85.53, "elapsed_time": "17:05:14", "remaining_time": "2:53:23"} +{"current_steps": 882, "total_steps": 1030, "loss": 0.3949, "lr": 4.926855394480079e-06, "epoch": 4.281188418978323, "percentage": 85.63, "elapsed_time": "17:09:06", "remaining_time": "2:52:41"} +{"current_steps": 883, "total_steps": 1030, "loss": 0.3896, "lr": 4.861879483124372e-06, "epoch": 4.286039108685766, "percentage": 85.73, "elapsed_time": "17:13:00", "remaining_time": "2:51:58"} +{"current_steps": 884, "total_steps": 1030, "loss": 0.3976, "lr": 4.797307141317666e-06, "epoch": 4.290889798393209, "percentage": 85.83, "elapsed_time": "17:16:53", "remaining_time": "2:51:15"} +{"current_steps": 885, "total_steps": 1030, "loss": 0.3951, "lr": 4.7331391106884364e-06, "epoch": 4.295740488100652, "percentage": 85.92, "elapsed_time": "17:20:46", "remaining_time": "2:50:31"} +{"current_steps": 886, "total_steps": 1030, "loss": 0.3923, "lr": 4.6693761282215766e-06, "epoch": 4.300591177808094, "percentage": 86.02, "elapsed_time": "17:24:40", "remaining_time": "2:49:47"} +{"current_steps": 887, "total_steps": 1030, "loss": 0.3894, "lr": 4.606018926249851e-06, "epoch": 4.305441867515538, "percentage": 86.12, "elapsed_time": "17:28:34", "remaining_time": "2:49:02"} +{"current_steps": 888, "total_steps": 1030, "loss": 0.3953, "lr": 4.543068232445596e-06, "epoch": 4.31029255722298, "percentage": 86.21, "elapsed_time": "17:32:26", "remaining_time": "2:48:17"} +{"current_steps": 889, "total_steps": 1030, "loss": 0.3959, "lr": 4.480524769812276e-06, "epoch": 4.315143246930423, "percentage": 86.31, "elapsed_time": "17:36:21", "remaining_time": "2:47:32"} +{"current_steps": 890, "total_steps": 1030, "loss": 0.3946, "lr": 4.418389256676206e-06, "epoch": 4.319993936637866, "percentage": 86.41, "elapsed_time": "17:40:14", "remaining_time": "2:46:46"} +{"current_steps": 891, "total_steps": 1030, "loss": 0.3885, "lr": 4.35666240667834e-06, "epoch": 4.324844626345309, "percentage": 86.5, "elapsed_time": "17:44:08", "remaining_time": "2:46:00"} +{"current_steps": 892, "total_steps": 1030, "loss": 0.3948, "lr": 4.295344928765999e-06, "epoch": 4.329695316052751, "percentage": 86.6, "elapsed_time": "17:48:02", "remaining_time": "2:45:14"} +{"current_steps": 893, "total_steps": 1030, "loss": 0.3992, "lr": 4.234437527184785e-06, "epoch": 4.334546005760194, "percentage": 86.7, "elapsed_time": "17:51:56", "remaining_time": "2:44:27"} +{"current_steps": 894, "total_steps": 1030, "loss": 0.3964, "lr": 4.173940901470488e-06, "epoch": 4.339396695467637, "percentage": 86.8, "elapsed_time": "17:55:49", "remaining_time": "2:43:39"} +{"current_steps": 895, "total_steps": 1030, "loss": 0.3882, "lr": 4.11385574644104e-06, "epoch": 4.34424738517508, "percentage": 86.89, "elapsed_time": "17:59:42", "remaining_time": "2:42:51"} +{"current_steps": 896, "total_steps": 1030, "loss": 0.3952, "lr": 4.054182752188501e-06, "epoch": 4.349098074882522, "percentage": 86.99, "elapsed_time": "18:03:36", "remaining_time": "2:42:03"} +{"current_steps": 897, "total_steps": 1030, "loss": 0.3935, "lr": 3.994922604071217e-06, "epoch": 4.3539487645899655, "percentage": 87.09, "elapsed_time": "18:07:30", "remaining_time": "2:41:14"} +{"current_steps": 898, "total_steps": 1030, "loss": 0.4, "lr": 3.936075982705871e-06, "epoch": 4.358799454297408, "percentage": 87.18, "elapsed_time": "18:11:24", "remaining_time": "2:40:25"} +{"current_steps": 899, "total_steps": 1030, "loss": 0.3986, "lr": 3.877643563959694e-06, "epoch": 4.3636501440048505, "percentage": 87.28, "elapsed_time": "18:15:18", "remaining_time": "2:39:36"} +{"current_steps": 900, "total_steps": 1030, "loss": 0.3963, "lr": 3.819626018942732e-06, "epoch": 4.368500833712293, "percentage": 87.38, "elapsed_time": "18:19:10", "remaining_time": "2:38:46"} +{"current_steps": 901, "total_steps": 1030, "loss": 0.3983, "lr": 3.762024014000054e-06, "epoch": 4.373351523419736, "percentage": 87.48, "elapsed_time": "18:23:02", "remaining_time": "2:37:55"} +{"current_steps": 902, "total_steps": 1030, "loss": 0.3844, "lr": 3.7048382107042113e-06, "epoch": 4.378202213127179, "percentage": 87.57, "elapsed_time": "18:26:56", "remaining_time": "2:37:04"} +{"current_steps": 903, "total_steps": 1030, "loss": 0.3922, "lr": 3.6480692658475446e-06, "epoch": 4.3830529028346215, "percentage": 87.67, "elapsed_time": "18:30:50", "remaining_time": "2:36:13"} +{"current_steps": 904, "total_steps": 1030, "loss": 0.3971, "lr": 3.5917178314346955e-06, "epoch": 4.387903592542065, "percentage": 87.77, "elapsed_time": "18:34:42", "remaining_time": "2:35:22"} +{"current_steps": 905, "total_steps": 1030, "loss": 0.395, "lr": 3.535784554675088e-06, "epoch": 4.392754282249507, "percentage": 87.86, "elapsed_time": "18:38:37", "remaining_time": "2:34:30"} +{"current_steps": 906, "total_steps": 1030, "loss": 0.3941, "lr": 3.480270077975525e-06, "epoch": 4.39760497195695, "percentage": 87.96, "elapsed_time": "18:42:30", "remaining_time": "2:33:37"} +{"current_steps": 907, "total_steps": 1030, "loss": 0.3884, "lr": 3.42517503893276e-06, "epoch": 4.402455661664393, "percentage": 88.06, "elapsed_time": "18:46:24", "remaining_time": "2:32:45"} +{"current_steps": 908, "total_steps": 1030, "loss": 0.3839, "lr": 3.370500070326257e-06, "epoch": 4.407306351371836, "percentage": 88.16, "elapsed_time": "18:50:18", "remaining_time": "2:31:52"} +{"current_steps": 909, "total_steps": 1030, "loss": 0.387, "lr": 3.3162458001108332e-06, "epoch": 4.412157041079278, "percentage": 88.25, "elapsed_time": "18:54:11", "remaining_time": "2:30:58"} +{"current_steps": 910, "total_steps": 1030, "loss": 0.391, "lr": 3.2624128514094778e-06, "epoch": 4.417007730786722, "percentage": 88.35, "elapsed_time": "18:58:04", "remaining_time": "2:30:04"} +{"current_steps": 911, "total_steps": 1030, "loss": 0.3939, "lr": 3.20900184250625e-06, "epoch": 4.421858420494164, "percentage": 88.45, "elapsed_time": "19:01:58", "remaining_time": "2:29:10"} +{"current_steps": 912, "total_steps": 1030, "loss": 0.4037, "lr": 3.1560133868390895e-06, "epoch": 4.426709110201607, "percentage": 88.54, "elapsed_time": "19:05:52", "remaining_time": "2:28:15"} +{"current_steps": 913, "total_steps": 1030, "loss": 0.3994, "lr": 3.1034480929928333e-06, "epoch": 4.431559799909049, "percentage": 88.64, "elapsed_time": "19:09:46", "remaining_time": "2:27:20"} +{"current_steps": 914, "total_steps": 1030, "loss": 0.3944, "lr": 3.0513065646921957e-06, "epoch": 4.436410489616493, "percentage": 88.74, "elapsed_time": "19:13:38", "remaining_time": "2:26:24"} +{"current_steps": 915, "total_steps": 1030, "loss": 0.394, "lr": 2.999589400794851e-06, "epoch": 4.441261179323935, "percentage": 88.83, "elapsed_time": "19:17:32", "remaining_time": "2:25:29"} +{"current_steps": 916, "total_steps": 1030, "loss": 0.3905, "lr": 2.948297195284546e-06, "epoch": 4.446111869031378, "percentage": 88.93, "elapsed_time": "19:21:25", "remaining_time": "2:24:32"} +{"current_steps": 917, "total_steps": 1030, "loss": 0.3948, "lr": 2.897430537264283e-06, "epoch": 4.450962558738821, "percentage": 89.03, "elapsed_time": "19:25:18", "remaining_time": "2:23:35"} +{"current_steps": 918, "total_steps": 1030, "loss": 0.3936, "lr": 2.8469900109495553e-06, "epoch": 4.455813248446264, "percentage": 89.13, "elapsed_time": "19:29:12", "remaining_time": "2:22:38"} +{"current_steps": 919, "total_steps": 1030, "loss": 0.3891, "lr": 2.79697619566162e-06, "epoch": 4.460663938153706, "percentage": 89.22, "elapsed_time": "19:33:06", "remaining_time": "2:21:41"} +{"current_steps": 920, "total_steps": 1030, "loss": 0.3912, "lr": 2.7473896658208743e-06, "epoch": 4.465514627861149, "percentage": 89.32, "elapsed_time": "19:36:58", "remaining_time": "2:20:43"} +{"current_steps": 921, "total_steps": 1030, "loss": 0.394, "lr": 2.6982309909402293e-06, "epoch": 4.470365317568592, "percentage": 89.42, "elapsed_time": "19:40:52", "remaining_time": "2:19:45"} +{"current_steps": 922, "total_steps": 1030, "loss": 0.3983, "lr": 2.649500735618582e-06, "epoch": 4.4752160072760345, "percentage": 89.51, "elapsed_time": "19:44:45", "remaining_time": "2:18:46"} +{"current_steps": 923, "total_steps": 1030, "loss": 0.3958, "lr": 2.6011994595343516e-06, "epoch": 4.480066696983477, "percentage": 89.61, "elapsed_time": "19:48:38", "remaining_time": "2:17:47"} +{"current_steps": 924, "total_steps": 1030, "loss": 0.3947, "lr": 2.5533277174389916e-06, "epoch": 4.48491738669092, "percentage": 89.71, "elapsed_time": "19:52:32", "remaining_time": "2:16:48"} +{"current_steps": 925, "total_steps": 1030, "loss": 0.3914, "lr": 2.5058860591506973e-06, "epoch": 4.489768076398363, "percentage": 89.81, "elapsed_time": "19:56:25", "remaining_time": "2:15:48"} +{"current_steps": 926, "total_steps": 1030, "loss": 0.3908, "lr": 2.4588750295480246e-06, "epoch": 4.4946187661058055, "percentage": 89.9, "elapsed_time": "20:00:18", "remaining_time": "2:14:48"} +{"current_steps": 927, "total_steps": 1030, "loss": 0.3899, "lr": 2.4122951685636674e-06, "epoch": 4.499469455813248, "percentage": 90.0, "elapsed_time": "20:04:12", "remaining_time": "2:13:48"} +{"current_steps": 928, "total_steps": 1030, "loss": 0.3984, "lr": 2.366147011178246e-06, "epoch": 4.504320145520691, "percentage": 90.1, "elapsed_time": "20:08:05", "remaining_time": "2:12:47"} +{"current_steps": 929, "total_steps": 1030, "loss": 0.3837, "lr": 2.320431087414159e-06, "epoch": 4.509170835228134, "percentage": 90.19, "elapsed_time": "20:11:58", "remaining_time": "2:11:45"} +{"current_steps": 930, "total_steps": 1030, "loss": 0.3924, "lr": 2.275147922329506e-06, "epoch": 4.514021524935576, "percentage": 90.29, "elapsed_time": "20:15:52", "remaining_time": "2:10:44"} +{"current_steps": 931, "total_steps": 1030, "loss": 0.3908, "lr": 2.230298036012055e-06, "epoch": 4.51887221464302, "percentage": 90.39, "elapsed_time": "20:19:45", "remaining_time": "2:09:42"} +{"current_steps": 932, "total_steps": 1030, "loss": 0.397, "lr": 2.1858819435732583e-06, "epoch": 4.523722904350462, "percentage": 90.49, "elapsed_time": "20:23:38", "remaining_time": "2:08:39"} +{"current_steps": 933, "total_steps": 1030, "loss": 0.3942, "lr": 2.141900155142351e-06, "epoch": 4.528573594057905, "percentage": 90.58, "elapsed_time": "20:27:30", "remaining_time": "2:07:37"} +{"current_steps": 934, "total_steps": 1030, "loss": 0.4008, "lr": 2.0983531758604726e-06, "epoch": 4.533424283765348, "percentage": 90.68, "elapsed_time": "20:31:24", "remaining_time": "2:06:34"} +{"current_steps": 935, "total_steps": 1030, "loss": 0.4009, "lr": 2.055241505874892e-06, "epoch": 4.538274973472791, "percentage": 90.78, "elapsed_time": "20:35:18", "remaining_time": "2:05:30"} +{"current_steps": 936, "total_steps": 1030, "loss": 0.3976, "lr": 2.0125656403332396e-06, "epoch": 4.543125663180233, "percentage": 90.87, "elapsed_time": "20:39:10", "remaining_time": "2:04:26"} +{"current_steps": 937, "total_steps": 1030, "loss": 0.3998, "lr": 1.970326069377828e-06, "epoch": 4.547976352887677, "percentage": 90.97, "elapsed_time": "20:43:04", "remaining_time": "2:03:22"} +{"current_steps": 938, "total_steps": 1030, "loss": 0.3948, "lr": 1.928523278140033e-06, "epoch": 4.552827042595119, "percentage": 91.07, "elapsed_time": "20:46:57", "remaining_time": "2:02:18"} +{"current_steps": 939, "total_steps": 1030, "loss": 0.3971, "lr": 1.887157746734718e-06, "epoch": 4.557677732302562, "percentage": 91.17, "elapsed_time": "20:50:50", "remaining_time": "2:01:13"} +{"current_steps": 940, "total_steps": 1030, "loss": 0.3902, "lr": 1.846229950254692e-06, "epoch": 4.562528422010004, "percentage": 91.26, "elapsed_time": "20:54:44", "remaining_time": "2:00:08"} +{"current_steps": 941, "total_steps": 1030, "loss": 0.3869, "lr": 1.8057403587652977e-06, "epoch": 4.567379111717448, "percentage": 91.36, "elapsed_time": "20:58:36", "remaining_time": "1:59:02"} +{"current_steps": 942, "total_steps": 1030, "loss": 0.4004, "lr": 1.7656894372989785e-06, "epoch": 4.57222980142489, "percentage": 91.46, "elapsed_time": "21:02:29", "remaining_time": "1:57:56"} +{"current_steps": 943, "total_steps": 1030, "loss": 0.4041, "lr": 1.726077645849955e-06, "epoch": 4.577080491132333, "percentage": 91.55, "elapsed_time": "21:06:22", "remaining_time": "1:56:50"} +{"current_steps": 944, "total_steps": 1030, "loss": 0.3938, "lr": 1.6869054393689265e-06, "epoch": 4.581931180839776, "percentage": 91.65, "elapsed_time": "21:10:14", "remaining_time": "1:55:43"} +{"current_steps": 945, "total_steps": 1030, "loss": 0.4032, "lr": 1.6481732677578798e-06, "epoch": 4.5867818705472185, "percentage": 91.75, "elapsed_time": "21:14:08", "remaining_time": "1:54:36"} +{"current_steps": 946, "total_steps": 1030, "loss": 0.378, "lr": 1.60988157586488e-06, "epoch": 4.591632560254661, "percentage": 91.84, "elapsed_time": "21:18:01", "remaining_time": "1:53:28"} +{"current_steps": 947, "total_steps": 1030, "loss": 0.3904, "lr": 1.5720308034789721e-06, "epoch": 4.596483249962104, "percentage": 91.94, "elapsed_time": "21:21:54", "remaining_time": "1:52:21"} +{"current_steps": 948, "total_steps": 1030, "loss": 0.3999, "lr": 1.5346213853251546e-06, "epoch": 4.601333939669547, "percentage": 92.04, "elapsed_time": "21:25:48", "remaining_time": "1:51:13"} +{"current_steps": 949, "total_steps": 1030, "loss": 0.3981, "lr": 1.4976537510593646e-06, "epoch": 4.6061846293769895, "percentage": 92.14, "elapsed_time": "21:29:41", "remaining_time": "1:50:04"} +{"current_steps": 950, "total_steps": 1030, "loss": 0.4038, "lr": 1.4611283252635412e-06, "epoch": 4.611035319084432, "percentage": 92.23, "elapsed_time": "21:33:33", "remaining_time": "1:48:55"} +{"current_steps": 951, "total_steps": 1030, "loss": 0.3963, "lr": 1.425045527440756e-06, "epoch": 4.615886008791875, "percentage": 92.33, "elapsed_time": "21:37:27", "remaining_time": "1:47:46"} +{"current_steps": 952, "total_steps": 1030, "loss": 0.399, "lr": 1.3894057720104104e-06, "epoch": 4.620736698499318, "percentage": 92.43, "elapsed_time": "21:41:20", "remaining_time": "1:46:37"} +{"current_steps": 953, "total_steps": 1030, "loss": 0.3838, "lr": 1.354209468303429e-06, "epoch": 4.62558738820676, "percentage": 92.52, "elapsed_time": "21:45:14", "remaining_time": "1:45:27"} +{"current_steps": 954, "total_steps": 1030, "loss": 0.3934, "lr": 1.3194570205576284e-06, "epoch": 4.630438077914204, "percentage": 92.62, "elapsed_time": "21:49:06", "remaining_time": "1:44:17"} +{"current_steps": 955, "total_steps": 1030, "loss": 0.3885, "lr": 1.2851488279130053e-06, "epoch": 4.635288767621646, "percentage": 92.72, "elapsed_time": "21:53:00", "remaining_time": "1:43:06"} +{"current_steps": 956, "total_steps": 1030, "loss": 0.3943, "lr": 1.2512852844071933e-06, "epoch": 4.640139457329089, "percentage": 92.82, "elapsed_time": "21:56:53", "remaining_time": "1:41:56"} +{"current_steps": 957, "total_steps": 1030, "loss": 0.3928, "lr": 1.2178667789709287e-06, "epoch": 4.644990147036532, "percentage": 92.91, "elapsed_time": "22:00:46", "remaining_time": "1:40:44"} +{"current_steps": 958, "total_steps": 1030, "loss": 0.3952, "lr": 1.1848936954235702e-06, "epoch": 4.649840836743975, "percentage": 93.01, "elapsed_time": "22:04:40", "remaining_time": "1:39:33"} +{"current_steps": 959, "total_steps": 1030, "loss": 0.4, "lr": 1.1523664124687284e-06, "epoch": 4.654691526451417, "percentage": 93.11, "elapsed_time": "22:08:34", "remaining_time": "1:38:21"} +{"current_steps": 960, "total_steps": 1030, "loss": 0.3981, "lr": 1.1202853036898476e-06, "epoch": 4.65954221615886, "percentage": 93.2, "elapsed_time": "22:12:27", "remaining_time": "1:37:09"} +{"current_steps": 961, "total_steps": 1030, "loss": 0.3984, "lr": 1.0886507375459908e-06, "epoch": 4.664392905866303, "percentage": 93.3, "elapsed_time": "22:16:21", "remaining_time": "1:35:57"} +{"current_steps": 962, "total_steps": 1030, "loss": 0.3848, "lr": 1.0574630773675687e-06, "epoch": 4.669243595573746, "percentage": 93.4, "elapsed_time": "22:20:15", "remaining_time": "1:34:44"} +{"current_steps": 963, "total_steps": 1030, "loss": 0.3852, "lr": 1.0267226813521635e-06, "epoch": 4.674094285281188, "percentage": 93.5, "elapsed_time": "22:24:09", "remaining_time": "1:33:31"} +{"current_steps": 964, "total_steps": 1030, "loss": 0.3943, "lr": 9.964299025604274e-07, "epoch": 4.678944974988632, "percentage": 93.59, "elapsed_time": "22:28:02", "remaining_time": "1:32:17"} +{"current_steps": 965, "total_steps": 1030, "loss": 0.3962, "lr": 9.66585088912022e-07, "epoch": 4.683795664696074, "percentage": 93.69, "elapsed_time": "22:31:56", "remaining_time": "1:31:03"} +{"current_steps": 966, "total_steps": 1030, "loss": 0.3942, "lr": 9.371885831816319e-07, "epoch": 4.688646354403517, "percentage": 93.79, "elapsed_time": "22:35:49", "remaining_time": "1:29:49"} +{"current_steps": 967, "total_steps": 1030, "loss": 0.3989, "lr": 9.082407229950018e-07, "epoch": 4.693497044110959, "percentage": 93.88, "elapsed_time": "22:39:42", "remaining_time": "1:28:35"} +{"current_steps": 968, "total_steps": 1030, "loss": 0.3919, "lr": 8.797418408251101e-07, "epoch": 4.6983477338184025, "percentage": 93.98, "elapsed_time": "22:43:36", "remaining_time": "1:27:20"} +{"current_steps": 969, "total_steps": 1030, "loss": 0.3911, "lr": 8.516922639882819e-07, "epoch": 4.703198423525845, "percentage": 94.08, "elapsed_time": "22:47:29", "remaining_time": "1:26:05"} +{"current_steps": 970, "total_steps": 1030, "loss": 0.3897, "lr": 8.2409231464049e-07, "epoch": 4.708049113233288, "percentage": 94.17, "elapsed_time": "22:51:22", "remaining_time": "1:24:49"} +{"current_steps": 971, "total_steps": 1030, "loss": 0.3925, "lr": 7.969423097736162e-07, "epoch": 4.712899802940731, "percentage": 94.27, "elapsed_time": "22:55:16", "remaining_time": "1:23:33"} +{"current_steps": 972, "total_steps": 1030, "loss": 0.3967, "lr": 7.702425612118269e-07, "epoch": 4.7177504926481735, "percentage": 94.37, "elapsed_time": "22:59:09", "remaining_time": "1:22:17"} +{"current_steps": 973, "total_steps": 1030, "loss": 0.3905, "lr": 7.439933756079942e-07, "epoch": 4.722601182355616, "percentage": 94.47, "elapsed_time": "23:03:02", "remaining_time": "1:21:01"} +{"current_steps": 974, "total_steps": 1030, "loss": 0.3932, "lr": 7.181950544401695e-07, "epoch": 4.7274518720630585, "percentage": 94.56, "elapsed_time": "23:06:56", "remaining_time": "1:19:44"} +{"current_steps": 975, "total_steps": 1030, "loss": 0.3995, "lr": 6.928478940081107e-07, "epoch": 4.732302561770502, "percentage": 94.66, "elapsed_time": "23:10:49", "remaining_time": "1:18:27"} +{"current_steps": 976, "total_steps": 1030, "loss": 0.3917, "lr": 6.679521854299032e-07, "epoch": 4.737153251477944, "percentage": 94.76, "elapsed_time": "23:14:42", "remaining_time": "1:17:09"} +{"current_steps": 977, "total_steps": 1030, "loss": 0.3929, "lr": 6.435082146385885e-07, "epoch": 4.742003941185387, "percentage": 94.85, "elapsed_time": "23:18:36", "remaining_time": "1:15:52"} +{"current_steps": 978, "total_steps": 1030, "loss": 0.3906, "lr": 6.195162623789052e-07, "epoch": 4.74685463089283, "percentage": 94.95, "elapsed_time": "23:22:29", "remaining_time": "1:14:34"} +{"current_steps": 979, "total_steps": 1030, "loss": 0.3879, "lr": 5.959766042040426e-07, "epoch": 4.751705320600273, "percentage": 95.05, "elapsed_time": "23:26:22", "remaining_time": "1:13:15"} +{"current_steps": 980, "total_steps": 1030, "loss": 0.3953, "lr": 5.728895104724963e-07, "epoch": 4.756556010307715, "percentage": 95.15, "elapsed_time": "23:30:16", "remaining_time": "1:11:57"} +{"current_steps": 981, "total_steps": 1030, "loss": 0.3991, "lr": 5.502552463449418e-07, "epoch": 4.761406700015159, "percentage": 95.24, "elapsed_time": "23:34:10", "remaining_time": "1:10:38"} +{"current_steps": 982, "total_steps": 1030, "loss": 0.3975, "lr": 5.280740717812149e-07, "epoch": 4.766257389722601, "percentage": 95.34, "elapsed_time": "23:38:02", "remaining_time": "1:09:18"} +{"current_steps": 983, "total_steps": 1030, "loss": 0.3957, "lr": 5.063462415372967e-07, "epoch": 4.771108079430044, "percentage": 95.44, "elapsed_time": "23:41:56", "remaining_time": "1:07:59"} +{"current_steps": 984, "total_steps": 1030, "loss": 0.3919, "lr": 4.850720051624124e-07, "epoch": 4.775958769137487, "percentage": 95.53, "elapsed_time": "23:45:49", "remaining_time": "1:06:39"} +{"current_steps": 985, "total_steps": 1030, "loss": 0.3909, "lr": 4.642516069961556e-07, "epoch": 4.78080945884493, "percentage": 95.63, "elapsed_time": "23:49:42", "remaining_time": "1:05:18"} +{"current_steps": 986, "total_steps": 1030, "loss": 0.3945, "lr": 4.438852861656751e-07, "epoch": 4.785660148552372, "percentage": 95.73, "elapsed_time": "23:53:36", "remaining_time": "1:03:58"} +{"current_steps": 825, "total_steps": 1030, "loss": 0.4032, "lr": 9.271262404637835e-06, "epoch": 4.0048506897074425, "percentage": 80.1, "elapsed_time": "0:04:11", "remaining_time": "0:01:02"} +{"current_steps": 826, "total_steps": 1030, "loss": 0.3988, "lr": 9.184655460787591e-06, "epoch": 4.009701379414886, "percentage": 80.19, "elapsed_time": "0:08:05", "remaining_time": "0:01:59"} +{"current_steps": 827, "total_steps": 1030, "loss": 0.3943, "lr": 9.098402438391161e-06, "epoch": 4.014552069122328, "percentage": 80.29, "elapsed_time": "0:11:58", "remaining_time": "0:02:56"} +{"current_steps": 828, "total_steps": 1030, "loss": 0.4024, "lr": 9.012504328084724e-06, "epoch": 4.019402758829771, "percentage": 80.39, "elapsed_time": "0:15:51", "remaining_time": "0:03:52"} +{"current_steps": 829, "total_steps": 1030, "loss": 0.4, "lr": 8.926962116428228e-06, "epoch": 4.0242534485372135, "percentage": 80.49, "elapsed_time": "0:19:45", "remaining_time": "0:04:47"} +{"current_steps": 830, "total_steps": 1030, "loss": 0.3994, "lr": 8.841776785894014e-06, "epoch": 4.029104138244657, "percentage": 80.58, "elapsed_time": "0:23:39", "remaining_time": "0:05:42"} +{"current_steps": 831, "total_steps": 1030, "loss": 0.3977, "lr": 8.756949314855565e-06, "epoch": 4.033954827952099, "percentage": 80.68, "elapsed_time": "0:27:33", "remaining_time": "0:06:35"} +{"current_steps": 832, "total_steps": 1030, "loss": 0.3906, "lr": 8.672480677576267e-06, "epoch": 4.038805517659542, "percentage": 80.78, "elapsed_time": "0:31:26", "remaining_time": "0:07:28"} +{"current_steps": 833, "total_steps": 1030, "loss": 0.388, "lr": 8.58837184419821e-06, "epoch": 4.043656207366985, "percentage": 80.87, "elapsed_time": "0:35:19", "remaining_time": "0:08:21"} +{"current_steps": 834, "total_steps": 1030, "loss": 0.3918, "lr": 8.504623780731056e-06, "epoch": 4.048506897074428, "percentage": 80.97, "elapsed_time": "0:39:13", "remaining_time": "0:09:13"} +{"current_steps": 835, "total_steps": 1030, "loss": 0.397, "lr": 8.421237449040962e-06, "epoch": 4.05335758678187, "percentage": 81.07, "elapsed_time": "0:43:07", "remaining_time": "0:10:04"} +{"current_steps": 836, "total_steps": 1030, "loss": 0.393, "lr": 8.338213806839453e-06, "epoch": 4.058208276489314, "percentage": 81.17, "elapsed_time": "0:47:01", "remaining_time": "0:10:54"} +{"current_steps": 837, "total_steps": 1030, "loss": 0.3897, "lr": 8.255553807672547e-06, "epoch": 4.063058966196756, "percentage": 81.26, "elapsed_time": "0:50:55", "remaining_time": "0:11:44"} +{"current_steps": 838, "total_steps": 1030, "loss": 0.3882, "lr": 8.1732584009097e-06, "epoch": 4.067909655904199, "percentage": 81.36, "elapsed_time": "0:54:49", "remaining_time": "0:12:33"} +{"current_steps": 839, "total_steps": 1030, "loss": 0.3959, "lr": 8.091328531732925e-06, "epoch": 4.072760345611641, "percentage": 81.46, "elapsed_time": "0:58:43", "remaining_time": "0:13:22"} +{"current_steps": 840, "total_steps": 1030, "loss": 0.3891, "lr": 8.009765141126014e-06, "epoch": 4.077611035319085, "percentage": 81.55, "elapsed_time": "1:02:37", "remaining_time": "0:14:09"} +{"current_steps": 841, "total_steps": 1030, "loss": 0.3909, "lr": 7.928569165863584e-06, "epoch": 4.082461725026527, "percentage": 81.65, "elapsed_time": "1:06:31", "remaining_time": "0:14:57"} +{"current_steps": 842, "total_steps": 1030, "loss": 0.3875, "lr": 7.847741538500439e-06, "epoch": 4.08731241473397, "percentage": 81.75, "elapsed_time": "1:10:25", "remaining_time": "0:15:43"} +{"current_steps": 843, "total_steps": 1030, "loss": 0.3929, "lr": 7.767283187360846e-06, "epoch": 4.092163104441413, "percentage": 81.84, "elapsed_time": "1:14:18", "remaining_time": "0:16:29"} +{"current_steps": 844, "total_steps": 1030, "loss": 0.3928, "lr": 7.687195036527813e-06, "epoch": 4.097013794148856, "percentage": 81.94, "elapsed_time": "1:18:13", "remaining_time": "0:17:14"} +{"current_steps": 845, "total_steps": 1030, "loss": 0.4002, "lr": 7.60747800583252e-06, "epoch": 4.101864483856298, "percentage": 82.04, "elapsed_time": "1:22:06", "remaining_time": "0:17:58"} +{"current_steps": 846, "total_steps": 1030, "loss": 0.3961, "lr": 7.52813301084375e-06, "epoch": 4.1067151735637415, "percentage": 82.14, "elapsed_time": "1:25:59", "remaining_time": "0:18:42"} +{"current_steps": 847, "total_steps": 1030, "loss": 0.3946, "lr": 7.449160962857358e-06, "epoch": 4.111565863271184, "percentage": 82.23, "elapsed_time": "1:29:56", "remaining_time": "0:19:25"} +{"current_steps": 848, "total_steps": 1030, "loss": 0.3937, "lr": 7.370562768885823e-06, "epoch": 4.1164165529786265, "percentage": 82.33, "elapsed_time": "1:33:49", "remaining_time": "0:20:08"} +{"current_steps": 849, "total_steps": 1030, "loss": 0.3957, "lr": 7.292339331647848e-06, "epoch": 4.121267242686069, "percentage": 82.43, "elapsed_time": "1:37:43", "remaining_time": "0:20:50"} +{"current_steps": 850, "total_steps": 1030, "loss": 0.3969, "lr": 7.214491549557898e-06, "epoch": 4.126117932393512, "percentage": 82.52, "elapsed_time": "1:41:35", "remaining_time": "0:21:30"} +{"current_steps": 851, "total_steps": 1030, "loss": 0.3937, "lr": 7.1370203167160326e-06, "epoch": 4.130968622100955, "percentage": 82.62, "elapsed_time": "1:45:29", "remaining_time": "0:22:11"} +{"current_steps": 852, "total_steps": 1030, "loss": 0.3965, "lr": 7.0599265228975e-06, "epoch": 4.1358193118083975, "percentage": 82.72, "elapsed_time": "1:49:23", "remaining_time": "0:22:51"} +{"current_steps": 853, "total_steps": 1030, "loss": 0.4008, "lr": 6.983211053542591e-06, "epoch": 4.140670001515841, "percentage": 82.82, "elapsed_time": "1:53:17", "remaining_time": "0:23:30"} +{"current_steps": 854, "total_steps": 1030, "loss": 0.4032, "lr": 6.9068747897464535e-06, "epoch": 4.145520691223283, "percentage": 82.91, "elapsed_time": "1:57:10", "remaining_time": "0:24:09"} +{"current_steps": 855, "total_steps": 1030, "loss": 0.4002, "lr": 6.830918608248964e-06, "epoch": 4.150371380930726, "percentage": 83.01, "elapsed_time": "2:01:04", "remaining_time": "0:24:46"} +{"current_steps": 856, "total_steps": 1030, "loss": 0.3976, "lr": 6.755343381424659e-06, "epoch": 4.155222070638169, "percentage": 83.11, "elapsed_time": "2:04:58", "remaining_time": "0:25:24"} +{"current_steps": 857, "total_steps": 1030, "loss": 0.3921, "lr": 6.68014997727275e-06, "epoch": 4.160072760345612, "percentage": 83.2, "elapsed_time": "2:08:52", "remaining_time": "0:26:00"} +{"current_steps": 858, "total_steps": 1030, "loss": 0.3852, "lr": 6.605339259407104e-06, "epoch": 4.164923450053054, "percentage": 83.3, "elapsed_time": "2:12:45", "remaining_time": "0:26:36"} +{"current_steps": 859, "total_steps": 1030, "loss": 0.395, "lr": 6.530912087046317e-06, "epoch": 4.169774139760497, "percentage": 83.4, "elapsed_time": "2:16:39", "remaining_time": "0:27:12"} +{"current_steps": 860, "total_steps": 1030, "loss": 0.3941, "lr": 6.456869315003946e-06, "epoch": 4.17462482946794, "percentage": 83.5, "elapsed_time": "2:20:32", "remaining_time": "0:27:46"} +{"current_steps": 861, "total_steps": 1030, "loss": 0.3997, "lr": 6.3832117936785564e-06, "epoch": 4.179475519175383, "percentage": 83.59, "elapsed_time": "2:24:26", "remaining_time": "0:28:21"} +{"current_steps": 862, "total_steps": 1030, "loss": 0.3945, "lr": 6.309940369044047e-06, "epoch": 4.184326208882825, "percentage": 83.69, "elapsed_time": "2:28:19", "remaining_time": "0:28:54"} +{"current_steps": 863, "total_steps": 1030, "loss": 0.3881, "lr": 6.23705588263992e-06, "epoch": 4.189176898590269, "percentage": 83.79, "elapsed_time": "2:32:13", "remaining_time": "0:29:27"} +{"current_steps": 864, "total_steps": 1030, "loss": 0.3957, "lr": 6.164559171561553e-06, "epoch": 4.194027588297711, "percentage": 83.88, "elapsed_time": "2:36:07", "remaining_time": "0:29:59"} +{"current_steps": 865, "total_steps": 1030, "loss": 0.3969, "lr": 6.092451068450671e-06, "epoch": 4.198878278005154, "percentage": 83.98, "elapsed_time": "2:40:01", "remaining_time": "0:30:31"} +{"current_steps": 866, "total_steps": 1030, "loss": 0.3896, "lr": 6.020732401485751e-06, "epoch": 4.203728967712596, "percentage": 84.08, "elapsed_time": "2:43:54", "remaining_time": "0:31:02"} +{"current_steps": 867, "total_steps": 1030, "loss": 0.4025, "lr": 5.9494039943724845e-06, "epoch": 4.20857965742004, "percentage": 84.17, "elapsed_time": "2:47:47", "remaining_time": "0:31:32"} +{"current_steps": 868, "total_steps": 1030, "loss": 0.3954, "lr": 5.878466666334341e-06, "epoch": 4.213430347127482, "percentage": 84.27, "elapsed_time": "2:51:41", "remaining_time": "0:32:02"} +{"current_steps": 869, "total_steps": 1030, "loss": 0.391, "lr": 5.80792123210316e-06, "epoch": 4.218281036834925, "percentage": 84.37, "elapsed_time": "2:55:35", "remaining_time": "0:32:31"} +{"current_steps": 870, "total_steps": 1030, "loss": 0.3965, "lr": 5.737768501909773e-06, "epoch": 4.223131726542368, "percentage": 84.47, "elapsed_time": "2:59:29", "remaining_time": "0:33:00"} +{"current_steps": 871, "total_steps": 1030, "loss": 0.3846, "lr": 5.668009281474751e-06, "epoch": 4.2279824162498105, "percentage": 84.56, "elapsed_time": "3:03:22", "remaining_time": "0:33:28"} +{"current_steps": 872, "total_steps": 1030, "loss": 0.3919, "lr": 5.598644371999085e-06, "epoch": 4.232833105957253, "percentage": 84.66, "elapsed_time": "3:07:15", "remaining_time": "0:33:55"} +{"current_steps": 873, "total_steps": 1030, "loss": 0.394, "lr": 5.5296745701549906e-06, "epoch": 4.237683795664696, "percentage": 84.76, "elapsed_time": "3:11:07", "remaining_time": "0:34:22"} +{"current_steps": 874, "total_steps": 1030, "loss": 0.3994, "lr": 5.4611006680768305e-06, "epoch": 4.242534485372139, "percentage": 84.85, "elapsed_time": "3:15:01", "remaining_time": "0:34:48"} +{"current_steps": 875, "total_steps": 1030, "loss": 0.388, "lr": 5.3929234533519345e-06, "epoch": 4.2473851750795815, "percentage": 84.95, "elapsed_time": "3:18:55", "remaining_time": "0:35:14"} +{"current_steps": 876, "total_steps": 1030, "loss": 0.3942, "lr": 5.325143709011587e-06, "epoch": 4.252235864787025, "percentage": 85.05, "elapsed_time": "3:22:49", "remaining_time": "0:35:39"} +{"current_steps": 877, "total_steps": 1030, "loss": 0.3907, "lr": 5.257762213522055e-06, "epoch": 4.257086554494467, "percentage": 85.15, "elapsed_time": "3:26:43", "remaining_time": "0:36:03"} +{"current_steps": 878, "total_steps": 1030, "loss": 0.3927, "lr": 5.19077974077558e-06, "epoch": 4.26193724420191, "percentage": 85.24, "elapsed_time": "3:30:37", "remaining_time": "0:36:27"} +{"current_steps": 879, "total_steps": 1030, "loss": 0.3981, "lr": 5.124197060081564e-06, "epoch": 4.266787933909352, "percentage": 85.34, "elapsed_time": "3:34:30", "remaining_time": "0:36:50"} +{"current_steps": 880, "total_steps": 1030, "loss": 0.3987, "lr": 5.058014936157714e-06, "epoch": 4.271638623616796, "percentage": 85.44, "elapsed_time": "3:38:23", "remaining_time": "0:37:13"} +{"current_steps": 881, "total_steps": 1030, "loss": 0.3993, "lr": 4.992234129121225e-06, "epoch": 4.276489313324238, "percentage": 85.53, "elapsed_time": "3:42:17", "remaining_time": "0:37:35"} +{"current_steps": 882, "total_steps": 1030, "loss": 0.394, "lr": 4.926855394480079e-06, "epoch": 4.281340003031681, "percentage": 85.63, "elapsed_time": "3:46:11", "remaining_time": "0:37:57"} +{"current_steps": 883, "total_steps": 1030, "loss": 0.3888, "lr": 4.861879483124372e-06, "epoch": 4.286190692739124, "percentage": 85.73, "elapsed_time": "3:50:04", "remaining_time": "0:38:18"} +{"current_steps": 884, "total_steps": 1030, "loss": 0.3978, "lr": 4.797307141317666e-06, "epoch": 4.291041382446567, "percentage": 85.83, "elapsed_time": "3:53:57", "remaining_time": "0:38:38"} +{"current_steps": 885, "total_steps": 1030, "loss": 0.3949, "lr": 4.7331391106884364e-06, "epoch": 4.295892072154009, "percentage": 85.92, "elapsed_time": "3:57:50", "remaining_time": "0:38:58"} +{"current_steps": 886, "total_steps": 1030, "loss": 0.3922, "lr": 4.6693761282215766e-06, "epoch": 4.300742761861452, "percentage": 86.02, "elapsed_time": "4:01:43", "remaining_time": "0:39:17"} +{"current_steps": 887, "total_steps": 1030, "loss": 0.389, "lr": 4.606018926249851e-06, "epoch": 4.305593451568895, "percentage": 86.12, "elapsed_time": "4:05:37", "remaining_time": "0:39:35"} +{"current_steps": 888, "total_steps": 1030, "loss": 0.3956, "lr": 4.543068232445596e-06, "epoch": 4.310444141276338, "percentage": 86.21, "elapsed_time": "4:09:30", "remaining_time": "0:39:53"} +{"current_steps": 889, "total_steps": 1030, "loss": 0.3938, "lr": 4.480524769812276e-06, "epoch": 4.31529483098378, "percentage": 86.31, "elapsed_time": "4:13:23", "remaining_time": "0:40:11"} +{"current_steps": 890, "total_steps": 1030, "loss": 0.3947, "lr": 4.418389256676206e-06, "epoch": 4.320145520691224, "percentage": 86.41, "elapsed_time": "4:17:17", "remaining_time": "0:40:28"} +{"current_steps": 891, "total_steps": 1030, "loss": 0.3907, "lr": 4.35666240667834e-06, "epoch": 4.324996210398666, "percentage": 86.5, "elapsed_time": "4:21:10", "remaining_time": "0:40:44"} +{"current_steps": 892, "total_steps": 1030, "loss": 0.3939, "lr": 4.295344928765999e-06, "epoch": 4.329846900106109, "percentage": 86.6, "elapsed_time": "4:25:03", "remaining_time": "0:41:00"} +{"current_steps": 893, "total_steps": 1030, "loss": 0.3985, "lr": 4.234437527184785e-06, "epoch": 4.334697589813552, "percentage": 86.7, "elapsed_time": "4:28:57", "remaining_time": "0:41:15"} +{"current_steps": 894, "total_steps": 1030, "loss": 0.395, "lr": 4.173940901470488e-06, "epoch": 4.3395482795209945, "percentage": 86.8, "elapsed_time": "4:32:50", "remaining_time": "0:41:30"} +{"current_steps": 895, "total_steps": 1030, "loss": 0.39, "lr": 4.11385574644104e-06, "epoch": 4.344398969228437, "percentage": 86.89, "elapsed_time": "4:36:43", "remaining_time": "0:41:44"} +{"current_steps": 896, "total_steps": 1030, "loss": 0.3948, "lr": 4.054182752188501e-06, "epoch": 4.34924965893588, "percentage": 86.99, "elapsed_time": "4:40:37", "remaining_time": "0:41:58"} +{"current_steps": 897, "total_steps": 1030, "loss": 0.3941, "lr": 3.994922604071217e-06, "epoch": 4.354100348643323, "percentage": 87.09, "elapsed_time": "4:44:31", "remaining_time": "0:42:11"} +{"current_steps": 898, "total_steps": 1030, "loss": 0.3982, "lr": 3.936075982705871e-06, "epoch": 4.3589510383507655, "percentage": 87.18, "elapsed_time": "4:48:26", "remaining_time": "0:42:23"} +{"current_steps": 899, "total_steps": 1030, "loss": 0.3986, "lr": 3.877643563959694e-06, "epoch": 4.363801728058208, "percentage": 87.28, "elapsed_time": "4:52:19", "remaining_time": "0:42:35"} +{"current_steps": 900, "total_steps": 1030, "loss": 0.3962, "lr": 3.819626018942732e-06, "epoch": 4.368652417765651, "percentage": 87.38, "elapsed_time": "4:56:13", "remaining_time": "0:42:47"} +{"current_steps": 901, "total_steps": 1030, "loss": 0.3974, "lr": 3.762024014000054e-06, "epoch": 4.373503107473094, "percentage": 87.48, "elapsed_time": "5:00:07", "remaining_time": "0:42:58"} +{"current_steps": 902, "total_steps": 1030, "loss": 0.3849, "lr": 3.7048382107042113e-06, "epoch": 4.378353797180536, "percentage": 87.57, "elapsed_time": "5:04:01", "remaining_time": "0:43:08"} +{"current_steps": 903, "total_steps": 1030, "loss": 0.3908, "lr": 3.6480692658475446e-06, "epoch": 4.38320448688798, "percentage": 87.67, "elapsed_time": "5:07:54", "remaining_time": "0:43:18"} +{"current_steps": 904, "total_steps": 1030, "loss": 0.398, "lr": 3.5917178314346955e-06, "epoch": 4.388055176595422, "percentage": 87.77, "elapsed_time": "5:11:47", "remaining_time": "0:43:27"} +{"current_steps": 905, "total_steps": 1030, "loss": 0.3941, "lr": 3.535784554675088e-06, "epoch": 4.392905866302865, "percentage": 87.86, "elapsed_time": "5:15:39", "remaining_time": "0:43:36"} +{"current_steps": 906, "total_steps": 1030, "loss": 0.395, "lr": 3.480270077975525e-06, "epoch": 4.397756556010307, "percentage": 87.96, "elapsed_time": "5:19:33", "remaining_time": "0:43:44"} +{"current_steps": 907, "total_steps": 1030, "loss": 0.3879, "lr": 3.42517503893276e-06, "epoch": 4.402607245717751, "percentage": 88.06, "elapsed_time": "5:23:26", "remaining_time": "0:43:51"} +{"current_steps": 908, "total_steps": 1030, "loss": 0.3832, "lr": 3.370500070326257e-06, "epoch": 4.407457935425193, "percentage": 88.16, "elapsed_time": "5:27:19", "remaining_time": "0:43:58"} +{"current_steps": 909, "total_steps": 1030, "loss": 0.3858, "lr": 3.3162458001108332e-06, "epoch": 4.412308625132636, "percentage": 88.25, "elapsed_time": "5:31:13", "remaining_time": "0:44:05"} +{"current_steps": 910, "total_steps": 1030, "loss": 0.3923, "lr": 3.2624128514094778e-06, "epoch": 4.417159314840079, "percentage": 88.35, "elapsed_time": "5:35:06", "remaining_time": "0:44:11"} +{"current_steps": 911, "total_steps": 1030, "loss": 0.3933, "lr": 3.20900184250625e-06, "epoch": 4.422010004547522, "percentage": 88.45, "elapsed_time": "5:38:59", "remaining_time": "0:44:16"} +{"current_steps": 912, "total_steps": 1030, "loss": 0.4023, "lr": 3.1560133868390895e-06, "epoch": 4.426860694254964, "percentage": 88.54, "elapsed_time": "5:42:54", "remaining_time": "0:44:22"} +{"current_steps": 913, "total_steps": 1030, "loss": 0.399, "lr": 3.1034480929928333e-06, "epoch": 4.431711383962407, "percentage": 88.64, "elapsed_time": "5:46:47", "remaining_time": "0:44:26"} +{"current_steps": 914, "total_steps": 1030, "loss": 0.3946, "lr": 3.0513065646921957e-06, "epoch": 4.43656207366985, "percentage": 88.74, "elapsed_time": "5:50:41", "remaining_time": "0:44:30"} +{"current_steps": 915, "total_steps": 1030, "loss": 0.392, "lr": 2.999589400794851e-06, "epoch": 4.441412763377293, "percentage": 88.83, "elapsed_time": "5:54:34", "remaining_time": "0:44:33"} +{"current_steps": 916, "total_steps": 1030, "loss": 0.3916, "lr": 2.948297195284546e-06, "epoch": 4.446263453084735, "percentage": 88.93, "elapsed_time": "5:58:27", "remaining_time": "0:44:36"} +{"current_steps": 917, "total_steps": 1030, "loss": 0.3947, "lr": 2.897430537264283e-06, "epoch": 4.4511141427921785, "percentage": 89.03, "elapsed_time": "6:02:19", "remaining_time": "0:44:38"} +{"current_steps": 918, "total_steps": 1030, "loss": 0.3942, "lr": 2.8469900109495553e-06, "epoch": 4.455964832499621, "percentage": 89.13, "elapsed_time": "6:06:13", "remaining_time": "0:44:40"} +{"current_steps": 919, "total_steps": 1030, "loss": 0.3888, "lr": 2.79697619566162e-06, "epoch": 4.460815522207064, "percentage": 89.22, "elapsed_time": "6:10:07", "remaining_time": "0:44:42"} +{"current_steps": 920, "total_steps": 1030, "loss": 0.391, "lr": 2.7473896658208743e-06, "epoch": 4.465666211914507, "percentage": 89.32, "elapsed_time": "6:14:01", "remaining_time": "0:44:43"} +{"current_steps": 921, "total_steps": 1030, "loss": 0.3936, "lr": 2.6982309909402293e-06, "epoch": 4.4705169016219495, "percentage": 89.42, "elapsed_time": "6:17:55", "remaining_time": "0:44:43"} +{"current_steps": 922, "total_steps": 1030, "loss": 0.3993, "lr": 2.649500735618582e-06, "epoch": 4.475367591329392, "percentage": 89.51, "elapsed_time": "6:21:49", "remaining_time": "0:44:43"} +{"current_steps": 923, "total_steps": 1030, "loss": 0.3965, "lr": 2.6011994595343516e-06, "epoch": 4.480218281036835, "percentage": 89.61, "elapsed_time": "6:25:43", "remaining_time": "0:44:42"} +{"current_steps": 924, "total_steps": 1030, "loss": 0.3927, "lr": 2.5533277174389916e-06, "epoch": 4.485068970744278, "percentage": 89.71, "elapsed_time": "6:29:37", "remaining_time": "0:44:41"} +{"current_steps": 925, "total_steps": 1030, "loss": 0.3927, "lr": 2.5058860591506973e-06, "epoch": 4.48991966045172, "percentage": 89.81, "elapsed_time": "6:33:31", "remaining_time": "0:44:40"} +{"current_steps": 926, "total_steps": 1030, "loss": 0.3888, "lr": 2.4588750295480246e-06, "epoch": 4.494770350159163, "percentage": 89.9, "elapsed_time": "6:37:23", "remaining_time": "0:44:37"} +{"current_steps": 927, "total_steps": 1030, "loss": 0.3896, "lr": 2.4122951685636674e-06, "epoch": 4.499621039866606, "percentage": 90.0, "elapsed_time": "6:41:17", "remaining_time": "0:44:35"} +{"current_steps": 928, "total_steps": 1030, "loss": 0.398, "lr": 2.366147011178246e-06, "epoch": 4.504471729574049, "percentage": 90.1, "elapsed_time": "6:45:11", "remaining_time": "0:44:32"} +{"current_steps": 929, "total_steps": 1030, "loss": 0.3838, "lr": 2.320431087414159e-06, "epoch": 4.509322419281491, "percentage": 90.19, "elapsed_time": "6:49:04", "remaining_time": "0:44:28"} +{"current_steps": 930, "total_steps": 1030, "loss": 0.3935, "lr": 2.275147922329506e-06, "epoch": 4.514173108988935, "percentage": 90.29, "elapsed_time": "6:52:57", "remaining_time": "0:44:24"} +{"current_steps": 931, "total_steps": 1030, "loss": 0.3913, "lr": 2.230298036012055e-06, "epoch": 4.519023798696377, "percentage": 90.39, "elapsed_time": "6:56:51", "remaining_time": "0:44:19"} +{"current_steps": 932, "total_steps": 1030, "loss": 0.395, "lr": 2.1858819435732583e-06, "epoch": 4.52387448840382, "percentage": 90.49, "elapsed_time": "7:00:43", "remaining_time": "0:44:14"} +{"current_steps": 933, "total_steps": 1030, "loss": 0.3951, "lr": 2.141900155142351e-06, "epoch": 4.528725178111262, "percentage": 90.58, "elapsed_time": "7:04:37", "remaining_time": "0:44:08"} +{"current_steps": 934, "total_steps": 1030, "loss": 0.4011, "lr": 2.0983531758604726e-06, "epoch": 4.533575867818706, "percentage": 90.68, "elapsed_time": "7:08:31", "remaining_time": "0:44:02"} +{"current_steps": 935, "total_steps": 1030, "loss": 0.3999, "lr": 2.055241505874892e-06, "epoch": 4.538426557526148, "percentage": 90.78, "elapsed_time": "7:12:25", "remaining_time": "0:43:56"} +{"current_steps": 936, "total_steps": 1030, "loss": 0.3968, "lr": 2.0125656403332396e-06, "epoch": 4.543277247233591, "percentage": 90.87, "elapsed_time": "7:16:18", "remaining_time": "0:43:49"} +{"current_steps": 937, "total_steps": 1030, "loss": 0.4001, "lr": 1.970326069377828e-06, "epoch": 4.548127936941034, "percentage": 90.97, "elapsed_time": "7:20:11", "remaining_time": "0:43:41"} +{"current_steps": 938, "total_steps": 1030, "loss": 0.3943, "lr": 1.928523278140033e-06, "epoch": 4.552978626648477, "percentage": 91.07, "elapsed_time": "7:24:05", "remaining_time": "0:43:33"} +{"current_steps": 939, "total_steps": 1030, "loss": 0.3972, "lr": 1.887157746734718e-06, "epoch": 4.557829316355919, "percentage": 91.17, "elapsed_time": "7:27:59", "remaining_time": "0:43:24"} +{"current_steps": 940, "total_steps": 1030, "loss": 0.3888, "lr": 1.846229950254692e-06, "epoch": 4.562680006063362, "percentage": 91.26, "elapsed_time": "7:31:53", "remaining_time": "0:43:15"} +{"current_steps": 941, "total_steps": 1030, "loss": 0.3892, "lr": 1.8057403587652977e-06, "epoch": 4.567530695770805, "percentage": 91.36, "elapsed_time": "7:35:46", "remaining_time": "0:43:06"} +{"current_steps": 942, "total_steps": 1030, "loss": 0.3991, "lr": 1.7656894372989785e-06, "epoch": 4.572381385478248, "percentage": 91.46, "elapsed_time": "7:39:39", "remaining_time": "0:42:56"} +{"current_steps": 943, "total_steps": 1030, "loss": 0.4033, "lr": 1.726077645849955e-06, "epoch": 4.57723207518569, "percentage": 91.55, "elapsed_time": "7:43:33", "remaining_time": "0:42:46"} +{"current_steps": 944, "total_steps": 1030, "loss": 0.394, "lr": 1.6869054393689265e-06, "epoch": 4.5820827648931335, "percentage": 91.65, "elapsed_time": "7:47:27", "remaining_time": "0:42:35"} +{"current_steps": 945, "total_steps": 1030, "loss": 0.4026, "lr": 1.6481732677578798e-06, "epoch": 4.586933454600576, "percentage": 91.75, "elapsed_time": "7:51:21", "remaining_time": "0:42:23"} +{"current_steps": 946, "total_steps": 1030, "loss": 0.378, "lr": 1.60988157586488e-06, "epoch": 4.5917841443080185, "percentage": 91.84, "elapsed_time": "7:55:14", "remaining_time": "0:42:11"} +{"current_steps": 947, "total_steps": 1030, "loss": 0.391, "lr": 1.5720308034789721e-06, "epoch": 4.596634834015462, "percentage": 91.94, "elapsed_time": "7:59:07", "remaining_time": "0:41:59"} +{"current_steps": 948, "total_steps": 1030, "loss": 0.3978, "lr": 1.5346213853251546e-06, "epoch": 4.601485523722904, "percentage": 92.04, "elapsed_time": "8:02:59", "remaining_time": "0:41:46"} +{"current_steps": 949, "total_steps": 1030, "loss": 0.3995, "lr": 1.4976537510593646e-06, "epoch": 4.606336213430347, "percentage": 92.14, "elapsed_time": "8:06:53", "remaining_time": "0:41:33"} +{"current_steps": 950, "total_steps": 1030, "loss": 0.4038, "lr": 1.4611283252635412e-06, "epoch": 4.61118690313779, "percentage": 92.23, "elapsed_time": "8:10:46", "remaining_time": "0:41:19"} +{"current_steps": 951, "total_steps": 1030, "loss": 0.3956, "lr": 1.425045527440756e-06, "epoch": 4.616037592845233, "percentage": 92.33, "elapsed_time": "8:14:40", "remaining_time": "0:41:05"} +{"current_steps": 952, "total_steps": 1030, "loss": 0.399, "lr": 1.3894057720104104e-06, "epoch": 4.620888282552675, "percentage": 92.43, "elapsed_time": "8:18:33", "remaining_time": "0:40:50"} +{"current_steps": 953, "total_steps": 1030, "loss": 0.3828, "lr": 1.354209468303429e-06, "epoch": 4.625738972260118, "percentage": 92.52, "elapsed_time": "8:22:27", "remaining_time": "0:40:35"} +{"current_steps": 954, "total_steps": 1030, "loss": 0.3954, "lr": 1.3194570205576284e-06, "epoch": 4.630589661967561, "percentage": 92.62, "elapsed_time": "8:26:19", "remaining_time": "0:40:20"} +{"current_steps": 955, "total_steps": 1030, "loss": 0.3876, "lr": 1.2851488279130053e-06, "epoch": 4.635440351675004, "percentage": 92.72, "elapsed_time": "8:30:13", "remaining_time": "0:40:04"} +{"current_steps": 956, "total_steps": 1030, "loss": 0.3949, "lr": 1.2512852844071933e-06, "epoch": 4.640291041382446, "percentage": 92.82, "elapsed_time": "8:34:06", "remaining_time": "0:39:47"} +{"current_steps": 957, "total_steps": 1030, "loss": 0.3919, "lr": 1.2178667789709287e-06, "epoch": 4.64514173108989, "percentage": 92.91, "elapsed_time": "8:37:59", "remaining_time": "0:39:30"} +{"current_steps": 958, "total_steps": 1030, "loss": 0.395, "lr": 1.1848936954235702e-06, "epoch": 4.649992420797332, "percentage": 93.01, "elapsed_time": "8:41:51", "remaining_time": "0:39:13"} +{"current_steps": 959, "total_steps": 1030, "loss": 0.3997, "lr": 1.1523664124687284e-06, "epoch": 4.654843110504775, "percentage": 93.11, "elapsed_time": "8:45:45", "remaining_time": "0:38:55"} +{"current_steps": 960, "total_steps": 1030, "loss": 0.3974, "lr": 1.1202853036898476e-06, "epoch": 4.659693800212217, "percentage": 93.2, "elapsed_time": "8:49:38", "remaining_time": "0:38:37"} +{"current_steps": 961, "total_steps": 1030, "loss": 0.3981, "lr": 1.0886507375459908e-06, "epoch": 4.664544489919661, "percentage": 93.3, "elapsed_time": "8:53:31", "remaining_time": "0:38:18"} +{"current_steps": 962, "total_steps": 1030, "loss": 0.3839, "lr": 1.0574630773675687e-06, "epoch": 4.669395179627103, "percentage": 93.4, "elapsed_time": "8:57:23", "remaining_time": "0:37:59"} +{"current_steps": 963, "total_steps": 1030, "loss": 0.3877, "lr": 1.0267226813521635e-06, "epoch": 4.674245869334546, "percentage": 93.5, "elapsed_time": "9:01:17", "remaining_time": "0:37:39"} +{"current_steps": 964, "total_steps": 1030, "loss": 0.3921, "lr": 9.964299025604274e-07, "epoch": 4.679096559041989, "percentage": 93.59, "elapsed_time": "9:05:10", "remaining_time": "0:37:19"} +{"current_steps": 965, "total_steps": 1030, "loss": 0.3967, "lr": 9.66585088912022e-07, "epoch": 4.683947248749432, "percentage": 93.69, "elapsed_time": "9:09:03", "remaining_time": "0:36:58"} +{"current_steps": 966, "total_steps": 1030, "loss": 0.395, "lr": 9.371885831816319e-07, "epoch": 4.688797938456874, "percentage": 93.79, "elapsed_time": "9:12:57", "remaining_time": "0:36:38"} +{"current_steps": 967, "total_steps": 1030, "loss": 0.3976, "lr": 9.082407229950018e-07, "epoch": 4.6936486281643175, "percentage": 93.88, "elapsed_time": "9:16:50", "remaining_time": "0:36:16"} +{"current_steps": 968, "total_steps": 1030, "loss": 0.3918, "lr": 8.797418408251101e-07, "epoch": 4.69849931787176, "percentage": 93.98, "elapsed_time": "9:20:43", "remaining_time": "0:35:54"} +{"current_steps": 969, "total_steps": 1030, "loss": 0.3897, "lr": 8.516922639882819e-07, "epoch": 4.7033500075792025, "percentage": 94.08, "elapsed_time": "9:24:35", "remaining_time": "0:35:32"} +{"current_steps": 970, "total_steps": 1030, "loss": 0.3901, "lr": 8.2409231464049e-07, "epoch": 4.708200697286646, "percentage": 94.17, "elapsed_time": "9:28:29", "remaining_time": "0:35:09"} +{"current_steps": 971, "total_steps": 1030, "loss": 0.3931, "lr": 7.969423097736162e-07, "epoch": 4.713051386994088, "percentage": 94.27, "elapsed_time": "9:32:23", "remaining_time": "0:34:46"} +{"current_steps": 972, "total_steps": 1030, "loss": 0.3962, "lr": 7.702425612118269e-07, "epoch": 4.717902076701531, "percentage": 94.37, "elapsed_time": "9:36:15", "remaining_time": "0:34:23"} +{"current_steps": 973, "total_steps": 1030, "loss": 0.3913, "lr": 7.439933756079942e-07, "epoch": 4.7227527664089735, "percentage": 94.47, "elapsed_time": "9:40:09", "remaining_time": "0:33:59"} +{"current_steps": 974, "total_steps": 1030, "loss": 0.3935, "lr": 7.181950544401695e-07, "epoch": 4.727603456116417, "percentage": 94.56, "elapsed_time": "9:44:02", "remaining_time": "0:33:34"} +{"current_steps": 975, "total_steps": 1030, "loss": 0.3984, "lr": 6.928478940081107e-07, "epoch": 4.732454145823859, "percentage": 94.66, "elapsed_time": "9:47:55", "remaining_time": "0:33:09"} +{"current_steps": 976, "total_steps": 1030, "loss": 0.3914, "lr": 6.679521854299032e-07, "epoch": 4.737304835531302, "percentage": 94.76, "elapsed_time": "9:51:49", "remaining_time": "0:32:44"} +{"current_steps": 977, "total_steps": 1030, "loss": 0.3901, "lr": 6.435082146385885e-07, "epoch": 4.742155525238745, "percentage": 94.85, "elapsed_time": "9:55:43", "remaining_time": "0:32:19"} +{"current_steps": 978, "total_steps": 1030, "loss": 0.393, "lr": 6.195162623789052e-07, "epoch": 4.747006214946188, "percentage": 94.95, "elapsed_time": "9:59:37", "remaining_time": "0:31:52"} +{"current_steps": 979, "total_steps": 1030, "loss": 0.3879, "lr": 5.959766042040426e-07, "epoch": 4.75185690465363, "percentage": 95.05, "elapsed_time": "10:03:30", "remaining_time": "0:31:26"} +{"current_steps": 980, "total_steps": 1030, "loss": 0.3959, "lr": 5.728895104724963e-07, "epoch": 4.756707594361073, "percentage": 95.15, "elapsed_time": "10:07:23", "remaining_time": "0:30:59"} +{"current_steps": 981, "total_steps": 1030, "loss": 0.3984, "lr": 5.502552463449418e-07, "epoch": 4.761558284068516, "percentage": 95.24, "elapsed_time": "10:11:17", "remaining_time": "0:30:32"} +{"current_steps": 982, "total_steps": 1030, "loss": 0.3977, "lr": 5.280740717812149e-07, "epoch": 4.766408973775959, "percentage": 95.34, "elapsed_time": "10:15:11", "remaining_time": "0:30:04"} +{"current_steps": 983, "total_steps": 1030, "loss": 0.3948, "lr": 5.063462415372967e-07, "epoch": 4.771259663483401, "percentage": 95.44, "elapsed_time": "10:19:03", "remaining_time": "0:29:35"} +{"current_steps": 984, "total_steps": 1030, "loss": 0.3914, "lr": 4.850720051624124e-07, "epoch": 4.776110353190845, "percentage": 95.53, "elapsed_time": "10:22:57", "remaining_time": "0:29:07"} +{"current_steps": 985, "total_steps": 1030, "loss": 0.392, "lr": 4.642516069961556e-07, "epoch": 4.780961042898287, "percentage": 95.63, "elapsed_time": "10:26:51", "remaining_time": "0:28:38"} +{"current_steps": 986, "total_steps": 1030, "loss": 0.3951, "lr": 4.438852861656751e-07, "epoch": 4.78581173260573, "percentage": 95.73, "elapsed_time": "10:30:45", "remaining_time": "0:28:08"} +{"current_steps": 987, "total_steps": 1030, "loss": 0.3899, "lr": 4.2397327658294076e-07, "epoch": 4.790662422313172, "percentage": 95.83, "elapsed_time": "10:34:39", "remaining_time": "0:27:38"} +{"current_steps": 988, "total_steps": 1030, "loss": 0.3963, "lr": 4.045158069420474e-07, "epoch": 4.795513112020616, "percentage": 95.92, "elapsed_time": "10:38:32", "remaining_time": "0:27:08"} +{"current_steps": 989, "total_steps": 1030, "loss": 0.3975, "lr": 3.8551310071659023e-07, "epoch": 4.800363801728058, "percentage": 96.02, "elapsed_time": "10:42:26", "remaining_time": "0:26:37"} +{"current_steps": 990, "total_steps": 1030, "loss": 0.3968, "lr": 3.6696537615711124e-07, "epoch": 4.805214491435501, "percentage": 96.12, "elapsed_time": "10:46:19", "remaining_time": "0:26:06"} +{"current_steps": 991, "total_steps": 1030, "loss": 0.3932, "lr": 3.4887284628857266e-07, "epoch": 4.810065181142944, "percentage": 96.21, "elapsed_time": "10:50:13", "remaining_time": "0:25:35"} +{"current_steps": 992, "total_steps": 1030, "loss": 0.3887, "lr": 3.3123571890791405e-07, "epoch": 4.8149158708503865, "percentage": 96.31, "elapsed_time": "10:54:07", "remaining_time": "0:25:03"} +{"current_steps": 993, "total_steps": 1030, "loss": 0.394, "lr": 3.1405419658168125e-07, "epoch": 4.819766560557829, "percentage": 96.41, "elapsed_time": "10:58:01", "remaining_time": "0:24:31"} +{"current_steps": 994, "total_steps": 1030, "loss": 0.3917, "lr": 2.973284766436857e-07, "epoch": 4.824617250265272, "percentage": 96.5, "elapsed_time": "11:01:54", "remaining_time": "0:23:58"} +{"current_steps": 995, "total_steps": 1030, "loss": 0.3901, "lr": 2.810587511927354e-07, "epoch": 4.829467939972715, "percentage": 96.6, "elapsed_time": "11:05:47", "remaining_time": "0:23:25"} +{"current_steps": 996, "total_steps": 1030, "loss": 0.3923, "lr": 2.652452070904499e-07, "epoch": 4.8343186296801575, "percentage": 96.7, "elapsed_time": "11:09:41", "remaining_time": "0:22:51"} +{"current_steps": 997, "total_steps": 1030, "loss": 0.3944, "lr": 2.498880259590797e-07, "epoch": 4.839169319387601, "percentage": 96.8, "elapsed_time": "11:13:35", "remaining_time": "0:22:17"} +{"current_steps": 998, "total_steps": 1030, "loss": 0.3975, "lr": 2.3498738417945034e-07, "epoch": 4.844020009095043, "percentage": 96.89, "elapsed_time": "11:17:29", "remaining_time": "0:21:43"} +{"current_steps": 999, "total_steps": 1030, "loss": 0.3971, "lr": 2.205434528889283e-07, "epoch": 4.848870698802486, "percentage": 96.99, "elapsed_time": "11:21:22", "remaining_time": "0:21:08"} +{"current_steps": 1000, "total_steps": 1030, "loss": 0.3903, "lr": 2.0655639797944937e-07, "epoch": 4.853721388509928, "percentage": 97.09, "elapsed_time": "11:25:15", "remaining_time": "0:20:33"} +{"current_steps": 1001, "total_steps": 1030, "loss": 0.396, "lr": 1.9302638009561782e-07, "epoch": 4.858572078217372, "percentage": 97.18, "elapsed_time": "11:29:09", "remaining_time": "0:19:57"} +{"current_steps": 1002, "total_steps": 1030, "loss": 0.3965, "lr": 1.7995355463285457e-07, "epoch": 4.863422767924814, "percentage": 97.28, "elapsed_time": "11:33:02", "remaining_time": "0:19:21"} +{"current_steps": 1003, "total_steps": 1030, "loss": 0.3913, "lr": 1.6733807173562988e-07, "epoch": 4.868273457632257, "percentage": 97.38, "elapsed_time": "11:36:55", "remaining_time": "0:18:45"} +{"current_steps": 1004, "total_steps": 1030, "loss": 0.3995, "lr": 1.5518007629571342e-07, "epoch": 4.8731241473397, "percentage": 97.48, "elapsed_time": "11:40:49", "remaining_time": "0:18:08"} +{"current_steps": 1005, "total_steps": 1030, "loss": 0.3967, "lr": 1.4347970795054456e-07, "epoch": 4.877974837047143, "percentage": 97.57, "elapsed_time": "11:44:42", "remaining_time": "0:17:31"} +{"current_steps": 1006, "total_steps": 1030, "loss": 0.3965, "lr": 1.3223710108158483e-07, "epoch": 4.882825526754585, "percentage": 97.67, "elapsed_time": "11:48:35", "remaining_time": "0:16:54"} +{"current_steps": 1007, "total_steps": 1030, "loss": 0.3971, "lr": 1.214523848128124e-07, "epoch": 4.887676216462028, "percentage": 97.77, "elapsed_time": "11:52:29", "remaining_time": "0:16:16"} +{"current_steps": 1008, "total_steps": 1030, "loss": 0.3996, "lr": 1.111256830092211e-07, "epoch": 4.892526906169471, "percentage": 97.86, "elapsed_time": "11:56:23", "remaining_time": "0:15:38"} +{"current_steps": 1009, "total_steps": 1030, "loss": 0.3949, "lr": 1.0125711427540374e-07, "epoch": 4.897377595876914, "percentage": 97.96, "elapsed_time": "12:00:15", "remaining_time": "0:14:59"} +{"current_steps": 1010, "total_steps": 1030, "loss": 0.3889, "lr": 9.184679195417989e-08, "epoch": 4.902228285584356, "percentage": 98.06, "elapsed_time": "12:04:09", "remaining_time": "0:14:20"} +{"current_steps": 1011, "total_steps": 1030, "loss": 0.3984, "lr": 8.289482412531246e-08, "epoch": 4.9070789752918, "percentage": 98.16, "elapsed_time": "12:08:03", "remaining_time": "0:13:40"} +{"current_steps": 1012, "total_steps": 1030, "loss": 0.3887, "lr": 7.440131360424652e-08, "epoch": 4.911929664999242, "percentage": 98.25, "elapsed_time": "12:11:57", "remaining_time": "0:13:01"} +{"current_steps": 1013, "total_steps": 1030, "loss": 0.3908, "lr": 6.636635794094126e-08, "epoch": 4.916780354706685, "percentage": 98.35, "elapsed_time": "12:15:51", "remaining_time": "0:12:20"} +{"current_steps": 1014, "total_steps": 1030, "loss": 0.3951, "lr": 5.879004941874655e-08, "epoch": 4.921631044414128, "percentage": 98.45, "elapsed_time": "12:19:45", "remaining_time": "0:11:40"} +{"current_steps": 1015, "total_steps": 1030, "loss": 0.398, "lr": 5.16724750533415e-08, "epoch": 4.9264817341215705, "percentage": 98.54, "elapsed_time": "12:23:38", "remaining_time": "0:10:59"} +{"current_steps": 1016, "total_steps": 1030, "loss": 0.3944, "lr": 4.5013716591730815e-08, "epoch": 4.931332423829013, "percentage": 98.64, "elapsed_time": "12:27:31", "remaining_time": "0:10:18"} +{"current_steps": 1017, "total_steps": 1030, "loss": 0.3997, "lr": 3.881385051132114e-08, "epoch": 4.9361831135364564, "percentage": 98.74, "elapsed_time": "12:31:25", "remaining_time": "0:09:36"} +{"current_steps": 1018, "total_steps": 1030, "loss": 0.3968, "lr": 3.307294801902838e-08, "epoch": 4.941033803243899, "percentage": 98.83, "elapsed_time": "12:35:19", "remaining_time": "0:08:54"} +{"current_steps": 1019, "total_steps": 1030, "loss": 0.3977, "lr": 2.7791075050460636e-08, "epoch": 4.9458844929513415, "percentage": 98.93, "elapsed_time": "12:39:13", "remaining_time": "0:08:11"} +{"current_steps": 1020, "total_steps": 1030, "loss": 0.3978, "lr": 2.2968292269167637e-08, "epoch": 4.950735182658784, "percentage": 99.03, "elapsed_time": "12:43:07", "remaining_time": "0:07:28"} +{"current_steps": 1021, "total_steps": 1030, "loss": 0.3888, "lr": 1.8604655065939116e-08, "epoch": 4.955585872366227, "percentage": 99.13, "elapsed_time": "12:47:00", "remaining_time": "0:06:45"} +{"current_steps": 1022, "total_steps": 1030, "loss": 0.3952, "lr": 1.470021355816975e-08, "epoch": 4.96043656207367, "percentage": 99.22, "elapsed_time": "12:50:53", "remaining_time": "0:06:02"} +{"current_steps": 1023, "total_steps": 1030, "loss": 0.3988, "lr": 1.1255012589286297e-08, "epoch": 4.965287251781112, "percentage": 99.32, "elapsed_time": "12:54:47", "remaining_time": "0:05:18"} +{"current_steps": 1024, "total_steps": 1030, "loss": 0.3858, "lr": 8.269091728232426e-09, "epoch": 4.970137941488556, "percentage": 99.42, "elapsed_time": "12:58:41", "remaining_time": "0:04:33"} +{"current_steps": 1025, "total_steps": 1030, "loss": 0.3976, "lr": 5.742485269006892e-09, "epoch": 4.974988631195998, "percentage": 99.51, "elapsed_time": "13:02:34", "remaining_time": "0:03:49"} +{"current_steps": 1026, "total_steps": 1030, "loss": 0.3922, "lr": 3.6752222302727238e-09, "epoch": 4.979839320903441, "percentage": 99.61, "elapsed_time": "13:06:27", "remaining_time": "0:03:03"} +{"current_steps": 1027, "total_steps": 1030, "loss": 0.3894, "lr": 2.06732635503748e-09, "epoch": 4.984690010610883, "percentage": 99.71, "elapsed_time": "13:10:21", "remaining_time": "0:02:18"} +{"current_steps": 1028, "total_steps": 1030, "loss": 0.3893, "lr": 9.188161103557136e-10, "epoch": 4.989540700318327, "percentage": 99.81, "elapsed_time": "13:14:15", "remaining_time": "0:01:32"} +{"current_steps": 1029, "total_steps": 1030, "loss": 0.3934, "lr": 2.2970468714245132e-10, "epoch": 4.994391390025769, "percentage": 99.9, "elapsed_time": "13:18:09", "remaining_time": "0:00:46"} +{"current_steps": 1030, "total_steps": 1030, "loss": 0.3877, "lr": 0.0, "epoch": 4.999242079733212, "percentage": 100.0, "elapsed_time": "13:22:02", "remaining_time": "0:00:00"} +{"current_steps": 1030, "total_steps": 1030, "epoch": 4.999242079733212, "percentage": 100.0, "elapsed_time": "13:22:33", "remaining_time": "0:00:00"} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..835aa94 --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,7252 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 4.999242079733212, + "eval_steps": 500, + "global_step": 1030, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.004850689707442777, + "grad_norm": 6.339065858846749, + "learning_rate": 7.766990291262136e-07, + "loss": 1.0147, + "step": 1 + }, + { + "epoch": 0.009701379414885554, + "grad_norm": 6.370901874406726, + "learning_rate": 1.5533980582524272e-06, + "loss": 1.0217, + "step": 2 + }, + { + "epoch": 0.01455206912232833, + "grad_norm": 6.253076167725343, + "learning_rate": 2.330097087378641e-06, + "loss": 1.0059, + "step": 3 + }, + { + "epoch": 0.01940275882977111, + "grad_norm": 5.8627331903052005, + "learning_rate": 3.1067961165048544e-06, + "loss": 0.9987, + "step": 4 + }, + { + "epoch": 0.024253448537213885, + "grad_norm": 4.624724616975588, + "learning_rate": 3.883495145631068e-06, + "loss": 0.9654, + "step": 5 + }, + { + "epoch": 0.02910413824465666, + "grad_norm": 2.701973440331149, + "learning_rate": 4.660194174757282e-06, + "loss": 0.9221, + "step": 6 + }, + { + "epoch": 0.03395482795209944, + "grad_norm": 2.5821400220833683, + "learning_rate": 5.436893203883496e-06, + "loss": 0.9118, + "step": 7 + }, + { + "epoch": 0.03880551765954222, + "grad_norm": 3.1473551148693146, + "learning_rate": 6.213592233009709e-06, + "loss": 0.8818, + "step": 8 + }, + { + "epoch": 0.04365620736698499, + "grad_norm": 3.8230150062051638, + "learning_rate": 6.990291262135923e-06, + "loss": 0.8912, + "step": 9 + }, + { + "epoch": 0.04850689707442777, + "grad_norm": 3.4669236063777715, + "learning_rate": 7.766990291262136e-06, + "loss": 0.8779, + "step": 10 + }, + { + "epoch": 0.053357586781870546, + "grad_norm": 2.712055876575345, + "learning_rate": 8.54368932038835e-06, + "loss": 0.8328, + "step": 11 + }, + { + "epoch": 0.05820827648931332, + "grad_norm": 2.574263966000136, + "learning_rate": 9.320388349514565e-06, + "loss": 0.8149, + "step": 12 + }, + { + "epoch": 0.0630589661967561, + "grad_norm": 1.8016385817876701, + "learning_rate": 1.0097087378640778e-05, + "loss": 0.7941, + "step": 13 + }, + { + "epoch": 0.06790965590419888, + "grad_norm": 1.16110696712433, + "learning_rate": 1.0873786407766991e-05, + "loss": 0.7751, + "step": 14 + }, + { + "epoch": 0.07276034561164166, + "grad_norm": 1.5441894400920566, + "learning_rate": 1.1650485436893204e-05, + "loss": 0.7603, + "step": 15 + }, + { + "epoch": 0.07761103531908443, + "grad_norm": 1.3570174190036193, + "learning_rate": 1.2427184466019418e-05, + "loss": 0.7456, + "step": 16 + }, + { + "epoch": 0.08246172502652721, + "grad_norm": 1.0160879152766609, + "learning_rate": 1.3203883495145633e-05, + "loss": 0.74, + "step": 17 + }, + { + "epoch": 0.08731241473396999, + "grad_norm": 1.195923679791525, + "learning_rate": 1.3980582524271846e-05, + "loss": 0.7223, + "step": 18 + }, + { + "epoch": 0.09216310444141276, + "grad_norm": 1.0381307779091873, + "learning_rate": 1.475728155339806e-05, + "loss": 0.7149, + "step": 19 + }, + { + "epoch": 0.09701379414885554, + "grad_norm": 0.9191697728302082, + "learning_rate": 1.5533980582524273e-05, + "loss": 0.7032, + "step": 20 + }, + { + "epoch": 0.10186448385629832, + "grad_norm": 1.0389109685950821, + "learning_rate": 1.6310679611650486e-05, + "loss": 0.697, + "step": 21 + }, + { + "epoch": 0.10671517356374109, + "grad_norm": 0.8528569833940303, + "learning_rate": 1.70873786407767e-05, + "loss": 0.6913, + "step": 22 + }, + { + "epoch": 0.11156586327118387, + "grad_norm": 0.7397574673832126, + "learning_rate": 1.7864077669902916e-05, + "loss": 0.6844, + "step": 23 + }, + { + "epoch": 0.11641655297862664, + "grad_norm": 0.6762376097915315, + "learning_rate": 1.864077669902913e-05, + "loss": 0.6807, + "step": 24 + }, + { + "epoch": 0.12126724268606942, + "grad_norm": 0.6801312007046909, + "learning_rate": 1.9417475728155343e-05, + "loss": 0.6651, + "step": 25 + }, + { + "epoch": 0.1261179323935122, + "grad_norm": 0.5373129321939298, + "learning_rate": 2.0194174757281556e-05, + "loss": 0.6661, + "step": 26 + }, + { + "epoch": 0.13096862210095497, + "grad_norm": 0.6155691125010336, + "learning_rate": 2.097087378640777e-05, + "loss": 0.6655, + "step": 27 + }, + { + "epoch": 0.13581931180839776, + "grad_norm": 0.5373412410981904, + "learning_rate": 2.1747572815533982e-05, + "loss": 0.6541, + "step": 28 + }, + { + "epoch": 0.14067000151584053, + "grad_norm": 0.5722094683121568, + "learning_rate": 2.2524271844660196e-05, + "loss": 0.6534, + "step": 29 + }, + { + "epoch": 0.14552069122328332, + "grad_norm": 0.6369873796903149, + "learning_rate": 2.330097087378641e-05, + "loss": 0.6536, + "step": 30 + }, + { + "epoch": 0.15037138093072608, + "grad_norm": 0.5246684440675834, + "learning_rate": 2.4077669902912622e-05, + "loss": 0.6545, + "step": 31 + }, + { + "epoch": 0.15522207063816887, + "grad_norm": 0.504247506683658, + "learning_rate": 2.4854368932038836e-05, + "loss": 0.6314, + "step": 32 + }, + { + "epoch": 0.16007276034561163, + "grad_norm": 0.5566944063536889, + "learning_rate": 2.5631067961165052e-05, + "loss": 0.6373, + "step": 33 + }, + { + "epoch": 0.16492345005305442, + "grad_norm": 0.8570989167580252, + "learning_rate": 2.6407766990291266e-05, + "loss": 0.63, + "step": 34 + }, + { + "epoch": 0.16977413976049718, + "grad_norm": 1.8667995731915865, + "learning_rate": 2.718446601941748e-05, + "loss": 0.6456, + "step": 35 + }, + { + "epoch": 0.17462482946793997, + "grad_norm": 0.5164194413667431, + "learning_rate": 2.7961165048543692e-05, + "loss": 0.6308, + "step": 36 + }, + { + "epoch": 0.17947551917538274, + "grad_norm": 1.6098330943831782, + "learning_rate": 2.8737864077669905e-05, + "loss": 0.6398, + "step": 37 + }, + { + "epoch": 0.18432620888282553, + "grad_norm": 1.1492129920694993, + "learning_rate": 2.951456310679612e-05, + "loss": 0.6276, + "step": 38 + }, + { + "epoch": 0.18917689859026832, + "grad_norm": 0.7127614761088336, + "learning_rate": 3.0291262135922332e-05, + "loss": 0.6218, + "step": 39 + }, + { + "epoch": 0.19402758829771108, + "grad_norm": 1.0312378150228299, + "learning_rate": 3.1067961165048545e-05, + "loss": 0.6253, + "step": 40 + }, + { + "epoch": 0.19887827800515387, + "grad_norm": 1.7574387168351864, + "learning_rate": 3.184466019417476e-05, + "loss": 0.6281, + "step": 41 + }, + { + "epoch": 0.20372896771259663, + "grad_norm": 0.9416599187328968, + "learning_rate": 3.262135922330097e-05, + "loss": 0.6235, + "step": 42 + }, + { + "epoch": 0.20857965742003942, + "grad_norm": 1.8301787236679616, + "learning_rate": 3.339805825242719e-05, + "loss": 0.622, + "step": 43 + }, + { + "epoch": 0.21343034712748218, + "grad_norm": 0.9292078210446757, + "learning_rate": 3.41747572815534e-05, + "loss": 0.6107, + "step": 44 + }, + { + "epoch": 0.21828103683492497, + "grad_norm": 1.994214362456412, + "learning_rate": 3.4951456310679615e-05, + "loss": 0.6151, + "step": 45 + }, + { + "epoch": 0.22313172654236774, + "grad_norm": 1.3619344540131681, + "learning_rate": 3.572815533980583e-05, + "loss": 0.6089, + "step": 46 + }, + { + "epoch": 0.22798241624981053, + "grad_norm": 1.6323821476629805, + "learning_rate": 3.650485436893204e-05, + "loss": 0.6165, + "step": 47 + }, + { + "epoch": 0.2328331059572533, + "grad_norm": 1.1474300438640261, + "learning_rate": 3.728155339805826e-05, + "loss": 0.6104, + "step": 48 + }, + { + "epoch": 0.23768379566469608, + "grad_norm": 1.1936059623728144, + "learning_rate": 3.805825242718447e-05, + "loss": 0.6086, + "step": 49 + }, + { + "epoch": 0.24253448537213884, + "grad_norm": 1.4126137333521573, + "learning_rate": 3.8834951456310685e-05, + "loss": 0.6123, + "step": 50 + }, + { + "epoch": 0.24738517507958163, + "grad_norm": 0.7835607330331523, + "learning_rate": 3.9611650485436895e-05, + "loss": 0.5979, + "step": 51 + }, + { + "epoch": 0.2522358647870244, + "grad_norm": 1.3575257469759314, + "learning_rate": 4.038834951456311e-05, + "loss": 0.6134, + "step": 52 + }, + { + "epoch": 0.25708655449446716, + "grad_norm": 0.9580505107131282, + "learning_rate": 4.116504854368932e-05, + "loss": 0.5987, + "step": 53 + }, + { + "epoch": 0.26193724420190995, + "grad_norm": 1.1647956860260527, + "learning_rate": 4.194174757281554e-05, + "loss": 0.6134, + "step": 54 + }, + { + "epoch": 0.26678793390935274, + "grad_norm": 0.9133078407230598, + "learning_rate": 4.271844660194175e-05, + "loss": 0.5978, + "step": 55 + }, + { + "epoch": 0.2716386236167955, + "grad_norm": 1.3505836368180404, + "learning_rate": 4.3495145631067965e-05, + "loss": 0.5944, + "step": 56 + }, + { + "epoch": 0.2764893133242383, + "grad_norm": 1.1628512424723636, + "learning_rate": 4.4271844660194175e-05, + "loss": 0.6052, + "step": 57 + }, + { + "epoch": 0.28134000303168105, + "grad_norm": 1.6421048813051027, + "learning_rate": 4.504854368932039e-05, + "loss": 0.6008, + "step": 58 + }, + { + "epoch": 0.28619069273912384, + "grad_norm": 1.3019802198524983, + "learning_rate": 4.58252427184466e-05, + "loss": 0.594, + "step": 59 + }, + { + "epoch": 0.29104138244656663, + "grad_norm": 1.2774402772060065, + "learning_rate": 4.660194174757282e-05, + "loss": 0.5892, + "step": 60 + }, + { + "epoch": 0.2958920721540094, + "grad_norm": 1.4435670386305743, + "learning_rate": 4.737864077669903e-05, + "loss": 0.5931, + "step": 61 + }, + { + "epoch": 0.30074276186145216, + "grad_norm": 1.0284857540916943, + "learning_rate": 4.8155339805825245e-05, + "loss": 0.5932, + "step": 62 + }, + { + "epoch": 0.30559345156889495, + "grad_norm": 1.1698103896183938, + "learning_rate": 4.8932038834951454e-05, + "loss": 0.5948, + "step": 63 + }, + { + "epoch": 0.31044414127633774, + "grad_norm": 1.434142725222452, + "learning_rate": 4.970873786407767e-05, + "loss": 0.5897, + "step": 64 + }, + { + "epoch": 0.3152948309837805, + "grad_norm": 1.3482179068151203, + "learning_rate": 5.0485436893203895e-05, + "loss": 0.5824, + "step": 65 + }, + { + "epoch": 0.32014552069122326, + "grad_norm": 1.3069227496554443, + "learning_rate": 5.1262135922330105e-05, + "loss": 0.5802, + "step": 66 + }, + { + "epoch": 0.32499621039866605, + "grad_norm": 1.1366236056516827, + "learning_rate": 5.203883495145632e-05, + "loss": 0.5804, + "step": 67 + }, + { + "epoch": 0.32984690010610884, + "grad_norm": 1.6243350603336242, + "learning_rate": 5.281553398058253e-05, + "loss": 0.5812, + "step": 68 + }, + { + "epoch": 0.33469758981355163, + "grad_norm": 1.0822457196908746, + "learning_rate": 5.359223300970875e-05, + "loss": 0.5862, + "step": 69 + }, + { + "epoch": 0.33954827952099437, + "grad_norm": 1.6360957248140573, + "learning_rate": 5.436893203883496e-05, + "loss": 0.5912, + "step": 70 + }, + { + "epoch": 0.34439896922843716, + "grad_norm": 2.3477845490488813, + "learning_rate": 5.5145631067961174e-05, + "loss": 0.5906, + "step": 71 + }, + { + "epoch": 0.34924965893587995, + "grad_norm": 1.105543560593242, + "learning_rate": 5.5922330097087384e-05, + "loss": 0.5824, + "step": 72 + }, + { + "epoch": 0.35410034864332274, + "grad_norm": 4.137098681881185, + "learning_rate": 5.66990291262136e-05, + "loss": 0.6359, + "step": 73 + }, + { + "epoch": 0.3589510383507655, + "grad_norm": 3.8847979837997033, + "learning_rate": 5.747572815533981e-05, + "loss": 0.6486, + "step": 74 + }, + { + "epoch": 0.36380172805820826, + "grad_norm": 1.1747128429519862, + "learning_rate": 5.825242718446603e-05, + "loss": 0.595, + "step": 75 + }, + { + "epoch": 0.36865241776565105, + "grad_norm": 3.008245900701061, + "learning_rate": 5.902912621359224e-05, + "loss": 0.6387, + "step": 76 + }, + { + "epoch": 0.37350310747309384, + "grad_norm": 2.3713075132931554, + "learning_rate": 5.9805825242718454e-05, + "loss": 0.6344, + "step": 77 + }, + { + "epoch": 0.37835379718053663, + "grad_norm": 1.6213053074921984, + "learning_rate": 6.0582524271844664e-05, + "loss": 0.6048, + "step": 78 + }, + { + "epoch": 0.38320448688797937, + "grad_norm": 1.6024154837501339, + "learning_rate": 6.135922330097087e-05, + "loss": 0.6203, + "step": 79 + }, + { + "epoch": 0.38805517659542216, + "grad_norm": 1.1825030677591377, + "learning_rate": 6.213592233009709e-05, + "loss": 0.6052, + "step": 80 + }, + { + "epoch": 0.39290586630286495, + "grad_norm": 1.3964525731128163, + "learning_rate": 6.291262135922331e-05, + "loss": 0.6112, + "step": 81 + }, + { + "epoch": 0.39775655601030774, + "grad_norm": 1.1205074621871551, + "learning_rate": 6.368932038834952e-05, + "loss": 0.5977, + "step": 82 + }, + { + "epoch": 0.4026072457177505, + "grad_norm": 1.045620374565707, + "learning_rate": 6.446601941747573e-05, + "loss": 0.5914, + "step": 83 + }, + { + "epoch": 0.40745793542519326, + "grad_norm": 1.3974586249408472, + "learning_rate": 6.524271844660194e-05, + "loss": 0.5918, + "step": 84 + }, + { + "epoch": 0.41230862513263605, + "grad_norm": 1.0818483302602913, + "learning_rate": 6.601941747572816e-05, + "loss": 0.5948, + "step": 85 + }, + { + "epoch": 0.41715931484007884, + "grad_norm": 0.9808456957793906, + "learning_rate": 6.679611650485438e-05, + "loss": 0.5839, + "step": 86 + }, + { + "epoch": 0.4220100045475216, + "grad_norm": 1.2035779456517084, + "learning_rate": 6.757281553398058e-05, + "loss": 0.5833, + "step": 87 + }, + { + "epoch": 0.42686069425496437, + "grad_norm": 1.6887623926979713, + "learning_rate": 6.83495145631068e-05, + "loss": 0.5818, + "step": 88 + }, + { + "epoch": 0.43171138396240716, + "grad_norm": 0.8023218391013366, + "learning_rate": 6.912621359223301e-05, + "loss": 0.5863, + "step": 89 + }, + { + "epoch": 0.43656207366984995, + "grad_norm": 1.574900348178855, + "learning_rate": 6.990291262135923e-05, + "loss": 0.5821, + "step": 90 + }, + { + "epoch": 0.4414127633772927, + "grad_norm": 0.9288518542917786, + "learning_rate": 7.067961165048545e-05, + "loss": 0.5814, + "step": 91 + }, + { + "epoch": 0.4462634530847355, + "grad_norm": 1.6871845487045471, + "learning_rate": 7.145631067961166e-05, + "loss": 0.5819, + "step": 92 + }, + { + "epoch": 0.45111414279217826, + "grad_norm": 1.147490028185953, + "learning_rate": 7.223300970873787e-05, + "loss": 0.5752, + "step": 93 + }, + { + "epoch": 0.45596483249962105, + "grad_norm": 1.0734179177901382, + "learning_rate": 7.300970873786408e-05, + "loss": 0.5786, + "step": 94 + }, + { + "epoch": 0.46081552220706384, + "grad_norm": 1.2263367009960806, + "learning_rate": 7.37864077669903e-05, + "loss": 0.5789, + "step": 95 + }, + { + "epoch": 0.4656662119145066, + "grad_norm": 1.4570032389620742, + "learning_rate": 7.456310679611652e-05, + "loss": 0.5745, + "step": 96 + }, + { + "epoch": 0.47051690162194937, + "grad_norm": 1.3246870726440927, + "learning_rate": 7.533980582524272e-05, + "loss": 0.5775, + "step": 97 + }, + { + "epoch": 0.47536759132939216, + "grad_norm": 0.9415857506868542, + "learning_rate": 7.611650485436894e-05, + "loss": 0.5699, + "step": 98 + }, + { + "epoch": 0.48021828103683495, + "grad_norm": 1.2384384474151087, + "learning_rate": 7.689320388349515e-05, + "loss": 0.5733, + "step": 99 + }, + { + "epoch": 0.4850689707442777, + "grad_norm": 1.5627749991572353, + "learning_rate": 7.766990291262137e-05, + "loss": 0.5735, + "step": 100 + }, + { + "epoch": 0.4899196604517205, + "grad_norm": 1.0078484211944914, + "learning_rate": 7.844660194174757e-05, + "loss": 0.5733, + "step": 101 + }, + { + "epoch": 0.49477035015916326, + "grad_norm": 1.6421211712488573, + "learning_rate": 7.922330097087379e-05, + "loss": 0.576, + "step": 102 + }, + { + "epoch": 0.49962103986660605, + "grad_norm": 0.8416126904816602, + "learning_rate": 8e-05, + "loss": 0.5697, + "step": 103 + }, + { + "epoch": 0.5044717295740488, + "grad_norm": 1.7540458195736903, + "learning_rate": 7.999977029531286e-05, + "loss": 0.5799, + "step": 104 + }, + { + "epoch": 0.5093224192814916, + "grad_norm": 1.050447231844734, + "learning_rate": 7.999908118388965e-05, + "loss": 0.5756, + "step": 105 + }, + { + "epoch": 0.5141731089889343, + "grad_norm": 1.394330877960354, + "learning_rate": 7.999793267364497e-05, + "loss": 0.5713, + "step": 106 + }, + { + "epoch": 0.5190237986963772, + "grad_norm": 1.5873678777006228, + "learning_rate": 7.999632477776974e-05, + "loss": 0.5733, + "step": 107 + }, + { + "epoch": 0.5238744884038199, + "grad_norm": 0.8115732123781836, + "learning_rate": 7.9994257514731e-05, + "loss": 0.5661, + "step": 108 + }, + { + "epoch": 0.5287251781112627, + "grad_norm": 1.1857754936411384, + "learning_rate": 7.999173090827177e-05, + "loss": 0.5719, + "step": 109 + }, + { + "epoch": 0.5335758678187055, + "grad_norm": 0.8066157800150973, + "learning_rate": 7.998874498741072e-05, + "loss": 0.5695, + "step": 110 + }, + { + "epoch": 0.5384265575261482, + "grad_norm": 1.4739854945603235, + "learning_rate": 7.998529978644183e-05, + "loss": 0.5712, + "step": 111 + }, + { + "epoch": 0.543277247233591, + "grad_norm": 0.778875512416499, + "learning_rate": 7.998139534493407e-05, + "loss": 0.5609, + "step": 112 + }, + { + "epoch": 0.5481279369410338, + "grad_norm": 0.9919152170469479, + "learning_rate": 7.997703170773084e-05, + "loss": 0.5648, + "step": 113 + }, + { + "epoch": 0.5529786266484766, + "grad_norm": 1.3093959851041357, + "learning_rate": 7.997220892494955e-05, + "loss": 0.5757, + "step": 114 + }, + { + "epoch": 0.5578293163559194, + "grad_norm": 0.9066117120369992, + "learning_rate": 7.996692705198097e-05, + "loss": 0.566, + "step": 115 + }, + { + "epoch": 0.5626800060633621, + "grad_norm": 1.2498381901490132, + "learning_rate": 7.996118614948869e-05, + "loss": 0.5757, + "step": 116 + }, + { + "epoch": 0.567530695770805, + "grad_norm": 1.0385189418340641, + "learning_rate": 7.995498628340827e-05, + "loss": 0.5697, + "step": 117 + }, + { + "epoch": 0.5723813854782477, + "grad_norm": 1.3065564110858372, + "learning_rate": 7.994832752494667e-05, + "loss": 0.5672, + "step": 118 + }, + { + "epoch": 0.5772320751856904, + "grad_norm": 0.9524061899396458, + "learning_rate": 7.994120995058127e-05, + "loss": 0.5624, + "step": 119 + }, + { + "epoch": 0.5820827648931333, + "grad_norm": 1.018979775317657, + "learning_rate": 7.993363364205907e-05, + "loss": 0.554, + "step": 120 + }, + { + "epoch": 0.586933454600576, + "grad_norm": 0.9276898951496916, + "learning_rate": 7.992559868639576e-05, + "loss": 0.556, + "step": 121 + }, + { + "epoch": 0.5917841443080188, + "grad_norm": 1.1930439188526805, + "learning_rate": 7.99171051758747e-05, + "loss": 0.5526, + "step": 122 + }, + { + "epoch": 0.5966348340154616, + "grad_norm": 0.6826863389197481, + "learning_rate": 7.990815320804583e-05, + "loss": 0.5609, + "step": 123 + }, + { + "epoch": 0.6014855237229043, + "grad_norm": 0.8061980858751947, + "learning_rate": 7.98987428857246e-05, + "loss": 0.5586, + "step": 124 + }, + { + "epoch": 0.6063362134303472, + "grad_norm": 0.9239948149603757, + "learning_rate": 7.988887431699079e-05, + "loss": 0.5507, + "step": 125 + }, + { + "epoch": 0.6111869031377899, + "grad_norm": 1.0465957889843347, + "learning_rate": 7.987854761518719e-05, + "loss": 0.5568, + "step": 126 + }, + { + "epoch": 0.6160375928452326, + "grad_norm": 0.8308130357408615, + "learning_rate": 7.986776289891842e-05, + "loss": 0.5591, + "step": 127 + }, + { + "epoch": 0.6208882825526755, + "grad_norm": 1.0246744766037437, + "learning_rate": 7.985652029204946e-05, + "loss": 0.5563, + "step": 128 + }, + { + "epoch": 0.6257389722601182, + "grad_norm": 1.3238612418839921, + "learning_rate": 7.984481992370429e-05, + "loss": 0.5491, + "step": 129 + }, + { + "epoch": 0.630589661967561, + "grad_norm": 0.6948258976249133, + "learning_rate": 7.983266192826437e-05, + "loss": 0.5418, + "step": 130 + }, + { + "epoch": 0.6354403516750038, + "grad_norm": 0.7288790333090353, + "learning_rate": 7.982004644536716e-05, + "loss": 0.5441, + "step": 131 + }, + { + "epoch": 0.6402910413824465, + "grad_norm": 1.0943204811023435, + "learning_rate": 7.98069736199044e-05, + "loss": 0.5493, + "step": 132 + }, + { + "epoch": 0.6451417310898894, + "grad_norm": 0.8706827515570799, + "learning_rate": 7.979344360202055e-05, + "loss": 0.5465, + "step": 133 + }, + { + "epoch": 0.6499924207973321, + "grad_norm": 0.9127380693761118, + "learning_rate": 7.977945654711108e-05, + "loss": 0.5475, + "step": 134 + }, + { + "epoch": 0.654843110504775, + "grad_norm": 0.9510188119086359, + "learning_rate": 7.976501261582056e-05, + "loss": 0.543, + "step": 135 + }, + { + "epoch": 0.6596938002122177, + "grad_norm": 0.9350726421156861, + "learning_rate": 7.975011197404092e-05, + "loss": 0.5525, + "step": 136 + }, + { + "epoch": 0.6645444899196604, + "grad_norm": 1.272258773056705, + "learning_rate": 7.973475479290956e-05, + "loss": 0.5518, + "step": 137 + }, + { + "epoch": 0.6693951796271033, + "grad_norm": 0.9765265325518906, + "learning_rate": 7.971894124880727e-05, + "loss": 0.5417, + "step": 138 + }, + { + "epoch": 0.674245869334546, + "grad_norm": 1.1917501609756302, + "learning_rate": 7.970267152335632e-05, + "loss": 0.5464, + "step": 139 + }, + { + "epoch": 0.6790965590419887, + "grad_norm": 0.6719257463868904, + "learning_rate": 7.968594580341832e-05, + "loss": 0.544, + "step": 140 + }, + { + "epoch": 0.6839472487494316, + "grad_norm": 0.7137208028607956, + "learning_rate": 7.966876428109209e-05, + "loss": 0.5351, + "step": 141 + }, + { + "epoch": 0.6887979384568743, + "grad_norm": 0.7449688014358767, + "learning_rate": 7.965112715371144e-05, + "loss": 0.5397, + "step": 142 + }, + { + "epoch": 0.6936486281643172, + "grad_norm": 0.5377305872108858, + "learning_rate": 7.96330346238429e-05, + "loss": 0.5346, + "step": 143 + }, + { + "epoch": 0.6984993178717599, + "grad_norm": 0.5856757070627496, + "learning_rate": 7.961448689928341e-05, + "loss": 0.5395, + "step": 144 + }, + { + "epoch": 0.7033500075792026, + "grad_norm": 0.6000325566823206, + "learning_rate": 7.959548419305796e-05, + "loss": 0.5447, + "step": 145 + }, + { + "epoch": 0.7082006972866455, + "grad_norm": 0.7819963257560868, + "learning_rate": 7.957602672341707e-05, + "loss": 0.5364, + "step": 146 + }, + { + "epoch": 0.7130513869940882, + "grad_norm": 1.1223449508846108, + "learning_rate": 7.955611471383433e-05, + "loss": 0.5381, + "step": 147 + }, + { + "epoch": 0.717902076701531, + "grad_norm": 1.1418981667975974, + "learning_rate": 7.953574839300385e-05, + "loss": 0.5381, + "step": 148 + }, + { + "epoch": 0.7227527664089738, + "grad_norm": 0.758286759296052, + "learning_rate": 7.95149279948376e-05, + "loss": 0.5398, + "step": 149 + }, + { + "epoch": 0.7276034561164165, + "grad_norm": 0.7637204957772546, + "learning_rate": 7.949365375846271e-05, + "loss": 0.5386, + "step": 150 + }, + { + "epoch": 0.7324541458238594, + "grad_norm": 0.6982030938329856, + "learning_rate": 7.94719259282188e-05, + "loss": 0.5328, + "step": 151 + }, + { + "epoch": 0.7373048355313021, + "grad_norm": 0.7115887055025976, + "learning_rate": 7.944974475365506e-05, + "loss": 0.5406, + "step": 152 + }, + { + "epoch": 0.7421555252387448, + "grad_norm": 0.6914212445412167, + "learning_rate": 7.94271104895275e-05, + "loss": 0.5375, + "step": 153 + }, + { + "epoch": 0.7470062149461877, + "grad_norm": 0.6376946136665823, + "learning_rate": 7.940402339579596e-05, + "loss": 0.5322, + "step": 154 + }, + { + "epoch": 0.7518569046536304, + "grad_norm": 0.662468788270689, + "learning_rate": 7.93804837376211e-05, + "loss": 0.5312, + "step": 155 + }, + { + "epoch": 0.7567075943610733, + "grad_norm": 0.8116591959883654, + "learning_rate": 7.935649178536142e-05, + "loss": 0.5362, + "step": 156 + }, + { + "epoch": 0.761558284068516, + "grad_norm": 1.2251954995336705, + "learning_rate": 7.93320478145701e-05, + "loss": 0.5454, + "step": 157 + }, + { + "epoch": 0.7664089737759587, + "grad_norm": 1.1753293382340935, + "learning_rate": 7.93071521059919e-05, + "loss": 0.5369, + "step": 158 + }, + { + "epoch": 0.7712596634834016, + "grad_norm": 0.5797209510428332, + "learning_rate": 7.928180494555983e-05, + "loss": 0.5255, + "step": 159 + }, + { + "epoch": 0.7761103531908443, + "grad_norm": 0.9260629876609666, + "learning_rate": 7.925600662439201e-05, + "loss": 0.535, + "step": 160 + }, + { + "epoch": 0.780961042898287, + "grad_norm": 1.2828815170548864, + "learning_rate": 7.922975743878817e-05, + "loss": 0.5293, + "step": 161 + }, + { + "epoch": 0.7858117326057299, + "grad_norm": 0.5171701751512903, + "learning_rate": 7.92030576902264e-05, + "loss": 0.5298, + "step": 162 + }, + { + "epoch": 0.7906624223131726, + "grad_norm": 0.9531992162184508, + "learning_rate": 7.917590768535952e-05, + "loss": 0.5315, + "step": 163 + }, + { + "epoch": 0.7955131120206155, + "grad_norm": 1.1106333536493764, + "learning_rate": 7.914830773601173e-05, + "loss": 0.5279, + "step": 164 + }, + { + "epoch": 0.8003638017280582, + "grad_norm": 0.45675301699833715, + "learning_rate": 7.912025815917489e-05, + "loss": 0.5372, + "step": 165 + }, + { + "epoch": 0.805214491435501, + "grad_norm": 0.7189143844280501, + "learning_rate": 7.909175927700499e-05, + "loss": 0.535, + "step": 166 + }, + { + "epoch": 0.8100651811429438, + "grad_norm": 0.8686823215812186, + "learning_rate": 7.906281141681839e-05, + "loss": 0.5333, + "step": 167 + }, + { + "epoch": 0.8149158708503865, + "grad_norm": 0.588440050652225, + "learning_rate": 7.903341491108798e-05, + "loss": 0.5289, + "step": 168 + }, + { + "epoch": 0.8197665605578294, + "grad_norm": 0.563873615495661, + "learning_rate": 7.900357009743958e-05, + "loss": 0.5331, + "step": 169 + }, + { + "epoch": 0.8246172502652721, + "grad_norm": 0.545022127050129, + "learning_rate": 7.897327731864784e-05, + "loss": 0.5266, + "step": 170 + }, + { + "epoch": 0.8294679399727148, + "grad_norm": 0.5592040867673563, + "learning_rate": 7.894253692263244e-05, + "loss": 0.522, + "step": 171 + }, + { + "epoch": 0.8343186296801577, + "grad_norm": 0.6324827822327501, + "learning_rate": 7.891134926245402e-05, + "loss": 0.5297, + "step": 172 + }, + { + "epoch": 0.8391693193876004, + "grad_norm": 0.8244822385641454, + "learning_rate": 7.887971469631016e-05, + "loss": 0.5319, + "step": 173 + }, + { + "epoch": 0.8440200090950432, + "grad_norm": 1.2087031591715138, + "learning_rate": 7.884763358753129e-05, + "loss": 0.5408, + "step": 174 + }, + { + "epoch": 0.848870698802486, + "grad_norm": 0.7427926592130248, + "learning_rate": 7.881510630457643e-05, + "loss": 0.5326, + "step": 175 + }, + { + "epoch": 0.8537213885099287, + "grad_norm": 0.5074413186000275, + "learning_rate": 7.878213322102908e-05, + "loss": 0.5281, + "step": 176 + }, + { + "epoch": 0.8585720782173716, + "grad_norm": 0.7191422226961306, + "learning_rate": 7.874871471559282e-05, + "loss": 0.5269, + "step": 177 + }, + { + "epoch": 0.8634227679248143, + "grad_norm": 0.7351841845171684, + "learning_rate": 7.8714851172087e-05, + "loss": 0.5326, + "step": 178 + }, + { + "epoch": 0.868273457632257, + "grad_norm": 0.661668481852005, + "learning_rate": 7.868054297944237e-05, + "loss": 0.5312, + "step": 179 + }, + { + "epoch": 0.8731241473396999, + "grad_norm": 0.6257843185205204, + "learning_rate": 7.864579053169657e-05, + "loss": 0.5265, + "step": 180 + }, + { + "epoch": 0.8779748370471426, + "grad_norm": 0.6272508186215946, + "learning_rate": 7.86105942279896e-05, + "loss": 0.5242, + "step": 181 + }, + { + "epoch": 0.8828255267545854, + "grad_norm": 0.5859524441087289, + "learning_rate": 7.857495447255925e-05, + "loss": 0.5117, + "step": 182 + }, + { + "epoch": 0.8876762164620282, + "grad_norm": 0.5314342493506371, + "learning_rate": 7.853887167473646e-05, + "loss": 0.5275, + "step": 183 + }, + { + "epoch": 0.892526906169471, + "grad_norm": 0.5894396606474899, + "learning_rate": 7.850234624894064e-05, + "loss": 0.5236, + "step": 184 + }, + { + "epoch": 0.8973775958769138, + "grad_norm": 0.7789309413273731, + "learning_rate": 7.846537861467485e-05, + "loss": 0.5269, + "step": 185 + }, + { + "epoch": 0.9022282855843565, + "grad_norm": 0.9749399305462054, + "learning_rate": 7.842796919652104e-05, + "loss": 0.5177, + "step": 186 + }, + { + "epoch": 0.9070789752917993, + "grad_norm": 0.8944031183061603, + "learning_rate": 7.839011842413514e-05, + "loss": 0.5236, + "step": 187 + }, + { + "epoch": 0.9119296649992421, + "grad_norm": 0.6072136307213187, + "learning_rate": 7.835182673224212e-05, + "loss": 0.5237, + "step": 188 + }, + { + "epoch": 0.9167803547066848, + "grad_norm": 0.44815995922956803, + "learning_rate": 7.831309456063107e-05, + "loss": 0.5193, + "step": 189 + }, + { + "epoch": 0.9216310444141277, + "grad_norm": 0.5362363058315522, + "learning_rate": 7.827392235415005e-05, + "loss": 0.5242, + "step": 190 + }, + { + "epoch": 0.9264817341215704, + "grad_norm": 0.5675209533538658, + "learning_rate": 7.823431056270103e-05, + "loss": 0.5223, + "step": 191 + }, + { + "epoch": 0.9313324238290132, + "grad_norm": 0.5087214285921436, + "learning_rate": 7.81942596412347e-05, + "loss": 0.522, + "step": 192 + }, + { + "epoch": 0.936183113536456, + "grad_norm": 0.46687413642954234, + "learning_rate": 7.815377004974532e-05, + "loss": 0.509, + "step": 193 + }, + { + "epoch": 0.9410338032438987, + "grad_norm": 0.43127006261715695, + "learning_rate": 7.811284225326529e-05, + "loss": 0.522, + "step": 194 + }, + { + "epoch": 0.9458844929513415, + "grad_norm": 0.43502529088952246, + "learning_rate": 7.807147672185996e-05, + "loss": 0.5258, + "step": 195 + }, + { + "epoch": 0.9507351826587843, + "grad_norm": 0.5247431038277521, + "learning_rate": 7.802967393062219e-05, + "loss": 0.524, + "step": 196 + }, + { + "epoch": 0.955585872366227, + "grad_norm": 0.6873590048364063, + "learning_rate": 7.798743435966676e-05, + "loss": 0.5227, + "step": 197 + }, + { + "epoch": 0.9604365620736699, + "grad_norm": 0.8978763261543932, + "learning_rate": 7.794475849412512e-05, + "loss": 0.5143, + "step": 198 + }, + { + "epoch": 0.9652872517811126, + "grad_norm": 0.8491329782406589, + "learning_rate": 7.790164682413954e-05, + "loss": 0.5186, + "step": 199 + }, + { + "epoch": 0.9701379414885554, + "grad_norm": 0.5004070361840594, + "learning_rate": 7.785809984485765e-05, + "loss": 0.5185, + "step": 200 + }, + { + "epoch": 0.9749886311959982, + "grad_norm": 0.4620691718653308, + "learning_rate": 7.781411805642675e-05, + "loss": 0.5179, + "step": 201 + }, + { + "epoch": 0.979839320903441, + "grad_norm": 0.6078145800613444, + "learning_rate": 7.776970196398795e-05, + "loss": 0.5185, + "step": 202 + }, + { + "epoch": 0.9846900106108837, + "grad_norm": 0.6744449960922595, + "learning_rate": 7.77248520776705e-05, + "loss": 0.5223, + "step": 203 + }, + { + "epoch": 0.9895407003183265, + "grad_norm": 0.769858159356013, + "learning_rate": 7.767956891258585e-05, + "loss": 0.514, + "step": 204 + }, + { + "epoch": 0.9943913900257693, + "grad_norm": 0.9703823352556248, + "learning_rate": 7.763385298882177e-05, + "loss": 0.5227, + "step": 205 + }, + { + "epoch": 0.9992420797332121, + "grad_norm": 1.0790500827883502, + "learning_rate": 7.758770483143634e-05, + "loss": 0.5161, + "step": 206 + }, + { + "epoch": 1.0048506897074427, + "grad_norm": 0.979399858326228, + "learning_rate": 7.754112497045198e-05, + "loss": 0.5126, + "step": 207 + }, + { + "epoch": 1.0097013794148855, + "grad_norm": 0.8061955074549858, + "learning_rate": 7.749411394084931e-05, + "loss": 0.5093, + "step": 208 + }, + { + "epoch": 1.0145520691223284, + "grad_norm": 0.769561002371883, + "learning_rate": 7.744667228256102e-05, + "loss": 0.5129, + "step": 209 + }, + { + "epoch": 1.0194027588297712, + "grad_norm": 0.7563794216226459, + "learning_rate": 7.739880054046567e-05, + "loss": 0.504, + "step": 210 + }, + { + "epoch": 1.024253448537214, + "grad_norm": 0.4861095042439798, + "learning_rate": 7.735049926438143e-05, + "loss": 0.5008, + "step": 211 + }, + { + "epoch": 1.0291041382446566, + "grad_norm": 0.521763707621908, + "learning_rate": 7.730176900905978e-05, + "loss": 0.5039, + "step": 212 + }, + { + "epoch": 1.0339548279520994, + "grad_norm": 0.6847654097095645, + "learning_rate": 7.725261033417914e-05, + "loss": 0.4987, + "step": 213 + }, + { + "epoch": 1.0388055176595423, + "grad_norm": 0.45617035587869154, + "learning_rate": 7.720302380433838e-05, + "loss": 0.5082, + "step": 214 + }, + { + "epoch": 1.043656207366985, + "grad_norm": 0.5136841747695677, + "learning_rate": 7.715300998905045e-05, + "loss": 0.4903, + "step": 215 + }, + { + "epoch": 1.0485068970744278, + "grad_norm": 0.5201029165395914, + "learning_rate": 7.710256946273572e-05, + "loss": 0.5061, + "step": 216 + }, + { + "epoch": 1.0533575867818705, + "grad_norm": 0.5369451831716502, + "learning_rate": 7.705170280471546e-05, + "loss": 0.4923, + "step": 217 + }, + { + "epoch": 1.0582082764893133, + "grad_norm": 0.5292650633659572, + "learning_rate": 7.700041059920516e-05, + "loss": 0.4958, + "step": 218 + }, + { + "epoch": 1.0630589661967562, + "grad_norm": 0.38347803199441816, + "learning_rate": 7.694869343530781e-05, + "loss": 0.4949, + "step": 219 + }, + { + "epoch": 1.067909655904199, + "grad_norm": 0.42205008813365347, + "learning_rate": 7.689655190700719e-05, + "loss": 0.4958, + "step": 220 + }, + { + "epoch": 1.0727603456116417, + "grad_norm": 0.43326896920779806, + "learning_rate": 7.684398661316092e-05, + "loss": 0.5034, + "step": 221 + }, + { + "epoch": 1.0776110353190844, + "grad_norm": 0.3610486041319715, + "learning_rate": 7.679099815749377e-05, + "loss": 0.508, + "step": 222 + }, + { + "epoch": 1.0824617250265272, + "grad_norm": 0.4631910613487445, + "learning_rate": 7.673758714859052e-05, + "loss": 0.5012, + "step": 223 + }, + { + "epoch": 1.08731241473397, + "grad_norm": 0.5933537887890846, + "learning_rate": 7.668375419988918e-05, + "loss": 0.5003, + "step": 224 + }, + { + "epoch": 1.0921631044414128, + "grad_norm": 0.7536616463697116, + "learning_rate": 7.662949992967375e-05, + "loss": 0.4984, + "step": 225 + }, + { + "epoch": 1.0970137941488556, + "grad_norm": 0.8908783317227219, + "learning_rate": 7.657482496106725e-05, + "loss": 0.499, + "step": 226 + }, + { + "epoch": 1.1018644838562983, + "grad_norm": 0.8949365262495667, + "learning_rate": 7.651972992202449e-05, + "loss": 0.4964, + "step": 227 + }, + { + "epoch": 1.106715173563741, + "grad_norm": 0.7666080530207662, + "learning_rate": 7.646421544532492e-05, + "loss": 0.501, + "step": 228 + }, + { + "epoch": 1.1115658632711838, + "grad_norm": 0.5974548399149405, + "learning_rate": 7.640828216856532e-05, + "loss": 0.5019, + "step": 229 + }, + { + "epoch": 1.1164165529786267, + "grad_norm": 0.5208576739553936, + "learning_rate": 7.635193073415246e-05, + "loss": 0.4954, + "step": 230 + }, + { + "epoch": 1.1212672426860695, + "grad_norm": 0.4449218126901089, + "learning_rate": 7.62951617892958e-05, + "loss": 0.4966, + "step": 231 + }, + { + "epoch": 1.1261179323935122, + "grad_norm": 0.3413546355163314, + "learning_rate": 7.623797598599995e-05, + "loss": 0.4869, + "step": 232 + }, + { + "epoch": 1.130968622100955, + "grad_norm": 0.4021494906350838, + "learning_rate": 7.618037398105728e-05, + "loss": 0.4876, + "step": 233 + }, + { + "epoch": 1.1358193118083977, + "grad_norm": 0.5401093810240136, + "learning_rate": 7.612235643604031e-05, + "loss": 0.495, + "step": 234 + }, + { + "epoch": 1.1406700015158404, + "grad_norm": 0.6450843987922678, + "learning_rate": 7.606392401729415e-05, + "loss": 0.4953, + "step": 235 + }, + { + "epoch": 1.1455206912232834, + "grad_norm": 0.6413460171528268, + "learning_rate": 7.600507739592879e-05, + "loss": 0.4972, + "step": 236 + }, + { + "epoch": 1.150371380930726, + "grad_norm": 0.6276158556341717, + "learning_rate": 7.594581724781152e-05, + "loss": 0.4957, + "step": 237 + }, + { + "epoch": 1.1552220706381688, + "grad_norm": 0.7553018024510589, + "learning_rate": 7.588614425355898e-05, + "loss": 0.4955, + "step": 238 + }, + { + "epoch": 1.1600727603456116, + "grad_norm": 0.8968837770832118, + "learning_rate": 7.582605909852951e-05, + "loss": 0.4937, + "step": 239 + }, + { + "epoch": 1.1649234500530543, + "grad_norm": 0.7618870978199445, + "learning_rate": 7.576556247281522e-05, + "loss": 0.4969, + "step": 240 + }, + { + "epoch": 1.1697741397604973, + "grad_norm": 0.6531717186517569, + "learning_rate": 7.570465507123401e-05, + "loss": 0.5042, + "step": 241 + }, + { + "epoch": 1.17462482946794, + "grad_norm": 0.591515239054212, + "learning_rate": 7.564333759332167e-05, + "loss": 0.4906, + "step": 242 + }, + { + "epoch": 1.1794755191753827, + "grad_norm": 0.49797581923871925, + "learning_rate": 7.558161074332379e-05, + "loss": 0.4966, + "step": 243 + }, + { + "epoch": 1.1843262088828255, + "grad_norm": 0.5865910810734263, + "learning_rate": 7.551947523018774e-05, + "loss": 0.4997, + "step": 244 + }, + { + "epoch": 1.1891768985902682, + "grad_norm": 0.5003536808662635, + "learning_rate": 7.54569317675544e-05, + "loss": 0.4954, + "step": 245 + }, + { + "epoch": 1.1940275882977112, + "grad_norm": 0.4328856052217075, + "learning_rate": 7.539398107375015e-05, + "loss": 0.4979, + "step": 246 + }, + { + "epoch": 1.198878278005154, + "grad_norm": 0.5623661241326378, + "learning_rate": 7.533062387177843e-05, + "loss": 0.4982, + "step": 247 + }, + { + "epoch": 1.2037289677125966, + "grad_norm": 0.542587238982675, + "learning_rate": 7.526686088931156e-05, + "loss": 0.4991, + "step": 248 + }, + { + "epoch": 1.2085796574200394, + "grad_norm": 0.4949553127282243, + "learning_rate": 7.520269285868235e-05, + "loss": 0.4908, + "step": 249 + }, + { + "epoch": 1.213430347127482, + "grad_norm": 0.39917468694971237, + "learning_rate": 7.513812051687564e-05, + "loss": 0.4917, + "step": 250 + }, + { + "epoch": 1.218281036834925, + "grad_norm": 0.44831825611716425, + "learning_rate": 7.507314460551993e-05, + "loss": 0.4898, + "step": 251 + }, + { + "epoch": 1.2231317265423678, + "grad_norm": 0.4694728642442923, + "learning_rate": 7.500776587087878e-05, + "loss": 0.4929, + "step": 252 + }, + { + "epoch": 1.2279824162498105, + "grad_norm": 0.4548469944052975, + "learning_rate": 7.494198506384229e-05, + "loss": 0.4826, + "step": 253 + }, + { + "epoch": 1.2328331059572533, + "grad_norm": 0.6666754202357293, + "learning_rate": 7.487580293991844e-05, + "loss": 0.5021, + "step": 254 + }, + { + "epoch": 1.237683795664696, + "grad_norm": 0.6791995766586792, + "learning_rate": 7.480922025922443e-05, + "loss": 0.4974, + "step": 255 + }, + { + "epoch": 1.242534485372139, + "grad_norm": 0.48795487898431833, + "learning_rate": 7.474223778647796e-05, + "loss": 0.4934, + "step": 256 + }, + { + "epoch": 1.2473851750795817, + "grad_norm": 0.32007742081193336, + "learning_rate": 7.467485629098842e-05, + "loss": 0.4907, + "step": 257 + }, + { + "epoch": 1.2522358647870244, + "grad_norm": 0.2948779105297471, + "learning_rate": 7.460707654664807e-05, + "loss": 0.4974, + "step": 258 + }, + { + "epoch": 1.2570865544944672, + "grad_norm": 0.2954711132741566, + "learning_rate": 7.453889933192316e-05, + "loss": 0.4893, + "step": 259 + }, + { + "epoch": 1.26193724420191, + "grad_norm": 0.3234156565448516, + "learning_rate": 7.447032542984502e-05, + "loss": 0.4882, + "step": 260 + }, + { + "epoch": 1.2667879339093528, + "grad_norm": 0.37736907562809757, + "learning_rate": 7.440135562800093e-05, + "loss": 0.487, + "step": 261 + }, + { + "epoch": 1.2716386236167956, + "grad_norm": 0.4380964102542513, + "learning_rate": 7.433199071852526e-05, + "loss": 0.4965, + "step": 262 + }, + { + "epoch": 1.2764893133242383, + "grad_norm": 0.5377640268616285, + "learning_rate": 7.426223149809023e-05, + "loss": 0.4922, + "step": 263 + }, + { + "epoch": 1.281340003031681, + "grad_norm": 0.5447192325063156, + "learning_rate": 7.419207876789685e-05, + "loss": 0.4844, + "step": 264 + }, + { + "epoch": 1.2861906927391238, + "grad_norm": 0.5569387883590096, + "learning_rate": 7.412153333366567e-05, + "loss": 0.4887, + "step": 265 + }, + { + "epoch": 1.2910413824465667, + "grad_norm": 0.6127559785319273, + "learning_rate": 7.405059600562751e-05, + "loss": 0.4974, + "step": 266 + }, + { + "epoch": 1.2958920721540095, + "grad_norm": 0.5372861059475705, + "learning_rate": 7.397926759851425e-05, + "loss": 0.4946, + "step": 267 + }, + { + "epoch": 1.3007427618614522, + "grad_norm": 0.3715441206816088, + "learning_rate": 7.390754893154933e-05, + "loss": 0.4914, + "step": 268 + }, + { + "epoch": 1.305593451568895, + "grad_norm": 0.3468457624853246, + "learning_rate": 7.383544082843846e-05, + "loss": 0.4906, + "step": 269 + }, + { + "epoch": 1.3104441412763377, + "grad_norm": 0.37917435116867076, + "learning_rate": 7.376294411736009e-05, + "loss": 0.4877, + "step": 270 + }, + { + "epoch": 1.3152948309837806, + "grad_norm": 0.44133896758740837, + "learning_rate": 7.369005963095596e-05, + "loss": 0.4962, + "step": 271 + }, + { + "epoch": 1.3201455206912232, + "grad_norm": 0.5453886771483799, + "learning_rate": 7.361678820632145e-05, + "loss": 0.4918, + "step": 272 + }, + { + "epoch": 1.324996210398666, + "grad_norm": 0.6036321305780495, + "learning_rate": 7.354313068499607e-05, + "loss": 0.4892, + "step": 273 + }, + { + "epoch": 1.3298469001061088, + "grad_norm": 0.620838391242342, + "learning_rate": 7.346908791295369e-05, + "loss": 0.495, + "step": 274 + }, + { + "epoch": 1.3346975898135516, + "grad_norm": 0.5848284090531766, + "learning_rate": 7.339466074059292e-05, + "loss": 0.4862, + "step": 275 + }, + { + "epoch": 1.3395482795209943, + "grad_norm": 0.5915616847361488, + "learning_rate": 7.331985002272726e-05, + "loss": 0.4986, + "step": 276 + }, + { + "epoch": 1.344398969228437, + "grad_norm": 0.5871009859314463, + "learning_rate": 7.324465661857534e-05, + "loss": 0.4868, + "step": 277 + }, + { + "epoch": 1.34924965893588, + "grad_norm": 0.4325881770640798, + "learning_rate": 7.316908139175105e-05, + "loss": 0.4886, + "step": 278 + }, + { + "epoch": 1.3541003486433227, + "grad_norm": 0.342133338929163, + "learning_rate": 7.309312521025356e-05, + "loss": 0.4909, + "step": 279 + }, + { + "epoch": 1.3589510383507655, + "grad_norm": 0.4415991996544984, + "learning_rate": 7.301678894645742e-05, + "loss": 0.4915, + "step": 280 + }, + { + "epoch": 1.3638017280582082, + "grad_norm": 0.510599069072842, + "learning_rate": 7.294007347710251e-05, + "loss": 0.4935, + "step": 281 + }, + { + "epoch": 1.368652417765651, + "grad_norm": 0.5220646005978747, + "learning_rate": 7.286297968328397e-05, + "loss": 0.4834, + "step": 282 + }, + { + "epoch": 1.373503107473094, + "grad_norm": 0.4836929320122624, + "learning_rate": 7.27855084504421e-05, + "loss": 0.4953, + "step": 283 + }, + { + "epoch": 1.3783537971805366, + "grad_norm": 0.4678184328008887, + "learning_rate": 7.270766066835217e-05, + "loss": 0.4872, + "step": 284 + }, + { + "epoch": 1.3832044868879794, + "grad_norm": 0.4479819209137706, + "learning_rate": 7.262943723111419e-05, + "loss": 0.4916, + "step": 285 + }, + { + "epoch": 1.388055176595422, + "grad_norm": 0.44661460126650243, + "learning_rate": 7.255083903714266e-05, + "loss": 0.4866, + "step": 286 + }, + { + "epoch": 1.3929058663028648, + "grad_norm": 0.46700839086853646, + "learning_rate": 7.247186698915625e-05, + "loss": 0.4879, + "step": 287 + }, + { + "epoch": 1.3977565560103078, + "grad_norm": 0.5111356334340853, + "learning_rate": 7.239252199416749e-05, + "loss": 0.4812, + "step": 288 + }, + { + "epoch": 1.4026072457177505, + "grad_norm": 0.5198819509993116, + "learning_rate": 7.23128049634722e-05, + "loss": 0.4809, + "step": 289 + }, + { + "epoch": 1.4074579354251933, + "grad_norm": 0.5071119674882796, + "learning_rate": 7.223271681263916e-05, + "loss": 0.4839, + "step": 290 + }, + { + "epoch": 1.412308625132636, + "grad_norm": 0.4871736388487796, + "learning_rate": 7.215225846149957e-05, + "loss": 0.4899, + "step": 291 + }, + { + "epoch": 1.4171593148400787, + "grad_norm": 0.4644477177967194, + "learning_rate": 7.207143083413643e-05, + "loss": 0.4865, + "step": 292 + }, + { + "epoch": 1.4220100045475217, + "grad_norm": 0.5305010693129898, + "learning_rate": 7.1990234858874e-05, + "loss": 0.4876, + "step": 293 + }, + { + "epoch": 1.4268606942549644, + "grad_norm": 0.5381812012245146, + "learning_rate": 7.190867146826707e-05, + "loss": 0.4936, + "step": 294 + }, + { + "epoch": 1.4317113839624072, + "grad_norm": 0.42926452605809334, + "learning_rate": 7.182674159909031e-05, + "loss": 0.4845, + "step": 295 + }, + { + "epoch": 1.43656207366985, + "grad_norm": 0.42959757228135126, + "learning_rate": 7.174444619232745e-05, + "loss": 0.4952, + "step": 296 + }, + { + "epoch": 1.4414127633772926, + "grad_norm": 0.4994771109955089, + "learning_rate": 7.166178619316056e-05, + "loss": 0.4912, + "step": 297 + }, + { + "epoch": 1.4462634530847356, + "grad_norm": 0.4676921077663137, + "learning_rate": 7.157876255095906e-05, + "loss": 0.4875, + "step": 298 + }, + { + "epoch": 1.4511141427921783, + "grad_norm": 0.430209471088095, + "learning_rate": 7.149537621926895e-05, + "loss": 0.4862, + "step": 299 + }, + { + "epoch": 1.455964832499621, + "grad_norm": 0.5267214852499816, + "learning_rate": 7.14116281558018e-05, + "loss": 0.4879, + "step": 300 + }, + { + "epoch": 1.4608155222070638, + "grad_norm": 0.5169308603441447, + "learning_rate": 7.132751932242376e-05, + "loss": 0.4984, + "step": 301 + }, + { + "epoch": 1.4656662119145065, + "grad_norm": 0.3435076728807633, + "learning_rate": 7.124305068514444e-05, + "loss": 0.487, + "step": 302 + }, + { + "epoch": 1.4705169016219495, + "grad_norm": 0.2662958717194974, + "learning_rate": 7.1158223214106e-05, + "loss": 0.4878, + "step": 303 + }, + { + "epoch": 1.4753675913293922, + "grad_norm": 0.31770648802942325, + "learning_rate": 7.107303788357177e-05, + "loss": 0.4819, + "step": 304 + }, + { + "epoch": 1.480218281036835, + "grad_norm": 0.29599579651368213, + "learning_rate": 7.098749567191527e-05, + "loss": 0.4852, + "step": 305 + }, + { + "epoch": 1.4850689707442777, + "grad_norm": 0.3093179833213525, + "learning_rate": 7.090159756160886e-05, + "loss": 0.4877, + "step": 306 + }, + { + "epoch": 1.4899196604517204, + "grad_norm": 0.38971280696993216, + "learning_rate": 7.081534453921242e-05, + "loss": 0.4852, + "step": 307 + }, + { + "epoch": 1.4947703501591634, + "grad_norm": 0.3825128078756503, + "learning_rate": 7.072873759536217e-05, + "loss": 0.4913, + "step": 308 + }, + { + "epoch": 1.499621039866606, + "grad_norm": 0.2886624346515238, + "learning_rate": 7.064177772475912e-05, + "loss": 0.4798, + "step": 309 + }, + { + "epoch": 1.5044717295740488, + "grad_norm": 0.3712678777863381, + "learning_rate": 7.05544659261578e-05, + "loss": 0.4867, + "step": 310 + }, + { + "epoch": 1.5093224192814916, + "grad_norm": 0.42331161544955054, + "learning_rate": 7.046680320235466e-05, + "loss": 0.4871, + "step": 311 + }, + { + "epoch": 1.5141731089889343, + "grad_norm": 0.4018226592697959, + "learning_rate": 7.037879056017663e-05, + "loss": 0.4842, + "step": 312 + }, + { + "epoch": 1.5190237986963773, + "grad_norm": 0.3959692369182176, + "learning_rate": 7.029042901046952e-05, + "loss": 0.4802, + "step": 313 + }, + { + "epoch": 1.5238744884038198, + "grad_norm": 0.4052319536586186, + "learning_rate": 7.020171956808645e-05, + "loss": 0.4859, + "step": 314 + }, + { + "epoch": 1.5287251781112627, + "grad_norm": 0.40673400305291324, + "learning_rate": 7.011266325187615e-05, + "loss": 0.496, + "step": 315 + }, + { + "epoch": 1.5335758678187055, + "grad_norm": 0.44258718402573904, + "learning_rate": 7.002326108467129e-05, + "loss": 0.4864, + "step": 316 + }, + { + "epoch": 1.5384265575261482, + "grad_norm": 0.4022422201093314, + "learning_rate": 6.993351409327672e-05, + "loss": 0.4763, + "step": 317 + }, + { + "epoch": 1.5432772472335912, + "grad_norm": 0.39107692009497685, + "learning_rate": 6.984342330845764e-05, + "loss": 0.4952, + "step": 318 + }, + { + "epoch": 1.5481279369410337, + "grad_norm": 0.36401667233363455, + "learning_rate": 6.975298976492785e-05, + "loss": 0.4952, + "step": 319 + }, + { + "epoch": 1.5529786266484766, + "grad_norm": 0.3964209144895704, + "learning_rate": 6.966221450133779e-05, + "loss": 0.4901, + "step": 320 + }, + { + "epoch": 1.5578293163559194, + "grad_norm": 0.41002635948711413, + "learning_rate": 6.957109856026261e-05, + "loss": 0.4917, + "step": 321 + }, + { + "epoch": 1.562680006063362, + "grad_norm": 0.33043042887382146, + "learning_rate": 6.94796429881903e-05, + "loss": 0.4771, + "step": 322 + }, + { + "epoch": 1.567530695770805, + "grad_norm": 0.3258167342621945, + "learning_rate": 6.938784883550948e-05, + "loss": 0.4889, + "step": 323 + }, + { + "epoch": 1.5723813854782476, + "grad_norm": 0.33864970777234993, + "learning_rate": 6.929571715649755e-05, + "loss": 0.4866, + "step": 324 + }, + { + "epoch": 1.5772320751856905, + "grad_norm": 0.3799335436470155, + "learning_rate": 6.920324900930842e-05, + "loss": 0.4907, + "step": 325 + }, + { + "epoch": 1.5820827648931333, + "grad_norm": 0.38649667346458383, + "learning_rate": 6.911044545596042e-05, + "loss": 0.4854, + "step": 326 + }, + { + "epoch": 1.586933454600576, + "grad_norm": 0.3332457174533195, + "learning_rate": 6.901730756232411e-05, + "loss": 0.4895, + "step": 327 + }, + { + "epoch": 1.591784144308019, + "grad_norm": 0.3688581464993942, + "learning_rate": 6.892383639811005e-05, + "loss": 0.4958, + "step": 328 + }, + { + "epoch": 1.5966348340154615, + "grad_norm": 0.43127701691860393, + "learning_rate": 6.883003303685644e-05, + "loss": 0.4844, + "step": 329 + }, + { + "epoch": 1.6014855237229044, + "grad_norm": 0.5098788849460419, + "learning_rate": 6.87358985559169e-05, + "loss": 0.489, + "step": 330 + }, + { + "epoch": 1.6063362134303472, + "grad_norm": 0.531466303384909, + "learning_rate": 6.864143403644797e-05, + "loss": 0.4945, + "step": 331 + }, + { + "epoch": 1.61118690313779, + "grad_norm": 0.4575057116450561, + "learning_rate": 6.85466405633968e-05, + "loss": 0.4855, + "step": 332 + }, + { + "epoch": 1.6160375928452326, + "grad_norm": 0.42418027914564915, + "learning_rate": 6.845151922548865e-05, + "loss": 0.4783, + "step": 333 + }, + { + "epoch": 1.6208882825526754, + "grad_norm": 0.38431703300530295, + "learning_rate": 6.835607111521439e-05, + "loss": 0.4796, + "step": 334 + }, + { + "epoch": 1.6257389722601183, + "grad_norm": 0.325044588754403, + "learning_rate": 6.826029732881793e-05, + "loss": 0.4928, + "step": 335 + }, + { + "epoch": 1.630589661967561, + "grad_norm": 0.2723847494193817, + "learning_rate": 6.816419896628363e-05, + "loss": 0.4851, + "step": 336 + }, + { + "epoch": 1.6354403516750038, + "grad_norm": 0.25325170865464947, + "learning_rate": 6.806777713132374e-05, + "loss": 0.4826, + "step": 337 + }, + { + "epoch": 1.6402910413824465, + "grad_norm": 0.2793387163645126, + "learning_rate": 6.79710329313656e-05, + "loss": 0.4873, + "step": 338 + }, + { + "epoch": 1.6451417310898893, + "grad_norm": 0.38835730960557174, + "learning_rate": 6.787396747753903e-05, + "loss": 0.4744, + "step": 339 + }, + { + "epoch": 1.6499924207973322, + "grad_norm": 0.5896470389457479, + "learning_rate": 6.777658188466354e-05, + "loss": 0.4765, + "step": 340 + }, + { + "epoch": 1.654843110504775, + "grad_norm": 0.7717199781637745, + "learning_rate": 6.767887727123544e-05, + "loss": 0.4931, + "step": 341 + }, + { + "epoch": 1.6596938002122177, + "grad_norm": 1.0491183054565791, + "learning_rate": 6.758085475941516e-05, + "loss": 0.4875, + "step": 342 + }, + { + "epoch": 1.6645444899196604, + "grad_norm": 1.0963514331569248, + "learning_rate": 6.748251547501418e-05, + "loss": 0.4783, + "step": 343 + }, + { + "epoch": 1.6693951796271032, + "grad_norm": 0.6008540810802777, + "learning_rate": 6.738386054748226e-05, + "loss": 0.4836, + "step": 344 + }, + { + "epoch": 1.674245869334546, + "grad_norm": 0.4448291346545642, + "learning_rate": 6.728489110989434e-05, + "loss": 0.4883, + "step": 345 + }, + { + "epoch": 1.6790965590419886, + "grad_norm": 0.4942617693141126, + "learning_rate": 6.718560829893762e-05, + "loss": 0.4799, + "step": 346 + }, + { + "epoch": 1.6839472487494316, + "grad_norm": 0.4996733158915889, + "learning_rate": 6.708601325489844e-05, + "loss": 0.4872, + "step": 347 + }, + { + "epoch": 1.6887979384568743, + "grad_norm": 0.3715020675799419, + "learning_rate": 6.698610712164924e-05, + "loss": 0.4864, + "step": 348 + }, + { + "epoch": 1.693648628164317, + "grad_norm": 0.27977348496462506, + "learning_rate": 6.688589104663536e-05, + "loss": 0.4731, + "step": 349 + }, + { + "epoch": 1.69849931787176, + "grad_norm": 0.3329757061053683, + "learning_rate": 6.67853661808619e-05, + "loss": 0.4771, + "step": 350 + }, + { + "epoch": 1.7033500075792025, + "grad_norm": 0.35849519050184514, + "learning_rate": 6.668453367888052e-05, + "loss": 0.4867, + "step": 351 + }, + { + "epoch": 1.7082006972866455, + "grad_norm": 0.3093064728603477, + "learning_rate": 6.658339469877613e-05, + "loss": 0.478, + "step": 352 + }, + { + "epoch": 1.7130513869940882, + "grad_norm": 0.2983932071893944, + "learning_rate": 6.64819504021536e-05, + "loss": 0.4814, + "step": 353 + }, + { + "epoch": 1.717902076701531, + "grad_norm": 0.32895472335219694, + "learning_rate": 6.638020195412448e-05, + "loss": 0.4771, + "step": 354 + }, + { + "epoch": 1.722752766408974, + "grad_norm": 0.4277599821762847, + "learning_rate": 6.627815052329354e-05, + "loss": 0.4925, + "step": 355 + }, + { + "epoch": 1.7276034561164164, + "grad_norm": 0.4690652488456737, + "learning_rate": 6.617579728174535e-05, + "loss": 0.4854, + "step": 356 + }, + { + "epoch": 1.7324541458238594, + "grad_norm": 0.43487992599318925, + "learning_rate": 6.60731434050309e-05, + "loss": 0.4777, + "step": 357 + }, + { + "epoch": 1.737304835531302, + "grad_norm": 0.4398837483674929, + "learning_rate": 6.597019007215401e-05, + "loss": 0.4783, + "step": 358 + }, + { + "epoch": 1.7421555252387448, + "grad_norm": 0.43050412759021583, + "learning_rate": 6.586693846555788e-05, + "loss": 0.4743, + "step": 359 + }, + { + "epoch": 1.7470062149461878, + "grad_norm": 0.40202174280112624, + "learning_rate": 6.576338977111134e-05, + "loss": 0.48, + "step": 360 + }, + { + "epoch": 1.7518569046536303, + "grad_norm": 0.36259944082265505, + "learning_rate": 6.565954517809543e-05, + "loss": 0.4747, + "step": 361 + }, + { + "epoch": 1.7567075943610733, + "grad_norm": 0.28300782787905476, + "learning_rate": 6.555540587918968e-05, + "loss": 0.4778, + "step": 362 + }, + { + "epoch": 1.761558284068516, + "grad_norm": 0.27286805994349533, + "learning_rate": 6.545097307045831e-05, + "loss": 0.4795, + "step": 363 + }, + { + "epoch": 1.7664089737759587, + "grad_norm": 0.31934491384929364, + "learning_rate": 6.534624795133662e-05, + "loss": 0.4851, + "step": 364 + }, + { + "epoch": 1.7712596634834017, + "grad_norm": 0.35245692182661065, + "learning_rate": 6.524123172461711e-05, + "loss": 0.4794, + "step": 365 + }, + { + "epoch": 1.7761103531908442, + "grad_norm": 0.3396944161317505, + "learning_rate": 6.51359255964358e-05, + "loss": 0.4774, + "step": 366 + }, + { + "epoch": 1.7809610428982872, + "grad_norm": 0.2877754553279699, + "learning_rate": 6.503033077625824e-05, + "loss": 0.4746, + "step": 367 + }, + { + "epoch": 1.78581173260573, + "grad_norm": 0.3326775146217252, + "learning_rate": 6.492444847686566e-05, + "loss": 0.4849, + "step": 368 + }, + { + "epoch": 1.7906624223131726, + "grad_norm": 0.419702080624426, + "learning_rate": 6.481827991434111e-05, + "loss": 0.4814, + "step": 369 + }, + { + "epoch": 1.7955131120206156, + "grad_norm": 0.43780909545325103, + "learning_rate": 6.471182630805538e-05, + "loss": 0.4813, + "step": 370 + }, + { + "epoch": 1.800363801728058, + "grad_norm": 0.5080371772111751, + "learning_rate": 6.460508888065314e-05, + "loss": 0.4865, + "step": 371 + }, + { + "epoch": 1.805214491435501, + "grad_norm": 0.5541771901573003, + "learning_rate": 6.449806885803873e-05, + "loss": 0.4752, + "step": 372 + }, + { + "epoch": 1.8100651811429438, + "grad_norm": 0.5077930985424878, + "learning_rate": 6.439076746936219e-05, + "loss": 0.4776, + "step": 373 + }, + { + "epoch": 1.8149158708503865, + "grad_norm": 0.3974055597915673, + "learning_rate": 6.428318594700509e-05, + "loss": 0.4833, + "step": 374 + }, + { + "epoch": 1.8197665605578295, + "grad_norm": 0.27838793632255576, + "learning_rate": 6.417532552656647e-05, + "loss": 0.4808, + "step": 375 + }, + { + "epoch": 1.824617250265272, + "grad_norm": 0.25531453372215107, + "learning_rate": 6.406718744684851e-05, + "loss": 0.475, + "step": 376 + }, + { + "epoch": 1.829467939972715, + "grad_norm": 0.37619306197372576, + "learning_rate": 6.395877294984241e-05, + "loss": 0.4718, + "step": 377 + }, + { + "epoch": 1.8343186296801577, + "grad_norm": 0.45314622671289495, + "learning_rate": 6.385008328071406e-05, + "loss": 0.4858, + "step": 378 + }, + { + "epoch": 1.8391693193876004, + "grad_norm": 0.4091697946782105, + "learning_rate": 6.374111968778982e-05, + "loss": 0.4797, + "step": 379 + }, + { + "epoch": 1.8440200090950432, + "grad_norm": 0.31229108750141443, + "learning_rate": 6.363188342254206e-05, + "loss": 0.4819, + "step": 380 + }, + { + "epoch": 1.848870698802486, + "grad_norm": 0.29389799920114323, + "learning_rate": 6.352237573957488e-05, + "loss": 0.4777, + "step": 381 + }, + { + "epoch": 1.8537213885099288, + "grad_norm": 0.31830405845533455, + "learning_rate": 6.341259789660969e-05, + "loss": 0.4812, + "step": 382 + }, + { + "epoch": 1.8585720782173716, + "grad_norm": 0.2783419658252336, + "learning_rate": 6.330255115447076e-05, + "loss": 0.4722, + "step": 383 + }, + { + "epoch": 1.8634227679248143, + "grad_norm": 0.252195902565345, + "learning_rate": 6.319223677707069e-05, + "loss": 0.4786, + "step": 384 + }, + { + "epoch": 1.868273457632257, + "grad_norm": 0.24931429544692238, + "learning_rate": 6.308165603139598e-05, + "loss": 0.4766, + "step": 385 + }, + { + "epoch": 1.8731241473396998, + "grad_norm": 0.343056469344131, + "learning_rate": 6.29708101874924e-05, + "loss": 0.4746, + "step": 386 + }, + { + "epoch": 1.8779748370471427, + "grad_norm": 0.39163026769861153, + "learning_rate": 6.285970051845045e-05, + "loss": 0.4777, + "step": 387 + }, + { + "epoch": 1.8828255267545853, + "grad_norm": 0.3925083138992103, + "learning_rate": 6.274832830039071e-05, + "loss": 0.4762, + "step": 388 + }, + { + "epoch": 1.8876762164620282, + "grad_norm": 0.3908015146094751, + "learning_rate": 6.26366948124492e-05, + "loss": 0.4882, + "step": 389 + }, + { + "epoch": 1.892526906169471, + "grad_norm": 0.38768255703534454, + "learning_rate": 6.25248013367627e-05, + "loss": 0.4746, + "step": 390 + }, + { + "epoch": 1.8973775958769137, + "grad_norm": 0.34797592572865116, + "learning_rate": 6.241264915845401e-05, + "loss": 0.4863, + "step": 391 + }, + { + "epoch": 1.9022282855843566, + "grad_norm": 0.2939167601152598, + "learning_rate": 6.230023956561716e-05, + "loss": 0.4803, + "step": 392 + }, + { + "epoch": 1.9070789752917991, + "grad_norm": 0.2683598696324213, + "learning_rate": 6.218757384930268e-05, + "loss": 0.4769, + "step": 393 + }, + { + "epoch": 1.911929664999242, + "grad_norm": 0.2963955328357841, + "learning_rate": 6.207465330350273e-05, + "loss": 0.4798, + "step": 394 + }, + { + "epoch": 1.9167803547066848, + "grad_norm": 0.34936564317737695, + "learning_rate": 6.196147922513623e-05, + "loss": 0.479, + "step": 395 + }, + { + "epoch": 1.9216310444141276, + "grad_norm": 0.3023947037005716, + "learning_rate": 6.184805291403402e-05, + "loss": 0.4776, + "step": 396 + }, + { + "epoch": 1.9264817341215705, + "grad_norm": 0.23472105439779495, + "learning_rate": 6.173437567292383e-05, + "loss": 0.475, + "step": 397 + }, + { + "epoch": 1.931332423829013, + "grad_norm": 0.30151702935680424, + "learning_rate": 6.162044880741544e-05, + "loss": 0.4719, + "step": 398 + }, + { + "epoch": 1.936183113536456, + "grad_norm": 0.4380813843564537, + "learning_rate": 6.150627362598557e-05, + "loss": 0.4871, + "step": 399 + }, + { + "epoch": 1.9410338032438987, + "grad_norm": 0.5034940901090467, + "learning_rate": 6.139185143996298e-05, + "loss": 0.4806, + "step": 400 + }, + { + "epoch": 1.9458844929513415, + "grad_norm": 0.44831770290541656, + "learning_rate": 6.127718356351326e-05, + "loss": 0.478, + "step": 401 + }, + { + "epoch": 1.9507351826587844, + "grad_norm": 0.3881020850233725, + "learning_rate": 6.116227131362385e-05, + "loss": 0.4714, + "step": 402 + }, + { + "epoch": 1.955585872366227, + "grad_norm": 0.3382903208345561, + "learning_rate": 6.104711601008888e-05, + "loss": 0.4779, + "step": 403 + }, + { + "epoch": 1.96043656207367, + "grad_norm": 0.2830781275191087, + "learning_rate": 6.0931718975493985e-05, + "loss": 0.4846, + "step": 404 + }, + { + "epoch": 1.9652872517811126, + "grad_norm": 0.27767803820547865, + "learning_rate": 6.081608153520117e-05, + "loss": 0.4691, + "step": 405 + }, + { + "epoch": 1.9701379414885554, + "grad_norm": 0.35527234014372044, + "learning_rate": 6.0700205017333525e-05, + "loss": 0.4787, + "step": 406 + }, + { + "epoch": 1.9749886311959983, + "grad_norm": 0.34300192919407774, + "learning_rate": 6.058409075276002e-05, + "loss": 0.4689, + "step": 407 + }, + { + "epoch": 1.9798393209034408, + "grad_norm": 0.2964726842271146, + "learning_rate": 6.046774007508019e-05, + "loss": 0.475, + "step": 408 + }, + { + "epoch": 1.9846900106108838, + "grad_norm": 0.2502113324820329, + "learning_rate": 6.035115432060883e-05, + "loss": 0.4747, + "step": 409 + }, + { + "epoch": 1.9895407003183265, + "grad_norm": 0.23471156048166733, + "learning_rate": 6.0234334828360655e-05, + "loss": 0.4786, + "step": 410 + }, + { + "epoch": 1.9943913900257693, + "grad_norm": 0.27137410563019304, + "learning_rate": 6.011728294003494e-05, + "loss": 0.4802, + "step": 411 + }, + { + "epoch": 1.9992420797332122, + "grad_norm": 0.2960970008273601, + "learning_rate": 6.000000000000001e-05, + "loss": 0.4768, + "step": 412 + }, + { + "epoch": 2.004850689707443, + "grad_norm": 0.33644070901215145, + "learning_rate": 5.988248735527793e-05, + "loss": 0.4473, + "step": 413 + }, + { + "epoch": 2.0097013794148855, + "grad_norm": 0.39546749871672404, + "learning_rate": 5.9764746355528994e-05, + "loss": 0.4501, + "step": 414 + }, + { + "epoch": 2.0145520691223284, + "grad_norm": 0.47967552460987467, + "learning_rate": 5.964677835303615e-05, + "loss": 0.4483, + "step": 415 + }, + { + "epoch": 2.019402758829771, + "grad_norm": 0.43081443925289625, + "learning_rate": 5.952858470268955e-05, + "loss": 0.4468, + "step": 416 + }, + { + "epoch": 2.024253448537214, + "grad_norm": 0.42692273173821377, + "learning_rate": 5.941016676197098e-05, + "loss": 0.4499, + "step": 417 + }, + { + "epoch": 2.029104138244657, + "grad_norm": 0.5203095933335755, + "learning_rate": 5.929152589093825e-05, + "loss": 0.4498, + "step": 418 + }, + { + "epoch": 2.0339548279520994, + "grad_norm": 0.5390774215298352, + "learning_rate": 5.9172663452209554e-05, + "loss": 0.449, + "step": 419 + }, + { + "epoch": 2.0388055176595423, + "grad_norm": 0.5618164866931807, + "learning_rate": 5.9053580810947845e-05, + "loss": 0.4555, + "step": 420 + }, + { + "epoch": 2.043656207366985, + "grad_norm": 0.6473211411897097, + "learning_rate": 5.89342793348452e-05, + "loss": 0.4537, + "step": 421 + }, + { + "epoch": 2.048506897074428, + "grad_norm": 0.7641174380933736, + "learning_rate": 5.881476039410699e-05, + "loss": 0.4579, + "step": 422 + }, + { + "epoch": 2.0533575867818707, + "grad_norm": 0.6589276143277975, + "learning_rate": 5.869502536143629e-05, + "loss": 0.4478, + "step": 423 + }, + { + "epoch": 2.0582082764893133, + "grad_norm": 0.4055360078631115, + "learning_rate": 5.857507561201802e-05, + "loss": 0.4501, + "step": 424 + }, + { + "epoch": 2.063058966196756, + "grad_norm": 0.3576976481492298, + "learning_rate": 5.845491252350312e-05, + "loss": 0.4479, + "step": 425 + }, + { + "epoch": 2.0679096559041987, + "grad_norm": 0.444390387775824, + "learning_rate": 5.833453747599286e-05, + "loss": 0.4466, + "step": 426 + }, + { + "epoch": 2.0727603456116417, + "grad_norm": 0.38706062123939283, + "learning_rate": 5.821395185202285e-05, + "loss": 0.449, + "step": 427 + }, + { + "epoch": 2.0776110353190846, + "grad_norm": 0.3243650769978332, + "learning_rate": 5.809315703654726e-05, + "loss": 0.4581, + "step": 428 + }, + { + "epoch": 2.082461725026527, + "grad_norm": 0.35862489527477903, + "learning_rate": 5.797215441692284e-05, + "loss": 0.4534, + "step": 429 + }, + { + "epoch": 2.08731241473397, + "grad_norm": 0.3353344776943914, + "learning_rate": 5.785094538289304e-05, + "loss": 0.4537, + "step": 430 + }, + { + "epoch": 2.0921631044414126, + "grad_norm": 0.3620686259692887, + "learning_rate": 5.772953132657202e-05, + "loss": 0.4553, + "step": 431 + }, + { + "epoch": 2.0970137941488556, + "grad_norm": 0.307403523851727, + "learning_rate": 5.7607913642428666e-05, + "loss": 0.4424, + "step": 432 + }, + { + "epoch": 2.101864483856298, + "grad_norm": 0.28710201149568576, + "learning_rate": 5.7486093727270606e-05, + "loss": 0.4462, + "step": 433 + }, + { + "epoch": 2.106715173563741, + "grad_norm": 0.31451691469735704, + "learning_rate": 5.736407298022809e-05, + "loss": 0.4434, + "step": 434 + }, + { + "epoch": 2.111565863271184, + "grad_norm": 0.3105010146819863, + "learning_rate": 5.7241852802738e-05, + "loss": 0.4533, + "step": 435 + }, + { + "epoch": 2.1164165529786265, + "grad_norm": 0.2878408032383936, + "learning_rate": 5.711943459852772e-05, + "loss": 0.4427, + "step": 436 + }, + { + "epoch": 2.1212672426860695, + "grad_norm": 0.3026608573456508, + "learning_rate": 5.699681977359902e-05, + "loss": 0.4385, + "step": 437 + }, + { + "epoch": 2.1261179323935124, + "grad_norm": 0.2857208984253648, + "learning_rate": 5.6874009736211896e-05, + "loss": 0.4465, + "step": 438 + }, + { + "epoch": 2.130968622100955, + "grad_norm": 0.28786201316205207, + "learning_rate": 5.675100589686839e-05, + "loss": 0.4472, + "step": 439 + }, + { + "epoch": 2.135819311808398, + "grad_norm": 0.3397455432854385, + "learning_rate": 5.662780966829646e-05, + "loss": 0.4486, + "step": 440 + }, + { + "epoch": 2.1406700015158404, + "grad_norm": 0.3060713829784068, + "learning_rate": 5.650442246543364e-05, + "loss": 0.4525, + "step": 441 + }, + { + "epoch": 2.1455206912232834, + "grad_norm": 0.2554715156912105, + "learning_rate": 5.638084570541088e-05, + "loss": 0.4451, + "step": 442 + }, + { + "epoch": 2.150371380930726, + "grad_norm": 0.31763468046624377, + "learning_rate": 5.625708080753621e-05, + "loss": 0.455, + "step": 443 + }, + { + "epoch": 2.155222070638169, + "grad_norm": 0.3288505103534938, + "learning_rate": 5.6133129193278525e-05, + "loss": 0.4453, + "step": 444 + }, + { + "epoch": 2.160072760345612, + "grad_norm": 0.27302062189682574, + "learning_rate": 5.600899228625112e-05, + "loss": 0.4523, + "step": 445 + }, + { + "epoch": 2.1649234500530543, + "grad_norm": 0.2367917713116079, + "learning_rate": 5.588467151219549e-05, + "loss": 0.4481, + "step": 446 + }, + { + "epoch": 2.1697741397604973, + "grad_norm": 0.27892881990044693, + "learning_rate": 5.5760168298964874e-05, + "loss": 0.4397, + "step": 447 + }, + { + "epoch": 2.17462482946794, + "grad_norm": 0.3659363982261399, + "learning_rate": 5.563548407650782e-05, + "loss": 0.4464, + "step": 448 + }, + { + "epoch": 2.1794755191753827, + "grad_norm": 0.3139974928184246, + "learning_rate": 5.551062027685187e-05, + "loss": 0.4487, + "step": 449 + }, + { + "epoch": 2.1843262088828257, + "grad_norm": 0.25894377780084493, + "learning_rate": 5.5385578334087006e-05, + "loss": 0.4481, + "step": 450 + }, + { + "epoch": 2.189176898590268, + "grad_norm": 0.17951964246489394, + "learning_rate": 5.526035968434927e-05, + "loss": 0.4469, + "step": 451 + }, + { + "epoch": 2.194027588297711, + "grad_norm": 0.21554515294483917, + "learning_rate": 5.513496576580418e-05, + "loss": 0.4573, + "step": 452 + }, + { + "epoch": 2.1988782780051537, + "grad_norm": 0.24799983544152385, + "learning_rate": 5.5009398018630276e-05, + "loss": 0.4498, + "step": 453 + }, + { + "epoch": 2.2037289677125966, + "grad_norm": 0.186973375547793, + "learning_rate": 5.4883657885002575e-05, + "loss": 0.4449, + "step": 454 + }, + { + "epoch": 2.2085796574200396, + "grad_norm": 0.1888483688795653, + "learning_rate": 5.475774680907597e-05, + "loss": 0.443, + "step": 455 + }, + { + "epoch": 2.213430347127482, + "grad_norm": 0.18914695692387654, + "learning_rate": 5.463166623696868e-05, + "loss": 0.4434, + "step": 456 + }, + { + "epoch": 2.218281036834925, + "grad_norm": 0.19070268199404652, + "learning_rate": 5.450541761674562e-05, + "loss": 0.4445, + "step": 457 + }, + { + "epoch": 2.2231317265423676, + "grad_norm": 0.2259939851217927, + "learning_rate": 5.437900239840179e-05, + "loss": 0.4465, + "step": 458 + }, + { + "epoch": 2.2279824162498105, + "grad_norm": 0.18023421500987896, + "learning_rate": 5.42524220338456e-05, + "loss": 0.4453, + "step": 459 + }, + { + "epoch": 2.2328331059572535, + "grad_norm": 0.16598518940751159, + "learning_rate": 5.412567797688219e-05, + "loss": 0.4498, + "step": 460 + }, + { + "epoch": 2.237683795664696, + "grad_norm": 0.16004882092407235, + "learning_rate": 5.3998771683196754e-05, + "loss": 0.4527, + "step": 461 + }, + { + "epoch": 2.242534485372139, + "grad_norm": 0.17890202722776521, + "learning_rate": 5.3871704610337836e-05, + "loss": 0.4444, + "step": 462 + }, + { + "epoch": 2.2473851750795815, + "grad_norm": 0.182744670257566, + "learning_rate": 5.374447821770053e-05, + "loss": 0.4431, + "step": 463 + }, + { + "epoch": 2.2522358647870244, + "grad_norm": 0.19342699163866056, + "learning_rate": 5.361709396650977e-05, + "loss": 0.4404, + "step": 464 + }, + { + "epoch": 2.2570865544944674, + "grad_norm": 0.20442779398031627, + "learning_rate": 5.3489553319803566e-05, + "loss": 0.4496, + "step": 465 + }, + { + "epoch": 2.26193724420191, + "grad_norm": 0.23359410284964036, + "learning_rate": 5.336185774241609e-05, + "loss": 0.4469, + "step": 466 + }, + { + "epoch": 2.266787933909353, + "grad_norm": 0.23295417695606166, + "learning_rate": 5.3234008700961e-05, + "loss": 0.4505, + "step": 467 + }, + { + "epoch": 2.2716386236167954, + "grad_norm": 0.20207094824496044, + "learning_rate": 5.3106007663814505e-05, + "loss": 0.4406, + "step": 468 + }, + { + "epoch": 2.2764893133242383, + "grad_norm": 0.1850252157104855, + "learning_rate": 5.2977856101098484e-05, + "loss": 0.4525, + "step": 469 + }, + { + "epoch": 2.281340003031681, + "grad_norm": 0.1821206965545461, + "learning_rate": 5.284955548466371e-05, + "loss": 0.4592, + "step": 470 + }, + { + "epoch": 2.286190692739124, + "grad_norm": 0.1913435003815255, + "learning_rate": 5.272110728807279e-05, + "loss": 0.4459, + "step": 471 + }, + { + "epoch": 2.2910413824465667, + "grad_norm": 0.17908151714339782, + "learning_rate": 5.25925129865834e-05, + "loss": 0.4523, + "step": 472 + }, + { + "epoch": 2.2958920721540093, + "grad_norm": 0.17796456682985312, + "learning_rate": 5.246377405713121e-05, + "loss": 0.4426, + "step": 473 + }, + { + "epoch": 2.300742761861452, + "grad_norm": 0.16950491734508644, + "learning_rate": 5.2334891978313006e-05, + "loss": 0.4426, + "step": 474 + }, + { + "epoch": 2.305593451568895, + "grad_norm": 0.18036359667208995, + "learning_rate": 5.220586823036966e-05, + "loss": 0.4458, + "step": 475 + }, + { + "epoch": 2.3104441412763377, + "grad_norm": 0.1873060682555774, + "learning_rate": 5.207670429516915e-05, + "loss": 0.4433, + "step": 476 + }, + { + "epoch": 2.3152948309837806, + "grad_norm": 0.1986452939709168, + "learning_rate": 5.1947401656189546e-05, + "loss": 0.4593, + "step": 477 + }, + { + "epoch": 2.320145520691223, + "grad_norm": 0.20494449288937291, + "learning_rate": 5.181796179850197e-05, + "loss": 0.4424, + "step": 478 + }, + { + "epoch": 2.324996210398666, + "grad_norm": 0.17952910191793728, + "learning_rate": 5.168838620875352e-05, + "loss": 0.4503, + "step": 479 + }, + { + "epoch": 2.3298469001061086, + "grad_norm": 0.1909701609269039, + "learning_rate": 5.155867637515019e-05, + "loss": 0.4506, + "step": 480 + }, + { + "epoch": 2.3346975898135516, + "grad_norm": 0.1838298898954926, + "learning_rate": 5.142883378743984e-05, + "loss": 0.4513, + "step": 481 + }, + { + "epoch": 2.3395482795209945, + "grad_norm": 0.1818267641683358, + "learning_rate": 5.129885993689502e-05, + "loss": 0.4488, + "step": 482 + }, + { + "epoch": 2.344398969228437, + "grad_norm": 0.21197375880432345, + "learning_rate": 5.116875631629585e-05, + "loss": 0.4456, + "step": 483 + }, + { + "epoch": 2.34924965893588, + "grad_norm": 0.21240893965447508, + "learning_rate": 5.10385244199129e-05, + "loss": 0.4386, + "step": 484 + }, + { + "epoch": 2.354100348643323, + "grad_norm": 0.19244612255162405, + "learning_rate": 5.0908165743490047e-05, + "loss": 0.4482, + "step": 485 + }, + { + "epoch": 2.3589510383507655, + "grad_norm": 0.22440529731925618, + "learning_rate": 5.0777681784227224e-05, + "loss": 0.4496, + "step": 486 + }, + { + "epoch": 2.3638017280582084, + "grad_norm": 0.249440062974833, + "learning_rate": 5.064707404076327e-05, + "loss": 0.4502, + "step": 487 + }, + { + "epoch": 2.368652417765651, + "grad_norm": 0.2374206142112278, + "learning_rate": 5.051634401315875e-05, + "loss": 0.448, + "step": 488 + }, + { + "epoch": 2.373503107473094, + "grad_norm": 0.21044332969367502, + "learning_rate": 5.0385493202878656e-05, + "loss": 0.4416, + "step": 489 + }, + { + "epoch": 2.3783537971805364, + "grad_norm": 0.15343545111269605, + "learning_rate": 5.025452311277522e-05, + "loss": 0.4413, + "step": 490 + }, + { + "epoch": 2.3832044868879794, + "grad_norm": 0.17472771019103053, + "learning_rate": 5.01234352470706e-05, + "loss": 0.4472, + "step": 491 + }, + { + "epoch": 2.3880551765954223, + "grad_norm": 0.2225509747823868, + "learning_rate": 4.999223111133968e-05, + "loss": 0.4405, + "step": 492 + }, + { + "epoch": 2.392905866302865, + "grad_norm": 0.27110633436791925, + "learning_rate": 4.986091221249269e-05, + "loss": 0.44, + "step": 493 + }, + { + "epoch": 2.397756556010308, + "grad_norm": 0.24255464597168586, + "learning_rate": 4.972948005875796e-05, + "loss": 0.4432, + "step": 494 + }, + { + "epoch": 2.4026072457177503, + "grad_norm": 0.2496648842091371, + "learning_rate": 4.959793615966459e-05, + "loss": 0.4401, + "step": 495 + }, + { + "epoch": 2.4074579354251933, + "grad_norm": 0.24806426439634907, + "learning_rate": 4.946628202602508e-05, + "loss": 0.4526, + "step": 496 + }, + { + "epoch": 2.412308625132636, + "grad_norm": 0.21808090914084832, + "learning_rate": 4.933451916991802e-05, + "loss": 0.4474, + "step": 497 + }, + { + "epoch": 2.4171593148400787, + "grad_norm": 0.19833835766366836, + "learning_rate": 4.920264910467066e-05, + "loss": 0.4485, + "step": 498 + }, + { + "epoch": 2.4220100045475217, + "grad_norm": 0.1904056029579938, + "learning_rate": 4.9070673344841645e-05, + "loss": 0.4471, + "step": 499 + }, + { + "epoch": 2.426860694254964, + "grad_norm": 0.17821880940044135, + "learning_rate": 4.893859340620348e-05, + "loss": 0.4518, + "step": 500 + }, + { + "epoch": 2.431711383962407, + "grad_norm": 0.16242846601925154, + "learning_rate": 4.880641080572522e-05, + "loss": 0.4426, + "step": 501 + }, + { + "epoch": 2.43656207366985, + "grad_norm": 0.16230843192633562, + "learning_rate": 4.8674127061555025e-05, + "loss": 0.4492, + "step": 502 + }, + { + "epoch": 2.4414127633772926, + "grad_norm": 0.18692985874064466, + "learning_rate": 4.8541743693002676e-05, + "loss": 0.4576, + "step": 503 + }, + { + "epoch": 2.4462634530847356, + "grad_norm": 0.17489245993778632, + "learning_rate": 4.8409262220522196e-05, + "loss": 0.4476, + "step": 504 + }, + { + "epoch": 2.451114142792178, + "grad_norm": 0.14061959670906948, + "learning_rate": 4.8276684165694336e-05, + "loss": 0.4479, + "step": 505 + }, + { + "epoch": 2.455964832499621, + "grad_norm": 0.17289206898304424, + "learning_rate": 4.814401105120914e-05, + "loss": 0.4479, + "step": 506 + }, + { + "epoch": 2.460815522207064, + "grad_norm": 0.21063084112901795, + "learning_rate": 4.8011244400848414e-05, + "loss": 0.4466, + "step": 507 + }, + { + "epoch": 2.4656662119145065, + "grad_norm": 0.2134287283629687, + "learning_rate": 4.787838573946825e-05, + "loss": 0.4503, + "step": 508 + }, + { + "epoch": 2.4705169016219495, + "grad_norm": 0.19387557882251144, + "learning_rate": 4.774543659298152e-05, + "loss": 0.4419, + "step": 509 + }, + { + "epoch": 2.475367591329392, + "grad_norm": 0.1690053079886072, + "learning_rate": 4.761239848834031e-05, + "loss": 0.4443, + "step": 510 + }, + { + "epoch": 2.480218281036835, + "grad_norm": 0.17406180900609755, + "learning_rate": 4.747927295351845e-05, + "loss": 0.4474, + "step": 511 + }, + { + "epoch": 2.485068970744278, + "grad_norm": 0.2024050850623432, + "learning_rate": 4.734606151749389e-05, + "loss": 0.4473, + "step": 512 + }, + { + "epoch": 2.4899196604517204, + "grad_norm": 0.22659357369802574, + "learning_rate": 4.7212765710231204e-05, + "loss": 0.4481, + "step": 513 + }, + { + "epoch": 2.4947703501591634, + "grad_norm": 0.23595309939097722, + "learning_rate": 4.707938706266397e-05, + "loss": 0.4484, + "step": 514 + }, + { + "epoch": 2.499621039866606, + "grad_norm": 0.19918584163751257, + "learning_rate": 4.694592710667723e-05, + "loss": 0.444, + "step": 515 + }, + { + "epoch": 2.504471729574049, + "grad_norm": 0.18418670752131802, + "learning_rate": 4.681238737508983e-05, + "loss": 0.4424, + "step": 516 + }, + { + "epoch": 2.5093224192814914, + "grad_norm": 0.1926237495649244, + "learning_rate": 4.6678769401636894e-05, + "loss": 0.4444, + "step": 517 + }, + { + "epoch": 2.5141731089889343, + "grad_norm": 0.20706125086296728, + "learning_rate": 4.6545074720952166e-05, + "loss": 0.456, + "step": 518 + }, + { + "epoch": 2.5190237986963773, + "grad_norm": 0.17699664563372686, + "learning_rate": 4.641130486855038e-05, + "loss": 0.4396, + "step": 519 + }, + { + "epoch": 2.52387448840382, + "grad_norm": 0.18317752602670304, + "learning_rate": 4.627746138080966e-05, + "loss": 0.4432, + "step": 520 + }, + { + "epoch": 2.5287251781112627, + "grad_norm": 0.2190424482227647, + "learning_rate": 4.614354579495379e-05, + "loss": 0.4448, + "step": 521 + }, + { + "epoch": 2.5335758678187057, + "grad_norm": 0.20135719119048615, + "learning_rate": 4.6009559649034695e-05, + "loss": 0.4432, + "step": 522 + }, + { + "epoch": 2.538426557526148, + "grad_norm": 0.20782420010728125, + "learning_rate": 4.587550448191465e-05, + "loss": 0.4474, + "step": 523 + }, + { + "epoch": 2.543277247233591, + "grad_norm": 0.18668296726800496, + "learning_rate": 4.5741381833248655e-05, + "loss": 0.455, + "step": 524 + }, + { + "epoch": 2.5481279369410337, + "grad_norm": 0.17935132627421838, + "learning_rate": 4.560719324346677e-05, + "loss": 0.4457, + "step": 525 + }, + { + "epoch": 2.5529786266484766, + "grad_norm": 0.16835981784522308, + "learning_rate": 4.547294025375641e-05, + "loss": 0.4478, + "step": 526 + }, + { + "epoch": 2.557829316355919, + "grad_norm": 0.18084487512355504, + "learning_rate": 4.533862440604461e-05, + "loss": 0.447, + "step": 527 + }, + { + "epoch": 2.562680006063362, + "grad_norm": 0.17384784743298828, + "learning_rate": 4.520424724298036e-05, + "loss": 0.4408, + "step": 528 + }, + { + "epoch": 2.567530695770805, + "grad_norm": 0.20150460275113774, + "learning_rate": 4.5069810307916874e-05, + "loss": 0.4441, + "step": 529 + }, + { + "epoch": 2.5723813854782476, + "grad_norm": 0.2240004858996321, + "learning_rate": 4.493531514489385e-05, + "loss": 0.4425, + "step": 530 + }, + { + "epoch": 2.5772320751856905, + "grad_norm": 0.2286831099325836, + "learning_rate": 4.480076329861977e-05, + "loss": 0.4433, + "step": 531 + }, + { + "epoch": 2.5820827648931335, + "grad_norm": 0.2048648110357608, + "learning_rate": 4.46661563144541e-05, + "loss": 0.4487, + "step": 532 + }, + { + "epoch": 2.586933454600576, + "grad_norm": 0.2121488428415987, + "learning_rate": 4.453149573838962e-05, + "loss": 0.4445, + "step": 533 + }, + { + "epoch": 2.591784144308019, + "grad_norm": 0.18541474138380978, + "learning_rate": 4.43967831170346e-05, + "loss": 0.4494, + "step": 534 + }, + { + "epoch": 2.5966348340154615, + "grad_norm": 0.17452762694525445, + "learning_rate": 4.426201999759505e-05, + "loss": 0.4484, + "step": 535 + }, + { + "epoch": 2.6014855237229044, + "grad_norm": 0.21944224068377363, + "learning_rate": 4.4127207927857e-05, + "loss": 0.4419, + "step": 536 + }, + { + "epoch": 2.606336213430347, + "grad_norm": 0.17656272332454842, + "learning_rate": 4.3992348456168666e-05, + "loss": 0.4568, + "step": 537 + }, + { + "epoch": 2.61118690313779, + "grad_norm": 0.1892562653364182, + "learning_rate": 4.385744313142267e-05, + "loss": 0.4427, + "step": 538 + }, + { + "epoch": 2.616037592845233, + "grad_norm": 0.21611454670373548, + "learning_rate": 4.372249350303828e-05, + "loss": 0.4418, + "step": 539 + }, + { + "epoch": 2.6208882825526754, + "grad_norm": 0.17168747953224547, + "learning_rate": 4.358750112094363e-05, + "loss": 0.4544, + "step": 540 + }, + { + "epoch": 2.6257389722601183, + "grad_norm": 0.17941819138400728, + "learning_rate": 4.3452467535557846e-05, + "loss": 0.4372, + "step": 541 + }, + { + "epoch": 2.6305896619675613, + "grad_norm": 0.2025265834742146, + "learning_rate": 4.3317394297773304e-05, + "loss": 0.4517, + "step": 542 + }, + { + "epoch": 2.635440351675004, + "grad_norm": 0.20441246530938206, + "learning_rate": 4.3182282958937816e-05, + "loss": 0.4333, + "step": 543 + }, + { + "epoch": 2.6402910413824463, + "grad_norm": 0.2334105452950634, + "learning_rate": 4.304713507083673e-05, + "loss": 0.4481, + "step": 544 + }, + { + "epoch": 2.6451417310898893, + "grad_norm": 0.26291969340773214, + "learning_rate": 4.291195218567523e-05, + "loss": 0.4466, + "step": 545 + }, + { + "epoch": 2.649992420797332, + "grad_norm": 0.1863631298156993, + "learning_rate": 4.277673585606046e-05, + "loss": 0.4405, + "step": 546 + }, + { + "epoch": 2.6548431105047747, + "grad_norm": 0.23226855973797117, + "learning_rate": 4.264148763498364e-05, + "loss": 0.4566, + "step": 547 + }, + { + "epoch": 2.6596938002122177, + "grad_norm": 0.30482274820740174, + "learning_rate": 4.250620907580226e-05, + "loss": 0.4407, + "step": 548 + }, + { + "epoch": 2.6645444899196606, + "grad_norm": 0.23781311620065457, + "learning_rate": 4.237090173222231e-05, + "loss": 0.4493, + "step": 549 + }, + { + "epoch": 2.669395179627103, + "grad_norm": 0.1808214801234254, + "learning_rate": 4.223556715828033e-05, + "loss": 0.4511, + "step": 550 + }, + { + "epoch": 2.674245869334546, + "grad_norm": 0.26315804734468673, + "learning_rate": 4.2100206908325603e-05, + "loss": 0.447, + "step": 551 + }, + { + "epoch": 2.6790965590419886, + "grad_norm": 0.25781234163394623, + "learning_rate": 4.196482253700235e-05, + "loss": 0.4415, + "step": 552 + }, + { + "epoch": 2.6839472487494316, + "grad_norm": 0.17133762584152984, + "learning_rate": 4.182941559923179e-05, + "loss": 0.4457, + "step": 553 + }, + { + "epoch": 2.688797938456874, + "grad_norm": 0.2266803612041648, + "learning_rate": 4.169398765019433e-05, + "loss": 0.4422, + "step": 554 + }, + { + "epoch": 2.693648628164317, + "grad_norm": 0.23286738752123257, + "learning_rate": 4.15585402453117e-05, + "loss": 0.4429, + "step": 555 + }, + { + "epoch": 2.69849931787176, + "grad_norm": 0.20226496811604636, + "learning_rate": 4.14230749402291e-05, + "loss": 0.4421, + "step": 556 + }, + { + "epoch": 2.7033500075792025, + "grad_norm": 0.21746634743317236, + "learning_rate": 4.128759329079732e-05, + "loss": 0.4318, + "step": 557 + }, + { + "epoch": 2.7082006972866455, + "grad_norm": 0.24285493960537577, + "learning_rate": 4.115209685305482e-05, + "loss": 0.4374, + "step": 558 + }, + { + "epoch": 2.7130513869940884, + "grad_norm": 0.20035101285126697, + "learning_rate": 4.101658718320998e-05, + "loss": 0.4429, + "step": 559 + }, + { + "epoch": 2.717902076701531, + "grad_norm": 0.1733102653989901, + "learning_rate": 4.088106583762309e-05, + "loss": 0.4456, + "step": 560 + }, + { + "epoch": 2.722752766408974, + "grad_norm": 0.25116764609287723, + "learning_rate": 4.074553437278857e-05, + "loss": 0.4494, + "step": 561 + }, + { + "epoch": 2.7276034561164164, + "grad_norm": 0.19896329775589092, + "learning_rate": 4.060999434531704e-05, + "loss": 0.4449, + "step": 562 + }, + { + "epoch": 2.7324541458238594, + "grad_norm": 0.16517536428811208, + "learning_rate": 4.047444731191751e-05, + "loss": 0.4426, + "step": 563 + }, + { + "epoch": 2.737304835531302, + "grad_norm": 0.1656807626865065, + "learning_rate": 4.033889482937943e-05, + "loss": 0.4445, + "step": 564 + }, + { + "epoch": 2.742155525238745, + "grad_norm": 0.15103159619749504, + "learning_rate": 4.020333845455478e-05, + "loss": 0.4565, + "step": 565 + }, + { + "epoch": 2.747006214946188, + "grad_norm": 0.16996820086522443, + "learning_rate": 4.0067779744340345e-05, + "loss": 0.4459, + "step": 566 + }, + { + "epoch": 2.7518569046536303, + "grad_norm": 0.1495970266083701, + "learning_rate": 3.993222025565966e-05, + "loss": 0.4447, + "step": 567 + }, + { + "epoch": 2.7567075943610733, + "grad_norm": 0.15458974892236554, + "learning_rate": 3.979666154544522e-05, + "loss": 0.4452, + "step": 568 + }, + { + "epoch": 2.7615582840685162, + "grad_norm": 0.1741093401099396, + "learning_rate": 3.96611051706206e-05, + "loss": 0.4421, + "step": 569 + }, + { + "epoch": 2.7664089737759587, + "grad_norm": 0.1819530197226333, + "learning_rate": 3.9525552688082494e-05, + "loss": 0.4509, + "step": 570 + }, + { + "epoch": 2.7712596634834017, + "grad_norm": 0.14996389947080183, + "learning_rate": 3.939000565468297e-05, + "loss": 0.4442, + "step": 571 + }, + { + "epoch": 2.776110353190844, + "grad_norm": 0.19015205226216172, + "learning_rate": 3.9254465627211444e-05, + "loss": 0.4458, + "step": 572 + }, + { + "epoch": 2.780961042898287, + "grad_norm": 0.2147271939320094, + "learning_rate": 3.911893416237693e-05, + "loss": 0.4423, + "step": 573 + }, + { + "epoch": 2.7858117326057297, + "grad_norm": 0.17368493707493848, + "learning_rate": 3.8983412816790045e-05, + "loss": 0.4415, + "step": 574 + }, + { + "epoch": 2.7906624223131726, + "grad_norm": 0.18366782229193682, + "learning_rate": 3.8847903146945186e-05, + "loss": 0.4419, + "step": 575 + }, + { + "epoch": 2.7955131120206156, + "grad_norm": 0.1770373720928735, + "learning_rate": 3.871240670920269e-05, + "loss": 0.4477, + "step": 576 + }, + { + "epoch": 2.800363801728058, + "grad_norm": 0.15508137985676013, + "learning_rate": 3.85769250597709e-05, + "loss": 0.4458, + "step": 577 + }, + { + "epoch": 2.805214491435501, + "grad_norm": 0.15518418619016236, + "learning_rate": 3.844145975468832e-05, + "loss": 0.4403, + "step": 578 + }, + { + "epoch": 2.810065181142944, + "grad_norm": 0.13016021632650948, + "learning_rate": 3.830601234980569e-05, + "loss": 0.4509, + "step": 579 + }, + { + "epoch": 2.8149158708503865, + "grad_norm": 0.17125198843453068, + "learning_rate": 3.8170584400768224e-05, + "loss": 0.4492, + "step": 580 + }, + { + "epoch": 2.8197665605578295, + "grad_norm": 0.18182599605587274, + "learning_rate": 3.8035177462997664e-05, + "loss": 0.4475, + "step": 581 + }, + { + "epoch": 2.824617250265272, + "grad_norm": 0.16612208849559923, + "learning_rate": 3.7899793091674396e-05, + "loss": 0.4419, + "step": 582 + }, + { + "epoch": 2.829467939972715, + "grad_norm": 0.15504382692612345, + "learning_rate": 3.776443284171969e-05, + "loss": 0.4421, + "step": 583 + }, + { + "epoch": 2.8343186296801575, + "grad_norm": 0.14158493240403466, + "learning_rate": 3.7629098267777706e-05, + "loss": 0.4399, + "step": 584 + }, + { + "epoch": 2.8391693193876004, + "grad_norm": 0.14521790840725082, + "learning_rate": 3.7493790924197746e-05, + "loss": 0.4328, + "step": 585 + }, + { + "epoch": 2.8440200090950434, + "grad_norm": 0.14223117063886642, + "learning_rate": 3.735851236501637e-05, + "loss": 0.4403, + "step": 586 + }, + { + "epoch": 2.848870698802486, + "grad_norm": 0.13716153813556975, + "learning_rate": 3.722326414393954e-05, + "loss": 0.4375, + "step": 587 + }, + { + "epoch": 2.853721388509929, + "grad_norm": 0.13481835773066367, + "learning_rate": 3.708804781432478e-05, + "loss": 0.4465, + "step": 588 + }, + { + "epoch": 2.858572078217372, + "grad_norm": 0.15098861155914894, + "learning_rate": 3.6952864929163286e-05, + "loss": 0.4478, + "step": 589 + }, + { + "epoch": 2.8634227679248143, + "grad_norm": 0.14428029096945075, + "learning_rate": 3.6817717041062204e-05, + "loss": 0.4433, + "step": 590 + }, + { + "epoch": 2.868273457632257, + "grad_norm": 0.14941685817838865, + "learning_rate": 3.66826057022267e-05, + "loss": 0.4426, + "step": 591 + }, + { + "epoch": 2.8731241473397, + "grad_norm": 0.15814915640950794, + "learning_rate": 3.654753246444217e-05, + "loss": 0.437, + "step": 592 + }, + { + "epoch": 2.8779748370471427, + "grad_norm": 0.1666350361712344, + "learning_rate": 3.641249887905638e-05, + "loss": 0.4404, + "step": 593 + }, + { + "epoch": 2.8828255267545853, + "grad_norm": 0.14761581189993908, + "learning_rate": 3.627750649696173e-05, + "loss": 0.4418, + "step": 594 + }, + { + "epoch": 2.887676216462028, + "grad_norm": 0.16433140815176697, + "learning_rate": 3.614255686857734e-05, + "loss": 0.4482, + "step": 595 + }, + { + "epoch": 2.892526906169471, + "grad_norm": 0.14898117787478918, + "learning_rate": 3.600765154383134e-05, + "loss": 0.4407, + "step": 596 + }, + { + "epoch": 2.8973775958769137, + "grad_norm": 0.1576311183401583, + "learning_rate": 3.587279207214301e-05, + "loss": 0.4502, + "step": 597 + }, + { + "epoch": 2.9022282855843566, + "grad_norm": 0.12713739329535242, + "learning_rate": 3.5737980002404965e-05, + "loss": 0.4504, + "step": 598 + }, + { + "epoch": 2.907078975291799, + "grad_norm": 0.1407162797770253, + "learning_rate": 3.5603216882965415e-05, + "loss": 0.4444, + "step": 599 + }, + { + "epoch": 2.911929664999242, + "grad_norm": 0.15096239269549241, + "learning_rate": 3.5468504261610387e-05, + "loss": 0.4497, + "step": 600 + }, + { + "epoch": 2.9167803547066846, + "grad_norm": 0.1341187523707445, + "learning_rate": 3.5333843685545914e-05, + "loss": 0.4449, + "step": 601 + }, + { + "epoch": 2.9216310444141276, + "grad_norm": 0.1619335943958044, + "learning_rate": 3.519923670138025e-05, + "loss": 0.4434, + "step": 602 + }, + { + "epoch": 2.9264817341215705, + "grad_norm": 0.16211928956809254, + "learning_rate": 3.506468485510616e-05, + "loss": 0.4394, + "step": 603 + }, + { + "epoch": 2.931332423829013, + "grad_norm": 0.13565985896740923, + "learning_rate": 3.493018969208314e-05, + "loss": 0.4513, + "step": 604 + }, + { + "epoch": 2.936183113536456, + "grad_norm": 0.14551792578562125, + "learning_rate": 3.479575275701965e-05, + "loss": 0.4425, + "step": 605 + }, + { + "epoch": 2.941033803243899, + "grad_norm": 0.17680002225930672, + "learning_rate": 3.4661375593955405e-05, + "loss": 0.4384, + "step": 606 + }, + { + "epoch": 2.9458844929513415, + "grad_norm": 0.16447736465809054, + "learning_rate": 3.45270597462436e-05, + "loss": 0.4451, + "step": 607 + }, + { + "epoch": 2.9507351826587844, + "grad_norm": 0.15299942108774958, + "learning_rate": 3.4392806756533233e-05, + "loss": 0.4383, + "step": 608 + }, + { + "epoch": 2.955585872366227, + "grad_norm": 0.1536623395643003, + "learning_rate": 3.425861816675135e-05, + "loss": 0.4453, + "step": 609 + }, + { + "epoch": 2.96043656207367, + "grad_norm": 0.15727509499916784, + "learning_rate": 3.4124495518085366e-05, + "loss": 0.436, + "step": 610 + }, + { + "epoch": 2.9652872517811124, + "grad_norm": 0.17906600408772821, + "learning_rate": 3.399044035096532e-05, + "loss": 0.4467, + "step": 611 + }, + { + "epoch": 2.9701379414885554, + "grad_norm": 0.16243556143131102, + "learning_rate": 3.3856454205046223e-05, + "loss": 0.4364, + "step": 612 + }, + { + "epoch": 2.9749886311959983, + "grad_norm": 0.1608114743453715, + "learning_rate": 3.372253861919036e-05, + "loss": 0.4517, + "step": 613 + }, + { + "epoch": 2.979839320903441, + "grad_norm": 0.16249676695986184, + "learning_rate": 3.3588695131449626e-05, + "loss": 0.4464, + "step": 614 + }, + { + "epoch": 2.984690010610884, + "grad_norm": 0.14682205641070967, + "learning_rate": 3.3454925279047854e-05, + "loss": 0.4446, + "step": 615 + }, + { + "epoch": 2.9895407003183267, + "grad_norm": 0.158750060737996, + "learning_rate": 3.3321230598363126e-05, + "loss": 0.4449, + "step": 616 + }, + { + "epoch": 2.9943913900257693, + "grad_norm": 0.15103569523913019, + "learning_rate": 3.3187612624910185e-05, + "loss": 0.4457, + "step": 617 + }, + { + "epoch": 2.999242079733212, + "grad_norm": 0.13279281722008607, + "learning_rate": 3.305407289332279e-05, + "loss": 0.4524, + "step": 618 + }, + { + "epoch": 3.004850689707443, + "grad_norm": 0.21786343264375474, + "learning_rate": 3.2920612937336035e-05, + "loss": 0.4186, + "step": 619 + }, + { + "epoch": 3.0097013794148855, + "grad_norm": 0.1940657522375173, + "learning_rate": 3.2787234289768816e-05, + "loss": 0.4198, + "step": 620 + }, + { + "epoch": 3.0145520691223284, + "grad_norm": 0.21773031084989108, + "learning_rate": 3.2653938482506125e-05, + "loss": 0.4257, + "step": 621 + }, + { + "epoch": 3.019402758829771, + "grad_norm": 0.20326547030411232, + "learning_rate": 3.252072704648157e-05, + "loss": 0.4165, + "step": 622 + }, + { + "epoch": 3.024253448537214, + "grad_norm": 0.1952882443077655, + "learning_rate": 3.2387601511659695e-05, + "loss": 0.4099, + "step": 623 + }, + { + "epoch": 3.029104138244657, + "grad_norm": 0.1918042514566916, + "learning_rate": 3.22545634070185e-05, + "loss": 0.4152, + "step": 624 + }, + { + "epoch": 3.0339548279520994, + "grad_norm": 0.19705116304049744, + "learning_rate": 3.212161426053177e-05, + "loss": 0.4128, + "step": 625 + }, + { + "epoch": 3.0388055176595423, + "grad_norm": 0.19649678060258355, + "learning_rate": 3.19887555991516e-05, + "loss": 0.4129, + "step": 626 + }, + { + "epoch": 3.043656207366985, + "grad_norm": 0.21708556979200094, + "learning_rate": 3.1855988948790866e-05, + "loss": 0.419, + "step": 627 + }, + { + "epoch": 3.048506897074428, + "grad_norm": 0.1975715363358727, + "learning_rate": 3.172331583430567e-05, + "loss": 0.4179, + "step": 628 + }, + { + "epoch": 3.0533575867818707, + "grad_norm": 0.23335868145268443, + "learning_rate": 3.1590737779477825e-05, + "loss": 0.4187, + "step": 629 + }, + { + "epoch": 3.0582082764893133, + "grad_norm": 0.16312780113553543, + "learning_rate": 3.145825630699734e-05, + "loss": 0.4145, + "step": 630 + }, + { + "epoch": 3.063058966196756, + "grad_norm": 0.1995031684584169, + "learning_rate": 3.1325872938444995e-05, + "loss": 0.4269, + "step": 631 + }, + { + "epoch": 3.0679096559041987, + "grad_norm": 0.16321617015370155, + "learning_rate": 3.119358919427478e-05, + "loss": 0.4189, + "step": 632 + }, + { + "epoch": 3.0727603456116417, + "grad_norm": 0.18410001775256316, + "learning_rate": 3.106140659379652e-05, + "loss": 0.4218, + "step": 633 + }, + { + "epoch": 3.0776110353190846, + "grad_norm": 0.15016856412332835, + "learning_rate": 3.092932665515837e-05, + "loss": 0.4142, + "step": 634 + }, + { + "epoch": 3.082461725026527, + "grad_norm": 0.1502499895895468, + "learning_rate": 3.079735089532935e-05, + "loss": 0.4092, + "step": 635 + }, + { + "epoch": 3.08731241473397, + "grad_norm": 0.1564011362374121, + "learning_rate": 3.0665480830082e-05, + "loss": 0.4176, + "step": 636 + }, + { + "epoch": 3.0921631044414126, + "grad_norm": 0.15490177035198396, + "learning_rate": 3.0533717973974924e-05, + "loss": 0.4171, + "step": 637 + }, + { + "epoch": 3.0970137941488556, + "grad_norm": 0.16842243538179394, + "learning_rate": 3.040206384033542e-05, + "loss": 0.4142, + "step": 638 + }, + { + "epoch": 3.101864483856298, + "grad_norm": 0.15647723657119908, + "learning_rate": 3.0270519941242052e-05, + "loss": 0.4045, + "step": 639 + }, + { + "epoch": 3.106715173563741, + "grad_norm": 0.14187950473293476, + "learning_rate": 3.0139087787507323e-05, + "loss": 0.4162, + "step": 640 + }, + { + "epoch": 3.111565863271184, + "grad_norm": 0.1486994798612613, + "learning_rate": 3.0007768888660337e-05, + "loss": 0.4162, + "step": 641 + }, + { + "epoch": 3.1164165529786265, + "grad_norm": 0.14045982542928215, + "learning_rate": 2.9876564752929406e-05, + "loss": 0.423, + "step": 642 + }, + { + "epoch": 3.1212672426860695, + "grad_norm": 0.14911944405394412, + "learning_rate": 2.9745476887224806e-05, + "loss": 0.4186, + "step": 643 + }, + { + "epoch": 3.1261179323935124, + "grad_norm": 0.130768356118423, + "learning_rate": 2.961450679712135e-05, + "loss": 0.4149, + "step": 644 + }, + { + "epoch": 3.130968622100955, + "grad_norm": 0.15344876789210227, + "learning_rate": 2.9483655986841265e-05, + "loss": 0.4185, + "step": 645 + }, + { + "epoch": 3.135819311808398, + "grad_norm": 0.16373681347456412, + "learning_rate": 2.9352925959236732e-05, + "loss": 0.4199, + "step": 646 + }, + { + "epoch": 3.1406700015158404, + "grad_norm": 0.13681917154319687, + "learning_rate": 2.92223182157728e-05, + "loss": 0.4187, + "step": 647 + }, + { + "epoch": 3.1455206912232834, + "grad_norm": 0.16376916195733163, + "learning_rate": 2.909183425650996e-05, + "loss": 0.4144, + "step": 648 + }, + { + "epoch": 3.150371380930726, + "grad_norm": 0.15231760580025508, + "learning_rate": 2.8961475580087108e-05, + "loss": 0.4065, + "step": 649 + }, + { + "epoch": 3.155222070638169, + "grad_norm": 0.1482250629623317, + "learning_rate": 2.8831243683704162e-05, + "loss": 0.4167, + "step": 650 + }, + { + "epoch": 3.160072760345612, + "grad_norm": 0.1279306947970543, + "learning_rate": 2.8701140063104996e-05, + "loss": 0.4163, + "step": 651 + }, + { + "epoch": 3.1649234500530543, + "grad_norm": 0.14839352063841615, + "learning_rate": 2.857116621256018e-05, + "loss": 0.4066, + "step": 652 + }, + { + "epoch": 3.1697741397604973, + "grad_norm": 0.14182099741632095, + "learning_rate": 2.8441323624849827e-05, + "loss": 0.4073, + "step": 653 + }, + { + "epoch": 3.17462482946794, + "grad_norm": 0.14062989686711488, + "learning_rate": 2.83116137912465e-05, + "loss": 0.4148, + "step": 654 + }, + { + "epoch": 3.1794755191753827, + "grad_norm": 0.13350262763245205, + "learning_rate": 2.8182038201498038e-05, + "loss": 0.4185, + "step": 655 + }, + { + "epoch": 3.1843262088828257, + "grad_norm": 0.14000623741594295, + "learning_rate": 2.8052598343810474e-05, + "loss": 0.4084, + "step": 656 + }, + { + "epoch": 3.189176898590268, + "grad_norm": 0.13922618624994615, + "learning_rate": 2.7923295704830868e-05, + "loss": 0.4209, + "step": 657 + }, + { + "epoch": 3.194027588297711, + "grad_norm": 0.13424360868636123, + "learning_rate": 2.7794131769630355e-05, + "loss": 0.4203, + "step": 658 + }, + { + "epoch": 3.1988782780051537, + "grad_norm": 0.1410971557670894, + "learning_rate": 2.7665108021687007e-05, + "loss": 0.4229, + "step": 659 + }, + { + "epoch": 3.2037289677125966, + "grad_norm": 0.15216131334925778, + "learning_rate": 2.753622594286879e-05, + "loss": 0.4145, + "step": 660 + }, + { + "epoch": 3.2085796574200396, + "grad_norm": 0.1261567069468345, + "learning_rate": 2.7407487013416615e-05, + "loss": 0.4083, + "step": 661 + }, + { + "epoch": 3.213430347127482, + "grad_norm": 0.15853568579534694, + "learning_rate": 2.727889271192722e-05, + "loss": 0.4187, + "step": 662 + }, + { + "epoch": 3.218281036834925, + "grad_norm": 0.1151093763460037, + "learning_rate": 2.715044451533631e-05, + "loss": 0.4164, + "step": 663 + }, + { + "epoch": 3.2231317265423676, + "grad_norm": 0.14296777545925654, + "learning_rate": 2.702214389890152e-05, + "loss": 0.413, + "step": 664 + }, + { + "epoch": 3.2279824162498105, + "grad_norm": 0.12844538251966497, + "learning_rate": 2.6893992336185512e-05, + "loss": 0.4035, + "step": 665 + }, + { + "epoch": 3.2328331059572535, + "grad_norm": 0.13036276585432338, + "learning_rate": 2.6765991299039025e-05, + "loss": 0.4145, + "step": 666 + }, + { + "epoch": 3.237683795664696, + "grad_norm": 0.12243507743746514, + "learning_rate": 2.663814225758393e-05, + "loss": 0.4117, + "step": 667 + }, + { + "epoch": 3.242534485372139, + "grad_norm": 0.14245972122975337, + "learning_rate": 2.6510446680196448e-05, + "loss": 0.4195, + "step": 668 + }, + { + "epoch": 3.2473851750795815, + "grad_norm": 0.12799039988824565, + "learning_rate": 2.638290603349023e-05, + "loss": 0.4203, + "step": 669 + }, + { + "epoch": 3.2522358647870244, + "grad_norm": 0.12961756855915293, + "learning_rate": 2.625552178229949e-05, + "loss": 0.4159, + "step": 670 + }, + { + "epoch": 3.2570865544944674, + "grad_norm": 0.1296944618260485, + "learning_rate": 2.612829538966218e-05, + "loss": 0.4111, + "step": 671 + }, + { + "epoch": 3.26193724420191, + "grad_norm": 0.14508116679367689, + "learning_rate": 2.6001228316803256e-05, + "loss": 0.4196, + "step": 672 + }, + { + "epoch": 3.266787933909353, + "grad_norm": 0.1216509600449271, + "learning_rate": 2.5874322023117824e-05, + "loss": 0.4162, + "step": 673 + }, + { + "epoch": 3.2716386236167954, + "grad_norm": 0.1407698696044201, + "learning_rate": 2.5747577966154404e-05, + "loss": 0.4165, + "step": 674 + }, + { + "epoch": 3.2764893133242383, + "grad_norm": 0.1142728140236527, + "learning_rate": 2.5620997601598215e-05, + "loss": 0.4076, + "step": 675 + }, + { + "epoch": 3.281340003031681, + "grad_norm": 0.14212475123175447, + "learning_rate": 2.5494582383254388e-05, + "loss": 0.4174, + "step": 676 + }, + { + "epoch": 3.286190692739124, + "grad_norm": 0.11798282133422631, + "learning_rate": 2.5368333763031324e-05, + "loss": 0.4131, + "step": 677 + }, + { + "epoch": 3.2910413824465667, + "grad_norm": 0.14618443390836333, + "learning_rate": 2.5242253190924034e-05, + "loss": 0.4092, + "step": 678 + }, + { + "epoch": 3.2958920721540093, + "grad_norm": 0.12815235524330332, + "learning_rate": 2.5116342114997442e-05, + "loss": 0.409, + "step": 679 + }, + { + "epoch": 3.300742761861452, + "grad_norm": 0.1346079173937725, + "learning_rate": 2.4990601981369737e-05, + "loss": 0.4201, + "step": 680 + }, + { + "epoch": 3.305593451568895, + "grad_norm": 0.12020401678661803, + "learning_rate": 2.4865034234195834e-05, + "loss": 0.4107, + "step": 681 + }, + { + "epoch": 3.3104441412763377, + "grad_norm": 0.1342860022847603, + "learning_rate": 2.4739640315650747e-05, + "loss": 0.4145, + "step": 682 + }, + { + "epoch": 3.3152948309837806, + "grad_norm": 0.11394559661374248, + "learning_rate": 2.4614421665912997e-05, + "loss": 0.4213, + "step": 683 + }, + { + "epoch": 3.320145520691223, + "grad_norm": 0.126805017438777, + "learning_rate": 2.4489379723148147e-05, + "loss": 0.4129, + "step": 684 + }, + { + "epoch": 3.324996210398666, + "grad_norm": 0.11817811298525939, + "learning_rate": 2.4364515923492187e-05, + "loss": 0.4193, + "step": 685 + }, + { + "epoch": 3.3298469001061086, + "grad_norm": 0.1342332761111468, + "learning_rate": 2.4239831701035143e-05, + "loss": 0.418, + "step": 686 + }, + { + "epoch": 3.3346975898135516, + "grad_norm": 0.12474527460295737, + "learning_rate": 2.411532848780451e-05, + "loss": 0.4166, + "step": 687 + }, + { + "epoch": 3.3395482795209945, + "grad_norm": 0.1329059048345405, + "learning_rate": 2.399100771374888e-05, + "loss": 0.4138, + "step": 688 + }, + { + "epoch": 3.344398969228437, + "grad_norm": 0.11628441384991241, + "learning_rate": 2.3866870806721495e-05, + "loss": 0.4111, + "step": 689 + }, + { + "epoch": 3.34924965893588, + "grad_norm": 0.1453864432398833, + "learning_rate": 2.37429191924638e-05, + "loss": 0.42, + "step": 690 + }, + { + "epoch": 3.354100348643323, + "grad_norm": 0.11264715608612798, + "learning_rate": 2.361915429458913e-05, + "loss": 0.417, + "step": 691 + }, + { + "epoch": 3.3589510383507655, + "grad_norm": 0.14248256005839127, + "learning_rate": 2.349557753456637e-05, + "loss": 0.4168, + "step": 692 + }, + { + "epoch": 3.3638017280582084, + "grad_norm": 0.12398727462550883, + "learning_rate": 2.3372190331703556e-05, + "loss": 0.4189, + "step": 693 + }, + { + "epoch": 3.368652417765651, + "grad_norm": 0.11869463547338541, + "learning_rate": 2.324899410313161e-05, + "loss": 0.4125, + "step": 694 + }, + { + "epoch": 3.373503107473094, + "grad_norm": 0.12377753865053726, + "learning_rate": 2.3125990263788118e-05, + "loss": 0.4186, + "step": 695 + }, + { + "epoch": 3.3783537971805364, + "grad_norm": 0.13141561076446406, + "learning_rate": 2.3003180226400986e-05, + "loss": 0.4123, + "step": 696 + }, + { + "epoch": 3.3832044868879794, + "grad_norm": 0.11816327910326484, + "learning_rate": 2.288056540147229e-05, + "loss": 0.4129, + "step": 697 + }, + { + "epoch": 3.3880551765954223, + "grad_norm": 0.12260669143866527, + "learning_rate": 2.275814719726201e-05, + "loss": 0.4133, + "step": 698 + }, + { + "epoch": 3.392905866302865, + "grad_norm": 0.133084483131333, + "learning_rate": 2.263592701977193e-05, + "loss": 0.4219, + "step": 699 + }, + { + "epoch": 3.397756556010308, + "grad_norm": 0.11848073628628028, + "learning_rate": 2.2513906272729397e-05, + "loss": 0.4143, + "step": 700 + }, + { + "epoch": 3.4026072457177503, + "grad_norm": 0.12858950370510128, + "learning_rate": 2.239208635757133e-05, + "loss": 0.4166, + "step": 701 + }, + { + "epoch": 3.4074579354251933, + "grad_norm": 0.11722692816596028, + "learning_rate": 2.2270468673428004e-05, + "loss": 0.4259, + "step": 702 + }, + { + "epoch": 3.412308625132636, + "grad_norm": 0.11830608786302087, + "learning_rate": 2.2149054617106974e-05, + "loss": 0.407, + "step": 703 + }, + { + "epoch": 3.4171593148400787, + "grad_norm": 0.12285165179780408, + "learning_rate": 2.2027845583077175e-05, + "loss": 0.4231, + "step": 704 + }, + { + "epoch": 3.4220100045475217, + "grad_norm": 0.12884220459818324, + "learning_rate": 2.1906842963452757e-05, + "loss": 0.4069, + "step": 705 + }, + { + "epoch": 3.426860694254964, + "grad_norm": 0.10700415399515635, + "learning_rate": 2.178604814797715e-05, + "loss": 0.4149, + "step": 706 + }, + { + "epoch": 3.431711383962407, + "grad_norm": 0.11853515304365536, + "learning_rate": 2.1665462524007162e-05, + "loss": 0.4125, + "step": 707 + }, + { + "epoch": 3.43656207366985, + "grad_norm": 0.10772813217204756, + "learning_rate": 2.1545087476496903e-05, + "loss": 0.4216, + "step": 708 + }, + { + "epoch": 3.4414127633772926, + "grad_norm": 0.12946073793938545, + "learning_rate": 2.1424924387981996e-05, + "loss": 0.4227, + "step": 709 + }, + { + "epoch": 3.4462634530847356, + "grad_norm": 0.11256888467579416, + "learning_rate": 2.1304974638563715e-05, + "loss": 0.4116, + "step": 710 + }, + { + "epoch": 3.451114142792178, + "grad_norm": 0.12334394272902899, + "learning_rate": 2.1185239605893013e-05, + "loss": 0.4217, + "step": 711 + }, + { + "epoch": 3.455964832499621, + "grad_norm": 0.11467056354627854, + "learning_rate": 2.106572066515482e-05, + "loss": 0.4193, + "step": 712 + }, + { + "epoch": 3.460815522207064, + "grad_norm": 0.11248104529388973, + "learning_rate": 2.0946419189052162e-05, + "loss": 0.4147, + "step": 713 + }, + { + "epoch": 3.4656662119145065, + "grad_norm": 0.11839620237634582, + "learning_rate": 2.0827336547790452e-05, + "loss": 0.4214, + "step": 714 + }, + { + "epoch": 3.4705169016219495, + "grad_norm": 0.11350680266976185, + "learning_rate": 2.0708474109061752e-05, + "loss": 0.416, + "step": 715 + }, + { + "epoch": 3.475367591329392, + "grad_norm": 0.11310394993568851, + "learning_rate": 2.0589833238029032e-05, + "loss": 0.4001, + "step": 716 + }, + { + "epoch": 3.480218281036835, + "grad_norm": 0.1142115014102716, + "learning_rate": 2.0471415297310455e-05, + "loss": 0.4158, + "step": 717 + }, + { + "epoch": 3.485068970744278, + "grad_norm": 0.12114855144347077, + "learning_rate": 2.0353221646963864e-05, + "loss": 0.41, + "step": 718 + }, + { + "epoch": 3.4899196604517204, + "grad_norm": 0.11155618948058961, + "learning_rate": 2.0235253644471012e-05, + "loss": 0.4226, + "step": 719 + }, + { + "epoch": 3.4947703501591634, + "grad_norm": 0.12346483161916652, + "learning_rate": 2.011751264472206e-05, + "loss": 0.4163, + "step": 720 + }, + { + "epoch": 3.499621039866606, + "grad_norm": 0.1314504891806893, + "learning_rate": 2.0000000000000012e-05, + "loss": 0.4185, + "step": 721 + }, + { + "epoch": 3.504471729574049, + "grad_norm": 0.11587490363769114, + "learning_rate": 1.9882717059965086e-05, + "loss": 0.4243, + "step": 722 + }, + { + "epoch": 3.5093224192814914, + "grad_norm": 0.147492515392888, + "learning_rate": 1.9765665171639345e-05, + "loss": 0.4139, + "step": 723 + }, + { + "epoch": 3.5141731089889343, + "grad_norm": 0.13161876983358525, + "learning_rate": 1.964884567939118e-05, + "loss": 0.4023, + "step": 724 + }, + { + "epoch": 3.5190237986963773, + "grad_norm": 0.1288012773595963, + "learning_rate": 1.9532259924919823e-05, + "loss": 0.416, + "step": 725 + }, + { + "epoch": 3.52387448840382, + "grad_norm": 0.10979902623938809, + "learning_rate": 1.9415909247239996e-05, + "loss": 0.4198, + "step": 726 + }, + { + "epoch": 3.5287251781112627, + "grad_norm": 0.12273321372911124, + "learning_rate": 1.9299794982666485e-05, + "loss": 0.4084, + "step": 727 + }, + { + "epoch": 3.5335758678187057, + "grad_norm": 0.11485189001172974, + "learning_rate": 1.9183918464798837e-05, + "loss": 0.408, + "step": 728 + }, + { + "epoch": 3.538426557526148, + "grad_norm": 0.1142263107632135, + "learning_rate": 1.906828102450601e-05, + "loss": 0.4131, + "step": 729 + }, + { + "epoch": 3.543277247233591, + "grad_norm": 0.11235720950088848, + "learning_rate": 1.895288398991114e-05, + "loss": 0.4102, + "step": 730 + }, + { + "epoch": 3.5481279369410337, + "grad_norm": 0.11476446551397697, + "learning_rate": 1.8837728686376158e-05, + "loss": 0.4176, + "step": 731 + }, + { + "epoch": 3.5529786266484766, + "grad_norm": 0.12252689326129268, + "learning_rate": 1.8722816436486754e-05, + "loss": 0.4238, + "step": 732 + }, + { + "epoch": 3.557829316355919, + "grad_norm": 0.10742367387279236, + "learning_rate": 1.8608148560037036e-05, + "loss": 0.4248, + "step": 733 + }, + { + "epoch": 3.562680006063362, + "grad_norm": 0.11202485484827082, + "learning_rate": 1.8493726374014442e-05, + "loss": 0.4047, + "step": 734 + }, + { + "epoch": 3.567530695770805, + "grad_norm": 0.10619927645163178, + "learning_rate": 1.8379551192584588e-05, + "loss": 0.4105, + "step": 735 + }, + { + "epoch": 3.5723813854782476, + "grad_norm": 0.1104031551739802, + "learning_rate": 1.826562432707619e-05, + "loss": 0.4158, + "step": 736 + }, + { + "epoch": 3.5772320751856905, + "grad_norm": 0.10920848831138874, + "learning_rate": 1.8151947085965994e-05, + "loss": 0.4157, + "step": 737 + }, + { + "epoch": 3.5820827648931335, + "grad_norm": 0.10703865180962287, + "learning_rate": 1.803852077486377e-05, + "loss": 0.4144, + "step": 738 + }, + { + "epoch": 3.586933454600576, + "grad_norm": 0.1043548569854331, + "learning_rate": 1.7925346696497295e-05, + "loss": 0.4082, + "step": 739 + }, + { + "epoch": 3.591784144308019, + "grad_norm": 0.11138455070453787, + "learning_rate": 1.781242615069733e-05, + "loss": 0.4137, + "step": 740 + }, + { + "epoch": 3.5966348340154615, + "grad_norm": 0.11820322046978973, + "learning_rate": 1.7699760434382853e-05, + "loss": 0.4108, + "step": 741 + }, + { + "epoch": 3.6014855237229044, + "grad_norm": 0.11278678223744326, + "learning_rate": 1.758735084154601e-05, + "loss": 0.4189, + "step": 742 + }, + { + "epoch": 3.606336213430347, + "grad_norm": 0.11323272041806605, + "learning_rate": 1.7475198663237297e-05, + "loss": 0.4123, + "step": 743 + }, + { + "epoch": 3.61118690313779, + "grad_norm": 0.10904989882061365, + "learning_rate": 1.736330518755082e-05, + "loss": 0.4158, + "step": 744 + }, + { + "epoch": 3.616037592845233, + "grad_norm": 0.11229772775053595, + "learning_rate": 1.7251671699609313e-05, + "loss": 0.4182, + "step": 745 + }, + { + "epoch": 3.6208882825526754, + "grad_norm": 0.10951334908001022, + "learning_rate": 1.7140299481549557e-05, + "loss": 0.4213, + "step": 746 + }, + { + "epoch": 3.6257389722601183, + "grad_norm": 0.11434493342191, + "learning_rate": 1.7029189812507603e-05, + "loss": 0.4224, + "step": 747 + }, + { + "epoch": 3.6305896619675613, + "grad_norm": 0.10344385368037658, + "learning_rate": 1.6918343968604027e-05, + "loss": 0.4106, + "step": 748 + }, + { + "epoch": 3.635440351675004, + "grad_norm": 0.11168549168378746, + "learning_rate": 1.6807763222929315e-05, + "loss": 0.408, + "step": 749 + }, + { + "epoch": 3.6402910413824463, + "grad_norm": 0.11594040802990377, + "learning_rate": 1.669744884552926e-05, + "loss": 0.4169, + "step": 750 + }, + { + "epoch": 3.6451417310898893, + "grad_norm": 0.11452998735643415, + "learning_rate": 1.6587402103390314e-05, + "loss": 0.4162, + "step": 751 + }, + { + "epoch": 3.649992420797332, + "grad_norm": 0.11033578052460767, + "learning_rate": 1.6477624260425137e-05, + "loss": 0.4179, + "step": 752 + }, + { + "epoch": 3.6548431105047747, + "grad_norm": 0.1198668006175803, + "learning_rate": 1.6368116577457973e-05, + "loss": 0.4124, + "step": 753 + }, + { + "epoch": 3.6596938002122177, + "grad_norm": 0.10884921001547737, + "learning_rate": 1.6258880312210195e-05, + "loss": 0.4152, + "step": 754 + }, + { + "epoch": 3.6645444899196606, + "grad_norm": 0.12009675101549108, + "learning_rate": 1.6149916719285942e-05, + "loss": 0.4147, + "step": 755 + }, + { + "epoch": 3.669395179627103, + "grad_norm": 0.11742205741912104, + "learning_rate": 1.6041227050157607e-05, + "loss": 0.4096, + "step": 756 + }, + { + "epoch": 3.674245869334546, + "grad_norm": 0.1123251375365744, + "learning_rate": 1.5932812553151506e-05, + "loss": 0.4128, + "step": 757 + }, + { + "epoch": 3.6790965590419886, + "grad_norm": 0.12009728599563303, + "learning_rate": 1.582467447343355e-05, + "loss": 0.4179, + "step": 758 + }, + { + "epoch": 3.6839472487494316, + "grad_norm": 0.10679356522304362, + "learning_rate": 1.5716814052994928e-05, + "loss": 0.4153, + "step": 759 + }, + { + "epoch": 3.688797938456874, + "grad_norm": 0.11287526417521035, + "learning_rate": 1.5609232530637827e-05, + "loss": 0.4065, + "step": 760 + }, + { + "epoch": 3.693648628164317, + "grad_norm": 0.10604174975295146, + "learning_rate": 1.5501931141961278e-05, + "loss": 0.4135, + "step": 761 + }, + { + "epoch": 3.69849931787176, + "grad_norm": 0.10895447717123838, + "learning_rate": 1.539491111934686e-05, + "loss": 0.4102, + "step": 762 + }, + { + "epoch": 3.7033500075792025, + "grad_norm": 0.11522106117016057, + "learning_rate": 1.5288173691944613e-05, + "loss": 0.4193, + "step": 763 + }, + { + "epoch": 3.7082006972866455, + "grad_norm": 0.11668799730823959, + "learning_rate": 1.5181720085658906e-05, + "loss": 0.4131, + "step": 764 + }, + { + "epoch": 3.7130513869940884, + "grad_norm": 0.1179757070897769, + "learning_rate": 1.5075551523134358e-05, + "loss": 0.4107, + "step": 765 + }, + { + "epoch": 3.717902076701531, + "grad_norm": 0.11352197320512793, + "learning_rate": 1.4969669223741771e-05, + "loss": 0.4093, + "step": 766 + }, + { + "epoch": 3.722752766408974, + "grad_norm": 0.11945491424386492, + "learning_rate": 1.4864074403564216e-05, + "loss": 0.4142, + "step": 767 + }, + { + "epoch": 3.7276034561164164, + "grad_norm": 0.10892285815783607, + "learning_rate": 1.4758768275382887e-05, + "loss": 0.4205, + "step": 768 + }, + { + "epoch": 3.7324541458238594, + "grad_norm": 0.12765157069597566, + "learning_rate": 1.4653752048663394e-05, + "loss": 0.412, + "step": 769 + }, + { + "epoch": 3.737304835531302, + "grad_norm": 0.10956587187939422, + "learning_rate": 1.4549026929541693e-05, + "loss": 0.4148, + "step": 770 + }, + { + "epoch": 3.742155525238745, + "grad_norm": 0.12138544117757244, + "learning_rate": 1.4444594120810326e-05, + "loss": 0.4115, + "step": 771 + }, + { + "epoch": 3.747006214946188, + "grad_norm": 0.10697996518645103, + "learning_rate": 1.4340454821904573e-05, + "loss": 0.4194, + "step": 772 + }, + { + "epoch": 3.7518569046536303, + "grad_norm": 0.10998535306961314, + "learning_rate": 1.4236610228888683e-05, + "loss": 0.4143, + "step": 773 + }, + { + "epoch": 3.7567075943610733, + "grad_norm": 0.10998459629638649, + "learning_rate": 1.4133061534442133e-05, + "loss": 0.4121, + "step": 774 + }, + { + "epoch": 3.7615582840685162, + "grad_norm": 0.1056241184630642, + "learning_rate": 1.4029809927845981e-05, + "loss": 0.4146, + "step": 775 + }, + { + "epoch": 3.7664089737759587, + "grad_norm": 0.11617390368347923, + "learning_rate": 1.3926856594969115e-05, + "loss": 0.4125, + "step": 776 + }, + { + "epoch": 3.7712596634834017, + "grad_norm": 0.10105741678809248, + "learning_rate": 1.3824202718254655e-05, + "loss": 0.4081, + "step": 777 + }, + { + "epoch": 3.776110353190844, + "grad_norm": 0.12303653861990478, + "learning_rate": 1.3721849476706477e-05, + "loss": 0.413, + "step": 778 + }, + { + "epoch": 3.780961042898287, + "grad_norm": 0.10128855312982177, + "learning_rate": 1.3619798045875529e-05, + "loss": 0.4117, + "step": 779 + }, + { + "epoch": 3.7858117326057297, + "grad_norm": 0.1118697000457396, + "learning_rate": 1.3518049597846412e-05, + "loss": 0.4097, + "step": 780 + }, + { + "epoch": 3.7906624223131726, + "grad_norm": 0.10689143155371568, + "learning_rate": 1.3416605301223893e-05, + "loss": 0.4146, + "step": 781 + }, + { + "epoch": 3.7955131120206156, + "grad_norm": 0.09942573069367382, + "learning_rate": 1.3315466321119486e-05, + "loss": 0.415, + "step": 782 + }, + { + "epoch": 3.800363801728058, + "grad_norm": 0.112223020708749, + "learning_rate": 1.3214633819138105e-05, + "loss": 0.4187, + "step": 783 + }, + { + "epoch": 3.805214491435501, + "grad_norm": 0.09509376603334437, + "learning_rate": 1.3114108953364655e-05, + "loss": 0.4083, + "step": 784 + }, + { + "epoch": 3.810065181142944, + "grad_norm": 0.1039694903593983, + "learning_rate": 1.3013892878350771e-05, + "loss": 0.415, + "step": 785 + }, + { + "epoch": 3.8149158708503865, + "grad_norm": 0.09799457517015436, + "learning_rate": 1.2913986745101567e-05, + "loss": 0.4082, + "step": 786 + }, + { + "epoch": 3.8197665605578295, + "grad_norm": 0.0994744466895985, + "learning_rate": 1.2814391701062392e-05, + "loss": 0.416, + "step": 787 + }, + { + "epoch": 3.824617250265272, + "grad_norm": 0.09937882084294014, + "learning_rate": 1.2715108890105663e-05, + "loss": 0.4118, + "step": 788 + }, + { + "epoch": 3.829467939972715, + "grad_norm": 0.09366936781008306, + "learning_rate": 1.2616139452517748e-05, + "loss": 0.4202, + "step": 789 + }, + { + "epoch": 3.8343186296801575, + "grad_norm": 0.10103247526201467, + "learning_rate": 1.2517484524985836e-05, + "loss": 0.414, + "step": 790 + }, + { + "epoch": 3.8391693193876004, + "grad_norm": 0.10154281976161658, + "learning_rate": 1.2419145240584856e-05, + "loss": 0.4169, + "step": 791 + }, + { + "epoch": 3.8440200090950434, + "grad_norm": 0.09917419975099584, + "learning_rate": 1.2321122728764566e-05, + "loss": 0.4121, + "step": 792 + }, + { + "epoch": 3.848870698802486, + "grad_norm": 0.10067017561953691, + "learning_rate": 1.222341811533648e-05, + "loss": 0.4177, + "step": 793 + }, + { + "epoch": 3.853721388509929, + "grad_norm": 0.10318548830281854, + "learning_rate": 1.2126032522460975e-05, + "loss": 0.4211, + "step": 794 + }, + { + "epoch": 3.858572078217372, + "grad_norm": 0.09616344349182201, + "learning_rate": 1.2028967068634417e-05, + "loss": 0.4204, + "step": 795 + }, + { + "epoch": 3.8634227679248143, + "grad_norm": 0.10489574786705688, + "learning_rate": 1.193222286867628e-05, + "loss": 0.4119, + "step": 796 + }, + { + "epoch": 3.868273457632257, + "grad_norm": 0.1008569871750799, + "learning_rate": 1.1835801033716372e-05, + "loss": 0.4086, + "step": 797 + }, + { + "epoch": 3.8731241473397, + "grad_norm": 0.09122317803788128, + "learning_rate": 1.1739702671182083e-05, + "loss": 0.4214, + "step": 798 + }, + { + "epoch": 3.8779748370471427, + "grad_norm": 0.0991904412555539, + "learning_rate": 1.1643928884785618e-05, + "loss": 0.4095, + "step": 799 + }, + { + "epoch": 3.8828255267545853, + "grad_norm": 0.0959491624589887, + "learning_rate": 1.1548480774511353e-05, + "loss": 0.4218, + "step": 800 + }, + { + "epoch": 3.887676216462028, + "grad_norm": 0.09541302821779325, + "learning_rate": 1.1453359436603213e-05, + "loss": 0.4218, + "step": 801 + }, + { + "epoch": 3.892526906169471, + "grad_norm": 0.09054297930670004, + "learning_rate": 1.1358565963552039e-05, + "loss": 0.421, + "step": 802 + }, + { + "epoch": 3.8973775958769137, + "grad_norm": 0.09175434223796135, + "learning_rate": 1.126410144408312e-05, + "loss": 0.4088, + "step": 803 + }, + { + "epoch": 3.9022282855843566, + "grad_norm": 0.0933968969265613, + "learning_rate": 1.1169966963143568e-05, + "loss": 0.4105, + "step": 804 + }, + { + "epoch": 3.907078975291799, + "grad_norm": 0.09827723734859882, + "learning_rate": 1.1076163601889953e-05, + "loss": 0.4114, + "step": 805 + }, + { + "epoch": 3.911929664999242, + "grad_norm": 0.09185288445531155, + "learning_rate": 1.098269243767589e-05, + "loss": 0.4099, + "step": 806 + }, + { + "epoch": 3.9167803547066846, + "grad_norm": 0.10344811490009215, + "learning_rate": 1.0889554544039593e-05, + "loss": 0.417, + "step": 807 + }, + { + "epoch": 3.9216310444141276, + "grad_norm": 0.09584223413813131, + "learning_rate": 1.0796750990691596e-05, + "loss": 0.4092, + "step": 808 + }, + { + "epoch": 3.9264817341215705, + "grad_norm": 0.10225202685968936, + "learning_rate": 1.0704282843502459e-05, + "loss": 0.4156, + "step": 809 + }, + { + "epoch": 3.931332423829013, + "grad_norm": 0.10087206295646214, + "learning_rate": 1.0612151164490525e-05, + "loss": 0.4209, + "step": 810 + }, + { + "epoch": 3.936183113536456, + "grad_norm": 0.09495839512641314, + "learning_rate": 1.0520357011809707e-05, + "loss": 0.4193, + "step": 811 + }, + { + "epoch": 3.941033803243899, + "grad_norm": 0.10115287872844174, + "learning_rate": 1.0428901439737387e-05, + "loss": 0.415, + "step": 812 + }, + { + "epoch": 3.9458844929513415, + "grad_norm": 0.09538434619439141, + "learning_rate": 1.0337785498662223e-05, + "loss": 0.4152, + "step": 813 + }, + { + "epoch": 3.9507351826587844, + "grad_norm": 0.0955931932252973, + "learning_rate": 1.024701023507216e-05, + "loss": 0.4153, + "step": 814 + }, + { + "epoch": 3.955585872366227, + "grad_norm": 0.10045702643945939, + "learning_rate": 1.015657669154237e-05, + "loss": 0.4156, + "step": 815 + }, + { + "epoch": 3.96043656207367, + "grad_norm": 0.09335473216661304, + "learning_rate": 1.00664859067233e-05, + "loss": 0.4109, + "step": 816 + }, + { + "epoch": 3.9652872517811124, + "grad_norm": 0.09645722262367523, + "learning_rate": 9.976738915328719e-06, + "loss": 0.4107, + "step": 817 + }, + { + "epoch": 3.9701379414885554, + "grad_norm": 0.09446841411423582, + "learning_rate": 9.887336748123864e-06, + "loss": 0.4178, + "step": 818 + }, + { + "epoch": 3.9749886311959983, + "grad_norm": 0.0903235693705833, + "learning_rate": 9.798280431913558e-06, + "loss": 0.4202, + "step": 819 + }, + { + "epoch": 3.979839320903441, + "grad_norm": 0.0948091272844266, + "learning_rate": 9.709570989530493e-06, + "loss": 0.4123, + "step": 820 + }, + { + "epoch": 3.984690010610884, + "grad_norm": 0.10103242493534337, + "learning_rate": 9.621209439823388e-06, + "loss": 0.4132, + "step": 821 + }, + { + "epoch": 3.9895407003183267, + "grad_norm": 0.09199808648298305, + "learning_rate": 9.533196797645354e-06, + "loss": 0.4101, + "step": 822 + }, + { + "epoch": 3.9943913900257693, + "grad_norm": 0.09866422487619428, + "learning_rate": 9.44553407384221e-06, + "loss": 0.412, + "step": 823 + }, + { + "epoch": 3.999242079733212, + "grad_norm": 0.09950215009808663, + "learning_rate": 9.358222275240884e-06, + "loss": 0.4113, + "step": 824 + }, + { + "epoch": 4.0048506897074425, + "grad_norm": 0.16227668213643984, + "learning_rate": 9.271262404637835e-06, + "loss": 0.4032, + "step": 825 + }, + { + "epoch": 4.009701379414886, + "grad_norm": 0.11430363283166092, + "learning_rate": 9.184655460787591e-06, + "loss": 0.3988, + "step": 826 + }, + { + "epoch": 4.014552069122328, + "grad_norm": 0.11751760908320912, + "learning_rate": 9.098402438391161e-06, + "loss": 0.3943, + "step": 827 + }, + { + "epoch": 4.019402758829771, + "grad_norm": 0.13225951402360853, + "learning_rate": 9.012504328084724e-06, + "loss": 0.4024, + "step": 828 + }, + { + "epoch": 4.0242534485372135, + "grad_norm": 0.1269725744791709, + "learning_rate": 8.926962116428228e-06, + "loss": 0.4, + "step": 829 + }, + { + "epoch": 4.029104138244657, + "grad_norm": 0.12436207204015083, + "learning_rate": 8.841776785894014e-06, + "loss": 0.3994, + "step": 830 + }, + { + "epoch": 4.033954827952099, + "grad_norm": 0.12882961013897004, + "learning_rate": 8.756949314855565e-06, + "loss": 0.3977, + "step": 831 + }, + { + "epoch": 4.038805517659542, + "grad_norm": 0.11685196489455994, + "learning_rate": 8.672480677576267e-06, + "loss": 0.3906, + "step": 832 + }, + { + "epoch": 4.043656207366985, + "grad_norm": 0.106568471380297, + "learning_rate": 8.58837184419821e-06, + "loss": 0.388, + "step": 833 + }, + { + "epoch": 4.048506897074428, + "grad_norm": 0.1134401036269532, + "learning_rate": 8.504623780731056e-06, + "loss": 0.3918, + "step": 834 + }, + { + "epoch": 4.05335758678187, + "grad_norm": 0.12093411095557142, + "learning_rate": 8.421237449040962e-06, + "loss": 0.397, + "step": 835 + }, + { + "epoch": 4.058208276489314, + "grad_norm": 0.11674197768223235, + "learning_rate": 8.338213806839453e-06, + "loss": 0.393, + "step": 836 + }, + { + "epoch": 4.063058966196756, + "grad_norm": 0.10082248897884766, + "learning_rate": 8.255553807672547e-06, + "loss": 0.3897, + "step": 837 + }, + { + "epoch": 4.067909655904199, + "grad_norm": 0.11069126863357161, + "learning_rate": 8.1732584009097e-06, + "loss": 0.3882, + "step": 838 + }, + { + "epoch": 4.072760345611641, + "grad_norm": 0.11738423041846735, + "learning_rate": 8.091328531732925e-06, + "loss": 0.3959, + "step": 839 + }, + { + "epoch": 4.077611035319085, + "grad_norm": 0.10387395387726432, + "learning_rate": 8.009765141126014e-06, + "loss": 0.3891, + "step": 840 + }, + { + "epoch": 4.082461725026527, + "grad_norm": 0.10003982048853301, + "learning_rate": 7.928569165863584e-06, + "loss": 0.3909, + "step": 841 + }, + { + "epoch": 4.08731241473397, + "grad_norm": 0.10549262492820612, + "learning_rate": 7.847741538500439e-06, + "loss": 0.3875, + "step": 842 + }, + { + "epoch": 4.092163104441413, + "grad_norm": 0.10986857014715488, + "learning_rate": 7.767283187360846e-06, + "loss": 0.3929, + "step": 843 + }, + { + "epoch": 4.097013794148856, + "grad_norm": 0.09674503227632227, + "learning_rate": 7.687195036527813e-06, + "loss": 0.3928, + "step": 844 + }, + { + "epoch": 4.101864483856298, + "grad_norm": 0.10305617355184506, + "learning_rate": 7.60747800583252e-06, + "loss": 0.4002, + "step": 845 + }, + { + "epoch": 4.1067151735637415, + "grad_norm": 0.09835145173574618, + "learning_rate": 7.52813301084375e-06, + "loss": 0.3961, + "step": 846 + }, + { + "epoch": 4.111565863271184, + "grad_norm": 0.09426867245890704, + "learning_rate": 7.449160962857358e-06, + "loss": 0.3946, + "step": 847 + }, + { + "epoch": 4.1164165529786265, + "grad_norm": 0.0993123791236732, + "learning_rate": 7.370562768885823e-06, + "loss": 0.3937, + "step": 848 + }, + { + "epoch": 4.121267242686069, + "grad_norm": 0.09692548506896993, + "learning_rate": 7.292339331647848e-06, + "loss": 0.3957, + "step": 849 + }, + { + "epoch": 4.126117932393512, + "grad_norm": 0.0977639150148905, + "learning_rate": 7.214491549557898e-06, + "loss": 0.3969, + "step": 850 + }, + { + "epoch": 4.130968622100955, + "grad_norm": 0.10100358672328608, + "learning_rate": 7.1370203167160326e-06, + "loss": 0.3937, + "step": 851 + }, + { + "epoch": 4.1358193118083975, + "grad_norm": 0.0961508995875077, + "learning_rate": 7.0599265228975e-06, + "loss": 0.3965, + "step": 852 + }, + { + "epoch": 4.140670001515841, + "grad_norm": 0.09450992963252156, + "learning_rate": 6.983211053542591e-06, + "loss": 0.4008, + "step": 853 + }, + { + "epoch": 4.145520691223283, + "grad_norm": 0.10411768031595499, + "learning_rate": 6.9068747897464535e-06, + "loss": 0.4032, + "step": 854 + }, + { + "epoch": 4.150371380930726, + "grad_norm": 0.09981896937364662, + "learning_rate": 6.830918608248964e-06, + "loss": 0.4002, + "step": 855 + }, + { + "epoch": 4.155222070638169, + "grad_norm": 0.08754517232013051, + "learning_rate": 6.755343381424659e-06, + "loss": 0.3976, + "step": 856 + }, + { + "epoch": 4.160072760345612, + "grad_norm": 0.09520671649907132, + "learning_rate": 6.68014997727275e-06, + "loss": 0.3921, + "step": 857 + }, + { + "epoch": 4.164923450053054, + "grad_norm": 0.09719121632502135, + "learning_rate": 6.605339259407104e-06, + "loss": 0.3852, + "step": 858 + }, + { + "epoch": 4.169774139760497, + "grad_norm": 0.08870928687089744, + "learning_rate": 6.530912087046317e-06, + "loss": 0.395, + "step": 859 + }, + { + "epoch": 4.17462482946794, + "grad_norm": 0.08685694037296439, + "learning_rate": 6.456869315003946e-06, + "loss": 0.3941, + "step": 860 + }, + { + "epoch": 4.179475519175383, + "grad_norm": 0.08904997313439429, + "learning_rate": 6.3832117936785564e-06, + "loss": 0.3997, + "step": 861 + }, + { + "epoch": 4.184326208882825, + "grad_norm": 0.0910482544729166, + "learning_rate": 6.309940369044047e-06, + "loss": 0.3945, + "step": 862 + }, + { + "epoch": 4.189176898590269, + "grad_norm": 0.0887134263309384, + "learning_rate": 6.23705588263992e-06, + "loss": 0.3881, + "step": 863 + }, + { + "epoch": 4.194027588297711, + "grad_norm": 0.08977043998387933, + "learning_rate": 6.164559171561553e-06, + "loss": 0.3957, + "step": 864 + }, + { + "epoch": 4.198878278005154, + "grad_norm": 0.09216637353138708, + "learning_rate": 6.092451068450671e-06, + "loss": 0.3969, + "step": 865 + }, + { + "epoch": 4.203728967712596, + "grad_norm": 0.08464526503746563, + "learning_rate": 6.020732401485751e-06, + "loss": 0.3896, + "step": 866 + }, + { + "epoch": 4.20857965742004, + "grad_norm": 0.08983668958241023, + "learning_rate": 5.9494039943724845e-06, + "loss": 0.4025, + "step": 867 + }, + { + "epoch": 4.213430347127482, + "grad_norm": 0.08753368121579265, + "learning_rate": 5.878466666334341e-06, + "loss": 0.3954, + "step": 868 + }, + { + "epoch": 4.218281036834925, + "grad_norm": 0.08687937990016806, + "learning_rate": 5.80792123210316e-06, + "loss": 0.391, + "step": 869 + }, + { + "epoch": 4.223131726542368, + "grad_norm": 0.08701962255264487, + "learning_rate": 5.737768501909773e-06, + "loss": 0.3965, + "step": 870 + }, + { + "epoch": 4.2279824162498105, + "grad_norm": 0.08811499746627446, + "learning_rate": 5.668009281474751e-06, + "loss": 0.3846, + "step": 871 + }, + { + "epoch": 4.232833105957253, + "grad_norm": 0.08561633996061273, + "learning_rate": 5.598644371999085e-06, + "loss": 0.3919, + "step": 872 + }, + { + "epoch": 4.237683795664696, + "grad_norm": 0.08321419945310787, + "learning_rate": 5.5296745701549906e-06, + "loss": 0.394, + "step": 873 + }, + { + "epoch": 4.242534485372139, + "grad_norm": 0.08724643182123827, + "learning_rate": 5.4611006680768305e-06, + "loss": 0.3994, + "step": 874 + }, + { + "epoch": 4.2473851750795815, + "grad_norm": 0.08361301460174729, + "learning_rate": 5.3929234533519345e-06, + "loss": 0.388, + "step": 875 + }, + { + "epoch": 4.252235864787025, + "grad_norm": 0.0862576560444418, + "learning_rate": 5.325143709011587e-06, + "loss": 0.3942, + "step": 876 + }, + { + "epoch": 4.257086554494467, + "grad_norm": 0.082606577377262, + "learning_rate": 5.257762213522055e-06, + "loss": 0.3907, + "step": 877 + }, + { + "epoch": 4.26193724420191, + "grad_norm": 0.08601520095290771, + "learning_rate": 5.19077974077558e-06, + "loss": 0.3927, + "step": 878 + }, + { + "epoch": 4.266787933909352, + "grad_norm": 0.08144847498379731, + "learning_rate": 5.124197060081564e-06, + "loss": 0.3981, + "step": 879 + }, + { + "epoch": 4.271638623616796, + "grad_norm": 0.08369648223405692, + "learning_rate": 5.058014936157714e-06, + "loss": 0.3987, + "step": 880 + }, + { + "epoch": 4.276489313324238, + "grad_norm": 0.08487450387282452, + "learning_rate": 4.992234129121225e-06, + "loss": 0.3993, + "step": 881 + }, + { + "epoch": 4.281340003031681, + "grad_norm": 0.0835928002976722, + "learning_rate": 4.926855394480079e-06, + "loss": 0.394, + "step": 882 + }, + { + "epoch": 4.286190692739124, + "grad_norm": 0.0877663910781713, + "learning_rate": 4.861879483124372e-06, + "loss": 0.3888, + "step": 883 + }, + { + "epoch": 4.291041382446567, + "grad_norm": 0.08201902566316537, + "learning_rate": 4.797307141317666e-06, + "loss": 0.3978, + "step": 884 + }, + { + "epoch": 4.295892072154009, + "grad_norm": 0.08252391090570044, + "learning_rate": 4.7331391106884364e-06, + "loss": 0.3949, + "step": 885 + }, + { + "epoch": 4.300742761861452, + "grad_norm": 0.08121494056766716, + "learning_rate": 4.6693761282215766e-06, + "loss": 0.3922, + "step": 886 + }, + { + "epoch": 4.305593451568895, + "grad_norm": 0.08414265476669228, + "learning_rate": 4.606018926249851e-06, + "loss": 0.389, + "step": 887 + }, + { + "epoch": 4.310444141276338, + "grad_norm": 0.08528892500629966, + "learning_rate": 4.543068232445596e-06, + "loss": 0.3956, + "step": 888 + }, + { + "epoch": 4.31529483098378, + "grad_norm": 0.08280199210655267, + "learning_rate": 4.480524769812276e-06, + "loss": 0.3938, + "step": 889 + }, + { + "epoch": 4.320145520691224, + "grad_norm": 0.08884076809121294, + "learning_rate": 4.418389256676206e-06, + "loss": 0.3947, + "step": 890 + }, + { + "epoch": 4.324996210398666, + "grad_norm": 0.08902762031211295, + "learning_rate": 4.35666240667834e-06, + "loss": 0.3907, + "step": 891 + }, + { + "epoch": 4.329846900106109, + "grad_norm": 0.08464410835355753, + "learning_rate": 4.295344928765999e-06, + "loss": 0.3939, + "step": 892 + }, + { + "epoch": 4.334697589813552, + "grad_norm": 0.08347421805827179, + "learning_rate": 4.234437527184785e-06, + "loss": 0.3985, + "step": 893 + }, + { + "epoch": 4.3395482795209945, + "grad_norm": 0.08770395898608876, + "learning_rate": 4.173940901470488e-06, + "loss": 0.395, + "step": 894 + }, + { + "epoch": 4.344398969228437, + "grad_norm": 0.08139356257791996, + "learning_rate": 4.11385574644104e-06, + "loss": 0.39, + "step": 895 + }, + { + "epoch": 4.34924965893588, + "grad_norm": 0.0818047074224124, + "learning_rate": 4.054182752188501e-06, + "loss": 0.3948, + "step": 896 + }, + { + "epoch": 4.354100348643323, + "grad_norm": 0.08370905382784635, + "learning_rate": 3.994922604071217e-06, + "loss": 0.3941, + "step": 897 + }, + { + "epoch": 4.3589510383507655, + "grad_norm": 0.08543140680473625, + "learning_rate": 3.936075982705871e-06, + "loss": 0.3982, + "step": 898 + }, + { + "epoch": 4.363801728058208, + "grad_norm": 0.08330546263387466, + "learning_rate": 3.877643563959694e-06, + "loss": 0.3986, + "step": 899 + }, + { + "epoch": 4.368652417765651, + "grad_norm": 0.08181359063571672, + "learning_rate": 3.819626018942732e-06, + "loss": 0.3962, + "step": 900 + }, + { + "epoch": 4.373503107473094, + "grad_norm": 0.08458157848919085, + "learning_rate": 3.762024014000054e-06, + "loss": 0.3974, + "step": 901 + }, + { + "epoch": 4.378353797180536, + "grad_norm": 0.0797245693813596, + "learning_rate": 3.7048382107042113e-06, + "loss": 0.3849, + "step": 902 + }, + { + "epoch": 4.38320448688798, + "grad_norm": 0.08552325047075819, + "learning_rate": 3.6480692658475446e-06, + "loss": 0.3908, + "step": 903 + }, + { + "epoch": 4.388055176595422, + "grad_norm": 0.08191614537028945, + "learning_rate": 3.5917178314346955e-06, + "loss": 0.398, + "step": 904 + }, + { + "epoch": 4.392905866302865, + "grad_norm": 0.08324472646577967, + "learning_rate": 3.535784554675088e-06, + "loss": 0.3941, + "step": 905 + }, + { + "epoch": 4.397756556010307, + "grad_norm": 0.08386476178169076, + "learning_rate": 3.480270077975525e-06, + "loss": 0.395, + "step": 906 + }, + { + "epoch": 4.402607245717751, + "grad_norm": 0.08759720428686872, + "learning_rate": 3.42517503893276e-06, + "loss": 0.3879, + "step": 907 + }, + { + "epoch": 4.407457935425193, + "grad_norm": 0.0834695533465509, + "learning_rate": 3.370500070326257e-06, + "loss": 0.3832, + "step": 908 + }, + { + "epoch": 4.412308625132636, + "grad_norm": 0.080547419306159, + "learning_rate": 3.3162458001108332e-06, + "loss": 0.3858, + "step": 909 + }, + { + "epoch": 4.417159314840079, + "grad_norm": 0.08406690651169581, + "learning_rate": 3.2624128514094778e-06, + "loss": 0.3923, + "step": 910 + }, + { + "epoch": 4.422010004547522, + "grad_norm": 0.08417275645743631, + "learning_rate": 3.20900184250625e-06, + "loss": 0.3933, + "step": 911 + }, + { + "epoch": 4.426860694254964, + "grad_norm": 0.08104238775596306, + "learning_rate": 3.1560133868390895e-06, + "loss": 0.4023, + "step": 912 + }, + { + "epoch": 4.431711383962407, + "grad_norm": 0.08376361425082632, + "learning_rate": 3.1034480929928333e-06, + "loss": 0.399, + "step": 913 + }, + { + "epoch": 4.43656207366985, + "grad_norm": 0.08058350379685782, + "learning_rate": 3.0513065646921957e-06, + "loss": 0.3946, + "step": 914 + }, + { + "epoch": 4.441412763377293, + "grad_norm": 0.08013760556674378, + "learning_rate": 2.999589400794851e-06, + "loss": 0.392, + "step": 915 + }, + { + "epoch": 4.446263453084735, + "grad_norm": 0.08082216615145961, + "learning_rate": 2.948297195284546e-06, + "loss": 0.3916, + "step": 916 + }, + { + "epoch": 4.4511141427921785, + "grad_norm": 0.09007717527915819, + "learning_rate": 2.897430537264283e-06, + "loss": 0.3947, + "step": 917 + }, + { + "epoch": 4.455964832499621, + "grad_norm": 0.0866390993026153, + "learning_rate": 2.8469900109495553e-06, + "loss": 0.3942, + "step": 918 + }, + { + "epoch": 4.460815522207064, + "grad_norm": 0.08034663815912857, + "learning_rate": 2.79697619566162e-06, + "loss": 0.3888, + "step": 919 + }, + { + "epoch": 4.465666211914507, + "grad_norm": 0.08423465438674188, + "learning_rate": 2.7473896658208743e-06, + "loss": 0.391, + "step": 920 + }, + { + "epoch": 4.4705169016219495, + "grad_norm": 0.08769412223500794, + "learning_rate": 2.6982309909402293e-06, + "loss": 0.3936, + "step": 921 + }, + { + "epoch": 4.475367591329392, + "grad_norm": 0.0794092004599977, + "learning_rate": 2.649500735618582e-06, + "loss": 0.3993, + "step": 922 + }, + { + "epoch": 4.480218281036835, + "grad_norm": 0.08321318361659834, + "learning_rate": 2.6011994595343516e-06, + "loss": 0.3965, + "step": 923 + }, + { + "epoch": 4.485068970744278, + "grad_norm": 0.08400144661884966, + "learning_rate": 2.5533277174389916e-06, + "loss": 0.3927, + "step": 924 + }, + { + "epoch": 4.48991966045172, + "grad_norm": 0.08039773750467258, + "learning_rate": 2.5058860591506973e-06, + "loss": 0.3927, + "step": 925 + }, + { + "epoch": 4.494770350159163, + "grad_norm": 0.08132175209524008, + "learning_rate": 2.4588750295480246e-06, + "loss": 0.3888, + "step": 926 + }, + { + "epoch": 4.499621039866606, + "grad_norm": 0.07920562392368859, + "learning_rate": 2.4122951685636674e-06, + "loss": 0.3896, + "step": 927 + }, + { + "epoch": 4.504471729574049, + "grad_norm": 0.07833571502263627, + "learning_rate": 2.366147011178246e-06, + "loss": 0.398, + "step": 928 + }, + { + "epoch": 4.509322419281491, + "grad_norm": 0.08232920047142565, + "learning_rate": 2.320431087414159e-06, + "loss": 0.3838, + "step": 929 + }, + { + "epoch": 4.514173108988935, + "grad_norm": 0.08136833742803433, + "learning_rate": 2.275147922329506e-06, + "loss": 0.3935, + "step": 930 + }, + { + "epoch": 4.519023798696377, + "grad_norm": 0.08383396678636225, + "learning_rate": 2.230298036012055e-06, + "loss": 0.3913, + "step": 931 + }, + { + "epoch": 4.52387448840382, + "grad_norm": 0.08000391439211, + "learning_rate": 2.1858819435732583e-06, + "loss": 0.395, + "step": 932 + }, + { + "epoch": 4.528725178111262, + "grad_norm": 0.080147749223563, + "learning_rate": 2.141900155142351e-06, + "loss": 0.3951, + "step": 933 + }, + { + "epoch": 4.533575867818706, + "grad_norm": 0.07978655829531454, + "learning_rate": 2.0983531758604726e-06, + "loss": 0.4011, + "step": 934 + }, + { + "epoch": 4.538426557526148, + "grad_norm": 0.08386421814730027, + "learning_rate": 2.055241505874892e-06, + "loss": 0.3999, + "step": 935 + }, + { + "epoch": 4.543277247233591, + "grad_norm": 0.08174904946083562, + "learning_rate": 2.0125656403332396e-06, + "loss": 0.3968, + "step": 936 + }, + { + "epoch": 4.548127936941034, + "grad_norm": 0.07927025601942647, + "learning_rate": 1.970326069377828e-06, + "loss": 0.4001, + "step": 937 + }, + { + "epoch": 4.552978626648477, + "grad_norm": 0.0783638905343862, + "learning_rate": 1.928523278140033e-06, + "loss": 0.3943, + "step": 938 + }, + { + "epoch": 4.557829316355919, + "grad_norm": 0.08012821453349714, + "learning_rate": 1.887157746734718e-06, + "loss": 0.3972, + "step": 939 + }, + { + "epoch": 4.562680006063362, + "grad_norm": 0.08022389886437123, + "learning_rate": 1.846229950254692e-06, + "loss": 0.3888, + "step": 940 + }, + { + "epoch": 4.567530695770805, + "grad_norm": 0.07938938767749412, + "learning_rate": 1.8057403587652977e-06, + "loss": 0.3892, + "step": 941 + }, + { + "epoch": 4.572381385478248, + "grad_norm": 0.07979264917062728, + "learning_rate": 1.7656894372989785e-06, + "loss": 0.3991, + "step": 942 + }, + { + "epoch": 4.57723207518569, + "grad_norm": 0.07900416574598519, + "learning_rate": 1.726077645849955e-06, + "loss": 0.4033, + "step": 943 + }, + { + "epoch": 4.5820827648931335, + "grad_norm": 0.0816244017270053, + "learning_rate": 1.6869054393689265e-06, + "loss": 0.394, + "step": 944 + }, + { + "epoch": 4.586933454600576, + "grad_norm": 0.07678354405433441, + "learning_rate": 1.6481732677578798e-06, + "loss": 0.4026, + "step": 945 + }, + { + "epoch": 4.5917841443080185, + "grad_norm": 0.07913436605637802, + "learning_rate": 1.60988157586488e-06, + "loss": 0.378, + "step": 946 + }, + { + "epoch": 4.596634834015462, + "grad_norm": 0.0793297266554538, + "learning_rate": 1.5720308034789721e-06, + "loss": 0.391, + "step": 947 + }, + { + "epoch": 4.601485523722904, + "grad_norm": 0.07767980761029898, + "learning_rate": 1.5346213853251546e-06, + "loss": 0.3978, + "step": 948 + }, + { + "epoch": 4.606336213430347, + "grad_norm": 0.08494507410525762, + "learning_rate": 1.4976537510593646e-06, + "loss": 0.3995, + "step": 949 + }, + { + "epoch": 4.61118690313779, + "grad_norm": 0.08237577571806884, + "learning_rate": 1.4611283252635412e-06, + "loss": 0.4038, + "step": 950 + }, + { + "epoch": 4.616037592845233, + "grad_norm": 0.07590194142960284, + "learning_rate": 1.425045527440756e-06, + "loss": 0.3956, + "step": 951 + }, + { + "epoch": 4.620888282552675, + "grad_norm": 0.07954982455169565, + "learning_rate": 1.3894057720104104e-06, + "loss": 0.399, + "step": 952 + }, + { + "epoch": 4.625738972260118, + "grad_norm": 0.07731849776688487, + "learning_rate": 1.354209468303429e-06, + "loss": 0.3828, + "step": 953 + }, + { + "epoch": 4.630589661967561, + "grad_norm": 0.07970299041030604, + "learning_rate": 1.3194570205576284e-06, + "loss": 0.3954, + "step": 954 + }, + { + "epoch": 4.635440351675004, + "grad_norm": 0.07874124868840192, + "learning_rate": 1.2851488279130053e-06, + "loss": 0.3876, + "step": 955 + }, + { + "epoch": 4.640291041382446, + "grad_norm": 0.07691612719760402, + "learning_rate": 1.2512852844071933e-06, + "loss": 0.3949, + "step": 956 + }, + { + "epoch": 4.64514173108989, + "grad_norm": 0.08126016720695953, + "learning_rate": 1.2178667789709287e-06, + "loss": 0.3919, + "step": 957 + }, + { + "epoch": 4.649992420797332, + "grad_norm": 0.08002643782323322, + "learning_rate": 1.1848936954235702e-06, + "loss": 0.395, + "step": 958 + }, + { + "epoch": 4.654843110504775, + "grad_norm": 0.08026194265591635, + "learning_rate": 1.1523664124687284e-06, + "loss": 0.3997, + "step": 959 + }, + { + "epoch": 4.659693800212217, + "grad_norm": 0.07660352848559206, + "learning_rate": 1.1202853036898476e-06, + "loss": 0.3974, + "step": 960 + }, + { + "epoch": 4.664544489919661, + "grad_norm": 0.08113236962163348, + "learning_rate": 1.0886507375459908e-06, + "loss": 0.3981, + "step": 961 + }, + { + "epoch": 4.669395179627103, + "grad_norm": 0.07701309756204706, + "learning_rate": 1.0574630773675687e-06, + "loss": 0.3839, + "step": 962 + }, + { + "epoch": 4.674245869334546, + "grad_norm": 0.07891978078549244, + "learning_rate": 1.0267226813521635e-06, + "loss": 0.3877, + "step": 963 + }, + { + "epoch": 4.679096559041989, + "grad_norm": 0.07852321868608765, + "learning_rate": 9.964299025604274e-07, + "loss": 0.3921, + "step": 964 + }, + { + "epoch": 4.683947248749432, + "grad_norm": 0.07818107376466682, + "learning_rate": 9.66585088912022e-07, + "loss": 0.3967, + "step": 965 + }, + { + "epoch": 4.688797938456874, + "grad_norm": 0.076600770628096, + "learning_rate": 9.371885831816319e-07, + "loss": 0.395, + "step": 966 + }, + { + "epoch": 4.6936486281643175, + "grad_norm": 0.07627250485843899, + "learning_rate": 9.082407229950018e-07, + "loss": 0.3976, + "step": 967 + }, + { + "epoch": 4.69849931787176, + "grad_norm": 0.07905168555654667, + "learning_rate": 8.797418408251101e-07, + "loss": 0.3918, + "step": 968 + }, + { + "epoch": 4.7033500075792025, + "grad_norm": 0.07625038396328788, + "learning_rate": 8.516922639882819e-07, + "loss": 0.3897, + "step": 969 + }, + { + "epoch": 4.708200697286646, + "grad_norm": 0.08055085830124646, + "learning_rate": 8.2409231464049e-07, + "loss": 0.3901, + "step": 970 + }, + { + "epoch": 4.713051386994088, + "grad_norm": 0.07599467665769233, + "learning_rate": 7.969423097736162e-07, + "loss": 0.3931, + "step": 971 + }, + { + "epoch": 4.717902076701531, + "grad_norm": 0.08049982038815076, + "learning_rate": 7.702425612118269e-07, + "loss": 0.3962, + "step": 972 + }, + { + "epoch": 4.7227527664089735, + "grad_norm": 0.07817439712988589, + "learning_rate": 7.439933756079942e-07, + "loss": 0.3913, + "step": 973 + }, + { + "epoch": 4.727603456116417, + "grad_norm": 0.08001209525722262, + "learning_rate": 7.181950544401695e-07, + "loss": 0.3935, + "step": 974 + }, + { + "epoch": 4.732454145823859, + "grad_norm": 0.07544329449164154, + "learning_rate": 6.928478940081107e-07, + "loss": 0.3984, + "step": 975 + }, + { + "epoch": 4.737304835531302, + "grad_norm": 0.07792056514995602, + "learning_rate": 6.679521854299032e-07, + "loss": 0.3914, + "step": 976 + }, + { + "epoch": 4.742155525238745, + "grad_norm": 0.07777159770613211, + "learning_rate": 6.435082146385885e-07, + "loss": 0.3901, + "step": 977 + }, + { + "epoch": 4.747006214946188, + "grad_norm": 0.07684966968716175, + "learning_rate": 6.195162623789052e-07, + "loss": 0.393, + "step": 978 + }, + { + "epoch": 4.75185690465363, + "grad_norm": 0.07663626226452194, + "learning_rate": 5.959766042040426e-07, + "loss": 0.3879, + "step": 979 + }, + { + "epoch": 4.756707594361073, + "grad_norm": 0.07653692258850123, + "learning_rate": 5.728895104724963e-07, + "loss": 0.3959, + "step": 980 + }, + { + "epoch": 4.761558284068516, + "grad_norm": 0.07731590848782262, + "learning_rate": 5.502552463449418e-07, + "loss": 0.3984, + "step": 981 + }, + { + "epoch": 4.766408973775959, + "grad_norm": 0.07715742201671594, + "learning_rate": 5.280740717812149e-07, + "loss": 0.3977, + "step": 982 + }, + { + "epoch": 4.771259663483401, + "grad_norm": 0.07733908081214975, + "learning_rate": 5.063462415372967e-07, + "loss": 0.3948, + "step": 983 + }, + { + "epoch": 4.776110353190845, + "grad_norm": 0.07797117300936077, + "learning_rate": 4.850720051624124e-07, + "loss": 0.3914, + "step": 984 + }, + { + "epoch": 4.780961042898287, + "grad_norm": 0.07721734718928677, + "learning_rate": 4.642516069961556e-07, + "loss": 0.392, + "step": 985 + }, + { + "epoch": 4.78581173260573, + "grad_norm": 0.07648551851063208, + "learning_rate": 4.438852861656751e-07, + "loss": 0.3951, + "step": 986 + }, + { + "epoch": 4.790662422313172, + "grad_norm": 0.07521119037010907, + "learning_rate": 4.2397327658294076e-07, + "loss": 0.3899, + "step": 987 + }, + { + "epoch": 4.795513112020616, + "grad_norm": 0.07655879860272995, + "learning_rate": 4.045158069420474e-07, + "loss": 0.3963, + "step": 988 + }, + { + "epoch": 4.800363801728058, + "grad_norm": 0.07622760847546149, + "learning_rate": 3.8551310071659023e-07, + "loss": 0.3975, + "step": 989 + }, + { + "epoch": 4.805214491435501, + "grad_norm": 0.0750428400819878, + "learning_rate": 3.6696537615711124e-07, + "loss": 0.3968, + "step": 990 + }, + { + "epoch": 4.810065181142944, + "grad_norm": 0.07852243689578567, + "learning_rate": 3.4887284628857266e-07, + "loss": 0.3932, + "step": 991 + }, + { + "epoch": 4.8149158708503865, + "grad_norm": 0.0771348195411035, + "learning_rate": 3.3123571890791405e-07, + "loss": 0.3887, + "step": 992 + }, + { + "epoch": 4.819766560557829, + "grad_norm": 0.07614331045752255, + "learning_rate": 3.1405419658168125e-07, + "loss": 0.394, + "step": 993 + }, + { + "epoch": 4.824617250265272, + "grad_norm": 0.07563944264490313, + "learning_rate": 2.973284766436857e-07, + "loss": 0.3917, + "step": 994 + }, + { + "epoch": 4.829467939972715, + "grad_norm": 0.07503164664083585, + "learning_rate": 2.810587511927354e-07, + "loss": 0.3901, + "step": 995 + }, + { + "epoch": 4.8343186296801575, + "grad_norm": 0.07663595734772072, + "learning_rate": 2.652452070904499e-07, + "loss": 0.3923, + "step": 996 + }, + { + "epoch": 4.839169319387601, + "grad_norm": 0.07606961706547127, + "learning_rate": 2.498880259590797e-07, + "loss": 0.3944, + "step": 997 + }, + { + "epoch": 4.844020009095043, + "grad_norm": 0.0761182148197196, + "learning_rate": 2.3498738417945034e-07, + "loss": 0.3975, + "step": 998 + }, + { + "epoch": 4.848870698802486, + "grad_norm": 0.08039104985634041, + "learning_rate": 2.205434528889283e-07, + "loss": 0.3971, + "step": 999 + }, + { + "epoch": 4.853721388509928, + "grad_norm": 0.07775606427920397, + "learning_rate": 2.0655639797944937e-07, + "loss": 0.3903, + "step": 1000 + }, + { + "epoch": 4.858572078217372, + "grad_norm": 0.07610940999590161, + "learning_rate": 1.9302638009561782e-07, + "loss": 0.396, + "step": 1001 + }, + { + "epoch": 4.863422767924814, + "grad_norm": 0.07569450912275462, + "learning_rate": 1.7995355463285457e-07, + "loss": 0.3965, + "step": 1002 + }, + { + "epoch": 4.868273457632257, + "grad_norm": 0.07643720956773195, + "learning_rate": 1.6733807173562988e-07, + "loss": 0.3913, + "step": 1003 + }, + { + "epoch": 4.8731241473397, + "grad_norm": 0.07571887859535044, + "learning_rate": 1.5518007629571342e-07, + "loss": 0.3995, + "step": 1004 + }, + { + "epoch": 4.877974837047143, + "grad_norm": 0.07657090064859913, + "learning_rate": 1.4347970795054456e-07, + "loss": 0.3967, + "step": 1005 + }, + { + "epoch": 4.882825526754585, + "grad_norm": 0.07475277823538463, + "learning_rate": 1.3223710108158483e-07, + "loss": 0.3965, + "step": 1006 + }, + { + "epoch": 4.887676216462028, + "grad_norm": 0.07465351831333361, + "learning_rate": 1.214523848128124e-07, + "loss": 0.3971, + "step": 1007 + }, + { + "epoch": 4.892526906169471, + "grad_norm": 0.07637388169909817, + "learning_rate": 1.111256830092211e-07, + "loss": 0.3996, + "step": 1008 + }, + { + "epoch": 4.897377595876914, + "grad_norm": 0.07639665552172381, + "learning_rate": 1.0125711427540374e-07, + "loss": 0.3949, + "step": 1009 + }, + { + "epoch": 4.902228285584356, + "grad_norm": 0.07373092012101537, + "learning_rate": 9.184679195417989e-08, + "loss": 0.3889, + "step": 1010 + }, + { + "epoch": 4.9070789752918, + "grad_norm": 0.07583698163385665, + "learning_rate": 8.289482412531246e-08, + "loss": 0.3984, + "step": 1011 + }, + { + "epoch": 4.911929664999242, + "grad_norm": 0.07647787343235872, + "learning_rate": 7.440131360424652e-08, + "loss": 0.3887, + "step": 1012 + }, + { + "epoch": 4.916780354706685, + "grad_norm": 0.07751142464425709, + "learning_rate": 6.636635794094126e-08, + "loss": 0.3908, + "step": 1013 + }, + { + "epoch": 4.921631044414128, + "grad_norm": 0.07884353160777417, + "learning_rate": 5.879004941874655e-08, + "loss": 0.3951, + "step": 1014 + }, + { + "epoch": 4.9264817341215705, + "grad_norm": 0.07661585400143268, + "learning_rate": 5.16724750533415e-08, + "loss": 0.398, + "step": 1015 + }, + { + "epoch": 4.931332423829013, + "grad_norm": 0.07506936516416932, + "learning_rate": 4.5013716591730815e-08, + "loss": 0.3944, + "step": 1016 + }, + { + "epoch": 4.9361831135364564, + "grad_norm": 0.07625120541429038, + "learning_rate": 3.881385051132114e-08, + "loss": 0.3997, + "step": 1017 + }, + { + "epoch": 4.941033803243899, + "grad_norm": 0.0754548388472603, + "learning_rate": 3.307294801902838e-08, + "loss": 0.3968, + "step": 1018 + }, + { + "epoch": 4.9458844929513415, + "grad_norm": 0.07563871272528049, + "learning_rate": 2.7791075050460636e-08, + "loss": 0.3977, + "step": 1019 + }, + { + "epoch": 4.950735182658784, + "grad_norm": 0.0760975342061979, + "learning_rate": 2.2968292269167637e-08, + "loss": 0.3978, + "step": 1020 + }, + { + "epoch": 4.955585872366227, + "grad_norm": 0.07484229156933196, + "learning_rate": 1.8604655065939116e-08, + "loss": 0.3888, + "step": 1021 + }, + { + "epoch": 4.96043656207367, + "grad_norm": 0.07489129192172529, + "learning_rate": 1.470021355816975e-08, + "loss": 0.3952, + "step": 1022 + }, + { + "epoch": 4.965287251781112, + "grad_norm": 0.07561234415729748, + "learning_rate": 1.1255012589286297e-08, + "loss": 0.3988, + "step": 1023 + }, + { + "epoch": 4.970137941488556, + "grad_norm": 0.07589712959511802, + "learning_rate": 8.269091728232426e-09, + "loss": 0.3858, + "step": 1024 + }, + { + "epoch": 4.974988631195998, + "grad_norm": 0.07684966203710471, + "learning_rate": 5.742485269006892e-09, + "loss": 0.3976, + "step": 1025 + }, + { + "epoch": 4.979839320903441, + "grad_norm": 0.07450707523151534, + "learning_rate": 3.6752222302727238e-09, + "loss": 0.3922, + "step": 1026 + }, + { + "epoch": 4.984690010610883, + "grad_norm": 0.0754634711281639, + "learning_rate": 2.06732635503748e-09, + "loss": 0.3894, + "step": 1027 + }, + { + "epoch": 4.989540700318327, + "grad_norm": 0.07460842756020492, + "learning_rate": 9.188161103557136e-10, + "loss": 0.3893, + "step": 1028 + }, + { + "epoch": 4.994391390025769, + "grad_norm": 0.07411367814575705, + "learning_rate": 2.2970468714245132e-10, + "loss": 0.3934, + "step": 1029 + }, + { + "epoch": 4.999242079733212, + "grad_norm": 0.07533391242414708, + "learning_rate": 0.0, + "loss": 0.3877, + "step": 1030 + }, + { + "epoch": 4.999242079733212, + "step": 1030, + "total_flos": 2.739131934768418e+19, + "train_loss": 0.07882811409755817, + "train_runtime": 48155.7887, + "train_samples_per_second": 10.958, + "train_steps_per_second": 0.021 + } + ], + "logging_steps": 1, + "max_steps": 1030, + "num_input_tokens_seen": 0, + "num_train_epochs": 5, + "save_steps": 500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 2.739131934768418e+19, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..a72a942 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cdd74b8dc9324cdf25abb39f6ea4cc3ababb5e10ad349faedede805a21838c6 +size 7416 diff --git a/training_loss.png b/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..2410f82da300f770aaf575a0fe0d1c0878eeb315 GIT binary patch literal 39178 zcmd?Rc{r7A`!;-;=P9#fC{z;4JPQp}N-2^th0K}fAw-#qP#Gg3u{5mA^OOq7uw@3Y>Lob7B%XS6kN_Z`+@2B2_zg&fC8=mcnT=UShjBCx%fiAPoK|Pj}je zeeb_SMaWeT9z2+?{eb8({2@Em3=@E#r*Cs$577%b|6lp@T|FXketsee%NE-o@5~#c z>bu{WC*l<&U6se}Y3O;CBNj&+5ApF~F#={AOXGP)0$9~@s|tf=j6o^KY*&onc|Og3 zQM@XCEsZTna?DgzRL#b(m)knlZrIz4=9kXN2L}hM#t3{%l)?S{O5UM3;J>waHaw}4 zKV?nx)TwH+a#8GDOz>o?|IU4rgkKj7Bp5zQYQ{JY`mRY?4_eR#?3b~xgX=}d#KcS} z9>>4ul&~;uO;K9k9Ndk{JfCoDVW`?tX`;slS6}y#Ink#%l-G~r=+UDWm3M3heAkRb zZoD5WYgrudo*(`@gFBlbYQ(4c<3{b-d-qQ03bQKjZY?jD*jtV|6*IE2Js_C)m!EFg z{jSbnwldx6G4k+mfy>mD3(v%fj_Ktq+Bn{wB3N0jeL03pTH{UhUi}>?pxOQY&iQ4Q zN54e;wpa8FT|2LZg@*@eXQ|)5Eg*E^SpeOB>GeMU(S}G4DQgy5a*~6G4lP!ZFr>YG z`*y(ZdM<0U%8qP$M#f9R%n6rYm){zdu9kgyBah3N=`Ol=$k=0;>>I3UU|?Xgr!}VP zFG-D0Mwp6zNFy~kNwN_mEd}!$t84a81a7~CMZQ${3u31XqW5-@z zk(#xch|@E!b|n~v9=-Zna^vr@>u*&(JY*lxa{d@|W=sxO52Zi#^70VGgBq;Nqww&> zsjSqIk#MnwN36%h&1y(J2a^@tN8W!GRd;eaInk0Fel<&bn0I%b0!83_K4-S*p;&PwC#*7}?oAZ*1Q1{87F`dI9xgGY`~&UEDkHQgp2n)~9kIa_Gn z{6fmpE1|IKTPFD7n|NCbusFBB;7Q)~5%8kT4s`ZV@)W(cxWoqo) zg$uy~n#SAVinBjS}QgS`KMjj_Ysr zbsQ=;mM1gZ=Lg_-l+@HUL)Afxsk>WeE6P89WPu3d+qZ9DTBkJ=4^Pxru}bdVLI)Ka zPPgCPfyeTTh=pRQ&SWqp7`bu!?QXkotU_7fSzKJi0?zXKvcw2Ty%{7xygZJHIXJK2 zJaK^|@(j0v8|~e@cNdnI)m>a9jeQnRQ}X-p@G>$Et>`uXU70y?`!gdvipy*dYdE{u zs^=_Z97lq&*U_5V+LxWyPhw*3uMK#&+N1^tlm6~4WT@O)3g41nQH(x)`n1Q`le6Co z9ZcXd&n^fV!VY)iZS=}*>Khwn{)X3&JDGL9xn}&bdpTttA{p+AxZF5;xHi-r>Jt`F zAI_d}v(WzglnaM~n{9c87u43%smi_u5JC~066EATMExbMv4aY5Nty@r2dLrADN5cW zP{3quY%b*fbR3r;K|L6Bl z=H2y1m1(8Ml+ALV4W~a-?Gy%iY!IyRDh$&G?{0+aNKC^n`qYF5sSzv=j#IUC7i$7l)% zymGg?1%-r0pt3w@wpf<$vc{*ZEK_3@yF1U-{cjQpg z(8Q+BWTkk0nH(LyH&RFCGSfxp`}fZ&XcGZ12<@Njdc|+mQT|%-5)cylOIz&e=~=YW zb(4vSi6~h+bZ2{WH1?8mPN7M^azM&X*x4xVCpRAv6BCQubcyKd>Utc|Gd7O8q`Xl# z<4MG|`&{qJmHUzVWxn8&p}48X2yBh=?pAHiS4QU>m8#`--unEQzq`aWx3zJlWF}wT z(NWw*{s1`xPsDu1W{VAPtBuw6-xZIcKnm0qs;X4`JSUS2e%c;6dbAqWmWhQWI4zA& zakblgWq={lcQ7e((pef-=IZMUfo)bA`uZF^o?}nE<_8=6CR4t8uh1lIgz3P6NbmV_g5{b-tFzH&X)k+j=cCCKZ+eK0pzFD(4Gp<@ zynmn2&+8KE5AA^tQd3h?_Qmp@eu3Mp!PdB#|C3tYA$qqn8Ev__-=R8EWnOuxFju5L z@Vb4PLnkcaHX9;ZYMi!T4}ey2{!uVHKZwg_&n?mih!U0<;?dLE1q zO3<#S(II7J<8RMSsPAl#Mys%4bya~R^_dCA!V|5jVmyB9W-oPx>pOC;mPZ|su!!J* zf44SURdz*q6|BDVEq2{>cnG;}459ht#fxdz-=*^v$FQ)rjI-hH1Dkxo4m)`t%tLfAYS^xrk29QM;5^qM(Nq}t~(8hLB#N9IVPLxtST_H1Wv0xB6} zgO=Z(@w><;{~9PSE!vn!tVhcQ{qZOkW|`vodSH=R=mI0b$US*$bFRNM#2CkJRN}(q zJn@Z5to%<5fKNtw8ubUXOpt*r4&^KH&s6*?I8^+~Fg`XBeZKkSW|_e-NZGbr zJ+Tef5{qUo{$NHZH>^gbZmj;By@Pcl_2Kp5ViiYj-MXcrsv7Y5%NOef<;{%^Po+lJ z?VZhe;(+c_cU&1=z%K$W6;KN^uHx?-kCjfn)9~tFKQhDh3rqvgX=*Y#RBXKV_&b#q zf=aWY(?fz>V+7|RKrIlQNgjXN&em^jET7iWdURPhZsbF&GV_xsPe!0yu`f?F$Ib`U z-+B_gR_1^580YO2kplUv9YU;Ap=9U(=7y(aT zHpT5f?Zg4kWbdV;yDu7#zp3Hk@{y8`ZpDjU>->3Ce}k{&uoMpZmF`{tyjZyafRuyK zfcT?$l!W6&jfAl|mFT$KPynHGlcC4@z>4sdyN`kjo+l zAI~W+f0IDz!otq(tuzq1QTCTmxg#i`xex8~@?+VvEC}yk9o2>FS1!jop5EJ-1$+K}lf1bMn9muRm5qst9urIB)kkw{{-; zit;ga=g;9qDB6#D?Mp9WjOe;$gFiCQhX4}II2*m{WgKj^WjSD(>MNux90%2oNsSUV zli#EiB5MRsFlNS8?v%i4vc7xwuEyd+QzOK$9w{kl*wd#hi-5r&0y+$XpwmAWGq%Dx z>#0pa%fSaYn2$}=@Q8iIhQ-EC1ecUnpG*72k$(5VIF)7PjWOnpb!X4L8u|%f!$|y1 zdnO2tl%mxh8`yWaU9Z{R?)kok3cdZyzCZM#YCsa4iQwQL@EE0AToaoBt0eNg4g@~Hea3| zRm*4#gK+rLtDUNRd~18VzMkDg#9`UTsse60Qhpw$M2I~Y%D(nmK&8XNpxT-YOgI(S zLB|h1ld<@BpRkx1yL_^?&(>n2@tw{omk}7wmOgE7uF+&(xgmyi`5vd@*Dx@6aZXEX zsizA7Y-+2~wQF%(>)y9--=@sFehiRYJ^B3FPvRkoR>e`)XTgq@hd&zR5jO8Ej?@ze zghfRBp|(k3c-*rY#VK(HW8B?n^&hjNVBmQ=XoFYr(8C!Yhq{tqL7awboNrN>XCV(d zrF-pKQ|~l+)%e#08f;`d!DLl_71}>@jKIS~XQMp&9U{++;_Vr}k7v;@z^6f1Ob$*WamV=R_9fZ)9F`$H==W^B^UgOASJ3_Kdl2uRYQoDd(1Bm4rG zfVvUnjopGlEF~-z<6XGRW;6@ z4d+*X5SE^P5NEE4%aR%NxjJBhH>eLFBGK^hDB7x*hk=5q>X_qCTj>)%>yBoUT;;}v z5GyzBi|c242!_s)lvGrUJzd|u-@Hrpg!g|Sc=s*eVB5EE#B~q>OCr@R=-F|FMgZ{B z9R@3mah?!kD5Xl==S3Zs6|(?R8%J*}4A+JTXpX?t7E>t4P0zG{|ID@5|IO98$){N{ z8J_^+NUxUnbkE0rkn>qDxO{|V1jdS-HM!rOK1!)X0Ke9HEUWL65eKaQ%7`A@WZ~fv zC8y;WS~)PEqo1>_C}LEidxV7=H-DQySpTEd6O2#Vw)^|9&7mjp@j}?==;37dfuk^G zj`voskI=xK!x+C3Rlf6g=Jf5`ueQAB2g+xZWYj3%ISeWjsiJ~BaD8+6H&jM8>JT*; z|LZI{#ePYOn>R!(%2{jU2w!)_L`5I`v~Bp+ma)Gxf(mo*yBDg*+zdYsyT}7FefWV# z0Z=7wClHc=e8@hXEI?&vog^eAqzKZjTwVgj+L_CjFK2wwBf#W`5KE`eZAq?sjR)L^ z))z;+EB#e4_sUY}bQ`uQ3zW39bra2r_aLv&m<&$2+=7|!*~vT9P=Ll}b#!!!rd}r& z_-%XXi^L1{Neo^z=fP7v@p!>zE1jsGt-^9C+>V=>QCy0(TZ>|ZYVBhD3BH2h%y*dUM_4*~ZI96tQDF==YO z#9GBKGcyx$0LZ+Be@=v>3@yOV7m$=Oe?+)NhRGwXU z?KOV0*hx^dcx+#>Ayh^ZTj~9CmAihpwXGlqWqsTQsI;tq*XE;b@{3;&*iE({emiH= z0h1L_P0tiP-?uU?x#CL$#gsBtWM zIY_$fuFmy`!&2}8tA&bjYpYnCRtS{-t2;&+Z9`BDG>naTVBR3F+D_6qb7rJrzr)kD ztGS&^zv_Vm82`q=7f?D^@^xkn@MlIrL4i)HLgdD`<<9XM^PZ1)jn~TOEd6wJnEd`u z9lnq(f6b49g@q-ppnwr}L)K?q{Qdj)Wi6h7y}gtsfcFStBt{cc*~J`PL{=H&7M*gMy#rk6vpyV(hI3eXZu(Fk z?>lz{u|f0wfKPo&Ee9X0=K6{<@RLHDRYov*{ZIQPSUcL(J7sA^;wMhDO|I^4&-=diBX7!~74c zN3A|1g2-=c-RsaU3v~z~lmz?ptBnLJ`}-*mI4%goGa4GfhF!pgxxi-);Cx-tHMD(XQiTW2T#{ zv&xkb(-k|4ych1>yQf@8@V(gB(9pH{o`I6m>d&I&deBhyfWIzhuqceX*MDT}ia&jdR;j%xJPvu}@j<@Ku6&s*^_YY%~u-p7<tx8?yTVa&45DO>#@Anu14Q=s$6NPiq1wD1AkfsTnYkx zFn&>6%WST%7%{nLGOD4%qxn?Ix+g}@*psYPahcY>c$^K5hLrU557b^(K_%-R zyL$<-ABZ&rZe_*Z=GO|Ln=rn?V{%hdld2(tlO(n&nBByO3Ffm9?X23>+1|zV(P){O zk7AKWQ?n+9d?sRTsV0}X$Xfgcm7wq(;=yFs} zErpFnl@-`DAM%F{$~)1DOJS|o$0*>B$l8{^LE>at+#Nopbr3i~0Bm*%0$uUIGB@ZR(` z!GH`EaGUEx@ZJ=0IrQ|aH}Zj;zj*ih#&j+&t$nJ%YsDHT+yd-ckz9D!?G&8?m|qtE z61&TC%ld7}0ux7g<@`D;i_klF_tvr@GX~iyZr3AuAyJx6I+4!*Z+q$jV3Gru6c>XH zxA(KMhIr2vQy>Nv^1!j}H2d(p|E_lsk+_HmEqTz(>XS!U9to8X%}7Uf0`PSF-F;$1 zOt?zPWFJ;6MQNHu2wY3$e_q7d}!r%R+Ye_g7$*sRuzoe{BK7ZkpSEAT#H#|HH z<;gH;({s+>9JdMGM>X@xaEkX_U}dF>eaX~ougxSV5aZ+H#`pk8a=0ASC>cZ11ij-! z8;XRAq^Zp@+f+~B*sYd$=~Ei7Dj`?~G+U^jIrCsEsdMM;g5)^yTzp7G1T9R}gEJ+iZnHHI|6RAPl3%-iU5zsE z$B!$($00URIF1^08;aN3$)0reNo9X^0L{G0%tX)wqUUKLudE}MtB1>XuT-2|1x%%^(hWiDQ=uKFb*H@2 z7PZ|}e_yEwIE!zez7R$&Km1&Px|Ooh{gC-^&6JCmQX{qih2vDrE1}Lao6|CK_IM~^b!`|vSl)58%{!>`}zKkabt6;3NH*b0F33bHhURO=Gz*4CdMZwq`Sw{ zPXIlB!tJ*{uxH(tvk|zX-Y?z=4#-%x_YD>|Z}^@B5DK8Z3~Kd?0kbIadB}+#KatQH;4wC z>jeb`*P)s)va^T6o?>%z7zk&zS*d=HAP_wVLG4R_`<51obY-(Jw*|FN)ghkG;e$cm zI@D66prsO(!g#I^g^`|HHlQi?Fk$8}rKB@m+9b(HPF6|{olGBwH;CN(!__OjFt3Wc z&lw_xPp0368A?roLXl-7pVr20FPj#F>i_y1Ww*2cE@17 zcW~#y?q=m~EvuekAO(*H26_k*dmcY|5(t!<)=sY1*7_n0taYEC90EE!kc5IB1>ZBt zyZd0c)&Zs(csxV*e%D`vl`0Wu4*9JQQ`q*GumbNk!TEIonyUG14;~4KbH$T9*}B58 zDIC{x@lEILlXLD~$ZAJ2#IqCTfYMxQoXS*XH2Ui~?|1t`bHF4X8{-K?n4XajzM*<-dr3(9;Xps5^ zQ?w6|W@xh1qf<3XX?>5j2#`9Em1xxA@`dP-6Y^F{%G>N6LzX z11OkuZpBt_LulAz5VW2L%9Tq>C@q(1@AV1XC4FzsY@^k`jf` z7qHb&Hbrtft;@ESz7{RFDBPRMOt=LT)925hs~UOz4d<7)CK4SQU}lSg`HDtmcT3_- z6gO2?`$K^7BamhY;_k{)n5_c=a{^RjlyCYK zKE-PSJC@vyeWZKL`@@G!)FCxCkEqt4SyzvOz{UbPGrK|F^*_^{=g}Q3xe(!{BLVZEamH_l!-Qzv&J*Xtnf5!VHB?=7g? z$|i@vijj;o0#Gs!^7EfUIC=zx=r=O`n!sa08H<7GWbMViv^Q_G6d@Xsa00O51SrSv z?zX@7!tu6ltF4IdmZ+o+bU*-x%SliKn$u%Agnew%3NXnn0EWtgmcZnU06)uo;=~C=bwc$;6E9Bgn@?Qh zu;U(^30(_-3TeQHiZhpzWcgoTN)-j+Ef{!mSeFqfi*Z?LvI(unT30`Qlw@LLR$g z_^@?#b+0x5T$gvBec#cA81^zfB`!p<^ZNdI!XfLJ2Ff#77S5qN25U-}O)6Sgn2xCM z2FF2us{;!Ecx&;EUZmEwYRW>lUxeEGcT2JGr|q6xfD~xlp27$9;`3l}# zN0_*{gh66}VV4BI^DYCgf@qnmljk}qzRN9%T;9!6*>1AL-?LmsSQI8XDChZl3L`ga zzY~ZFJYY4F+u52_$w*5}8(`dC6%iC9gVnhcYjaH@7qDAbB3&ikwS$n|2wWP_YTs>r zId2Bl4kJ$mxNCx7Fv-G)t9QJ{_ZU>oYF@j>3b&Jyv8I=Ao=2z}`0XRma#5&aYCrL>WcD4O}o4jIw(T3c4ZasOG>#B6fYhe!TQH8- zLzQ%D@a<7oin1IieE>Qx$@zGZV)2l>_oJ2+I~usaDwi&84dutuX!=9uqoc|2J3at8=(1PdF${S+78^p@mIR=4({_Ucg2vi7-Rs6D z=q5NpIt6C(s%1yGn`L8x7w{H?MgV5OGWYh>Td~pxOjdswYlGh;esmLsie==%7ET7N zO!FrfGw(XggGaHsLMZkjvhQUlPkrkzl((#vf!FCAZurlwh-3TUXV;UzN#NF!Qy7Wq zLrJu=KH$UEnpJaj)iSTRPAmIa)}mJ@zktEW%}rWZSlFQSNJj)H?XZ_=ZC3D;-98dN z_!tAx1R73GP5=&JQBe=hWSHgYC>#z(1C^hjGRT|XA=()LBE<{dRGm4n2u^H{vj86 z5C-6%)~W8Hp&>S5R=kijQK8P+C9Qjsm2dIkr!+L|p29>-!k`!ca2uElkmjgigd@XH z1jYyq1L$ppZUAnbcYfP{y)NQl`9ML(h)GDGN!^E*&JAs)3J}eh@3b`0VZbNI1qKWd zF=!e3bXI4wDFTy5bQnB@x;0FWN2`Em`0Z0&|Fjui@|0*l%YvJbRCPMOvuOIN+ zw1Wkv@BrSnWkdPOS2JeE{kmq(pLYutj4lg5&C};PnBG!5>@vKpqK*H8&!UeC(fV2B z^&E|-z=!I;zfF~2G(wG40b&gR0&E1}1JdF!Osr!4peUGp$Xg}+cYG89oS?pdVKi(a zRX{GadTm3|8G-qqXefWy8?L_qP$&cVdMp5DAA zXClnXu(v}_$;D^hyV<1+Xu^a7ym(5P9e_|IF*^cEc^Vg2J?vO@`(*O+_N(|>*sX2v zWh#-KaSj%0Dw0u>6D8jIHtY|>vaen~%KA)R_ETqme;*9VFSe7g=}78$0ZsZygf+nc zW?2T9@!a|I>Z+<3dXh3QMjXGwX3e!qWE=G6wc&2g^YNlm17l`>Wo+v z7*K4x3r-DK6!yMzow@$%)ho$qZXzNg$dtzvQCI*>fk39U=7_l3^%XGzS%St0aoBF) zgAV{fDvNWzvJ7=~|DWG+O-FK_hQ7{b6)ZpHydKJIz?vBNFzj=4Ybyf)SQ#GQKRQqz zGr$MqvAse-G6%55tU!xccX%Sz0s&yal?}M8Lb_bKT@7pt$G)-p2 z^HcH5*C`&V-1&P9k)F1_pXk8qiEgKC;>6M&xO=d@NW+4Kf_DtLB>=HlWZ>?;(`RI4 z#6JA&`<;B#U+HPIW&C{o!*uF0=TTL|PL+}yt(P=3RH4;DoqPQ3nTPSqtPCja=d`sO zfNEX*ab67XcCY2@^OWBBtsQ$Y`3rQWo}O|@*nt5A8V7Jp$jt`!5h}zZLXI#ZpX7C% zaes}V9XI|;AQn^_YnPJwChokthQ@(5NC`BH4#5Nf^7dZJq7m?QqP_KOx(>~ZxG#o- zbn_H_)c~^{(>`YAaUD%)fBKbvN(11|fyKh>p4fj8r&D7xJ}=LZ3(95~Y(~7u zjr(VLJW16k5w(R>shHTlF_9*= zY3#!)1D4`3LiMcKVq+4lFvqVeXR6(QS3>^yVioGQN%D5g3n0|a9QP;(OBgM$a#^)G z%xoVG?9Q{(VQG)Ct1EnuW2hAl2MIwFw`e!B#=d^}Qs6wP{kyN2Il%ix0yu9EN=PsV zl&;!CFJ9UKFv*V0oydO*ih3QuyKrz_a04j0Y{OE?1J^gs2!8J+y?X!T&0`60<6-iT z=$WzI^-%^|ZdpbkI7l(@Z0(2tr~^X~4F&)#zLpOIXWuPI4rEhCp@9asT>xUebu8j= zqXOryU$sfHsQ5)dE- zPD&kO+oC1uA$Xlp$AeBv3O#WVOrSNxjzd60oCZhXEpzk5#YSH5WCyT=7J*tYzT6KA z@sVT4VjbLz4Lv~m2dG1ncRd`W6H}mYmS(|ah6O;q2CqoO0fnxaE#&HC1TOsXW5zyk z34+CY$qu>3p&Nj$YiM#Z6hzQlkkrPFVmIECf?X)E+O$fFU>F3`iiMYeLKb~HMZuvf z=VJOuzbV7R9KS>vs8#ymT7I71G5%|7yUK~bf7>D-8!CABnxzP7;L-()Kw=;J4m2M% zTiZQjI}~6d5HXLTN&|xjN1}{F!}~j59idH(z)W!#UiRhdS5WL9Ap0vQE1$o9t+gxc zf3P`MdTCC57m)oZ7}k&{?S$iyst?Svh&d<#%^p?ho1bh?fdYt#FCeD&b48vJori#n z$j&~3+}+?orhI)d@d1*U;FBmYRQOQSMtuaR-%;@2RR>cs7g)CPppQd$2cE`9kY}b~ zXMt&f6}oHjgfFo?r)JXKG1BBGkgU*$zFA0I5W4yyb@!`X*1~3+nosdI%Nciu`X4t# zr8lJ@sy~2o1!aft#0e((WO`O!p*`W$QNkS}KeRe4Bi80bkbBt*e5 z)G*ba1z{NY>=_5zbC0E_!{auYuU{k2s(z6pKjMmjTtZ+5tYO)DDZuKf<+!-pypVSl zhU$hE<+g>z!J|j1oqKE>yn z+S_CBce7N<6mU<2km^RdrQjK`6Z1dz?KYY9~PoAmw| zgtwrHH>3zG50DcS5oa>CmVxFPf*+hV9?-AklghQ%(7CwT65H24ee^QBAVMpOT3wSwS;~tDm;F zM?kX%o(Pc|ikrVbghfX;LiuWcmz@Ymcv$q(cnus>Bm z&5n(NsU-k#7xs8_OD=h`E7S?tOn73HC-9*AMN$v{B+nqANiI2O^0KOsY>dx0Jy1fwF36G1`9!dJpni5-4xWyVC~PJ-b4b9YTLM6-0Q>8iPV8xCc;3Eg1MR=II{>CB@KO7IwLD~U?7Qr^hc9jYP`M!R2{me*&22;uzy^2udPbVYNHl@WbfBr zUsPIk#pAX1&Yk^xX%_iq`haUmfDN(*9n~VDLR+VvqaaN=twPJSrWo)RCP8cC6u~cO zYAqJ%=u>RH+kfZR=RDuH?(LdzWM~}wjH-UKR*o*BBEVCR^)VlGZfah=NE!I(5%t*k zIKQ}f!NA{|u?DRBK_{u|C0z?BCiY(1cL2a@5 zQjCDc>C^m*irj7rDwYbwc!TB_l^;wo+ginD#=p~CRWP2wU}7y;YQK+3N+$D4(|6Tm z@>q@iLImuMjq+nHxqZ(dHd~m{GEI?WKgLv|NcSL04cv++aoTxIsN9=FVUq};Q`^QZ z^uZELMTW#eMy}Y{IjB$v3ilIzpL#PzVr9XM07UX(01y{4TvU``#MqHX%L&jAEsV?b zG-l=Abg_ySeY{Hr`uIF8D$KEn^bgnC)oT{6Ra5)&Zit|ennZt$)Z)KHo~I)`K6~da z8BG1@%T-u+!`~XFQMxmzhB1Vc+>`c!Y@UaXIK%G3zUPc zN^9IeG)KWPj6=td(?J|5ula)|{GG?*EzmQ0H`nGHfrAVI7Z*7QGDTH_DiRP$S&T{4 z4`7d9oDQW50PjIPD6>)EZQ%#TEu8K6eZVSkuxHG97o=#!^UgCWiLGauHj zgTC$=c;3%q$(m18r=8UH4js(6Oj1UnlmQ@X_I|Rf1)M%+2ZAXQ3IQVc@R;KbpbnOO znu2;}Qdx2Ot5?3_#j3eZRegjNH70TDq*eFt6T?9o_{qaAIxI{TNbFW~;1!S($gS+d z0W^;dA-^6~z2CooljGnck;v_5@S>)j;xgsBjT~h#3S1Mojf=>CoB{LSug+X{@Khih z6;j5iPuDUuCCNF%P{p?k69e8uF78Smrr%HTy=Dc`W3aqo7zY;@H5l3Y`V4WiPv;x(475$)*O(sEyLK%EbqF|`7u05j!r>hpz$7In|MWv?p;?0RRdyeJMm#D% z8ZJ8m{J~bUY9IB06$Cl}+Sc(d?y@N>{*%;Sh_IJu=;riG==y6T^%cA?gd4&}XJ?c$ z4i4HGh5jPxe)2O}bYqu1avzqsw;NmH*r$8aXD?zM*?pJT|NYJf{SIa`d?!&s-$Zam zmmB0|x-&|)deW)!U7M#;m-L>;p)RMd>J}8!#Ji7%L$) z9q~e!a7lrRK-APu`g@Lkoy1fjE!!_%WA+pu>Kl-IVMGN7 z9$zjc|1Lop{BLB0dz}ry-8B`lB}Qda2udr3KrsW~zinD>#JcG{tg#RRALGB;wReq2 z22ue+dt+>yCwhbRb>f^HqA^9Z7ys^6*M^buUnu%Ovml{9z5Oul*sOMUa(AUCT8AyfQ0*3kFkEwjl;TWQC&sLM&B_b+Dkv?ISf* znxRPu0;fkhs+aWVI$LA17}6|HTAdgCch`OBu2(iOCzic2@BmuMxAXz@2?|8yx(vi8 z{&NjtxQ1%x)3IHJBvCmmUU!dVZYws2HPL-!K=fU346`!(SEz{KBlt993~8)z*GN7i zP<_yv8s4sEbO1Y`UA-3}lOaR}$(N7zU5e|k-|Is1DsaCVvs_iG<>c7qyY4j;j(CfA zXbBF$x*vYpDHTAU6;P=iGX304pJuP9MZiZabYMM3qDNTvZQPnMH=>vCwnjeMOVN%Cz^52~ zvgJfaPSKe*IP7^AGz2s!!nBaOxeExhdT?h|MiFRPS;rwvd22ykcNOw@BU zJ8mFI^}@e=&^RE3fs)P+t^frP$U@-A3Anu}fmB9vRqM74%%)EcogIMz2aZ7yH$?MB z?+0D*E&f5?>CEisXAJV&PJI7TjBvKI+x-E92N@rX&djaoucSj{bh!e z%+|fw1`DE{TM0NXY{&kV7UkgymoToX@82&UiPIXJnDDY|ZEi*``Bw83&k0U644^|* z7zU!^X`nFXibm-b;b_X`Bh!}VdDnr8=-qNpW9o3V#*~N(vXlPRS$la6x-_uCAU_Bw zn_qejMcKjFbrzVWzR44;tgI_)DOYkxF-m@e{DO3Hp5v^#Cn1QNevn; zx)hiy=kr|ITRuzB(GJlE%H#L>aS490(`HHN-TNwt>^6bw)mots`XVsB!xlVfx^2BU zvppDpfs)8jLY&+ya$kn=CRNs>V~ZTASR+dyj$AF^9Z8M0b(Ac`reK8A3)L zS~(o#7QJKl#i-u zdcFiT$Iw6I4x{31n3m@QuDx-CN#_uHWa|)|a==`UDfQQXD}V3b$LdsJjB_{=Y%Iax zW+rM69Xoq>hy8LP%AfWN7#2E?@!>wc>HKmU{y0kmmm0ZCOm0nnKX}8Nm~XGTXYYMh zh??5U1#u?{$Ka-Z(j?2hulz`FfL3g&c(uBldk*6;HX_lta80Y3u);gR6YFe3uV`7n z+kd_??s{=;icao*<2=$TgS}eH4a?b}TfU0R{6ddC7Rc#RW&Bq#QDbT_nM_&3^-Vu5 zJgs|)toF$sO5lK}jxe~U#BQ3`sagY+vh&ZqIU*8ZeM|P6to!c>1`M)&sm^HT(HVs` zk+8nA&86xo#rTgwJ_HXg@n-t2>2G`&Nz@P@BZ>x!y-#gh@Tw|i+w0hEKhZm(2cFI2 zQq?8_LS19>KJ*Bk>jbRFW`*d_1rqc8j~QR){&;f3Lq4H^6&vLw9eFE7-Tg}MRECpE z+{V9o1I=@mitSZJ8qMcSHDjzVlI^Lb8kR6Fwpi&>>$;O@+{v35pk$`F|KG4tCy(@2 z8lt{=5sRR8q^N2ajLW+M@p#Z$#Xt%313F6|TxnaI=Fv*%Xmtd~31U!btmIT!wTR)yrK6jzGyT`K^*8CU{*i5(h$zv?VRhgckQ@9#yozP zSo#CiUYNe^w80|J9HOS7A;J)k1cn%T44Pi{+uP3;Pv2A;56^SMXk7@{`+u*04X=kU zSa9ld>$L;N1RwnY`CyPPh%uzFfOy|^+;IQ61V-KwLF^`LwDgD{wnD=d@1=#9yax=t zQNZB%02&98o(Mx?4IFS8l}kMak{=*;I6YDi=M1^}+=1>x>AX>|1NfaM~o-4ovb;O7TRbMW$@Y6=IDLcy{E z9MB@>K8!S zr>mDs!194Cnjzp4{7v9N;5=6VoWZ1mlOU1Gt#B~>9{OsFuD3Vf_;7Xl>2OnVjs;-F zH~Lg$WjR3KSZW3Dq?tHJ&uOgVh*FSh8DTq;&MCA)(R`h88+(Jeeb$+z z*pb4n4&ny#_u$lk?v&q20!{SP>CII_3^GDXUYJUFKe@;>R@vA%mIkL&cf8;+~$nJNkP zKWRrd1T0+Im7E1gfsyjH0rd+PXt5z=2>_;@%auOzOwg$y@?qfIo&v8bibhTjWuJA< z=xz9XQ@p`qLgiNGlzTcWN3IR_)w&aF=z2rMqV`d%7&VMpn-#7qQKOO}>bg#+$g za>!f-&ZXH&=`Fi4je1J`N6~T_J4&| z+Sn$SQ#d1oJB|MCchqyR*Yr_A0>x*^2JtTYug`w1me6}W)TQ%~{Ub`b*;6)t{)Mc0 z0~8BjF-D(t56T--9}uLrun+?M6Me7HN4Lcu5tT^l7*biIIU$p1o+mq4fVx~}-Ze>7 zfJY6=sn$Wwss>+1)XdcNz^Q5YXS3O~Ij2efll+C7yxr9*v0 z;z|j7gr*PdnJUOtKYsi*%LF4fSLAC}tq#B7zs0<%_fO`QC2QxCN4S`p8k1EQ|FL{FxC%h)x-%nKVD&0c(**c?&)l=%Hy-7(7 zC}n)CSFm+Btd|C43`CYJ&{gmc98wJgm#W!7nP;9+ne@e6r|6hZ&@}b)boq{cD^FP* zR+J|BckuxVao{|`B6b`gB%qd9Fi^o;@lH)W%5gPHON8skFk;o#bN<}lj-K|?<`kV} z9iF)i>oi?wAc(c3C~Za*!uLb9F6~aXB=`QPzgs9N>`s5lNqba-|Ws-C|iEDYU`^#^zbr^RQ>pg{o#Gftp=Dj7{`k`cO2$$Ang)j{{S{>{fgNx(tX4 zyo;Cu$)$vCwSOx#`=Mr|3*0Hm0xQN!t(i~O7o*cHJPvP4|MU?3`YqMgd9Mn>G_N`{ znk2660W&*bdMQkQ5WY?N@|C_Wmch$o_DaUI3FkW$qTqJqfi|U2bGX1qOlOTP7_4Nt zf20CH075VQ_&s@K9dk0req)ltWTMmibR9~ya;nli)>fVGl8cIbxYaqpJ!bIcMP3A2 zFE??_jZy1#v#$6?=Jnzx8L8@i+OiF9;-P4Y<;%MEwb2wyFDlc}E2rTZDKBAf3*_Fp z`R6OHoVU&kZj%96mp=)2rFO%{$Q0{#?URgo9)FU{3 zs9{G75BBm6Go}>e=V~oTUPneOyS9PNB%$x}kf($XNVlis!;(at2VS!iF=wXU6Cgd1LJPR?lKI>R5*GjSe_2t&G7(!_HqqG4BH2Q^1vCCR> zb~z8L7ut_JF|n>6n63znyrye!6TgJOYA=A*Q|GR1W7*jQuXT<(-isE;su(t%#jO4n zT{G-=m9-xA>y;={%m=R&{~~V9agD5zTzEMOI6xVhCTa!cpt3%4Z%1=Hn_p; zSXg&ep_NEA+sDQ`N{zPlyKbou`ls$|=hY2OUpwU|-@QQ18<{MEEPOp;@Gu%LAERqW zoTo}Cyw+oQM8uh4>{$n)pLT25fzwg?JMHgdyC+xx;<}2!wI5erpI!0R%v8XPy>� z|5&rc_b&9B4YrpS`2;Jual(W&tq=ReSAJ${W%J#Z6BYn_|H@AX3y`^@??8 zbT)S2(Xrp_ewU)k%H6h@)rR!_IDa^6EuQzPjXjI1-6m)z)pX~nSBs5u9y^*_vtw12 z(gzX_d$V=2`bvk=I9I5I`RBJ*9ZrlIZN`Vn@dN3oL(%qsS^-?4jT7#uc3>hFht>GL114z?L#Br-N=cpxaUG{n0+MCbANEfLUIQv|%+wm2nYO|zx zsMC2J3)jz^JfA-$-J_C&bhTFb-_SpbgD>kXJ`AH1qadCy0?0V1q;vo&bYN@{b!@t6 z428K*^5gmP+5J&0w|a(Tv8qIycK+bUhwm$2A4)kSF02|FURt_Iv*SBX^prpyg3?*p z^%*7$G=87o<}AVuK${m>wH<`76+)H+<+WY-3IebX27^@u$0+d5=^DibLuCw>?YbF?4g-jQdG8c!IlUE$0#yai7vZ*t%u z)?+J;fIBDKh;&IPr63`Vq|zl40|-iYBPFd;5{iPP43bI+44oo^ zAT1yzpfoCiQule!cmH+oy0z9l%XQA;oH@+Qe)oR%6Tg7u)TF{99_f%Eb5$!Ku>VKH z>N8fn6z`HcpE4)TvqT0i?pE@^A`_INR~iWoA1jK3R}iI-BSW8db9Zxar2OV>ZmD4N65t1w^3$khoqe z2b>hB3*?jH6B3kR^qgxXxaIMDo*v(h12Jt3GipDi@@Wi7k-c$ zb8{U-#?;RALWqSN2QzACAn`)rUa}}s6XD9#9@^8cR4Vy|Q$iqnvfsHtb}Incm6GrU zoh~yY-wR|N3YrFhbq`r=7tFEmv0Z`!5y9aJn+}jNBIz`+VnHhEBZ8>9&i8miH`w-5 zi5R~;lfbaVvR^&E&KcwU4{Kc)x#^mJPrPE#(+Jlu_1a$d*(bpdr<%AkkJdSK$A#)) z?V*e+^t_=ETLP|Q8$wC}aMV1Ei_{P-(LfeNT~Pf)fL?*8$oLE7=ML7bPZOX7v_YDH zP?UH8Aii$gvL5}n8=phs^$GrP(v5HNjw*|}CR+7xtm!M7`9TD!y;25RZEeCzPljY^ z0a9r=w-Mdn-Is@~`njEr+LIh3c8{MZg}_`D2CD;mE@85h-s zzvh`=g^S|A3D|l?f8-~{KCMH)1en>yn9;x9hKMe6k zjW&-DvC=+I_|P)`%>_3OMy`p)k^1QF8OR=u6&YfQ`svfAs=Rb5E6&kBkQd{7BD5K> z_Dqhkun7qmSK(d}(@f1Z6tdA1`q)^hwtQ?LaN+Gj_Blf3lH?ulAo-JO>FS~cO?dIZ zL!9I$!obTsA254=@BMtu^-V(S>g5Vq)clnD{^I&(v3X$#@;jTDP?}boc&Ic|4$iLd z{?yLq-@_Psrp(3W&9|Kd^??CbE7sU4Vztq~SFs*@9eaQ|uuAqqqBsm%XgiK-HOTi= zs$LLg{vz#-bIY^J8{(d^j(ry6r&P%wh6?W#sIv8^%z6Igp>}XX=R(C}2aDFbbUMI3 z96D5l_kYx@-?o}poyhh6LRs5iZi2nKRr6OneLYM3B{kgda(nPHePd0ERJCeI@D_1J zLX==*gnTQTo2z|Im^}DYa~t~+9iOeoT!&Hfy=Gu6zc`gqe{SzBCkCDE9rx$*=k4Edlf8 zdi&d4R`su_gmpbddiQ%?`4~-QGd4bfPhmua$B~^`^ChL;0ZsmrJg(%5@55eo}j&9K%_5ZgDQ03)uhFBdPJ#1 zD#10Bi-W?@(<09nZpIgsD>m)A>gJ`$2hC>2l^0?Y7IKp?lsh}&Q04?)VwwL4l60cj=YBN-Z6s;t;+GvM!JBW zAWzxUiw7x{Cy)>gl$~g*n5C_ywe{A%d)B(iCe`V*3JmsQDSdS71!jELN*}@$!pb zfl0KpNCFP($bZ7oLLvWI7{ZoV*>W0AadypEjZ)vF1(tj^@6n@2**hlmb$MtHt%|Di|6@q(k+fk68gJc zbEa%<1MF@}p3xLKnTqMnC(k2z86-DkZsN+W(m~GYlorz(A8#IKz?l~uMYC)|6vG?M zQH{Y3W2roQd~Tz-ot5$YLh-MwN2xhUc7K)w?0jX8Y6W?s|JdAqt5^B6eC9D806Q$0 z=-ES*w#i__1a~njI>FSN~q(&V%hhZPI()oIJ<9!QuB-sDvWtxA3d6z171(G zNNz?tlrLL`yzg9d-CvCG?kv|mp1k*-{E-$;X@LX%&clV>fRk5Wl6hiam;C72b_b$R z2jft5%AJyq3PXplnUXB{>7*nKCPb2KLS4En&GOB@^z$cK+o zMm_T(-mm;Y8V&^w!{wG8Jf)e%|#9`JBHNN`%$Q1#n2XR$h2=Vs=%d~EhhXkD(F z^XqaJ=nGaItSHqNGOBRU=-+AEb{8g4-+XRWkk-kL!ld5`)htaXB~PI0InMO!tu}qh z!TTQn*+{f{%Ort!baT-IZTPf&q9}t{gW#*Zxd$9b#+HK9qJF$Ksx|ZEGl6G&5K{Lg zNqlF-q`}gcKfp9g!9)4p#hvEzmKCNaYux~m49O|kyeu%Rw@#I5! z)-EW(`=-Agv!Waj&wzy3%A2#p{6FU_}g}%nw`+Xzv2hltmi`QnZ8LDl& zH(}@RnvaW|)x+bd3^K#J5Dv*OFvPU)&#-|`XaKPNtL`28A!tS5s{>Nhd4~x^WB{=J zXBCh!j8$DedH77D^=^6>{&tO0g+q8-K0P1vcj41o30i(C0QdB>4~w`*|9Tt5lo$wV-0NeGyu9GO(xHV}(seJhbTqI;>wvEY7SMVlY8fjQ@$BJw+Bo>M) zpxWA>8(f$QV3`p49CfXg<(g*njW64JZfEP*M0(!KO#KVy}ne9Psu(|rxeNzw|umXCTGB5uL^|8hj58Q zwjDXbJ6~z2RB4hwv!*!V!Oge-AY+y7C{$N6wP40@U_;JTtx|(7^7!)5D|%=t;h;D= z3V%wQ=EZh???@t=IX0_gXIZcP6c4SOPJ!GB{&iL;)hHx`AuRa*2RO}QTQkJl+Z*V& zQy6d1FF_a{pzY)6@#1_=0B-f2j~QWa%`O1L)Y&|*ssf^|S1DbnId5ak+2QkiC}Y3# zC)oANHPC_UCgSANn|qjqw3z7sOTEYa^7>O;6i}BA07mTz)OLwA7M)@`(7S7gGj(o8 zy>v{ubg#LLsn$Iw+2oc*72EyA`&H{kByf5l4^RLg7mxrsr!ArvNzYl}!piCi@Pxcw zzf9Wi>d}Z#xty^8ryx}3No*7~p6z{dQ77Xe3_bkagCv5w;0#tb9axUoz$?=R(N7fR zEQBNMZ|RN;C59H;f6KVh_{K3h48}=82sZK>N$=Xa~tdsY}C(iPbOd_;P{F zApbhCC}!E4m^0bfARZ=wGQP*X;gIsZgj0rt{=XWc{EL+cEc+Pfi047S2aqy^z?F*t zW!Q3wZNgfb;Ru;7!iH5^mQ-qTl+^R}t!hTPLiKQ^i$qobN+lAAgx3?@{py`*e4PmD z?qsyBcq|0i5F|3195f}innW9v;_Y%0A{Ahz#R#Kc=5}APD<$LaY{`O8E5EY3KHD9q z;L=Ypmyn~rOWSLF6i|86dIs9H&o8`c8|9R!9asO^|C+aeSS_2>bT3IhRvlu|=W1XX z760$c*OltUMO&o*1Ls{yPmdZA0Rbg&E?(ZE+AZ8#PS|CE$6LiEfu*WMYbh-D9gw=< zqBkqB+t(7IZXa*^L zvk2Go31TJI^c>;M#TQZdI`k%rr3M_m79@{#DAElg-i2pr_D55{yI9+?=Am3_z}0II zePjU4X~w_Zgo@=xxm7`dva#BbiiYR?JwYPJ$eT5X4e#X!KDd@eQmG^9G9>;BQN@`t zc5noVD}5rJJB7(X19>na*f|vQXK&G;RUYQ;3V(c!fxn^(t~CzQ_hn|)A`=si_uj}_ zV&2H6IKN)>uo5WqW29V7&#zzHpwo6XCWUJ<5;j>$&5}mw*$tijX{kxw`}tnm=52ZL z?HY;VdFoNEO&4YKV$<%@)xF?P*>82cn;A4ASW?w)T^wVeAEwwB-{IvVWe^8@q8{@g zm}hVJNF4g(mFZ^ixR^u3{BxNV^M5ihy4)45XM!mp;h&QAO?Icz#Z)VsgFk3_6x!>Q zAF`iKiC*+Raly>PG84gE6G4b;1-I&HQ0S63c2FTo8C&3B4Hb(`a;>j(yf35FpiRDM z76CiVB$jMFiT>|}JF`1PsArcFsv3e&T9Cozsa+&z=Kb4Cz@=zC!alU%qlA)5U3C+e ze`1;NA)mC1U|o!dlWG0a&lIM$*qoFtjz6%BXDJ;r;nG)v@^@g2^G{ZUSQXYn^!q3W zj5VN8!q9MCH~*DHrWp6)%n3yl^Nn(vM(76{684}WOAAcfNsdDQdO)EVJr+N9=mjl> zJOiyNqek~D-$(23`Ou>Lt1Ip>Gd8P5Xx;LC?3vE`UAjo>xoJ#iU=ijGmfG=?jX^8_ z6QK<~0p2L)+BnM5B}fs+*#+8Q^Q9S0To|{S4j5};A=f5ViXMo7s4BcglVI_H;k)z~ zZ>F3JuT&k4*|Y>V_yyng!MJI*cyrPD`>WRh<0N>#$)F}C2(r&BvRWb- zyNMQjG#9tVAd_B>JOqvVgzh@uK zbElZN&-kHXmryy3E#VkxhV<#=9K!@*&X^!NDXax94Dp~X{`yMk0x$7l*OMU;Nou&H zTE66r&4<>KaH4(dt9I|=)MfLlIi?rr+f<3c=*af2t*BNhOTC{SIb35``UB(R28mi* z&!Rq(Su6VFHCW(YW01r@cezU1a!=XH$+qe$=Js9-%Vf5&D#15+_v)>xJ6}33^;H`w z!ASI-E?%)V(#NJ;F{7rt-L@O)b^DAlM`>5{mZwiHrDf!CvRy^TZig2?FNqF2yHICp zSVl| zu3)9d{IjD~M$%PR`X5>rYk9nyWTk)mf?ug<;HLYgEf-hg4q(AP3xFk%{Tx4Wy-HT4 zfC~&_H1k5Gp5IFN%1>7#$ZJuXxIRr0w|7qPc6pC-}LC1D4=|ZJ3C!a>rBB|`} z7k*b{&(#VVP0k4AGSvuv8{H~#>EVrCI<0%I3f(pob*`x$RPGNq&X98Ae=&QU2%Ona z+2={S&F9|AgRVp^3!!4Z-}ME%$d$&(qszc{*ZE?amppX72Om4aOH^l-!p9TMyqxmE zu~ykUgxEuL8aETQs6q}2qjGBaIm71jiCeTTiVph6yxadOGtVWRv0ct_0VqnoBy=e- zbeMDWhuwtZ)5X6pOZr+)DKG=QpC{^oQ$}yw+di4bQUyw&is++FkBA9ZXuH1Ny~}B` z-GA-r7!G%F3~=I%DZ&=%XpAp88N;APIWKv>*!a)$!E5@n-0AFb_9Ya;^qJ8%xjLzs`#! zK2GKed{`&__iM&la5|L=HDe(S4ry8lSU;2S&zz7a|IG4t5h&6EJS_ZCZO)~Xi_jeH zn7U4Tf$#Va*1?P2S7hIK zh!&sF21C~?q2HB)?UtTHw|neQ7-t#HsYhg=*Zyj3u;wLYIeG6D{SXP`w?8kp%ssoGN_s9-{z>eTZ$-0%wJ^*U7O~mIFj`!K zyz2Lhy7|msAulFmk~gjT1INBR_ZH-)(f784CwHa@vnR0RLy~6P(D^w^K7}cV9@lm6 z=zcHh`xMD-(=zRkDvs%_x5N`X8VgC+sTc#sC}o~+o!&_|TJ)$0)|AzyU_m{1Q!R)5 zv)O3&sT%jhmP$P^Dc%eiPX^RfwI7>q^r;1wdmR{g$b*PjKWX zMpwW7*Ym(t^t^Usq*yssv?1&=-+oe0gbNw;&*{#S3VG}oPkT;GRuJ!wv^n`N7%ur?Tm*w;`c(ZJ*7z;`lR*z^3-^Xk$Pq;SgJ2nhd<$EwlIXQ%<5{q zuc;;Ia{{ub_ z&UfX+hXqP$GJuiH??w})rxblqKJ*Dij}S;70ce*HK#{eW&$U)}K1qCtn_3D&f8Rdu z(Ny)aG8-CiBkfsLzR*5}Sir1#i$yb~vx|}B$tae00^P$+ z;zpC%aiWf5jklNtT_}w{XTKAv<(kB(nQQTozAu-b&?F3BB3QP%(NE-cp&p}6Js0vRL1Ic3(tX z@c|%-pdWybf>a7R@~<`|YF*%LUr6`+HmU{P$t9ScZ|E>SG-rURNq*s{FPQbUQPN3P z+(DD0C+jpeU1cfp9#RCL8G)oBf}1+@>C@;T3^hY8lH33Q0Vbv?)V6JQbU_P7zOFX8 zN{`?fvj{Un{+M4i6BB75MB8~ZbcGM)RD`7}8e8bfc*unh9oxmRdm$AQ*Hzt)P8?8I zMM7|BBy`ee<6%Y{Z7=CV=0DLQZHY_t<|6UWiA8nxffCN-Gm1|k4d4$qa* z(0Dh&(!m{Tk--w7^^6V@jA7o%@NbH8u&!Ut%ZPuEptaRFCGXI;uX)7YAldRwgga$^ zp(e*HGbf2IdRb410aGKr3t=_QoE07@Kaan+YehGyH#aT@BuWMrBDL$Ez4molzDX1x zz|X@W{0>!QpbS~seYNNty`)XbUMgv%B&`abXJJ(JsPT;cov#1ho~73RX;vpe=ez2{ zHhqbFYDKGXH4O)a+_6wyBr+N)riMe?*$PjdxwK=g?e}BeWYqOF#^_X1|0h_-yNpM7 zy!k-=UqfV~4QH#w9_BMq9#<+?GH>Q3^T6tHw9kIXwkuIK@#KXGMKjk8sH-tmGCR9H zOIAN|os3Bzeq$!BHHZXe%;Rh65bKpVH8tWTZPXp&P3Zz$0S5wW1kV(6wUc| zjEy;LFo{C{PW!eyXe#APqFp|EY+StwksGFqR0TS`M2ZUKr1zKZ(<~NWgKX(U#^^8uL*l5ZU8tLE0!l+T?=IK|77T#6lNhRAU89WK*aZ`@N`D1SaV@q!FT--3D zk2Dwqeh>Rr{-e+`VkmN>4%bCryYm40Bh49)`-Y5amd{>=@ANlSczfJh<&GDG-5fHC zR8U1ijcGIbD%p8=tMdwnFg0KyIN%nEhwSI35sr5et3FQ92evu9^Q5!)NGz2(p2?DES^NP`>uf;?7GG&taqjJC7YDGqA;2Kz;%Eu_Q>o|$0o5;eRNv|a zqOK(o@B5xeSv}mMQ9D>4Wg3>i|K3of5ihP(Y+`FWr-5oab(Q|^TmDUvmGC@1T)~Mi zs8;Om+7d%xfrrMoO?U2V&Q?*?hXlyepo3xylQ9U&?UOkROw%LSBg@VsQGR)12-Q&E z=xNZV7F^dz^qR1O*dqp^BJ^rA?W1Hc08iU=qog}x$FA`TVpB({lg?4oc2RoD1Z_koKxAAB5%IG_*fKcj&ZGh|x>X5`DRaC@1jzv)}uIOEp!ZOi5c zGlP)v{!eF&$?(#fuO5F+6U_5IR=+2iZ((0ugJv{`^n3Qqy@VYZ-GAX?$o`rT*`vPE z*}>C`;lam4LH>Z}eQilin@)eV6NqH_Kk4;Lw_oU3(*1QJQvc|4@sa(fQYcErs!Sf) zS;ClTNUnoFRvXgu>$z<3Wu#I~W8D4iZT{{=c{d8v_)`8uE+=H%C+^;<;1s>vbXxHn z!83oq$7=GiKFtHFwI7P<)g_kI{F=0I|BT_~kPu81`3>`D&dO67~qw#XNW=+(YdGJ}}U&xMi9EZH<@Yn{G&B^6^Y283^4 z>Kyslo89U4o*Ingx=5iMPoTiwzGS`C(`UX;Grd08G>c1l`&QLy4S~Xjdq7cUzSp@> zosTM>fdeebNXGcUwV1hfk(5S)0{I+7`oZ{K(X$cVBSf4PjoUUsZUSy69+y5a_(5n} ze4wBcNT7^d@!NjcJ%2k1?lgnOT!!ErXZeS_UEbmcp>Q1+c%pO7Wlr zh=y}{JJZPKm}Y?P>MIxRdVPL0gnb*T^yAdl2;TdcR)Mo$b^+vB!Nm*IgTBuv%?o>h-(e> z-3c;2Yp<7o$-Gs$QDjVc`%GizpPwELPFWGz!kjODVp={p%c~`kKEng-l6b-p{7;Xq z9)+(-v#fuHEIA^G!tYLco5A;Hwdz>`_^)xk-vi;+5fkRcbt=MD|M8wfQ*ojyX4Qqq zNd&@DoJ<_T7r6lHT<~2MJV<;fE-m(q3LiKf3LsOVk8|R{L+HR5FDy}y=3ocY(7CA153_d?iH}-{Xr6Y$V#bAs%GGe zmQ8kTFIm+3^>C;6%LVQG%l(kNz<_Urcgve)@S+NwAXo$x%2SE(u91sk!S6@N0l5DS zjyAMHP;HLhyezd&Lr?^J%oWXwo)&XMpMrD3_L}g_jk4GsP%auEfjL^_b!XojmNx>bjizk8>(RAXk2m$Wl*MEzI6?HLlT}bI zK_y*Sq&k1wlNX+%zN0_jS42zP>B}e?{cfKrxD%y7=tF`(zr`2;$sSG+11yx+fl#@Z z$Wv2CZ(GPJnz=xW+Og8~zUg!wT{lud#$|bAS(}g4Y|w7KT%lIDn8=u6r>#aK{GB1@ zVWiieELrgf$|}q0fChb*8e#-`CiT z6>zk;8e0xyF5V07Clr99Pe_K z;`H(EtHmqm&==Ia;@c45**6FR1(<~s^QZ$y>a)4(P~gCf9Jfi)(He`C`KtfeOGnt2j@13P#hI2`zaw>Fk)X$aDZ%xPY z;3Iv@)9LI-5Lp1rY9_dO_qzxeNjMKq1)qh6fTqXagI5;6G9QTM>5c;aS6C`E4B;MO zRK%Q`6~+&H2{@qN3;^Xd*KM|~B$2n-%5dMvis&eZK4r+zB5K6P9@ZOAWgjdB(75O@ z8sy`l^@L!L!)9rNEK@34F%yjk7eXi8>*2|!%AO<(5`t5P6Z4KTTMUlM0CoTnqY)`V z8RdE8#!`0>gJcd05_Clkck3wh6R|O3Fu8$7U%Q2kI+RLq>%x9Ywsz<&StK?3{JhF& zYQcvDt}vRft2x&X(K-Trq)?W->2USW00_98A$>f!uSl0)2LP)$4BqgBIkOu&Q;|pgPsJ?26|9aY zpSCpxzOrH`NuI&U8Hy3U+oaUhrxCyltTF5BmhO# z`KJ8*^3OxZ^sN>1$CQVmRC&7tirG;KHdo_zR63DvGf0l5c)ofzRJ2U(Bc>I-pHB{#cyp}F*A?Ynp5 zH71&kVkL_zrIzErO0VCEnR2#%NLX#1jlEK_ZSAf|rhjW9FX;9E#G?L$Swi%hzyTYy z#A;jstYrR#N0Vuiml~3uA)z;X*Y^^CQ${i`H{3h2p1MNH-53+#ieRl8gZW_~`YA|# z{(Xx+VB*C1zs!EPb%p-X+L?siW^S9I(Wp_S-MwOO{XfKp6XXwfNrM+oWFD@;TDQDp zgK0XX0tnIrU}f#;$N4Z_y5B+Pc0&e3Pl|M(VK#oJPyq%N%EfL6uQdSPB&Z0TFmBkj zJUvBGDn&+UNbLA|=GR$o1_b@Fs<2Sr)QK&@`8T#VAVm?)5kxftlr<2A@SU9MCV4{Pa*ZfjTpPvWX z$<)v7A^<1^xHZ0PbE|u*V~V*(0z842-{=>oz76b(Wvbd#eSH)R=@BM9HDvR|6KCkv z%spD1d6+anHJb=;0TshHTHCgNCO&ZPRWL71gy~SwQEwl7%=?YuI~An+0A9$7bkfVcu5+a$yJ5G)Q?i(%oC$mW zhLC?g7dtXG|5KAy{lAKy;Gn>1I*LKaWFEw`I}q0Ui(Zf+IRZ1W9x{=pa3HEsfM^|z z^;K0FGg?dro)w>QGuqdK^x!@|$pT+Fiw``H@n=H1CCP(jaok+R!Spgmz2Gu-K2Ova!b9?prR)25NdAA<63?oBt>3rwo z6fEH*tsJ4M-(ADZ>DvyLAD1RC&am%WE#{c7B7^o2EuN#AmR1vJ_IO@sB?s(MUg_9% zYcq#v?cAyH2f{E1%GJ*vxh(NCn&Dtcl?F0%>JB;0-@MHoG&ZkJ0}OhHIk{Q}96Awq zU$DOjdGZ z?hg!H8sde3CR%XDGLqt5t(j-Qr8geB%30wcqQ}ffjBH0Ll3^ck3j9I zLhIO`o=fu9ZwS8ZtEMCkqXf~b0;(qk?Jx;%H&|ALTf!dBM{YZ_UXtZ`ZJ610I{9-> zVwB!`a9`FUKw6shXuQ;pBWOR;l5mE)#JJhOP(G&=Y&{TB0z_Djn)&lV{MA*UQiA1h z9)Y%+>S*0%{{y`6NkBqeH*c7_H1m}$ci3vw(%P)pWU)w~dH3s;;MY#ploi%ZB&NR~ z#X!v)Q$PUOLhj63TMRdW2MO9|U+}=u7{-h(A&G|F3|^0eAxj{zmqcwX@554a&lGmT z!Iw(A74w8c?v2w8y>ep#h;W6bu1FIPAo4I~O5LA=bq2`GS92#paX@UI;ERd;Dj%dR$Hhv@)j^b`rcF8@I1>j_6hN4hw65;=salQ{bKHu z1u34iw6uA^t?YdcgFS_?jnm#|F=q5H=ad=c>2Uyk0=%Wl{aLLg!a*fFJBUjY0C(>$ z?G)AljuSApWPZhn25qYjMYa|Wv=&&r83aq8#q!n{e+);3nV|dO?aaIwilY_0Z;3@^p@g;#0M&pywJUs zuwVQoRW{S{wm{|6(`aiMIiumRe>~&+3g6zCvT!fH>zZf8WZ*0ObieaGK2-OWIs2AH zDyk-A-T&1`6Li%Z`hWynJNUtxx>IX_hAq$m7i%}c z>{-pxQQ#jzI1s01ezbieSi4IAQ&QxV{kYjJP-rw)z8L7@{?cBh5>~Uzh+U&>mVUa4`>acd)18hqPWP zZuibEvB=Pp1%@S0%-_8CTdHs}0R#eC6NRg0xu!ySMjE1~pBHEqfwM3i5yT==rsx^H z`MjdUP$+p^mR7`Sw%DqC{meq}xrMHGh(x{0B?fbICAnoN6dRoBSz%RILY>~`H zs;O+E$qVTn(x(yP{gp(as`QlM`~#tn(maxCP~0@Zx z<1B7+Cg=5a)`;#aRBq$qJBL`jJ)Gx~uFPO$w+p0YuJh-KK<%>am2v6U2u{$o)Z?Gb zOG8AsZiiEv{(jJt()1|^XGpiSV?GKEg#=(F>4A|D&4WxDj(i!ICW}tKPME}wSURuZ z0wN2}U*AYonh8=&>DhR96q-UT%exgt)4l9xG|8eTK!0$Q^my`xYXmeX(jvqF+C$p! z0#9e?(x)gm2S~TvJRO&>nfVIUgWiG8CBW;l1Ww7vju2?3LZes(rpJ_-hgnc)z0od{ zvNB7A2c00~@=nqe=F{MO1C2;P1dVo~>n*l^sF_kpzLzxR!WNRkZ-hq=?am=yGo=65 zvDOPxea^xO?LSzHaZms@Xj|~IanB%VWgYAV1aj?H!zoAKC(Lc*ZLJ)D0eZXWbq-oV zOF!$hgQ5cmZa#tK)+M^P-&g9a{6eGbmG>9u!foh8KwSjM<2beg;yoahdWuxh0QGE8 zn17OEbHLl|(54w~^$1|-XzzN!<{F;PeVHY?W_%om3fq3O@n-$ag^xnS8a)`2r&`Rm z`gyw=!cJH}N55TSJyi<{W`J+p-$L?{@dF@x{U93=$so zk5iU>xkqyt4Hpsl2dxzi@-mDxGgmmO`tL;l{E20p{YOdP@#Nkw;%^191uZo9jvw+@ zw!Dtpn`?bL-bhD^I{5o-9^>92M`LpNvaDy>z{cdH2N~|)Z(=+jB4gJ38=?-FsU0Lb zzSCcpF6xZVIez$s_=iN>wDtoVnv=VCY4H!4hb9*9f6JAZy0ER{ zF@SM)F>xSzJ6pm#Y8(D?AZYTnO(+w!OUy9V-amuW=1hpOQG~-CZI7l)UF7Qb`mOp8 zbu6837KlxfmzylT*_;~+HL-Z*s<>xOp}{;OK5XZ5-2K|v#SpKF2cc5EZGQJEE zJ7Zgm#+-7u(Uo6KS|(Ipnv^OjKWlzQM~DwZ=FQ5t70pllk9t@;>Uz5H1+?2y7qPiD zv-)ZU!{|?P3wImkPcq~Ktl8~$ZXA}hw)ot*1?wy9FaLO(G@_t|MCo3mLnggf_dh-b zBwwt|YaC=n%3sb#_LbL|gMJ=2%Jf{8rJveaYL}iqvf4P(je@AwTf1#-=p%E--XUV4 z(5s){9I8)Vyzt9)9X-&!A~{FsjLpeaT8$+*bErKX%>H^0>AI4-T+! zG%uHFrRbFn&qfHQmDa6p*p_bF-MCZ!W`_0YduG$f>qW-j9tIe=js>k&rpwrgz;8}T zK$^TXG$rJCxkTbjhKYs7^GOjtp> z+uPC5+Byl;sSr6;hw8K7zsEoLLSg&U%cdq4kgSaAyR8hG3Sdq;JUTl1SYy07m&8H;sCDM^k9qxp1S`?D3+Nmyg3ze4qgWbyB$!+;D#k; zenbcgncmWK#88rB~c)np`ovzg6MIJ zgWc+Kh@s)*uAUw(FRwQ&GCmrhFf5>?r1S$=zF0dAHb>BY`vmIH4WJ5c4-RC=#spkJ z-c1C!k?F8znxUaBGl8qw;$V2>Pu^z-WMuj-Dkf+kjuFZ{ySIX zwtZxPA>9YXaS=;tNeRvUb`Ibb)6%5a^}0a+vH zNDK7>%N48;!1HLnCucUa!lD5e1)^st6bRcz zTF*dVu(Cls-eMdboa8ByH<{TWnM zon=X>(@pR^2QMWMAQW;1s<)nrNlbsH$o|mXQKi)_${`9y5i3=1@9O?o9#m9J%pxed z`WjZcDFEJ^j8RzC)|Lx2`f*V3IfmBvs?5uUU4fFUk36UEnBV2AqZfpP{xPWoz4D++c}@uo^foUK|)`#x{c- zw&`TOCpY3uM}AfuA9R@zy(#bnFuP?SCy)D^15V}6j~`A~f`5QgI;bhRt&MHkLk$6r zS44i>Umk&@jzBLkHehq;85%BqYH@XSmAn;O>n>Mpf>=U;tA{AKl7MLt{6Qp|Kv6~> zXg?TR|FV6-7x9?kTPKSwziM^gpz1Ew={*N6p2Pn8pJ{u@%@x!u$X`Jw0c}Yoo z`+cHxN$`Y;1mhXlxj|_9obTXUIOJrhu+r4j1dSk^f9=kv@Wvo>d0A3Y(DhAqHDY`q zf3oScl@qO80Uq&PXwi2dgUbhD>M^kQ)yhmt`!_V5w!s0O0sOuD1_si>)O^`@Z_T)9 z066zN;^GE=o1b}s8J?P)%mHGY@BfS!X(1X|@HKuM@6Tz2>qMsDcg5+OZOFlgi_98q z>5y;;_X#JM0MI|~;{io_z0crj5I5$O4sPcCKt-|tRH(@+Tq))K$Zk@jRZAYAt4p$KHmPBSJ}cTt)Z&Z zde+z|69~kouDLmD;M-q+Dt=8+NXW7Rbmz}L6}5?kpiDwanhM^W`poCf1qWQt+1|!U zhI`e$_1FYXb2lt12vvgps=TK(L{R(hpNeR~YYwatQ&Uq5%gR0!4S?A6Z4hIym3-E1 z`}$qk&FZcNk6&L!uO`mAWrA{=1_)-tF?$Clo}6HU=6TaLs=O&G3tISEzc;kcTcw1`SWT##Jo{~_!6ACi#&=|>}1P!)RuVh32P zlIm!|zh^7SaYhRu(WYi$!2;<6+;WI3+^=6gA)vcF*>X=7B&gw!m$x?#3Y0kmHeUCF z6c-IOb-3nZz6IbHz27t6W@!NjN5s0k+ZNH&8X6j!&jG!`V>}su|L`~r7QCNrVSNG+ z*DO%kf*kPc>gp26bF0EhhF~Us=@JeK6qoP1xTtDrk%9v`C^}PtfCy;U;epj=FKnqi zM6VA5_s;IFlAD__NT1$EbiW~K5;CpuS@npIJ2?+Y?b;qZUC5N8;MzwF-%*HN8Va(S zdcRF(kfr+++8ILu(iaDy+?h9g7lnd70)ZO*ak`<4j6wx9vw;X*Y~O9fJ^*o^=7xX* zYFptZ{X`d3zcw6DUQ=!U0{awE6^8(WxQ)a8(+Tj4qSp=s%#csu zLx5ndt1K_?j-%nO0+yTKYUF)LO|hz~vx$&&8i7AD;v)hVz8Og3g0>10wBYK1O95NM z3IbOxM?bV7(`>VSJ@YFIb{M9#6hyG`Q5(~5sUX#aymwaS47BtXxzVt2AW`@lWE;Re zFb`5sL;?_=JH-=nA`pkQJvllI=P7`?b3*e%xKH9!U+*G$)4u#?I!zbSX(Q`X+e+3r| zb$GhK-qXKz>j4;XE`enen250DGl_z~G_UEXRw$z*{~O~mLWKYT literal 0 HcmV?d00001 diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..6c49fc6 --- /dev/null +++ b/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833