From da30fc00744002f946dc9581ef0071060ad58645 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Thu, 25 Jun 2026 16:09:12 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: laion/GLM-4.6-stackoverflow-32eps-65k-fixeps_Qwen3-8B Source: Original Platform --- .gitattributes | 56 +++ README.md | 59 +++ added_tokens.json | 28 ++ chat_template.jinja | 89 ++++ config.json | 68 +++ configuration.json | 1 + generation_config.json | 12 + merges.txt | 3 + model-00001-of-00004.safetensors | 3 + model-00002-of-00004.safetensors | 3 + model-00003-of-00004.safetensors | 3 + model-00004-of-00004.safetensors | 3 + model.safetensors.index.json | 407 +++++++++++++++ run_summary.json | 12 + special_tokens_map.json | 31 ++ tokenizer.json | 3 + tokenizer_config.json | 240 +++++++++ trainer_log.jsonl | 821 +++++++++++++++++++++++++++++++ training_args.bin | 3 + vocab.json | 3 + 20 files changed, 1848 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 chat_template.jinja create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 merges.txt create mode 100644 model-00001-of-00004.safetensors create mode 100644 model-00002-of-00004.safetensors create mode 100644 model-00003-of-00004.safetensors create mode 100644 model-00004-of-00004.safetensors create mode 100644 model.safetensors.index.json create mode 100644 run_summary.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 trainer_log.jsonl create mode 100644 training_args.bin create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..96d2bf7 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,56 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text + + +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text + +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +merges.txt filter=lfs diff=lfs merge=lfs -text +model-00002-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +model-00001-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +model-00003-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text +training_args.bin filter=lfs diff=lfs merge=lfs -text +vocab.json filter=lfs diff=lfs merge=lfs -text +model-00004-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..a1cd8cf --- /dev/null +++ b/README.md @@ -0,0 +1,59 @@ +--- +library_name: transformers +license: apache-2.0 +base_model: Qwen/Qwen3-8B +tags: +- llama-factory +- generated_from_trainer +model-index: +- name: GLM-4_6-stackoverflow-32eps-65k-fixeps + results: [] +--- + + + +# GLM-4_6-stackoverflow-32eps-65k-fixeps + +This model is a fine-tuned version of [Qwen/Qwen3-8B](https://huggingface.co/Qwen/Qwen3-8B) on an unknown dataset. + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 4e-05 +- train_batch_size: 1 +- eval_batch_size: 8 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 16 +- total_train_batch_size: 16 +- total_eval_batch_size: 128 +- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.98) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 7.0 + +### Training results + + + +### Framework versions + +- Transformers 4.56.0 +- Pytorch 2.9.0+cu128 +- Datasets 4.4.1 +- Tokenizers 0.22.1 diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..b54f913 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,28 @@ +{ + "": 151668, + "": 151658, + "": 151666, + "": 151667, + "": 151657, + "": 151665, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..01be9b3 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,89 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0].role == 'system' %} + {{- messages[0].content + '\n\n' }} + {%- endif %} + {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0].role == 'system' %} + {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %} +{%- for message in messages[::-1] %} + {%- set index = (messages|length - 1) - loop.index0 %} + {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('') and message.content.endswith('')) %} + {%- set ns.multi_step_tool = false %} + {%- set ns.last_query_index = index %} + {%- endif %} +{%- endfor %} +{%- for message in messages %} + {%- if message.content is string %} + {%- set content = message.content %} + {%- else %} + {%- set content = '' %} + {%- endif %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) %} + {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {%- set reasoning_content = '' %} + {%- if message.reasoning_content is string %} + {%- set reasoning_content = message.reasoning_content %} + {%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} + {%- endif %} + {%- if loop.index0 > ns.last_query_index %} + {%- if loop.last or (not loop.last and reasoning_content) %} + {{- '<|im_start|>' + message.role + '\n\n' + reasoning_content.strip('\n') + '\n\n\n' + content.lstrip('\n') }} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- if message.tool_calls %} + {%- for tool_call in message.tool_calls %} + {%- if (loop.first and content) or (not loop.first) %} + {{- '\n' }} + {%- endif %} + {%- if tool_call.function %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {%- if tool_call.arguments is string %} + {{- tool_call.arguments }} + {%- else %} + {{- tool_call.arguments | tojson }} + {%- endif %} + {{- '}\n' }} + {%- endfor %} + {%- endif %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} + {%- if enable_thinking is defined and enable_thinking is false %} + {{- '\n\n\n\n' }} + {%- endif %} +{%- endif %} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..d04042c --- /dev/null +++ b/config.json @@ -0,0 +1,68 @@ +{ + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "eos_token_id": 151645, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 12288, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 36, + "model_type": "qwen3", + "num_attention_heads": 32, + "num_hidden_layers": 36, + "num_key_value_heads": 8, + "pad_token_id": 151643, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": false, + "transformers_version": "4.56.0", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..eff07c5 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,12 @@ +{ + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "temperature": 0.6, + "top_k": 20, + "top_p": 0.95, + "transformers_version": "4.56.0" +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model-00001-of-00004.safetensors b/model-00001-of-00004.safetensors new file mode 100644 index 0000000..97c89f3 --- /dev/null +++ b/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872677d9be956e6146dfc5c6d6d0b37a1286b2341a4ec7686d809402e88ccdee +size 4902257696 diff --git a/model-00002-of-00004.safetensors b/model-00002-of-00004.safetensors new file mode 100644 index 0000000..7b7838d --- /dev/null +++ b/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d884622781e091e874fc70e53b01fd216fde6321e24018d37b2a42e2a499bf29 +size 4915960368 diff --git a/model-00003-of-00004.safetensors b/model-00003-of-00004.safetensors new file mode 100644 index 0000000..cb46a92 --- /dev/null +++ b/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f383d901aa0ef0c9466c5f4afd19056441b0f36b3246a15d162d05f6f5436163 +size 4983068496 diff --git a/model-00004-of-00004.safetensors b/model-00004-of-00004.safetensors new file mode 100644 index 0000000..6e45ba8 --- /dev/null +++ b/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c26c91c92e8211993753971b1d48c73a174e744746898ebeb85e6da5b6bcdd29 +size 1580230264 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..ba886c0 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,407 @@ +{ + "metadata": { + "total_parameters": 308224, + "total_size": 16381470720 + }, + "weight_map": { + "lm_head.weight": "model-00004-of-00004.safetensors", + "model.embed_tokens.weight": "model-00001-of-00004.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.20.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.23.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.30.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.input_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.down_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.gate_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.up_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.k_norm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.q_norm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.norm.weight": "model-00004-of-00004.safetensors" + } +} diff --git a/run_summary.json b/run_summary.json new file mode 100644 index 0000000..a2bec40 --- /dev/null +++ b/run_summary.json @@ -0,0 +1,12 @@ +{ + "agent_name": null, + "training_start": null, + "training_end": null, + "created_by": "DCAgent", + "base_model_name": "Qwen/Qwen3-8B", + "dataset_name": "penfever/GLM-4.6-stackexchange-overflow-sandboxes-32eps-65k", + "training_type": "SFT", + "training_parameters": "https://huggingface.co/DCAgent2/GLM-4_6-stackoverflow-32eps-65k-fixeps/blob/main/config.json", + "wandb_link": "https://wandb.ai/dogml/dc-agent/runs/GLM-4.6-stackoverflow-32eps-65k-fixeps_Qwen3-8B", + "traces_location_s3": null +} \ No newline at end of file diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..ac23c0a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..cd71f61 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..e9dc937 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,240 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151665": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151666": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151667": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151668": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 32768, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..1a93863 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,821 @@ +{"current_steps": 5, "total_steps": 4102, "loss": 0.7356, "lr": 3.892944038929441e-07, "epoch": 0.008532423208191127, "percentage": 0.12, "elapsed_time": "0:00:34", "remaining_time": "7:50:14"} +{"current_steps": 10, "total_steps": 4102, "loss": 0.7425, "lr": 8.759124087591242e-07, "epoch": 0.017064846416382253, "percentage": 0.24, "elapsed_time": "0:00:59", "remaining_time": "6:43:33"} +{"current_steps": 15, "total_steps": 4102, "loss": 0.6855, "lr": 1.3625304136253043e-06, "epoch": 0.025597269624573378, "percentage": 0.37, "elapsed_time": "0:01:19", "remaining_time": "6:00:38"} +{"current_steps": 20, "total_steps": 4102, "loss": 0.6368, "lr": 1.8491484184914844e-06, "epoch": 0.034129692832764506, "percentage": 0.49, "elapsed_time": "0:01:54", "remaining_time": "6:29:05"} +{"current_steps": 25, "total_steps": 4102, "loss": 0.6536, "lr": 2.3357664233576643e-06, "epoch": 0.042662116040955635, "percentage": 0.61, "elapsed_time": "0:02:18", "remaining_time": "6:16:31"} +{"current_steps": 30, "total_steps": 4102, "loss": 0.6279, "lr": 2.8223844282238443e-06, "epoch": 0.051194539249146756, "percentage": 0.73, "elapsed_time": "0:02:40", "remaining_time": "6:03:41"} +{"current_steps": 35, "total_steps": 4102, "loss": 0.5787, "lr": 3.3090024330900246e-06, "epoch": 0.059726962457337884, "percentage": 0.85, "elapsed_time": "0:03:04", "remaining_time": "5:58:15"} +{"current_steps": 40, "total_steps": 4102, "loss": 0.5466, "lr": 3.7956204379562045e-06, "epoch": 0.06825938566552901, "percentage": 0.98, "elapsed_time": "0:03:30", "remaining_time": "5:56:53"} +{"current_steps": 45, "total_steps": 4102, "loss": 0.5302, "lr": 4.282238442822385e-06, "epoch": 0.07679180887372014, "percentage": 1.1, "elapsed_time": "0:03:56", "remaining_time": "5:54:38"} +{"current_steps": 50, "total_steps": 4102, "loss": 0.5127, "lr": 4.768856447688564e-06, "epoch": 0.08532423208191127, "percentage": 1.22, "elapsed_time": "0:04:19", "remaining_time": "5:50:51"} +{"current_steps": 55, "total_steps": 4102, "loss": 0.5237, "lr": 5.255474452554746e-06, "epoch": 0.09385665529010238, "percentage": 1.34, "elapsed_time": "0:04:38", "remaining_time": "5:41:25"} +{"current_steps": 60, "total_steps": 4102, "loss": 0.4872, "lr": 5.742092457420925e-06, "epoch": 0.10238907849829351, "percentage": 1.46, "elapsed_time": "0:05:00", "remaining_time": "5:37:23"} +{"current_steps": 65, "total_steps": 4102, "loss": 0.4914, "lr": 6.2287104622871054e-06, "epoch": 0.11092150170648464, "percentage": 1.58, "elapsed_time": "0:05:21", "remaining_time": "5:33:10"} +{"current_steps": 70, "total_steps": 4102, "loss": 0.4769, "lr": 6.715328467153285e-06, "epoch": 0.11945392491467577, "percentage": 1.71, "elapsed_time": "0:05:43", "remaining_time": "5:29:56"} +{"current_steps": 75, "total_steps": 4102, "loss": 0.4622, "lr": 7.201946472019465e-06, "epoch": 0.12798634812286688, "percentage": 1.83, "elapsed_time": "0:06:05", "remaining_time": "5:26:47"} +{"current_steps": 80, "total_steps": 4102, "loss": 0.4338, "lr": 7.688564476885646e-06, "epoch": 0.13651877133105803, "percentage": 1.95, "elapsed_time": "0:06:28", "remaining_time": "5:25:27"} +{"current_steps": 85, "total_steps": 4102, "loss": 0.4597, "lr": 8.175182481751825e-06, "epoch": 0.14505119453924914, "percentage": 2.07, "elapsed_time": "0:06:50", "remaining_time": "5:23:36"} +{"current_steps": 90, "total_steps": 4102, "loss": 0.4316, "lr": 8.661800486618006e-06, "epoch": 0.15358361774744028, "percentage": 2.19, "elapsed_time": "0:07:11", "remaining_time": "5:20:39"} +{"current_steps": 95, "total_steps": 4102, "loss": 0.4183, "lr": 9.148418491484186e-06, "epoch": 0.1621160409556314, "percentage": 2.32, "elapsed_time": "0:07:31", "remaining_time": "5:17:18"} +{"current_steps": 100, "total_steps": 4102, "loss": 0.4309, "lr": 9.635036496350367e-06, "epoch": 0.17064846416382254, "percentage": 2.44, "elapsed_time": "0:08:01", "remaining_time": "5:21:05"} +{"current_steps": 105, "total_steps": 4102, "loss": 0.4354, "lr": 1.0121654501216547e-05, "epoch": 0.17918088737201365, "percentage": 2.56, "elapsed_time": "0:08:21", "remaining_time": "5:17:55"} +{"current_steps": 110, "total_steps": 4102, "loss": 0.4227, "lr": 1.0608272506082726e-05, "epoch": 0.18771331058020477, "percentage": 2.68, "elapsed_time": "0:08:44", "remaining_time": "5:17:29"} +{"current_steps": 115, "total_steps": 4102, "loss": 0.4172, "lr": 1.1094890510948906e-05, "epoch": 0.1962457337883959, "percentage": 2.8, "elapsed_time": "0:09:08", "remaining_time": "5:17:00"} +{"current_steps": 120, "total_steps": 4102, "loss": 0.4352, "lr": 1.1581508515815085e-05, "epoch": 0.20477815699658702, "percentage": 2.93, "elapsed_time": "0:09:32", "remaining_time": "5:16:28"} +{"current_steps": 125, "total_steps": 4102, "loss": 0.4305, "lr": 1.2068126520681266e-05, "epoch": 0.21331058020477817, "percentage": 3.05, "elapsed_time": "0:09:55", "remaining_time": "5:15:58"} +{"current_steps": 130, "total_steps": 4102, "loss": 0.3958, "lr": 1.2554744525547446e-05, "epoch": 0.22184300341296928, "percentage": 3.17, "elapsed_time": "0:10:19", "remaining_time": "5:15:41"} +{"current_steps": 135, "total_steps": 4102, "loss": 0.4074, "lr": 1.3041362530413625e-05, "epoch": 0.23037542662116042, "percentage": 3.29, "elapsed_time": "0:10:46", "remaining_time": "5:16:40"} +{"current_steps": 140, "total_steps": 4102, "loss": 0.3898, "lr": 1.3527980535279805e-05, "epoch": 0.23890784982935154, "percentage": 3.41, "elapsed_time": "0:11:08", "remaining_time": "5:15:06"} +{"current_steps": 145, "total_steps": 4102, "loss": 0.3859, "lr": 1.4014598540145988e-05, "epoch": 0.24744027303754265, "percentage": 3.53, "elapsed_time": "0:11:29", "remaining_time": "5:13:46"} +{"current_steps": 150, "total_steps": 4102, "loss": 0.3916, "lr": 1.4501216545012167e-05, "epoch": 0.25597269624573377, "percentage": 3.66, "elapsed_time": "0:11:53", "remaining_time": "5:13:26"} +{"current_steps": 155, "total_steps": 4102, "loss": 0.3796, "lr": 1.4987834549878347e-05, "epoch": 0.2645051194539249, "percentage": 3.78, "elapsed_time": "0:12:15", "remaining_time": "5:11:59"} +{"current_steps": 160, "total_steps": 4102, "loss": 0.392, "lr": 1.5474452554744528e-05, "epoch": 0.27303754266211605, "percentage": 3.9, "elapsed_time": "0:12:38", "remaining_time": "5:11:21"} +{"current_steps": 165, "total_steps": 4102, "loss": 0.3866, "lr": 1.5961070559610707e-05, "epoch": 0.2815699658703072, "percentage": 4.02, "elapsed_time": "0:13:02", "remaining_time": "5:11:11"} +{"current_steps": 170, "total_steps": 4102, "loss": 0.3851, "lr": 1.6447688564476887e-05, "epoch": 0.2901023890784983, "percentage": 4.14, "elapsed_time": "0:13:30", "remaining_time": "5:12:27"} +{"current_steps": 175, "total_steps": 4102, "loss": 0.383, "lr": 1.6934306569343066e-05, "epoch": 0.2986348122866894, "percentage": 4.27, "elapsed_time": "0:13:55", "remaining_time": "5:12:31"} +{"current_steps": 180, "total_steps": 4102, "loss": 0.3717, "lr": 1.742092457420925e-05, "epoch": 0.30716723549488056, "percentage": 4.39, "elapsed_time": "0:14:19", "remaining_time": "5:12:08"} +{"current_steps": 185, "total_steps": 4102, "loss": 0.3776, "lr": 1.790754257907543e-05, "epoch": 0.31569965870307165, "percentage": 4.51, "elapsed_time": "0:14:42", "remaining_time": "5:11:18"} +{"current_steps": 190, "total_steps": 4102, "loss": 0.3836, "lr": 1.8394160583941608e-05, "epoch": 0.3242320819112628, "percentage": 4.63, "elapsed_time": "0:15:08", "remaining_time": "5:11:43"} +{"current_steps": 195, "total_steps": 4102, "loss": 0.3655, "lr": 1.8880778588807788e-05, "epoch": 0.33276450511945393, "percentage": 4.75, "elapsed_time": "0:15:30", "remaining_time": "5:10:50"} +{"current_steps": 200, "total_steps": 4102, "loss": 0.3746, "lr": 1.9367396593673967e-05, "epoch": 0.3412969283276451, "percentage": 4.88, "elapsed_time": "0:15:59", "remaining_time": "5:11:53"} +{"current_steps": 205, "total_steps": 4102, "loss": 0.3718, "lr": 1.9854014598540147e-05, "epoch": 0.34982935153583616, "percentage": 5.0, "elapsed_time": "0:17:20", "remaining_time": "5:29:37"} +{"current_steps": 210, "total_steps": 4102, "loss": 0.3785, "lr": 2.034063260340633e-05, "epoch": 0.3583617747440273, "percentage": 5.12, "elapsed_time": "0:17:41", "remaining_time": "5:27:51"} +{"current_steps": 215, "total_steps": 4102, "loss": 0.3862, "lr": 2.082725060827251e-05, "epoch": 0.36689419795221845, "percentage": 5.24, "elapsed_time": "0:18:00", "remaining_time": "5:25:41"} +{"current_steps": 220, "total_steps": 4102, "loss": 0.3769, "lr": 2.131386861313869e-05, "epoch": 0.37542662116040953, "percentage": 5.36, "elapsed_time": "0:18:25", "remaining_time": "5:25:12"} +{"current_steps": 225, "total_steps": 4102, "loss": 0.3848, "lr": 2.1800486618004868e-05, "epoch": 0.3839590443686007, "percentage": 5.49, "elapsed_time": "0:18:46", "remaining_time": "5:23:34"} +{"current_steps": 230, "total_steps": 4102, "loss": 0.359, "lr": 2.2287104622871048e-05, "epoch": 0.3924914675767918, "percentage": 5.61, "elapsed_time": "0:19:07", "remaining_time": "5:21:57"} +{"current_steps": 235, "total_steps": 4102, "loss": 0.3654, "lr": 2.2773722627737227e-05, "epoch": 0.40102389078498296, "percentage": 5.73, "elapsed_time": "0:19:27", "remaining_time": "5:20:14"} +{"current_steps": 240, "total_steps": 4102, "loss": 0.3585, "lr": 2.3260340632603407e-05, "epoch": 0.40955631399317405, "percentage": 5.85, "elapsed_time": "0:19:51", "remaining_time": "5:19:34"} +{"current_steps": 245, "total_steps": 4102, "loss": 0.3486, "lr": 2.374695863746959e-05, "epoch": 0.4180887372013652, "percentage": 5.97, "elapsed_time": "0:20:13", "remaining_time": "5:18:31"} +{"current_steps": 250, "total_steps": 4102, "loss": 0.3739, "lr": 2.423357664233577e-05, "epoch": 0.42662116040955633, "percentage": 6.09, "elapsed_time": "0:20:44", "remaining_time": "5:19:33"} +{"current_steps": 255, "total_steps": 4102, "loss": 0.3659, "lr": 2.472019464720195e-05, "epoch": 0.4351535836177474, "percentage": 6.22, "elapsed_time": "0:21:07", "remaining_time": "5:18:34"} +{"current_steps": 260, "total_steps": 4102, "loss": 0.366, "lr": 2.5206812652068128e-05, "epoch": 0.44368600682593856, "percentage": 6.34, "elapsed_time": "0:21:25", "remaining_time": "5:16:40"} +{"current_steps": 265, "total_steps": 4102, "loss": 0.3789, "lr": 2.5693430656934308e-05, "epoch": 0.4522184300341297, "percentage": 6.46, "elapsed_time": "0:21:45", "remaining_time": "5:15:09"} +{"current_steps": 270, "total_steps": 4102, "loss": 0.3588, "lr": 2.6180048661800487e-05, "epoch": 0.46075085324232085, "percentage": 6.58, "elapsed_time": "0:22:04", "remaining_time": "5:13:12"} +{"current_steps": 275, "total_steps": 4102, "loss": 0.3663, "lr": 2.6666666666666667e-05, "epoch": 0.46928327645051193, "percentage": 6.7, "elapsed_time": "0:22:27", "remaining_time": "5:12:27"} +{"current_steps": 280, "total_steps": 4102, "loss": 0.3572, "lr": 2.7153284671532846e-05, "epoch": 0.4778156996587031, "percentage": 6.83, "elapsed_time": "0:22:50", "remaining_time": "5:11:52"} +{"current_steps": 285, "total_steps": 4102, "loss": 0.3509, "lr": 2.7639902676399032e-05, "epoch": 0.4863481228668942, "percentage": 6.95, "elapsed_time": "0:23:16", "remaining_time": "5:11:38"} +{"current_steps": 290, "total_steps": 4102, "loss": 0.3713, "lr": 2.8126520681265212e-05, "epoch": 0.4948805460750853, "percentage": 7.07, "elapsed_time": "0:23:36", "remaining_time": "5:10:26"} +{"current_steps": 295, "total_steps": 4102, "loss": 0.347, "lr": 2.861313868613139e-05, "epoch": 0.5034129692832765, "percentage": 7.19, "elapsed_time": "0:24:00", "remaining_time": "5:09:48"} +{"current_steps": 300, "total_steps": 4102, "loss": 0.3588, "lr": 2.909975669099757e-05, "epoch": 0.5119453924914675, "percentage": 7.31, "elapsed_time": "0:24:22", "remaining_time": "5:08:56"} +{"current_steps": 305, "total_steps": 4102, "loss": 0.3631, "lr": 2.958637469586375e-05, "epoch": 0.5204778156996587, "percentage": 7.44, "elapsed_time": "0:24:48", "remaining_time": "5:08:56"} +{"current_steps": 310, "total_steps": 4102, "loss": 0.3514, "lr": 3.007299270072993e-05, "epoch": 0.5290102389078498, "percentage": 7.56, "elapsed_time": "0:25:10", "remaining_time": "5:07:54"} +{"current_steps": 315, "total_steps": 4102, "loss": 0.3544, "lr": 3.055961070559611e-05, "epoch": 0.537542662116041, "percentage": 7.68, "elapsed_time": "0:25:31", "remaining_time": "5:06:47"} +{"current_steps": 320, "total_steps": 4102, "loss": 0.3535, "lr": 3.104622871046229e-05, "epoch": 0.5460750853242321, "percentage": 7.8, "elapsed_time": "0:25:50", "remaining_time": "5:05:30"} +{"current_steps": 325, "total_steps": 4102, "loss": 0.3587, "lr": 3.153284671532847e-05, "epoch": 0.5546075085324232, "percentage": 7.92, "elapsed_time": "0:26:11", "remaining_time": "5:04:20"} +{"current_steps": 330, "total_steps": 4102, "loss": 0.3552, "lr": 3.201946472019465e-05, "epoch": 0.5631399317406144, "percentage": 8.04, "elapsed_time": "0:26:33", "remaining_time": "5:03:32"} +{"current_steps": 335, "total_steps": 4102, "loss": 0.3476, "lr": 3.250608272506083e-05, "epoch": 0.5716723549488054, "percentage": 8.17, "elapsed_time": "0:27:01", "remaining_time": "5:03:49"} +{"current_steps": 340, "total_steps": 4102, "loss": 0.3442, "lr": 3.299270072992701e-05, "epoch": 0.5802047781569966, "percentage": 8.29, "elapsed_time": "0:27:27", "remaining_time": "5:03:49"} +{"current_steps": 345, "total_steps": 4102, "loss": 0.3513, "lr": 3.3479318734793186e-05, "epoch": 0.5887372013651877, "percentage": 8.41, "elapsed_time": "0:27:53", "remaining_time": "5:03:41"} +{"current_steps": 350, "total_steps": 4102, "loss": 0.3482, "lr": 3.396593673965937e-05, "epoch": 0.5972696245733788, "percentage": 8.53, "elapsed_time": "0:28:18", "remaining_time": "5:03:29"} +{"current_steps": 355, "total_steps": 4102, "loss": 0.3462, "lr": 3.4452554744525545e-05, "epoch": 0.60580204778157, "percentage": 8.65, "elapsed_time": "0:28:39", "remaining_time": "5:02:30"} +{"current_steps": 360, "total_steps": 4102, "loss": 0.3543, "lr": 3.4939172749391735e-05, "epoch": 0.6143344709897611, "percentage": 8.78, "elapsed_time": "0:29:00", "remaining_time": "5:01:34"} +{"current_steps": 365, "total_steps": 4102, "loss": 0.3555, "lr": 3.542579075425791e-05, "epoch": 0.6228668941979523, "percentage": 8.9, "elapsed_time": "0:29:22", "remaining_time": "5:00:45"} +{"current_steps": 370, "total_steps": 4102, "loss": 0.358, "lr": 3.5912408759124094e-05, "epoch": 0.6313993174061433, "percentage": 9.02, "elapsed_time": "0:29:46", "remaining_time": "5:00:23"} +{"current_steps": 375, "total_steps": 4102, "loss": 0.3547, "lr": 3.639902676399027e-05, "epoch": 0.6399317406143344, "percentage": 9.14, "elapsed_time": "0:30:13", "remaining_time": "5:00:24"} +{"current_steps": 380, "total_steps": 4102, "loss": 0.3568, "lr": 3.688564476885645e-05, "epoch": 0.6484641638225256, "percentage": 9.26, "elapsed_time": "0:30:39", "remaining_time": "5:00:19"} +{"current_steps": 385, "total_steps": 4102, "loss": 0.3467, "lr": 3.737226277372263e-05, "epoch": 0.6569965870307167, "percentage": 9.39, "elapsed_time": "0:31:02", "remaining_time": "4:59:42"} +{"current_steps": 390, "total_steps": 4102, "loss": 0.3599, "lr": 3.785888077858881e-05, "epoch": 0.6655290102389079, "percentage": 9.51, "elapsed_time": "0:31:24", "remaining_time": "4:59:01"} +{"current_steps": 395, "total_steps": 4102, "loss": 0.3478, "lr": 3.8345498783454995e-05, "epoch": 0.674061433447099, "percentage": 9.63, "elapsed_time": "0:31:44", "remaining_time": "4:57:57"} +{"current_steps": 400, "total_steps": 4102, "loss": 0.3466, "lr": 3.883211678832117e-05, "epoch": 0.6825938566552902, "percentage": 9.75, "elapsed_time": "0:32:05", "remaining_time": "4:56:59"} +{"current_steps": 405, "total_steps": 4102, "loss": 0.3418, "lr": 3.9318734793187354e-05, "epoch": 0.6911262798634812, "percentage": 9.87, "elapsed_time": "0:33:28", "remaining_time": "5:05:31"} +{"current_steps": 410, "total_steps": 4102, "loss": 0.3466, "lr": 3.980535279805353e-05, "epoch": 0.6996587030716723, "percentage": 10.0, "elapsed_time": "0:33:51", "remaining_time": "5:04:50"} +{"current_steps": 415, "total_steps": 4102, "loss": 0.3322, "lr": 3.999993479904927e-05, "epoch": 0.7081911262798635, "percentage": 10.12, "elapsed_time": "0:34:11", "remaining_time": "5:03:43"} +{"current_steps": 420, "total_steps": 4102, "loss": 0.3455, "lr": 3.999953635033432e-05, "epoch": 0.7167235494880546, "percentage": 10.24, "elapsed_time": "0:34:33", "remaining_time": "5:02:57"} +{"current_steps": 425, "total_steps": 4102, "loss": 0.3248, "lr": 3.999877568286252e-05, "epoch": 0.7252559726962458, "percentage": 10.36, "elapsed_time": "0:34:54", "remaining_time": "5:01:59"} +{"current_steps": 430, "total_steps": 4102, "loss": 0.3436, "lr": 3.999765281041059e-05, "epoch": 0.7337883959044369, "percentage": 10.48, "elapsed_time": "0:35:17", "remaining_time": "5:01:19"} +{"current_steps": 435, "total_steps": 4102, "loss": 0.3317, "lr": 3.999616775331529e-05, "epoch": 0.742320819112628, "percentage": 10.6, "elapsed_time": "0:35:47", "remaining_time": "5:01:43"} +{"current_steps": 440, "total_steps": 4102, "loss": 0.3522, "lr": 3.9994320538473e-05, "epoch": 0.7508532423208191, "percentage": 10.73, "elapsed_time": "0:36:12", "remaining_time": "5:01:19"} +{"current_steps": 445, "total_steps": 4102, "loss": 0.3622, "lr": 3.99921111993393e-05, "epoch": 0.7593856655290102, "percentage": 10.85, "elapsed_time": "0:36:32", "remaining_time": "5:00:14"} +{"current_steps": 450, "total_steps": 4102, "loss": 0.3295, "lr": 3.998953977592832e-05, "epoch": 0.7679180887372014, "percentage": 10.97, "elapsed_time": "0:36:57", "remaining_time": "4:59:56"} +{"current_steps": 455, "total_steps": 4102, "loss": 0.3407, "lr": 3.998660631481203e-05, "epoch": 0.7764505119453925, "percentage": 11.09, "elapsed_time": "0:37:24", "remaining_time": "4:59:52"} +{"current_steps": 460, "total_steps": 4102, "loss": 0.3335, "lr": 3.998331086911939e-05, "epoch": 0.7849829351535836, "percentage": 11.21, "elapsed_time": "0:37:49", "remaining_time": "4:59:24"} +{"current_steps": 465, "total_steps": 4102, "loss": 0.3436, "lr": 3.9979653498535394e-05, "epoch": 0.7935153583617748, "percentage": 11.34, "elapsed_time": "0:38:09", "remaining_time": "4:58:27"} +{"current_steps": 470, "total_steps": 4102, "loss": 0.3535, "lr": 3.9975634269299994e-05, "epoch": 0.8020477815699659, "percentage": 11.46, "elapsed_time": "0:38:34", "remaining_time": "4:58:05"} +{"current_steps": 475, "total_steps": 4102, "loss": 0.3437, "lr": 3.997125325420689e-05, "epoch": 0.810580204778157, "percentage": 11.58, "elapsed_time": "0:38:59", "remaining_time": "4:57:47"} +{"current_steps": 480, "total_steps": 4102, "loss": 0.346, "lr": 3.9966510532602206e-05, "epoch": 0.8191126279863481, "percentage": 11.7, "elapsed_time": "0:39:20", "remaining_time": "4:56:53"} +{"current_steps": 485, "total_steps": 4102, "loss": 0.3599, "lr": 3.996140619038308e-05, "epoch": 0.8276450511945392, "percentage": 11.82, "elapsed_time": "0:39:41", "remaining_time": "4:55:57"} +{"current_steps": 490, "total_steps": 4102, "loss": 0.3407, "lr": 3.995594031999607e-05, "epoch": 0.8361774744027304, "percentage": 11.95, "elapsed_time": "0:40:03", "remaining_time": "4:55:14"} +{"current_steps": 495, "total_steps": 4102, "loss": 0.3471, "lr": 3.9950113020435515e-05, "epoch": 0.8447098976109215, "percentage": 12.07, "elapsed_time": "0:40:24", "remaining_time": "4:54:28"} +{"current_steps": 500, "total_steps": 4102, "loss": 0.3188, "lr": 3.9943924397241716e-05, "epoch": 0.8532423208191127, "percentage": 12.19, "elapsed_time": "0:40:54", "remaining_time": "4:54:42"} +{"current_steps": 505, "total_steps": 4102, "loss": 0.3482, "lr": 3.993737456249905e-05, "epoch": 0.8617747440273038, "percentage": 12.31, "elapsed_time": "0:41:19", "remaining_time": "4:54:24"} +{"current_steps": 510, "total_steps": 4102, "loss": 0.3421, "lr": 3.9930463634833906e-05, "epoch": 0.8703071672354948, "percentage": 12.43, "elapsed_time": "0:41:42", "remaining_time": "4:53:48"} +{"current_steps": 515, "total_steps": 4102, "loss": 0.3256, "lr": 3.9923191739412586e-05, "epoch": 0.878839590443686, "percentage": 12.55, "elapsed_time": "0:42:12", "remaining_time": "4:53:57"} +{"current_steps": 520, "total_steps": 4102, "loss": 0.3391, "lr": 3.991555900793897e-05, "epoch": 0.8873720136518771, "percentage": 12.68, "elapsed_time": "0:42:33", "remaining_time": "4:53:06"} +{"current_steps": 525, "total_steps": 4102, "loss": 0.3636, "lr": 3.990756557865219e-05, "epoch": 0.8959044368600683, "percentage": 12.8, "elapsed_time": "0:42:56", "remaining_time": "4:52:34"} +{"current_steps": 530, "total_steps": 4102, "loss": 0.3392, "lr": 3.989921159632412e-05, "epoch": 0.9044368600682594, "percentage": 12.92, "elapsed_time": "0:43:22", "remaining_time": "4:52:16"} +{"current_steps": 535, "total_steps": 4102, "loss": 0.3386, "lr": 3.9890497212256704e-05, "epoch": 0.9129692832764505, "percentage": 13.04, "elapsed_time": "0:43:48", "remaining_time": "4:52:02"} +{"current_steps": 540, "total_steps": 4102, "loss": 0.344, "lr": 3.9881422584279276e-05, "epoch": 0.9215017064846417, "percentage": 13.16, "elapsed_time": "0:44:10", "remaining_time": "4:51:21"} +{"current_steps": 545, "total_steps": 4102, "loss": 0.3305, "lr": 3.987198787674566e-05, "epoch": 0.9300341296928327, "percentage": 13.29, "elapsed_time": "0:44:33", "remaining_time": "4:50:50"} +{"current_steps": 550, "total_steps": 4102, "loss": 0.3322, "lr": 3.9862193260531234e-05, "epoch": 0.9385665529010239, "percentage": 13.41, "elapsed_time": "0:44:58", "remaining_time": "4:50:28"} +{"current_steps": 555, "total_steps": 4102, "loss": 0.3325, "lr": 3.98520389130298e-05, "epoch": 0.947098976109215, "percentage": 13.53, "elapsed_time": "0:45:18", "remaining_time": "4:49:32"} +{"current_steps": 560, "total_steps": 4102, "loss": 0.3179, "lr": 3.9841525018150354e-05, "epoch": 0.9556313993174061, "percentage": 13.65, "elapsed_time": "0:45:37", "remaining_time": "4:48:35"} +{"current_steps": 565, "total_steps": 4102, "loss": 0.3264, "lr": 3.983065176631383e-05, "epoch": 0.9641638225255973, "percentage": 13.77, "elapsed_time": "0:46:02", "remaining_time": "4:48:14"} +{"current_steps": 570, "total_steps": 4102, "loss": 0.3233, "lr": 3.981941935444956e-05, "epoch": 0.9726962457337884, "percentage": 13.9, "elapsed_time": "0:46:24", "remaining_time": "4:47:34"} +{"current_steps": 575, "total_steps": 4102, "loss": 0.341, "lr": 3.9807827985991795e-05, "epoch": 0.9812286689419796, "percentage": 14.02, "elapsed_time": "0:46:45", "remaining_time": "4:46:49"} +{"current_steps": 580, "total_steps": 4102, "loss": 0.3343, "lr": 3.979587787087594e-05, "epoch": 0.9897610921501706, "percentage": 14.14, "elapsed_time": "0:47:06", "remaining_time": "4:46:02"} +{"current_steps": 585, "total_steps": 4102, "loss": 0.3457, "lr": 3.978356922553482e-05, "epoch": 0.9982935153583617, "percentage": 14.26, "elapsed_time": "0:47:28", "remaining_time": "4:45:27"} +{"current_steps": 590, "total_steps": 4102, "loss": 0.31, "lr": 3.977090227289469e-05, "epoch": 1.006825938566553, "percentage": 14.38, "elapsed_time": "0:47:49", "remaining_time": "4:44:38"} +{"current_steps": 595, "total_steps": 4102, "loss": 0.33, "lr": 3.9757877242371286e-05, "epoch": 1.015358361774744, "percentage": 14.51, "elapsed_time": "0:48:13", "remaining_time": "4:44:13"} +{"current_steps": 600, "total_steps": 4102, "loss": 0.3054, "lr": 3.974449436986557e-05, "epoch": 1.023890784982935, "percentage": 14.63, "elapsed_time": "0:48:35", "remaining_time": "4:43:38"} +{"current_steps": 605, "total_steps": 4102, "loss": 0.3152, "lr": 3.973075389775956e-05, "epoch": 1.0324232081911262, "percentage": 14.75, "elapsed_time": "0:49:56", "remaining_time": "4:48:39"} +{"current_steps": 610, "total_steps": 4102, "loss": 0.3099, "lr": 3.971665607491184e-05, "epoch": 1.0409556313993173, "percentage": 14.87, "elapsed_time": "0:50:18", "remaining_time": "4:47:56"} +{"current_steps": 615, "total_steps": 4102, "loss": 0.3271, "lr": 3.9702201156653136e-05, "epoch": 1.0494880546075085, "percentage": 14.99, "elapsed_time": "0:50:39", "remaining_time": "4:47:11"} +{"current_steps": 620, "total_steps": 4102, "loss": 0.3153, "lr": 3.9687389404781635e-05, "epoch": 1.0580204778156996, "percentage": 15.11, "elapsed_time": "0:51:05", "remaining_time": "4:46:54"} +{"current_steps": 625, "total_steps": 4102, "loss": 0.3151, "lr": 3.967222108755827e-05, "epoch": 1.0665529010238908, "percentage": 15.24, "elapsed_time": "0:51:25", "remaining_time": "4:46:07"} +{"current_steps": 630, "total_steps": 4102, "loss": 0.3072, "lr": 3.9656696479701875e-05, "epoch": 1.075085324232082, "percentage": 15.36, "elapsed_time": "0:51:57", "remaining_time": "4:46:22"} +{"current_steps": 635, "total_steps": 4102, "loss": 0.3073, "lr": 3.964081586238417e-05, "epoch": 1.083617747440273, "percentage": 15.48, "elapsed_time": "0:52:19", "remaining_time": "4:45:39"} +{"current_steps": 640, "total_steps": 4102, "loss": 0.3055, "lr": 3.962457952322468e-05, "epoch": 1.0921501706484642, "percentage": 15.6, "elapsed_time": "0:52:40", "remaining_time": "4:44:56"} +{"current_steps": 645, "total_steps": 4102, "loss": 0.3148, "lr": 3.9607987756285566e-05, "epoch": 1.1006825938566553, "percentage": 15.72, "elapsed_time": "0:53:05", "remaining_time": "4:44:35"} +{"current_steps": 650, "total_steps": 4102, "loss": 0.2944, "lr": 3.959104086206626e-05, "epoch": 1.1092150170648465, "percentage": 15.85, "elapsed_time": "0:53:29", "remaining_time": "4:44:06"} +{"current_steps": 655, "total_steps": 4102, "loss": 0.3025, "lr": 3.957373914749802e-05, "epoch": 1.1177474402730376, "percentage": 15.97, "elapsed_time": "0:53:58", "remaining_time": "4:44:02"} +{"current_steps": 660, "total_steps": 4102, "loss": 0.2982, "lr": 3.955608292593838e-05, "epoch": 1.1262798634812285, "percentage": 16.09, "elapsed_time": "0:54:20", "remaining_time": "4:43:22"} +{"current_steps": 665, "total_steps": 4102, "loss": 0.3188, "lr": 3.9538072517165483e-05, "epoch": 1.13481228668942, "percentage": 16.21, "elapsed_time": "0:54:46", "remaining_time": "4:43:05"} +{"current_steps": 670, "total_steps": 4102, "loss": 0.3111, "lr": 3.95197082473723e-05, "epoch": 1.1433447098976108, "percentage": 16.33, "elapsed_time": "0:55:07", "remaining_time": "4:42:22"} +{"current_steps": 675, "total_steps": 4102, "loss": 0.3166, "lr": 3.950099044916068e-05, "epoch": 1.151877133105802, "percentage": 16.46, "elapsed_time": "0:55:30", "remaining_time": "4:41:50"} +{"current_steps": 680, "total_steps": 4102, "loss": 0.2934, "lr": 3.948191946153537e-05, "epoch": 1.1604095563139931, "percentage": 16.58, "elapsed_time": "0:55:50", "remaining_time": "4:41:02"} +{"current_steps": 685, "total_steps": 4102, "loss": 0.3093, "lr": 3.946249562989783e-05, "epoch": 1.1689419795221843, "percentage": 16.7, "elapsed_time": "0:56:17", "remaining_time": "4:40:45"} +{"current_steps": 690, "total_steps": 4102, "loss": 0.3134, "lr": 3.9442719306040044e-05, "epoch": 1.1774744027303754, "percentage": 16.82, "elapsed_time": "0:56:39", "remaining_time": "4:40:11"} +{"current_steps": 695, "total_steps": 4102, "loss": 0.3191, "lr": 3.942259084813807e-05, "epoch": 1.1860068259385665, "percentage": 16.94, "elapsed_time": "0:57:04", "remaining_time": "4:39:47"} +{"current_steps": 700, "total_steps": 4102, "loss": 0.3087, "lr": 3.940211062074563e-05, "epoch": 1.1945392491467577, "percentage": 17.06, "elapsed_time": "0:57:27", "remaining_time": "4:39:15"} +{"current_steps": 705, "total_steps": 4102, "loss": 0.3118, "lr": 3.938127899478743e-05, "epoch": 1.2030716723549488, "percentage": 17.19, "elapsed_time": "0:57:47", "remaining_time": "4:38:29"} +{"current_steps": 710, "total_steps": 4102, "loss": 0.3057, "lr": 3.936009634755251e-05, "epoch": 1.21160409556314, "percentage": 17.31, "elapsed_time": "0:58:08", "remaining_time": "4:37:48"} +{"current_steps": 715, "total_steps": 4102, "loss": 0.2925, "lr": 3.933856306268736e-05, "epoch": 1.2201365187713311, "percentage": 17.43, "elapsed_time": "0:58:40", "remaining_time": "4:37:57"} +{"current_steps": 720, "total_steps": 4102, "loss": 0.332, "lr": 3.9316679530189016e-05, "epoch": 1.2286689419795223, "percentage": 17.55, "elapsed_time": "0:59:02", "remaining_time": "4:37:20"} +{"current_steps": 725, "total_steps": 4102, "loss": 0.3019, "lr": 3.9294446146397956e-05, "epoch": 1.2372013651877134, "percentage": 17.67, "elapsed_time": "0:59:31", "remaining_time": "4:37:15"} +{"current_steps": 730, "total_steps": 4102, "loss": 0.319, "lr": 3.927186331399095e-05, "epoch": 1.2457337883959045, "percentage": 17.8, "elapsed_time": "0:59:52", "remaining_time": "4:36:32"} +{"current_steps": 735, "total_steps": 4102, "loss": 0.3161, "lr": 3.924893144197375e-05, "epoch": 1.2542662116040955, "percentage": 17.92, "elapsed_time": "1:00:13", "remaining_time": "4:35:52"} +{"current_steps": 740, "total_steps": 4102, "loss": 0.3235, "lr": 3.922565094567371e-05, "epoch": 1.2627986348122868, "percentage": 18.04, "elapsed_time": "1:00:41", "remaining_time": "4:35:44"} +{"current_steps": 745, "total_steps": 4102, "loss": 0.3053, "lr": 3.9202022246732195e-05, "epoch": 1.2713310580204777, "percentage": 18.16, "elapsed_time": "1:01:08", "remaining_time": "4:35:32"} +{"current_steps": 750, "total_steps": 4102, "loss": 0.3129, "lr": 3.9178045773097054e-05, "epoch": 1.2798634812286689, "percentage": 18.28, "elapsed_time": "1:01:34", "remaining_time": "4:35:13"} +{"current_steps": 755, "total_steps": 4102, "loss": 0.3081, "lr": 3.9153721959014764e-05, "epoch": 1.28839590443686, "percentage": 18.41, "elapsed_time": "1:01:58", "remaining_time": "4:34:44"} +{"current_steps": 760, "total_steps": 4102, "loss": 0.3171, "lr": 3.9129051245022614e-05, "epoch": 1.2969283276450512, "percentage": 18.53, "elapsed_time": "1:02:20", "remaining_time": "4:34:08"} +{"current_steps": 765, "total_steps": 4102, "loss": 0.3176, "lr": 3.910403407794075e-05, "epoch": 1.3054607508532423, "percentage": 18.65, "elapsed_time": "1:02:42", "remaining_time": "4:33:32"} +{"current_steps": 770, "total_steps": 4102, "loss": 0.3159, "lr": 3.907867091086402e-05, "epoch": 1.3139931740614335, "percentage": 18.77, "elapsed_time": "1:03:03", "remaining_time": "4:32:52"} +{"current_steps": 775, "total_steps": 4102, "loss": 0.3044, "lr": 3.905296220315382e-05, "epoch": 1.3225255972696246, "percentage": 18.89, "elapsed_time": "1:03:28", "remaining_time": "4:32:27"} +{"current_steps": 780, "total_steps": 4102, "loss": 0.3029, "lr": 3.902690842042975e-05, "epoch": 1.3310580204778157, "percentage": 19.02, "elapsed_time": "1:03:50", "remaining_time": "4:31:54"} +{"current_steps": 785, "total_steps": 4102, "loss": 0.3101, "lr": 3.900051003456119e-05, "epoch": 1.3395904436860069, "percentage": 19.14, "elapsed_time": "1:04:14", "remaining_time": "4:31:28"} +{"current_steps": 790, "total_steps": 4102, "loss": 0.3155, "lr": 3.8973767523658745e-05, "epoch": 1.348122866894198, "percentage": 19.26, "elapsed_time": "1:04:35", "remaining_time": "4:30:46"} +{"current_steps": 795, "total_steps": 4102, "loss": 0.3174, "lr": 3.8946681372065604e-05, "epoch": 1.3566552901023892, "percentage": 19.38, "elapsed_time": "1:04:57", "remaining_time": "4:30:10"} +{"current_steps": 800, "total_steps": 4102, "loss": 0.3047, "lr": 3.8919252070348736e-05, "epoch": 1.36518771331058, "percentage": 19.5, "elapsed_time": "1:05:19", "remaining_time": "4:29:36"} +{"current_steps": 805, "total_steps": 4102, "loss": 0.3045, "lr": 3.889148011529005e-05, "epoch": 1.3737201365187715, "percentage": 19.62, "elapsed_time": "1:06:39", "remaining_time": "4:33:00"} +{"current_steps": 810, "total_steps": 4102, "loss": 0.3076, "lr": 3.886336600987735e-05, "epoch": 1.3822525597269624, "percentage": 19.75, "elapsed_time": "1:07:03", "remaining_time": "4:32:33"} +{"current_steps": 815, "total_steps": 4102, "loss": 0.2982, "lr": 3.8834910263295256e-05, "epoch": 1.3907849829351535, "percentage": 19.87, "elapsed_time": "1:07:26", "remaining_time": "4:32:01"} +{"current_steps": 820, "total_steps": 4102, "loss": 0.3021, "lr": 3.880611339091598e-05, "epoch": 1.3993174061433447, "percentage": 19.99, "elapsed_time": "1:07:50", "remaining_time": "4:31:30"} +{"current_steps": 825, "total_steps": 4102, "loss": 0.3096, "lr": 3.877697591428996e-05, "epoch": 1.4078498293515358, "percentage": 20.11, "elapsed_time": "1:08:10", "remaining_time": "4:30:46"} +{"current_steps": 830, "total_steps": 4102, "loss": 0.2996, "lr": 3.8747498361136484e-05, "epoch": 1.416382252559727, "percentage": 20.23, "elapsed_time": "1:08:31", "remaining_time": "4:30:06"} +{"current_steps": 835, "total_steps": 4102, "loss": 0.31, "lr": 3.8717681265334045e-05, "epoch": 1.424914675767918, "percentage": 20.36, "elapsed_time": "1:08:53", "remaining_time": "4:29:31"} +{"current_steps": 840, "total_steps": 4102, "loss": 0.3136, "lr": 3.868752516691073e-05, "epoch": 1.4334470989761092, "percentage": 20.48, "elapsed_time": "1:09:16", "remaining_time": "4:28:59"} +{"current_steps": 845, "total_steps": 4102, "loss": 0.2986, "lr": 3.865703061203443e-05, "epoch": 1.4419795221843004, "percentage": 20.6, "elapsed_time": "1:09:35", "remaining_time": "4:28:14"} +{"current_steps": 850, "total_steps": 4102, "loss": 0.3053, "lr": 3.8626198153002943e-05, "epoch": 1.4505119453924915, "percentage": 20.72, "elapsed_time": "1:09:59", "remaining_time": "4:27:48"} +{"current_steps": 855, "total_steps": 4102, "loss": 0.3051, "lr": 3.859502834823395e-05, "epoch": 1.4590443686006827, "percentage": 20.84, "elapsed_time": "1:10:19", "remaining_time": "4:27:05"} +{"current_steps": 860, "total_steps": 4102, "loss": 0.2978, "lr": 3.8563521762254946e-05, "epoch": 1.4675767918088738, "percentage": 20.97, "elapsed_time": "1:10:41", "remaining_time": "4:26:27"} +{"current_steps": 865, "total_steps": 4102, "loss": 0.3035, "lr": 3.853167896569296e-05, "epoch": 1.4761092150170647, "percentage": 21.09, "elapsed_time": "1:11:06", "remaining_time": "4:26:06"} +{"current_steps": 870, "total_steps": 4102, "loss": 0.3066, "lr": 3.8499500535264303e-05, "epoch": 1.484641638225256, "percentage": 21.21, "elapsed_time": "1:11:27", "remaining_time": "4:25:27"} +{"current_steps": 875, "total_steps": 4102, "loss": 0.3197, "lr": 3.8466987053764014e-05, "epoch": 1.493174061433447, "percentage": 21.33, "elapsed_time": "1:11:48", "remaining_time": "4:24:48"} +{"current_steps": 880, "total_steps": 4102, "loss": 0.3043, "lr": 3.8434139110055396e-05, "epoch": 1.5017064846416384, "percentage": 21.45, "elapsed_time": "1:12:09", "remaining_time": "4:24:10"} +{"current_steps": 885, "total_steps": 4102, "loss": 0.3089, "lr": 3.84009572990593e-05, "epoch": 1.5102389078498293, "percentage": 21.57, "elapsed_time": "1:12:31", "remaining_time": "4:23:37"} +{"current_steps": 890, "total_steps": 4102, "loss": 0.2955, "lr": 3.836744222174339e-05, "epoch": 1.5187713310580204, "percentage": 21.7, "elapsed_time": "1:12:55", "remaining_time": "4:23:12"} +{"current_steps": 895, "total_steps": 4102, "loss": 0.2963, "lr": 3.833359448511121e-05, "epoch": 1.5273037542662116, "percentage": 21.82, "elapsed_time": "1:13:16", "remaining_time": "4:22:35"} +{"current_steps": 900, "total_steps": 4102, "loss": 0.3039, "lr": 3.829941470219123e-05, "epoch": 1.5358361774744027, "percentage": 21.94, "elapsed_time": "1:13:39", "remaining_time": "4:22:02"} +{"current_steps": 905, "total_steps": 4102, "loss": 0.2993, "lr": 3.8264903492025706e-05, "epoch": 1.5443686006825939, "percentage": 22.06, "elapsed_time": "1:14:03", "remaining_time": "4:21:35"} +{"current_steps": 910, "total_steps": 4102, "loss": 0.3206, "lr": 3.823006147965953e-05, "epoch": 1.552901023890785, "percentage": 22.18, "elapsed_time": "1:14:26", "remaining_time": "4:21:06"} +{"current_steps": 915, "total_steps": 4102, "loss": 0.3093, "lr": 3.819488929612886e-05, "epoch": 1.5614334470989761, "percentage": 22.31, "elapsed_time": "1:14:47", "remaining_time": "4:20:30"} +{"current_steps": 920, "total_steps": 4102, "loss": 0.2967, "lr": 3.815938757844966e-05, "epoch": 1.5699658703071673, "percentage": 22.43, "elapsed_time": "1:15:10", "remaining_time": "4:19:58"} +{"current_steps": 925, "total_steps": 4102, "loss": 0.2885, "lr": 3.812355696960627e-05, "epoch": 1.5784982935153584, "percentage": 22.55, "elapsed_time": "1:15:40", "remaining_time": "4:19:55"} +{"current_steps": 930, "total_steps": 4102, "loss": 0.3256, "lr": 3.808739811853965e-05, "epoch": 1.5870307167235493, "percentage": 22.67, "elapsed_time": "1:16:01", "remaining_time": "4:19:18"} +{"current_steps": 935, "total_steps": 4102, "loss": 0.3053, "lr": 3.8050911680135685e-05, "epoch": 1.5955631399317407, "percentage": 22.79, "elapsed_time": "1:16:21", "remaining_time": "4:18:39"} +{"current_steps": 940, "total_steps": 4102, "loss": 0.2935, "lr": 3.801409831521332e-05, "epoch": 1.6040955631399316, "percentage": 22.92, "elapsed_time": "1:16:41", "remaining_time": "4:17:59"} +{"current_steps": 945, "total_steps": 4102, "loss": 0.3119, "lr": 3.797695869051256e-05, "epoch": 1.612627986348123, "percentage": 23.04, "elapsed_time": "1:17:06", "remaining_time": "4:17:37"} +{"current_steps": 950, "total_steps": 4102, "loss": 0.2988, "lr": 3.7939493478682455e-05, "epoch": 1.621160409556314, "percentage": 23.16, "elapsed_time": "1:17:28", "remaining_time": "4:17:02"} +{"current_steps": 955, "total_steps": 4102, "loss": 0.2875, "lr": 3.790170335826884e-05, "epoch": 1.6296928327645053, "percentage": 23.28, "elapsed_time": "1:17:49", "remaining_time": "4:16:28"} +{"current_steps": 960, "total_steps": 4102, "loss": 0.3148, "lr": 3.786358901370212e-05, "epoch": 1.6382252559726962, "percentage": 23.4, "elapsed_time": "1:18:11", "remaining_time": "4:15:55"} +{"current_steps": 965, "total_steps": 4102, "loss": 0.3051, "lr": 3.782515113528481e-05, "epoch": 1.6467576791808873, "percentage": 23.53, "elapsed_time": "1:18:37", "remaining_time": "4:15:34"} +{"current_steps": 970, "total_steps": 4102, "loss": 0.3099, "lr": 3.778639041917907e-05, "epoch": 1.6552901023890785, "percentage": 23.65, "elapsed_time": "1:19:02", "remaining_time": "4:15:12"} +{"current_steps": 975, "total_steps": 4102, "loss": 0.3127, "lr": 3.774730756739411e-05, "epoch": 1.6638225255972696, "percentage": 23.77, "elapsed_time": "1:19:22", "remaining_time": "4:14:33"} +{"current_steps": 980, "total_steps": 4102, "loss": 0.2972, "lr": 3.7707903287773433e-05, "epoch": 1.6723549488054608, "percentage": 23.89, "elapsed_time": "1:19:44", "remaining_time": "4:14:01"} +{"current_steps": 985, "total_steps": 4102, "loss": 0.3031, "lr": 3.766817829398204e-05, "epoch": 1.680887372013652, "percentage": 24.01, "elapsed_time": "1:20:10", "remaining_time": "4:13:41"} +{"current_steps": 990, "total_steps": 4102, "loss": 0.2945, "lr": 3.7628133305493515e-05, "epoch": 1.689419795221843, "percentage": 24.13, "elapsed_time": "1:20:38", "remaining_time": "4:13:28"} +{"current_steps": 995, "total_steps": 4102, "loss": 0.3116, "lr": 3.758776904757695e-05, "epoch": 1.697952218430034, "percentage": 24.26, "elapsed_time": "1:20:58", "remaining_time": "4:12:50"} +{"current_steps": 1000, "total_steps": 4102, "loss": 0.2948, "lr": 3.7547086251283864e-05, "epoch": 1.7064846416382253, "percentage": 24.38, "elapsed_time": "1:21:21", "remaining_time": "4:12:22"} +{"current_steps": 1005, "total_steps": 4102, "loss": 0.2968, "lr": 3.750608565343495e-05, "epoch": 1.7150170648464163, "percentage": 24.5, "elapsed_time": "1:22:44", "remaining_time": "4:14:59"} +{"current_steps": 1010, "total_steps": 4102, "loss": 0.301, "lr": 3.7464767996606684e-05, "epoch": 1.7235494880546076, "percentage": 24.62, "elapsed_time": "1:23:05", "remaining_time": "4:14:22"} +{"current_steps": 1015, "total_steps": 4102, "loss": 0.3062, "lr": 3.7423134029117934e-05, "epoch": 1.7320819112627985, "percentage": 24.74, "elapsed_time": "1:23:34", "remaining_time": "4:14:12"} +{"current_steps": 1020, "total_steps": 4102, "loss": 0.2971, "lr": 3.738118450501638e-05, "epoch": 1.74061433447099, "percentage": 24.87, "elapsed_time": "1:23:57", "remaining_time": "4:13:42"} +{"current_steps": 1025, "total_steps": 4102, "loss": 0.3081, "lr": 3.733892018406486e-05, "epoch": 1.7491467576791808, "percentage": 24.99, "elapsed_time": "1:24:22", "remaining_time": "4:13:18"} +{"current_steps": 1030, "total_steps": 4102, "loss": 0.2926, "lr": 3.72963418317276e-05, "epoch": 1.757679180887372, "percentage": 25.11, "elapsed_time": "1:24:44", "remaining_time": "4:12:45"} +{"current_steps": 1035, "total_steps": 4102, "loss": 0.306, "lr": 3.725345021915637e-05, "epoch": 1.766211604095563, "percentage": 25.23, "elapsed_time": "1:25:05", "remaining_time": "4:12:08"} +{"current_steps": 1040, "total_steps": 4102, "loss": 0.3141, "lr": 3.7210246123176525e-05, "epoch": 1.7747440273037542, "percentage": 25.35, "elapsed_time": "1:25:24", "remaining_time": "4:11:26"} +{"current_steps": 1045, "total_steps": 4102, "loss": 0.2957, "lr": 3.716673032627289e-05, "epoch": 1.7832764505119454, "percentage": 25.48, "elapsed_time": "1:25:46", "remaining_time": "4:10:54"} +{"current_steps": 1050, "total_steps": 4102, "loss": 0.3035, "lr": 3.712290361657562e-05, "epoch": 1.7918088737201365, "percentage": 25.6, "elapsed_time": "1:26:07", "remaining_time": "4:10:19"} +{"current_steps": 1055, "total_steps": 4102, "loss": 0.321, "lr": 3.7078766787845946e-05, "epoch": 1.8003412969283277, "percentage": 25.72, "elapsed_time": "1:26:26", "remaining_time": "4:09:40"} +{"current_steps": 1060, "total_steps": 4102, "loss": 0.3072, "lr": 3.703432063946176e-05, "epoch": 1.8088737201365188, "percentage": 25.84, "elapsed_time": "1:26:46", "remaining_time": "4:09:03"} +{"current_steps": 1065, "total_steps": 4102, "loss": 0.2867, "lr": 3.698956597640314e-05, "epoch": 1.81740614334471, "percentage": 25.96, "elapsed_time": "1:27:05", "remaining_time": "4:08:21"} +{"current_steps": 1070, "total_steps": 4102, "loss": 0.3182, "lr": 3.694450360923782e-05, "epoch": 1.8259385665529009, "percentage": 26.08, "elapsed_time": "1:27:27", "remaining_time": "4:07:49"} +{"current_steps": 1075, "total_steps": 4102, "loss": 0.2998, "lr": 3.6899134354106433e-05, "epoch": 1.8344709897610922, "percentage": 26.21, "elapsed_time": "1:27:49", "remaining_time": "4:07:18"} +{"current_steps": 1080, "total_steps": 4102, "loss": 0.3003, "lr": 3.6853459032707794e-05, "epoch": 1.8430034129692832, "percentage": 26.33, "elapsed_time": "1:28:17", "remaining_time": "4:07:03"} +{"current_steps": 1085, "total_steps": 4102, "loss": 0.3043, "lr": 3.6807478472283985e-05, "epoch": 1.8515358361774745, "percentage": 26.45, "elapsed_time": "1:28:37", "remaining_time": "4:06:26"} +{"current_steps": 1090, "total_steps": 4102, "loss": 0.2947, "lr": 3.676119350560539e-05, "epoch": 1.8600682593856654, "percentage": 26.57, "elapsed_time": "1:28:57", "remaining_time": "4:05:47"} +{"current_steps": 1095, "total_steps": 4102, "loss": 0.3101, "lr": 3.671460497095558e-05, "epoch": 1.8686006825938568, "percentage": 26.69, "elapsed_time": "1:29:18", "remaining_time": "4:05:13"} +{"current_steps": 1100, "total_steps": 4102, "loss": 0.3115, "lr": 3.6667713712116195e-05, "epoch": 1.8771331058020477, "percentage": 26.82, "elapsed_time": "1:29:39", "remaining_time": "4:04:40"} +{"current_steps": 1105, "total_steps": 4102, "loss": 0.3046, "lr": 3.662052057835158e-05, "epoch": 1.8856655290102389, "percentage": 26.94, "elapsed_time": "1:30:00", "remaining_time": "4:04:06"} +{"current_steps": 1110, "total_steps": 4102, "loss": 0.3061, "lr": 3.657302642439347e-05, "epoch": 1.89419795221843, "percentage": 27.06, "elapsed_time": "1:30:22", "remaining_time": "4:03:37"} +{"current_steps": 1115, "total_steps": 4102, "loss": 0.3005, "lr": 3.652523211042548e-05, "epoch": 1.9027303754266212, "percentage": 27.18, "elapsed_time": "1:30:56", "remaining_time": "4:03:36"} +{"current_steps": 1120, "total_steps": 4102, "loss": 0.3004, "lr": 3.647713850206751e-05, "epoch": 1.9112627986348123, "percentage": 27.3, "elapsed_time": "1:31:18", "remaining_time": "4:03:05"} +{"current_steps": 1125, "total_steps": 4102, "loss": 0.3017, "lr": 3.6428746470360125e-05, "epoch": 1.9197952218430034, "percentage": 27.43, "elapsed_time": "1:31:47", "remaining_time": "4:02:53"} +{"current_steps": 1130, "total_steps": 4102, "loss": 0.3022, "lr": 3.638005689174871e-05, "epoch": 1.9283276450511946, "percentage": 27.55, "elapsed_time": "1:32:08", "remaining_time": "4:02:20"} +{"current_steps": 1135, "total_steps": 4102, "loss": 0.3071, "lr": 3.633107064806764e-05, "epoch": 1.9368600682593855, "percentage": 27.67, "elapsed_time": "1:32:31", "remaining_time": "4:01:50"} +{"current_steps": 1140, "total_steps": 4102, "loss": 0.3005, "lr": 3.6281788626524294e-05, "epoch": 1.9453924914675769, "percentage": 27.79, "elapsed_time": "1:32:57", "remaining_time": "4:01:33"} +{"current_steps": 1145, "total_steps": 4102, "loss": 0.301, "lr": 3.6232211719683e-05, "epoch": 1.9539249146757678, "percentage": 27.91, "elapsed_time": "1:33:18", "remaining_time": "4:00:57"} +{"current_steps": 1150, "total_steps": 4102, "loss": 0.2964, "lr": 3.618234082544885e-05, "epoch": 1.9624573378839592, "percentage": 28.04, "elapsed_time": "1:33:38", "remaining_time": "4:00:22"} +{"current_steps": 1155, "total_steps": 4102, "loss": 0.2953, "lr": 3.613217684705145e-05, "epoch": 1.97098976109215, "percentage": 28.16, "elapsed_time": "1:34:01", "remaining_time": "3:59:53"} +{"current_steps": 1160, "total_steps": 4102, "loss": 0.3132, "lr": 3.608172069302855e-05, "epoch": 1.9795221843003414, "percentage": 28.28, "elapsed_time": "1:34:21", "remaining_time": "3:59:19"} +{"current_steps": 1165, "total_steps": 4102, "loss": 0.307, "lr": 3.603097327720962e-05, "epoch": 1.9880546075085324, "percentage": 28.4, "elapsed_time": "1:34:51", "remaining_time": "3:59:08"} +{"current_steps": 1170, "total_steps": 4102, "loss": 0.3048, "lr": 3.597993551869924e-05, "epoch": 1.9965870307167235, "percentage": 28.52, "elapsed_time": "1:35:16", "remaining_time": "3:58:45"} +{"current_steps": 1175, "total_steps": 4102, "loss": 0.2658, "lr": 3.592860834186052e-05, "epoch": 2.0051194539249146, "percentage": 28.64, "elapsed_time": "1:35:41", "remaining_time": "3:58:22"} +{"current_steps": 1180, "total_steps": 4102, "loss": 0.2643, "lr": 3.5876992676298326e-05, "epoch": 2.013651877133106, "percentage": 28.77, "elapsed_time": "1:36:06", "remaining_time": "3:58:00"} +{"current_steps": 1185, "total_steps": 4102, "loss": 0.2653, "lr": 3.5825089456842436e-05, "epoch": 2.022184300341297, "percentage": 28.89, "elapsed_time": "1:36:28", "remaining_time": "3:57:30"} +{"current_steps": 1190, "total_steps": 4102, "loss": 0.2654, "lr": 3.577289962353062e-05, "epoch": 2.030716723549488, "percentage": 29.01, "elapsed_time": "1:36:55", "remaining_time": "3:57:10"} +{"current_steps": 1195, "total_steps": 4102, "loss": 0.2745, "lr": 3.572042412159162e-05, "epoch": 2.039249146757679, "percentage": 29.13, "elapsed_time": "1:37:15", "remaining_time": "3:56:35"} +{"current_steps": 1200, "total_steps": 4102, "loss": 0.2692, "lr": 3.5667663901428024e-05, "epoch": 2.04778156996587, "percentage": 29.25, "elapsed_time": "1:37:37", "remaining_time": "3:56:04"} +{"current_steps": 1205, "total_steps": 4102, "loss": 0.2808, "lr": 3.5614619918599054e-05, "epoch": 2.0563139931740615, "percentage": 29.38, "elapsed_time": "1:38:57", "remaining_time": "3:57:54"} +{"current_steps": 1210, "total_steps": 4102, "loss": 0.2669, "lr": 3.556129313380325e-05, "epoch": 2.0648464163822524, "percentage": 29.5, "elapsed_time": "1:39:23", "remaining_time": "3:57:32"} +{"current_steps": 1215, "total_steps": 4102, "loss": 0.2772, "lr": 3.550768451286109e-05, "epoch": 2.073378839590444, "percentage": 29.62, "elapsed_time": "1:39:46", "remaining_time": "3:57:03"} +{"current_steps": 1220, "total_steps": 4102, "loss": 0.257, "lr": 3.545379502669749e-05, "epoch": 2.0819112627986347, "percentage": 29.74, "elapsed_time": "1:40:08", "remaining_time": "3:56:33"} +{"current_steps": 1225, "total_steps": 4102, "loss": 0.2702, "lr": 3.539962565132421e-05, "epoch": 2.090443686006826, "percentage": 29.86, "elapsed_time": "1:40:28", "remaining_time": "3:55:59"} +{"current_steps": 1230, "total_steps": 4102, "loss": 0.2805, "lr": 3.534517736782217e-05, "epoch": 2.098976109215017, "percentage": 29.99, "elapsed_time": "1:40:52", "remaining_time": "3:55:33"} +{"current_steps": 1235, "total_steps": 4102, "loss": 0.2611, "lr": 3.529045116232373e-05, "epoch": 2.1075085324232083, "percentage": 30.11, "elapsed_time": "1:41:17", "remaining_time": "3:55:09"} +{"current_steps": 1240, "total_steps": 4102, "loss": 0.2768, "lr": 3.523544802599476e-05, "epoch": 2.1160409556313993, "percentage": 30.23, "elapsed_time": "1:41:38", "remaining_time": "3:54:35"} +{"current_steps": 1245, "total_steps": 4102, "loss": 0.2734, "lr": 3.5180168955016744e-05, "epoch": 2.1245733788395906, "percentage": 30.35, "elapsed_time": "1:42:03", "remaining_time": "3:54:12"} +{"current_steps": 1250, "total_steps": 4102, "loss": 0.2701, "lr": 3.51246149505687e-05, "epoch": 2.1331058020477816, "percentage": 30.47, "elapsed_time": "1:42:27", "remaining_time": "3:53:46"} +{"current_steps": 1255, "total_steps": 4102, "loss": 0.2633, "lr": 3.506878701880909e-05, "epoch": 2.1416382252559725, "percentage": 30.59, "elapsed_time": "1:42:48", "remaining_time": "3:53:14"} +{"current_steps": 1260, "total_steps": 4102, "loss": 0.2737, "lr": 3.501268617085754e-05, "epoch": 2.150170648464164, "percentage": 30.72, "elapsed_time": "1:43:17", "remaining_time": "3:52:58"} +{"current_steps": 1265, "total_steps": 4102, "loss": 0.2726, "lr": 3.495631342277659e-05, "epoch": 2.1587030716723548, "percentage": 30.84, "elapsed_time": "1:43:40", "remaining_time": "3:52:30"} +{"current_steps": 1270, "total_steps": 4102, "loss": 0.2652, "lr": 3.4899669795553235e-05, "epoch": 2.167235494880546, "percentage": 30.96, "elapsed_time": "1:44:06", "remaining_time": "3:52:08"} +{"current_steps": 1275, "total_steps": 4102, "loss": 0.2713, "lr": 3.484275631508047e-05, "epoch": 2.175767918088737, "percentage": 31.08, "elapsed_time": "1:44:28", "remaining_time": "3:51:39"} +{"current_steps": 1280, "total_steps": 4102, "loss": 0.2866, "lr": 3.478557401213871e-05, "epoch": 2.1843003412969284, "percentage": 31.2, "elapsed_time": "1:44:49", "remaining_time": "3:51:06"} +{"current_steps": 1285, "total_steps": 4102, "loss": 0.2661, "lr": 3.472812392237708e-05, "epoch": 2.1928327645051193, "percentage": 31.33, "elapsed_time": "1:45:11", "remaining_time": "3:50:36"} +{"current_steps": 1290, "total_steps": 4102, "loss": 0.2677, "lr": 3.467040708629472e-05, "epoch": 2.2013651877133107, "percentage": 31.45, "elapsed_time": "1:45:32", "remaining_time": "3:50:02"} +{"current_steps": 1295, "total_steps": 4102, "loss": 0.277, "lr": 3.461242454922189e-05, "epoch": 2.2098976109215016, "percentage": 31.57, "elapsed_time": "1:45:55", "remaining_time": "3:49:36"} +{"current_steps": 1300, "total_steps": 4102, "loss": 0.262, "lr": 3.4554177361301056e-05, "epoch": 2.218430034129693, "percentage": 31.69, "elapsed_time": "1:46:14", "remaining_time": "3:49:00"} +{"current_steps": 1305, "total_steps": 4102, "loss": 0.2733, "lr": 3.449566657746788e-05, "epoch": 2.226962457337884, "percentage": 31.81, "elapsed_time": "1:46:37", "remaining_time": "3:48:32"} +{"current_steps": 1310, "total_steps": 4102, "loss": 0.2711, "lr": 3.443689325743209e-05, "epoch": 2.2354948805460753, "percentage": 31.94, "elapsed_time": "1:47:01", "remaining_time": "3:48:06"} +{"current_steps": 1315, "total_steps": 4102, "loss": 0.2734, "lr": 3.437785846565833e-05, "epoch": 2.244027303754266, "percentage": 32.06, "elapsed_time": "1:47:24", "remaining_time": "3:47:38"} +{"current_steps": 1320, "total_steps": 4102, "loss": 0.2565, "lr": 3.43185632713468e-05, "epoch": 2.252559726962457, "percentage": 32.18, "elapsed_time": "1:47:45", "remaining_time": "3:47:06"} +{"current_steps": 1325, "total_steps": 4102, "loss": 0.2522, "lr": 3.425900874841399e-05, "epoch": 2.2610921501706485, "percentage": 32.3, "elapsed_time": "1:48:05", "remaining_time": "3:46:32"} +{"current_steps": 1330, "total_steps": 4102, "loss": 0.2752, "lr": 3.419919597547318e-05, "epoch": 2.26962457337884, "percentage": 32.42, "elapsed_time": "1:48:25", "remaining_time": "3:45:58"} +{"current_steps": 1335, "total_steps": 4102, "loss": 0.2631, "lr": 3.413912603581487e-05, "epoch": 2.2781569965870307, "percentage": 32.55, "elapsed_time": "1:48:45", "remaining_time": "3:45:25"} +{"current_steps": 1340, "total_steps": 4102, "loss": 0.2796, "lr": 3.4078800017387245e-05, "epoch": 2.2866894197952217, "percentage": 32.67, "elapsed_time": "1:49:10", "remaining_time": "3:45:01"} +{"current_steps": 1345, "total_steps": 4102, "loss": 0.26, "lr": 3.401821901277639e-05, "epoch": 2.295221843003413, "percentage": 32.79, "elapsed_time": "1:49:34", "remaining_time": "3:44:37"} +{"current_steps": 1350, "total_steps": 4102, "loss": 0.2666, "lr": 3.395738411918657e-05, "epoch": 2.303754266211604, "percentage": 32.91, "elapsed_time": "1:49:57", "remaining_time": "3:44:08"} +{"current_steps": 1355, "total_steps": 4102, "loss": 0.2695, "lr": 3.389629643842029e-05, "epoch": 2.3122866894197953, "percentage": 33.03, "elapsed_time": "1:50:22", "remaining_time": "3:43:46"} +{"current_steps": 1360, "total_steps": 4102, "loss": 0.2707, "lr": 3.383495707685838e-05, "epoch": 2.3208191126279862, "percentage": 33.15, "elapsed_time": "1:50:43", "remaining_time": "3:43:15"} +{"current_steps": 1365, "total_steps": 4102, "loss": 0.2703, "lr": 3.3773367145439976e-05, "epoch": 2.3293515358361776, "percentage": 33.28, "elapsed_time": "1:51:03", "remaining_time": "3:42:41"} +{"current_steps": 1370, "total_steps": 4102, "loss": 0.2702, "lr": 3.371152775964235e-05, "epoch": 2.3378839590443685, "percentage": 33.4, "elapsed_time": "1:51:34", "remaining_time": "3:42:29"} +{"current_steps": 1375, "total_steps": 4102, "loss": 0.2681, "lr": 3.364944003946073e-05, "epoch": 2.34641638225256, "percentage": 33.52, "elapsed_time": "1:51:52", "remaining_time": "3:41:52"} +{"current_steps": 1380, "total_steps": 4102, "loss": 0.2628, "lr": 3.358710510938804e-05, "epoch": 2.354948805460751, "percentage": 33.64, "elapsed_time": "1:52:12", "remaining_time": "3:41:19"} +{"current_steps": 1385, "total_steps": 4102, "loss": 0.2722, "lr": 3.3524524098394484e-05, "epoch": 2.363481228668942, "percentage": 33.76, "elapsed_time": "1:52:33", "remaining_time": "3:40:47"} +{"current_steps": 1390, "total_steps": 4102, "loss": 0.2622, "lr": 3.346169813990715e-05, "epoch": 2.372013651877133, "percentage": 33.89, "elapsed_time": "1:53:01", "remaining_time": "3:40:31"} +{"current_steps": 1395, "total_steps": 4102, "loss": 0.2683, "lr": 3.339862837178944e-05, "epoch": 2.3805460750853245, "percentage": 34.01, "elapsed_time": "1:53:29", "remaining_time": "3:40:14"} +{"current_steps": 1400, "total_steps": 4102, "loss": 0.2719, "lr": 3.333531593632047e-05, "epoch": 2.3890784982935154, "percentage": 34.13, "elapsed_time": "1:53:51", "remaining_time": "3:39:44"} +{"current_steps": 1405, "total_steps": 4102, "loss": 0.2685, "lr": 3.327176198017444e-05, "epoch": 2.3976109215017063, "percentage": 34.25, "elapsed_time": "1:55:15", "remaining_time": "3:41:14"} +{"current_steps": 1410, "total_steps": 4102, "loss": 0.2807, "lr": 3.320796765439975e-05, "epoch": 2.4061433447098977, "percentage": 34.37, "elapsed_time": "1:55:34", "remaining_time": "3:40:39"} +{"current_steps": 1415, "total_steps": 4102, "loss": 0.2707, "lr": 3.314393411439828e-05, "epoch": 2.4146757679180886, "percentage": 34.5, "elapsed_time": "1:55:54", "remaining_time": "3:40:06"} +{"current_steps": 1420, "total_steps": 4102, "loss": 0.2803, "lr": 3.3079662519904355e-05, "epoch": 2.42320819112628, "percentage": 34.62, "elapsed_time": "1:56:12", "remaining_time": "3:39:28"} +{"current_steps": 1425, "total_steps": 4102, "loss": 0.2616, "lr": 3.301515403496383e-05, "epoch": 2.431740614334471, "percentage": 34.74, "elapsed_time": "1:56:38", "remaining_time": "3:39:06"} +{"current_steps": 1430, "total_steps": 4102, "loss": 0.2636, "lr": 3.295040982791295e-05, "epoch": 2.4402730375426622, "percentage": 34.86, "elapsed_time": "1:57:04", "remaining_time": "3:38:45"} +{"current_steps": 1435, "total_steps": 4102, "loss": 0.2626, "lr": 3.288543107135719e-05, "epoch": 2.448805460750853, "percentage": 34.98, "elapsed_time": "1:57:28", "remaining_time": "3:38:19"} +{"current_steps": 1440, "total_steps": 4102, "loss": 0.2684, "lr": 3.282021894215008e-05, "epoch": 2.4573378839590445, "percentage": 35.1, "elapsed_time": "1:57:50", "remaining_time": "3:37:50"} +{"current_steps": 1445, "total_steps": 4102, "loss": 0.263, "lr": 3.27547746213718e-05, "epoch": 2.4658703071672354, "percentage": 35.23, "elapsed_time": "1:58:09", "remaining_time": "3:37:16"} +{"current_steps": 1450, "total_steps": 4102, "loss": 0.2748, "lr": 3.268909929430786e-05, "epoch": 2.474402730375427, "percentage": 35.35, "elapsed_time": "1:58:29", "remaining_time": "3:36:42"} +{"current_steps": 1455, "total_steps": 4102, "loss": 0.2736, "lr": 3.26231941504276e-05, "epoch": 2.4829351535836177, "percentage": 35.47, "elapsed_time": "1:58:50", "remaining_time": "3:36:12"} +{"current_steps": 1460, "total_steps": 4102, "loss": 0.2724, "lr": 3.2557060383362664e-05, "epoch": 2.491467576791809, "percentage": 35.59, "elapsed_time": "1:59:14", "remaining_time": "3:35:46"} +{"current_steps": 1465, "total_steps": 4102, "loss": 0.2792, "lr": 3.249069919088536e-05, "epoch": 2.5, "percentage": 35.71, "elapsed_time": "1:59:35", "remaining_time": "3:35:15"} +{"current_steps": 1470, "total_steps": 4102, "loss": 0.271, "lr": 3.242411177488697e-05, "epoch": 2.508532423208191, "percentage": 35.84, "elapsed_time": "2:00:01", "remaining_time": "3:34:54"} +{"current_steps": 1475, "total_steps": 4102, "loss": 0.2711, "lr": 3.235729934135601e-05, "epoch": 2.5170648464163823, "percentage": 35.96, "elapsed_time": "2:00:23", "remaining_time": "3:34:24"} +{"current_steps": 1480, "total_steps": 4102, "loss": 0.2645, "lr": 3.229026310035638e-05, "epoch": 2.5255972696245736, "percentage": 36.08, "elapsed_time": "2:00:42", "remaining_time": "3:33:51"} +{"current_steps": 1485, "total_steps": 4102, "loss": 0.2745, "lr": 3.2223004266005395e-05, "epoch": 2.5341296928327646, "percentage": 36.2, "elapsed_time": "2:01:04", "remaining_time": "3:33:21"} +{"current_steps": 1490, "total_steps": 4102, "loss": 0.2718, "lr": 3.215552405645188e-05, "epoch": 2.5426621160409555, "percentage": 36.32, "elapsed_time": "2:01:24", "remaining_time": "3:32:49"} +{"current_steps": 1495, "total_steps": 4102, "loss": 0.271, "lr": 3.208782369385404e-05, "epoch": 2.551194539249147, "percentage": 36.45, "elapsed_time": "2:01:47", "remaining_time": "3:32:22"} +{"current_steps": 1500, "total_steps": 4102, "loss": 0.2672, "lr": 3.201990440435737e-05, "epoch": 2.5597269624573378, "percentage": 36.57, "elapsed_time": "2:02:08", "remaining_time": "3:31:51"} +{"current_steps": 1505, "total_steps": 4102, "loss": 0.2744, "lr": 3.19517674180724e-05, "epoch": 2.568259385665529, "percentage": 36.69, "elapsed_time": "2:02:27", "remaining_time": "3:31:19"} +{"current_steps": 1510, "total_steps": 4102, "loss": 0.2621, "lr": 3.188341396905248e-05, "epoch": 2.57679180887372, "percentage": 36.81, "elapsed_time": "2:02:50", "remaining_time": "3:30:51"} +{"current_steps": 1515, "total_steps": 4102, "loss": 0.2776, "lr": 3.1814845295271364e-05, "epoch": 2.5853242320819114, "percentage": 36.93, "elapsed_time": "2:03:09", "remaining_time": "3:30:18"} +{"current_steps": 1520, "total_steps": 4102, "loss": 0.2687, "lr": 3.174606263860083e-05, "epoch": 2.5938566552901023, "percentage": 37.06, "elapsed_time": "2:03:28", "remaining_time": "3:29:44"} +{"current_steps": 1525, "total_steps": 4102, "loss": 0.2736, "lr": 3.167706724478818e-05, "epoch": 2.6023890784982937, "percentage": 37.18, "elapsed_time": "2:03:50", "remaining_time": "3:29:15"} +{"current_steps": 1530, "total_steps": 4102, "loss": 0.2775, "lr": 3.1607860363433686e-05, "epoch": 2.6109215017064846, "percentage": 37.3, "elapsed_time": "2:04:15", "remaining_time": "3:28:52"} +{"current_steps": 1535, "total_steps": 4102, "loss": 0.2631, "lr": 3.1538443247967906e-05, "epoch": 2.6194539249146755, "percentage": 37.42, "elapsed_time": "2:04:35", "remaining_time": "3:28:20"} +{"current_steps": 1540, "total_steps": 4102, "loss": 0.2743, "lr": 3.146881715562906e-05, "epoch": 2.627986348122867, "percentage": 37.54, "elapsed_time": "2:04:56", "remaining_time": "3:27:51"} +{"current_steps": 1545, "total_steps": 4102, "loss": 0.2568, "lr": 3.139898334744023e-05, "epoch": 2.6365187713310583, "percentage": 37.66, "elapsed_time": "2:05:17", "remaining_time": "3:27:21"} +{"current_steps": 1550, "total_steps": 4102, "loss": 0.2768, "lr": 3.1328943088186465e-05, "epoch": 2.645051194539249, "percentage": 37.79, "elapsed_time": "2:05:37", "remaining_time": "3:26:49"} +{"current_steps": 1555, "total_steps": 4102, "loss": 0.2587, "lr": 3.1258697646391975e-05, "epoch": 2.65358361774744, "percentage": 37.91, "elapsed_time": "2:06:05", "remaining_time": "3:26:31"} +{"current_steps": 1560, "total_steps": 4102, "loss": 0.2688, "lr": 3.118824829429708e-05, "epoch": 2.6621160409556315, "percentage": 38.03, "elapsed_time": "2:06:25", "remaining_time": "3:26:00"} +{"current_steps": 1565, "total_steps": 4102, "loss": 0.2731, "lr": 3.111759630783519e-05, "epoch": 2.6706484641638224, "percentage": 38.15, "elapsed_time": "2:06:45", "remaining_time": "3:25:29"} +{"current_steps": 1570, "total_steps": 4102, "loss": 0.259, "lr": 3.104674296660972e-05, "epoch": 2.6791808873720138, "percentage": 38.27, "elapsed_time": "2:07:10", "remaining_time": "3:25:05"} +{"current_steps": 1575, "total_steps": 4102, "loss": 0.2754, "lr": 3.097568955387086e-05, "epoch": 2.6877133105802047, "percentage": 38.4, "elapsed_time": "2:07:36", "remaining_time": "3:24:44"} +{"current_steps": 1580, "total_steps": 4102, "loss": 0.2749, "lr": 3.0904437356492386e-05, "epoch": 2.696245733788396, "percentage": 38.52, "elapsed_time": "2:07:58", "remaining_time": "3:24:16"} +{"current_steps": 1585, "total_steps": 4102, "loss": 0.2755, "lr": 3.083298766494834e-05, "epoch": 2.704778156996587, "percentage": 38.64, "elapsed_time": "2:08:24", "remaining_time": "3:23:54"} +{"current_steps": 1590, "total_steps": 4102, "loss": 0.2709, "lr": 3.076134177328965e-05, "epoch": 2.7133105802047783, "percentage": 38.76, "elapsed_time": "2:08:44", "remaining_time": "3:23:22"} +{"current_steps": 1595, "total_steps": 4102, "loss": 0.2779, "lr": 3.068950097912067e-05, "epoch": 2.7218430034129693, "percentage": 38.88, "elapsed_time": "2:09:01", "remaining_time": "3:22:48"} +{"current_steps": 1600, "total_steps": 4102, "loss": 0.2649, "lr": 3.061746658357573e-05, "epoch": 2.73037542662116, "percentage": 39.01, "elapsed_time": "2:09:18", "remaining_time": "3:22:12"} +{"current_steps": 1605, "total_steps": 4102, "loss": 0.272, "lr": 3.054523989129555e-05, "epoch": 2.7389078498293515, "percentage": 39.13, "elapsed_time": "2:10:36", "remaining_time": "3:23:12"} +{"current_steps": 1610, "total_steps": 4102, "loss": 0.2697, "lr": 3.047282221040356e-05, "epoch": 2.747440273037543, "percentage": 39.25, "elapsed_time": "2:10:59", "remaining_time": "3:22:45"} +{"current_steps": 1615, "total_steps": 4102, "loss": 0.274, "lr": 3.0400214852482306e-05, "epoch": 2.755972696245734, "percentage": 39.37, "elapsed_time": "2:11:18", "remaining_time": "3:22:13"} +{"current_steps": 1620, "total_steps": 4102, "loss": 0.2565, "lr": 3.0327419132549613e-05, "epoch": 2.7645051194539247, "percentage": 39.49, "elapsed_time": "2:11:41", "remaining_time": "3:21:46"} +{"current_steps": 1625, "total_steps": 4102, "loss": 0.2698, "lr": 3.0254436369034804e-05, "epoch": 2.773037542662116, "percentage": 39.61, "elapsed_time": "2:12:06", "remaining_time": "3:21:22"} +{"current_steps": 1630, "total_steps": 4102, "loss": 0.2716, "lr": 3.0181267883754812e-05, "epoch": 2.781569965870307, "percentage": 39.74, "elapsed_time": "2:12:28", "remaining_time": "3:20:54"} +{"current_steps": 1635, "total_steps": 4102, "loss": 0.2711, "lr": 3.0107915001890254e-05, "epoch": 2.7901023890784984, "percentage": 39.86, "elapsed_time": "2:12:51", "remaining_time": "3:20:28"} +{"current_steps": 1640, "total_steps": 4102, "loss": 0.266, "lr": 3.0034379051961413e-05, "epoch": 2.7986348122866893, "percentage": 39.98, "elapsed_time": "2:13:16", "remaining_time": "3:20:04"} +{"current_steps": 1645, "total_steps": 4102, "loss": 0.2681, "lr": 2.9960661365804168e-05, "epoch": 2.8071672354948807, "percentage": 40.1, "elapsed_time": "2:13:44", "remaining_time": "3:19:45"} +{"current_steps": 1650, "total_steps": 4102, "loss": 0.2791, "lr": 2.988676327854592e-05, "epoch": 2.8156996587030716, "percentage": 40.22, "elapsed_time": "2:14:11", "remaining_time": "3:19:24"} +{"current_steps": 1655, "total_steps": 4102, "loss": 0.2684, "lr": 2.981268612858135e-05, "epoch": 2.824232081911263, "percentage": 40.35, "elapsed_time": "2:14:33", "remaining_time": "3:18:56"} +{"current_steps": 1660, "total_steps": 4102, "loss": 0.2661, "lr": 2.973843125754823e-05, "epoch": 2.832764505119454, "percentage": 40.47, "elapsed_time": "2:14:55", "remaining_time": "3:18:29"} +{"current_steps": 1665, "total_steps": 4102, "loss": 0.2605, "lr": 2.9664000010303078e-05, "epoch": 2.841296928327645, "percentage": 40.59, "elapsed_time": "2:15:22", "remaining_time": "3:18:09"} +{"current_steps": 1670, "total_steps": 4102, "loss": 0.2633, "lr": 2.9589393734896843e-05, "epoch": 2.849829351535836, "percentage": 40.71, "elapsed_time": "2:15:50", "remaining_time": "3:17:50"} +{"current_steps": 1675, "total_steps": 4102, "loss": 0.278, "lr": 2.9514613782550473e-05, "epoch": 2.8583617747440275, "percentage": 40.83, "elapsed_time": "2:16:13", "remaining_time": "3:17:23"} +{"current_steps": 1680, "total_steps": 4102, "loss": 0.2662, "lr": 2.9439661507630425e-05, "epoch": 2.8668941979522184, "percentage": 40.96, "elapsed_time": "2:16:35", "remaining_time": "3:16:55"} +{"current_steps": 1685, "total_steps": 4102, "loss": 0.274, "lr": 2.9364538267624163e-05, "epoch": 2.8754266211604094, "percentage": 41.08, "elapsed_time": "2:16:55", "remaining_time": "3:16:24"} +{"current_steps": 1690, "total_steps": 4102, "loss": 0.2664, "lr": 2.9289245423115563e-05, "epoch": 2.8839590443686007, "percentage": 41.2, "elapsed_time": "2:17:17", "remaining_time": "3:15:56"} +{"current_steps": 1695, "total_steps": 4102, "loss": 0.2634, "lr": 2.9213784337760257e-05, "epoch": 2.8924914675767917, "percentage": 41.32, "elapsed_time": "2:17:44", "remaining_time": "3:15:36"} +{"current_steps": 1700, "total_steps": 4102, "loss": 0.2694, "lr": 2.9138156378260968e-05, "epoch": 2.901023890784983, "percentage": 41.44, "elapsed_time": "2:18:06", "remaining_time": "3:15:08"} +{"current_steps": 1705, "total_steps": 4102, "loss": 0.2545, "lr": 2.9062362914342706e-05, "epoch": 2.909556313993174, "percentage": 41.57, "elapsed_time": "2:18:29", "remaining_time": "3:14:41"} +{"current_steps": 1710, "total_steps": 4102, "loss": 0.2629, "lr": 2.8986405318728023e-05, "epoch": 2.9180887372013653, "percentage": 41.69, "elapsed_time": "2:18:55", "remaining_time": "3:14:20"} +{"current_steps": 1715, "total_steps": 4102, "loss": 0.2673, "lr": 2.89102849671121e-05, "epoch": 2.926621160409556, "percentage": 41.81, "elapsed_time": "2:19:17", "remaining_time": "3:13:52"} +{"current_steps": 1720, "total_steps": 4102, "loss": 0.276, "lr": 2.883400323813785e-05, "epoch": 2.9351535836177476, "percentage": 41.93, "elapsed_time": "2:19:38", "remaining_time": "3:13:23"} +{"current_steps": 1725, "total_steps": 4102, "loss": 0.2672, "lr": 2.8757561513370952e-05, "epoch": 2.9436860068259385, "percentage": 42.05, "elapsed_time": "2:19:58", "remaining_time": "3:12:53"} +{"current_steps": 1730, "total_steps": 4102, "loss": 0.2551, "lr": 2.868096117727484e-05, "epoch": 2.9522184300341294, "percentage": 42.17, "elapsed_time": "2:20:21", "remaining_time": "3:12:27"} +{"current_steps": 1735, "total_steps": 4102, "loss": 0.2542, "lr": 2.8604203617185584e-05, "epoch": 2.960750853242321, "percentage": 42.3, "elapsed_time": "2:20:53", "remaining_time": "3:12:13"} +{"current_steps": 1740, "total_steps": 4102, "loss": 0.2741, "lr": 2.8527290223286823e-05, "epoch": 2.969283276450512, "percentage": 42.42, "elapsed_time": "2:21:17", "remaining_time": "3:11:47"} +{"current_steps": 1745, "total_steps": 4102, "loss": 0.2576, "lr": 2.8450222388584544e-05, "epoch": 2.977815699658703, "percentage": 42.54, "elapsed_time": "2:21:41", "remaining_time": "3:11:22"} +{"current_steps": 1750, "total_steps": 4102, "loss": 0.2712, "lr": 2.8373001508881867e-05, "epoch": 2.986348122866894, "percentage": 42.66, "elapsed_time": "2:22:03", "remaining_time": "3:10:55"} +{"current_steps": 1755, "total_steps": 4102, "loss": 0.266, "lr": 2.8295628982753762e-05, "epoch": 2.9948805460750854, "percentage": 42.78, "elapsed_time": "2:22:25", "remaining_time": "3:10:28"} +{"current_steps": 1760, "total_steps": 4102, "loss": 0.2448, "lr": 2.8218106211521735e-05, "epoch": 3.0034129692832763, "percentage": 42.91, "elapsed_time": "2:22:51", "remaining_time": "3:10:05"} +{"current_steps": 1765, "total_steps": 4102, "loss": 0.2387, "lr": 2.8140434599228436e-05, "epoch": 3.0119453924914676, "percentage": 43.03, "elapsed_time": "2:23:12", "remaining_time": "3:09:37"} +{"current_steps": 1770, "total_steps": 4102, "loss": 0.2409, "lr": 2.806261555261219e-05, "epoch": 3.0204778156996586, "percentage": 43.15, "elapsed_time": "2:23:29", "remaining_time": "3:09:03"} +{"current_steps": 1775, "total_steps": 4102, "loss": 0.2198, "lr": 2.7984650481081615e-05, "epoch": 3.02901023890785, "percentage": 43.27, "elapsed_time": "2:23:56", "remaining_time": "3:08:42"} +{"current_steps": 1780, "total_steps": 4102, "loss": 0.2325, "lr": 2.7906540796689995e-05, "epoch": 3.037542662116041, "percentage": 43.39, "elapsed_time": "2:24:18", "remaining_time": "3:08:15"} +{"current_steps": 1785, "total_steps": 4102, "loss": 0.2415, "lr": 2.7828287914109768e-05, "epoch": 3.046075085324232, "percentage": 43.52, "elapsed_time": "2:24:42", "remaining_time": "3:07:50"} +{"current_steps": 1790, "total_steps": 4102, "loss": 0.2402, "lr": 2.774989325060689e-05, "epoch": 3.054607508532423, "percentage": 43.64, "elapsed_time": "2:25:05", "remaining_time": "3:07:23"} +{"current_steps": 1795, "total_steps": 4102, "loss": 0.2452, "lr": 2.767135822601514e-05, "epoch": 3.0631399317406145, "percentage": 43.76, "elapsed_time": "2:25:30", "remaining_time": "3:07:01"} +{"current_steps": 1800, "total_steps": 4102, "loss": 0.2357, "lr": 2.759268426271045e-05, "epoch": 3.0716723549488054, "percentage": 43.88, "elapsed_time": "2:25:52", "remaining_time": "3:06:33"} +{"current_steps": 1805, "total_steps": 4102, "loss": 0.2338, "lr": 2.751387278558511e-05, "epoch": 3.080204778156997, "percentage": 44.0, "elapsed_time": "2:27:20", "remaining_time": "3:07:29"} +{"current_steps": 1810, "total_steps": 4102, "loss": 0.2295, "lr": 2.7434925222021968e-05, "epoch": 3.0887372013651877, "percentage": 44.12, "elapsed_time": "2:27:41", "remaining_time": "3:07:01"} +{"current_steps": 1815, "total_steps": 4102, "loss": 0.242, "lr": 2.7355843001868603e-05, "epoch": 3.0972696245733786, "percentage": 44.25, "elapsed_time": "2:28:02", "remaining_time": "3:06:32"} +{"current_steps": 1820, "total_steps": 4102, "loss": 0.2363, "lr": 2.7276627557411376e-05, "epoch": 3.10580204778157, "percentage": 44.37, "elapsed_time": "2:28:24", "remaining_time": "3:06:04"} +{"current_steps": 1825, "total_steps": 4102, "loss": 0.2289, "lr": 2.7197280323349545e-05, "epoch": 3.114334470989761, "percentage": 44.49, "elapsed_time": "2:28:44", "remaining_time": "3:05:34"} +{"current_steps": 1830, "total_steps": 4102, "loss": 0.2416, "lr": 2.711780273676925e-05, "epoch": 3.1228668941979523, "percentage": 44.61, "elapsed_time": "2:29:04", "remaining_time": "3:05:04"} +{"current_steps": 1835, "total_steps": 4102, "loss": 0.2379, "lr": 2.7038196237117492e-05, "epoch": 3.131399317406143, "percentage": 44.73, "elapsed_time": "2:29:32", "remaining_time": "3:04:44"} +{"current_steps": 1840, "total_steps": 4102, "loss": 0.2364, "lr": 2.695846226617606e-05, "epoch": 3.1399317406143346, "percentage": 44.86, "elapsed_time": "2:29:53", "remaining_time": "3:04:15"} +{"current_steps": 1845, "total_steps": 4102, "loss": 0.2428, "lr": 2.687860226803542e-05, "epoch": 3.1484641638225255, "percentage": 44.98, "elapsed_time": "2:30:16", "remaining_time": "3:03:49"} +{"current_steps": 1850, "total_steps": 4102, "loss": 0.2431, "lr": 2.6798617689068578e-05, "epoch": 3.156996587030717, "percentage": 45.1, "elapsed_time": "2:30:40", "remaining_time": "3:03:24"} +{"current_steps": 1855, "total_steps": 4102, "loss": 0.2422, "lr": 2.6718509977904833e-05, "epoch": 3.1655290102389078, "percentage": 45.22, "elapsed_time": "2:31:00", "remaining_time": "3:02:55"} +{"current_steps": 1860, "total_steps": 4102, "loss": 0.2427, "lr": 2.6638280585403617e-05, "epoch": 3.174061433447099, "percentage": 45.34, "elapsed_time": "2:31:24", "remaining_time": "3:02:29"} +{"current_steps": 1865, "total_steps": 4102, "loss": 0.2335, "lr": 2.6557930964628148e-05, "epoch": 3.18259385665529, "percentage": 45.47, "elapsed_time": "2:31:44", "remaining_time": "3:02:01"} +{"current_steps": 1870, "total_steps": 4102, "loss": 0.231, "lr": 2.6477462570819153e-05, "epoch": 3.1911262798634814, "percentage": 45.59, "elapsed_time": "2:32:12", "remaining_time": "3:01:40"} +{"current_steps": 1875, "total_steps": 4102, "loss": 0.2346, "lr": 2.639687686136849e-05, "epoch": 3.1996587030716723, "percentage": 45.71, "elapsed_time": "2:32:32", "remaining_time": "3:01:10"} +{"current_steps": 1880, "total_steps": 4102, "loss": 0.225, "lr": 2.631617529579277e-05, "epoch": 3.2081911262798632, "percentage": 45.83, "elapsed_time": "2:32:52", "remaining_time": "3:00:40"} +{"current_steps": 1885, "total_steps": 4102, "loss": 0.2505, "lr": 2.6235359335706924e-05, "epoch": 3.2167235494880546, "percentage": 45.95, "elapsed_time": "2:33:15", "remaining_time": "3:00:14"} +{"current_steps": 1890, "total_steps": 4102, "loss": 0.245, "lr": 2.6154430444797702e-05, "epoch": 3.2252559726962455, "percentage": 46.08, "elapsed_time": "2:33:38", "remaining_time": "2:59:49"} +{"current_steps": 1895, "total_steps": 4102, "loss": 0.2441, "lr": 2.6073390088797208e-05, "epoch": 3.233788395904437, "percentage": 46.2, "elapsed_time": "2:34:00", "remaining_time": "2:59:22"} +{"current_steps": 1900, "total_steps": 4102, "loss": 0.2405, "lr": 2.5992239735456314e-05, "epoch": 3.242320819112628, "percentage": 46.32, "elapsed_time": "2:34:20", "remaining_time": "2:58:52"} +{"current_steps": 1905, "total_steps": 4102, "loss": 0.2389, "lr": 2.5910980854518088e-05, "epoch": 3.250853242320819, "percentage": 46.44, "elapsed_time": "2:34:42", "remaining_time": "2:58:25"} +{"current_steps": 1910, "total_steps": 4102, "loss": 0.2352, "lr": 2.5829614917691195e-05, "epoch": 3.25938566552901, "percentage": 46.56, "elapsed_time": "2:35:03", "remaining_time": "2:57:57"} +{"current_steps": 1915, "total_steps": 4102, "loss": 0.2364, "lr": 2.5748143398623232e-05, "epoch": 3.2679180887372015, "percentage": 46.68, "elapsed_time": "2:35:23", "remaining_time": "2:57:27"} +{"current_steps": 1920, "total_steps": 4102, "loss": 0.2353, "lr": 2.5666567772874012e-05, "epoch": 3.2764505119453924, "percentage": 46.81, "elapsed_time": "2:35:50", "remaining_time": "2:57:06"} +{"current_steps": 1925, "total_steps": 4102, "loss": 0.2441, "lr": 2.558488951788888e-05, "epoch": 3.2849829351535837, "percentage": 46.93, "elapsed_time": "2:36:16", "remaining_time": "2:56:44"} +{"current_steps": 1930, "total_steps": 4102, "loss": 0.2606, "lr": 2.5503110112971925e-05, "epoch": 3.2935153583617747, "percentage": 47.05, "elapsed_time": "2:36:38", "remaining_time": "2:56:16"} +{"current_steps": 1935, "total_steps": 4102, "loss": 0.245, "lr": 2.5421231039259203e-05, "epoch": 3.302047781569966, "percentage": 47.17, "elapsed_time": "2:37:05", "remaining_time": "2:55:55"} +{"current_steps": 1940, "total_steps": 4102, "loss": 0.2301, "lr": 2.5339253779691918e-05, "epoch": 3.310580204778157, "percentage": 47.29, "elapsed_time": "2:37:25", "remaining_time": "2:55:25"} +{"current_steps": 1945, "total_steps": 4102, "loss": 0.2522, "lr": 2.5257179818989518e-05, "epoch": 3.319112627986348, "percentage": 47.42, "elapsed_time": "2:37:44", "remaining_time": "2:54:56"} +{"current_steps": 1950, "total_steps": 4102, "loss": 0.2464, "lr": 2.5175010643622887e-05, "epoch": 3.3276450511945392, "percentage": 47.54, "elapsed_time": "2:38:07", "remaining_time": "2:54:30"} +{"current_steps": 1955, "total_steps": 4102, "loss": 0.2407, "lr": 2.5092747741787338e-05, "epoch": 3.3361774744027306, "percentage": 47.66, "elapsed_time": "2:38:27", "remaining_time": "2:54:01"} +{"current_steps": 1960, "total_steps": 4102, "loss": 0.2303, "lr": 2.5010392603375722e-05, "epoch": 3.3447098976109215, "percentage": 47.78, "elapsed_time": "2:38:48", "remaining_time": "2:53:33"} +{"current_steps": 1965, "total_steps": 4102, "loss": 0.2333, "lr": 2.4927946719951406e-05, "epoch": 3.3532423208191124, "percentage": 47.9, "elapsed_time": "2:39:11", "remaining_time": "2:53:07"} +{"current_steps": 1970, "total_steps": 4102, "loss": 0.2266, "lr": 2.484541158472127e-05, "epoch": 3.361774744027304, "percentage": 48.03, "elapsed_time": "2:39:33", "remaining_time": "2:52:40"} +{"current_steps": 1975, "total_steps": 4102, "loss": 0.232, "lr": 2.476278869250869e-05, "epoch": 3.3703071672354947, "percentage": 48.15, "elapsed_time": "2:39:54", "remaining_time": "2:52:13"} +{"current_steps": 1980, "total_steps": 4102, "loss": 0.2486, "lr": 2.46800795397264e-05, "epoch": 3.378839590443686, "percentage": 48.27, "elapsed_time": "2:40:23", "remaining_time": "2:51:54"} +{"current_steps": 1985, "total_steps": 4102, "loss": 0.2378, "lr": 2.459728562434946e-05, "epoch": 3.387372013651877, "percentage": 48.39, "elapsed_time": "2:40:44", "remaining_time": "2:51:25"} +{"current_steps": 1990, "total_steps": 4102, "loss": 0.2448, "lr": 2.4514408445888097e-05, "epoch": 3.3959044368600684, "percentage": 48.51, "elapsed_time": "2:41:05", "remaining_time": "2:50:57"} +{"current_steps": 1995, "total_steps": 4102, "loss": 0.2358, "lr": 2.4431449505360516e-05, "epoch": 3.4044368600682593, "percentage": 48.63, "elapsed_time": "2:41:26", "remaining_time": "2:50:30"} +{"current_steps": 2000, "total_steps": 4102, "loss": 0.2451, "lr": 2.4348410305265788e-05, "epoch": 3.4129692832764507, "percentage": 48.76, "elapsed_time": "2:41:46", "remaining_time": "2:50:01"} +{"current_steps": 2005, "total_steps": 4102, "loss": 0.2378, "lr": 2.426529234955655e-05, "epoch": 3.4215017064846416, "percentage": 48.88, "elapsed_time": "2:43:07", "remaining_time": "2:50:36"} +{"current_steps": 2010, "total_steps": 4102, "loss": 0.2399, "lr": 2.4182097143611843e-05, "epoch": 3.430034129692833, "percentage": 49.0, "elapsed_time": "2:43:31", "remaining_time": "2:50:12"} +{"current_steps": 2015, "total_steps": 4102, "loss": 0.2443, "lr": 2.4098826194209793e-05, "epoch": 3.438566552901024, "percentage": 49.12, "elapsed_time": "2:43:51", "remaining_time": "2:49:42"} +{"current_steps": 2020, "total_steps": 4102, "loss": 0.2439, "lr": 2.4015481009500358e-05, "epoch": 3.4470989761092152, "percentage": 49.24, "elapsed_time": "2:44:14", "remaining_time": "2:49:17"} +{"current_steps": 2025, "total_steps": 4102, "loss": 0.2325, "lr": 2.3932063098977985e-05, "epoch": 3.455631399317406, "percentage": 49.37, "elapsed_time": "2:44:35", "remaining_time": "2:48:48"} +{"current_steps": 2030, "total_steps": 4102, "loss": 0.2453, "lr": 2.384857397345429e-05, "epoch": 3.464163822525597, "percentage": 49.49, "elapsed_time": "2:44:58", "remaining_time": "2:48:23"} +{"current_steps": 2035, "total_steps": 4102, "loss": 0.2511, "lr": 2.3765015145030694e-05, "epoch": 3.4726962457337884, "percentage": 49.61, "elapsed_time": "2:45:20", "remaining_time": "2:47:56"} +{"current_steps": 2040, "total_steps": 4102, "loss": 0.2445, "lr": 2.3681388127071033e-05, "epoch": 3.4812286689419794, "percentage": 49.73, "elapsed_time": "2:45:42", "remaining_time": "2:47:29"} +{"current_steps": 2045, "total_steps": 4102, "loss": 0.2372, "lr": 2.3597694434174137e-05, "epoch": 3.4897610921501707, "percentage": 49.85, "elapsed_time": "2:46:05", "remaining_time": "2:47:03"} +{"current_steps": 2050, "total_steps": 4102, "loss": 0.2297, "lr": 2.351393558214642e-05, "epoch": 3.4982935153583616, "percentage": 49.98, "elapsed_time": "2:46:25", "remaining_time": "2:46:35"} +{"current_steps": 2055, "total_steps": 4102, "loss": 0.2453, "lr": 2.3430113087974407e-05, "epoch": 3.506825938566553, "percentage": 50.1, "elapsed_time": "2:46:44", "remaining_time": "2:46:05"} +{"current_steps": 2060, "total_steps": 4102, "loss": 0.2385, "lr": 2.334622846979728e-05, "epoch": 3.515358361774744, "percentage": 50.22, "elapsed_time": "2:47:05", "remaining_time": "2:45:38"} +{"current_steps": 2065, "total_steps": 4102, "loss": 0.2439, "lr": 2.3262283246879353e-05, "epoch": 3.5238907849829353, "percentage": 50.34, "elapsed_time": "2:47:26", "remaining_time": "2:45:10"} +{"current_steps": 2070, "total_steps": 4102, "loss": 0.2462, "lr": 2.3178278939582604e-05, "epoch": 3.532423208191126, "percentage": 50.46, "elapsed_time": "2:47:45", "remaining_time": "2:44:40"} +{"current_steps": 2075, "total_steps": 4102, "loss": 0.256, "lr": 2.309421706933908e-05, "epoch": 3.5409556313993176, "percentage": 50.59, "elapsed_time": "2:48:06", "remaining_time": "2:44:12"} +{"current_steps": 2080, "total_steps": 4102, "loss": 0.2457, "lr": 2.301009915862338e-05, "epoch": 3.5494880546075085, "percentage": 50.71, "elapsed_time": "2:48:32", "remaining_time": "2:43:50"} +{"current_steps": 2085, "total_steps": 4102, "loss": 0.2467, "lr": 2.292592673092509e-05, "epoch": 3.5580204778157, "percentage": 50.83, "elapsed_time": "2:48:53", "remaining_time": "2:43:22"} +{"current_steps": 2090, "total_steps": 4102, "loss": 0.2344, "lr": 2.2841701310721143e-05, "epoch": 3.5665529010238908, "percentage": 50.95, "elapsed_time": "2:49:19", "remaining_time": "2:42:59"} +{"current_steps": 2095, "total_steps": 4102, "loss": 0.2385, "lr": 2.2757424423448253e-05, "epoch": 3.5750853242320817, "percentage": 51.07, "elapsed_time": "2:49:47", "remaining_time": "2:42:39"} +{"current_steps": 2100, "total_steps": 4102, "loss": 0.239, "lr": 2.267309759547528e-05, "epoch": 3.583617747440273, "percentage": 51.19, "elapsed_time": "2:50:10", "remaining_time": "2:42:13"} +{"current_steps": 2105, "total_steps": 4102, "loss": 0.237, "lr": 2.258872235407556e-05, "epoch": 3.5921501706484644, "percentage": 51.32, "elapsed_time": "2:50:38", "remaining_time": "2:41:53"} +{"current_steps": 2110, "total_steps": 4102, "loss": 0.2456, "lr": 2.250430022739928e-05, "epoch": 3.6006825938566553, "percentage": 51.44, "elapsed_time": "2:51:02", "remaining_time": "2:41:28"} +{"current_steps": 2115, "total_steps": 4102, "loss": 0.2342, "lr": 2.2419832744445774e-05, "epoch": 3.6092150170648463, "percentage": 51.56, "elapsed_time": "2:51:21", "remaining_time": "2:40:59"} +{"current_steps": 2120, "total_steps": 4102, "loss": 0.2327, "lr": 2.2335321435035834e-05, "epoch": 3.6177474402730376, "percentage": 51.68, "elapsed_time": "2:51:41", "remaining_time": "2:40:31"} +{"current_steps": 2125, "total_steps": 4102, "loss": 0.2489, "lr": 2.225076782978403e-05, "epoch": 3.6262798634812285, "percentage": 51.8, "elapsed_time": "2:52:05", "remaining_time": "2:40:06"} +{"current_steps": 2130, "total_steps": 4102, "loss": 0.232, "lr": 2.2166173460070927e-05, "epoch": 3.63481228668942, "percentage": 51.93, "elapsed_time": "2:52:30", "remaining_time": "2:39:42"} +{"current_steps": 2135, "total_steps": 4102, "loss": 0.2362, "lr": 2.208153985801544e-05, "epoch": 3.643344709897611, "percentage": 52.05, "elapsed_time": "2:52:50", "remaining_time": "2:39:14"} +{"current_steps": 2140, "total_steps": 4102, "loss": 0.2387, "lr": 2.1996868556446994e-05, "epoch": 3.651877133105802, "percentage": 52.17, "elapsed_time": "2:53:17", "remaining_time": "2:38:52"} +{"current_steps": 2145, "total_steps": 4102, "loss": 0.2436, "lr": 2.191216108887783e-05, "epoch": 3.660409556313993, "percentage": 52.29, "elapsed_time": "2:53:38", "remaining_time": "2:38:25"} +{"current_steps": 2150, "total_steps": 4102, "loss": 0.2419, "lr": 2.1827418989475188e-05, "epoch": 3.6689419795221845, "percentage": 52.41, "elapsed_time": "2:53:56", "remaining_time": "2:37:55"} +{"current_steps": 2155, "total_steps": 4102, "loss": 0.2451, "lr": 2.174264379303354e-05, "epoch": 3.6774744027303754, "percentage": 52.54, "elapsed_time": "2:54:17", "remaining_time": "2:37:27"} +{"current_steps": 2160, "total_steps": 4102, "loss": 0.2424, "lr": 2.1657837034946807e-05, "epoch": 3.6860068259385663, "percentage": 52.66, "elapsed_time": "2:54:40", "remaining_time": "2:37:02"} +{"current_steps": 2165, "total_steps": 4102, "loss": 0.2332, "lr": 2.1573000251180504e-05, "epoch": 3.6945392491467577, "percentage": 52.78, "elapsed_time": "2:55:02", "remaining_time": "2:36:36"} +{"current_steps": 2170, "total_steps": 4102, "loss": 0.2238, "lr": 2.1488134978243977e-05, "epoch": 3.703071672354949, "percentage": 52.9, "elapsed_time": "2:55:23", "remaining_time": "2:36:09"} +{"current_steps": 2175, "total_steps": 4102, "loss": 0.2411, "lr": 2.140324275316254e-05, "epoch": 3.71160409556314, "percentage": 53.02, "elapsed_time": "2:55:47", "remaining_time": "2:35:45"} +{"current_steps": 2180, "total_steps": 4102, "loss": 0.2278, "lr": 2.1318325113449645e-05, "epoch": 3.720136518771331, "percentage": 53.14, "elapsed_time": "2:56:12", "remaining_time": "2:35:21"} +{"current_steps": 2185, "total_steps": 4102, "loss": 0.2352, "lr": 2.1233383597079053e-05, "epoch": 3.7286689419795223, "percentage": 53.27, "elapsed_time": "2:56:36", "remaining_time": "2:34:57"} +{"current_steps": 2190, "total_steps": 4102, "loss": 0.2526, "lr": 2.1148419742456932e-05, "epoch": 3.737201365187713, "percentage": 53.39, "elapsed_time": "2:56:57", "remaining_time": "2:34:29"} +{"current_steps": 2195, "total_steps": 4102, "loss": 0.2434, "lr": 2.1063435088394066e-05, "epoch": 3.7457337883959045, "percentage": 53.51, "elapsed_time": "2:57:23", "remaining_time": "2:34:06"} +{"current_steps": 2200, "total_steps": 4102, "loss": 0.2402, "lr": 2.097843117407791e-05, "epoch": 3.7542662116040955, "percentage": 53.63, "elapsed_time": "2:57:43", "remaining_time": "2:33:38"} +{"current_steps": 2205, "total_steps": 4102, "loss": 0.2365, "lr": 2.0893409539044765e-05, "epoch": 3.762798634812287, "percentage": 53.75, "elapsed_time": "2:59:00", "remaining_time": "2:34:00"} +{"current_steps": 2210, "total_steps": 4102, "loss": 0.2479, "lr": 2.0808371723151885e-05, "epoch": 3.7713310580204777, "percentage": 53.88, "elapsed_time": "2:59:22", "remaining_time": "2:33:33"} +{"current_steps": 2215, "total_steps": 4102, "loss": 0.2433, "lr": 2.0723319266549556e-05, "epoch": 3.779863481228669, "percentage": 54.0, "elapsed_time": "2:59:42", "remaining_time": "2:33:05"} +{"current_steps": 2220, "total_steps": 4102, "loss": 0.2217, "lr": 2.0638253709653256e-05, "epoch": 3.78839590443686, "percentage": 54.12, "elapsed_time": "3:00:04", "remaining_time": "2:32:39"} +{"current_steps": 2225, "total_steps": 4102, "loss": 0.2458, "lr": 2.055317659311572e-05, "epoch": 3.796928327645051, "percentage": 54.24, "elapsed_time": "3:00:23", "remaining_time": "2:32:11"} +{"current_steps": 2230, "total_steps": 4102, "loss": 0.2461, "lr": 2.0468089457799022e-05, "epoch": 3.8054607508532423, "percentage": 54.36, "elapsed_time": "3:00:47", "remaining_time": "2:31:46"} +{"current_steps": 2235, "total_steps": 4102, "loss": 0.2318, "lr": 2.0382993844746713e-05, "epoch": 3.8139931740614337, "percentage": 54.49, "elapsed_time": "3:01:11", "remaining_time": "2:31:21"} +{"current_steps": 2240, "total_steps": 4102, "loss": 0.2383, "lr": 2.0297891295155884e-05, "epoch": 3.8225255972696246, "percentage": 54.61, "elapsed_time": "3:01:39", "remaining_time": "2:30:59"} +{"current_steps": 2245, "total_steps": 4102, "loss": 0.2447, "lr": 2.021278335034925e-05, "epoch": 3.8310580204778155, "percentage": 54.73, "elapsed_time": "3:01:57", "remaining_time": "2:30:30"} +{"current_steps": 2250, "total_steps": 4102, "loss": 0.2314, "lr": 2.012767155174724e-05, "epoch": 3.839590443686007, "percentage": 54.85, "elapsed_time": "3:02:19", "remaining_time": "2:30:04"} +{"current_steps": 2255, "total_steps": 4102, "loss": 0.2418, "lr": 2.0042557440840092e-05, "epoch": 3.848122866894198, "percentage": 54.97, "elapsed_time": "3:02:40", "remaining_time": "2:29:37"} +{"current_steps": 2260, "total_steps": 4102, "loss": 0.2419, "lr": 1.9957442559159918e-05, "epoch": 3.856655290102389, "percentage": 55.1, "elapsed_time": "3:03:06", "remaining_time": "2:29:14"} +{"current_steps": 2265, "total_steps": 4102, "loss": 0.2425, "lr": 1.9872328448252762e-05, "epoch": 3.86518771331058, "percentage": 55.22, "elapsed_time": "3:03:26", "remaining_time": "2:28:46"} +{"current_steps": 2270, "total_steps": 4102, "loss": 0.2365, "lr": 1.9787216649650757e-05, "epoch": 3.8737201365187715, "percentage": 55.34, "elapsed_time": "3:03:47", "remaining_time": "2:28:19"} +{"current_steps": 2275, "total_steps": 4102, "loss": 0.2316, "lr": 1.970210870484412e-05, "epoch": 3.8822525597269624, "percentage": 55.46, "elapsed_time": "3:04:05", "remaining_time": "2:27:50"} +{"current_steps": 2280, "total_steps": 4102, "loss": 0.2488, "lr": 1.961700615525329e-05, "epoch": 3.8907849829351537, "percentage": 55.58, "elapsed_time": "3:04:28", "remaining_time": "2:27:24"} +{"current_steps": 2285, "total_steps": 4102, "loss": 0.235, "lr": 1.953191054220099e-05, "epoch": 3.8993174061433447, "percentage": 55.7, "elapsed_time": "3:04:53", "remaining_time": "2:27:01"} +{"current_steps": 2290, "total_steps": 4102, "loss": 0.2338, "lr": 1.9446823406884288e-05, "epoch": 3.9078498293515356, "percentage": 55.83, "elapsed_time": "3:05:17", "remaining_time": "2:26:37"} +{"current_steps": 2295, "total_steps": 4102, "loss": 0.24, "lr": 1.9361746290346747e-05, "epoch": 3.916382252559727, "percentage": 55.95, "elapsed_time": "3:05:40", "remaining_time": "2:26:11"} +{"current_steps": 2300, "total_steps": 4102, "loss": 0.2361, "lr": 1.9276680733450447e-05, "epoch": 3.9249146757679183, "percentage": 56.07, "elapsed_time": "3:06:05", "remaining_time": "2:25:47"} +{"current_steps": 2305, "total_steps": 4102, "loss": 0.2371, "lr": 1.9191628276848125e-05, "epoch": 3.9334470989761092, "percentage": 56.19, "elapsed_time": "3:06:28", "remaining_time": "2:25:22"} +{"current_steps": 2310, "total_steps": 4102, "loss": 0.2393, "lr": 1.9106590460955242e-05, "epoch": 3.9419795221843, "percentage": 56.31, "elapsed_time": "3:06:50", "remaining_time": "2:24:56"} +{"current_steps": 2315, "total_steps": 4102, "loss": 0.241, "lr": 1.9021568825922098e-05, "epoch": 3.9505119453924915, "percentage": 56.44, "elapsed_time": "3:07:16", "remaining_time": "2:24:33"} +{"current_steps": 2320, "total_steps": 4102, "loss": 0.2415, "lr": 1.893656491160594e-05, "epoch": 3.9590443686006824, "percentage": 56.56, "elapsed_time": "3:07:36", "remaining_time": "2:24:06"} +{"current_steps": 2325, "total_steps": 4102, "loss": 0.2436, "lr": 1.8851580257543067e-05, "epoch": 3.967576791808874, "percentage": 56.68, "elapsed_time": "3:07:56", "remaining_time": "2:23:38"} +{"current_steps": 2330, "total_steps": 4102, "loss": 0.2282, "lr": 1.8766616402920957e-05, "epoch": 3.9761092150170647, "percentage": 56.8, "elapsed_time": "3:08:23", "remaining_time": "2:23:16"} +{"current_steps": 2335, "total_steps": 4102, "loss": 0.2401, "lr": 1.868167488655036e-05, "epoch": 3.984641638225256, "percentage": 56.92, "elapsed_time": "3:08:43", "remaining_time": "2:22:48"} +{"current_steps": 2340, "total_steps": 4102, "loss": 0.2253, "lr": 1.8596757246837466e-05, "epoch": 3.993174061433447, "percentage": 57.05, "elapsed_time": "3:09:08", "remaining_time": "2:22:25"} +{"current_steps": 2345, "total_steps": 4102, "loss": 0.2309, "lr": 1.851186502175603e-05, "epoch": 4.001706484641638, "percentage": 57.17, "elapsed_time": "3:09:27", "remaining_time": "2:21:56"} +{"current_steps": 2350, "total_steps": 4102, "loss": 0.2082, "lr": 1.84269997488195e-05, "epoch": 4.010238907849829, "percentage": 57.29, "elapsed_time": "3:09:51", "remaining_time": "2:21:32"} +{"current_steps": 2355, "total_steps": 4102, "loss": 0.2124, "lr": 1.8342162965053204e-05, "epoch": 4.01877133105802, "percentage": 57.41, "elapsed_time": "3:10:16", "remaining_time": "2:21:09"} +{"current_steps": 2360, "total_steps": 4102, "loss": 0.214, "lr": 1.8257356206966465e-05, "epoch": 4.027303754266212, "percentage": 57.53, "elapsed_time": "3:10:36", "remaining_time": "2:20:41"} +{"current_steps": 2365, "total_steps": 4102, "loss": 0.2111, "lr": 1.8172581010524815e-05, "epoch": 4.035836177474403, "percentage": 57.65, "elapsed_time": "3:11:02", "remaining_time": "2:20:19"} +{"current_steps": 2370, "total_steps": 4102, "loss": 0.2099, "lr": 1.8087838911122174e-05, "epoch": 4.044368600682594, "percentage": 57.78, "elapsed_time": "3:11:30", "remaining_time": "2:19:57"} +{"current_steps": 2375, "total_steps": 4102, "loss": 0.2009, "lr": 1.8003131443553016e-05, "epoch": 4.052901023890785, "percentage": 57.9, "elapsed_time": "3:11:53", "remaining_time": "2:19:32"} +{"current_steps": 2380, "total_steps": 4102, "loss": 0.2273, "lr": 1.7918460141984567e-05, "epoch": 4.061433447098976, "percentage": 58.02, "elapsed_time": "3:12:18", "remaining_time": "2:19:08"} +{"current_steps": 2385, "total_steps": 4102, "loss": 0.2023, "lr": 1.7833826539929077e-05, "epoch": 4.0699658703071675, "percentage": 58.14, "elapsed_time": "3:12:44", "remaining_time": "2:18:45"} +{"current_steps": 2390, "total_steps": 4102, "loss": 0.2167, "lr": 1.7749232170215977e-05, "epoch": 4.078498293515358, "percentage": 58.26, "elapsed_time": "3:13:02", "remaining_time": "2:18:16"} +{"current_steps": 2395, "total_steps": 4102, "loss": 0.213, "lr": 1.7664678564964166e-05, "epoch": 4.087030716723549, "percentage": 58.39, "elapsed_time": "3:13:27", "remaining_time": "2:17:53"} +{"current_steps": 2400, "total_steps": 4102, "loss": 0.2081, "lr": 1.7580167255554236e-05, "epoch": 4.09556313993174, "percentage": 58.51, "elapsed_time": "3:13:51", "remaining_time": "2:17:29"} +{"current_steps": 2405, "total_steps": 4102, "loss": 0.2047, "lr": 1.7495699772600723e-05, "epoch": 4.104095563139932, "percentage": 58.63, "elapsed_time": "3:15:11", "remaining_time": "2:17:43"} +{"current_steps": 2410, "total_steps": 4102, "loss": 0.2221, "lr": 1.7411277645924446e-05, "epoch": 4.112627986348123, "percentage": 58.75, "elapsed_time": "3:15:31", "remaining_time": "2:17:16"} +{"current_steps": 2415, "total_steps": 4102, "loss": 0.2128, "lr": 1.7326902404524725e-05, "epoch": 4.121160409556314, "percentage": 58.87, "elapsed_time": "3:15:57", "remaining_time": "2:16:52"} +{"current_steps": 2420, "total_steps": 4102, "loss": 0.2009, "lr": 1.7242575576551754e-05, "epoch": 4.129692832764505, "percentage": 59.0, "elapsed_time": "3:16:19", "remaining_time": "2:16:27"} +{"current_steps": 2425, "total_steps": 4102, "loss": 0.2162, "lr": 1.7158298689278867e-05, "epoch": 4.138225255972697, "percentage": 59.12, "elapsed_time": "3:16:45", "remaining_time": "2:16:03"} +{"current_steps": 2430, "total_steps": 4102, "loss": 0.2199, "lr": 1.7074073269074916e-05, "epoch": 4.146757679180888, "percentage": 59.24, "elapsed_time": "3:17:11", "remaining_time": "2:15:41"} +{"current_steps": 2435, "total_steps": 4102, "loss": 0.2109, "lr": 1.6989900841376622e-05, "epoch": 4.1552901023890785, "percentage": 59.36, "elapsed_time": "3:17:30", "remaining_time": "2:15:13"} +{"current_steps": 2440, "total_steps": 4102, "loss": 0.2145, "lr": 1.6905782930660924e-05, "epoch": 4.163822525597269, "percentage": 59.48, "elapsed_time": "3:17:50", "remaining_time": "2:14:45"} +{"current_steps": 2445, "total_steps": 4102, "loss": 0.2115, "lr": 1.6821721060417403e-05, "epoch": 4.172354948805461, "percentage": 59.61, "elapsed_time": "3:18:14", "remaining_time": "2:14:20"} +{"current_steps": 2450, "total_steps": 4102, "loss": 0.2131, "lr": 1.673771675312065e-05, "epoch": 4.180887372013652, "percentage": 59.73, "elapsed_time": "3:18:31", "remaining_time": "2:13:51"} +{"current_steps": 2455, "total_steps": 4102, "loss": 0.216, "lr": 1.6653771530202727e-05, "epoch": 4.189419795221843, "percentage": 59.85, "elapsed_time": "3:18:50", "remaining_time": "2:13:23"} +{"current_steps": 2460, "total_steps": 4102, "loss": 0.2184, "lr": 1.65698869120256e-05, "epoch": 4.197952218430034, "percentage": 59.97, "elapsed_time": "3:19:14", "remaining_time": "2:12:59"} +{"current_steps": 2465, "total_steps": 4102, "loss": 0.2091, "lr": 1.6486064417853583e-05, "epoch": 4.206484641638225, "percentage": 60.09, "elapsed_time": "3:19:34", "remaining_time": "2:12:32"} +{"current_steps": 2470, "total_steps": 4102, "loss": 0.2131, "lr": 1.640230556582587e-05, "epoch": 4.215017064846417, "percentage": 60.21, "elapsed_time": "3:19:59", "remaining_time": "2:12:08"} +{"current_steps": 2475, "total_steps": 4102, "loss": 0.2124, "lr": 1.631861187292897e-05, "epoch": 4.223549488054608, "percentage": 60.34, "elapsed_time": "3:20:23", "remaining_time": "2:11:44"} +{"current_steps": 2480, "total_steps": 4102, "loss": 0.2198, "lr": 1.623498485496931e-05, "epoch": 4.2320819112627985, "percentage": 60.46, "elapsed_time": "3:20:46", "remaining_time": "2:11:18"} +{"current_steps": 2485, "total_steps": 4102, "loss": 0.212, "lr": 1.6151426026545715e-05, "epoch": 4.2406143344709895, "percentage": 60.58, "elapsed_time": "3:21:10", "remaining_time": "2:10:54"} +{"current_steps": 2490, "total_steps": 4102, "loss": 0.2142, "lr": 1.606793690102203e-05, "epoch": 4.249146757679181, "percentage": 60.7, "elapsed_time": "3:21:33", "remaining_time": "2:10:29"} +{"current_steps": 2495, "total_steps": 4102, "loss": 0.2089, "lr": 1.5984518990499656e-05, "epoch": 4.257679180887372, "percentage": 60.82, "elapsed_time": "3:21:58", "remaining_time": "2:10:05"} +{"current_steps": 2500, "total_steps": 4102, "loss": 0.2165, "lr": 1.5901173805790214e-05, "epoch": 4.266211604095563, "percentage": 60.95, "elapsed_time": "3:22:30", "remaining_time": "2:09:45"} +{"current_steps": 2505, "total_steps": 4102, "loss": 0.2216, "lr": 1.5817902856388164e-05, "epoch": 4.274744027303754, "percentage": 61.07, "elapsed_time": "3:22:51", "remaining_time": "2:09:19"} +{"current_steps": 2510, "total_steps": 4102, "loss": 0.2211, "lr": 1.573470765044345e-05, "epoch": 4.283276450511945, "percentage": 61.19, "elapsed_time": "3:23:14", "remaining_time": "2:08:54"} +{"current_steps": 2515, "total_steps": 4102, "loss": 0.2079, "lr": 1.565158969473422e-05, "epoch": 4.291808873720137, "percentage": 61.31, "elapsed_time": "3:23:37", "remaining_time": "2:08:29"} +{"current_steps": 2520, "total_steps": 4102, "loss": 0.2099, "lr": 1.5568550494639488e-05, "epoch": 4.300341296928328, "percentage": 61.43, "elapsed_time": "3:23:58", "remaining_time": "2:08:03"} +{"current_steps": 2525, "total_steps": 4102, "loss": 0.2169, "lr": 1.548559155411191e-05, "epoch": 4.308873720136519, "percentage": 61.56, "elapsed_time": "3:24:24", "remaining_time": "2:07:40"} +{"current_steps": 2530, "total_steps": 4102, "loss": 0.2107, "lr": 1.5402714375650546e-05, "epoch": 4.3174061433447095, "percentage": 61.68, "elapsed_time": "3:24:47", "remaining_time": "2:07:15"} +{"current_steps": 2535, "total_steps": 4102, "loss": 0.2172, "lr": 1.5319920460273604e-05, "epoch": 4.325938566552901, "percentage": 61.8, "elapsed_time": "3:25:05", "remaining_time": "2:06:46"} +{"current_steps": 2540, "total_steps": 4102, "loss": 0.2182, "lr": 1.5237211307491322e-05, "epoch": 4.334470989761092, "percentage": 61.92, "elapsed_time": "3:25:27", "remaining_time": "2:06:21"} +{"current_steps": 2545, "total_steps": 4102, "loss": 0.2062, "lr": 1.5154588415278735e-05, "epoch": 4.343003412969283, "percentage": 62.04, "elapsed_time": "3:25:50", "remaining_time": "2:05:55"} +{"current_steps": 2550, "total_steps": 4102, "loss": 0.2296, "lr": 1.50720532800486e-05, "epoch": 4.351535836177474, "percentage": 62.16, "elapsed_time": "3:26:12", "remaining_time": "2:05:30"} +{"current_steps": 2555, "total_steps": 4102, "loss": 0.2163, "lr": 1.498960739662428e-05, "epoch": 4.360068259385666, "percentage": 62.29, "elapsed_time": "3:26:32", "remaining_time": "2:05:03"} +{"current_steps": 2560, "total_steps": 4102, "loss": 0.2113, "lr": 1.490725225821267e-05, "epoch": 4.368600682593857, "percentage": 62.41, "elapsed_time": "3:26:53", "remaining_time": "2:04:37"} +{"current_steps": 2565, "total_steps": 4102, "loss": 0.2284, "lr": 1.482498935637712e-05, "epoch": 4.377133105802048, "percentage": 62.53, "elapsed_time": "3:27:16", "remaining_time": "2:04:12"} +{"current_steps": 2570, "total_steps": 4102, "loss": 0.2192, "lr": 1.4742820181010489e-05, "epoch": 4.385665529010239, "percentage": 62.65, "elapsed_time": "3:27:36", "remaining_time": "2:03:45"} +{"current_steps": 2575, "total_steps": 4102, "loss": 0.2265, "lr": 1.466074622030809e-05, "epoch": 4.3941979522184305, "percentage": 62.77, "elapsed_time": "3:27:58", "remaining_time": "2:03:19"} +{"current_steps": 2580, "total_steps": 4102, "loss": 0.2182, "lr": 1.4578768960740797e-05, "epoch": 4.402730375426621, "percentage": 62.9, "elapsed_time": "3:28:15", "remaining_time": "2:02:51"} +{"current_steps": 2585, "total_steps": 4102, "loss": 0.2082, "lr": 1.4496889887028083e-05, "epoch": 4.411262798634812, "percentage": 63.02, "elapsed_time": "3:28:34", "remaining_time": "2:02:24"} +{"current_steps": 2590, "total_steps": 4102, "loss": 0.2105, "lr": 1.4415110482111126e-05, "epoch": 4.419795221843003, "percentage": 63.14, "elapsed_time": "3:28:54", "remaining_time": "2:01:57"} +{"current_steps": 2595, "total_steps": 4102, "loss": 0.2231, "lr": 1.4333432227125994e-05, "epoch": 4.428327645051194, "percentage": 63.26, "elapsed_time": "3:29:18", "remaining_time": "2:01:32"} +{"current_steps": 2600, "total_steps": 4102, "loss": 0.2218, "lr": 1.425185660137677e-05, "epoch": 4.436860068259386, "percentage": 63.38, "elapsed_time": "3:29:38", "remaining_time": "2:01:06"} +{"current_steps": 2605, "total_steps": 4102, "loss": 0.2227, "lr": 1.4170385082308803e-05, "epoch": 4.445392491467577, "percentage": 63.51, "elapsed_time": "3:30:54", "remaining_time": "2:01:11"} +{"current_steps": 2610, "total_steps": 4102, "loss": 0.2105, "lr": 1.408901914548192e-05, "epoch": 4.453924914675768, "percentage": 63.63, "elapsed_time": "3:31:18", "remaining_time": "2:00:47"} +{"current_steps": 2615, "total_steps": 4102, "loss": 0.2087, "lr": 1.4007760264543694e-05, "epoch": 4.462457337883959, "percentage": 63.75, "elapsed_time": "3:31:41", "remaining_time": "2:00:22"} +{"current_steps": 2620, "total_steps": 4102, "loss": 0.2116, "lr": 1.3926609911202796e-05, "epoch": 4.4709897610921505, "percentage": 63.87, "elapsed_time": "3:32:10", "remaining_time": "2:00:01"} +{"current_steps": 2625, "total_steps": 4102, "loss": 0.2135, "lr": 1.3845569555202296e-05, "epoch": 4.479522184300341, "percentage": 63.99, "elapsed_time": "3:32:29", "remaining_time": "1:59:33"} +{"current_steps": 2630, "total_steps": 4102, "loss": 0.2151, "lr": 1.3764640664293083e-05, "epoch": 4.488054607508532, "percentage": 64.12, "elapsed_time": "3:32:50", "remaining_time": "1:59:07"} +{"current_steps": 2635, "total_steps": 4102, "loss": 0.2152, "lr": 1.3683824704207234e-05, "epoch": 4.496587030716723, "percentage": 64.24, "elapsed_time": "3:33:10", "remaining_time": "1:58:41"} +{"current_steps": 2640, "total_steps": 4102, "loss": 0.2189, "lr": 1.3603123138631516e-05, "epoch": 4.505119453924914, "percentage": 64.36, "elapsed_time": "3:33:32", "remaining_time": "1:58:15"} +{"current_steps": 2645, "total_steps": 4102, "loss": 0.214, "lr": 1.3522537429180853e-05, "epoch": 4.513651877133106, "percentage": 64.48, "elapsed_time": "3:33:52", "remaining_time": "1:57:48"} +{"current_steps": 2650, "total_steps": 4102, "loss": 0.22, "lr": 1.3442069035371852e-05, "epoch": 4.522184300341297, "percentage": 64.6, "elapsed_time": "3:34:17", "remaining_time": "1:57:24"} +{"current_steps": 2655, "total_steps": 4102, "loss": 0.2142, "lr": 1.3361719414596386e-05, "epoch": 4.530716723549488, "percentage": 64.72, "elapsed_time": "3:34:43", "remaining_time": "1:57:01"} +{"current_steps": 2660, "total_steps": 4102, "loss": 0.2193, "lr": 1.3281490022095169e-05, "epoch": 4.53924914675768, "percentage": 64.85, "elapsed_time": "3:35:02", "remaining_time": "1:56:34"} +{"current_steps": 2665, "total_steps": 4102, "loss": 0.234, "lr": 1.3201382310931427e-05, "epoch": 4.547781569965871, "percentage": 64.97, "elapsed_time": "3:35:21", "remaining_time": "1:56:07"} +{"current_steps": 2670, "total_steps": 4102, "loss": 0.2151, "lr": 1.312139773196458e-05, "epoch": 4.5563139931740615, "percentage": 65.09, "elapsed_time": "3:35:39", "remaining_time": "1:55:39"} +{"current_steps": 2675, "total_steps": 4102, "loss": 0.2205, "lr": 1.304153773382394e-05, "epoch": 4.564846416382252, "percentage": 65.21, "elapsed_time": "3:36:00", "remaining_time": "1:55:13"} +{"current_steps": 2680, "total_steps": 4102, "loss": 0.217, "lr": 1.2961803762882514e-05, "epoch": 4.573378839590443, "percentage": 65.33, "elapsed_time": "3:36:26", "remaining_time": "1:54:50"} +{"current_steps": 2685, "total_steps": 4102, "loss": 0.2119, "lr": 1.2882197263230754e-05, "epoch": 4.581911262798635, "percentage": 65.46, "elapsed_time": "3:36:46", "remaining_time": "1:54:24"} +{"current_steps": 2690, "total_steps": 4102, "loss": 0.2076, "lr": 1.280271967665046e-05, "epoch": 4.590443686006826, "percentage": 65.58, "elapsed_time": "3:37:10", "remaining_time": "1:53:59"} +{"current_steps": 2695, "total_steps": 4102, "loss": 0.2182, "lr": 1.272337244258863e-05, "epoch": 4.598976109215017, "percentage": 65.7, "elapsed_time": "3:37:30", "remaining_time": "1:53:33"} +{"current_steps": 2700, "total_steps": 4102, "loss": 0.2129, "lr": 1.2644156998131407e-05, "epoch": 4.607508532423208, "percentage": 65.82, "elapsed_time": "3:37:53", "remaining_time": "1:53:08"} +{"current_steps": 2705, "total_steps": 4102, "loss": 0.22, "lr": 1.2565074777978037e-05, "epoch": 4.6160409556314, "percentage": 65.94, "elapsed_time": "3:38:12", "remaining_time": "1:52:41"} +{"current_steps": 2710, "total_steps": 4102, "loss": 0.2102, "lr": 1.2486127214414898e-05, "epoch": 4.624573378839591, "percentage": 66.07, "elapsed_time": "3:38:34", "remaining_time": "1:52:16"} +{"current_steps": 2715, "total_steps": 4102, "loss": 0.2063, "lr": 1.2407315737289558e-05, "epoch": 4.6331058020477816, "percentage": 66.19, "elapsed_time": "3:38:55", "remaining_time": "1:51:50"} +{"current_steps": 2720, "total_steps": 4102, "loss": 0.228, "lr": 1.2328641773984864e-05, "epoch": 4.6416382252559725, "percentage": 66.31, "elapsed_time": "3:39:16", "remaining_time": "1:51:24"} +{"current_steps": 2725, "total_steps": 4102, "loss": 0.2203, "lr": 1.225010674939312e-05, "epoch": 4.650170648464163, "percentage": 66.43, "elapsed_time": "3:39:37", "remaining_time": "1:50:58"} +{"current_steps": 2730, "total_steps": 4102, "loss": 0.2152, "lr": 1.2171712085890237e-05, "epoch": 4.658703071672355, "percentage": 66.55, "elapsed_time": "3:39:57", "remaining_time": "1:50:32"} +{"current_steps": 2735, "total_steps": 4102, "loss": 0.2211, "lr": 1.2093459203310008e-05, "epoch": 4.667235494880546, "percentage": 66.67, "elapsed_time": "3:40:18", "remaining_time": "1:50:06"} +{"current_steps": 2740, "total_steps": 4102, "loss": 0.2211, "lr": 1.2015349518918391e-05, "epoch": 4.675767918088737, "percentage": 66.8, "elapsed_time": "3:40:36", "remaining_time": "1:49:39"} +{"current_steps": 2745, "total_steps": 4102, "loss": 0.2155, "lr": 1.1937384447387817e-05, "epoch": 4.684300341296928, "percentage": 66.92, "elapsed_time": "3:40:59", "remaining_time": "1:49:15"} +{"current_steps": 2750, "total_steps": 4102, "loss": 0.2141, "lr": 1.1859565400771577e-05, "epoch": 4.69283276450512, "percentage": 67.04, "elapsed_time": "3:41:22", "remaining_time": "1:48:50"} +{"current_steps": 2755, "total_steps": 4102, "loss": 0.2079, "lr": 1.1781893788478268e-05, "epoch": 4.701365187713311, "percentage": 67.16, "elapsed_time": "3:41:42", "remaining_time": "1:48:24"} +{"current_steps": 2760, "total_steps": 4102, "loss": 0.2074, "lr": 1.1704371017246241e-05, "epoch": 4.709897610921502, "percentage": 67.28, "elapsed_time": "3:42:03", "remaining_time": "1:47:58"} +{"current_steps": 2765, "total_steps": 4102, "loss": 0.2117, "lr": 1.1626998491118138e-05, "epoch": 4.7184300341296925, "percentage": 67.41, "elapsed_time": "3:42:26", "remaining_time": "1:47:33"} +{"current_steps": 2770, "total_steps": 4102, "loss": 0.2113, "lr": 1.1549777611415469e-05, "epoch": 4.726962457337884, "percentage": 67.53, "elapsed_time": "3:42:50", "remaining_time": "1:47:09"} +{"current_steps": 2775, "total_steps": 4102, "loss": 0.2087, "lr": 1.147270977671319e-05, "epoch": 4.735494880546075, "percentage": 67.65, "elapsed_time": "3:43:14", "remaining_time": "1:46:45"} +{"current_steps": 2780, "total_steps": 4102, "loss": 0.212, "lr": 1.1395796382814419e-05, "epoch": 4.744027303754266, "percentage": 67.77, "elapsed_time": "3:43:39", "remaining_time": "1:46:21"} +{"current_steps": 2785, "total_steps": 4102, "loss": 0.2069, "lr": 1.1319038822725165e-05, "epoch": 4.752559726962457, "percentage": 67.89, "elapsed_time": "3:44:00", "remaining_time": "1:45:55"} +{"current_steps": 2790, "total_steps": 4102, "loss": 0.2086, "lr": 1.1242438486629048e-05, "epoch": 4.761092150170649, "percentage": 68.02, "elapsed_time": "3:44:19", "remaining_time": "1:45:29"} +{"current_steps": 2795, "total_steps": 4102, "loss": 0.2102, "lr": 1.1165996761862155e-05, "epoch": 4.76962457337884, "percentage": 68.14, "elapsed_time": "3:44:41", "remaining_time": "1:45:04"} +{"current_steps": 2800, "total_steps": 4102, "loss": 0.226, "lr": 1.1089715032887905e-05, "epoch": 4.778156996587031, "percentage": 68.26, "elapsed_time": "3:45:00", "remaining_time": "1:44:37"} +{"current_steps": 2805, "total_steps": 4102, "loss": 0.2075, "lr": 1.101359468127198e-05, "epoch": 4.786689419795222, "percentage": 68.38, "elapsed_time": "3:46:23", "remaining_time": "1:44:40"} +{"current_steps": 2810, "total_steps": 4102, "loss": 0.218, "lr": 1.0937637085657297e-05, "epoch": 4.795221843003413, "percentage": 68.5, "elapsed_time": "3:46:42", "remaining_time": "1:44:14"} +{"current_steps": 2815, "total_steps": 4102, "loss": 0.2144, "lr": 1.0861843621739042e-05, "epoch": 4.803754266211604, "percentage": 68.63, "elapsed_time": "3:47:01", "remaining_time": "1:43:47"} +{"current_steps": 2820, "total_steps": 4102, "loss": 0.2161, "lr": 1.078621566223975e-05, "epoch": 4.812286689419795, "percentage": 68.75, "elapsed_time": "3:47:23", "remaining_time": "1:43:22"} +{"current_steps": 2825, "total_steps": 4102, "loss": 0.2149, "lr": 1.0710754576884445e-05, "epoch": 4.820819112627986, "percentage": 68.87, "elapsed_time": "3:47:44", "remaining_time": "1:42:56"} +{"current_steps": 2830, "total_steps": 4102, "loss": 0.2125, "lr": 1.0635461732375838e-05, "epoch": 4.829351535836177, "percentage": 68.99, "elapsed_time": "3:48:12", "remaining_time": "1:42:34"} +{"current_steps": 2835, "total_steps": 4102, "loss": 0.2131, "lr": 1.056033849236958e-05, "epoch": 4.837883959044369, "percentage": 69.11, "elapsed_time": "3:48:40", "remaining_time": "1:42:11"} +{"current_steps": 2840, "total_steps": 4102, "loss": 0.2176, "lr": 1.0485386217449537e-05, "epoch": 4.84641638225256, "percentage": 69.23, "elapsed_time": "3:48:58", "remaining_time": "1:41:44"} +{"current_steps": 2845, "total_steps": 4102, "loss": 0.2217, "lr": 1.0410606265103159e-05, "epoch": 4.854948805460751, "percentage": 69.36, "elapsed_time": "3:49:18", "remaining_time": "1:41:18"} +{"current_steps": 2850, "total_steps": 4102, "loss": 0.2137, "lr": 1.0335999989696926e-05, "epoch": 4.863481228668942, "percentage": 69.48, "elapsed_time": "3:49:40", "remaining_time": "1:40:53"} +{"current_steps": 2855, "total_steps": 4102, "loss": 0.2125, "lr": 1.0261568742451776e-05, "epoch": 4.872013651877133, "percentage": 69.6, "elapsed_time": "3:50:03", "remaining_time": "1:40:28"} +{"current_steps": 2860, "total_steps": 4102, "loss": 0.2084, "lr": 1.0187313871418652e-05, "epoch": 4.8805460750853245, "percentage": 69.72, "elapsed_time": "3:50:24", "remaining_time": "1:40:03"} +{"current_steps": 2865, "total_steps": 4102, "loss": 0.222, "lr": 1.0113236721454087e-05, "epoch": 4.889078498293515, "percentage": 69.84, "elapsed_time": "3:50:52", "remaining_time": "1:39:41"} +{"current_steps": 2870, "total_steps": 4102, "loss": 0.2095, "lr": 1.0039338634195837e-05, "epoch": 4.897610921501706, "percentage": 69.97, "elapsed_time": "3:51:11", "remaining_time": "1:39:14"} +{"current_steps": 2875, "total_steps": 4102, "loss": 0.2204, "lr": 9.965620948038597e-06, "epoch": 4.906143344709898, "percentage": 70.09, "elapsed_time": "3:51:32", "remaining_time": "1:38:49"} +{"current_steps": 2880, "total_steps": 4102, "loss": 0.2035, "lr": 9.892084998109746e-06, "epoch": 4.914675767918089, "percentage": 70.21, "elapsed_time": "3:51:57", "remaining_time": "1:38:25"} +{"current_steps": 2885, "total_steps": 4102, "loss": 0.2268, "lr": 9.818732116245193e-06, "epoch": 4.92320819112628, "percentage": 70.33, "elapsed_time": "3:52:20", "remaining_time": "1:38:00"} +{"current_steps": 2890, "total_steps": 4102, "loss": 0.2097, "lr": 9.745563630965204e-06, "epoch": 4.931740614334471, "percentage": 70.45, "elapsed_time": "3:52:41", "remaining_time": "1:37:35"} +{"current_steps": 2895, "total_steps": 4102, "loss": 0.2104, "lr": 9.672580867450397e-06, "epoch": 4.940273037542662, "percentage": 70.58, "elapsed_time": "3:53:06", "remaining_time": "1:37:11"} +{"current_steps": 2900, "total_steps": 4102, "loss": 0.2252, "lr": 9.599785147517694e-06, "epoch": 4.948805460750854, "percentage": 70.7, "elapsed_time": "3:53:30", "remaining_time": "1:36:47"} +{"current_steps": 2905, "total_steps": 4102, "loss": 0.2212, "lr": 9.527177789596442e-06, "epoch": 4.9573378839590445, "percentage": 70.82, "elapsed_time": "3:53:47", "remaining_time": "1:36:19"} +{"current_steps": 2910, "total_steps": 4102, "loss": 0.2081, "lr": 9.454760108704467e-06, "epoch": 4.965870307167235, "percentage": 70.94, "elapsed_time": "3:54:08", "remaining_time": "1:35:54"} +{"current_steps": 2915, "total_steps": 4102, "loss": 0.2181, "lr": 9.382533416424269e-06, "epoch": 4.974402730375426, "percentage": 71.06, "elapsed_time": "3:54:29", "remaining_time": "1:35:29"} +{"current_steps": 2920, "total_steps": 4102, "loss": 0.2116, "lr": 9.310499020879336e-06, "epoch": 4.982935153583618, "percentage": 71.18, "elapsed_time": "3:54:51", "remaining_time": "1:35:04"} +{"current_steps": 2925, "total_steps": 4102, "loss": 0.2236, "lr": 9.238658226710359e-06, "epoch": 4.991467576791809, "percentage": 71.31, "elapsed_time": "3:55:13", "remaining_time": "1:34:39"} +{"current_steps": 2930, "total_steps": 4102, "loss": 0.2182, "lr": 9.167012335051663e-06, "epoch": 5.0, "percentage": 71.43, "elapsed_time": "3:55:36", "remaining_time": "1:34:14"} +{"current_steps": 2935, "total_steps": 4102, "loss": 0.2025, "lr": 9.09556264350762e-06, "epoch": 5.008532423208191, "percentage": 71.55, "elapsed_time": "3:55:55", "remaining_time": "1:33:48"} +{"current_steps": 2940, "total_steps": 4102, "loss": 0.195, "lr": 9.024310446129151e-06, "epoch": 5.017064846416382, "percentage": 71.67, "elapsed_time": "3:56:14", "remaining_time": "1:33:22"} +{"current_steps": 2945, "total_steps": 4102, "loss": 0.1949, "lr": 8.953257033390293e-06, "epoch": 5.025597269624574, "percentage": 71.79, "elapsed_time": "3:56:38", "remaining_time": "1:32:58"} +{"current_steps": 2950, "total_steps": 4102, "loss": 0.1827, "lr": 8.882403692164807e-06, "epoch": 5.034129692832765, "percentage": 71.92, "elapsed_time": "3:57:04", "remaining_time": "1:32:34"} +{"current_steps": 2955, "total_steps": 4102, "loss": 0.1896, "lr": 8.811751705702927e-06, "epoch": 5.0426621160409555, "percentage": 72.04, "elapsed_time": "3:57:26", "remaining_time": "1:32:09"} +{"current_steps": 2960, "total_steps": 4102, "loss": 0.1965, "lr": 8.741302353608032e-06, "epoch": 5.051194539249146, "percentage": 72.16, "elapsed_time": "3:57:46", "remaining_time": "1:31:43"} +{"current_steps": 2965, "total_steps": 4102, "loss": 0.193, "lr": 8.671056911813536e-06, "epoch": 5.059726962457338, "percentage": 72.28, "elapsed_time": "3:58:07", "remaining_time": "1:31:18"} +{"current_steps": 2970, "total_steps": 4102, "loss": 0.1959, "lr": 8.601016652559775e-06, "epoch": 5.068259385665529, "percentage": 72.4, "elapsed_time": "3:58:35", "remaining_time": "1:30:56"} +{"current_steps": 2975, "total_steps": 4102, "loss": 0.1945, "lr": 8.531182844370936e-06, "epoch": 5.07679180887372, "percentage": 72.53, "elapsed_time": "3:59:03", "remaining_time": "1:30:33"} +{"current_steps": 2980, "total_steps": 4102, "loss": 0.1914, "lr": 8.461556752032097e-06, "epoch": 5.085324232081911, "percentage": 72.65, "elapsed_time": "3:59:27", "remaining_time": "1:30:09"} +{"current_steps": 2985, "total_steps": 4102, "loss": 0.1867, "lr": 8.392139636566321e-06, "epoch": 5.093856655290103, "percentage": 72.77, "elapsed_time": "3:59:54", "remaining_time": "1:29:46"} +{"current_steps": 2990, "total_steps": 4102, "loss": 0.2061, "lr": 8.322932755211818e-06, "epoch": 5.102389078498294, "percentage": 72.89, "elapsed_time": "4:00:12", "remaining_time": "1:29:20"} +{"current_steps": 2995, "total_steps": 4102, "loss": 0.1875, "lr": 8.253937361399174e-06, "epoch": 5.110921501706485, "percentage": 73.01, "elapsed_time": "4:00:40", "remaining_time": "1:28:57"} +{"current_steps": 3000, "total_steps": 4102, "loss": 0.1975, "lr": 8.185154704728637e-06, "epoch": 5.1194539249146755, "percentage": 73.14, "elapsed_time": "4:01:02", "remaining_time": "1:28:32"} +{"current_steps": 3005, "total_steps": 4102, "loss": 0.1934, "lr": 8.116586030947529e-06, "epoch": 5.1279863481228665, "percentage": 73.26, "elapsed_time": "4:02:20", "remaining_time": "1:28:28"} +{"current_steps": 3010, "total_steps": 4102, "loss": 0.1945, "lr": 8.048232581927604e-06, "epoch": 5.136518771331058, "percentage": 73.38, "elapsed_time": "4:02:47", "remaining_time": "1:28:05"} +{"current_steps": 3015, "total_steps": 4102, "loss": 0.1978, "lr": 7.980095595642635e-06, "epoch": 5.145051194539249, "percentage": 73.5, "elapsed_time": "4:03:06", "remaining_time": "1:27:38"} +{"current_steps": 3020, "total_steps": 4102, "loss": 0.1967, "lr": 7.91217630614596e-06, "epoch": 5.15358361774744, "percentage": 73.62, "elapsed_time": "4:03:29", "remaining_time": "1:27:14"} +{"current_steps": 3025, "total_steps": 4102, "loss": 0.1953, "lr": 7.84447594354813e-06, "epoch": 5.162116040955631, "percentage": 73.74, "elapsed_time": "4:03:54", "remaining_time": "1:26:50"} +{"current_steps": 3030, "total_steps": 4102, "loss": 0.1923, "lr": 7.776995733994608e-06, "epoch": 5.170648464163823, "percentage": 73.87, "elapsed_time": "4:04:15", "remaining_time": "1:26:24"} +{"current_steps": 3035, "total_steps": 4102, "loss": 0.2023, "lr": 7.709736899643627e-06, "epoch": 5.179180887372014, "percentage": 73.99, "elapsed_time": "4:04:38", "remaining_time": "1:26:00"} +{"current_steps": 3040, "total_steps": 4102, "loss": 0.1965, "lr": 7.642700658643991e-06, "epoch": 5.187713310580205, "percentage": 74.11, "elapsed_time": "4:05:00", "remaining_time": "1:25:35"} +{"current_steps": 3045, "total_steps": 4102, "loss": 0.2055, "lr": 7.575888225113037e-06, "epoch": 5.196245733788396, "percentage": 74.23, "elapsed_time": "4:05:23", "remaining_time": "1:25:10"} +{"current_steps": 3050, "total_steps": 4102, "loss": 0.1899, "lr": 7.50930080911465e-06, "epoch": 5.204778156996587, "percentage": 74.35, "elapsed_time": "4:05:48", "remaining_time": "1:24:46"} +{"current_steps": 3055, "total_steps": 4102, "loss": 0.2004, "lr": 7.442939616637339e-06, "epoch": 5.213310580204778, "percentage": 74.48, "elapsed_time": "4:06:07", "remaining_time": "1:24:21"} +{"current_steps": 3060, "total_steps": 4102, "loss": 0.2039, "lr": 7.376805849572402e-06, "epoch": 5.221843003412969, "percentage": 74.6, "elapsed_time": "4:06:30", "remaining_time": "1:23:56"} +{"current_steps": 3065, "total_steps": 4102, "loss": 0.2058, "lr": 7.310900705692137e-06, "epoch": 5.23037542662116, "percentage": 74.72, "elapsed_time": "4:06:50", "remaining_time": "1:23:30"} +{"current_steps": 3070, "total_steps": 4102, "loss": 0.2015, "lr": 7.245225378628207e-06, "epoch": 5.238907849829351, "percentage": 74.84, "elapsed_time": "4:07:10", "remaining_time": "1:23:05"} +{"current_steps": 3075, "total_steps": 4102, "loss": 0.193, "lr": 7.17978105784993e-06, "epoch": 5.247440273037543, "percentage": 74.96, "elapsed_time": "4:07:30", "remaining_time": "1:22:39"} +{"current_steps": 3080, "total_steps": 4102, "loss": 0.1982, "lr": 7.114568928642815e-06, "epoch": 5.255972696245734, "percentage": 75.09, "elapsed_time": "4:07:55", "remaining_time": "1:22:16"} +{"current_steps": 3085, "total_steps": 4102, "loss": 0.2024, "lr": 7.049590172087058e-06, "epoch": 5.264505119453925, "percentage": 75.21, "elapsed_time": "4:08:17", "remaining_time": "1:21:51"} +{"current_steps": 3090, "total_steps": 4102, "loss": 0.1965, "lr": 6.984845965036174e-06, "epoch": 5.273037542662116, "percentage": 75.33, "elapsed_time": "4:08:34", "remaining_time": "1:21:24"} +{"current_steps": 3095, "total_steps": 4102, "loss": 0.1931, "lr": 6.920337480095654e-06, "epoch": 5.2815699658703075, "percentage": 75.45, "elapsed_time": "4:08:55", "remaining_time": "1:20:59"} +{"current_steps": 3100, "total_steps": 4102, "loss": 0.1989, "lr": 6.8560658856017255e-06, "epoch": 5.290102389078498, "percentage": 75.57, "elapsed_time": "4:09:16", "remaining_time": "1:20:34"} +{"current_steps": 3105, "total_steps": 4102, "loss": 0.1959, "lr": 6.79203234560025e-06, "epoch": 5.298634812286689, "percentage": 75.69, "elapsed_time": "4:09:38", "remaining_time": "1:20:09"} +{"current_steps": 3110, "total_steps": 4102, "loss": 0.198, "lr": 6.728238019825566e-06, "epoch": 5.30716723549488, "percentage": 75.82, "elapsed_time": "4:09:56", "remaining_time": "1:19:43"} +{"current_steps": 3115, "total_steps": 4102, "loss": 0.1938, "lr": 6.664684063679527e-06, "epoch": 5.315699658703072, "percentage": 75.94, "elapsed_time": "4:10:18", "remaining_time": "1:19:18"} +{"current_steps": 3120, "total_steps": 4102, "loss": 0.1874, "lr": 6.601371628210569e-06, "epoch": 5.324232081911263, "percentage": 76.06, "elapsed_time": "4:10:43", "remaining_time": "1:18:54"} +{"current_steps": 3125, "total_steps": 4102, "loss": 0.1976, "lr": 6.538301860092857e-06, "epoch": 5.332764505119454, "percentage": 76.18, "elapsed_time": "4:11:06", "remaining_time": "1:18:30"} +{"current_steps": 3130, "total_steps": 4102, "loss": 0.2037, "lr": 6.475475901605522e-06, "epoch": 5.341296928327645, "percentage": 76.3, "elapsed_time": "4:11:28", "remaining_time": "1:18:05"} +{"current_steps": 3135, "total_steps": 4102, "loss": 0.1955, "lr": 6.412894890611963e-06, "epoch": 5.349829351535837, "percentage": 76.43, "elapsed_time": "4:11:51", "remaining_time": "1:17:41"} +{"current_steps": 3140, "total_steps": 4102, "loss": 0.2042, "lr": 6.350559960539277e-06, "epoch": 5.3583617747440275, "percentage": 76.55, "elapsed_time": "4:12:15", "remaining_time": "1:17:17"} +{"current_steps": 3145, "total_steps": 4102, "loss": 0.1985, "lr": 6.288472240357664e-06, "epoch": 5.3668941979522184, "percentage": 76.67, "elapsed_time": "4:12:43", "remaining_time": "1:16:54"} +{"current_steps": 3150, "total_steps": 4102, "loss": 0.2019, "lr": 6.226632854560028e-06, "epoch": 5.375426621160409, "percentage": 76.79, "elapsed_time": "4:13:03", "remaining_time": "1:16:28"} +{"current_steps": 3155, "total_steps": 4102, "loss": 0.1938, "lr": 6.165042923141622e-06, "epoch": 5.3839590443686, "percentage": 76.91, "elapsed_time": "4:13:24", "remaining_time": "1:16:03"} +{"current_steps": 3160, "total_steps": 4102, "loss": 0.2071, "lr": 6.103703561579717e-06, "epoch": 5.392491467576792, "percentage": 77.04, "elapsed_time": "4:13:44", "remaining_time": "1:15:38"} +{"current_steps": 3165, "total_steps": 4102, "loss": 0.1963, "lr": 6.042615880813434e-06, "epoch": 5.401023890784983, "percentage": 77.16, "elapsed_time": "4:14:10", "remaining_time": "1:15:14"} +{"current_steps": 3170, "total_steps": 4102, "loss": 0.1996, "lr": 5.981780987223609e-06, "epoch": 5.409556313993174, "percentage": 77.28, "elapsed_time": "4:14:30", "remaining_time": "1:14:49"} +{"current_steps": 3175, "total_steps": 4102, "loss": 0.2065, "lr": 5.92119998261276e-06, "epoch": 5.418088737201365, "percentage": 77.4, "elapsed_time": "4:14:53", "remaining_time": "1:14:25"} +{"current_steps": 3180, "total_steps": 4102, "loss": 0.2115, "lr": 5.860873964185136e-06, "epoch": 5.426621160409557, "percentage": 77.52, "elapsed_time": "4:15:13", "remaining_time": "1:14:00"} +{"current_steps": 3185, "total_steps": 4102, "loss": 0.1967, "lr": 5.800804024526825e-06, "epoch": 5.435153583617748, "percentage": 77.65, "elapsed_time": "4:15:32", "remaining_time": "1:13:34"} +{"current_steps": 3190, "total_steps": 4102, "loss": 0.1938, "lr": 5.740991251586014e-06, "epoch": 5.4436860068259385, "percentage": 77.77, "elapsed_time": "4:15:56", "remaining_time": "1:13:10"} +{"current_steps": 3195, "total_steps": 4102, "loss": 0.1887, "lr": 5.681436728653209e-06, "epoch": 5.452218430034129, "percentage": 77.89, "elapsed_time": "4:16:20", "remaining_time": "1:12:46"} +{"current_steps": 3200, "total_steps": 4102, "loss": 0.1897, "lr": 5.622141534341676e-06, "epoch": 5.460750853242321, "percentage": 78.01, "elapsed_time": "4:16:38", "remaining_time": "1:12:20"} +{"current_steps": 3205, "total_steps": 4102, "loss": 0.1984, "lr": 5.563106742567908e-06, "epoch": 5.469283276450512, "percentage": 78.13, "elapsed_time": "4:18:00", "remaining_time": "1:12:12"} +{"current_steps": 3210, "total_steps": 4102, "loss": 0.1988, "lr": 5.504333422532128e-06, "epoch": 5.477815699658703, "percentage": 78.25, "elapsed_time": "4:18:24", "remaining_time": "1:11:48"} +{"current_steps": 3215, "total_steps": 4102, "loss": 0.2071, "lr": 5.445822638698948e-06, "epoch": 5.486348122866894, "percentage": 78.38, "elapsed_time": "4:18:42", "remaining_time": "1:11:22"} +{"current_steps": 3220, "total_steps": 4102, "loss": 0.205, "lr": 5.387575450778115e-06, "epoch": 5.494880546075085, "percentage": 78.5, "elapsed_time": "4:19:02", "remaining_time": "1:10:57"} +{"current_steps": 3225, "total_steps": 4102, "loss": 0.2033, "lr": 5.329592913705286e-06, "epoch": 5.503412969283277, "percentage": 78.62, "elapsed_time": "4:19:20", "remaining_time": "1:10:31"} +{"current_steps": 3230, "total_steps": 4102, "loss": 0.1967, "lr": 5.2718760776229265e-06, "epoch": 5.511945392491468, "percentage": 78.74, "elapsed_time": "4:19:44", "remaining_time": "1:10:07"} +{"current_steps": 3235, "total_steps": 4102, "loss": 0.1914, "lr": 5.2144259878613e-06, "epoch": 5.520477815699659, "percentage": 78.86, "elapsed_time": "4:20:10", "remaining_time": "1:09:43"} +{"current_steps": 3240, "total_steps": 4102, "loss": 0.2041, "lr": 5.157243684919535e-06, "epoch": 5.5290102389078495, "percentage": 78.99, "elapsed_time": "4:20:30", "remaining_time": "1:09:18"} +{"current_steps": 3245, "total_steps": 4102, "loss": 0.2073, "lr": 5.100330204446773e-06, "epoch": 5.537542662116041, "percentage": 79.11, "elapsed_time": "4:20:49", "remaining_time": "1:08:53"} +{"current_steps": 3250, "total_steps": 4102, "loss": 0.1985, "lr": 5.043686577223412e-06, "epoch": 5.546075085324232, "percentage": 79.23, "elapsed_time": "4:21:14", "remaining_time": "1:08:29"} +{"current_steps": 3255, "total_steps": 4102, "loss": 0.1895, "lr": 4.98731382914246e-06, "epoch": 5.554607508532423, "percentage": 79.35, "elapsed_time": "4:21:40", "remaining_time": "1:08:05"} +{"current_steps": 3260, "total_steps": 4102, "loss": 0.1968, "lr": 4.93121298119092e-06, "epoch": 5.563139931740614, "percentage": 79.47, "elapsed_time": "4:22:03", "remaining_time": "1:07:41"} +{"current_steps": 3265, "total_steps": 4102, "loss": 0.19, "lr": 4.8753850494313e-06, "epoch": 5.571672354948806, "percentage": 79.6, "elapsed_time": "4:22:29", "remaining_time": "1:07:17"} +{"current_steps": 3270, "total_steps": 4102, "loss": 0.2046, "lr": 4.819831044983261e-06, "epoch": 5.580204778156997, "percentage": 79.72, "elapsed_time": "4:22:54", "remaining_time": "1:06:53"} +{"current_steps": 3275, "total_steps": 4102, "loss": 0.19, "lr": 4.764551974005243e-06, "epoch": 5.588737201365188, "percentage": 79.84, "elapsed_time": "4:23:14", "remaining_time": "1:06:28"} +{"current_steps": 3280, "total_steps": 4102, "loss": 0.2013, "lr": 4.709548837676279e-06, "epoch": 5.597269624573379, "percentage": 79.96, "elapsed_time": "4:23:35", "remaining_time": "1:06:03"} +{"current_steps": 3285, "total_steps": 4102, "loss": 0.2052, "lr": 4.654822632177829e-06, "epoch": 5.6058020477815695, "percentage": 80.08, "elapsed_time": "4:23:55", "remaining_time": "1:05:38"} +{"current_steps": 3290, "total_steps": 4102, "loss": 0.2046, "lr": 4.600374348675796e-06, "epoch": 5.614334470989761, "percentage": 80.2, "elapsed_time": "4:24:21", "remaining_time": "1:05:14"} +{"current_steps": 3295, "total_steps": 4102, "loss": 0.1928, "lr": 4.546204973302513e-06, "epoch": 5.622866894197952, "percentage": 80.33, "elapsed_time": "4:24:41", "remaining_time": "1:04:49"} +{"current_steps": 3300, "total_steps": 4102, "loss": 0.2076, "lr": 4.492315487138914e-06, "epoch": 5.631399317406143, "percentage": 80.45, "elapsed_time": "4:25:10", "remaining_time": "1:04:26"} +{"current_steps": 3305, "total_steps": 4102, "loss": 0.1949, "lr": 4.438706866196758e-06, "epoch": 5.639931740614334, "percentage": 80.57, "elapsed_time": "4:25:32", "remaining_time": "1:04:02"} +{"current_steps": 3310, "total_steps": 4102, "loss": 0.2045, "lr": 4.385380081400956e-06, "epoch": 5.648464163822526, "percentage": 80.69, "elapsed_time": "4:25:53", "remaining_time": "1:03:37"} +{"current_steps": 3315, "total_steps": 4102, "loss": 0.1979, "lr": 4.3323360985719856e-06, "epoch": 5.656996587030717, "percentage": 80.81, "elapsed_time": "4:26:14", "remaining_time": "1:03:12"} +{"current_steps": 3320, "total_steps": 4102, "loss": 0.2044, "lr": 4.279575878408384e-06, "epoch": 5.665529010238908, "percentage": 80.94, "elapsed_time": "4:26:37", "remaining_time": "1:02:48"} +{"current_steps": 3325, "total_steps": 4102, "loss": 0.1971, "lr": 4.227100376469384e-06, "epoch": 5.674061433447099, "percentage": 81.06, "elapsed_time": "4:27:04", "remaining_time": "1:02:24"} +{"current_steps": 3330, "total_steps": 4102, "loss": 0.1999, "lr": 4.1749105431575755e-06, "epoch": 5.6825938566552905, "percentage": 81.18, "elapsed_time": "4:27:24", "remaining_time": "1:01:59"} +{"current_steps": 3335, "total_steps": 4102, "loss": 0.198, "lr": 4.123007323701678e-06, "epoch": 5.691126279863481, "percentage": 81.3, "elapsed_time": "4:27:50", "remaining_time": "1:01:36"} +{"current_steps": 3340, "total_steps": 4102, "loss": 0.202, "lr": 4.071391658139483e-06, "epoch": 5.699658703071672, "percentage": 81.42, "elapsed_time": "4:28:14", "remaining_time": "1:01:11"} +{"current_steps": 3345, "total_steps": 4102, "loss": 0.2028, "lr": 4.020064481300765e-06, "epoch": 5.708191126279863, "percentage": 81.55, "elapsed_time": "4:28:34", "remaining_time": "1:00:46"} +{"current_steps": 3350, "total_steps": 4102, "loss": 0.1962, "lr": 3.96902672279039e-06, "epoch": 5.716723549488055, "percentage": 81.67, "elapsed_time": "4:28:57", "remaining_time": "1:00:22"} +{"current_steps": 3355, "total_steps": 4102, "loss": 0.1917, "lr": 3.918279306971453e-06, "epoch": 5.725255972696246, "percentage": 81.79, "elapsed_time": "4:29:25", "remaining_time": "0:59:59"} +{"current_steps": 3360, "total_steps": 4102, "loss": 0.2033, "lr": 3.8678231529485555e-06, "epoch": 5.733788395904437, "percentage": 81.91, "elapsed_time": "4:29:44", "remaining_time": "0:59:34"} +{"current_steps": 3365, "total_steps": 4102, "loss": 0.211, "lr": 3.817659174551156e-06, "epoch": 5.742320819112628, "percentage": 82.03, "elapsed_time": "4:30:06", "remaining_time": "0:59:09"} +{"current_steps": 3370, "total_steps": 4102, "loss": 0.2029, "lr": 3.7677882803170017e-06, "epoch": 5.750853242320819, "percentage": 82.16, "elapsed_time": "4:30:27", "remaining_time": "0:58:44"} +{"current_steps": 3375, "total_steps": 4102, "loss": 0.1982, "lr": 3.718211373475715e-06, "epoch": 5.7593856655290105, "percentage": 82.28, "elapsed_time": "4:30:48", "remaining_time": "0:58:19"} +{"current_steps": 3380, "total_steps": 4102, "loss": 0.1948, "lr": 3.668929351932373e-06, "epoch": 5.7679180887372015, "percentage": 82.4, "elapsed_time": "4:31:15", "remaining_time": "0:57:56"} +{"current_steps": 3385, "total_steps": 4102, "loss": 0.1949, "lr": 3.619943108251296e-06, "epoch": 5.776450511945392, "percentage": 82.52, "elapsed_time": "4:31:35", "remaining_time": "0:57:31"} +{"current_steps": 3390, "total_steps": 4102, "loss": 0.2009, "lr": 3.57125352963988e-06, "epoch": 5.784982935153583, "percentage": 82.64, "elapsed_time": "4:31:59", "remaining_time": "0:57:07"} +{"current_steps": 3395, "total_steps": 4102, "loss": 0.1937, "lr": 3.522861497932495e-06, "epoch": 5.793515358361775, "percentage": 82.76, "elapsed_time": "4:32:21", "remaining_time": "0:56:43"} +{"current_steps": 3400, "total_steps": 4102, "loss": 0.1919, "lr": 3.4747678895745264e-06, "epoch": 5.802047781569966, "percentage": 82.89, "elapsed_time": "4:32:41", "remaining_time": "0:56:18"} +{"current_steps": 3405, "total_steps": 4102, "loss": 0.2036, "lr": 3.4269735756065314e-06, "epoch": 5.810580204778157, "percentage": 83.01, "elapsed_time": "4:34:00", "remaining_time": "0:56:05"} +{"current_steps": 3410, "total_steps": 4102, "loss": 0.1977, "lr": 3.3794794216484217e-06, "epoch": 5.819112627986348, "percentage": 83.13, "elapsed_time": "4:34:19", "remaining_time": "0:55:40"} +{"current_steps": 3415, "total_steps": 4102, "loss": 0.1893, "lr": 3.3322862878838104e-06, "epoch": 5.827645051194539, "percentage": 83.25, "elapsed_time": "4:34:38", "remaining_time": "0:55:15"} +{"current_steps": 3420, "total_steps": 4102, "loss": 0.1953, "lr": 3.2853950290444226e-06, "epoch": 5.836177474402731, "percentage": 83.37, "elapsed_time": "4:35:01", "remaining_time": "0:54:50"} +{"current_steps": 3425, "total_steps": 4102, "loss": 0.1903, "lr": 3.238806494394622e-06, "epoch": 5.8447098976109215, "percentage": 83.5, "elapsed_time": "4:35:24", "remaining_time": "0:54:26"} +{"current_steps": 3430, "total_steps": 4102, "loss": 0.1835, "lr": 3.1925215277160217e-06, "epoch": 5.853242320819112, "percentage": 83.62, "elapsed_time": "4:35:50", "remaining_time": "0:54:02"} +{"current_steps": 3435, "total_steps": 4102, "loss": 0.2072, "lr": 3.146540967292211e-06, "epoch": 5.861774744027304, "percentage": 83.74, "elapsed_time": "4:36:13", "remaining_time": "0:53:38"} +{"current_steps": 3440, "total_steps": 4102, "loss": 0.2072, "lr": 3.1008656458935715e-06, "epoch": 5.870307167235495, "percentage": 83.86, "elapsed_time": "4:36:32", "remaining_time": "0:53:13"} +{"current_steps": 3445, "total_steps": 4102, "loss": 0.1987, "lr": 3.055496390762189e-06, "epoch": 5.878839590443686, "percentage": 83.98, "elapsed_time": "4:36:54", "remaining_time": "0:52:48"} +{"current_steps": 3450, "total_steps": 4102, "loss": 0.1913, "lr": 3.010434023596858e-06, "epoch": 5.887372013651877, "percentage": 84.11, "elapsed_time": "4:37:18", "remaining_time": "0:52:24"} +{"current_steps": 3455, "total_steps": 4102, "loss": 0.1991, "lr": 2.965679360538245e-06, "epoch": 5.895904436860068, "percentage": 84.23, "elapsed_time": "4:37:36", "remaining_time": "0:51:59"} +{"current_steps": 3460, "total_steps": 4102, "loss": 0.192, "lr": 2.9212332121540552e-06, "epoch": 5.90443686006826, "percentage": 84.35, "elapsed_time": "4:37:58", "remaining_time": "0:51:34"} +{"current_steps": 3465, "total_steps": 4102, "loss": 0.2013, "lr": 2.8770963834243826e-06, "epoch": 5.912969283276451, "percentage": 84.47, "elapsed_time": "4:38:17", "remaining_time": "0:51:09"} +{"current_steps": 3470, "total_steps": 4102, "loss": 0.204, "lr": 2.8332696737271194e-06, "epoch": 5.921501706484642, "percentage": 84.59, "elapsed_time": "4:38:39", "remaining_time": "0:50:45"} +{"current_steps": 3475, "total_steps": 4102, "loss": 0.1965, "lr": 2.78975387682348e-06, "epoch": 5.9300341296928325, "percentage": 84.71, "elapsed_time": "4:39:05", "remaining_time": "0:50:21"} +{"current_steps": 3480, "total_steps": 4102, "loss": 0.1876, "lr": 2.7465497808436326e-06, "epoch": 5.938566552901024, "percentage": 84.84, "elapsed_time": "4:39:26", "remaining_time": "0:49:56"} +{"current_steps": 3485, "total_steps": 4102, "loss": 0.2035, "lr": 2.703658168272405e-06, "epoch": 5.947098976109215, "percentage": 84.96, "elapsed_time": "4:39:48", "remaining_time": "0:49:32"} +{"current_steps": 3490, "total_steps": 4102, "loss": 0.195, "lr": 2.66107981593515e-06, "epoch": 5.955631399317406, "percentage": 85.08, "elapsed_time": "4:40:07", "remaining_time": "0:49:07"} +{"current_steps": 3495, "total_steps": 4102, "loss": 0.1996, "lr": 2.6188154949836262e-06, "epoch": 5.964163822525597, "percentage": 85.2, "elapsed_time": "4:40:28", "remaining_time": "0:48:42"} +{"current_steps": 3500, "total_steps": 4102, "loss": 0.2037, "lr": 2.576865970882072e-06, "epoch": 5.972696245733788, "percentage": 85.32, "elapsed_time": "4:40:47", "remaining_time": "0:48:17"} +{"current_steps": 3505, "total_steps": 4102, "loss": 0.1965, "lr": 2.5352320033933198e-06, "epoch": 5.98122866894198, "percentage": 85.45, "elapsed_time": "4:41:08", "remaining_time": "0:47:53"} +{"current_steps": 3510, "total_steps": 4102, "loss": 0.1958, "lr": 2.493914346565054e-06, "epoch": 5.989761092150171, "percentage": 85.57, "elapsed_time": "4:41:28", "remaining_time": "0:47:28"} +{"current_steps": 3515, "total_steps": 4102, "loss": 0.2043, "lr": 2.452913748716139e-06, "epoch": 5.998293515358362, "percentage": 85.69, "elapsed_time": "4:41:50", "remaining_time": "0:47:04"} +{"current_steps": 3520, "total_steps": 4102, "loss": 0.1882, "lr": 2.4122309524230557e-06, "epoch": 6.006825938566553, "percentage": 85.81, "elapsed_time": "4:42:11", "remaining_time": "0:46:39"} +{"current_steps": 3525, "total_steps": 4102, "loss": 0.1823, "lr": 2.371866694506495e-06, "epoch": 6.015358361774744, "percentage": 85.93, "elapsed_time": "4:42:30", "remaining_time": "0:46:14"} +{"current_steps": 3530, "total_steps": 4102, "loss": 0.1994, "lr": 2.3318217060179626e-06, "epoch": 6.023890784982935, "percentage": 86.06, "elapsed_time": "4:42:53", "remaining_time": "0:45:50"} +{"current_steps": 3535, "total_steps": 4102, "loss": 0.182, "lr": 2.2920967122265724e-06, "epoch": 6.032423208191126, "percentage": 86.18, "elapsed_time": "4:43:12", "remaining_time": "0:45:25"} +{"current_steps": 3540, "total_steps": 4102, "loss": 0.1896, "lr": 2.2526924326058963e-06, "epoch": 6.040955631399317, "percentage": 86.3, "elapsed_time": "4:43:32", "remaining_time": "0:45:00"} +{"current_steps": 3545, "total_steps": 4102, "loss": 0.192, "lr": 2.2136095808209366e-06, "epoch": 6.049488054607509, "percentage": 86.42, "elapsed_time": "4:43:54", "remaining_time": "0:44:36"} +{"current_steps": 3550, "total_steps": 4102, "loss": 0.1981, "lr": 2.1748488647152043e-06, "epoch": 6.0580204778157, "percentage": 86.54, "elapsed_time": "4:44:13", "remaining_time": "0:44:11"} +{"current_steps": 3555, "total_steps": 4102, "loss": 0.186, "lr": 2.1364109862978878e-06, "epoch": 6.066552901023891, "percentage": 86.67, "elapsed_time": "4:44:38", "remaining_time": "0:43:47"} +{"current_steps": 3560, "total_steps": 4102, "loss": 0.1871, "lr": 2.0982966417311655e-06, "epoch": 6.075085324232082, "percentage": 86.79, "elapsed_time": "4:44:59", "remaining_time": "0:43:23"} +{"current_steps": 3565, "total_steps": 4102, "loss": 0.1867, "lr": 2.0605065213175533e-06, "epoch": 6.083617747440273, "percentage": 86.91, "elapsed_time": "4:45:21", "remaining_time": "0:42:59"} +{"current_steps": 3570, "total_steps": 4102, "loss": 0.1934, "lr": 2.0230413094874414e-06, "epoch": 6.092150170648464, "percentage": 87.03, "elapsed_time": "4:45:47", "remaining_time": "0:42:35"} +{"current_steps": 3575, "total_steps": 4102, "loss": 0.1813, "lr": 1.9859016847866887e-06, "epoch": 6.100682593856655, "percentage": 87.15, "elapsed_time": "4:46:11", "remaining_time": "0:42:11"} +{"current_steps": 3580, "total_steps": 4102, "loss": 0.1871, "lr": 1.9490883198643207e-06, "epoch": 6.109215017064846, "percentage": 87.27, "elapsed_time": "4:46:39", "remaining_time": "0:41:47"} +{"current_steps": 3585, "total_steps": 4102, "loss": 0.183, "lr": 1.9126018814603565e-06, "epoch": 6.117747440273037, "percentage": 87.4, "elapsed_time": "4:46:58", "remaining_time": "0:41:23"} +{"current_steps": 3590, "total_steps": 4102, "loss": 0.1837, "lr": 1.8764430303937354e-06, "epoch": 6.126279863481229, "percentage": 87.52, "elapsed_time": "4:47:22", "remaining_time": "0:40:59"} +{"current_steps": 3595, "total_steps": 4102, "loss": 0.1989, "lr": 1.840612421550343e-06, "epoch": 6.13481228668942, "percentage": 87.64, "elapsed_time": "4:47:39", "remaining_time": "0:40:34"} +{"current_steps": 3600, "total_steps": 4102, "loss": 0.1846, "lr": 1.8051107038711535e-06, "epoch": 6.143344709897611, "percentage": 87.76, "elapsed_time": "4:47:57", "remaining_time": "0:40:09"} +{"current_steps": 3605, "total_steps": 4102, "loss": 0.175, "lr": 1.769938520340473e-06, "epoch": 6.151877133105802, "percentage": 87.88, "elapsed_time": "4:49:20", "remaining_time": "0:39:53"} +{"current_steps": 3610, "total_steps": 4102, "loss": 0.2001, "lr": 1.735096507974301e-06, "epoch": 6.160409556313994, "percentage": 88.01, "elapsed_time": "4:49:43", "remaining_time": "0:39:29"} +{"current_steps": 3615, "total_steps": 4102, "loss": 0.1924, "lr": 1.7005852978087833e-06, "epoch": 6.1689419795221845, "percentage": 88.13, "elapsed_time": "4:50:07", "remaining_time": "0:39:05"} +{"current_steps": 3620, "total_steps": 4102, "loss": 0.1938, "lr": 1.6664055148887937e-06, "epoch": 6.177474402730375, "percentage": 88.25, "elapsed_time": "4:50:28", "remaining_time": "0:38:40"} +{"current_steps": 3625, "total_steps": 4102, "loss": 0.199, "lr": 1.6325577782566093e-06, "epoch": 6.186006825938566, "percentage": 88.37, "elapsed_time": "4:50:53", "remaining_time": "0:38:16"} +{"current_steps": 3630, "total_steps": 4102, "loss": 0.1899, "lr": 1.5990427009407006e-06, "epoch": 6.194539249146757, "percentage": 88.49, "elapsed_time": "4:51:19", "remaining_time": "0:37:52"} +{"current_steps": 3635, "total_steps": 4102, "loss": 0.1926, "lr": 1.5658608899446059e-06, "epoch": 6.203071672354949, "percentage": 88.62, "elapsed_time": "4:51:40", "remaining_time": "0:37:28"} +{"current_steps": 3640, "total_steps": 4102, "loss": 0.1894, "lr": 1.5330129462359899e-06, "epoch": 6.21160409556314, "percentage": 88.74, "elapsed_time": "4:51:59", "remaining_time": "0:37:03"} +{"current_steps": 3645, "total_steps": 4102, "loss": 0.1942, "lr": 1.5004994647357007e-06, "epoch": 6.220136518771331, "percentage": 88.86, "elapsed_time": "4:52:16", "remaining_time": "0:36:38"} +{"current_steps": 3650, "total_steps": 4102, "loss": 0.1913, "lr": 1.4683210343070387e-06, "epoch": 6.228668941979522, "percentage": 88.98, "elapsed_time": "4:52:47", "remaining_time": "0:36:15"} +{"current_steps": 3655, "total_steps": 4102, "loss": 0.1949, "lr": 1.4364782377450625e-06, "epoch": 6.237201365187714, "percentage": 89.1, "elapsed_time": "4:53:06", "remaining_time": "0:35:50"} +{"current_steps": 3660, "total_steps": 4102, "loss": 0.1826, "lr": 1.404971651766054e-06, "epoch": 6.2457337883959045, "percentage": 89.22, "elapsed_time": "4:53:25", "remaining_time": "0:35:26"} +{"current_steps": 3665, "total_steps": 4102, "loss": 0.1903, "lr": 1.3738018469970626e-06, "epoch": 6.2542662116040955, "percentage": 89.35, "elapsed_time": "4:53:49", "remaining_time": "0:35:02"} +{"current_steps": 3670, "total_steps": 4102, "loss": 0.1981, "lr": 1.342969387965567e-06, "epoch": 6.262798634812286, "percentage": 89.47, "elapsed_time": "4:54:13", "remaining_time": "0:34:37"} +{"current_steps": 3675, "total_steps": 4102, "loss": 0.1942, "lr": 1.3124748330892722e-06, "epoch": 6.271331058020478, "percentage": 89.59, "elapsed_time": "4:54:39", "remaining_time": "0:34:14"} +{"current_steps": 3680, "total_steps": 4102, "loss": 0.1843, "lr": 1.2823187346659616e-06, "epoch": 6.279863481228669, "percentage": 89.71, "elapsed_time": "4:55:03", "remaining_time": "0:33:50"} +{"current_steps": 3685, "total_steps": 4102, "loss": 0.1835, "lr": 1.2525016388635193e-06, "epoch": 6.28839590443686, "percentage": 89.83, "elapsed_time": "4:55:30", "remaining_time": "0:33:26"} +{"current_steps": 3690, "total_steps": 4102, "loss": 0.1884, "lr": 1.2230240857100385e-06, "epoch": 6.296928327645051, "percentage": 89.96, "elapsed_time": "4:55:53", "remaining_time": "0:33:02"} +{"current_steps": 3695, "total_steps": 4102, "loss": 0.1868, "lr": 1.1938866090840273e-06, "epoch": 6.305460750853243, "percentage": 90.08, "elapsed_time": "4:56:18", "remaining_time": "0:32:38"} +{"current_steps": 3700, "total_steps": 4102, "loss": 0.1863, "lr": 1.1650897367047497e-06, "epoch": 6.313993174061434, "percentage": 90.2, "elapsed_time": "4:56:45", "remaining_time": "0:32:14"} +{"current_steps": 3705, "total_steps": 4102, "loss": 0.1967, "lr": 1.136633990122653e-06, "epoch": 6.322525597269625, "percentage": 90.32, "elapsed_time": "4:57:05", "remaining_time": "0:31:50"} +{"current_steps": 3710, "total_steps": 4102, "loss": 0.196, "lr": 1.1085198847099531e-06, "epoch": 6.3310580204778155, "percentage": 90.44, "elapsed_time": "4:57:25", "remaining_time": "0:31:25"} +{"current_steps": 3715, "total_steps": 4102, "loss": 0.1989, "lr": 1.0807479296512646e-06, "epoch": 6.339590443686006, "percentage": 90.57, "elapsed_time": "4:57:47", "remaining_time": "0:31:01"} +{"current_steps": 3720, "total_steps": 4102, "loss": 0.196, "lr": 1.0533186279344032e-06, "epoch": 6.348122866894198, "percentage": 90.69, "elapsed_time": "4:58:14", "remaining_time": "0:30:37"} +{"current_steps": 3725, "total_steps": 4102, "loss": 0.1945, "lr": 1.0262324763412601e-06, "epoch": 6.356655290102389, "percentage": 90.81, "elapsed_time": "4:58:37", "remaining_time": "0:30:13"} +{"current_steps": 3730, "total_steps": 4102, "loss": 0.1937, "lr": 9.99489965438818e-07, "epoch": 6.36518771331058, "percentage": 90.93, "elapsed_time": "4:58:57", "remaining_time": "0:29:48"} +{"current_steps": 3735, "total_steps": 4102, "loss": 0.1873, "lr": 9.730915795702555e-07, "epoch": 6.373720136518771, "percentage": 91.05, "elapsed_time": "4:59:18", "remaining_time": "0:29:24"} +{"current_steps": 3740, "total_steps": 4102, "loss": 0.1968, "lr": 9.470377968461841e-07, "epoch": 6.382252559726963, "percentage": 91.18, "elapsed_time": "4:59:38", "remaining_time": "0:29:00"} +{"current_steps": 3745, "total_steps": 4102, "loss": 0.1826, "lr": 9.213290891359849e-07, "epoch": 6.390784982935154, "percentage": 91.3, "elapsed_time": "5:00:02", "remaining_time": "0:28:36"} +{"current_steps": 3750, "total_steps": 4102, "loss": 0.1925, "lr": 8.959659220592564e-07, "epoch": 6.399317406143345, "percentage": 91.42, "elapsed_time": "5:00:22", "remaining_time": "0:28:11"} +{"current_steps": 3755, "total_steps": 4102, "loss": 0.1964, "lr": 8.709487549773854e-07, "epoch": 6.407849829351536, "percentage": 91.54, "elapsed_time": "5:00:42", "remaining_time": "0:27:47"} +{"current_steps": 3760, "total_steps": 4102, "loss": 0.1843, "lr": 8.462780409852423e-07, "epoch": 6.4163822525597265, "percentage": 91.66, "elapsed_time": "5:01:07", "remaining_time": "0:27:23"} +{"current_steps": 3765, "total_steps": 4102, "loss": 0.1879, "lr": 8.219542269029501e-07, "epoch": 6.424914675767918, "percentage": 91.78, "elapsed_time": "5:01:30", "remaining_time": "0:26:59"} +{"current_steps": 3770, "total_steps": 4102, "loss": 0.1799, "lr": 7.979777532678046e-07, "epoch": 6.433447098976109, "percentage": 91.91, "elapsed_time": "5:01:49", "remaining_time": "0:26:34"} +{"current_steps": 3775, "total_steps": 4102, "loss": 0.1895, "lr": 7.743490543262977e-07, "epoch": 6.4419795221843, "percentage": 92.03, "elapsed_time": "5:02:15", "remaining_time": "0:26:10"} +{"current_steps": 3780, "total_steps": 4102, "loss": 0.1794, "lr": 7.510685580262489e-07, "epoch": 6.450511945392491, "percentage": 92.15, "elapsed_time": "5:02:34", "remaining_time": "0:25:46"} +{"current_steps": 3785, "total_steps": 4102, "loss": 0.1891, "lr": 7.281366860090555e-07, "epoch": 6.459044368600683, "percentage": 92.27, "elapsed_time": "5:02:55", "remaining_time": "0:25:22"} +{"current_steps": 3790, "total_steps": 4102, "loss": 0.1862, "lr": 7.055538536020501e-07, "epoch": 6.467576791808874, "percentage": 92.39, "elapsed_time": "5:03:21", "remaining_time": "0:24:58"} +{"current_steps": 3795, "total_steps": 4102, "loss": 0.1861, "lr": 6.833204698109908e-07, "epoch": 6.476109215017065, "percentage": 92.52, "elapsed_time": "5:03:45", "remaining_time": "0:24:34"} +{"current_steps": 3800, "total_steps": 4102, "loss": 0.1944, "lr": 6.614369373126473e-07, "epoch": 6.484641638225256, "percentage": 92.64, "elapsed_time": "5:04:02", "remaining_time": "0:24:09"} +{"current_steps": 3805, "total_steps": 4102, "loss": 0.1927, "lr": 6.399036524474978e-07, "epoch": 6.493174061433447, "percentage": 92.76, "elapsed_time": "5:05:27", "remaining_time": "0:23:50"} +{"current_steps": 3810, "total_steps": 4102, "loss": 0.1913, "lr": 6.187210052125747e-07, "epoch": 6.501706484641638, "percentage": 92.88, "elapsed_time": "5:05:49", "remaining_time": "0:23:26"} +{"current_steps": 3815, "total_steps": 4102, "loss": 0.1905, "lr": 5.978893792543772e-07, "epoch": 6.510238907849829, "percentage": 93.0, "elapsed_time": "5:06:10", "remaining_time": "0:23:01"} +{"current_steps": 3820, "total_steps": 4102, "loss": 0.1937, "lr": 5.774091518619296e-07, "epoch": 6.51877133105802, "percentage": 93.13, "elapsed_time": "5:06:29", "remaining_time": "0:22:37"} +{"current_steps": 3825, "total_steps": 4102, "loss": 0.1786, "lr": 5.572806939599606e-07, "epoch": 6.527303754266212, "percentage": 93.25, "elapsed_time": "5:06:50", "remaining_time": "0:22:13"} +{"current_steps": 3830, "total_steps": 4102, "loss": 0.1893, "lr": 5.375043701021731e-07, "epoch": 6.535836177474403, "percentage": 93.37, "elapsed_time": "5:07:08", "remaining_time": "0:21:48"} +{"current_steps": 3835, "total_steps": 4102, "loss": 0.186, "lr": 5.180805384646381e-07, "epoch": 6.544368600682594, "percentage": 93.49, "elapsed_time": "5:07:29", "remaining_time": "0:21:24"} +{"current_steps": 3840, "total_steps": 4102, "loss": 0.1954, "lr": 4.990095508393222e-07, "epoch": 6.552901023890785, "percentage": 93.61, "elapsed_time": "5:07:49", "remaining_time": "0:21:00"} +{"current_steps": 3845, "total_steps": 4102, "loss": 0.1934, "lr": 4.802917526277017e-07, "epoch": 6.561433447098976, "percentage": 93.73, "elapsed_time": "5:08:07", "remaining_time": "0:20:35"} +{"current_steps": 3850, "total_steps": 4102, "loss": 0.1889, "lr": 4.619274828345188e-07, "epoch": 6.5699658703071675, "percentage": 93.86, "elapsed_time": "5:08:28", "remaining_time": "0:20:11"} +{"current_steps": 3855, "total_steps": 4102, "loss": 0.1857, "lr": 4.439170740616261e-07, "epoch": 6.578498293515358, "percentage": 93.98, "elapsed_time": "5:08:48", "remaining_time": "0:19:47"} +{"current_steps": 3860, "total_steps": 4102, "loss": 0.1863, "lr": 4.2626085250198733e-07, "epoch": 6.587030716723549, "percentage": 94.1, "elapsed_time": "5:09:07", "remaining_time": "0:19:22"} +{"current_steps": 3865, "total_steps": 4102, "loss": 0.1991, "lr": 4.089591379337443e-07, "epoch": 6.59556313993174, "percentage": 94.22, "elapsed_time": "5:09:32", "remaining_time": "0:18:58"} +{"current_steps": 3870, "total_steps": 4102, "loss": 0.1825, "lr": 3.920122437144325e-07, "epoch": 6.604095563139932, "percentage": 94.34, "elapsed_time": "5:09:53", "remaining_time": "0:18:34"} +{"current_steps": 3875, "total_steps": 4102, "loss": 0.1836, "lr": 3.7542047677532334e-07, "epoch": 6.612627986348123, "percentage": 94.47, "elapsed_time": "5:10:16", "remaining_time": "0:18:10"} +{"current_steps": 3880, "total_steps": 4102, "loss": 0.1892, "lr": 3.5918413761584006e-07, "epoch": 6.621160409556314, "percentage": 94.59, "elapsed_time": "5:10:43", "remaining_time": "0:17:46"} +{"current_steps": 3885, "total_steps": 4102, "loss": 0.188, "lr": 3.433035202981283e-07, "epoch": 6.629692832764505, "percentage": 94.71, "elapsed_time": "5:11:06", "remaining_time": "0:17:22"} +{"current_steps": 3890, "total_steps": 4102, "loss": 0.1925, "lr": 3.2777891244172965e-07, "epoch": 6.638225255972696, "percentage": 94.83, "elapsed_time": "5:11:36", "remaining_time": "0:16:58"} +{"current_steps": 3895, "total_steps": 4102, "loss": 0.2037, "lr": 3.1261059521837e-07, "epoch": 6.646757679180888, "percentage": 94.95, "elapsed_time": "5:12:00", "remaining_time": "0:16:34"} +{"current_steps": 3900, "total_steps": 4102, "loss": 0.183, "lr": 2.9779884334686816e-07, "epoch": 6.6552901023890785, "percentage": 95.08, "elapsed_time": "5:12:21", "remaining_time": "0:16:10"} +{"current_steps": 3905, "total_steps": 4102, "loss": 0.1946, "lr": 2.8334392508815976e-07, "epoch": 6.663822525597269, "percentage": 95.2, "elapsed_time": "5:12:40", "remaining_time": "0:15:46"} +{"current_steps": 3910, "total_steps": 4102, "loss": 0.1951, "lr": 2.6924610224044354e-07, "epoch": 6.672354948805461, "percentage": 95.32, "elapsed_time": "5:13:01", "remaining_time": "0:15:22"} +{"current_steps": 3915, "total_steps": 4102, "loss": 0.1906, "lr": 2.5550563013442944e-07, "epoch": 6.680887372013652, "percentage": 95.44, "elapsed_time": "5:13:21", "remaining_time": "0:14:58"} +{"current_steps": 3920, "total_steps": 4102, "loss": 0.1911, "lr": 2.4212275762871994e-07, "epoch": 6.689419795221843, "percentage": 95.56, "elapsed_time": "5:13:46", "remaining_time": "0:14:34"} +{"current_steps": 3925, "total_steps": 4102, "loss": 0.1958, "lr": 2.2909772710531186e-07, "epoch": 6.697952218430034, "percentage": 95.69, "elapsed_time": "5:14:06", "remaining_time": "0:14:09"} +{"current_steps": 3930, "total_steps": 4102, "loss": 0.1855, "lr": 2.1643077446518834e-07, "epoch": 6.706484641638225, "percentage": 95.81, "elapsed_time": "5:14:24", "remaining_time": "0:13:45"} +{"current_steps": 3935, "total_steps": 4102, "loss": 0.1953, "lr": 2.0412212912406248e-07, "epoch": 6.715017064846417, "percentage": 95.93, "elapsed_time": "5:14:46", "remaining_time": "0:13:21"} +{"current_steps": 3940, "total_steps": 4102, "loss": 0.1827, "lr": 1.921720140082095e-07, "epoch": 6.723549488054608, "percentage": 96.05, "elapsed_time": "5:15:13", "remaining_time": "0:12:57"} +{"current_steps": 3945, "total_steps": 4102, "loss": 0.192, "lr": 1.8058064555044108e-07, "epoch": 6.7320819112627985, "percentage": 96.17, "elapsed_time": "5:15:32", "remaining_time": "0:12:33"} +{"current_steps": 3950, "total_steps": 4102, "loss": 0.1852, "lr": 1.6934823368617735e-07, "epoch": 6.7406143344709895, "percentage": 96.29, "elapsed_time": "5:15:53", "remaining_time": "0:12:09"} +{"current_steps": 3955, "total_steps": 4102, "loss": 0.1878, "lr": 1.5847498184965005e-07, "epoch": 6.749146757679181, "percentage": 96.42, "elapsed_time": "5:16:15", "remaining_time": "0:11:45"} +{"current_steps": 3960, "total_steps": 4102, "loss": 0.1825, "lr": 1.479610869702075e-07, "epoch": 6.757679180887372, "percentage": 96.54, "elapsed_time": "5:16:38", "remaining_time": "0:11:21"} +{"current_steps": 3965, "total_steps": 4102, "loss": 0.1966, "lr": 1.3780673946876433e-07, "epoch": 6.766211604095563, "percentage": 96.66, "elapsed_time": "5:16:59", "remaining_time": "0:10:57"} +{"current_steps": 3970, "total_steps": 4102, "loss": 0.1919, "lr": 1.2801212325433966e-07, "epoch": 6.774744027303754, "percentage": 96.78, "elapsed_time": "5:17:20", "remaining_time": "0:10:33"} +{"current_steps": 3975, "total_steps": 4102, "loss": 0.1888, "lr": 1.185774157207309e-07, "epoch": 6.783276450511945, "percentage": 96.9, "elapsed_time": "5:17:47", "remaining_time": "0:10:09"} +{"current_steps": 3980, "total_steps": 4102, "loss": 0.185, "lr": 1.0950278774330304e-07, "epoch": 6.791808873720137, "percentage": 97.03, "elapsed_time": "5:18:07", "remaining_time": "0:09:45"} +{"current_steps": 3985, "total_steps": 4102, "loss": 0.1896, "lr": 1.007884036758866e-07, "epoch": 6.800341296928328, "percentage": 97.15, "elapsed_time": "5:18:27", "remaining_time": "0:09:21"} +{"current_steps": 3990, "total_steps": 4102, "loss": 0.192, "lr": 9.2434421347809e-08, "epoch": 6.808873720136519, "percentage": 97.27, "elapsed_time": "5:18:54", "remaining_time": "0:08:57"} +{"current_steps": 3995, "total_steps": 4102, "loss": 0.1879, "lr": 8.444099206103229e-08, "epoch": 6.8174061433447095, "percentage": 97.39, "elapsed_time": "5:19:17", "remaining_time": "0:08:33"} +{"current_steps": 4000, "total_steps": 4102, "loss": 0.1933, "lr": 7.680826058741764e-08, "epoch": 6.825938566552901, "percentage": 97.51, "elapsed_time": "5:19:37", "remaining_time": "0:08:09"} +{"current_steps": 4005, "total_steps": 4102, "loss": 0.1877, "lr": 6.953636516609185e-08, "epoch": 6.834470989761092, "percentage": 97.64, "elapsed_time": "5:20:56", "remaining_time": "0:07:46"} +{"current_steps": 4010, "total_steps": 4102, "loss": 0.201, "lr": 6.262543750095384e-08, "epoch": 6.843003412969283, "percentage": 97.76, "elapsed_time": "5:21:19", "remaining_time": "0:07:22"} +{"current_steps": 4015, "total_steps": 4102, "loss": 0.1879, "lr": 5.6075602758285385e-08, "epoch": 6.851535836177474, "percentage": 97.88, "elapsed_time": "5:21:43", "remaining_time": "0:06:58"} +{"current_steps": 4020, "total_steps": 4102, "loss": 0.1785, "lr": 4.988697956449073e-08, "epoch": 6.860068259385666, "percentage": 98.0, "elapsed_time": "5:22:04", "remaining_time": "0:06:34"} +{"current_steps": 4025, "total_steps": 4102, "loss": 0.1932, "lr": 4.40596800039339e-08, "epoch": 6.868600682593857, "percentage": 98.12, "elapsed_time": "5:22:31", "remaining_time": "0:06:10"} +{"current_steps": 4030, "total_steps": 4102, "loss": 0.1806, "lr": 3.859380961692472e-08, "epoch": 6.877133105802048, "percentage": 98.24, "elapsed_time": "5:22:52", "remaining_time": "0:05:46"} +{"current_steps": 4035, "total_steps": 4102, "loss": 0.1913, "lr": 3.3489467397795904e-08, "epoch": 6.885665529010239, "percentage": 98.37, "elapsed_time": "5:23:14", "remaining_time": "0:05:22"} +{"current_steps": 4040, "total_steps": 4102, "loss": 0.1878, "lr": 2.8746745793113428e-08, "epoch": 6.8941979522184305, "percentage": 98.49, "elapsed_time": "5:23:32", "remaining_time": "0:04:57"} +{"current_steps": 4045, "total_steps": 4102, "loss": 0.202, "lr": 2.4365730700008917e-08, "epoch": 6.902730375426621, "percentage": 98.61, "elapsed_time": "5:23:54", "remaining_time": "0:04:33"} +{"current_steps": 4050, "total_steps": 4102, "loss": 0.1902, "lr": 2.0346501464609814e-08, "epoch": 6.911262798634812, "percentage": 98.73, "elapsed_time": "5:24:14", "remaining_time": "0:04:09"} +{"current_steps": 4055, "total_steps": 4102, "loss": 0.1881, "lr": 1.6689130880616076e-08, "epoch": 6.919795221843003, "percentage": 98.85, "elapsed_time": "5:24:37", "remaining_time": "0:03:45"} +{"current_steps": 4060, "total_steps": 4102, "loss": 0.1837, "lr": 1.339368518797679e-08, "epoch": 6.928327645051194, "percentage": 98.98, "elapsed_time": "5:24:59", "remaining_time": "0:03:21"} +{"current_steps": 4065, "total_steps": 4102, "loss": 0.1905, "lr": 1.0460224071684456e-08, "epoch": 6.936860068259386, "percentage": 99.1, "elapsed_time": "5:25:19", "remaining_time": "0:02:57"} +{"current_steps": 4070, "total_steps": 4102, "loss": 0.196, "lr": 7.888800660702523e-09, "epoch": 6.945392491467577, "percentage": 99.22, "elapsed_time": "5:25:42", "remaining_time": "0:02:33"} +{"current_steps": 4075, "total_steps": 4102, "loss": 0.187, "lr": 5.679461527003938e-09, "epoch": 6.953924914675768, "percentage": 99.34, "elapsed_time": "5:26:05", "remaining_time": "0:02:09"} +{"current_steps": 4080, "total_steps": 4102, "loss": 0.193, "lr": 3.8322466847162674e-09, "epoch": 6.962457337883959, "percentage": 99.46, "elapsed_time": "5:26:30", "remaining_time": "0:01:45"} +{"current_steps": 4085, "total_steps": 4102, "loss": 0.1887, "lr": 2.347189589408938e-09, "epoch": 6.9709897610921505, "percentage": 99.59, "elapsed_time": "5:26:53", "remaining_time": "0:01:21"} +{"current_steps": 4090, "total_steps": 4102, "loss": 0.1792, "lr": 1.2243171374826113e-09, "epoch": 6.979522184300341, "percentage": 99.71, "elapsed_time": "5:27:15", "remaining_time": "0:00:57"} +{"current_steps": 4095, "total_steps": 4102, "loss": 0.1844, "lr": 4.6364966568290817e-10, "epoch": 6.988054607508532, "percentage": 99.83, "elapsed_time": "5:27:36", "remaining_time": "0:00:33"} +{"current_steps": 4100, "total_steps": 4102, "loss": 0.1794, "lr": 6.520095073181409e-11, "epoch": 6.996587030716723, "percentage": 99.95, "elapsed_time": "5:27:59", "remaining_time": "0:00:09"} +{"current_steps": 4102, "total_steps": 4102, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "5:29:04", "remaining_time": "0:00:00"} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..685ce0b --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0af9c4c35bc0c82e6ea9c3ab76fda48a2862fa13ee471c8861fb9e33f54fb4b9 +size 8593 diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..6c49fc6 --- /dev/null +++ b/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833