From ffc93dde84f4bcf8e58cc60a195bbc4cca2c0ceb Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Sat, 20 Jun 2026 17:15:30 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: baban/QwenTranslate_Bengali_English Source: Original Platform --- .gitattributes | 36 + README.md | 63 + chat_template.jinja | 54 + config.json | 66 + generation_config.json | 14 + model-00001-of-00002.safetensors | 3 + model-00002-of-00002.safetensors | 3 + model.safetensors.index.json | 442 +++++ special_tokens_map.json | 31 + tokenizer.json | 3 + tokenizer_config.json | 208 +++ trainer_log.jsonl | 2892 ++++++++++++++++++++++++++++++ 12 files changed, 3815 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 chat_template.jinja create mode 100644 config.json create mode 100644 generation_config.json create mode 100644 model-00001-of-00002.safetensors create mode 100644 model-00002-of-00002.safetensors create mode 100644 model.safetensors.index.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 trainer_log.jsonl diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..1d223c7 --- /dev/null +++ b/README.md @@ -0,0 +1,63 @@ +--- +library_name: transformers +license: other +base_model: Qwen/Qwen2.5-3B-Instruct +tags: +- llama-factory +- full +- generated_from_trainer +model-index: +- name: MT_Bengali_En + results: [] +--- + + + +# MT_Bengali_En + +This model is a fine-tuned version of [Qwen/Qwen2.5-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-3B-Instruct) on the MT_Bengali_En dataset. +It achieves the following results on the evaluation set: +- Loss: 1.0118 +- Num Input Tokens Seen: 6787789376 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 5e-05 +- train_batch_size: 8 +- eval_batch_size: 16 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 8 +- gradient_accumulation_steps: 16 +- total_train_batch_size: 1024 +- total_eval_batch_size: 128 +- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: inverse_sqrt +- num_epochs: 3.0 + +### Training results + + + +### Framework versions + +- Transformers 4.55.0 +- Pytorch 2.5.1+cu124 +- Datasets 3.6.0 +- Tokenizers 0.21.1 diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..bdf7919 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,54 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0]['role'] == 'system' %} + {{- messages[0]['content'] }} + {%- else %} + {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }} + {%- endif %} + {{- "\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0]['role'] == 'system' %} + {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }} + {%- else %} + {{- '<|im_start|>system\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- for message in messages %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) or (message.role == "assistant" and not message.tool_calls) %} + {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {{- '<|im_start|>' + message.role }} + {%- if message.content %} + {{- '\n' + message.content }} + {%- endif %} + {%- for tool_call in message.tool_calls %} + {%- if tool_call.function is defined %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {{- tool_call.arguments | tojson }} + {{- '}\n' }} + {%- endfor %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- message.content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} +{%- endif %} diff --git a/config.json b/config.json new file mode 100644 index 0000000..a302053 --- /dev/null +++ b/config.json @@ -0,0 +1,66 @@ +{ + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "bos_token_id": 151643, + "eos_token_id": 151645, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 11008, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 32768, + "max_window_layers": 70, + "model_type": "qwen2", + "num_attention_heads": 16, + "num_hidden_layers": 36, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": null, + "tie_word_embeddings": true, + "torch_dtype": "bfloat16", + "transformers_version": "4.55.0", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..0147d6e --- /dev/null +++ b/generation_config.json @@ -0,0 +1,14 @@ +{ + "bos_token_id": 151643, + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "repetition_penalty": 1.05, + "temperature": 0.7, + "top_k": 20, + "top_p": 0.8, + "transformers_version": "4.55.0" +} diff --git a/model-00001-of-00002.safetensors b/model-00001-of-00002.safetensors new file mode 100644 index 0000000..aa97786 --- /dev/null +++ b/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaffbeccc5b127de9f231a730305d904f9099338409a9d22b8165a4f33ba4609 +size 4957560304 diff --git a/model-00002-of-00002.safetensors b/model-00002-of-00002.safetensors new file mode 100644 index 0000000..c2c1a70 --- /dev/null +++ b/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e476971e0680a1dc746fbc29497e406e5b7cb1d2242859cbf50a35cd16b79bd +size 1214366696 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..d3896a7 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,442 @@ +{ + "metadata": { + "total_parameters": 3085938688, + "total_size": 6171877376 + }, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-00002.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.29.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.30.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.norm.weight": "model-00002-of-00002.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..ac23c0a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..51ebb3b --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..fb44f02 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,208 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 131072, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..1f4c9b6 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,2892 @@ +{"current_steps": 10, "total_steps": 25209, "loss": 2.1404, "lr": 4.9977515176118345e-05, "epoch": 0.001190060023652443, "percentage": 0.04, "elapsed_time": "0:02:20", "remaining_time": "4 days, 2:08:21", "throughput": 19308.9, "total_tokens": 2707200} +{"current_steps": 20, "total_steps": 25209, "loss": 1.6354, "lr": 4.9952567580506e-05, "epoch": 0.002380120047304886, "percentage": 0.08, "elapsed_time": "0:04:38", "remaining_time": "4 days, 1:20:52", "throughput": 19461.84, "total_tokens": 5415424} +{"current_steps": 30, "total_steps": 25209, "loss": 1.5277, "lr": 4.992765730738634e-05, "epoch": 0.003570180070957329, "percentage": 0.12, "elapsed_time": "0:06:40", "remaining_time": "3 days, 21:27:01", "throughput": 20253.51, "total_tokens": 8118336} +{"current_steps": 40, "total_steps": 25209, "loss": 1.4936, "lr": 4.9902784263792476e-05, "epoch": 0.004760240094609772, "percentage": 0.16, "elapsed_time": "0:09:22", "remaining_time": "4 days, 2:14:06", "throughput": 19103.94, "total_tokens": 10737088} +{"current_steps": 50, "total_steps": 25209, "loss": 1.4672, "lr": 4.987794835708133e-05, "epoch": 0.005950300118262215, "percentage": 0.2, "elapsed_time": "0:12:54", "remaining_time": "4 days, 12:15:05", "throughput": 17426.78, "total_tokens": 13496768} +{"current_steps": 60, "total_steps": 25209, "loss": 1.4594, "lr": 4.985314949493234e-05, "epoch": 0.007140360141914658, "percentage": 0.24, "elapsed_time": "0:16:52", "remaining_time": "4 days, 21:53:06", "throughput": 15966.6, "total_tokens": 16166080} +{"current_steps": 70, "total_steps": 25209, "loss": 1.4229, "lr": 4.982838758534584e-05, "epoch": 0.008330420165567102, "percentage": 0.28, "elapsed_time": "0:20:59", "remaining_time": "5 days, 5:36:53", "throughput": 14962.62, "total_tokens": 18840896} +{"current_steps": 80, "total_steps": 25209, "loss": 1.4298, "lr": 4.980366253664179e-05, "epoch": 0.009520480189219544, "percentage": 0.32, "elapsed_time": "0:24:45", "remaining_time": "5 days, 9:38:29", "throughput": 14515.31, "total_tokens": 21566912} +{"current_steps": 90, "total_steps": 25209, "loss": 1.4151, "lr": 4.977897425745825e-05, "epoch": 0.010710540212871987, "percentage": 0.36, "elapsed_time": "0:27:33", "remaining_time": "5 days, 8:09:49", "throughput": 14697.35, "total_tokens": 24296704} +{"current_steps": 100, "total_steps": 25209, "loss": 1.4092, "lr": 4.975432265674997e-05, "epoch": 0.01190060023652443, "percentage": 0.4, "elapsed_time": "0:30:03", "remaining_time": "5 days, 5:47:36", "throughput": 14961.03, "total_tokens": 26983168} +{"current_steps": 110, "total_steps": 25209, "loss": 1.409, "lr": 4.972970764378705e-05, "epoch": 0.013090660260176872, "percentage": 0.44, "elapsed_time": "0:32:44", "remaining_time": "5 days, 4:29:14", "throughput": 15120.94, "total_tokens": 29699072} +{"current_steps": 120, "total_steps": 25209, "loss": 1.3884, "lr": 4.970512912815344e-05, "epoch": 0.014280720283829316, "percentage": 0.48, "elapsed_time": "0:36:08", "remaining_time": "5 days, 5:55:43", "throughput": 14953.58, "total_tokens": 32424320} +{"current_steps": 130, "total_steps": 25209, "loss": 1.389, "lr": 4.968058701974564e-05, "epoch": 0.015470780307481759, "percentage": 0.52, "elapsed_time": "0:38:56", "remaining_time": "5 days, 5:12:24", "throughput": 15025.91, "total_tokens": 35107904} +{"current_steps": 140, "total_steps": 25209, "loss": 1.3676, "lr": 4.96560812287712e-05, "epoch": 0.016660840331134203, "percentage": 0.56, "elapsed_time": "0:42:08", "remaining_time": "5 days, 5:46:05", "throughput": 14947.87, "total_tokens": 37795840} +{"current_steps": 150, "total_steps": 25209, "loss": 1.3653, "lr": 4.963161166574748e-05, "epoch": 0.017850900354786644, "percentage": 0.6, "elapsed_time": "0:44:41", "remaining_time": "5 days, 4:25:04", "throughput": 15114.21, "total_tokens": 40522688} +{"current_steps": 160, "total_steps": 25209, "loss": 1.3442, "lr": 4.960717824150013e-05, "epoch": 0.019040960378439088, "percentage": 0.63, "elapsed_time": "0:46:56", "remaining_time": "5 days, 2:30:16", "throughput": 15324.2, "total_tokens": 43168064} +{"current_steps": 170, "total_steps": 25209, "loss": 1.3558, "lr": 4.9582780867161893e-05, "epoch": 0.02023102040209153, "percentage": 0.67, "elapsed_time": "0:49:03", "remaining_time": "5 days, 0:25:27", "throughput": 15571.52, "total_tokens": 45833088} +{"current_steps": 180, "total_steps": 25209, "loss": 1.3478, "lr": 4.955841945417105e-05, "epoch": 0.021421080425743973, "percentage": 0.71, "elapsed_time": "0:50:59", "remaining_time": "4 days, 22:10:29", "throughput": 15863.86, "total_tokens": 48536192} +{"current_steps": 190, "total_steps": 25209, "loss": 1.3666, "lr": 4.953409391427024e-05, "epoch": 0.022611140449396418, "percentage": 0.75, "elapsed_time": "0:52:50", "remaining_time": "4 days, 19:59:07", "throughput": 16148.8, "total_tokens": 51207040} +{"current_steps": 200, "total_steps": 25209, "loss": 1.3498, "lr": 4.950980415950502e-05, "epoch": 0.02380120047304886, "percentage": 0.79, "elapsed_time": "0:55:09", "remaining_time": "4 days, 18:57:56", "throughput": 16296.52, "total_tokens": 53938624} +{"current_steps": 210, "total_steps": 25209, "loss": 1.3402, "lr": 4.9485550102222575e-05, "epoch": 0.024991260496701303, "percentage": 0.83, "elapsed_time": "0:57:08", "remaining_time": "4 days, 17:22:01", "throughput": 16512.51, "total_tokens": 56610816} +{"current_steps": 220, "total_steps": 25209, "loss": 1.3426, "lr": 4.946133165507037e-05, "epoch": 0.026181320520353744, "percentage": 0.87, "elapsed_time": "0:59:00", "remaining_time": "4 days, 15:42:00", "throughput": 16748.13, "total_tokens": 59291968} +{"current_steps": 230, "total_steps": 25209, "loss": 1.3299, "lr": 4.943714873099483e-05, "epoch": 0.027371380544006188, "percentage": 0.91, "elapsed_time": "1:01:28", "remaining_time": "4 days, 15:17:20", "throughput": 16795.43, "total_tokens": 61958208} +{"current_steps": 240, "total_steps": 25209, "loss": 1.3235, "lr": 4.9413001243240024e-05, "epoch": 0.028561440567658632, "percentage": 0.95, "elapsed_time": "1:03:24", "remaining_time": "4 days, 13:56:13", "throughput": 16985.06, "total_tokens": 64613568} +{"current_steps": 250, "total_steps": 25209, "loss": 1.3247, "lr": 4.938888910534637e-05, "epoch": 0.029751500591311073, "percentage": 0.99, "elapsed_time": "1:05:21", "remaining_time": "4 days, 12:45:22", "throughput": 17159.33, "total_tokens": 67293056} +{"current_steps": 260, "total_steps": 25209, "loss": 1.332, "lr": 4.936481223114932e-05, "epoch": 0.030941560614963518, "percentage": 1.03, "elapsed_time": "1:07:07", "remaining_time": "4 days, 11:20:42", "throughput": 17364.75, "total_tokens": 69931584} +{"current_steps": 270, "total_steps": 25209, "loss": 1.3217, "lr": 4.934077053477808e-05, "epoch": 0.03213162063861596, "percentage": 1.07, "elapsed_time": "1:09:29", "remaining_time": "4 days, 10:59:09", "throughput": 17425.07, "total_tokens": 72658880} +{"current_steps": 280, "total_steps": 25209, "loss": 1.3219, "lr": 4.931676393065431e-05, "epoch": 0.033321680662268406, "percentage": 1.11, "elapsed_time": "1:11:29", "remaining_time": "4 days, 10:04:28", "throughput": 17566.63, "total_tokens": 75345216} +{"current_steps": 290, "total_steps": 25209, "loss": 1.3066, "lr": 4.929279233349088e-05, "epoch": 0.03451174068592085, "percentage": 1.15, "elapsed_time": "1:13:10", "remaining_time": "4 days, 8:47:02", "throughput": 17770.78, "total_tokens": 78013824} +{"current_steps": 300, "total_steps": 25209, "loss": 1.3024, "lr": 4.926885565829051e-05, "epoch": 0.03570180070957329, "percentage": 1.19, "elapsed_time": "1:14:59", "remaining_time": "4 days, 7:46:30", "throughput": 17934.03, "total_tokens": 80693568} +{"current_steps": 310, "total_steps": 25209, "loss": 1.3134, "lr": 4.924495382034461e-05, "epoch": 0.03689186073322573, "percentage": 1.23, "elapsed_time": "1:16:41", "remaining_time": "4 days, 6:40:12", "throughput": 18111.98, "total_tokens": 83347456} +{"current_steps": 320, "total_steps": 25209, "loss": 1.3147, "lr": 4.9221086735231975e-05, "epoch": 0.038081920756878176, "percentage": 1.27, "elapsed_time": "1:18:20", "remaining_time": "4 days, 5:33:06", "throughput": 18298.15, "total_tokens": 86008320} +{"current_steps": 330, "total_steps": 25209, "loss": 1.3037, "lr": 4.919725431881751e-05, "epoch": 0.03927198078053062, "percentage": 1.31, "elapsed_time": "1:20:03", "remaining_time": "4 days, 4:35:43", "throughput": 18468.48, "total_tokens": 88714048} +{"current_steps": 340, "total_steps": 25209, "loss": 1.3147, "lr": 4.917345648725101e-05, "epoch": 0.04046204080418306, "percentage": 1.35, "elapsed_time": "1:21:54", "remaining_time": "4 days, 3:51:32", "throughput": 18596.3, "total_tokens": 91398144} +{"current_steps": 350, "total_steps": 25209, "loss": 1.3002, "lr": 4.914969315696596e-05, "epoch": 0.041652100827835506, "percentage": 1.39, "elapsed_time": "1:23:40", "remaining_time": "4 days, 3:02:39", "throughput": 18742.17, "total_tokens": 94088512} +{"current_steps": 360, "total_steps": 25209, "loss": 1.2967, "lr": 4.912596424467818e-05, "epoch": 0.04284216085148795, "percentage": 1.43, "elapsed_time": "1:25:20", "remaining_time": "4 days, 2:10:13", "throughput": 18888.14, "total_tokens": 96708736} +{"current_steps": 370, "total_steps": 25209, "loss": 1.2946, "lr": 4.910226966738475e-05, "epoch": 0.04403222087514039, "percentage": 1.47, "elapsed_time": "1:27:12", "remaining_time": "4 days, 1:34:39", "throughput": 18988.97, "total_tokens": 99362240} +{"current_steps": 380, "total_steps": 25209, "loss": 1.2795, "lr": 4.9078609342362666e-05, "epoch": 0.045222280898792835, "percentage": 1.51, "elapsed_time": "1:29:24", "remaining_time": "4 days, 1:21:42", "throughput": 19014.46, "total_tokens": 101999872} +{"current_steps": 390, "total_steps": 25209, "loss": 1.2741, "lr": 4.905498318716775e-05, "epoch": 0.046412340922445276, "percentage": 1.55, "elapsed_time": "1:31:20", "remaining_time": "4 days, 0:53:14", "throughput": 19102.93, "total_tokens": 104700800} +{"current_steps": 400, "total_steps": 25209, "loss": 1.2832, "lr": 4.9031391119633295e-05, "epoch": 0.04760240094609772, "percentage": 1.59, "elapsed_time": "1:33:10", "remaining_time": "4 days, 0:18:35", "throughput": 19213.12, "total_tokens": 107404288} +{"current_steps": 410, "total_steps": 25209, "loss": 1.2827, "lr": 4.9007833057869e-05, "epoch": 0.048792460969750165, "percentage": 1.63, "elapsed_time": "1:35:21", "remaining_time": "4 days, 0:07:43", "throughput": 19250.71, "total_tokens": 110141888} +{"current_steps": 420, "total_steps": 25209, "loss": 1.2848, "lr": 4.898430892025967e-05, "epoch": 0.049982520993402606, "percentage": 1.67, "elapsed_time": "1:37:12", "remaining_time": "3 days, 23:37:40", "throughput": 19336.05, "total_tokens": 112783488} +{"current_steps": 430, "total_steps": 25209, "loss": 1.2701, "lr": 4.896081862546415e-05, "epoch": 0.05117258101705505, "percentage": 1.71, "elapsed_time": "1:38:59", "remaining_time": "3 days, 23:04:36", "throughput": 19438.58, "total_tokens": 115458560} +{"current_steps": 440, "total_steps": 25209, "loss": 1.2673, "lr": 4.8937362092414e-05, "epoch": 0.05236264104070749, "percentage": 1.75, "elapsed_time": "1:40:47", "remaining_time": "3 days, 22:34:00", "throughput": 19546.08, "total_tokens": 118207424} +{"current_steps": 450, "total_steps": 25209, "loss": 1.2733, "lr": 4.891393924031244e-05, "epoch": 0.053552701064359935, "percentage": 1.79, "elapsed_time": "1:42:28", "remaining_time": "3 days, 21:57:54", "throughput": 19659.25, "total_tokens": 120869376} +{"current_steps": 460, "total_steps": 25209, "loss": 1.2754, "lr": 4.8890549988633095e-05, "epoch": 0.054742761088012376, "percentage": 1.82, "elapsed_time": "1:44:14", "remaining_time": "3 days, 21:28:31", "throughput": 19766.82, "total_tokens": 123633792} +{"current_steps": 470, "total_steps": 25209, "loss": 1.2828, "lr": 4.8867194257118907e-05, "epoch": 0.05593282111166482, "percentage": 1.86, "elapsed_time": "1:46:01", "remaining_time": "3 days, 21:00:46", "throughput": 19863.33, "total_tokens": 126360960} +{"current_steps": 480, "total_steps": 25209, "loss": 1.2854, "lr": 4.884387196578093e-05, "epoch": 0.057122881135317265, "percentage": 1.9, "elapsed_time": "1:47:49", "remaining_time": "3 days, 20:34:49", "throughput": 19955.96, "total_tokens": 129100928} +{"current_steps": 490, "total_steps": 25209, "loss": 1.2637, "lr": 4.882058303489718e-05, "epoch": 0.058312941158969706, "percentage": 1.94, "elapsed_time": "1:49:31", "remaining_time": "3 days, 20:05:04", "throughput": 20048.67, "total_tokens": 131747008} +{"current_steps": 500, "total_steps": 25209, "loss": 1.2833, "lr": 4.8797327385011496e-05, "epoch": 0.059503001182622146, "percentage": 1.98, "elapsed_time": "1:51:13", "remaining_time": "3 days, 19:36:22", "throughput": 20143.62, "total_tokens": 134425024} +{"current_steps": 510, "total_steps": 25209, "loss": 1.258, "lr": 4.8774104936932425e-05, "epoch": 0.060693061206274594, "percentage": 2.02, "elapsed_time": "1:52:58", "remaining_time": "3 days, 19:11:14", "throughput": 20227.73, "total_tokens": 137111872} +{"current_steps": 520, "total_steps": 25209, "loss": 1.2528, "lr": 4.8750915611732076e-05, "epoch": 0.061883121229927035, "percentage": 2.06, "elapsed_time": "1:54:58", "remaining_time": "3 days, 18:59:01", "throughput": 20260.13, "total_tokens": 139768192} +{"current_steps": 530, "total_steps": 25209, "loss": 1.2644, "lr": 4.8727759330744986e-05, "epoch": 0.06307318125357948, "percentage": 2.1, "elapsed_time": "1:56:39", "remaining_time": "3 days, 18:32:14", "throughput": 20353.2, "total_tokens": 142466112} +{"current_steps": 540, "total_steps": 25209, "loss": 1.2447, "lr": 4.870463601556696e-05, "epoch": 0.06426324127723192, "percentage": 2.14, "elapsed_time": "1:58:26", "remaining_time": "3 days, 18:10:54", "throughput": 20428.13, "total_tokens": 145175168} +{"current_steps": 550, "total_steps": 25209, "loss": 1.2552, "lr": 4.8681545588054075e-05, "epoch": 0.06545330130088436, "percentage": 2.18, "elapsed_time": "2:00:11", "remaining_time": "3 days, 17:48:35", "throughput": 20507.06, "total_tokens": 147882752} +{"current_steps": 560, "total_steps": 25209, "loss": 1.2636, "lr": 4.8658487970321404e-05, "epoch": 0.06664336132453681, "percentage": 2.22, "elapsed_time": "2:02:25", "remaining_time": "3 days, 17:48:29", "throughput": 20504.38, "total_tokens": 150609792} +{"current_steps": 570, "total_steps": 25209, "loss": 1.2541, "lr": 4.863546308474209e-05, "epoch": 0.06783342134818925, "percentage": 2.26, "elapsed_time": "2:04:22", "remaining_time": "3 days, 17:35:57", "throughput": 20539.1, "total_tokens": 153264064} +{"current_steps": 580, "total_steps": 25209, "loss": 1.2615, "lr": 4.86124708539461e-05, "epoch": 0.0690234813718417, "percentage": 2.3, "elapsed_time": "2:06:35", "remaining_time": "3 days, 17:35:39", "throughput": 20529.87, "total_tokens": 155937408} +{"current_steps": 590, "total_steps": 25209, "loss": 1.2394, "lr": 4.8589511200819216e-05, "epoch": 0.07021354139549414, "percentage": 2.34, "elapsed_time": "2:08:32", "remaining_time": "3 days, 17:23:26", "throughput": 20580.36, "total_tokens": 158719296} +{"current_steps": 600, "total_steps": 25209, "loss": 1.2519, "lr": 4.8566584048501926e-05, "epoch": 0.07140360141914658, "percentage": 2.38, "elapsed_time": "2:10:31", "remaining_time": "3 days, 17:13:27", "throughput": 20609.17, "total_tokens": 161399808} +{"current_steps": 610, "total_steps": 25209, "loss": 1.2452, "lr": 4.854368932038835e-05, "epoch": 0.07259366144279902, "percentage": 2.42, "elapsed_time": "2:12:21", "remaining_time": "3 days, 16:57:17", "throughput": 20659.04, "total_tokens": 164056896} +{"current_steps": 620, "total_steps": 25209, "loss": 1.2544, "lr": 4.8520826940125144e-05, "epoch": 0.07378372146645146, "percentage": 2.46, "elapsed_time": "2:14:04", "remaining_time": "3 days, 16:37:35", "throughput": 20725.82, "total_tokens": 166736000} +{"current_steps": 630, "total_steps": 25209, "loss": 1.257, "lr": 4.849799683161046e-05, "epoch": 0.0749737814901039, "percentage": 2.5, "elapsed_time": "2:15:48", "remaining_time": "3 days, 16:18:13", "throughput": 20792.51, "total_tokens": 169419904} +{"current_steps": 640, "total_steps": 25209, "loss": 1.2523, "lr": 4.8475198918992835e-05, "epoch": 0.07616384151375635, "percentage": 2.54, "elapsed_time": "2:17:29", "remaining_time": "3 days, 15:57:52", "throughput": 20864.06, "total_tokens": 172108288} +{"current_steps": 650, "total_steps": 25209, "loss": 1.2509, "lr": 4.845243312667023e-05, "epoch": 0.07735390153740879, "percentage": 2.58, "elapsed_time": "2:19:11", "remaining_time": "3 days, 15:39:11", "throughput": 20934.45, "total_tokens": 174837248} +{"current_steps": 660, "total_steps": 25209, "loss": 1.2281, "lr": 4.842969937928884e-05, "epoch": 0.07854396156106123, "percentage": 2.62, "elapsed_time": "2:21:24", "remaining_time": "3 days, 15:40:03", "throughput": 20919.13, "total_tokens": 177498816} +{"current_steps": 670, "total_steps": 25209, "loss": 1.2531, "lr": 4.840699760174217e-05, "epoch": 0.07973402158471368, "percentage": 2.66, "elapsed_time": "2:23:26", "remaining_time": "3 days, 15:33:28", "throughput": 20938.06, "total_tokens": 180198912} +{"current_steps": 680, "total_steps": 25209, "loss": 1.2404, "lr": 4.8384327719169906e-05, "epoch": 0.08092408160836612, "percentage": 2.7, "elapsed_time": "2:25:17", "remaining_time": "3 days, 15:21:07", "throughput": 20977.8, "total_tokens": 182879232} +{"current_steps": 690, "total_steps": 25209, "loss": 1.2403, "lr": 4.836168965695694e-05, "epoch": 0.08211414163201856, "percentage": 2.74, "elapsed_time": "2:27:04", "remaining_time": "3 days, 15:06:33", "throughput": 21031.45, "total_tokens": 185601920} +{"current_steps": 700, "total_steps": 25209, "loss": 1.2448, "lr": 4.8339083340732304e-05, "epoch": 0.08330420165567101, "percentage": 2.78, "elapsed_time": "2:29:13", "remaining_time": "3 days, 15:04:47", "throughput": 21037.97, "total_tokens": 188363584} +{"current_steps": 710, "total_steps": 25209, "loss": 1.2433, "lr": 4.8316508696368154e-05, "epoch": 0.08449426167932345, "percentage": 2.82, "elapsed_time": "2:31:03", "remaining_time": "3 days, 14:52:35", "throughput": 21075.23, "total_tokens": 191023552} +{"current_steps": 720, "total_steps": 25209, "loss": 1.2402, "lr": 4.8293965649978714e-05, "epoch": 0.0856843217029759, "percentage": 2.86, "elapsed_time": "2:32:48", "remaining_time": "3 days, 14:37:20", "throughput": 21127.84, "total_tokens": 193708672} +{"current_steps": 730, "total_steps": 25209, "loss": 1.2321, "lr": 4.8271454127919364e-05, "epoch": 0.08687438172662834, "percentage": 2.9, "elapsed_time": "2:34:34", "remaining_time": "3 days, 14:23:04", "throughput": 21175.98, "total_tokens": 196386176} +{"current_steps": 740, "total_steps": 25209, "loss": 1.2304, "lr": 4.824897405678549e-05, "epoch": 0.08806444175028078, "percentage": 2.94, "elapsed_time": "2:36:39", "remaining_time": "3 days, 14:20:01", "throughput": 21185.5, "total_tokens": 199130048} +{"current_steps": 750, "total_steps": 25209, "loss": 1.2402, "lr": 4.8226525363411576e-05, "epoch": 0.08925450177393322, "percentage": 2.98, "elapsed_time": "2:39:00", "remaining_time": "3 days, 14:25:48", "throughput": 21155.11, "total_tokens": 201839552} +{"current_steps": 760, "total_steps": 25209, "loss": 1.2387, "lr": 4.820410797487017e-05, "epoch": 0.09044456179758567, "percentage": 3.01, "elapsed_time": "2:41:07", "remaining_time": "3 days, 14:23:25", "throughput": 21153.71, "total_tokens": 204506752} +{"current_steps": 770, "total_steps": 25209, "loss": 1.2357, "lr": 4.818172181847091e-05, "epoch": 0.0916346218212381, "percentage": 3.05, "elapsed_time": "2:43:37", "remaining_time": "3 days, 14:33:13", "throughput": 21104.51, "total_tokens": 207190912} +{"current_steps": 780, "total_steps": 25209, "loss": 1.2402, "lr": 4.81593668217595e-05, "epoch": 0.09282468184489055, "percentage": 3.09, "elapsed_time": "2:46:23", "remaining_time": "3 days, 14:51:01", "throughput": 21024.87, "total_tokens": 209892160} +{"current_steps": 790, "total_steps": 25209, "loss": 1.249, "lr": 4.813704291251675e-05, "epoch": 0.094014741868543, "percentage": 3.13, "elapsed_time": "2:49:01", "remaining_time": "3 days, 15:04:37", "throughput": 20956.0, "total_tokens": 212526848} +{"current_steps": 800, "total_steps": 25209, "loss": 1.2344, "lr": 4.811475001875759e-05, "epoch": 0.09520480189219543, "percentage": 3.17, "elapsed_time": "2:51:32", "remaining_time": "3 days, 15:13:49", "throughput": 20917.42, "total_tokens": 215287232} +{"current_steps": 810, "total_steps": 25209, "loss": 1.2377, "lr": 4.8092488068730105e-05, "epoch": 0.09639486191584788, "percentage": 3.21, "elapsed_time": "2:54:14", "remaining_time": "3 days, 15:28:31", "throughput": 20849.02, "total_tokens": 217965312} +{"current_steps": 820, "total_steps": 25209, "loss": 1.2413, "lr": 4.807025699091452e-05, "epoch": 0.09758492193950033, "percentage": 3.25, "elapsed_time": "2:56:53", "remaining_time": "3 days, 15:41:10", "throughput": 20789.15, "total_tokens": 220642944} +{"current_steps": 830, "total_steps": 25209, "loss": 1.2223, "lr": 4.8048056714022325e-05, "epoch": 0.09877498196315276, "percentage": 3.29, "elapsed_time": "2:58:59", "remaining_time": "3 days, 15:37:36", "throughput": 20801.25, "total_tokens": 223403776} +{"current_steps": 840, "total_steps": 25209, "loss": 1.2175, "lr": 4.802588716699519e-05, "epoch": 0.09996504198680521, "percentage": 3.33, "elapsed_time": "3:01:10", "remaining_time": "3 days, 15:35:57", "throughput": 20795.93, "total_tokens": 226059776} +{"current_steps": 850, "total_steps": 25209, "loss": 1.2293, "lr": 4.8003748279004156e-05, "epoch": 0.10115510201045766, "percentage": 3.37, "elapsed_time": "3:03:28", "remaining_time": "3 days, 15:37:50", "throughput": 20781.62, "total_tokens": 228769600} +{"current_steps": 860, "total_steps": 25209, "loss": 1.2172, "lr": 4.798163997944854e-05, "epoch": 0.1023451620341101, "percentage": 3.41, "elapsed_time": "3:05:59", "remaining_time": "3 days, 15:46:06", "throughput": 20743.15, "total_tokens": 231490368} +{"current_steps": 870, "total_steps": 25209, "loss": 1.2415, "lr": 4.79595621979551e-05, "epoch": 0.10353522205776254, "percentage": 3.45, "elapsed_time": "3:08:39", "remaining_time": "3 days, 15:58:00", "throughput": 20688.16, "total_tokens": 234185216} +{"current_steps": 880, "total_steps": 25209, "loss": 1.2304, "lr": 4.793751486437702e-05, "epoch": 0.10472528208141497, "percentage": 3.49, "elapsed_time": "3:11:16", "remaining_time": "3 days, 16:08:12", "throughput": 20638.0, "total_tokens": 236856640} +{"current_steps": 890, "total_steps": 25209, "loss": 1.2324, "lr": 4.7915497908793064e-05, "epoch": 0.10591534210506742, "percentage": 3.53, "elapsed_time": "3:14:29", "remaining_time": "3 days, 16:34:12", "throughput": 20527.76, "total_tokens": 239538432} +{"current_steps": 900, "total_steps": 25209, "loss": 1.2297, "lr": 4.7893511261506516e-05, "epoch": 0.10710540212871987, "percentage": 3.57, "elapsed_time": "3:17:55", "remaining_time": "3 days, 17:05:50", "throughput": 20400.39, "total_tokens": 242259392} +{"current_steps": 910, "total_steps": 25209, "loss": 1.2155, "lr": 4.787155485304435e-05, "epoch": 0.1082954621523723, "percentage": 3.61, "elapsed_time": "3:21:21", "remaining_time": "3 days, 17:36:36", "throughput": 20271.41, "total_tokens": 244904512} +{"current_steps": 920, "total_steps": 25209, "loss": 1.2081, "lr": 4.784962861415629e-05, "epoch": 0.10948552217602475, "percentage": 3.65, "elapsed_time": "3:24:49", "remaining_time": "3 days, 18:07:40", "throughput": 20148.81, "total_tokens": 247622336} +{"current_steps": 930, "total_steps": 25209, "loss": 1.2383, "lr": 4.7827732475813884e-05, "epoch": 0.1106755821996772, "percentage": 3.69, "elapsed_time": "3:28:01", "remaining_time": "3 days, 18:31:00", "throughput": 20055.01, "total_tokens": 250326464} +{"current_steps": 940, "total_steps": 25209, "loss": 1.2264, "lr": 4.7805866369209576e-05, "epoch": 0.11186564222332963, "percentage": 3.73, "elapsed_time": "3:31:04", "remaining_time": "3 days, 18:49:42", "throughput": 19977.78, "total_tokens": 253016064} +{"current_steps": 950, "total_steps": 25209, "loss": 1.2071, "lr": 4.778403022575583e-05, "epoch": 0.11305570224698208, "percentage": 3.77, "elapsed_time": "3:33:31", "remaining_time": "3 days, 18:52:40", "throughput": 19959.68, "total_tokens": 255719936} +{"current_steps": 960, "total_steps": 25209, "loss": 1.2158, "lr": 4.7762223977084195e-05, "epoch": 0.11424576227063453, "percentage": 3.81, "elapsed_time": "3:36:17", "remaining_time": "3 days, 19:03:34", "throughput": 19911.59, "total_tokens": 258411008} +{"current_steps": 970, "total_steps": 25209, "loss": 1.2208, "lr": 4.774044755504444e-05, "epoch": 0.11543582229428696, "percentage": 3.85, "elapsed_time": "3:39:07", "remaining_time": "3 days, 19:15:47", "throughput": 19858.35, "total_tokens": 261094720} +{"current_steps": 980, "total_steps": 25209, "loss": 1.2128, "lr": 4.7718700891703616e-05, "epoch": 0.11662588231793941, "percentage": 3.89, "elapsed_time": "3:41:26", "remaining_time": "3 days, 19:14:36", "throughput": 19856.72, "total_tokens": 263816448} +{"current_steps": 990, "total_steps": 25209, "loss": 1.2118, "lr": 4.7696983919345215e-05, "epoch": 0.11781594234159186, "percentage": 3.93, "elapsed_time": "3:43:40", "remaining_time": "3 days, 19:12:02", "throughput": 19857.24, "total_tokens": 266501184} +{"current_steps": 1000, "total_steps": 25209, "loss": 1.2184, "lr": 4.7675296570468216e-05, "epoch": 0.11900600236524429, "percentage": 3.97, "elapsed_time": "3:46:16", "remaining_time": "3 days, 19:17:59", "throughput": 19826.84, "total_tokens": 269184384} +{"current_steps": 1010, "total_steps": 25209, "loss": 1.1995, "lr": 4.76536387777863e-05, "epoch": 0.12019606238889674, "percentage": 4.01, "elapsed_time": "3:48:47", "remaining_time": "3 days, 19:21:44", "throughput": 19805.47, "total_tokens": 271881024} +{"current_steps": 1020, "total_steps": 25209, "loss": 1.2155, "lr": 4.7632010474226915e-05, "epoch": 0.12138612241254919, "percentage": 4.05, "elapsed_time": "3:51:10", "remaining_time": "3 days, 19:22:13", "throughput": 19794.51, "total_tokens": 274558784} +{"current_steps": 1030, "total_steps": 25209, "loss": 1.2257, "lr": 4.761041159293035e-05, "epoch": 0.12257618243620162, "percentage": 4.09, "elapsed_time": "3:53:32", "remaining_time": "3 days, 19:22:30", "throughput": 19784.2, "total_tokens": 277235136} +{"current_steps": 1040, "total_steps": 25209, "loss": 1.2195, "lr": 4.7588842067249e-05, "epoch": 0.12376624245985407, "percentage": 4.13, "elapsed_time": "3:56:18", "remaining_time": "3 days, 19:31:35", "throughput": 19743.54, "total_tokens": 279930112} +{"current_steps": 1050, "total_steps": 25209, "loss": 1.205, "lr": 4.756730183074637e-05, "epoch": 0.12495630248350652, "percentage": 4.17, "elapsed_time": "3:59:13", "remaining_time": "3 days, 19:44:03", "throughput": 19693.44, "total_tokens": 282661184} +{"current_steps": 1060, "total_steps": 25209, "loss": 1.2123, "lr": 4.7545790817196314e-05, "epoch": 0.12614636250715897, "percentage": 4.2, "elapsed_time": "4:01:37", "remaining_time": "3 days, 19:44:51", "throughput": 19683.79, "total_tokens": 285372672} +{"current_steps": 1070, "total_steps": 25209, "loss": 1.1999, "lr": 4.752430896058212e-05, "epoch": 0.1273364225308114, "percentage": 4.24, "elapsed_time": "4:04:03", "remaining_time": "3 days, 19:45:53", "throughput": 19669.3, "total_tokens": 288026112} +{"current_steps": 1080, "total_steps": 25209, "loss": 1.2189, "lr": 4.750285619509567e-05, "epoch": 0.12852648255446383, "percentage": 4.28, "elapsed_time": "4:06:08", "remaining_time": "3 days, 19:39:19", "throughput": 19683.83, "total_tokens": 290706624} +{"current_steps": 1090, "total_steps": 25209, "loss": 1.2033, "lr": 4.7481432455136644e-05, "epoch": 0.1297165425781163, "percentage": 4.32, "elapsed_time": "4:08:04", "remaining_time": "3 days, 19:29:25", "throughput": 19712.21, "total_tokens": 293413632} +{"current_steps": 1100, "total_steps": 25209, "loss": 1.2036, "lr": 4.7460037675311584e-05, "epoch": 0.13090660260176873, "percentage": 4.36, "elapsed_time": "4:10:16", "remaining_time": "3 days, 19:25:13", "throughput": 19719.76, "total_tokens": 296115328} +{"current_steps": 1110, "total_steps": 25209, "loss": 1.2033, "lr": 4.7438671790433126e-05, "epoch": 0.13209666262542116, "percentage": 4.4, "elapsed_time": "4:13:07", "remaining_time": "3 days, 19:35:32", "throughput": 19675.14, "total_tokens": 298816256} +{"current_steps": 1120, "total_steps": 25209, "loss": 1.2055, "lr": 4.741733473551915e-05, "epoch": 0.13328672264907362, "percentage": 4.44, "elapsed_time": "4:16:00", "remaining_time": "3 days, 19:46:06", "throughput": 19628.39, "total_tokens": 301494912} +{"current_steps": 1130, "total_steps": 25209, "loss": 1.212, "lr": 4.7396026445791966e-05, "epoch": 0.13447678267272606, "percentage": 4.48, "elapsed_time": "4:18:49", "remaining_time": "3 days, 19:55:25", "throughput": 19589.8, "total_tokens": 304228288} +{"current_steps": 1140, "total_steps": 25209, "loss": 1.1981, "lr": 4.737474685667742e-05, "epoch": 0.1356668426963785, "percentage": 4.52, "elapsed_time": "4:21:54", "remaining_time": "3 days, 20:09:33", "throughput": 19530.12, "total_tokens": 306897152} +{"current_steps": 1150, "total_steps": 25209, "loss": 1.1957, "lr": 4.7353495903804165e-05, "epoch": 0.13685690272003095, "percentage": 4.56, "elapsed_time": "4:25:16", "remaining_time": "3 days, 20:29:52", "throughput": 19446.81, "total_tokens": 309529856} +{"current_steps": 1160, "total_steps": 25209, "loss": 1.2066, "lr": 4.733227352300277e-05, "epoch": 0.1380469627436834, "percentage": 4.6, "elapsed_time": "4:27:39", "remaining_time": "3 days, 20:29:10", "throughput": 19443.38, "total_tokens": 312256832} +{"current_steps": 1170, "total_steps": 25209, "loss": 1.2032, "lr": 4.731107965030496e-05, "epoch": 0.13923702276733582, "percentage": 4.64, "elapsed_time": "4:29:53", "remaining_time": "3 days, 20:25:08", "throughput": 19449.97, "total_tokens": 314957888} +{"current_steps": 1180, "total_steps": 25209, "loss": 1.1999, "lr": 4.728991422194278e-05, "epoch": 0.14042708279098828, "percentage": 4.68, "elapsed_time": "4:32:15", "remaining_time": "3 days, 20:24:01", "throughput": 19447.77, "total_tokens": 317681792} +{"current_steps": 1190, "total_steps": 25209, "loss": 1.1939, "lr": 4.726877717434773e-05, "epoch": 0.14161714281464072, "percentage": 4.72, "elapsed_time": "4:34:41", "remaining_time": "3 days, 20:24:28", "throughput": 19439.34, "total_tokens": 320394560} +{"current_steps": 1200, "total_steps": 25209, "loss": 1.1999, "lr": 4.724766844415013e-05, "epoch": 0.14280720283829315, "percentage": 4.76, "elapsed_time": "4:36:35", "remaining_time": "3 days, 20:14:01", "throughput": 19466.97, "total_tokens": 323071168} +{"current_steps": 1210, "total_steps": 25209, "loss": 1.1839, "lr": 4.722658796817813e-05, "epoch": 0.1439972628619456, "percentage": 4.8, "elapsed_time": "4:39:06", "remaining_time": "3 days, 20:15:39", "throughput": 19449.92, "total_tokens": 325709568} +{"current_steps": 1220, "total_steps": 25209, "loss": 1.2091, "lr": 4.7205535683457044e-05, "epoch": 0.14518732288559805, "percentage": 4.84, "elapsed_time": "4:41:15", "remaining_time": "3 days, 20:10:25", "throughput": 19457.22, "total_tokens": 328350784} +{"current_steps": 1230, "total_steps": 25209, "loss": 1.1931, "lr": 4.7184511527208484e-05, "epoch": 0.14637738290925048, "percentage": 4.88, "elapsed_time": "4:43:14", "remaining_time": "3 days, 20:01:52", "throughput": 19477.33, "total_tokens": 331010240} +{"current_steps": 1240, "total_steps": 25209, "loss": 1.1997, "lr": 4.7163515436849644e-05, "epoch": 0.14756744293290291, "percentage": 4.92, "elapsed_time": "4:45:04", "remaining_time": "3 days, 19:50:35", "throughput": 19509.01, "total_tokens": 333700416} +{"current_steps": 1250, "total_steps": 25209, "loss": 1.1878, "lr": 4.714254734999245e-05, "epoch": 0.14875750295655538, "percentage": 4.96, "elapsed_time": "4:46:55", "remaining_time": "3 days, 19:39:41", "throughput": 19539.37, "total_tokens": 336388288} +{"current_steps": 1260, "total_steps": 25209, "loss": 1.1951, "lr": 4.712160720444284e-05, "epoch": 0.1499475629802078, "percentage": 5.0, "elapsed_time": "4:49:38", "remaining_time": "3 days, 19:45:12", "throughput": 19508.72, "total_tokens": 339029632} +{"current_steps": 1270, "total_steps": 25209, "loss": 1.183, "lr": 4.710069493819992e-05, "epoch": 0.15113762300386024, "percentage": 5.04, "elapsed_time": "4:52:05", "remaining_time": "3 days, 19:45:43", "throughput": 19496.37, "total_tokens": 341678016} +{"current_steps": 1280, "total_steps": 25209, "loss": 1.1993, "lr": 4.70798104894553e-05, "epoch": 0.1523276830275127, "percentage": 5.08, "elapsed_time": "4:54:33", "remaining_time": "3 days, 19:46:40", "throughput": 19485.36, "total_tokens": 344376896} +{"current_steps": 1290, "total_steps": 25209, "loss": 1.183, "lr": 4.705895379659219e-05, "epoch": 0.15351774305116514, "percentage": 5.12, "elapsed_time": "4:57:12", "remaining_time": "3 days, 19:50:55", "throughput": 19461.5, "total_tokens": 347055808} +{"current_steps": 1300, "total_steps": 25209, "loss": 1.1917, "lr": 4.7038124798184766e-05, "epoch": 0.15470780307481757, "percentage": 5.16, "elapsed_time": "4:59:50", "remaining_time": "3 days, 19:54:32", "throughput": 19442.82, "total_tokens": 349785472} +{"current_steps": 1310, "total_steps": 25209, "loss": 1.1899, "lr": 4.7017323432997304e-05, "epoch": 0.15589786309847004, "percentage": 5.2, "elapsed_time": "5:02:24", "remaining_time": "3 days, 19:56:56", "throughput": 19428.49, "total_tokens": 352516864} +{"current_steps": 1320, "total_steps": 25209, "loss": 1.1886, "lr": 4.6996549639983506e-05, "epoch": 0.15708792312212247, "percentage": 5.24, "elapsed_time": "5:04:47", "remaining_time": "3 days, 19:56:08", "throughput": 19426.47, "total_tokens": 355268352} +{"current_steps": 1330, "total_steps": 25209, "loss": 1.1766, "lr": 4.697580335828569e-05, "epoch": 0.1582779831457749, "percentage": 5.28, "elapsed_time": "5:07:27", "remaining_time": "3 days, 20:00:02", "throughput": 19402.04, "total_tokens": 357912640} +{"current_steps": 1340, "total_steps": 25209, "loss": 1.1993, "lr": 4.6955084527234076e-05, "epoch": 0.15946804316942736, "percentage": 5.32, "elapsed_time": "5:09:48", "remaining_time": "3 days, 19:58:35", "throughput": 19397.99, "total_tokens": 360584384} +{"current_steps": 1350, "total_steps": 25209, "loss": 1.187, "lr": 4.6934393086346034e-05, "epoch": 0.1606581031930798, "percentage": 5.36, "elapsed_time": "5:11:58", "remaining_time": "3 days, 19:53:40", "throughput": 19406.44, "total_tokens": 363262336} +{"current_steps": 1360, "total_steps": 25209, "loss": 1.2021, "lr": 4.6913728975325324e-05, "epoch": 0.16184816321673223, "percentage": 5.39, "elapsed_time": "5:14:15", "remaining_time": "3 days, 19:50:44", "throughput": 19410.17, "total_tokens": 365981568} +{"current_steps": 1370, "total_steps": 25209, "loss": 1.1987, "lr": 4.6893092134061393e-05, "epoch": 0.1630382232403847, "percentage": 5.43, "elapsed_time": "5:16:28", "remaining_time": "3 days, 19:46:47", "throughput": 19415.67, "total_tokens": 368667776} +{"current_steps": 1380, "total_steps": 25209, "loss": 1.1968, "lr": 4.687248250262859e-05, "epoch": 0.16422828326403713, "percentage": 5.47, "elapsed_time": "5:19:02", "remaining_time": "3 days, 19:48:58", "throughput": 19400.28, "total_tokens": 371366848} +{"current_steps": 1390, "total_steps": 25209, "loss": 1.1699, "lr": 4.685190002128548e-05, "epoch": 0.16541834328768956, "percentage": 5.51, "elapsed_time": "5:20:53", "remaining_time": "3 days, 19:38:50", "throughput": 19428.09, "total_tokens": 374061760} +{"current_steps": 1400, "total_steps": 25209, "loss": 1.2012, "lr": 4.6831344630474114e-05, "epoch": 0.16660840331134202, "percentage": 5.55, "elapsed_time": "5:23:00", "remaining_time": "3 days, 19:33:09", "throughput": 19441.35, "total_tokens": 376778624} +{"current_steps": 1410, "total_steps": 25209, "loss": 1.1895, "lr": 4.6810816270819276e-05, "epoch": 0.16779846333499446, "percentage": 5.59, "elapsed_time": "5:25:23", "remaining_time": "3 days, 19:32:05", "throughput": 19437.97, "total_tokens": 379490496} +{"current_steps": 1420, "total_steps": 25209, "loss": 1.1752, "lr": 4.679031488312777e-05, "epoch": 0.1689885233586469, "percentage": 5.63, "elapsed_time": "5:27:06", "remaining_time": "3 days, 19:19:59", "throughput": 19471.89, "total_tokens": 382164992} +{"current_steps": 1430, "total_steps": 25209, "loss": 1.1915, "lr": 4.6769840408387717e-05, "epoch": 0.17017858338229935, "percentage": 5.67, "elapsed_time": "5:28:48", "remaining_time": "3 days, 19:07:45", "throughput": 19508.63, "total_tokens": 384883648} +{"current_steps": 1440, "total_steps": 25209, "loss": 1.186, "lr": 4.674939278776787e-05, "epoch": 0.1713686434059518, "percentage": 5.71, "elapsed_time": "5:30:33", "remaining_time": "3 days, 18:56:13", "throughput": 19543.74, "total_tokens": 387616896} +{"current_steps": 1450, "total_steps": 25209, "loss": 1.1898, "lr": 4.672897196261683e-05, "epoch": 0.17255870342960422, "percentage": 5.75, "elapsed_time": "5:32:45", "remaining_time": "3 days, 18:52:28", "throughput": 19549.72, "total_tokens": 390324608} +{"current_steps": 1460, "total_steps": 25209, "loss": 1.1831, "lr": 4.670857787446238e-05, "epoch": 0.17374876345325668, "percentage": 5.79, "elapsed_time": "5:34:59", "remaining_time": "3 days, 18:49:11", "throughput": 19552.45, "total_tokens": 393000000} +{"current_steps": 1470, "total_steps": 25209, "loss": 1.184, "lr": 4.668821046501082e-05, "epoch": 0.17493882347690912, "percentage": 5.83, "elapsed_time": "5:36:47", "remaining_time": "3 days, 18:38:57", "throughput": 19579.92, "total_tokens": 395669504} +{"current_steps": 1480, "total_steps": 25209, "loss": 1.1721, "lr": 4.6667869676146194e-05, "epoch": 0.17612888350056155, "percentage": 5.87, "elapsed_time": "5:39:11", "remaining_time": "3 days, 18:38:16", "throughput": 19573.53, "total_tokens": 398348992} +{"current_steps": 1490, "total_steps": 25209, "loss": 1.1841, "lr": 4.6647555449929645e-05, "epoch": 0.177318943524214, "percentage": 5.91, "elapsed_time": "5:41:38", "remaining_time": "3 days, 18:38:26", "throughput": 19564.87, "total_tokens": 401044160} +{"current_steps": 1500, "total_steps": 25209, "loss": 1.167, "lr": 4.662726772859869e-05, "epoch": 0.17850900354786645, "percentage": 5.95, "elapsed_time": "5:44:04", "remaining_time": "3 days, 18:38:28", "throughput": 19555.98, "total_tokens": 403725760} +{"current_steps": 1510, "total_steps": 25209, "loss": 1.1715, "lr": 4.660700645456655e-05, "epoch": 0.17969906357151888, "percentage": 5.99, "elapsed_time": "5:46:14", "remaining_time": "3 days, 18:34:03", "throughput": 19564.91, "total_tokens": 406443200} +{"current_steps": 1520, "total_steps": 25209, "loss": 1.1822, "lr": 4.658677157042149e-05, "epoch": 0.18088912359517134, "percentage": 6.03, "elapsed_time": "5:48:43", "remaining_time": "3 days, 18:34:53", "throughput": 19554.18, "total_tokens": 409145920} +{"current_steps": 1530, "total_steps": 25209, "loss": 1.1847, "lr": 4.656656301892605e-05, "epoch": 0.18207918361882378, "percentage": 6.07, "elapsed_time": "5:50:47", "remaining_time": "3 days, 18:28:59", "throughput": 19564.95, "total_tokens": 411791744} +{"current_steps": 1540, "total_steps": 25209, "loss": 1.1854, "lr": 4.6546380743016465e-05, "epoch": 0.1832692436424762, "percentage": 6.11, "elapsed_time": "5:53:36", "remaining_time": "3 days, 18:34:41", "throughput": 19536.23, "total_tokens": 414484352} +{"current_steps": 1550, "total_steps": 25209, "loss": 1.1853, "lr": 4.652622468580193e-05, "epoch": 0.18445930366612867, "percentage": 6.15, "elapsed_time": "5:56:10", "remaining_time": "3 days, 18:36:35", "throughput": 19521.18, "total_tokens": 417176448} +{"current_steps": 1560, "total_steps": 25209, "loss": 1.1756, "lr": 4.650609479056392e-05, "epoch": 0.1856493636897811, "percentage": 6.19, "elapsed_time": "5:58:17", "remaining_time": "3 days, 18:31:39", "throughput": 19529.83, "total_tokens": 419850176} +{"current_steps": 1570, "total_steps": 25209, "loss": 1.1807, "lr": 4.648599100075556e-05, "epoch": 0.18683942371343354, "percentage": 6.23, "elapsed_time": "6:00:25", "remaining_time": "3 days, 18:26:52", "throughput": 19538.79, "total_tokens": 422540800} +{"current_steps": 1580, "total_steps": 25209, "loss": 1.1919, "lr": 4.6465913260000945e-05, "epoch": 0.188029483737086, "percentage": 6.27, "elapsed_time": "6:03:03", "remaining_time": "3 days, 18:29:27", "throughput": 19518.8, "total_tokens": 425180288} +{"current_steps": 1590, "total_steps": 25209, "loss": 1.1889, "lr": 4.644586151209444e-05, "epoch": 0.18921954376073843, "percentage": 6.31, "elapsed_time": "6:05:23", "remaining_time": "3 days, 18:27:42", "throughput": 19516.77, "total_tokens": 427869120} +{"current_steps": 1600, "total_steps": 25209, "loss": 1.1807, "lr": 4.6425835701000084e-05, "epoch": 0.19040960378439087, "percentage": 6.35, "elapsed_time": "6:07:33", "remaining_time": "3 days, 18:23:29", "throughput": 19522.21, "total_tokens": 430528256} +{"current_steps": 1610, "total_steps": 25209, "loss": 1.18, "lr": 4.640583577085084e-05, "epoch": 0.19159966380804333, "percentage": 6.39, "elapsed_time": "6:09:35", "remaining_time": "3 days, 18:17:28", "throughput": 19537.67, "total_tokens": 433264640} +{"current_steps": 1620, "total_steps": 25209, "loss": 1.151, "lr": 4.638586166594806e-05, "epoch": 0.19278972383169576, "percentage": 6.43, "elapsed_time": "6:11:17", "remaining_time": "3 days, 18:06:21", "throughput": 19569.65, "total_tokens": 435957376} +{"current_steps": 1630, "total_steps": 25209, "loss": 1.1677, "lr": 4.6365913330760726e-05, "epoch": 0.1939797838553482, "percentage": 6.47, "elapsed_time": "6:12:52", "remaining_time": "3 days, 17:53:47", "throughput": 19604.34, "total_tokens": 438590656} +{"current_steps": 10, "total_steps": 25209, "loss": 2.0652, "lr": 4.9977515176118345e-05, "epoch": 0.001190060023652443, "percentage": 0.04, "elapsed_time": "0:03:21", "remaining_time": "5 days, 21:15:41", "throughput": 13414.59, "total_tokens": 2707200} +{"current_steps": 20, "total_steps": 25209, "loss": 1.602, "lr": 4.9952567580506e-05, "epoch": 0.002380120047304886, "percentage": 0.08, "elapsed_time": "0:06:53", "remaining_time": "6 days, 0:48:09", "throughput": 13083.82, "total_tokens": 5415424} +{"current_steps": 30, "total_steps": 25209, "loss": 1.5147, "lr": 4.992765730738634e-05, "epoch": 0.003570180070957329, "percentage": 0.12, "elapsed_time": "0:10:08", "remaining_time": "5 days, 21:55:58", "throughput": 13335.18, "total_tokens": 8118336} +{"current_steps": 40, "total_steps": 25209, "loss": 1.4835, "lr": 4.9902784263792476e-05, "epoch": 0.004760240094609772, "percentage": 0.16, "elapsed_time": "0:13:50", "remaining_time": "6 days, 1:14:26", "throughput": 12921.16, "total_tokens": 10737088} +{"current_steps": 50, "total_steps": 25209, "loss": 1.4622, "lr": 4.987794835708133e-05, "epoch": 0.005950300118262215, "percentage": 0.2, "elapsed_time": "0:17:12", "remaining_time": "6 days, 0:20:55", "throughput": 13068.85, "total_tokens": 13496768} +{"current_steps": 60, "total_steps": 25209, "loss": 1.4554, "lr": 4.985314949493234e-05, "epoch": 0.007140360141914658, "percentage": 0.24, "elapsed_time": "0:20:14", "remaining_time": "5 days, 21:25:10", "throughput": 13309.51, "total_tokens": 16166080} +{"current_steps": 70, "total_steps": 25209, "loss": 1.4199, "lr": 4.982838758534584e-05, "epoch": 0.008330420165567102, "percentage": 0.28, "elapsed_time": "0:23:02", "remaining_time": "5 days, 17:55:36", "throughput": 13627.01, "total_tokens": 18840896} +{"current_steps": 80, "total_steps": 25209, "loss": 1.428, "lr": 4.980366253664179e-05, "epoch": 0.009520480189219544, "percentage": 0.32, "elapsed_time": "0:27:01", "remaining_time": "5 days, 21:26:36", "throughput": 13304.17, "total_tokens": 21566912} +{"current_steps": 90, "total_steps": 25209, "loss": 1.4135, "lr": 4.977897425745825e-05, "epoch": 0.010710540212871987, "percentage": 0.36, "elapsed_time": "0:30:30", "remaining_time": "5 days, 21:56:18", "throughput": 13271.02, "total_tokens": 24296704} +{"current_steps": 100, "total_steps": 25209, "loss": 1.4077, "lr": 4.975432265674997e-05, "epoch": 0.01190060023652443, "percentage": 0.4, "elapsed_time": "0:33:54", "remaining_time": "5 days, 21:53:41", "throughput": 13263.34, "total_tokens": 26983168} +{"current_steps": 110, "total_steps": 25209, "loss": 1.4078, "lr": 4.972970764378705e-05, "epoch": 0.013090660260176872, "percentage": 0.44, "elapsed_time": "0:37:08", "remaining_time": "5 days, 21:14:34", "throughput": 13327.17, "total_tokens": 29699072} +{"current_steps": 120, "total_steps": 25209, "loss": 1.3878, "lr": 4.970512912815344e-05, "epoch": 0.014280720283829316, "percentage": 0.48, "elapsed_time": "0:39:58", "remaining_time": "5 days, 19:18:41", "throughput": 13517.1, "total_tokens": 32424320} +{"current_steps": 130, "total_steps": 25209, "loss": 1.3889, "lr": 4.968058701974564e-05, "epoch": 0.015470780307481759, "percentage": 0.52, "elapsed_time": "0:43:03", "remaining_time": "5 days, 18:27:08", "throughput": 13588.42, "total_tokens": 35107904} +{"current_steps": 140, "total_steps": 25209, "loss": 1.3669, "lr": 4.96560812287712e-05, "epoch": 0.016660840331134203, "percentage": 0.56, "elapsed_time": "0:46:17", "remaining_time": "5 days, 18:08:58", "throughput": 13608.2, "total_tokens": 37795840} +{"current_steps": 150, "total_steps": 25209, "loss": 1.3646, "lr": 4.963161166574748e-05, "epoch": 0.017850900354786644, "percentage": 0.6, "elapsed_time": "0:49:42", "remaining_time": "5 days, 18:24:20", "throughput": 13586.72, "total_tokens": 40522688} +{"current_steps": 160, "total_steps": 25209, "loss": 1.3437, "lr": 4.960717824150013e-05, "epoch": 0.019040960378439088, "percentage": 0.63, "elapsed_time": "0:53:12", "remaining_time": "5 days, 18:49:32", "throughput": 13522.6, "total_tokens": 43168064} +{"current_steps": 170, "total_steps": 25209, "loss": 1.3561, "lr": 4.9582780867161893e-05, "epoch": 0.02023102040209153, "percentage": 0.67, "elapsed_time": "0:56:38", "remaining_time": "5 days, 19:01:26", "throughput": 13488.21, "total_tokens": 45833088} +{"current_steps": 180, "total_steps": 25209, "loss": 1.3485, "lr": 4.955841945417105e-05, "epoch": 0.021421080425743973, "percentage": 0.71, "elapsed_time": "0:59:40", "remaining_time": "5 days, 18:17:10", "throughput": 13556.73, "total_tokens": 48536192} +{"current_steps": 190, "total_steps": 25209, "loss": 1.3665, "lr": 4.953409391427024e-05, "epoch": 0.022611140449396418, "percentage": 0.75, "elapsed_time": "1:02:41", "remaining_time": "5 days, 17:36:00", "throughput": 13612.09, "total_tokens": 51207040} +{"current_steps": 200, "total_steps": 25209, "loss": 1.3505, "lr": 4.950980415950502e-05, "epoch": 0.02380120047304886, "percentage": 0.79, "elapsed_time": "1:05:41", "remaining_time": "5 days, 16:54:34", "throughput": 13684.54, "total_tokens": 53938624} +{"current_steps": 210, "total_steps": 25209, "loss": 1.3406, "lr": 4.9485550102222575e-05, "epoch": 0.024991260496701303, "percentage": 0.83, "elapsed_time": "1:08:48", "remaining_time": "5 days, 16:32:05", "throughput": 13710.6, "total_tokens": 56610816} +{"current_steps": 220, "total_steps": 25209, "loss": 1.3435, "lr": 4.946133165507037e-05, "epoch": 0.026181320520353744, "percentage": 0.87, "elapsed_time": "1:11:46", "remaining_time": "5 days, 15:53:09", "throughput": 13767.19, "total_tokens": 59291968} +{"current_steps": 230, "total_steps": 25209, "loss": 1.3313, "lr": 4.943714873099483e-05, "epoch": 0.027371380544006188, "percentage": 0.91, "elapsed_time": "1:15:42", "remaining_time": "5 days, 17:02:52", "throughput": 13638.64, "total_tokens": 61958208} +{"current_steps": 240, "total_steps": 25209, "loss": 1.3246, "lr": 4.9413001243240024e-05, "epoch": 0.028561440567658632, "percentage": 0.95, "elapsed_time": "1:19:31", "remaining_time": "5 days, 17:53:09", "throughput": 13542.25, "total_tokens": 64613568} +{"current_steps": 250, "total_steps": 25209, "loss": 1.3253, "lr": 4.938888910534637e-05, "epoch": 0.029751500591311073, "percentage": 0.99, "elapsed_time": "1:23:25", "remaining_time": "5 days, 18:48:13", "throughput": 13444.79, "total_tokens": 67293056} +{"current_steps": 260, "total_steps": 25209, "loss": 1.3321, "lr": 4.936481223114932e-05, "epoch": 0.030941560614963518, "percentage": 1.03, "elapsed_time": "1:26:45", "remaining_time": "5 days, 18:45:46", "throughput": 13433.14, "total_tokens": 69931584} +{"current_steps": 270, "total_steps": 25209, "loss": 1.3219, "lr": 4.934077053477808e-05, "epoch": 0.03213162063861596, "percentage": 1.07, "elapsed_time": "1:30:08", "remaining_time": "5 days, 18:46:31", "throughput": 13433.5, "total_tokens": 72658880} +{"current_steps": 280, "total_steps": 25209, "loss": 1.3215, "lr": 4.931676393065431e-05, "epoch": 0.033321680662268406, "percentage": 1.11, "elapsed_time": "1:33:23", "remaining_time": "5 days, 18:34:30", "throughput": 13446.67, "total_tokens": 75345216} +{"current_steps": 290, "total_steps": 25209, "loss": 1.3072, "lr": 4.929279233349088e-05, "epoch": 0.03451174068592085, "percentage": 1.15, "elapsed_time": "1:36:40", "remaining_time": "5 days, 18:26:35", "throughput": 13450.25, "total_tokens": 78013824} +{"current_steps": 300, "total_steps": 25209, "loss": 1.3029, "lr": 4.926885565829051e-05, "epoch": 0.03570180070957329, "percentage": 1.19, "elapsed_time": "1:40:35", "remaining_time": "5 days, 19:11:38", "throughput": 13370.61, "total_tokens": 80693568} +{"current_steps": 310, "total_steps": 25209, "loss": 1.3148, "lr": 4.924495382034461e-05, "epoch": 0.03689186073322573, "percentage": 1.23, "elapsed_time": "1:44:17", "remaining_time": "5 days, 19:36:54", "throughput": 13319.17, "total_tokens": 83347456} +{"current_steps": 320, "total_steps": 25209, "loss": 1.3143, "lr": 4.9221086735231975e-05, "epoch": 0.038081920756878176, "percentage": 1.27, "elapsed_time": "1:47:08", "remaining_time": "5 days, 18:53:25", "throughput": 13378.98, "total_tokens": 86008320} +{"current_steps": 330, "total_steps": 25209, "loss": 1.3046, "lr": 4.919725431881751e-05, "epoch": 0.03927198078053062, "percentage": 1.31, "elapsed_time": "1:49:58", "remaining_time": "5 days, 18:10:31", "throughput": 13445.53, "total_tokens": 88714048} +{"current_steps": 340, "total_steps": 25209, "loss": 1.3153, "lr": 4.917345648725101e-05, "epoch": 0.04046204080418306, "percentage": 1.35, "elapsed_time": "1:52:36", "remaining_time": "5 days, 17:16:58", "throughput": 13526.89, "total_tokens": 91398144} +{"current_steps": 350, "total_steps": 25209, "loss": 1.3008, "lr": 4.914969315696596e-05, "epoch": 0.041652100827835506, "percentage": 1.39, "elapsed_time": "1:55:02", "remaining_time": "5 days, 16:10:34", "throughput": 13631.63, "total_tokens": 94088512} +{"current_steps": 360, "total_steps": 25209, "loss": 1.2974, "lr": 4.912596424467818e-05, "epoch": 0.04284216085148795, "percentage": 1.43, "elapsed_time": "1:57:08", "remaining_time": "5 days, 14:46:07", "throughput": 13758.78, "total_tokens": 96708736} +{"current_steps": 370, "total_steps": 25209, "loss": 1.2954, "lr": 4.910226966738475e-05, "epoch": 0.04403222087514039, "percentage": 1.47, "elapsed_time": "1:59:11", "remaining_time": "5 days, 13:21:08", "throughput": 13894.73, "total_tokens": 99362240} +{"current_steps": 380, "total_steps": 25209, "loss": 1.2807, "lr": 4.9078609342362666e-05, "epoch": 0.045222280898792835, "percentage": 1.51, "elapsed_time": "2:01:10", "remaining_time": "5 days, 11:57:03", "throughput": 14030.08, "total_tokens": 101999872} +{"current_steps": 390, "total_steps": 25209, "loss": 1.2741, "lr": 4.905498318716775e-05, "epoch": 0.046412340922445276, "percentage": 1.55, "elapsed_time": "2:03:41", "remaining_time": "5 days, 11:11:06", "throughput": 14108.56, "total_tokens": 104700800} +{"current_steps": 400, "total_steps": 25209, "loss": 1.2834, "lr": 4.9031391119633295e-05, "epoch": 0.04760240094609772, "percentage": 1.59, "elapsed_time": "2:06:30", "remaining_time": "5 days, 10:46:19", "throughput": 14149.9, "total_tokens": 107404288} +{"current_steps": 410, "total_steps": 25209, "loss": 1.2837, "lr": 4.9007833057869e-05, "epoch": 0.048792460969750165, "percentage": 1.63, "elapsed_time": "2:09:29", "remaining_time": "5 days, 10:31:52", "throughput": 14177.06, "total_tokens": 110141888} +{"current_steps": 420, "total_steps": 25209, "loss": 1.2854, "lr": 4.898430892025967e-05, "epoch": 0.049982520993402606, "percentage": 1.67, "elapsed_time": "2:12:32", "remaining_time": "5 days, 10:23:09", "throughput": 14181.48, "total_tokens": 112783488} +{"current_steps": 430, "total_steps": 25209, "loss": 1.2708, "lr": 4.896081862546415e-05, "epoch": 0.05117258101705505, "percentage": 1.71, "elapsed_time": "2:15:27", "remaining_time": "5 days, 10:05:23", "throughput": 14206.78, "total_tokens": 115458560} +{"current_steps": 440, "total_steps": 25209, "loss": 1.2677, "lr": 4.8937362092414e-05, "epoch": 0.05236264104070749, "percentage": 1.75, "elapsed_time": "2:17:58", "remaining_time": "5 days, 9:26:35", "throughput": 14279.71, "total_tokens": 118207424} +{"current_steps": 450, "total_steps": 25209, "loss": 1.2742, "lr": 4.891393924031244e-05, "epoch": 0.053552701064359935, "percentage": 1.79, "elapsed_time": "2:20:04", "remaining_time": "5 days, 8:26:39", "throughput": 14382.02, "total_tokens": 120869376} +{"current_steps": 460, "total_steps": 25209, "loss": 1.2757, "lr": 4.8890549988633095e-05, "epoch": 0.054742761088012376, "percentage": 1.82, "elapsed_time": "2:22:26", "remaining_time": "5 days, 7:43:45", "throughput": 14465.85, "total_tokens": 123633792} +{"current_steps": 470, "total_steps": 25209, "loss": 1.2829, "lr": 4.8867194257118907e-05, "epoch": 0.05593282111166482, "percentage": 1.86, "elapsed_time": "2:24:46", "remaining_time": "5 days, 7:00:41", "throughput": 14546.27, "total_tokens": 126360960} +{"current_steps": 480, "total_steps": 25209, "loss": 1.2856, "lr": 4.884387196578093e-05, "epoch": 0.057122881135317265, "percentage": 1.9, "elapsed_time": "2:27:29", "remaining_time": "5 days, 6:38:42", "throughput": 14588.28, "total_tokens": 129100928} +{"current_steps": 490, "total_steps": 25209, "loss": 1.2636, "lr": 4.882058303489718e-05, "epoch": 0.058312941158969706, "percentage": 1.94, "elapsed_time": "2:29:37", "remaining_time": "5 days, 5:47:43", "throughput": 14676.03, "total_tokens": 131747008} +{"current_steps": 500, "total_steps": 25209, "loss": 1.2842, "lr": 4.8797327385011496e-05, "epoch": 0.059503001182622146, "percentage": 1.98, "elapsed_time": "2:31:56", "remaining_time": "5 days, 5:08:40", "throughput": 14745.2, "total_tokens": 134425024} +{"current_steps": 510, "total_steps": 25209, "loss": 1.2585, "lr": 4.8774104936932425e-05, "epoch": 0.060693061206274594, "percentage": 2.02, "elapsed_time": "2:34:03", "remaining_time": "5 days, 4:20:56", "throughput": 14833.36, "total_tokens": 137111872} +{"current_steps": 520, "total_steps": 25209, "loss": 1.2537, "lr": 4.8750915611732076e-05, "epoch": 0.061883121229927035, "percentage": 2.06, "elapsed_time": "2:35:50", "remaining_time": "5 days, 3:18:50", "throughput": 14948.35, "total_tokens": 139768192} +{"current_steps": 530, "total_steps": 25209, "loss": 1.2655, "lr": 4.8727759330744986e-05, "epoch": 0.06307318125357948, "percentage": 2.1, "elapsed_time": "2:37:46", "remaining_time": "5 days, 2:26:27", "throughput": 15049.92, "total_tokens": 142466112} +{"current_steps": 540, "total_steps": 25209, "loss": 1.2459, "lr": 4.870463601556696e-05, "epoch": 0.06426324127723192, "percentage": 2.14, "elapsed_time": "2:39:48", "remaining_time": "5 days, 1:40:38", "throughput": 15140.4, "total_tokens": 145175168} +{"current_steps": 550, "total_steps": 25209, "loss": 1.2559, "lr": 4.8681545588054075e-05, "epoch": 0.06545330130088436, "percentage": 2.18, "elapsed_time": "2:41:31", "remaining_time": "5 days, 0:41:40", "throughput": 15259.5, "total_tokens": 147882752} +{"current_steps": 560, "total_steps": 25209, "loss": 1.2644, "lr": 4.8658487970321404e-05, "epoch": 0.06664336132453681, "percentage": 2.22, "elapsed_time": "2:43:22", "remaining_time": "4 days, 23:50:56", "throughput": 15364.83, "total_tokens": 150609792} +{"current_steps": 570, "total_steps": 25209, "loss": 1.2551, "lr": 4.863546308474209e-05, "epoch": 0.06783342134818925, "percentage": 2.26, "elapsed_time": "2:45:10", "remaining_time": "4 days, 22:59:45", "throughput": 15465.12, "total_tokens": 153264064} +{"current_steps": 580, "total_steps": 25209, "loss": 1.2615, "lr": 4.86124708539461e-05, "epoch": 0.0690234813718417, "percentage": 2.3, "elapsed_time": "2:47:03", "remaining_time": "4 days, 22:13:58", "throughput": 15557.09, "total_tokens": 155937408} +{"current_steps": 590, "total_steps": 25209, "loss": 1.2401, "lr": 4.8589511200819216e-05, "epoch": 0.07021354139549414, "percentage": 2.34, "elapsed_time": "2:49:09", "remaining_time": "4 days, 21:38:08", "throughput": 15638.91, "total_tokens": 158719296} +{"current_steps": 600, "total_steps": 25209, "loss": 1.2524, "lr": 4.8566584048501926e-05, "epoch": 0.07140360141914658, "percentage": 2.38, "elapsed_time": "2:50:55", "remaining_time": "4 days, 20:50:40", "throughput": 15737.47, "total_tokens": 161399808} +{"current_steps": 610, "total_steps": 25209, "loss": 1.2452, "lr": 4.854368932038835e-05, "epoch": 0.07259366144279902, "percentage": 2.42, "elapsed_time": "2:52:32", "remaining_time": "4 days, 19:58:14", "throughput": 15846.43, "total_tokens": 164056896} +{"current_steps": 620, "total_steps": 25209, "loss": 1.2546, "lr": 4.8520826940125144e-05, "epoch": 0.07378372146645146, "percentage": 2.46, "elapsed_time": "2:54:15", "remaining_time": "4 days, 19:11:19", "throughput": 15946.53, "total_tokens": 166736000} +{"current_steps": 630, "total_steps": 25209, "loss": 1.2575, "lr": 4.849799683161046e-05, "epoch": 0.0749737814901039, "percentage": 2.5, "elapsed_time": "2:55:56", "remaining_time": "4 days, 18:24:19", "throughput": 16048.67, "total_tokens": 169419904} +{"current_steps": 640, "total_steps": 25209, "loss": 1.2534, "lr": 4.8475198918992835e-05, "epoch": 0.07616384151375635, "percentage": 2.54, "elapsed_time": "2:57:36", "remaining_time": "4 days, 17:37:59", "throughput": 16151.09, "total_tokens": 172108288} +{"current_steps": 650, "total_steps": 25209, "loss": 1.2515, "lr": 4.845243312667023e-05, "epoch": 0.07735390153740879, "percentage": 2.58, "elapsed_time": "2:59:18", "remaining_time": "4 days, 16:54:36", "throughput": 16251.58, "total_tokens": 174837248} +{"current_steps": 660, "total_steps": 25209, "loss": 1.2279, "lr": 4.842969937928884e-05, "epoch": 0.07854396156106123, "percentage": 2.62, "elapsed_time": "3:00:57", "remaining_time": "4 days, 16:10:53", "throughput": 16347.88, "total_tokens": 177498816} +{"current_steps": 670, "total_steps": 25209, "loss": 1.2544, "lr": 4.840699760174217e-05, "epoch": 0.07973402158471368, "percentage": 2.66, "elapsed_time": "3:02:40", "remaining_time": "4 days, 15:30:32", "throughput": 16440.75, "total_tokens": 180198912} +{"current_steps": 680, "total_steps": 25209, "loss": 1.2412, "lr": 4.8384327719169906e-05, "epoch": 0.08092408160836612, "percentage": 2.7, "elapsed_time": "3:04:23", "remaining_time": "4 days, 14:51:38", "throughput": 16529.33, "total_tokens": 182879232} +{"current_steps": 690, "total_steps": 25209, "loss": 1.241, "lr": 4.836168965695694e-05, "epoch": 0.08211414163201856, "percentage": 2.74, "elapsed_time": "3:06:16", "remaining_time": "4 days, 14:19:10", "throughput": 16606.6, "total_tokens": 185601920} +{"current_steps": 700, "total_steps": 25209, "loss": 1.2461, "lr": 4.8339083340732304e-05, "epoch": 0.08330420165567101, "percentage": 2.78, "elapsed_time": "3:08:05", "remaining_time": "4 days, 13:45:32", "throughput": 16690.99, "total_tokens": 188363584} +{"current_steps": 710, "total_steps": 25209, "loss": 1.2439, "lr": 4.8316508696368154e-05, "epoch": 0.08449426167932345, "percentage": 2.82, "elapsed_time": "3:10:03", "remaining_time": "4 days, 13:18:14", "throughput": 16750.9, "total_tokens": 191023552} +{"current_steps": 720, "total_steps": 25209, "loss": 1.241, "lr": 4.8293965649978714e-05, "epoch": 0.0856843217029759, "percentage": 2.86, "elapsed_time": "3:11:47", "remaining_time": "4 days, 12:43:14", "throughput": 16833.45, "total_tokens": 193708672} +{"current_steps": 730, "total_steps": 25209, "loss": 1.2328, "lr": 4.8271454127919364e-05, "epoch": 0.08687438172662834, "percentage": 2.9, "elapsed_time": "3:13:37", "remaining_time": "4 days, 12:13:02", "throughput": 16903.71, "total_tokens": 196386176} +{"current_steps": 740, "total_steps": 25209, "loss": 1.2311, "lr": 4.824897405678549e-05, "epoch": 0.08806444175028078, "percentage": 2.94, "elapsed_time": "3:15:22", "remaining_time": "4 days, 11:40:19", "throughput": 16986.94, "total_tokens": 199130048} +{"current_steps": 750, "total_steps": 25209, "loss": 1.2398, "lr": 4.8226525363411576e-05, "epoch": 0.08925450177393322, "percentage": 2.98, "elapsed_time": "3:17:05", "remaining_time": "4 days, 11:07:20", "throughput": 17068.73, "total_tokens": 201839552} +{"current_steps": 760, "total_steps": 25209, "loss": 1.2395, "lr": 4.820410797487017e-05, "epoch": 0.09044456179758567, "percentage": 3.01, "elapsed_time": "3:18:44", "remaining_time": "4 days, 10:33:34", "throughput": 17149.85, "total_tokens": 204506752} +{"current_steps": 770, "total_steps": 25209, "loss": 1.2362, "lr": 4.818172181847091e-05, "epoch": 0.0916346218212381, "percentage": 3.05, "elapsed_time": "3:20:23", "remaining_time": "4 days, 10:00:27", "throughput": 17231.54, "total_tokens": 207190912} +{"current_steps": 780, "total_steps": 25209, "loss": 1.241, "lr": 4.81593668217595e-05, "epoch": 0.09282468184489055, "percentage": 3.09, "elapsed_time": "3:22:06", "remaining_time": "4 days, 9:29:42", "throughput": 17309.04, "total_tokens": 209892160} +{"current_steps": 790, "total_steps": 25209, "loss": 1.2491, "lr": 4.813704291251675e-05, "epoch": 0.094014741868543, "percentage": 3.13, "elapsed_time": "3:23:44", "remaining_time": "4 days, 8:57:29", "throughput": 17385.82, "total_tokens": 212526848} +{"current_steps": 800, "total_steps": 25209, "loss": 1.2349, "lr": 4.811475001875759e-05, "epoch": 0.09520480189219543, "percentage": 3.17, "elapsed_time": "3:25:27", "remaining_time": "4 days, 8:28:40", "throughput": 17464.33, "total_tokens": 215287232} +{"current_steps": 810, "total_steps": 25209, "loss": 1.2382, "lr": 4.8092488068730105e-05, "epoch": 0.09639486191584788, "percentage": 3.21, "elapsed_time": "3:27:07", "remaining_time": "4 days, 7:58:53", "throughput": 17539.45, "total_tokens": 217965312} +{"current_steps": 820, "total_steps": 25209, "loss": 1.2417, "lr": 4.807025699091452e-05, "epoch": 0.09758492193950033, "percentage": 3.25, "elapsed_time": "3:28:47", "remaining_time": "4 days, 7:30:02", "throughput": 17612.64, "total_tokens": 220642944} +{"current_steps": 830, "total_steps": 25209, "loss": 1.223, "lr": 4.8048056714022325e-05, "epoch": 0.09877498196315276, "percentage": 3.29, "elapsed_time": "3:30:32", "remaining_time": "4 days, 7:04:12", "throughput": 17684.48, "total_tokens": 223403776} +{"current_steps": 840, "total_steps": 25209, "loss": 1.2178, "lr": 4.802588716699519e-05, "epoch": 0.09996504198680521, "percentage": 3.33, "elapsed_time": "3:32:11", "remaining_time": "4 days, 6:35:50", "throughput": 17755.93, "total_tokens": 226059776} +{"current_steps": 850, "total_steps": 25209, "loss": 1.229, "lr": 4.8003748279004156e-05, "epoch": 0.10115510201045766, "percentage": 3.37, "elapsed_time": "3:33:50", "remaining_time": "4 days, 6:08:19", "throughput": 17829.75, "total_tokens": 228769600} +{"current_steps": 860, "total_steps": 25209, "loss": 1.2174, "lr": 4.798163997944854e-05, "epoch": 0.1023451620341101, "percentage": 3.41, "elapsed_time": "3:35:31", "remaining_time": "4 days, 5:42:14", "throughput": 17900.91, "total_tokens": 231490368} +{"current_steps": 870, "total_steps": 25209, "loss": 1.2418, "lr": 4.79595621979551e-05, "epoch": 0.10353522205776254, "percentage": 3.45, "elapsed_time": "3:37:14", "remaining_time": "4 days, 5:17:29", "throughput": 17966.65, "total_tokens": 234185216} +{"current_steps": 880, "total_steps": 25209, "loss": 1.2307, "lr": 4.793751486437702e-05, "epoch": 0.10472528208141497, "percentage": 3.49, "elapsed_time": "3:38:57", "remaining_time": "4 days, 4:53:16", "throughput": 18029.56, "total_tokens": 236856640} +{"current_steps": 890, "total_steps": 25209, "loss": 1.2329, "lr": 4.7915497908793064e-05, "epoch": 0.10591534210506742, "percentage": 3.53, "elapsed_time": "3:40:46", "remaining_time": "4 days, 4:32:36", "throughput": 18083.15, "total_tokens": 239538432} +{"current_steps": 900, "total_steps": 25209, "loss": 1.2306, "lr": 4.7893511261506516e-05, "epoch": 0.10710540212871987, "percentage": 3.57, "elapsed_time": "3:42:38", "remaining_time": "4 days, 4:13:33", "throughput": 18135.2, "total_tokens": 242259392} +{"current_steps": 910, "total_steps": 25209, "loss": 1.2152, "lr": 4.787155485304435e-05, "epoch": 0.1082954621523723, "percentage": 3.61, "elapsed_time": "3:44:18", "remaining_time": "4 days, 3:49:27", "throughput": 18197.22, "total_tokens": 244904512} +{"current_steps": 920, "total_steps": 25209, "loss": 1.2087, "lr": 4.784962861415629e-05, "epoch": 0.10948552217602475, "percentage": 3.65, "elapsed_time": "3:46:12", "remaining_time": "4 days, 3:32:16", "throughput": 18244.02, "total_tokens": 247622336} +{"current_steps": 930, "total_steps": 25209, "loss": 1.2384, "lr": 4.7827732475813884e-05, "epoch": 0.1106755821996772, "percentage": 3.69, "elapsed_time": "3:47:54", "remaining_time": "4 days, 3:09:57", "throughput": 18305.83, "total_tokens": 250326464} +{"current_steps": 940, "total_steps": 25209, "loss": 1.227, "lr": 4.7805866369209576e-05, "epoch": 0.11186564222332963, "percentage": 3.73, "elapsed_time": "3:49:41", "remaining_time": "4 days, 2:49:59", "throughput": 18359.73, "total_tokens": 253016064} +{"current_steps": 950, "total_steps": 25209, "loss": 1.2073, "lr": 4.778403022575583e-05, "epoch": 0.11305570224698208, "percentage": 3.77, "elapsed_time": "3:51:23", "remaining_time": "4 days, 2:28:39", "throughput": 18419.35, "total_tokens": 255719936} +{"current_steps": 960, "total_steps": 25209, "loss": 1.2168, "lr": 4.7762223977084195e-05, "epoch": 0.11424576227063453, "percentage": 3.81, "elapsed_time": "3:53:06", "remaining_time": "4 days, 2:08:21", "throughput": 18475.14, "total_tokens": 258411008} +{"current_steps": 970, "total_steps": 25209, "loss": 1.2214, "lr": 4.774044755504444e-05, "epoch": 0.11543582229428696, "percentage": 3.85, "elapsed_time": "3:54:44", "remaining_time": "4 days, 1:45:53", "throughput": 18537.7, "total_tokens": 261094720} +{"current_steps": 980, "total_steps": 25209, "loss": 1.2132, "lr": 4.7718700891703616e-05, "epoch": 0.11662588231793941, "percentage": 3.89, "elapsed_time": "3:56:27", "remaining_time": "4 days, 1:26:12", "throughput": 18594.55, "total_tokens": 263816448} +{"current_steps": 990, "total_steps": 25209, "loss": 1.2124, "lr": 4.7696983919345215e-05, "epoch": 0.11781594234159186, "percentage": 3.93, "elapsed_time": "3:58:05", "remaining_time": "4 days, 1:04:41", "throughput": 18655.04, "total_tokens": 266501184} +{"current_steps": 1000, "total_steps": 25209, "loss": 1.2187, "lr": 4.7675296570468216e-05, "epoch": 0.11900600236524429, "percentage": 3.97, "elapsed_time": "3:59:44", "remaining_time": "4 days, 0:43:46", "throughput": 18713.9, "total_tokens": 269184384} +{"current_steps": 1010, "total_steps": 25209, "loss": 1.2, "lr": 4.76536387777863e-05, "epoch": 0.12019606238889674, "percentage": 4.01, "elapsed_time": "4:01:29", "remaining_time": "4 days, 0:26:05", "throughput": 18763.72, "total_tokens": 271881024} +{"current_steps": 1020, "total_steps": 25209, "loss": 1.2158, "lr": 4.7632010474226915e-05, "epoch": 0.12138612241254919, "percentage": 4.05, "elapsed_time": "4:03:19", "remaining_time": "4 days, 0:10:30", "throughput": 18805.6, "total_tokens": 274558784} +{"current_steps": 1030, "total_steps": 25209, "loss": 1.2259, "lr": 4.761041159293035e-05, "epoch": 0.12257618243620162, "percentage": 4.09, "elapsed_time": "4:05:10", "remaining_time": "3 days, 23:55:26", "throughput": 18846.02, "total_tokens": 277235136} +{"current_steps": 1040, "total_steps": 25209, "loss": 1.2202, "lr": 4.7588842067249e-05, "epoch": 0.12376624245985407, "percentage": 4.13, "elapsed_time": "4:06:57", "remaining_time": "3 days, 23:39:19", "throughput": 18891.34, "total_tokens": 279930112} +{"current_steps": 1050, "total_steps": 25209, "loss": 1.2052, "lr": 4.756730183074637e-05, "epoch": 0.12495630248350652, "percentage": 4.17, "elapsed_time": "4:08:42", "remaining_time": "3 days, 23:22:21", "throughput": 18942.15, "total_tokens": 282661184} +{"current_steps": 1060, "total_steps": 25209, "loss": 1.2124, "lr": 4.7545790817196314e-05, "epoch": 0.12614636250715897, "percentage": 4.2, "elapsed_time": "4:10:22", "remaining_time": "3 days, 23:03:54", "throughput": 18996.86, "total_tokens": 285372672} +{"current_steps": 1070, "total_steps": 25209, "loss": 1.2007, "lr": 4.752430896058212e-05, "epoch": 0.1273364225308114, "percentage": 4.24, "elapsed_time": "4:12:01", "remaining_time": "3 days, 22:45:33", "throughput": 19047.73, "total_tokens": 288026112} +{"current_steps": 1080, "total_steps": 25209, "loss": 1.2192, "lr": 4.750285619509567e-05, "epoch": 0.12852648255446383, "percentage": 4.28, "elapsed_time": "4:13:42", "remaining_time": "3 days, 22:28:18", "throughput": 19097.02, "total_tokens": 290706624} +{"current_steps": 1090, "total_steps": 25209, "loss": 1.2042, "lr": 4.7481432455136644e-05, "epoch": 0.1297165425781163, "percentage": 4.32, "elapsed_time": "4:15:27", "remaining_time": "3 days, 22:12:34", "throughput": 19143.22, "total_tokens": 293413632} +{"current_steps": 1100, "total_steps": 25209, "loss": 1.2042, "lr": 4.7460037675311584e-05, "epoch": 0.13090660260176873, "percentage": 4.36, "elapsed_time": "4:17:11", "remaining_time": "3 days, 21:57:05", "throughput": 19188.52, "total_tokens": 296115328} +{"current_steps": 1110, "total_steps": 25209, "loss": 1.2045, "lr": 4.7438671790433126e-05, "epoch": 0.13209666262542116, "percentage": 4.4, "elapsed_time": "4:18:57", "remaining_time": "3 days, 21:42:20", "throughput": 19231.44, "total_tokens": 298816256} +{"current_steps": 1120, "total_steps": 25209, "loss": 1.2063, "lr": 4.741733473551915e-05, "epoch": 0.13328672264907362, "percentage": 4.44, "elapsed_time": "4:20:36", "remaining_time": "3 days, 21:25:09", "throughput": 19281.56, "total_tokens": 301494912} +{"current_steps": 1130, "total_steps": 25209, "loss": 1.2123, "lr": 4.7396026445791966e-05, "epoch": 0.13447678267272606, "percentage": 4.48, "elapsed_time": "4:22:17", "remaining_time": "3 days, 21:09:07", "throughput": 19331.46, "total_tokens": 304228288} +{"current_steps": 1140, "total_steps": 25209, "loss": 1.1986, "lr": 4.737474685667742e-05, "epoch": 0.1356668426963785, "percentage": 4.52, "elapsed_time": "4:23:57", "remaining_time": "3 days, 20:53:06", "throughput": 19377.49, "total_tokens": 306897152} +{"current_steps": 1150, "total_steps": 25209, "loss": 1.1963, "lr": 4.7353495903804165e-05, "epoch": 0.13685690272003095, "percentage": 4.56, "elapsed_time": "4:25:35", "remaining_time": "3 days, 20:36:29", "throughput": 19423.61, "total_tokens": 309529856} +{"current_steps": 1160, "total_steps": 25209, "loss": 1.2066, "lr": 4.733227352300277e-05, "epoch": 0.1380469627436834, "percentage": 4.6, "elapsed_time": "4:27:17", "remaining_time": "3 days, 20:21:34", "throughput": 19470.04, "total_tokens": 312256832} +{"current_steps": 1170, "total_steps": 25209, "loss": 1.2043, "lr": 4.731107965030496e-05, "epoch": 0.13923702276733582, "percentage": 4.64, "elapsed_time": "4:28:55", "remaining_time": "3 days, 20:05:23", "throughput": 19519.47, "total_tokens": 314957888} +{"current_steps": 1180, "total_steps": 25209, "loss": 1.2, "lr": 4.728991422194278e-05, "epoch": 0.14042708279098828, "percentage": 4.68, "elapsed_time": "4:30:35", "remaining_time": "3 days, 19:50:08", "throughput": 19567.36, "total_tokens": 317681792} +{"current_steps": 1190, "total_steps": 25209, "loss": 1.1946, "lr": 4.726877717434773e-05, "epoch": 0.14161714281464072, "percentage": 4.72, "elapsed_time": "4:32:15", "remaining_time": "3 days, 19:35:20", "throughput": 19613.16, "total_tokens": 320394560} +{"current_steps": 1200, "total_steps": 25209, "loss": 1.201, "lr": 4.724766844415013e-05, "epoch": 0.14280720283829315, "percentage": 4.76, "elapsed_time": "4:33:54", "remaining_time": "3 days, 19:20:06", "throughput": 19658.52, "total_tokens": 323071168} +{"current_steps": 1210, "total_steps": 25209, "loss": 1.1836, "lr": 4.722658796817813e-05, "epoch": 0.1439972628619456, "percentage": 4.8, "elapsed_time": "4:35:40", "remaining_time": "3 days, 19:07:37", "throughput": 19691.94, "total_tokens": 325709568} +{"current_steps": 1220, "total_steps": 25209, "loss": 1.2091, "lr": 4.7205535683457044e-05, "epoch": 0.14518732288559805, "percentage": 4.84, "elapsed_time": "4:37:18", "remaining_time": "3 days, 18:52:40", "throughput": 19734.65, "total_tokens": 328350784} +{"current_steps": 1230, "total_steps": 25209, "loss": 1.1932, "lr": 4.7184511527208484e-05, "epoch": 0.14637738290925048, "percentage": 4.88, "elapsed_time": "4:39:02", "remaining_time": "3 days, 18:39:51", "throughput": 19771.01, "total_tokens": 331010240} +{"current_steps": 1240, "total_steps": 25209, "loss": 1.2002, "lr": 4.7163515436849644e-05, "epoch": 0.14756744293290291, "percentage": 4.92, "elapsed_time": "4:40:53", "remaining_time": "3 days, 18:29:31", "throughput": 19800.29, "total_tokens": 333700416} +{"current_steps": 1250, "total_steps": 25209, "loss": 1.188, "lr": 4.714254734999245e-05, "epoch": 0.14875750295655538, "percentage": 4.96, "elapsed_time": "4:42:31", "remaining_time": "3 days, 18:15:11", "throughput": 19844.22, "total_tokens": 336388288} +{"current_steps": 1260, "total_steps": 25209, "loss": 1.1961, "lr": 4.712160720444284e-05, "epoch": 0.1499475629802078, "percentage": 5.0, "elapsed_time": "4:44:10", "remaining_time": "3 days, 18:01:20", "throughput": 19883.87, "total_tokens": 339029632} +{"current_steps": 1270, "total_steps": 25209, "loss": 1.183, "lr": 4.710069493819992e-05, "epoch": 0.15113762300386024, "percentage": 5.04, "elapsed_time": "4:45:47", "remaining_time": "3 days, 17:46:59", "throughput": 19926.08, "total_tokens": 341678016} +{"current_steps": 1280, "total_steps": 25209, "loss": 1.1996, "lr": 4.70798104894553e-05, "epoch": 0.1523276830275127, "percentage": 5.08, "elapsed_time": "4:47:26", "remaining_time": "3 days, 17:33:26", "throughput": 19968.46, "total_tokens": 344376896} +{"current_steps": 1290, "total_steps": 25209, "loss": 1.1832, "lr": 4.705895379659219e-05, "epoch": 0.15351774305116514, "percentage": 5.12, "elapsed_time": "4:49:02", "remaining_time": "3 days, 17:19:15", "throughput": 20012.26, "total_tokens": 347055808} +{"current_steps": 1300, "total_steps": 25209, "loss": 1.1919, "lr": 4.7038124798184766e-05, "epoch": 0.15470780307481757, "percentage": 5.16, "elapsed_time": "4:50:44", "remaining_time": "3 days, 17:07:04", "throughput": 20051.77, "total_tokens": 349785472} +{"current_steps": 1310, "total_steps": 25209, "loss": 1.1908, "lr": 4.7017323432997304e-05, "epoch": 0.15589786309847004, "percentage": 5.2, "elapsed_time": "4:52:27", "remaining_time": "3 days, 16:55:29", "throughput": 20089.2, "total_tokens": 352516864} +{"current_steps": 1320, "total_steps": 25209, "loss": 1.1891, "lr": 4.6996549639983506e-05, "epoch": 0.15708792312212247, "percentage": 5.24, "elapsed_time": "4:54:14", "remaining_time": "3 days, 16:45:05", "throughput": 20123.42, "total_tokens": 355268352} +{"current_steps": 1330, "total_steps": 25209, "loss": 1.1767, "lr": 4.697580335828569e-05, "epoch": 0.1582779831457749, "percentage": 5.28, "elapsed_time": "4:55:53", "remaining_time": "3 days, 16:32:35", "throughput": 20159.68, "total_tokens": 357912640} +{"current_steps": 1340, "total_steps": 25209, "loss": 1.1998, "lr": 4.6955084527234076e-05, "epoch": 0.15946804316942736, "percentage": 5.32, "elapsed_time": "4:57:33", "remaining_time": "3 days, 16:20:14", "throughput": 20197.12, "total_tokens": 360584384} +{"current_steps": 1350, "total_steps": 25209, "loss": 1.1872, "lr": 4.6934393086346034e-05, "epoch": 0.1606581031930798, "percentage": 5.36, "elapsed_time": "4:59:11", "remaining_time": "3 days, 16:07:37", "throughput": 20236.13, "total_tokens": 363262336} +{"current_steps": 1360, "total_steps": 25209, "loss": 1.2024, "lr": 4.6913728975325324e-05, "epoch": 0.16184816321673223, "percentage": 5.39, "elapsed_time": "5:00:53", "remaining_time": "3 days, 15:56:29", "throughput": 20271.86, "total_tokens": 365981568} +{"current_steps": 1370, "total_steps": 25209, "loss": 1.199, "lr": 4.6893092134061393e-05, "epoch": 0.1630382232403847, "percentage": 5.43, "elapsed_time": "5:02:30", "remaining_time": "3 days, 15:43:45", "throughput": 20312.15, "total_tokens": 368667776} +{"current_steps": 1380, "total_steps": 25209, "loss": 1.1972, "lr": 4.687248250262859e-05, "epoch": 0.16422828326403713, "percentage": 5.47, "elapsed_time": "5:04:12", "remaining_time": "3 days, 15:32:58", "throughput": 20345.73, "total_tokens": 371366848} +{"current_steps": 1390, "total_steps": 25209, "loss": 1.1698, "lr": 4.685190002128548e-05, "epoch": 0.16541834328768956, "percentage": 5.51, "elapsed_time": "5:05:51", "remaining_time": "3 days, 15:21:17", "throughput": 20382.72, "total_tokens": 374061760} +{"current_steps": 1400, "total_steps": 25209, "loss": 1.2014, "lr": 4.6831344630474114e-05, "epoch": 0.16660840331134202, "percentage": 5.55, "elapsed_time": "5:07:33", "remaining_time": "3 days, 15:10:34", "throughput": 20417.32, "total_tokens": 376778624} +{"current_steps": 1410, "total_steps": 25209, "loss": 1.1904, "lr": 4.6810816270819276e-05, "epoch": 0.16779846333499446, "percentage": 5.59, "elapsed_time": "5:09:14", "remaining_time": "3 days, 14:59:35", "throughput": 20452.83, "total_tokens": 379490496} +{"current_steps": 1420, "total_steps": 25209, "loss": 1.1751, "lr": 4.679031488312777e-05, "epoch": 0.1689885233586469, "percentage": 5.63, "elapsed_time": "5:10:51", "remaining_time": "3 days, 14:47:46", "throughput": 20489.67, "total_tokens": 382164992} +{"current_steps": 1430, "total_steps": 25209, "loss": 1.1917, "lr": 4.6769840408387717e-05, "epoch": 0.17017858338229935, "percentage": 5.67, "elapsed_time": "5:12:32", "remaining_time": "3 days, 14:37:07", "throughput": 20524.51, "total_tokens": 384883648} +{"current_steps": 1440, "total_steps": 25209, "loss": 1.1861, "lr": 4.674939278776787e-05, "epoch": 0.1713686434059518, "percentage": 5.71, "elapsed_time": "5:14:14", "remaining_time": "3 days, 14:26:50", "throughput": 20558.76, "total_tokens": 387616896} +{"current_steps": 1450, "total_steps": 25209, "loss": 1.1898, "lr": 4.672897196261683e-05, "epoch": 0.17255870342960422, "percentage": 5.75, "elapsed_time": "5:15:53", "remaining_time": "3 days, 14:16:00", "throughput": 20593.98, "total_tokens": 390324608} +{"current_steps": 1460, "total_steps": 25209, "loss": 1.1835, "lr": 4.670857787446238e-05, "epoch": 0.17374876345325668, "percentage": 5.79, "elapsed_time": "5:17:29", "remaining_time": "3 days, 14:04:28", "throughput": 20630.39, "total_tokens": 393000000} +{"current_steps": 1470, "total_steps": 25209, "loss": 1.1839, "lr": 4.668821046501082e-05, "epoch": 0.17493882347690912, "percentage": 5.83, "elapsed_time": "5:19:07", "remaining_time": "3 days, 13:53:39", "throughput": 20663.81, "total_tokens": 395669504} +{"current_steps": 1480, "total_steps": 25209, "loss": 1.1729, "lr": 4.6667869676146194e-05, "epoch": 0.17612888350056155, "percentage": 5.87, "elapsed_time": "5:20:49", "remaining_time": "3 days, 13:43:44", "throughput": 20694.34, "total_tokens": 398348992} +{"current_steps": 1490, "total_steps": 25209, "loss": 1.1846, "lr": 4.6647555449929645e-05, "epoch": 0.177318943524214, "percentage": 5.91, "elapsed_time": "5:22:30", "remaining_time": "3 days, 13:33:50", "throughput": 20725.66, "total_tokens": 401044160} +{"current_steps": 1500, "total_steps": 25209, "loss": 1.1673, "lr": 4.662726772859869e-05, "epoch": 0.17850900354786645, "percentage": 5.95, "elapsed_time": "5:24:09", "remaining_time": "3 days, 13:23:40", "throughput": 20757.56, "total_tokens": 403725760} +{"current_steps": 1510, "total_steps": 25209, "loss": 1.1719, "lr": 4.660700645456655e-05, "epoch": 0.17969906357151888, "percentage": 5.99, "elapsed_time": "5:25:53", "remaining_time": "3 days, 13:14:40", "throughput": 20786.6, "total_tokens": 406443200} +{"current_steps": 1520, "total_steps": 25209, "loss": 1.1833, "lr": 4.658677157042149e-05, "epoch": 0.18088912359517134, "percentage": 6.03, "elapsed_time": "5:27:33", "remaining_time": "3 days, 13:05:03", "throughput": 20817.55, "total_tokens": 409145920} +{"current_steps": 1530, "total_steps": 25209, "loss": 1.1855, "lr": 4.656656301892605e-05, "epoch": 0.18207918361882378, "percentage": 6.07, "elapsed_time": "5:29:09", "remaining_time": "3 days, 12:54:06", "throughput": 20851.15, "total_tokens": 411791744} +{"current_steps": 1540, "total_steps": 25209, "loss": 1.1859, "lr": 4.6546380743016465e-05, "epoch": 0.1832692436424762, "percentage": 6.11, "elapsed_time": "5:30:47", "remaining_time": "3 days, 12:44:06", "throughput": 20883.38, "total_tokens": 414484352} +{"current_steps": 1550, "total_steps": 25209, "loss": 1.1855, "lr": 4.652622468580193e-05, "epoch": 0.18445930366612867, "percentage": 6.15, "elapsed_time": "5:32:28", "remaining_time": "3 days, 12:34:51", "throughput": 20912.68, "total_tokens": 417176448} +{"current_steps": 1560, "total_steps": 25209, "loss": 1.1756, "lr": 4.650609479056392e-05, "epoch": 0.1856493636897811, "percentage": 6.19, "elapsed_time": "5:34:16", "remaining_time": "3 days, 12:27:23", "throughput": 20933.71, "total_tokens": 419850176} +{"current_steps": 1570, "total_steps": 25209, "loss": 1.1809, "lr": 4.648599100075556e-05, "epoch": 0.18683942371343354, "percentage": 6.23, "elapsed_time": "5:36:37", "remaining_time": "3 days, 12:28:20", "throughput": 20920.92, "total_tokens": 422540800} +{"current_steps": 1580, "total_steps": 25209, "loss": 1.1918, "lr": 4.6465913260000945e-05, "epoch": 0.188029483737086, "percentage": 6.27, "elapsed_time": "5:38:35", "remaining_time": "3 days, 12:23:36", "throughput": 20929.1, "total_tokens": 425180288} +{"current_steps": 1590, "total_steps": 25209, "loss": 1.1892, "lr": 4.644586151209444e-05, "epoch": 0.18921954376073843, "percentage": 6.31, "elapsed_time": "5:40:35", "remaining_time": "3 days, 12:19:22", "throughput": 20937.61, "total_tokens": 427869120} +{"current_steps": 1600, "total_steps": 25209, "loss": 1.1807, "lr": 4.6425835701000084e-05, "epoch": 0.19040960378439087, "percentage": 6.35, "elapsed_time": "5:42:33", "remaining_time": "3 days, 12:14:37", "throughput": 20946.85, "total_tokens": 430528256} +{"current_steps": 1610, "total_steps": 25209, "loss": 1.1801, "lr": 4.640583577085084e-05, "epoch": 0.19159966380804333, "percentage": 6.39, "elapsed_time": "5:44:27", "remaining_time": "3 days, 12:09:03", "throughput": 20963.26, "total_tokens": 433264640} +{"current_steps": 1620, "total_steps": 25209, "loss": 1.1514, "lr": 4.638586166594806e-05, "epoch": 0.19278972383169576, "percentage": 6.43, "elapsed_time": "5:46:22", "remaining_time": "3 days, 12:03:40", "throughput": 20976.87, "total_tokens": 435957376} +{"current_steps": 1630, "total_steps": 25209, "loss": 1.1686, "lr": 4.6365913330760726e-05, "epoch": 0.1939797838553482, "percentage": 6.47, "elapsed_time": "5:48:05", "remaining_time": "3 days, 11:55:16", "throughput": 21000.16, "total_tokens": 438590656} +{"current_steps": 1640, "total_steps": 25209, "loss": 1.1659, "lr": 4.6345990709924855e-05, "epoch": 0.19516984387900066, "percentage": 6.51, "elapsed_time": "5:49:52", "remaining_time": "3 days, 11:48:12", "throughput": 21020.93, "total_tokens": 441284992} +{"current_steps": 1650, "total_steps": 25209, "loss": 1.176, "lr": 4.632609374824284e-05, "epoch": 0.1963599039026531, "percentage": 6.55, "elapsed_time": "5:51:40", "remaining_time": "3 days, 11:41:20", "throughput": 21040.05, "total_tokens": 443961536} +{"current_steps": 1660, "total_steps": 25209, "loss": 1.1616, "lr": 4.630622239068285e-05, "epoch": 0.19754996392630553, "percentage": 6.58, "elapsed_time": "5:53:36", "remaining_time": "3 days, 11:36:14", "throughput": 21053.13, "total_tokens": 446665152} +{"current_steps": 1670, "total_steps": 25209, "loss": 1.1795, "lr": 4.628637658237808e-05, "epoch": 0.198740023949958, "percentage": 6.62, "elapsed_time": "5:55:35", "remaining_time": "3 days, 11:32:11", "throughput": 21059.39, "total_tokens": 449317248} +{"current_steps": 1680, "total_steps": 25209, "loss": 1.1622, "lr": 4.626655626862625e-05, "epoch": 0.19993008397361042, "percentage": 6.66, "elapsed_time": "5:57:50", "remaining_time": "3 days, 11:31:42", "throughput": 21053.86, "total_tokens": 452037568} +{"current_steps": 1690, "total_steps": 25209, "loss": 1.1802, "lr": 4.624676139488888e-05, "epoch": 0.20112014399726286, "percentage": 6.7, "elapsed_time": "6:00:21", "remaining_time": "3 days, 11:34:57", "throughput": 21033.38, "total_tokens": 454773248} +{"current_steps": 1700, "total_steps": 25209, "loss": 1.1732, "lr": 4.6226991906790686e-05, "epoch": 0.20231020402091532, "percentage": 6.74, "elapsed_time": "6:02:48", "remaining_time": "3 days, 11:37:09", "throughput": 21020.14, "total_tokens": 457571456} +{"current_steps": 1710, "total_steps": 25209, "loss": 1.1669, "lr": 4.620724775011897e-05, "epoch": 0.20350026404456775, "percentage": 6.78, "elapsed_time": "6:05:40", "remaining_time": "3 days, 11:45:04", "throughput": 20979.51, "total_tokens": 460295232} +{"current_steps": 1720, "total_steps": 25209, "loss": 1.1738, "lr": 4.618752887082297e-05, "epoch": 0.2046903240682202, "percentage": 6.82, "elapsed_time": "6:09:49", "remaining_time": "3 days, 12:10:27", "throughput": 20864.71, "total_tokens": 462975552} +{"current_steps": 1730, "total_steps": 25209, "loss": 1.1691, "lr": 4.616783521501325e-05, "epoch": 0.20588038409187262, "percentage": 6.86, "elapsed_time": "6:12:54", "remaining_time": "3 days, 12:20:53", "throughput": 20816.41, "total_tokens": 465746944} +{"current_steps": 1740, "total_steps": 25209, "loss": 1.1743, "lr": 4.614816672896108e-05, "epoch": 0.20707044411552508, "percentage": 6.9, "elapsed_time": "6:15:37", "remaining_time": "3 days, 12:26:27", "throughput": 20786.45, "total_tokens": 468479040} +{"current_steps": 1750, "total_steps": 25209, "loss": 1.1732, "lr": 4.612852335909782e-05, "epoch": 0.20826050413917752, "percentage": 6.94, "elapsed_time": "6:18:19", "remaining_time": "3 days, 12:31:33", "throughput": 20759.42, "total_tokens": 471233472} +{"current_steps": 1760, "total_steps": 25209, "loss": 1.176, "lr": 4.6108905052014323e-05, "epoch": 0.20945056416282995, "percentage": 6.98, "elapsed_time": "6:20:51", "remaining_time": "3 days, 12:34:16", "throughput": 20741.24, "total_tokens": 473966912} +{"current_steps": 1770, "total_steps": 25209, "loss": 1.1565, "lr": 4.608931175446027e-05, "epoch": 0.2106406241864824, "percentage": 7.02, "elapsed_time": "6:23:12", "remaining_time": "3 days, 12:34:40", "throughput": 20728.7, "total_tokens": 476612928} +{"current_steps": 1780, "total_steps": 25209, "loss": 1.1658, "lr": 4.606974341334367e-05, "epoch": 0.21183068421013485, "percentage": 7.06, "elapsed_time": "6:25:51", "remaining_time": "3 days, 12:38:50", "throughput": 20703.12, "total_tokens": 479311616} +{"current_steps": 1790, "total_steps": 25209, "loss": 1.1709, "lr": 4.605019997573011e-05, "epoch": 0.21302074423378728, "percentage": 7.1, "elapsed_time": "6:28:29", "remaining_time": "3 days, 12:42:43", "throughput": 20676.76, "total_tokens": 481963968} +{"current_steps": 1800, "total_steps": 25209, "loss": 1.1588, "lr": 4.603068138884229e-05, "epoch": 0.21421080425743974, "percentage": 7.14, "elapsed_time": "6:30:44", "remaining_time": "3 days, 12:41:40", "throughput": 20670.55, "total_tokens": 484618368} +{"current_steps": 1810, "total_steps": 25209, "loss": 1.1787, "lr": 4.6011187600059345e-05, "epoch": 0.21540086428109217, "percentage": 7.18, "elapsed_time": "6:33:06", "remaining_time": "3 days, 12:41:59", "throughput": 20660.42, "total_tokens": 487309632} +{"current_steps": 1820, "total_steps": 25209, "loss": 1.1723, "lr": 4.599171855691629e-05, "epoch": 0.2165909243047446, "percentage": 7.22, "elapsed_time": "6:35:13", "remaining_time": "3 days, 12:39:10", "throughput": 20663.36, "total_tokens": 490010624} +{"current_steps": 1830, "total_steps": 25209, "loss": 1.1569, "lr": 4.597227420710335e-05, "epoch": 0.21778098432839707, "percentage": 7.26, "elapsed_time": "6:37:25", "remaining_time": "3 days, 12:37:20", "throughput": 20662.76, "total_tokens": 492720704} +{"current_steps": 1840, "total_steps": 25209, "loss": 1.1665, "lr": 4.595285449846551e-05, "epoch": 0.2189710443520495, "percentage": 7.3, "elapsed_time": "6:39:29", "remaining_time": "3 days, 12:33:42", "throughput": 20667.52, "total_tokens": 495385216} +{"current_steps": 1850, "total_steps": 25209, "loss": 1.1695, "lr": 4.593345937900178e-05, "epoch": 0.22016110437570194, "percentage": 7.34, "elapsed_time": "6:42:15", "remaining_time": "3 days, 12:39:04", "throughput": 20635.52, "total_tokens": 498045760} +{"current_steps": 1860, "total_steps": 25209, "loss": 1.1508, "lr": 4.591408879686472e-05, "epoch": 0.2213511643993544, "percentage": 7.38, "elapsed_time": "6:44:39", "remaining_time": "3 days, 12:39:45", "throughput": 20622.06, "total_tokens": 500693248} +{"current_steps": 1870, "total_steps": 25209, "loss": 1.176, "lr": 4.5894742700359775e-05, "epoch": 0.22254122442300683, "percentage": 7.42, "elapsed_time": "6:47:45", "remaining_time": "3 days, 12:49:08", "throughput": 20574.19, "total_tokens": 503359744} +{"current_steps": 1880, "total_steps": 25209, "loss": 1.1753, "lr": 4.587542103794477e-05, "epoch": 0.22373128444665927, "percentage": 7.46, "elapsed_time": "6:51:27", "remaining_time": "3 days, 13:05:43", "throughput": 20499.57, "total_tokens": 506075392} +{"current_steps": 1890, "total_steps": 25209, "loss": 1.171, "lr": 4.5856123758229247e-05, "epoch": 0.22492134447031173, "percentage": 7.5, "elapsed_time": "6:54:44", "remaining_time": "3 days, 13:17:07", "throughput": 20446.06, "total_tokens": 508790336} +{"current_steps": 1900, "total_steps": 25209, "loss": 1.1504, "lr": 4.5836850809973993e-05, "epoch": 0.22611140449396416, "percentage": 7.54, "elapsed_time": "6:57:56", "remaining_time": "3 days, 13:27:13", "throughput": 20398.68, "total_tokens": 511522752} +{"current_steps": 1910, "total_steps": 25209, "loss": 1.1526, "lr": 4.5817602142090385e-05, "epoch": 0.2273014645176166, "percentage": 7.58, "elapsed_time": "7:00:56", "remaining_time": "3 days, 13:34:44", "throughput": 20361.56, "total_tokens": 514252928} +{"current_steps": 1920, "total_steps": 25209, "loss": 1.1596, "lr": 4.579837770363989e-05, "epoch": 0.22849152454126906, "percentage": 7.62, "elapsed_time": "7:03:50", "remaining_time": "3 days, 13:41:05", "throughput": 20324.63, "total_tokens": 516868352} +{"current_steps": 1930, "total_steps": 25209, "loss": 1.1803, "lr": 4.57791774438334e-05, "epoch": 0.2296815845649215, "percentage": 7.66, "elapsed_time": "7:06:49", "remaining_time": "3 days, 13:48:10", "throughput": 20289.3, "total_tokens": 519594240} +{"current_steps": 1940, "total_steps": 25209, "loss": 1.1743, "lr": 4.576000131203078e-05, "epoch": 0.23087164458857393, "percentage": 7.7, "elapsed_time": "7:09:38", "remaining_time": "3 days, 13:53:10", "throughput": 20260.89, "total_tokens": 522286848} +{"current_steps": 1950, "total_steps": 25209, "loss": 1.1503, "lr": 4.574084925774023e-05, "epoch": 0.2320617046122264, "percentage": 7.74, "elapsed_time": "7:13:02", "remaining_time": "3 days, 14:05:16", "throughput": 20204.09, "total_tokens": 524961856} +{"current_steps": 1960, "total_steps": 25209, "loss": 1.151, "lr": 4.5721721230617795e-05, "epoch": 0.23325176463587882, "percentage": 7.78, "elapsed_time": "7:16:14", "remaining_time": "3 days, 14:14:32", "throughput": 20159.2, "total_tokens": 527653056} +{"current_steps": 1970, "total_steps": 25209, "loss": 1.1743, "lr": 4.57026171804667e-05, "epoch": 0.23444182465953126, "percentage": 7.81, "elapsed_time": "7:19:19", "remaining_time": "3 days, 14:22:29", "throughput": 20120.15, "total_tokens": 530358400} +{"current_steps": 1980, "total_steps": 25209, "loss": 1.172, "lr": 4.568353705723692e-05, "epoch": 0.23563188468318372, "percentage": 7.85, "elapsed_time": "7:22:50", "remaining_time": "3 days, 14:35:19", "throughput": 20061.98, "total_tokens": 533056128} +{"current_steps": 1990, "total_steps": 25209, "loss": 1.1579, "lr": 4.566448081102455e-05, "epoch": 0.23682194470683615, "percentage": 7.89, "elapsed_time": "7:25:56", "remaining_time": "3 days, 14:43:16", "throughput": 20021.47, "total_tokens": 535714304} +{"current_steps": 2000, "total_steps": 25209, "loss": 1.1619, "lr": 4.564544839207128e-05, "epoch": 0.23801200473048859, "percentage": 7.93, "elapsed_time": "7:29:31", "remaining_time": "3 days, 14:56:26", "throughput": 19964.75, "total_tokens": 538471040} +{"current_steps": 2010, "total_steps": 25209, "loss": 1.1698, "lr": 4.562643975076387e-05, "epoch": 0.23920206475414105, "percentage": 7.97, "elapsed_time": "7:32:53", "remaining_time": "3 days, 15:07:15", "throughput": 19914.66, "total_tokens": 541159552} +{"current_steps": 2020, "total_steps": 25209, "loss": 1.1626, "lr": 4.560745483763357e-05, "epoch": 0.24039212477779348, "percentage": 8.01, "elapsed_time": "7:36:37", "remaining_time": "3 days, 15:21:49", "throughput": 19852.16, "total_tokens": 543890048} +{"current_steps": 2030, "total_steps": 25209, "loss": 1.1668, "lr": 4.5588493603355595e-05, "epoch": 0.24158218480144592, "percentage": 8.05, "elapsed_time": "7:40:01", "remaining_time": "3 days, 15:32:38", "throughput": 19801.91, "total_tokens": 546558784} +{"current_steps": 10, "total_steps": 25209, "loss": 2.0927, "lr": 4.9977515176118345e-05, "epoch": 0.001190060023652443, "percentage": 0.04, "elapsed_time": "0:01:59", "remaining_time": "3 days, 11:35:51", "throughput": 22667.63, "total_tokens": 2707200} +{"current_steps": 20, "total_steps": 25209, "loss": 1.6142, "lr": 4.9952567580506e-05, "epoch": 0.002380120047304886, "percentage": 0.08, "elapsed_time": "0:03:46", "remaining_time": "3 days, 7:15:51", "throughput": 23901.96, "total_tokens": 5415424} +{"current_steps": 30, "total_steps": 25209, "loss": 1.5206, "lr": 4.992765730738634e-05, "epoch": 0.003570180070957329, "percentage": 0.12, "elapsed_time": "0:05:45", "remaining_time": "3 days, 8:27:47", "throughput": 23522.58, "total_tokens": 8118336} +{"current_steps": 40, "total_steps": 25209, "loss": 1.4884, "lr": 4.9902784263792476e-05, "epoch": 0.004760240094609772, "percentage": 0.16, "elapsed_time": "0:07:45", "remaining_time": "3 days, 9:20:29", "throughput": 23071.58, "total_tokens": 10737088} +{"current_steps": 50, "total_steps": 25209, "loss": 1.4643, "lr": 4.987794835708133e-05, "epoch": 0.005950300118262215, "percentage": 0.2, "elapsed_time": "0:09:34", "remaining_time": "3 days, 8:14:43", "throughput": 23508.78, "total_tokens": 13496768} +{"current_steps": 60, "total_steps": 25209, "loss": 1.4581, "lr": 4.985314949493234e-05, "epoch": 0.007140360141914658, "percentage": 0.24, "elapsed_time": "0:11:25", "remaining_time": "3 days, 7:48:00", "throughput": 23586.76, "total_tokens": 16166080} +{"current_steps": 70, "total_steps": 25209, "loss": 1.4212, "lr": 4.982838758534584e-05, "epoch": 0.008330420165567102, "percentage": 0.28, "elapsed_time": "0:13:17", "remaining_time": "3 days, 7:34:31", "throughput": 23619.43, "total_tokens": 18840896} +{"current_steps": 80, "total_steps": 25209, "loss": 1.4288, "lr": 4.980366253664179e-05, "epoch": 0.009520480189219544, "percentage": 0.32, "elapsed_time": "0:15:07", "remaining_time": "3 days, 7:10:56", "throughput": 23765.21, "total_tokens": 21566912} +{"current_steps": 90, "total_steps": 25209, "loss": 1.4148, "lr": 4.977897425745825e-05, "epoch": 0.010710540212871987, "percentage": 0.36, "elapsed_time": "0:16:58", "remaining_time": "3 days, 6:56:00", "throughput": 23863.98, "total_tokens": 24296704} +{"current_steps": 100, "total_steps": 25209, "loss": 1.4088, "lr": 4.975432265674997e-05, "epoch": 0.01190060023652443, "percentage": 0.4, "elapsed_time": "0:18:50", "remaining_time": "3 days, 6:53:01", "throughput": 23857.93, "total_tokens": 26983168} +{"current_steps": 110, "total_steps": 25209, "loss": 1.4087, "lr": 4.972970764378705e-05, "epoch": 0.013090660260176872, "percentage": 0.44, "elapsed_time": "0:20:50", "remaining_time": "3 days, 7:17:14", "throughput": 23741.09, "total_tokens": 29699072} +{"current_steps": 120, "total_steps": 25209, "loss": 1.3879, "lr": 4.970512912815344e-05, "epoch": 0.014280720283829316, "percentage": 0.48, "elapsed_time": "0:23:02", "remaining_time": "3 days, 8:16:44", "throughput": 23456.76, "total_tokens": 32424320} +{"current_steps": 130, "total_steps": 25209, "loss": 1.39, "lr": 4.968058701974564e-05, "epoch": 0.015470780307481759, "percentage": 0.52, "elapsed_time": "0:24:56", "remaining_time": "3 days, 8:10:45", "throughput": 23464.27, "total_tokens": 35107904} +{"current_steps": 140, "total_steps": 25209, "loss": 1.3674, "lr": 4.96560812287712e-05, "epoch": 0.016660840331134203, "percentage": 0.56, "elapsed_time": "0:26:42", "remaining_time": "3 days, 7:41:31", "throughput": 23590.37, "total_tokens": 37795840} +{"current_steps": 150, "total_steps": 25209, "loss": 1.3658, "lr": 4.963161166574748e-05, "epoch": 0.017850900354786644, "percentage": 0.6, "elapsed_time": "0:28:26", "remaining_time": "3 days, 7:12:22", "throughput": 23741.49, "total_tokens": 40522688} +{"current_steps": 160, "total_steps": 25209, "loss": 1.3445, "lr": 4.960717824150013e-05, "epoch": 0.019040960378439088, "percentage": 0.63, "elapsed_time": "0:30:09", "remaining_time": "3 days, 6:42:09", "throughput": 23852.94, "total_tokens": 43168064} +{"current_steps": 170, "total_steps": 25209, "loss": 1.3566, "lr": 4.9582780867161893e-05, "epoch": 0.02023102040209153, "percentage": 0.67, "elapsed_time": "0:31:59", "remaining_time": "3 days, 6:32:37", "throughput": 23874.44, "total_tokens": 45833088} +{"current_steps": 180, "total_steps": 25209, "loss": 1.3484, "lr": 4.955841945417105e-05, "epoch": 0.021421080425743973, "percentage": 0.71, "elapsed_time": "0:33:50", "remaining_time": "3 days, 6:25:14", "throughput": 23905.79, "total_tokens": 48536192} +{"current_steps": 190, "total_steps": 25209, "loss": 1.367, "lr": 4.953409391427024e-05, "epoch": 0.022611140449396418, "percentage": 0.75, "elapsed_time": "0:35:47", "remaining_time": "3 days, 6:32:59", "throughput": 23845.04, "total_tokens": 51207040} +{"current_steps": 200, "total_steps": 25209, "loss": 1.3502, "lr": 4.950980415950502e-05, "epoch": 0.02380120047304886, "percentage": 0.79, "elapsed_time": "0:37:48", "remaining_time": "3 days, 6:48:39", "throughput": 23772.64, "total_tokens": 53938624} +{"current_steps": 210, "total_steps": 25209, "loss": 1.3404, "lr": 4.9485550102222575e-05, "epoch": 0.024991260496701303, "percentage": 0.83, "elapsed_time": "0:39:32", "remaining_time": "3 days, 6:26:35", "throughput": 23864.09, "total_tokens": 56610816} +{"current_steps": 220, "total_steps": 25209, "loss": 1.3432, "lr": 4.946133165507037e-05, "epoch": 0.026181320520353744, "percentage": 0.87, "elapsed_time": "0:41:12", "remaining_time": "3 days, 6:00:23", "throughput": 23982.21, "total_tokens": 59291968} +{"current_steps": 230, "total_steps": 25209, "loss": 1.3309, "lr": 4.943714873099483e-05, "epoch": 0.027371380544006188, "percentage": 0.91, "elapsed_time": "0:42:56", "remaining_time": "3 days, 5:43:10", "throughput": 24049.87, "total_tokens": 61958208} +{"current_steps": 240, "total_steps": 25209, "loss": 1.3245, "lr": 4.9413001243240024e-05, "epoch": 0.028561440567658632, "percentage": 0.95, "elapsed_time": "0:44:39", "remaining_time": "3 days, 5:27:00", "throughput": 24109.58, "total_tokens": 64613568} +{"current_steps": 250, "total_steps": 25209, "loss": 1.3253, "lr": 4.938888910534637e-05, "epoch": 0.029751500591311073, "percentage": 0.99, "elapsed_time": "0:46:24", "remaining_time": "3 days, 5:13:19", "throughput": 24166.44, "total_tokens": 67293056} +{"current_steps": 260, "total_steps": 25209, "loss": 1.3321, "lr": 4.936481223114932e-05, "epoch": 0.030941560614963518, "percentage": 1.03, "elapsed_time": "0:48:07", "remaining_time": "3 days, 4:57:42", "throughput": 24220.05, "total_tokens": 69931584} +{"current_steps": 270, "total_steps": 25209, "loss": 1.3223, "lr": 4.934077053477808e-05, "epoch": 0.03213162063861596, "percentage": 1.07, "elapsed_time": "0:49:52", "remaining_time": "3 days, 4:47:04", "throughput": 24278.81, "total_tokens": 72658880} +{"current_steps": 280, "total_steps": 25209, "loss": 1.322, "lr": 4.931676393065431e-05, "epoch": 0.033321680662268406, "percentage": 1.11, "elapsed_time": "0:51:35", "remaining_time": "3 days, 4:32:40", "throughput": 24343.68, "total_tokens": 75345216} +{"current_steps": 290, "total_steps": 25209, "loss": 1.3075, "lr": 4.929279233349088e-05, "epoch": 0.03451174068592085, "percentage": 1.15, "elapsed_time": "0:53:16", "remaining_time": "3 days, 4:17:53", "throughput": 24405.49, "total_tokens": 78013824} +{"current_steps": 300, "total_steps": 25209, "loss": 1.3031, "lr": 4.926885565829051e-05, "epoch": 0.03570180070957329, "percentage": 1.19, "elapsed_time": "0:54:59", "remaining_time": "3 days, 4:06:21", "throughput": 24454.19, "total_tokens": 80693568} +{"current_steps": 310, "total_steps": 25209, "loss": 1.3152, "lr": 4.924495382034461e-05, "epoch": 0.03689186073322573, "percentage": 1.23, "elapsed_time": "0:56:39", "remaining_time": "3 days, 3:51:10", "throughput": 24515.3, "total_tokens": 83347456} +{"current_steps": 320, "total_steps": 25209, "loss": 1.3146, "lr": 4.9221086735231975e-05, "epoch": 0.038081920756878176, "percentage": 1.27, "elapsed_time": "0:58:20", "remaining_time": "3 days, 3:37:57", "throughput": 24568.94, "total_tokens": 86008320} +{"current_steps": 330, "total_steps": 25209, "loss": 1.3044, "lr": 4.919725431881751e-05, "epoch": 0.03927198078053062, "percentage": 1.31, "elapsed_time": "1:00:03", "remaining_time": "3 days, 3:28:07", "throughput": 24617.38, "total_tokens": 88714048} +{"current_steps": 340, "total_steps": 25209, "loss": 1.3155, "lr": 4.917345648725101e-05, "epoch": 0.04046204080418306, "percentage": 1.35, "elapsed_time": "1:01:47", "remaining_time": "3 days, 3:20:06", "throughput": 24649.98, "total_tokens": 91398144} +{"current_steps": 350, "total_steps": 25209, "loss": 1.3006, "lr": 4.914969315696596e-05, "epoch": 0.041652100827835506, "percentage": 1.39, "elapsed_time": "1:03:28", "remaining_time": "3 days, 3:08:24", "throughput": 24704.64, "total_tokens": 94088512} +{"current_steps": 360, "total_steps": 25209, "loss": 1.2977, "lr": 4.912596424467818e-05, "epoch": 0.04284216085148795, "percentage": 1.43, "elapsed_time": "1:05:10", "remaining_time": "3 days, 2:59:08", "throughput": 24728.15, "total_tokens": 96708736} +{"current_steps": 370, "total_steps": 25209, "loss": 1.2956, "lr": 4.910226966738475e-05, "epoch": 0.04403222087514039, "percentage": 1.47, "elapsed_time": "1:06:49", "remaining_time": "3 days, 2:45:40", "throughput": 24784.17, "total_tokens": 99362240} +{"current_steps": 380, "total_steps": 25209, "loss": 1.2805, "lr": 4.9078609342362666e-05, "epoch": 0.045222280898792835, "percentage": 1.51, "elapsed_time": "1:08:26", "remaining_time": "3 days, 2:31:47", "throughput": 24839.45, "total_tokens": 101999872} +{"current_steps": 390, "total_steps": 25209, "loss": 1.2738, "lr": 4.905498318716775e-05, "epoch": 0.046412340922445276, "percentage": 1.55, "elapsed_time": "1:10:13", "remaining_time": "3 days, 2:29:09", "throughput": 24848.1, "total_tokens": 104700800} +{"current_steps": 400, "total_steps": 25209, "loss": 1.2836, "lr": 4.9031391119633295e-05, "epoch": 0.04760240094609772, "percentage": 1.59, "elapsed_time": "1:12:09", "remaining_time": "3 days, 2:35:25", "throughput": 24807.66, "total_tokens": 107404288} +{"current_steps": 410, "total_steps": 25209, "loss": 1.2835, "lr": 4.9007833057869e-05, "epoch": 0.048792460969750165, "percentage": 1.63, "elapsed_time": "1:14:06", "remaining_time": "3 days, 2:42:33", "throughput": 24770.01, "total_tokens": 110141888} +{"current_steps": 420, "total_steps": 25209, "loss": 1.285, "lr": 4.898430892025967e-05, "epoch": 0.049982520993402606, "percentage": 1.67, "elapsed_time": "1:15:50", "remaining_time": "3 days, 2:36:33", "throughput": 24783.34, "total_tokens": 112783488} +{"current_steps": 430, "total_steps": 25209, "loss": 1.271, "lr": 4.896081862546415e-05, "epoch": 0.05117258101705505, "percentage": 1.71, "elapsed_time": "1:17:41", "remaining_time": "3 days, 2:37:05", "throughput": 24768.23, "total_tokens": 115458560} +{"current_steps": 440, "total_steps": 25209, "loss": 1.2678, "lr": 4.8937362092414e-05, "epoch": 0.05236264104070749, "percentage": 1.75, "elapsed_time": "1:19:35", "remaining_time": "3 days, 2:40:08", "throughput": 24754.67, "total_tokens": 118207424} +{"current_steps": 450, "total_steps": 25209, "loss": 1.2746, "lr": 4.891393924031244e-05, "epoch": 0.053552701064359935, "percentage": 1.79, "elapsed_time": "1:21:15", "remaining_time": "3 days, 2:30:56", "throughput": 24790.59, "total_tokens": 120869376} +{"current_steps": 460, "total_steps": 25209, "loss": 1.2756, "lr": 4.8890549988633095e-05, "epoch": 0.054742761088012376, "percentage": 1.82, "elapsed_time": "1:23:01", "remaining_time": "3 days, 2:26:56", "throughput": 24818.49, "total_tokens": 123633792} +{"current_steps": 470, "total_steps": 25209, "loss": 1.2832, "lr": 4.8867194257118907e-05, "epoch": 0.05593282111166482, "percentage": 1.86, "elapsed_time": "1:24:48", "remaining_time": "3 days, 2:23:40", "throughput": 24834.42, "total_tokens": 126360960} +{"current_steps": 480, "total_steps": 25209, "loss": 1.2855, "lr": 4.884387196578093e-05, "epoch": 0.057122881135317265, "percentage": 1.9, "elapsed_time": "1:26:31", "remaining_time": "3 days, 2:17:56", "throughput": 24866.19, "total_tokens": 129100928} +{"current_steps": 490, "total_steps": 25209, "loss": 1.2642, "lr": 4.882058303489718e-05, "epoch": 0.058312941158969706, "percentage": 1.94, "elapsed_time": "1:28:14", "remaining_time": "3 days, 2:11:19", "throughput": 24884.89, "total_tokens": 131747008} +{"current_steps": 500, "total_steps": 25209, "loss": 1.2833, "lr": 4.8797327385011496e-05, "epoch": 0.059503001182622146, "percentage": 1.98, "elapsed_time": "1:30:00", "remaining_time": "3 days, 2:07:59", "throughput": 24891.48, "total_tokens": 134425024} +{"current_steps": 510, "total_steps": 25209, "loss": 1.2583, "lr": 4.8774104936932425e-05, "epoch": 0.060693061206274594, "percentage": 2.02, "elapsed_time": "1:31:45", "remaining_time": "3 days, 2:03:36", "throughput": 24905.65, "total_tokens": 137111872} +{"current_steps": 520, "total_steps": 25209, "loss": 1.2534, "lr": 4.8750915611732076e-05, "epoch": 0.061883121229927035, "percentage": 2.06, "elapsed_time": "1:33:25", "remaining_time": "3 days, 1:55:20", "throughput": 24936.17, "total_tokens": 139768192} +{"current_steps": 530, "total_steps": 25209, "loss": 1.2653, "lr": 4.8727759330744986e-05, "epoch": 0.06307318125357948, "percentage": 2.1, "elapsed_time": "1:35:07", "remaining_time": "3 days, 1:49:04", "throughput": 24963.09, "total_tokens": 142466112} +{"current_steps": 540, "total_steps": 25209, "loss": 1.2463, "lr": 4.870463601556696e-05, "epoch": 0.06426324127723192, "percentage": 2.14, "elapsed_time": "1:36:50", "remaining_time": "3 days, 1:43:42", "throughput": 24986.92, "total_tokens": 145175168} +{"current_steps": 550, "total_steps": 25209, "loss": 1.2556, "lr": 4.8681545588054075e-05, "epoch": 0.06545330130088436, "percentage": 2.18, "elapsed_time": "1:38:38", "remaining_time": "3 days, 1:42:30", "throughput": 24986.82, "total_tokens": 147882752} +{"current_steps": 560, "total_steps": 25209, "loss": 1.2645, "lr": 4.8658487970321404e-05, "epoch": 0.06664336132453681, "percentage": 2.22, "elapsed_time": "1:40:25", "remaining_time": "3 days, 1:40:27", "throughput": 24994.59, "total_tokens": 150609792} +{"current_steps": 570, "total_steps": 25209, "loss": 1.2546, "lr": 4.863546308474209e-05, "epoch": 0.06783342134818925, "percentage": 2.26, "elapsed_time": "1:42:06", "remaining_time": "3 days, 1:33:36", "throughput": 25017.5, "total_tokens": 153264064} +{"current_steps": 580, "total_steps": 25209, "loss": 1.2614, "lr": 4.86124708539461e-05, "epoch": 0.0690234813718417, "percentage": 2.3, "elapsed_time": "1:43:49", "remaining_time": "3 days, 1:28:35", "throughput": 25033.3, "total_tokens": 155937408} +{"current_steps": 590, "total_steps": 25209, "loss": 1.2398, "lr": 4.8589511200819216e-05, "epoch": 0.07021354139549414, "percentage": 2.34, "elapsed_time": "1:46:00", "remaining_time": "3 days, 1:43:33", "throughput": 24953.18, "total_tokens": 158719296} +{"current_steps": 600, "total_steps": 25209, "loss": 1.2523, "lr": 4.8566584048501926e-05, "epoch": 0.07140360141914658, "percentage": 2.38, "elapsed_time": "1:47:46", "remaining_time": "3 days, 1:40:43", "throughput": 24957.49, "total_tokens": 161399808} +{"current_steps": 610, "total_steps": 25209, "loss": 1.2454, "lr": 4.854368932038835e-05, "epoch": 0.07259366144279902, "percentage": 2.42, "elapsed_time": "1:49:27", "remaining_time": "3 days, 1:33:56", "throughput": 24980.72, "total_tokens": 164056896} +{"current_steps": 620, "total_steps": 25209, "loss": 1.2546, "lr": 4.8520826940125144e-05, "epoch": 0.07378372146645146, "percentage": 2.46, "elapsed_time": "1:51:08", "remaining_time": "3 days, 1:27:40", "throughput": 25004.47, "total_tokens": 166736000} +{"current_steps": 630, "total_steps": 25209, "loss": 1.2574, "lr": 4.849799683161046e-05, "epoch": 0.0749737814901039, "percentage": 2.5, "elapsed_time": "1:52:48", "remaining_time": "3 days, 1:21:13", "throughput": 25030.14, "total_tokens": 169419904} +{"current_steps": 640, "total_steps": 25209, "loss": 1.2527, "lr": 4.8475198918992835e-05, "epoch": 0.07616384151375635, "percentage": 2.54, "elapsed_time": "1:54:29", "remaining_time": "3 days, 1:15:24", "throughput": 25052.93, "total_tokens": 172108288} +{"current_steps": 650, "total_steps": 25209, "loss": 1.2509, "lr": 4.845243312667023e-05, "epoch": 0.07735390153740879, "percentage": 2.58, "elapsed_time": "1:56:13", "remaining_time": "3 days, 1:11:29", "throughput": 25070.79, "total_tokens": 174837248} +{"current_steps": 660, "total_steps": 25209, "loss": 1.2283, "lr": 4.842969937928884e-05, "epoch": 0.07854396156106123, "percentage": 2.62, "elapsed_time": "1:57:55", "remaining_time": "3 days, 1:06:25", "throughput": 25085.56, "total_tokens": 177498816} +{"current_steps": 670, "total_steps": 25209, "loss": 1.2535, "lr": 4.840699760174217e-05, "epoch": 0.07973402158471368, "percentage": 2.66, "elapsed_time": "1:59:38", "remaining_time": "3 days, 1:01:37", "throughput": 25104.3, "total_tokens": 180198912} +{"current_steps": 680, "total_steps": 25209, "loss": 1.2401, "lr": 4.8384327719169906e-05, "epoch": 0.08092408160836612, "percentage": 2.7, "elapsed_time": "2:01:24", "remaining_time": "3 days, 0:59:40", "throughput": 25103.92, "total_tokens": 182879232} +{"current_steps": 690, "total_steps": 25209, "loss": 1.2405, "lr": 4.836168965695694e-05, "epoch": 0.08211414163201856, "percentage": 2.74, "elapsed_time": "2:03:09", "remaining_time": "3 days, 0:56:24", "throughput": 25116.98, "total_tokens": 185601920} +{"current_steps": 700, "total_steps": 25209, "loss": 1.2456, "lr": 4.8339083340732304e-05, "epoch": 0.08330420165567101, "percentage": 2.78, "elapsed_time": "2:04:55", "remaining_time": "3 days, 0:54:07", "throughput": 25129.42, "total_tokens": 188363584} +{"current_steps": 710, "total_steps": 25209, "loss": 1.2435, "lr": 4.8316508696368154e-05, "epoch": 0.08449426167932345, "percentage": 2.82, "elapsed_time": "2:06:35", "remaining_time": "3 days, 0:47:53", "throughput": 25150.95, "total_tokens": 191023552} +{"current_steps": 720, "total_steps": 25209, "loss": 1.2405, "lr": 4.8293965649978714e-05, "epoch": 0.0856843217029759, "percentage": 2.86, "elapsed_time": "2:08:17", "remaining_time": "3 days, 0:43:21", "throughput": 25166.12, "total_tokens": 193708672} +{"current_steps": 730, "total_steps": 25209, "loss": 1.2324, "lr": 4.8271454127919364e-05, "epoch": 0.08687438172662834, "percentage": 2.9, "elapsed_time": "2:10:00", "remaining_time": "3 days, 0:39:33", "throughput": 25176.06, "total_tokens": 196386176} +{"current_steps": 740, "total_steps": 25209, "loss": 1.2316, "lr": 4.824897405678549e-05, "epoch": 0.08806444175028078, "percentage": 2.94, "elapsed_time": "2:11:46", "remaining_time": "3 days, 0:37:09", "throughput": 25186.46, "total_tokens": 199130048} +{"current_steps": 750, "total_steps": 25209, "loss": 1.2403, "lr": 4.8226525363411576e-05, "epoch": 0.08925450177393322, "percentage": 2.98, "elapsed_time": "2:13:29", "remaining_time": "3 days, 0:33:14", "throughput": 25201.07, "total_tokens": 201839552} +{"current_steps": 760, "total_steps": 25209, "loss": 1.2393, "lr": 4.820410797487017e-05, "epoch": 0.09044456179758567, "percentage": 3.01, "elapsed_time": "2:15:15", "remaining_time": "3 days, 0:30:58", "throughput": 25200.95, "total_tokens": 204506752} +{"current_steps": 770, "total_steps": 25209, "loss": 1.2358, "lr": 4.818172181847091e-05, "epoch": 0.0916346218212381, "percentage": 3.05, "elapsed_time": "2:16:56", "remaining_time": "3 days, 0:26:23", "throughput": 25216.42, "total_tokens": 207190912} +{"current_steps": 780, "total_steps": 25209, "loss": 1.2406, "lr": 4.81593668217595e-05, "epoch": 0.09282468184489055, "percentage": 3.09, "elapsed_time": "2:18:39", "remaining_time": "3 days, 0:22:29", "throughput": 25230.01, "total_tokens": 209892160} +{"current_steps": 790, "total_steps": 25209, "loss": 1.2495, "lr": 4.813704291251675e-05, "epoch": 0.094014741868543, "percentage": 3.13, "elapsed_time": "2:20:17", "remaining_time": "3 days, 0:16:33", "throughput": 25247.49, "total_tokens": 212526848} +{"current_steps": 800, "total_steps": 25209, "loss": 1.234, "lr": 4.811475001875759e-05, "epoch": 0.09520480189219543, "percentage": 3.17, "elapsed_time": "2:22:02", "remaining_time": "3 days, 0:13:42", "throughput": 25261.94, "total_tokens": 215287232} +{"current_steps": 810, "total_steps": 25209, "loss": 1.2381, "lr": 4.8092488068730105e-05, "epoch": 0.09639486191584788, "percentage": 3.21, "elapsed_time": "2:23:43", "remaining_time": "3 days, 0:09:15", "throughput": 25276.1, "total_tokens": 217965312} +{"current_steps": 820, "total_steps": 25209, "loss": 1.2415, "lr": 4.807025699091452e-05, "epoch": 0.09758492193950033, "percentage": 3.25, "elapsed_time": "2:25:24", "remaining_time": "3 days, 0:05:01", "throughput": 25288.91, "total_tokens": 220642944} +{"current_steps": 830, "total_steps": 25209, "loss": 1.2229, "lr": 4.8048056714022325e-05, "epoch": 0.09877498196315276, "percentage": 3.29, "elapsed_time": "2:27:10", "remaining_time": "3 days, 0:02:50", "throughput": 25299.21, "total_tokens": 223403776} +{"current_steps": 840, "total_steps": 25209, "loss": 1.2176, "lr": 4.802588716699519e-05, "epoch": 0.09996504198680521, "percentage": 3.33, "elapsed_time": "2:28:56", "remaining_time": "3 days, 0:00:47", "throughput": 25296.91, "total_tokens": 226059776} +{"current_steps": 850, "total_steps": 25209, "loss": 1.229, "lr": 4.8003748279004156e-05, "epoch": 0.10115510201045766, "percentage": 3.37, "elapsed_time": "2:30:47", "remaining_time": "3 days, 0:01:08", "throughput": 25286.55, "total_tokens": 228769600} +{"current_steps": 860, "total_steps": 25209, "loss": 1.217, "lr": 4.798163997944854e-05, "epoch": 0.1023451620341101, "percentage": 3.41, "elapsed_time": "2:32:29", "remaining_time": "2 days, 23:57:36", "throughput": 25300.07, "total_tokens": 231490368} +{"current_steps": 870, "total_steps": 25209, "loss": 1.2411, "lr": 4.79595621979551e-05, "epoch": 0.10353522205776254, "percentage": 3.45, "elapsed_time": "2:34:19", "remaining_time": "2 days, 23:57:13", "throughput": 25292.23, "total_tokens": 234185216} +{"current_steps": 880, "total_steps": 25209, "loss": 1.2307, "lr": 4.793751486437702e-05, "epoch": 0.10472528208141497, "percentage": 3.49, "elapsed_time": "2:35:59", "remaining_time": "2 days, 23:52:27", "throughput": 25307.57, "total_tokens": 236856640} +{"current_steps": 890, "total_steps": 25209, "loss": 1.2331, "lr": 4.7915497908793064e-05, "epoch": 0.10591534210506742, "percentage": 3.53, "elapsed_time": "2:37:38", "remaining_time": "2 days, 23:47:25", "throughput": 25325.77, "total_tokens": 239538432} +{"current_steps": 900, "total_steps": 25209, "loss": 1.2303, "lr": 4.7893511261506516e-05, "epoch": 0.10710540212871987, "percentage": 3.57, "elapsed_time": "2:39:21", "remaining_time": "2 days, 23:44:07", "throughput": 25337.86, "total_tokens": 242259392} +{"current_steps": 910, "total_steps": 25209, "loss": 1.2154, "lr": 4.787155485304435e-05, "epoch": 0.1082954621523723, "percentage": 3.61, "elapsed_time": "2:40:59", "remaining_time": "2 days, 23:38:50", "throughput": 25353.68, "total_tokens": 244904512} +{"current_steps": 920, "total_steps": 25209, "loss": 1.2087, "lr": 4.784962861415629e-05, "epoch": 0.10948552217602475, "percentage": 3.65, "elapsed_time": "2:42:45", "remaining_time": "2 days, 23:37:07", "throughput": 25356.08, "total_tokens": 247622336} +{"current_steps": 930, "total_steps": 25209, "loss": 1.2386, "lr": 4.7827732475813884e-05, "epoch": 0.1106755821996772, "percentage": 3.69, "elapsed_time": "2:44:44", "remaining_time": "2 days, 23:40:50", "throughput": 25325.04, "total_tokens": 250326464} +{"current_steps": 940, "total_steps": 25209, "loss": 1.2269, "lr": 4.7805866369209576e-05, "epoch": 0.11186564222332963, "percentage": 3.73, "elapsed_time": "2:46:44", "remaining_time": "2 days, 23:44:57", "throughput": 25290.19, "total_tokens": 253016064} +{"current_steps": 950, "total_steps": 25209, "loss": 1.2074, "lr": 4.778403022575583e-05, "epoch": 0.11305570224698208, "percentage": 3.77, "elapsed_time": "2:48:34", "remaining_time": "2 days, 23:44:49", "throughput": 25281.77, "total_tokens": 255719936} +{"current_steps": 960, "total_steps": 25209, "loss": 1.2163, "lr": 4.7762223977084195e-05, "epoch": 0.11424576227063453, "percentage": 3.81, "elapsed_time": "2:50:19", "remaining_time": "2 days, 23:42:14", "throughput": 25286.46, "total_tokens": 258411008} +{"current_steps": 970, "total_steps": 25209, "loss": 1.2216, "lr": 4.774044755504444e-05, "epoch": 0.11543582229428696, "percentage": 3.85, "elapsed_time": "2:51:58", "remaining_time": "2 days, 23:37:22", "throughput": 25303.85, "total_tokens": 261094720} +{"current_steps": 980, "total_steps": 25209, "loss": 1.2126, "lr": 4.7718700891703616e-05, "epoch": 0.11662588231793941, "percentage": 3.89, "elapsed_time": "2:53:42", "remaining_time": "2 days, 23:34:39", "throughput": 25312.31, "total_tokens": 263816448} +{"current_steps": 990, "total_steps": 25209, "loss": 1.2117, "lr": 4.7696983919345215e-05, "epoch": 0.11781594234159186, "percentage": 3.93, "elapsed_time": "2:55:24", "remaining_time": "2 days, 23:31:07", "throughput": 25322.03, "total_tokens": 266501184} +{"current_steps": 1000, "total_steps": 25209, "loss": 1.2188, "lr": 4.7675296570468216e-05, "epoch": 0.11900600236524429, "percentage": 3.97, "elapsed_time": "2:57:10", "remaining_time": "2 days, 23:29:18", "throughput": 25321.39, "total_tokens": 269184384} +{"current_steps": 1010, "total_steps": 25209, "loss": 1.2, "lr": 4.76536387777863e-05, "epoch": 0.12019606238889674, "percentage": 4.01, "elapsed_time": "2:59:02", "remaining_time": "2 days, 23:29:35", "throughput": 25309.77, "total_tokens": 271881024} +{"current_steps": 1020, "total_steps": 25209, "loss": 1.2159, "lr": 4.7632010474226915e-05, "epoch": 0.12138612241254919, "percentage": 4.05, "elapsed_time": "3:00:55", "remaining_time": "2 days, 23:30:40", "throughput": 25291.56, "total_tokens": 274558784} +{"current_steps": 1030, "total_steps": 25209, "loss": 1.2264, "lr": 4.761041159293035e-05, "epoch": 0.12257618243620162, "percentage": 4.09, "elapsed_time": "3:02:40", "remaining_time": "2 days, 23:28:19", "throughput": 25293.57, "total_tokens": 277235136} +{"current_steps": 1040, "total_steps": 25209, "loss": 1.22, "lr": 4.7588842067249e-05, "epoch": 0.12376624245985407, "percentage": 4.13, "elapsed_time": "3:04:24", "remaining_time": "2 days, 23:25:39", "throughput": 25299.13, "total_tokens": 279930112} +{"current_steps": 1050, "total_steps": 25209, "loss": 1.2054, "lr": 4.756730183074637e-05, "epoch": 0.12495630248350652, "percentage": 4.17, "elapsed_time": "3:06:38", "remaining_time": "2 days, 23:34:23", "throughput": 25240.83, "total_tokens": 282661184} +{"current_steps": 1060, "total_steps": 25209, "loss": 1.2124, "lr": 4.7545790817196314e-05, "epoch": 0.12614636250715897, "percentage": 4.2, "elapsed_time": "3:08:39", "remaining_time": "2 days, 23:38:05", "throughput": 25210.37, "total_tokens": 285372672} +{"current_steps": 1070, "total_steps": 25209, "loss": 1.2004, "lr": 4.752430896058212e-05, "epoch": 0.1273364225308114, "percentage": 4.24, "elapsed_time": "3:11:21", "remaining_time": "2 days, 23:56:57", "throughput": 25086.36, "total_tokens": 288026112} +{"current_steps": 1080, "total_steps": 25209, "loss": 1.2193, "lr": 4.750285619509567e-05, "epoch": 0.12852648255446383, "percentage": 4.28, "elapsed_time": "3:13:12", "remaining_time": "2 days, 23:56:31", "throughput": 25077.52, "total_tokens": 290706624} +{"current_steps": 1090, "total_steps": 25209, "loss": 1.2035, "lr": 4.7481432455136644e-05, "epoch": 0.1297165425781163, "percentage": 4.32, "elapsed_time": "3:14:57", "remaining_time": "2 days, 23:53:55", "throughput": 25083.52, "total_tokens": 293413632} +{"current_steps": 1100, "total_steps": 25209, "loss": 1.2043, "lr": 4.7460037675311584e-05, "epoch": 0.13090660260176873, "percentage": 4.36, "elapsed_time": "3:16:42", "remaining_time": "2 days, 23:51:12", "throughput": 25089.81, "total_tokens": 296115328} +{"current_steps": 1110, "total_steps": 25209, "loss": 1.2043, "lr": 4.7438671790433126e-05, "epoch": 0.13209666262542116, "percentage": 4.4, "elapsed_time": "3:18:28", "remaining_time": "2 days, 23:49:06", "throughput": 25092.35, "total_tokens": 298816256} +{"current_steps": 1120, "total_steps": 25209, "loss": 1.2057, "lr": 4.741733473551915e-05, "epoch": 0.13328672264907362, "percentage": 4.44, "elapsed_time": "3:20:09", "remaining_time": "2 days, 23:45:08", "throughput": 25103.97, "total_tokens": 301494912} +{"current_steps": 1130, "total_steps": 25209, "loss": 1.2124, "lr": 4.7396026445791966e-05, "epoch": 0.13447678267272606, "percentage": 4.48, "elapsed_time": "3:21:54", "remaining_time": "2 days, 23:42:25", "throughput": 25112.81, "total_tokens": 304228288} +{"current_steps": 1140, "total_steps": 25209, "loss": 1.199, "lr": 4.737474685667742e-05, "epoch": 0.1356668426963785, "percentage": 4.52, "elapsed_time": "3:23:38", "remaining_time": "2 days, 23:39:22", "throughput": 25118.27, "total_tokens": 306897152} +{"current_steps": 1150, "total_steps": 25209, "loss": 1.196, "lr": 4.7353495903804165e-05, "epoch": 0.13685690272003095, "percentage": 4.56, "elapsed_time": "3:25:18", "remaining_time": "2 days, 23:35:21", "throughput": 25126.49, "total_tokens": 309529856} +{"current_steps": 1160, "total_steps": 25209, "loss": 1.2067, "lr": 4.733227352300277e-05, "epoch": 0.1380469627436834, "percentage": 4.6, "elapsed_time": "3:27:03", "remaining_time": "2 days, 23:32:50", "throughput": 25133.56, "total_tokens": 312256832} +{"current_steps": 1170, "total_steps": 25209, "loss": 1.2035, "lr": 4.731107965030496e-05, "epoch": 0.13923702276733582, "percentage": 4.64, "elapsed_time": "3:28:46", "remaining_time": "2 days, 23:29:40", "throughput": 25142.43, "total_tokens": 314957888} +{"current_steps": 1180, "total_steps": 25209, "loss": 1.2002, "lr": 4.728991422194278e-05, "epoch": 0.14042708279098828, "percentage": 4.68, "elapsed_time": "3:30:46", "remaining_time": "2 days, 23:31:58", "throughput": 25121.08, "total_tokens": 317681792} +{"current_steps": 1190, "total_steps": 25209, "loss": 1.1942, "lr": 4.726877717434773e-05, "epoch": 0.14161714281464072, "percentage": 4.72, "elapsed_time": "3:32:35", "remaining_time": "2 days, 23:31:03", "throughput": 25117.55, "total_tokens": 320394560} +{"current_steps": 1200, "total_steps": 25209, "loss": 1.2003, "lr": 4.724766844415013e-05, "epoch": 0.14280720283829315, "percentage": 4.76, "elapsed_time": "3:34:37", "remaining_time": "2 days, 23:33:59", "throughput": 25088.77, "total_tokens": 323071168} +{"current_steps": 1210, "total_steps": 25209, "loss": 1.1837, "lr": 4.722658796817813e-05, "epoch": 0.1439972628619456, "percentage": 4.8, "elapsed_time": "3:36:17", "remaining_time": "2 days, 23:29:50", "throughput": 25098.38, "total_tokens": 325709568} +{"current_steps": 1220, "total_steps": 25209, "loss": 1.2096, "lr": 4.7205535683457044e-05, "epoch": 0.14518732288559805, "percentage": 4.84, "elapsed_time": "3:37:54", "remaining_time": "2 days, 23:24:49", "throughput": 25113.4, "total_tokens": 328350784} +{"current_steps": 1230, "total_steps": 25209, "loss": 1.1928, "lr": 4.7184511527208484e-05, "epoch": 0.14637738290925048, "percentage": 4.88, "elapsed_time": "3:39:35", "remaining_time": "2 days, 23:20:52", "throughput": 25123.7, "total_tokens": 331010240} +{"current_steps": 1240, "total_steps": 25209, "loss": 1.2004, "lr": 4.7163515436849644e-05, "epoch": 0.14756744293290291, "percentage": 4.92, "elapsed_time": "3:41:20", "remaining_time": "2 days, 23:18:29", "throughput": 25127.13, "total_tokens": 333700416} +{"current_steps": 1250, "total_steps": 25209, "loss": 1.1879, "lr": 4.714254734999245e-05, "epoch": 0.14875750295655538, "percentage": 4.96, "elapsed_time": "3:43:03", "remaining_time": "2 days, 23:15:21", "throughput": 25134.8, "total_tokens": 336388288} +{"current_steps": 1260, "total_steps": 25209, "loss": 1.1957, "lr": 4.712160720444284e-05, "epoch": 0.1499475629802078, "percentage": 5.0, "elapsed_time": "3:44:44", "remaining_time": "2 days, 23:11:44", "throughput": 25141.91, "total_tokens": 339029632} +{"current_steps": 1270, "total_steps": 25209, "loss": 1.1836, "lr": 4.710069493819992e-05, "epoch": 0.15113762300386024, "percentage": 5.04, "elapsed_time": "3:46:25", "remaining_time": "2 days, 23:08:03", "throughput": 25150.01, "total_tokens": 341678016} +{"current_steps": 1280, "total_steps": 25209, "loss": 1.1992, "lr": 4.70798104894553e-05, "epoch": 0.1523276830275127, "percentage": 5.08, "elapsed_time": "3:48:06", "remaining_time": "2 days, 23:04:31", "throughput": 25160.95, "total_tokens": 344376896} +{"current_steps": 1290, "total_steps": 25209, "loss": 1.1829, "lr": 4.705895379659219e-05, "epoch": 0.15351774305116514, "percentage": 5.12, "elapsed_time": "3:49:48", "remaining_time": "2 days, 23:00:59", "throughput": 25170.45, "total_tokens": 347055808} +{"current_steps": 1300, "total_steps": 25209, "loss": 1.1915, "lr": 4.7038124798184766e-05, "epoch": 0.15470780307481757, "percentage": 5.16, "elapsed_time": "3:51:35", "remaining_time": "2 days, 22:59:22", "throughput": 25172.31, "total_tokens": 349785472} +{"current_steps": 1310, "total_steps": 25209, "loss": 1.1908, "lr": 4.7017323432997304e-05, "epoch": 0.15589786309847004, "percentage": 5.2, "elapsed_time": "3:53:30", "remaining_time": "2 days, 22:59:51", "throughput": 25161.77, "total_tokens": 352516864} +{"current_steps": 1320, "total_steps": 25209, "loss": 1.1885, "lr": 4.6996549639983506e-05, "epoch": 0.15708792312212247, "percentage": 5.24, "elapsed_time": "3:55:18", "remaining_time": "2 days, 22:58:36", "throughput": 25162.91, "total_tokens": 355268352} +{"current_steps": 1330, "total_steps": 25209, "loss": 1.1769, "lr": 4.697580335828569e-05, "epoch": 0.1582779831457749, "percentage": 5.28, "elapsed_time": "3:57:00", "remaining_time": "2 days, 22:55:16", "throughput": 25168.76, "total_tokens": 357912640} +{"current_steps": 1340, "total_steps": 25209, "loss": 1.1994, "lr": 4.6955084527234076e-05, "epoch": 0.15946804316942736, "percentage": 5.32, "elapsed_time": "3:58:44", "remaining_time": "2 days, 22:52:32", "throughput": 25173.07, "total_tokens": 360584384} +{"current_steps": 1350, "total_steps": 25209, "loss": 1.1871, "lr": 4.6934393086346034e-05, "epoch": 0.1606581031930798, "percentage": 5.36, "elapsed_time": "4:00:25", "remaining_time": "2 days, 22:48:58", "throughput": 25182.74, "total_tokens": 363262336} +{"current_steps": 1360, "total_steps": 25209, "loss": 1.2027, "lr": 4.6913728975325324e-05, "epoch": 0.16184816321673223, "percentage": 5.39, "elapsed_time": "4:02:18", "remaining_time": "2 days, 22:49:10", "throughput": 25173.0, "total_tokens": 365981568} +{"current_steps": 1370, "total_steps": 25209, "loss": 1.1992, "lr": 4.6893092134061393e-05, "epoch": 0.1630382232403847, "percentage": 5.43, "elapsed_time": "4:04:06", "remaining_time": "2 days, 22:47:40", "throughput": 25170.94, "total_tokens": 368667776} +{"current_steps": 1380, "total_steps": 25209, "loss": 1.1966, "lr": 4.687248250262859e-05, "epoch": 0.16422828326403713, "percentage": 5.47, "elapsed_time": "4:05:52", "remaining_time": "2 days, 22:45:31", "throughput": 25173.69, "total_tokens": 371366848} +{"current_steps": 1390, "total_steps": 25209, "loss": 1.17, "lr": 4.685190002128548e-05, "epoch": 0.16541834328768956, "percentage": 5.51, "elapsed_time": "4:07:36", "remaining_time": "2 days, 22:42:58", "throughput": 25178.5, "total_tokens": 374061760} +{"current_steps": 1400, "total_steps": 25209, "loss": 1.2015, "lr": 4.6831344630474114e-05, "epoch": 0.16660840331134202, "percentage": 5.55, "elapsed_time": "4:09:21", "remaining_time": "2 days, 22:40:34", "throughput": 25183.88, "total_tokens": 376778624} +{"current_steps": 1410, "total_steps": 25209, "loss": 1.1904, "lr": 4.6810816270819276e-05, "epoch": 0.16779846333499446, "percentage": 5.59, "elapsed_time": "4:11:03", "remaining_time": "2 days, 22:37:32", "throughput": 25192.68, "total_tokens": 379490496} +{"current_steps": 1420, "total_steps": 25209, "loss": 1.1755, "lr": 4.679031488312777e-05, "epoch": 0.1689885233586469, "percentage": 5.63, "elapsed_time": "4:12:43", "remaining_time": "2 days, 22:33:49", "throughput": 25203.1, "total_tokens": 382164992} +{"current_steps": 1430, "total_steps": 25209, "loss": 1.1919, "lr": 4.6769840408387717e-05, "epoch": 0.17017858338229935, "percentage": 5.67, "elapsed_time": "4:14:25", "remaining_time": "2 days, 22:30:37", "throughput": 25213.39, "total_tokens": 384883648} +{"current_steps": 1440, "total_steps": 25209, "loss": 1.1863, "lr": 4.674939278776787e-05, "epoch": 0.1713686434059518, "percentage": 5.71, "elapsed_time": "4:16:10", "remaining_time": "2 days, 22:28:26", "throughput": 25218.52, "total_tokens": 387616896} +{"current_steps": 1450, "total_steps": 25209, "loss": 1.1899, "lr": 4.672897196261683e-05, "epoch": 0.17255870342960422, "percentage": 5.75, "elapsed_time": "4:17:51", "remaining_time": "2 days, 22:25:08", "throughput": 25228.62, "total_tokens": 390324608} +{"current_steps": 1460, "total_steps": 25209, "loss": 1.1836, "lr": 4.670857787446238e-05, "epoch": 0.17374876345325668, "percentage": 5.79, "elapsed_time": "4:19:29", "remaining_time": "2 days, 22:20:52", "throughput": 25242.46, "total_tokens": 393000000} +{"current_steps": 1470, "total_steps": 25209, "loss": 1.1844, "lr": 4.668821046501082e-05, "epoch": 0.17493882347690912, "percentage": 5.83, "elapsed_time": "4:21:09", "remaining_time": "2 days, 22:17:27", "throughput": 25250.83, "total_tokens": 395669504} +{"current_steps": 1480, "total_steps": 25209, "loss": 1.173, "lr": 4.6667869676146194e-05, "epoch": 0.17612888350056155, "percentage": 5.87, "elapsed_time": "4:22:52", "remaining_time": "2 days, 22:14:48", "throughput": 25255.28, "total_tokens": 398348992} +{"current_steps": 1490, "total_steps": 25209, "loss": 1.1844, "lr": 4.6647555449929645e-05, "epoch": 0.177318943524214, "percentage": 5.91, "elapsed_time": "4:24:35", "remaining_time": "2 days, 22:12:06", "throughput": 25261.08, "total_tokens": 401044160} +{"current_steps": 1500, "total_steps": 25209, "loss": 1.1671, "lr": 4.662726772859869e-05, "epoch": 0.17850900354786645, "percentage": 5.95, "elapsed_time": "4:26:17", "remaining_time": "2 days, 22:08:53", "throughput": 25269.09, "total_tokens": 403725760} +{"current_steps": 1510, "total_steps": 25209, "loss": 1.1724, "lr": 4.660700645456655e-05, "epoch": 0.17969906357151888, "percentage": 5.99, "elapsed_time": "4:28:02", "remaining_time": "2 days, 22:06:54", "throughput": 25271.9, "total_tokens": 406443200} +{"current_steps": 1520, "total_steps": 25209, "loss": 1.1826, "lr": 4.658677157042149e-05, "epoch": 0.18088912359517134, "percentage": 6.03, "elapsed_time": "4:29:45", "remaining_time": "2 days, 22:04:08", "throughput": 25278.57, "total_tokens": 409145920} +{"current_steps": 1530, "total_steps": 25209, "loss": 1.185, "lr": 4.656656301892605e-05, "epoch": 0.18207918361882378, "percentage": 6.07, "elapsed_time": "4:31:22", "remaining_time": "2 days, 22:00:00", "throughput": 25289.91, "total_tokens": 411791744} +{"current_steps": 1540, "total_steps": 25209, "loss": 1.1857, "lr": 4.6546380743016465e-05, "epoch": 0.1832692436424762, "percentage": 6.11, "elapsed_time": "4:33:04", "remaining_time": "2 days, 21:57:08", "throughput": 25296.63, "total_tokens": 414484352} +{"current_steps": 1550, "total_steps": 25209, "loss": 1.1855, "lr": 4.652622468580193e-05, "epoch": 0.18445930366612867, "percentage": 6.15, "elapsed_time": "4:34:46", "remaining_time": "2 days, 21:54:11", "throughput": 25303.71, "total_tokens": 417176448} +{"current_steps": 1560, "total_steps": 25209, "loss": 1.176, "lr": 4.650609479056392e-05, "epoch": 0.1856493636897811, "percentage": 6.19, "elapsed_time": "4:36:26", "remaining_time": "2 days, 21:50:50", "throughput": 25312.18, "total_tokens": 419850176} +{"current_steps": 1570, "total_steps": 25209, "loss": 1.1807, "lr": 4.648599100075556e-05, "epoch": 0.18683942371343354, "percentage": 6.23, "elapsed_time": "4:38:10", "remaining_time": "2 days, 21:48:16", "throughput": 25316.99, "total_tokens": 422540800} +{"current_steps": 1580, "total_steps": 25209, "loss": 1.192, "lr": 4.6465913260000945e-05, "epoch": 0.188029483737086, "percentage": 6.27, "elapsed_time": "4:39:49", "remaining_time": "2 days, 21:44:41", "throughput": 25324.84, "total_tokens": 425180288} +{"current_steps": 1590, "total_steps": 25209, "loss": 1.1891, "lr": 4.644586151209444e-05, "epoch": 0.18921954376073843, "percentage": 6.31, "elapsed_time": "4:41:36", "remaining_time": "2 days, 21:43:06", "throughput": 25323.56, "total_tokens": 427869120} +{"current_steps": 1600, "total_steps": 25209, "loss": 1.1808, "lr": 4.6425835701000084e-05, "epoch": 0.19040960378439087, "percentage": 6.35, "elapsed_time": "4:43:17", "remaining_time": "2 days, 21:40:08", "throughput": 25328.9, "total_tokens": 430528256} +{"current_steps": 1610, "total_steps": 25209, "loss": 1.1798, "lr": 4.640583577085084e-05, "epoch": 0.19159966380804333, "percentage": 6.39, "elapsed_time": "4:45:03", "remaining_time": "2 days, 21:38:12", "throughput": 25332.55, "total_tokens": 433264640} +{"current_steps": 1620, "total_steps": 25209, "loss": 1.1511, "lr": 4.638586166594806e-05, "epoch": 0.19278972383169576, "percentage": 6.43, "elapsed_time": "4:46:46", "remaining_time": "2 days, 21:35:42", "throughput": 25337.07, "total_tokens": 435957376} +{"current_steps": 1630, "total_steps": 25209, "loss": 1.1677, "lr": 4.6365913330760726e-05, "epoch": 0.1939797838553482, "percentage": 6.47, "elapsed_time": "4:48:23", "remaining_time": "2 days, 21:31:41", "throughput": 25347.44, "total_tokens": 438590656} +{"current_steps": 1640, "total_steps": 25209, "loss": 1.1659, "lr": 4.6345990709924855e-05, "epoch": 0.19516984387900066, "percentage": 6.51, "elapsed_time": "4:50:02", "remaining_time": "2 days, 21:28:10", "throughput": 25358.22, "total_tokens": 441284992} +{"current_steps": 1650, "total_steps": 25209, "loss": 1.1758, "lr": 4.632609374824284e-05, "epoch": 0.1963599039026531, "percentage": 6.55, "elapsed_time": "4:51:40", "remaining_time": "2 days, 21:24:32", "throughput": 25368.83, "total_tokens": 443961536} +{"current_steps": 1660, "total_steps": 25209, "loss": 1.1614, "lr": 4.630622239068285e-05, "epoch": 0.19754996392630553, "percentage": 6.58, "elapsed_time": "4:53:23", "remaining_time": "2 days, 21:21:59", "throughput": 25374.3, "total_tokens": 446665152} +{"current_steps": 1670, "total_steps": 25209, "loss": 1.1794, "lr": 4.628637658237808e-05, "epoch": 0.198740023949958, "percentage": 6.62, "elapsed_time": "4:55:05", "remaining_time": "2 days, 21:19:16", "throughput": 25377.95, "total_tokens": 449317248} +{"current_steps": 1680, "total_steps": 25209, "loss": 1.1617, "lr": 4.626655626862625e-05, "epoch": 0.19993008397361042, "percentage": 6.66, "elapsed_time": "4:56:46", "remaining_time": "2 days, 21:16:25", "throughput": 25386.19, "total_tokens": 452037568} +{"current_steps": 1690, "total_steps": 25209, "loss": 1.1804, "lr": 4.624676139488888e-05, "epoch": 0.20112014399726286, "percentage": 6.7, "elapsed_time": "4:58:30", "remaining_time": "2 days, 21:14:16", "throughput": 25391.03, "total_tokens": 454773248} +{"current_steps": 1700, "total_steps": 25209, "loss": 1.1735, "lr": 4.6226991906790686e-05, "epoch": 0.20231020402091532, "percentage": 6.74, "elapsed_time": "5:00:21", "remaining_time": "2 days, 21:13:33", "throughput": 25390.59, "total_tokens": 457571456} +{"current_steps": 1710, "total_steps": 25209, "loss": 1.1664, "lr": 4.620724775011897e-05, "epoch": 0.20350026404456775, "percentage": 6.78, "elapsed_time": "5:02:06", "remaining_time": "2 days, 21:11:36", "throughput": 25393.43, "total_tokens": 460295232} +{"current_steps": 1720, "total_steps": 25209, "loss": 1.1734, "lr": 4.618752887082297e-05, "epoch": 0.2046903240682202, "percentage": 6.82, "elapsed_time": "5:03:49", "remaining_time": "2 days, 21:09:02", "throughput": 25397.7, "total_tokens": 462975552} +{"current_steps": 1730, "total_steps": 25209, "loss": 1.1691, "lr": 4.616783521501325e-05, "epoch": 0.20588038409187262, "percentage": 6.86, "elapsed_time": "5:05:36", "remaining_time": "2 days, 21:07:32", "throughput": 25400.47, "total_tokens": 465746944} +{"current_steps": 1740, "total_steps": 25209, "loss": 1.1746, "lr": 4.614816672896108e-05, "epoch": 0.20707044411552508, "percentage": 6.9, "elapsed_time": "5:07:20", "remaining_time": "2 days, 21:05:26", "throughput": 25404.67, "total_tokens": 468479040} +{"current_steps": 1750, "total_steps": 25209, "loss": 1.1733, "lr": 4.612852335909782e-05, "epoch": 0.20826050413917752, "percentage": 6.94, "elapsed_time": "5:09:19", "remaining_time": "2 days, 21:06:37", "throughput": 25389.93, "total_tokens": 471233472} +{"current_steps": 1760, "total_steps": 25209, "loss": 1.1752, "lr": 4.6108905052014323e-05, "epoch": 0.20945056416282995, "percentage": 6.98, "elapsed_time": "5:11:15", "remaining_time": "2 days, 21:06:52", "throughput": 25379.73, "total_tokens": 473966912} +{"current_steps": 1770, "total_steps": 25209, "loss": 1.1564, "lr": 4.608931175446027e-05, "epoch": 0.2106406241864824, "percentage": 7.02, "elapsed_time": "5:13:01", "remaining_time": "2 days, 21:05:15", "throughput": 25376.33, "total_tokens": 476612928} +{"current_steps": 1780, "total_steps": 25209, "loss": 1.1655, "lr": 4.606974341334367e-05, "epoch": 0.21183068421013485, "percentage": 7.06, "elapsed_time": "5:14:44", "remaining_time": "2 days, 21:02:48", "throughput": 25380.85, "total_tokens": 479311616} +{"current_steps": 1790, "total_steps": 25209, "loss": 1.1709, "lr": 4.605019997573011e-05, "epoch": 0.21302074423378728, "percentage": 7.1, "elapsed_time": "5:16:23", "remaining_time": "2 days, 20:59:27", "throughput": 25388.36, "total_tokens": 481963968} +{"current_steps": 1800, "total_steps": 25209, "loss": 1.1587, "lr": 4.603068138884229e-05, "epoch": 0.21421080425743974, "percentage": 7.14, "elapsed_time": "5:18:02", "remaining_time": "2 days, 20:56:11", "throughput": 25395.6, "total_tokens": 484618368} +{"current_steps": 1810, "total_steps": 25209, "loss": 1.179, "lr": 4.6011187600059345e-05, "epoch": 0.21540086428109217, "percentage": 7.18, "elapsed_time": "5:19:44", "remaining_time": "2 days, 20:53:24", "throughput": 25401.8, "total_tokens": 487309632} +{"current_steps": 1820, "total_steps": 25209, "loss": 1.1721, "lr": 4.599171855691629e-05, "epoch": 0.2165909243047446, "percentage": 7.22, "elapsed_time": "5:21:27", "remaining_time": "2 days, 20:51:03", "throughput": 25405.84, "total_tokens": 490010624} +{"current_steps": 1830, "total_steps": 25209, "loss": 1.1563, "lr": 4.597227420710335e-05, "epoch": 0.21778098432839707, "percentage": 7.26, "elapsed_time": "5:23:06", "remaining_time": "2 days, 20:47:56", "throughput": 25415.02, "total_tokens": 492720704} +{"current_steps": 1840, "total_steps": 25209, "loss": 1.1666, "lr": 4.595285449846551e-05, "epoch": 0.2189710443520495, "percentage": 7.3, "elapsed_time": "5:24:50", "remaining_time": "2 days, 20:45:40", "throughput": 25416.71, "total_tokens": 495385216} +{"current_steps": 1850, "total_steps": 25209, "loss": 1.1698, "lr": 4.593345937900178e-05, "epoch": 0.22016110437570194, "percentage": 7.34, "elapsed_time": "5:26:31", "remaining_time": "2 days, 20:42:55", "throughput": 25421.15, "total_tokens": 498045760} +{"current_steps": 1860, "total_steps": 25209, "loss": 1.151, "lr": 4.591408879686472e-05, "epoch": 0.2213511643993544, "percentage": 7.38, "elapsed_time": "5:28:06", "remaining_time": "2 days, 20:38:43", "throughput": 25433.86, "total_tokens": 500693248} +{"current_steps": 1870, "total_steps": 25209, "loss": 1.1756, "lr": 4.5894742700359775e-05, "epoch": 0.22254122442300683, "percentage": 7.42, "elapsed_time": "5:29:46", "remaining_time": "2 days, 20:35:51", "throughput": 25439.49, "total_tokens": 503359744} +{"current_steps": 1880, "total_steps": 25209, "loss": 1.1755, "lr": 4.587542103794477e-05, "epoch": 0.22373128444665927, "percentage": 7.46, "elapsed_time": "5:31:25", "remaining_time": "2 days, 20:32:41", "throughput": 25449.28, "total_tokens": 506075392} +{"current_steps": 1890, "total_steps": 25209, "loss": 1.1714, "lr": 4.5856123758229247e-05, "epoch": 0.22492134447031173, "percentage": 7.5, "elapsed_time": "5:33:07", "remaining_time": "2 days, 20:30:05", "throughput": 25455.6, "total_tokens": 508790336} +{"current_steps": 1900, "total_steps": 25209, "loss": 1.15, "lr": 4.5836850809973993e-05, "epoch": 0.22611140449396416, "percentage": 7.54, "elapsed_time": "5:34:51", "remaining_time": "2 days, 20:27:57", "throughput": 25459.96, "total_tokens": 511522752} +{"current_steps": 1910, "total_steps": 25209, "loss": 1.1523, "lr": 4.5817602142090385e-05, "epoch": 0.2273014645176166, "percentage": 7.58, "elapsed_time": "5:36:31", "remaining_time": "2 days, 20:25:02", "throughput": 25469.01, "total_tokens": 514252928} +{"current_steps": 1920, "total_steps": 25209, "loss": 1.1595, "lr": 4.579837770363989e-05, "epoch": 0.22849152454126906, "percentage": 7.62, "elapsed_time": "5:38:08", "remaining_time": "2 days, 20:21:36", "throughput": 25475.55, "total_tokens": 516868352} +{"current_steps": 1930, "total_steps": 25209, "loss": 1.1801, "lr": 4.57791774438334e-05, "epoch": 0.2296815845649215, "percentage": 7.66, "elapsed_time": "5:39:51", "remaining_time": "2 days, 20:19:14", "throughput": 25481.03, "total_tokens": 519594240} +{"current_steps": 1940, "total_steps": 25209, "loss": 1.1739, "lr": 4.576000131203078e-05, "epoch": 0.23087164458857393, "percentage": 7.7, "elapsed_time": "5:41:32", "remaining_time": "2 days, 20:16:36", "throughput": 25486.43, "total_tokens": 522286848} +{"current_steps": 1950, "total_steps": 25209, "loss": 1.1504, "lr": 4.574084925774023e-05, "epoch": 0.2320617046122264, "percentage": 7.74, "elapsed_time": "5:43:14", "remaining_time": "2 days, 20:14:04", "throughput": 25490.41, "total_tokens": 524961856} +{"current_steps": 1960, "total_steps": 25209, "loss": 1.1505, "lr": 4.5721721230617795e-05, "epoch": 0.23325176463587882, "percentage": 7.78, "elapsed_time": "5:44:55", "remaining_time": "2 days, 20:11:24", "throughput": 25496.01, "total_tokens": 527653056} +{"current_steps": 1970, "total_steps": 25209, "loss": 1.174, "lr": 4.57026171804667e-05, "epoch": 0.23444182465953126, "percentage": 7.81, "elapsed_time": "5:46:37", "remaining_time": "2 days, 20:08:59", "throughput": 25500.73, "total_tokens": 530358400} +{"current_steps": 1980, "total_steps": 25209, "loss": 1.172, "lr": 4.568353705723692e-05, "epoch": 0.23563188468318372, "percentage": 7.85, "elapsed_time": "5:48:20", "remaining_time": "2 days, 20:06:37", "throughput": 25504.85, "total_tokens": 533056128} +{"current_steps": 1990, "total_steps": 25209, "loss": 1.1578, "lr": 4.566448081102455e-05, "epoch": 0.23682194470683615, "percentage": 7.89, "elapsed_time": "5:50:00", "remaining_time": "2 days, 20:03:45", "throughput": 25510.07, "total_tokens": 535714304} +{"current_steps": 2000, "total_steps": 25209, "loss": 1.1622, "lr": 4.564544839207128e-05, "epoch": 0.23801200473048859, "percentage": 7.93, "elapsed_time": "5:51:48", "remaining_time": "2 days, 20:02:33", "throughput": 25509.73, "total_tokens": 538471040} +{"current_steps": 2010, "total_steps": 25209, "loss": 1.1696, "lr": 4.562643975076387e-05, "epoch": 0.23920206475414105, "percentage": 7.97, "elapsed_time": "5:53:32", "remaining_time": "2 days, 20:00:27", "throughput": 25511.66, "total_tokens": 541159552} +{"current_steps": 2020, "total_steps": 25209, "loss": 1.1631, "lr": 4.560745483763357e-05, "epoch": 0.24039212477779348, "percentage": 8.01, "elapsed_time": "5:55:10", "remaining_time": "2 days, 19:57:15", "throughput": 25522.47, "total_tokens": 543890048} +{"current_steps": 2030, "total_steps": 25209, "loss": 1.1669, "lr": 4.5588493603355595e-05, "epoch": 0.24158218480144592, "percentage": 8.05, "elapsed_time": "5:56:49", "remaining_time": "2 days, 19:54:22", "throughput": 25528.36, "total_tokens": 546558784} +{"current_steps": 2040, "total_steps": 25209, "loss": 1.1729, "lr": 4.556955599874859e-05, "epoch": 0.24277224482509838, "percentage": 8.09, "elapsed_time": "5:58:33", "remaining_time": "2 days, 19:52:18", "throughput": 25532.38, "total_tokens": 549295936} +{"current_steps": 2050, "total_steps": 25209, "loss": 1.1593, "lr": 4.555064197477409e-05, "epoch": 0.2439623048487508, "percentage": 8.13, "elapsed_time": "6:00:14", "remaining_time": "2 days, 19:49:36", "throughput": 25537.03, "total_tokens": 551960704} +{"current_steps": 2060, "total_steps": 25209, "loss": 1.1654, "lr": 4.5531751482536e-05, "epoch": 0.24515236487240324, "percentage": 8.17, "elapsed_time": "6:01:53", "remaining_time": "2 days, 19:46:47", "throughput": 25544.09, "total_tokens": 554661888} +{"current_steps": 2070, "total_steps": 25209, "loss": 1.1828, "lr": 4.5512884473280024e-05, "epoch": 0.2463424248960557, "percentage": 8.21, "elapsed_time": "6:03:34", "remaining_time": "2 days, 19:44:10", "throughput": 25548.35, "total_tokens": 557329536} +{"current_steps": 2080, "total_steps": 25209, "loss": 1.1678, "lr": 4.549404089839322e-05, "epoch": 0.24753248491970814, "percentage": 8.25, "elapsed_time": "6:05:14", "remaining_time": "2 days, 19:41:24", "throughput": 25553.61, "total_tokens": 559998080} +{"current_steps": 2090, "total_steps": 25209, "loss": 1.1458, "lr": 4.547522070940335e-05, "epoch": 0.24872254494336057, "percentage": 8.29, "elapsed_time": "6:06:56", "remaining_time": "2 days, 19:38:58", "throughput": 25558.15, "total_tokens": 562696000} +{"current_steps": 2100, "total_steps": 25209, "loss": 1.1384, "lr": 4.545642385797848e-05, "epoch": 0.24991260496701304, "percentage": 8.33, "elapsed_time": "6:08:42", "remaining_time": "2 days, 19:37:26", "throughput": 25555.06, "total_tokens": 565351616} +{"current_steps": 2110, "total_steps": 25209, "loss": 1.1542, "lr": 4.543765029592637e-05, "epoch": 0.25110266499066547, "percentage": 8.37, "elapsed_time": "6:10:24", "remaining_time": "2 days, 19:35:04", "throughput": 25558.07, "total_tokens": 568024384} +{"current_steps": 2120, "total_steps": 25209, "loss": 1.1411, "lr": 4.541889997519403e-05, "epoch": 0.25229272501431793, "percentage": 8.41, "elapsed_time": "6:12:07", "remaining_time": "2 days, 19:32:55", "throughput": 25561.16, "total_tokens": 570729344} +{"current_steps": 2130, "total_steps": 25209, "loss": 1.1514, "lr": 4.5400172847867095e-05, "epoch": 0.25348278503797034, "percentage": 8.45, "elapsed_time": "6:13:50", "remaining_time": "2 days, 19:30:34", "throughput": 25564.86, "total_tokens": 573421248} +{"current_steps": 2140, "total_steps": 25209, "loss": 1.1493, "lr": 4.5381468866169466e-05, "epoch": 0.2546728450616228, "percentage": 8.49, "elapsed_time": "6:15:27", "remaining_time": "2 days, 19:27:25", "throughput": 25572.11, "total_tokens": 576078400} +{"current_steps": 2150, "total_steps": 25209, "loss": 1.1596, "lr": 4.5362787982462616e-05, "epoch": 0.25586290508527526, "percentage": 8.53, "elapsed_time": "6:17:07", "remaining_time": "2 days, 19:24:46", "throughput": 25576.06, "total_tokens": 578732416} +{"current_steps": 2160, "total_steps": 25209, "loss": 1.1515, "lr": 4.5344130149245275e-05, "epoch": 0.25705296510892767, "percentage": 8.57, "elapsed_time": "6:18:50", "remaining_time": "2 days, 19:22:36", "throughput": 25579.26, "total_tokens": 581436672} +{"current_steps": 2170, "total_steps": 25209, "loss": 1.156, "lr": 4.5325495319152715e-05, "epoch": 0.25824302513258013, "percentage": 8.61, "elapsed_time": "6:20:28", "remaining_time": "2 days, 19:19:28", "throughput": 25586.38, "total_tokens": 584092288} +{"current_steps": 2180, "total_steps": 25209, "loss": 1.1542, "lr": 4.530688344495644e-05, "epoch": 0.2594330851562326, "percentage": 8.65, "elapsed_time": "6:22:17", "remaining_time": "2 days, 19:18:26", "throughput": 25582.52, "total_tokens": 586800128} +{"current_steps": 2190, "total_steps": 25209, "loss": 1.147, "lr": 4.528829447956357e-05, "epoch": 0.260623145179885, "percentage": 8.69, "elapsed_time": "6:23:58", "remaining_time": "2 days, 19:16:01", "throughput": 25585.62, "total_tokens": 589465088} +{"current_steps": 2200, "total_steps": 25209, "loss": 1.1521, "lr": 4.526972837601633e-05, "epoch": 0.26181320520353746, "percentage": 8.73, "elapsed_time": "6:25:37", "remaining_time": "2 days, 19:13:02", "throughput": 25592.55, "total_tokens": 592136192} +{"current_steps": 2210, "total_steps": 25209, "loss": 1.1588, "lr": 4.525118508749165e-05, "epoch": 0.2630032652271899, "percentage": 8.77, "elapsed_time": "6:27:16", "remaining_time": "2 days, 19:10:17", "throughput": 25597.15, "total_tokens": 594789376} +{"current_steps": 2220, "total_steps": 25209, "loss": 1.1489, "lr": 4.5232664567300546e-05, "epoch": 0.2641933252508423, "percentage": 8.81, "elapsed_time": "6:28:55", "remaining_time": "2 days, 19:07:24", "throughput": 25604.46, "total_tokens": 597482880} +{"current_steps": 2230, "total_steps": 25209, "loss": 1.1627, "lr": 4.521416676888773e-05, "epoch": 0.2653833852744948, "percentage": 8.85, "elapsed_time": "6:30:37", "remaining_time": "2 days, 19:05:12", "throughput": 25609.48, "total_tokens": 600223808} +{"current_steps": 2240, "total_steps": 25209, "loss": 1.1477, "lr": 4.519569164583107e-05, "epoch": 0.26657344529814725, "percentage": 8.89, "elapsed_time": "6:32:16", "remaining_time": "2 days, 19:02:21", "throughput": 25615.26, "total_tokens": 602889216} +{"current_steps": 2250, "total_steps": 25209, "loss": 1.1421, "lr": 4.517723915184109e-05, "epoch": 0.26776350532179966, "percentage": 8.93, "elapsed_time": "6:34:00", "remaining_time": "2 days, 19:00:30", "throughput": 25616.5, "total_tokens": 605594176} +{"current_steps": 2260, "total_steps": 25209, "loss": 1.1611, "lr": 4.5158809240760506e-05, "epoch": 0.2689535653454521, "percentage": 8.97, "elapsed_time": "6:35:38", "remaining_time": "2 days, 18:57:30", "throughput": 25622.89, "total_tokens": 608247296} +{"current_steps": 2270, "total_steps": 25209, "loss": 1.1597, "lr": 4.514040186656375e-05, "epoch": 0.2701436253691046, "percentage": 9.0, "elapsed_time": "6:37:23", "remaining_time": "2 days, 18:55:41", "throughput": 25625.09, "total_tokens": 610981504} +{"current_steps": 2280, "total_steps": 25209, "loss": 1.1568, "lr": 4.512201698335644e-05, "epoch": 0.271333685392757, "percentage": 9.04, "elapsed_time": "6:39:04", "remaining_time": "2 days, 18:53:19", "throughput": 25628.59, "total_tokens": 613662720} +{"current_steps": 2290, "total_steps": 25209, "loss": 1.1431, "lr": 4.510365454537496e-05, "epoch": 0.27252374541640945, "percentage": 9.08, "elapsed_time": "6:40:44", "remaining_time": "2 days, 18:50:43", "throughput": 25634.62, "total_tokens": 616370176} +{"current_steps": 2300, "total_steps": 25209, "loss": 1.1595, "lr": 4.5085314506985945e-05, "epoch": 0.2737138054400619, "percentage": 9.12, "elapsed_time": "6:42:23", "remaining_time": "2 days, 18:47:59", "throughput": 25639.71, "total_tokens": 619030848} +{"current_steps": 2310, "total_steps": 25209, "loss": 1.1551, "lr": 4.50669968226858e-05, "epoch": 0.2749038654637143, "percentage": 9.16, "elapsed_time": "6:44:06", "remaining_time": "2 days, 18:45:50", "throughput": 25643.19, "total_tokens": 621745152} +{"current_steps": 2320, "total_steps": 25209, "loss": 1.1573, "lr": 4.504870144710027e-05, "epoch": 0.2760939254873668, "percentage": 9.2, "elapsed_time": "6:45:48", "remaining_time": "2 days, 18:43:43", "throughput": 25644.87, "total_tokens": 624421184} +{"current_steps": 2330, "total_steps": 25209, "loss": 1.1422, "lr": 4.5030428334983884e-05, "epoch": 0.27728398551101924, "percentage": 9.24, "elapsed_time": "6:47:29", "remaining_time": "2 days, 18:41:18", "throughput": 25649.91, "total_tokens": 627129920} +{"current_steps": 2340, "total_steps": 25209, "loss": 1.156, "lr": 4.501217744121959e-05, "epoch": 0.27847404553467164, "percentage": 9.28, "elapsed_time": "6:49:11", "remaining_time": "2 days, 18:39:01", "throughput": 25652.37, "total_tokens": 629797824} +{"current_steps": 2350, "total_steps": 25209, "loss": 1.1522, "lr": 4.499394872081821e-05, "epoch": 0.2796641055583241, "percentage": 9.32, "elapsed_time": "6:50:50", "remaining_time": "2 days, 18:36:25", "throughput": 25658.2, "total_tokens": 632497664} +{"current_steps": 2360, "total_steps": 25209, "loss": 1.1449, "lr": 4.4975742128918e-05, "epoch": 0.28085416558197657, "percentage": 9.36, "elapsed_time": "6:52:27", "remaining_time": "2 days, 18:33:24", "throughput": 25665.27, "total_tokens": 635163840} +{"current_steps": 2370, "total_steps": 25209, "loss": 1.1537, "lr": 4.495755762078418e-05, "epoch": 0.282044225605629, "percentage": 9.4, "elapsed_time": "6:54:09", "remaining_time": "2 days, 18:31:10", "throughput": 25669.23, "total_tokens": 637876544} +{"current_steps": 2380, "total_steps": 25209, "loss": 1.1468, "lr": 4.49393951518085e-05, "epoch": 0.28323428562928143, "percentage": 9.44, "elapsed_time": "6:55:46", "remaining_time": "2 days, 18:28:03", "throughput": 25676.22, "total_tokens": 640522496} +{"current_steps": 2390, "total_steps": 25209, "loss": 1.1612, "lr": 4.4921254677508716e-05, "epoch": 0.2844243456529339, "percentage": 9.48, "elapsed_time": "6:57:25", "remaining_time": "2 days, 18:25:27", "throughput": 25680.9, "total_tokens": 643191744} +{"current_steps": 2400, "total_steps": 25209, "loss": 1.1354, "lr": 4.490313615352821e-05, "epoch": 0.2856144056765863, "percentage": 9.52, "elapsed_time": "6:59:03", "remaining_time": "2 days, 18:22:41", "throughput": 25687.77, "total_tokens": 645892288} +{"current_steps": 2410, "total_steps": 25209, "loss": 1.1439, "lr": 4.48850395356355e-05, "epoch": 0.28680446570023876, "percentage": 9.56, "elapsed_time": "7:00:42", "remaining_time": "2 days, 18:19:56", "throughput": 25694.92, "total_tokens": 648599488} +{"current_steps": 2420, "total_steps": 25209, "loss": 1.135, "lr": 4.486696477972375e-05, "epoch": 0.2879945257238912, "percentage": 9.6, "elapsed_time": "7:02:20", "remaining_time": "2 days, 18:17:11", "throughput": 25701.56, "total_tokens": 651295808} +{"current_steps": 2430, "total_steps": 25209, "loss": 1.1231, "lr": 4.484891184181041e-05, "epoch": 0.28918458574754363, "percentage": 9.64, "elapsed_time": "7:03:55", "remaining_time": "2 days, 18:13:52", "throughput": 25709.93, "total_tokens": 653940928} +{"current_steps": 2440, "total_steps": 25209, "loss": 1.133, "lr": 4.483088067803662e-05, "epoch": 0.2903746457711961, "percentage": 9.68, "elapsed_time": "7:05:34", "remaining_time": "2 days, 18:11:12", "throughput": 25716.43, "total_tokens": 656645888} +{"current_steps": 2450, "total_steps": 25209, "loss": 1.1349, "lr": 4.481287124466697e-05, "epoch": 0.2915647057948485, "percentage": 9.72, "elapsed_time": "7:07:16", "remaining_time": "2 days, 18:09:09", "throughput": 25718.16, "total_tokens": 659330432} +{"current_steps": 2460, "total_steps": 25209, "loss": 1.1369, "lr": 4.479488349808885e-05, "epoch": 0.29275476581850096, "percentage": 9.76, "elapsed_time": "7:08:57", "remaining_time": "2 days, 18:06:47", "throughput": 25722.23, "total_tokens": 662021888} +{"current_steps": 2470, "total_steps": 25209, "loss": 1.1382, "lr": 4.4776917394812114e-05, "epoch": 0.2939448258421534, "percentage": 9.8, "elapsed_time": "7:10:34", "remaining_time": "2 days, 18:03:53", "throughput": 25727.98, "total_tokens": 664666304} +{"current_steps": 2480, "total_steps": 25209, "loss": 1.1369, "lr": 4.475897289146862e-05, "epoch": 0.29513488586580583, "percentage": 9.84, "elapsed_time": "7:12:11", "remaining_time": "2 days, 18:01:03", "throughput": 25733.42, "total_tokens": 667316672} +{"current_steps": 2490, "total_steps": 25209, "loss": 1.1345, "lr": 4.4741049944811806e-05, "epoch": 0.2963249458894583, "percentage": 9.88, "elapsed_time": "7:13:52", "remaining_time": "2 days, 17:58:41", "throughput": 25737.61, "total_tokens": 670009728} +{"current_steps": 2500, "total_steps": 25209, "loss": 1.131, "lr": 4.472314851171621e-05, "epoch": 0.29751500591311075, "percentage": 9.92, "elapsed_time": "7:15:28", "remaining_time": "2 days, 17:55:40", "throughput": 25744.24, "total_tokens": 672657728} +{"current_steps": 2510, "total_steps": 25209, "loss": 1.1519, "lr": 4.4705268549177084e-05, "epoch": 0.29870506593676316, "percentage": 9.96, "elapsed_time": "7:17:08", "remaining_time": "2 days, 17:53:16", "throughput": 25748.77, "total_tokens": 675353728} +{"current_steps": 2520, "total_steps": 25209, "loss": 1.1473, "lr": 4.468741001430989e-05, "epoch": 0.2998951259604156, "percentage": 10.0, "elapsed_time": "7:18:46", "remaining_time": "2 days, 17:50:35", "throughput": 25754.22, "total_tokens": 678027136} +{"current_steps": 2530, "total_steps": 25209, "loss": 1.1307, "lr": 4.466957286434997e-05, "epoch": 0.3010851859840681, "percentage": 10.04, "elapsed_time": "7:20:28", "remaining_time": "2 days, 17:48:25", "throughput": 25758.29, "total_tokens": 680751936} +{"current_steps": 2540, "total_steps": 25209, "loss": 1.1343, "lr": 4.4651757056652e-05, "epoch": 0.3022752460077205, "percentage": 10.08, "elapsed_time": "7:22:10", "remaining_time": "2 days, 17:46:21", "throughput": 25761.32, "total_tokens": 683466304} +{"current_steps": 2550, "total_steps": 25209, "loss": 1.1482, "lr": 4.463396254868968e-05, "epoch": 0.30346530603137295, "percentage": 10.12, "elapsed_time": "7:23:52", "remaining_time": "2 days, 17:44:13", "throughput": 25763.95, "total_tokens": 686158144} +{"current_steps": 2560, "total_steps": 25209, "loss": 1.1424, "lr": 4.461618929805519e-05, "epoch": 0.3046553660550254, "percentage": 10.16, "elapsed_time": "7:25:31", "remaining_time": "2 days, 17:41:41", "throughput": 25769.52, "total_tokens": 688860096} +{"current_steps": 2570, "total_steps": 25209, "loss": 1.1255, "lr": 4.459843726245888e-05, "epoch": 0.3058454260786778, "percentage": 10.19, "elapsed_time": "7:27:11", "remaining_time": "2 days, 17:39:21", "throughput": 25774.09, "total_tokens": 691570048} +{"current_steps": 2580, "total_steps": 25209, "loss": 1.1363, "lr": 4.458070639972875e-05, "epoch": 0.3070354861023303, "percentage": 10.23, "elapsed_time": "7:28:53", "remaining_time": "2 days, 17:37:11", "throughput": 25777.57, "total_tokens": 694278976} +{"current_steps": 2590, "total_steps": 25209, "loss": 1.1321, "lr": 4.456299666781007e-05, "epoch": 0.30822554612598274, "percentage": 10.27, "elapsed_time": "7:30:30", "remaining_time": "2 days, 17:34:20", "throughput": 25782.3, "total_tokens": 696900544} +{"current_steps": 2600, "total_steps": 25209, "loss": 1.1397, "lr": 4.4545308024764984e-05, "epoch": 0.30941560614963515, "percentage": 10.31, "elapsed_time": "7:32:07", "remaining_time": "2 days, 17:31:32", "throughput": 25787.72, "total_tokens": 699550208} +{"current_steps": 2610, "total_steps": 25209, "loss": 1.1267, "lr": 4.452764042877207e-05, "epoch": 0.3106056661732876, "percentage": 10.35, "elapsed_time": "7:33:47", "remaining_time": "2 days, 17:29:15", "throughput": 25790.74, "total_tokens": 702225344} +{"current_steps": 2620, "total_steps": 25209, "loss": 1.1356, "lr": 4.45099938381259e-05, "epoch": 0.31179572619694007, "percentage": 10.39, "elapsed_time": "7:35:28", "remaining_time": "2 days, 17:27:03", "throughput": 25793.48, "total_tokens": 704907200} +{"current_steps": 2630, "total_steps": 25209, "loss": 1.15, "lr": 4.449236821123667e-05, "epoch": 0.3129857862205925, "percentage": 10.43, "elapsed_time": "7:37:20", "remaining_time": "2 days, 17:26:19", "throughput": 25787.13, "total_tokens": 707606400} +{"current_steps": 2640, "total_steps": 25209, "loss": 1.1331, "lr": 4.447476350662976e-05, "epoch": 0.31417584624424494, "percentage": 10.47, "elapsed_time": "7:39:03", "remaining_time": "2 days, 17:24:27", "throughput": 25787.78, "total_tokens": 710292160} +{"current_steps": 2650, "total_steps": 25209, "loss": 1.1283, "lr": 4.4457179682945346e-05, "epoch": 0.3153659062678974, "percentage": 10.51, "elapsed_time": "7:40:41", "remaining_time": "2 days, 17:21:50", "throughput": 25793.19, "total_tokens": 712972800} +{"current_steps": 2660, "total_steps": 25209, "loss": 1.1302, "lr": 4.443961669893798e-05, "epoch": 0.3165559662915498, "percentage": 10.55, "elapsed_time": "7:42:19", "remaining_time": "2 days, 17:19:13", "throughput": 25799.46, "total_tokens": 715675392} +{"current_steps": 2670, "total_steps": 25209, "loss": 1.1385, "lr": 4.4422074513476155e-05, "epoch": 0.31774602631520227, "percentage": 10.59, "elapsed_time": "7:44:01", "remaining_time": "2 days, 17:17:08", "throughput": 25802.56, "total_tokens": 718389056} +{"current_steps": 2680, "total_steps": 25209, "loss": 1.1324, "lr": 4.4404553085541955e-05, "epoch": 0.31893608633885473, "percentage": 10.63, "elapsed_time": "7:45:42", "remaining_time": "2 days, 17:14:54", "throughput": 25806.4, "total_tokens": 721095488} +{"current_steps": 2690, "total_steps": 25209, "loss": 1.1385, "lr": 4.438705237423063e-05, "epoch": 0.32012614636250714, "percentage": 10.67, "elapsed_time": "7:47:22", "remaining_time": "2 days, 17:12:31", "throughput": 25810.38, "total_tokens": 723779776} +{"current_steps": 2700, "total_steps": 25209, "loss": 1.1402, "lr": 4.436957233875017e-05, "epoch": 0.3213162063861596, "percentage": 10.71, "elapsed_time": "7:49:01", "remaining_time": "2 days, 17:10:04", "throughput": 25815.41, "total_tokens": 726478720} +{"current_steps": 2710, "total_steps": 25209, "loss": 1.1339, "lr": 4.4352112938420956e-05, "epoch": 0.32250626640981206, "percentage": 10.75, "elapsed_time": "7:50:42", "remaining_time": "2 days, 17:07:51", "throughput": 25818.92, "total_tokens": 729179648} +{"current_steps": 2720, "total_steps": 25209, "loss": 1.1285, "lr": 4.433467413267529e-05, "epoch": 0.32369632643346447, "percentage": 10.79, "elapsed_time": "7:52:27", "remaining_time": "2 days, 17:06:15", "throughput": 25818.56, "total_tokens": 731886592} +{"current_steps": 2730, "total_steps": 25209, "loss": 1.1281, "lr": 4.431725588105708e-05, "epoch": 0.3248863864571169, "percentage": 10.83, "elapsed_time": "7:54:10", "remaining_time": "2 days, 17:04:22", "throughput": 25821.84, "total_tokens": 734642816} +{"current_steps": 2740, "total_steps": 25209, "loss": 1.1346, "lr": 4.4299858143221377e-05, "epoch": 0.3260764464807694, "percentage": 10.87, "elapsed_time": "7:55:53", "remaining_time": "2 days, 17:02:27", "throughput": 25824.08, "total_tokens": 737361984} +{"current_steps": 2750, "total_steps": 25209, "loss": 1.139, "lr": 4.4282480878934065e-05, "epoch": 0.3272665065044218, "percentage": 10.91, "elapsed_time": "7:57:35", "remaining_time": "2 days, 17:00:28", "throughput": 25827.37, "total_tokens": 740100288} +{"current_steps": 2760, "total_steps": 25209, "loss": 1.1464, "lr": 4.4265124048071346e-05, "epoch": 0.32845656652807426, "percentage": 10.95, "elapsed_time": "7:59:15", "remaining_time": "2 days, 16:58:10", "throughput": 25830.72, "total_tokens": 742782976} +{"current_steps": 2770, "total_steps": 25209, "loss": 1.1398, "lr": 4.4247787610619477e-05, "epoch": 0.3296466265517267, "percentage": 10.99, "elapsed_time": "8:00:59", "remaining_time": "2 days, 16:56:24", "throughput": 25832.32, "total_tokens": 745511872} +{"current_steps": 2780, "total_steps": 25209, "loss": 1.1298, "lr": 4.42304715266743e-05, "epoch": 0.3308366865753791, "percentage": 11.03, "elapsed_time": "8:02:32", "remaining_time": "2 days, 16:53:09", "throughput": 25841.01, "total_tokens": 748166208} +{"current_steps": 2790, "total_steps": 25209, "loss": 1.1371, "lr": 4.421317575644092e-05, "epoch": 0.3320267465990316, "percentage": 11.07, "elapsed_time": "8:04:13", "remaining_time": "2 days, 16:50:59", "throughput": 25844.68, "total_tokens": 750880384} +{"current_steps": 2800, "total_steps": 25209, "loss": 1.1452, "lr": 4.419590026023325e-05, "epoch": 0.33321680662268405, "percentage": 11.11, "elapsed_time": "8:06:03", "remaining_time": "2 days, 16:50:01", "throughput": 25837.65, "total_tokens": 753516288} +{"current_steps": 2810, "total_steps": 25209, "loss": 1.1176, "lr": 4.417864499847368e-05, "epoch": 0.33440686664633645, "percentage": 11.15, "elapsed_time": "8:07:42", "remaining_time": "2 days, 16:47:37", "throughput": 25842.38, "total_tokens": 756217216} +{"current_steps": 2820, "total_steps": 25209, "loss": 1.1343, "lr": 4.4161409931692676e-05, "epoch": 0.3355969266699889, "percentage": 11.19, "elapsed_time": "8:09:27", "remaining_time": "2 days, 16:45:57", "throughput": 25843.34, "total_tokens": 758948672} +{"current_steps": 2830, "total_steps": 25209, "loss": 1.1303, "lr": 4.414419502052841e-05, "epoch": 0.3367869866936414, "percentage": 11.23, "elapsed_time": "8:11:00", "remaining_time": "2 days, 16:42:43", "throughput": 25852.51, "total_tokens": 761617984} +{"current_steps": 2840, "total_steps": 25209, "loss": 1.1401, "lr": 4.412700022572637e-05, "epoch": 0.3379770467172938, "percentage": 11.27, "elapsed_time": "8:12:39", "remaining_time": "2 days, 16:40:23", "throughput": 25856.71, "total_tokens": 764312768} +{"current_steps": 2850, "total_steps": 25209, "loss": 1.1245, "lr": 4.410982550813902e-05, "epoch": 0.33916710674094624, "percentage": 11.31, "elapsed_time": "8:14:23", "remaining_time": "2 days, 16:38:34", "throughput": 25859.09, "total_tokens": 767061120} +{"current_steps": 2860, "total_steps": 25209, "loss": 1.1314, "lr": 4.409267082872535e-05, "epoch": 0.3403571667645987, "percentage": 11.35, "elapsed_time": "8:16:02", "remaining_time": "2 days, 16:36:16", "throughput": 25864.18, "total_tokens": 769790016} +{"current_steps": 2870, "total_steps": 25209, "loss": 1.1283, "lr": 4.407553614855059e-05, "epoch": 0.3415472267882511, "percentage": 11.38, "elapsed_time": "8:17:45", "remaining_time": "2 days, 16:34:21", "throughput": 25867.52, "total_tokens": 772544640} +{"current_steps": 2880, "total_steps": 25209, "loss": 1.1381, "lr": 4.405842142878579e-05, "epoch": 0.3427372868119036, "percentage": 11.42, "elapsed_time": "8:19:20", "remaining_time": "2 days, 16:31:28", "throughput": 25873.8, "total_tokens": 775194048} +{"current_steps": 2890, "total_steps": 25209, "loss": 1.1127, "lr": 4.404132663070745e-05, "epoch": 0.34392734683555604, "percentage": 11.46, "elapsed_time": "8:20:58", "remaining_time": "2 days, 16:29:00", "throughput": 25878.14, "total_tokens": 777869120} +{"current_steps": 2900, "total_steps": 25209, "loss": 1.1231, "lr": 4.402425171569716e-05, "epoch": 0.34511740685920844, "percentage": 11.5, "elapsed_time": "8:22:40", "remaining_time": "2 days, 16:26:53", "throughput": 25882.0, "total_tokens": 780602048} +{"current_steps": 2910, "total_steps": 25209, "loss": 1.1382, "lr": 4.400719664524127e-05, "epoch": 0.3463074668828609, "percentage": 11.54, "elapsed_time": "8:24:21", "remaining_time": "2 days, 16:24:51", "throughput": 25884.89, "total_tokens": 783320448} +{"current_steps": 2920, "total_steps": 25209, "loss": 1.1345, "lr": 4.399016138093044e-05, "epoch": 0.34749752690651337, "percentage": 11.58, "elapsed_time": "8:26:01", "remaining_time": "2 days, 16:22:35", "throughput": 25888.17, "total_tokens": 786002432} +{"current_steps": 2930, "total_steps": 25209, "loss": 1.1202, "lr": 4.397314588445937e-05, "epoch": 0.34868758693016577, "percentage": 11.62, "elapsed_time": "8:27:37", "remaining_time": "2 days, 16:19:53", "throughput": 25893.88, "total_tokens": 788669824} +{"current_steps": 2940, "total_steps": 25209, "loss": 1.124, "lr": 4.395615011762637e-05, "epoch": 0.34987764695381823, "percentage": 11.66, "elapsed_time": "8:29:13", "remaining_time": "2 days, 16:17:08", "throughput": 25899.67, "total_tokens": 791331264} +{"current_steps": 2950, "total_steps": 25209, "loss": 1.1271, "lr": 4.3939174042333057e-05, "epoch": 0.3510677069774707, "percentage": 11.7, "elapsed_time": "8:30:54", "remaining_time": "2 days, 16:15:02", "throughput": 25901.68, "total_tokens": 794008256} +{"current_steps": 2960, "total_steps": 25209, "loss": 1.1249, "lr": 4.3922217620583904e-05, "epoch": 0.3522577670011231, "percentage": 11.74, "elapsed_time": "8:32:32", "remaining_time": "2 days, 16:12:36", "throughput": 25905.82, "total_tokens": 796681600} +{"current_steps": 2970, "total_steps": 25209, "loss": 1.1348, "lr": 4.3905280814486025e-05, "epoch": 0.35344782702477556, "percentage": 11.78, "elapsed_time": "8:34:12", "remaining_time": "2 days, 16:10:23", "throughput": 25909.56, "total_tokens": 799387648} +{"current_steps": 2980, "total_steps": 25209, "loss": 1.1188, "lr": 4.388836358624867e-05, "epoch": 0.354637887048428, "percentage": 11.82, "elapsed_time": "8:35:51", "remaining_time": "2 days, 16:07:58", "throughput": 25914.38, "total_tokens": 802087168} +{"current_steps": 2990, "total_steps": 25209, "loss": 1.1433, "lr": 4.3871465898182976e-05, "epoch": 0.35582794707208043, "percentage": 11.86, "elapsed_time": "8:37:28", "remaining_time": "2 days, 16:05:26", "throughput": 25919.31, "total_tokens": 804762944} +{"current_steps": 3000, "total_steps": 25209, "loss": 1.1235, "lr": 4.385458771270156e-05, "epoch": 0.3570180070957329, "percentage": 11.9, "elapsed_time": "8:39:06", "remaining_time": "2 days, 16:02:57", "throughput": 25923.94, "total_tokens": 807438720} +{"current_steps": 3010, "total_steps": 25209, "loss": 1.1194, "lr": 4.3837728992318205e-05, "epoch": 0.35820806711938535, "percentage": 11.94, "elapsed_time": "8:40:43", "remaining_time": "2 days, 16:00:21", "throughput": 25928.8, "total_tokens": 810099136} +{"current_steps": 3020, "total_steps": 25209, "loss": 1.1257, "lr": 4.382088969964746e-05, "epoch": 0.35939812714303776, "percentage": 11.98, "elapsed_time": "8:42:20", "remaining_time": "2 days, 15:57:46", "throughput": 25934.07, "total_tokens": 812776192} +{"current_steps": 3030, "total_steps": 25209, "loss": 1.1182, "lr": 4.380406979740436e-05, "epoch": 0.3605881871666902, "percentage": 12.02, "elapsed_time": "8:43:59", "remaining_time": "2 days, 15:55:33", "throughput": 25937.43, "total_tokens": 815467456} +{"current_steps": 3040, "total_steps": 25209, "loss": 1.1219, "lr": 4.3787269248403994e-05, "epoch": 0.3617782471903427, "percentage": 12.06, "elapsed_time": "8:45:37", "remaining_time": "2 days, 15:53:06", "throughput": 25942.12, "total_tokens": 818156032} +{"current_steps": 3050, "total_steps": 25209, "loss": 1.1245, "lr": 4.377048801556126e-05, "epoch": 0.3629683072139951, "percentage": 12.1, "elapsed_time": "8:47:15", "remaining_time": "2 days, 15:50:41", "throughput": 25946.67, "total_tokens": 820842688} +{"current_steps": 3060, "total_steps": 25209, "loss": 1.1442, "lr": 4.3753726061890446e-05, "epoch": 0.36415836723764755, "percentage": 12.14, "elapsed_time": "8:48:56", "remaining_time": "2 days, 15:48:39", "throughput": 25948.96, "total_tokens": 823539008} +{"current_steps": 3070, "total_steps": 25209, "loss": 1.1279, "lr": 4.373698335050488e-05, "epoch": 0.3653484272613, "percentage": 12.18, "elapsed_time": "8:50:33", "remaining_time": "2 days, 15:46:03", "throughput": 25954.07, "total_tokens": 826206848} +{"current_steps": 3080, "total_steps": 25209, "loss": 1.1336, "lr": 4.372025984461667e-05, "epoch": 0.3665384872849524, "percentage": 12.22, "elapsed_time": "8:52:08", "remaining_time": "2 days, 15:43:16", "throughput": 25959.87, "total_tokens": 828853760} +{"current_steps": 3090, "total_steps": 25209, "loss": 1.132, "lr": 4.370355550753629e-05, "epoch": 0.3677285473086049, "percentage": 12.26, "elapsed_time": "8:53:48", "remaining_time": "2 days, 15:41:05", "throughput": 25962.93, "total_tokens": 831543680} +{"current_steps": 3100, "total_steps": 25209, "loss": 1.1244, "lr": 4.368687030267226e-05, "epoch": 0.36891860733225734, "percentage": 12.3, "elapsed_time": "8:55:25", "remaining_time": "2 days, 15:38:35", "throughput": 25966.71, "total_tokens": 834187776} +{"current_steps": 3110, "total_steps": 25209, "loss": 1.1243, "lr": 4.367020419353081e-05, "epoch": 0.37010866735590975, "percentage": 12.34, "elapsed_time": "8:57:01", "remaining_time": "2 days, 15:35:56", "throughput": 25971.6, "total_tokens": 836834240} +{"current_steps": 3120, "total_steps": 25209, "loss": 1.1367, "lr": 4.365355714371558e-05, "epoch": 0.3712987273795622, "percentage": 12.38, "elapsed_time": "8:58:37", "remaining_time": "2 days, 15:33:21", "throughput": 25975.91, "total_tokens": 839477376} +{"current_steps": 3130, "total_steps": 25209, "loss": 1.1191, "lr": 4.3636929116927235e-05, "epoch": 0.37248878740321467, "percentage": 12.42, "elapsed_time": "9:00:12", "remaining_time": "2 days, 15:30:35", "throughput": 25981.89, "total_tokens": 842129280} +{"current_steps": 3140, "total_steps": 25209, "loss": 1.1326, "lr": 4.362032007696314e-05, "epoch": 0.3736788474268671, "percentage": 12.46, "elapsed_time": "9:01:48", "remaining_time": "2 days, 15:28:02", "throughput": 25987.27, "total_tokens": 844812224} +{"current_steps": 3150, "total_steps": 25209, "loss": 1.1335, "lr": 4.360372998771707e-05, "epoch": 0.37486890745051954, "percentage": 12.5, "elapsed_time": "9:03:28", "remaining_time": "2 days, 15:25:50", "throughput": 25989.45, "total_tokens": 847469568} +{"current_steps": 3160, "total_steps": 25209, "loss": 1.1129, "lr": 4.358715881317884e-05, "epoch": 0.376058967474172, "percentage": 12.54, "elapsed_time": "9:05:11", "remaining_time": "2 days, 15:24:04", "throughput": 25991.69, "total_tokens": 850225024} +{"current_steps": 3170, "total_steps": 25209, "loss": 1.1394, "lr": 4.357060651743399e-05, "epoch": 0.3772490274978244, "percentage": 12.57, "elapsed_time": "9:06:49", "remaining_time": "2 days, 15:21:43", "throughput": 25996.13, "total_tokens": 852920576} +{"current_steps": 3180, "total_steps": 25209, "loss": 1.1304, "lr": 4.3554073064663454e-05, "epoch": 0.37843908752147687, "percentage": 12.61, "elapsed_time": "9:08:25", "remaining_time": "2 days, 15:19:05", "throughput": 26002.57, "total_tokens": 855618048} +{"current_steps": 3190, "total_steps": 25209, "loss": 1.1176, "lr": 4.353755841914325e-05, "epoch": 0.37962914754512933, "percentage": 12.65, "elapsed_time": "9:10:03", "remaining_time": "2 days, 15:16:47", "throughput": 26007.94, "total_tokens": 858355904} +{"current_steps": 3200, "total_steps": 25209, "loss": 1.1219, "lr": 4.3521062545244116e-05, "epoch": 0.38081920756878174, "percentage": 12.69, "elapsed_time": "9:11:40", "remaining_time": "2 days, 15:14:21", "throughput": 26012.27, "total_tokens": 861027392} +{"current_steps": 3210, "total_steps": 25209, "loss": 1.1273, "lr": 4.350458540743126e-05, "epoch": 0.3820092675924342, "percentage": 12.73, "elapsed_time": "9:13:15", "remaining_time": "2 days, 15:11:36", "throughput": 26017.04, "total_tokens": 863645440} +{"current_steps": 3220, "total_steps": 25209, "loss": 1.111, "lr": 4.3488126970263955e-05, "epoch": 0.38319932761608666, "percentage": 12.77, "elapsed_time": "9:14:52", "remaining_time": "2 days, 15:09:10", "throughput": 26022.43, "total_tokens": 866350528} +{"current_steps": 3230, "total_steps": 25209, "loss": 1.1202, "lr": 4.347168719839527e-05, "epoch": 0.38438938763973907, "percentage": 12.81, "elapsed_time": "9:16:28", "remaining_time": "2 days, 15:06:35", "throughput": 26027.77, "total_tokens": 869024960} +{"current_steps": 3240, "total_steps": 25209, "loss": 1.1432, "lr": 4.345526605657173e-05, "epoch": 0.38557944766339153, "percentage": 12.85, "elapsed_time": "9:18:06", "remaining_time": "2 days, 15:04:20", "throughput": 26031.15, "total_tokens": 871704704} +{"current_steps": 3250, "total_steps": 25209, "loss": 1.1305, "lr": 4.343886350963304e-05, "epoch": 0.386769507687044, "percentage": 12.89, "elapsed_time": "9:19:46", "remaining_time": "2 days, 15:02:14", "throughput": 26035.45, "total_tokens": 874451200} +{"current_steps": 3260, "total_steps": 25209, "loss": 1.1283, "lr": 4.3422479522511697e-05, "epoch": 0.3879595677106964, "percentage": 12.93, "elapsed_time": "9:21:24", "remaining_time": "2 days, 14:59:48", "throughput": 26038.96, "total_tokens": 877097792} +{"current_steps": 3270, "total_steps": 25209, "loss": 1.1179, "lr": 4.340611406023272e-05, "epoch": 0.38914962773434886, "percentage": 12.97, "elapsed_time": "9:22:59", "remaining_time": "2 days, 14:57:15", "throughput": 26043.93, "total_tokens": 879761856} +{"current_steps": 3280, "total_steps": 25209, "loss": 1.1208, "lr": 4.338976708791336e-05, "epoch": 0.3903396877580013, "percentage": 13.01, "elapsed_time": "9:24:41", "remaining_time": "2 days, 14:55:20", "throughput": 26046.51, "total_tokens": 882496000} +{"current_steps": 3290, "total_steps": 25209, "loss": 1.1305, "lr": 4.337343857076272e-05, "epoch": 0.3915297477816537, "percentage": 13.05, "elapsed_time": "9:26:19", "remaining_time": "2 days, 14:53:03", "throughput": 26050.34, "total_tokens": 885184192} +{"current_steps": 3300, "total_steps": 25209, "loss": 1.1283, "lr": 4.33571284740815e-05, "epoch": 0.3927198078053062, "percentage": 13.09, "elapsed_time": "9:28:01", "remaining_time": "2 days, 14:51:11", "throughput": 26052.83, "total_tokens": 887924480} +{"current_steps": 3310, "total_steps": 25209, "loss": 1.1258, "lr": 4.3340836763261675e-05, "epoch": 0.39390986782895865, "percentage": 13.13, "elapsed_time": "9:29:41", "remaining_time": "2 days, 14:49:05", "throughput": 26055.5, "total_tokens": 890615680} +{"current_steps": 3320, "total_steps": 25209, "loss": 1.1131, "lr": 4.332456340378618e-05, "epoch": 0.39509992785261105, "percentage": 13.17, "elapsed_time": "9:31:16", "remaining_time": "2 days, 14:46:26", "throughput": 26060.7, "total_tokens": 893265024} +{"current_steps": 3330, "total_steps": 25209, "loss": 1.1305, "lr": 4.3308308361228586e-05, "epoch": 0.3962899878762635, "percentage": 13.21, "elapsed_time": "9:32:51", "remaining_time": "2 days, 14:43:50", "throughput": 26067.01, "total_tokens": 895964160} +{"current_steps": 3340, "total_steps": 25209, "loss": 1.1144, "lr": 4.329207160125282e-05, "epoch": 0.397480047899916, "percentage": 13.25, "elapsed_time": "9:34:31", "remaining_time": "2 days, 14:41:48", "throughput": 26069.77, "total_tokens": 898676800} +{"current_steps": 3350, "total_steps": 25209, "loss": 1.1155, "lr": 4.327585308961287e-05, "epoch": 0.3986701079235684, "percentage": 13.29, "elapsed_time": "9:36:12", "remaining_time": "2 days, 14:39:45", "throughput": 26072.74, "total_tokens": 901387200} +{"current_steps": 3360, "total_steps": 25209, "loss": 1.1069, "lr": 4.325965279215243e-05, "epoch": 0.39986016794722085, "percentage": 13.33, "elapsed_time": "9:37:49", "remaining_time": "2 days, 14:37:22", "throughput": 26077.36, "total_tokens": 904081280} +{"current_steps": 3370, "total_steps": 25209, "loss": 1.1153, "lr": 4.3243470674804686e-05, "epoch": 0.4010502279708733, "percentage": 13.37, "elapsed_time": "9:39:27", "remaining_time": "2 days, 14:35:06", "throughput": 26081.41, "total_tokens": 906781248} +{"current_steps": 3380, "total_steps": 25209, "loss": 1.1135, "lr": 4.3227306703591904e-05, "epoch": 0.4022402879945257, "percentage": 13.41, "elapsed_time": "9:41:05", "remaining_time": "2 days, 14:32:51", "throughput": 26084.53, "total_tokens": 909451136} +{"current_steps": 3390, "total_steps": 25209, "loss": 1.1242, "lr": 4.32111608446252e-05, "epoch": 0.4034303480181782, "percentage": 13.45, "elapsed_time": "9:42:42", "remaining_time": "2 days, 14:30:30", "throughput": 26088.81, "total_tokens": 912138752} +{"current_steps": 3400, "total_steps": 25209, "loss": 1.1128, "lr": 4.319503306410426e-05, "epoch": 0.40462040804183064, "percentage": 13.49, "elapsed_time": "9:44:24", "remaining_time": "2 days, 14:28:35", "throughput": 26091.78, "total_tokens": 914882432} +{"current_steps": 3410, "total_steps": 25209, "loss": 1.1129, "lr": 4.317892332831699e-05, "epoch": 0.40581046806548304, "percentage": 13.53, "elapsed_time": "9:46:00", "remaining_time": "2 days, 14:26:12", "throughput": 26095.0, "total_tokens": 917525056} +{"current_steps": 3420, "total_steps": 25209, "loss": 1.1098, "lr": 4.316283160363922e-05, "epoch": 0.4070005280891355, "percentage": 13.57, "elapsed_time": "9:47:39", "remaining_time": "2 days, 14:24:02", "throughput": 26097.62, "total_tokens": 920198400} +{"current_steps": 3430, "total_steps": 25209, "loss": 1.1119, "lr": 4.314675785653447e-05, "epoch": 0.4081905881127879, "percentage": 13.61, "elapsed_time": "9:49:18", "remaining_time": "2 days, 14:21:51", "throughput": 26100.61, "total_tokens": 922878656} +{"current_steps": 3440, "total_steps": 25209, "loss": 1.1163, "lr": 4.3130702053553606e-05, "epoch": 0.4093806481364404, "percentage": 13.65, "elapsed_time": "9:50:55", "remaining_time": "2 days, 14:19:27", "throughput": 26104.59, "total_tokens": 925542976} +{"current_steps": 3450, "total_steps": 25209, "loss": 1.113, "lr": 4.3114664161334546e-05, "epoch": 0.41057070816009283, "percentage": 13.69, "elapsed_time": "9:52:28", "remaining_time": "2 days, 14:16:40", "throughput": 26111.42, "total_tokens": 928212928} +{"current_steps": 3460, "total_steps": 25209, "loss": 1.1126, "lr": 4.3098644146601984e-05, "epoch": 0.41176076818374524, "percentage": 13.73, "elapsed_time": "9:54:10", "remaining_time": "2 days, 14:14:54", "throughput": 26113.75, "total_tokens": 930974144} +{"current_steps": 3470, "total_steps": 25209, "loss": 1.1018, "lr": 4.30826419761671e-05, "epoch": 0.4129508282073977, "percentage": 13.76, "elapsed_time": "9:55:49", "remaining_time": "2 days, 14:12:42", "throughput": 26116.4, "total_tokens": 933636352} +{"current_steps": 3480, "total_steps": 25209, "loss": 1.1057, "lr": 4.30666576169273e-05, "epoch": 0.41414088823105016, "percentage": 13.8, "elapsed_time": "9:57:26", "remaining_time": "2 days, 14:10:26", "throughput": 26120.02, "total_tokens": 936319296} +{"current_steps": 3490, "total_steps": 25209, "loss": 1.1204, "lr": 4.305069103586585e-05, "epoch": 0.41533094825470257, "percentage": 13.84, "elapsed_time": "9:59:05", "remaining_time": "2 days, 14:08:19", "throughput": 26122.45, "total_tokens": 938997312} +{"current_steps": 3500, "total_steps": 25209, "loss": 1.1185, "lr": 4.303474220005164e-05, "epoch": 0.41652100827835503, "percentage": 13.88, "elapsed_time": "10:00:43", "remaining_time": "2 days, 14:06:00", "throughput": 26126.49, "total_tokens": 941682304} +{"current_steps": 3510, "total_steps": 25209, "loss": 1.1214, "lr": 4.3018811076638944e-05, "epoch": 0.4177110683020075, "percentage": 13.92, "elapsed_time": "10:02:32", "remaining_time": "2 days, 14:04:53", "throughput": 26123.48, "total_tokens": 944416768} +{"current_steps": 3520, "total_steps": 25209, "loss": 1.1186, "lr": 4.300289763286704e-05, "epoch": 0.4189011283256599, "percentage": 13.96, "elapsed_time": "10:04:07", "remaining_time": "2 days, 14:02:21", "throughput": 26128.61, "total_tokens": 947085056} +{"current_steps": 3530, "total_steps": 25209, "loss": 1.1059, "lr": 4.298700183606e-05, "epoch": 0.42009118834931236, "percentage": 14.0, "elapsed_time": "10:05:41", "remaining_time": "2 days, 13:59:45", "throughput": 26134.65, "total_tokens": 949769728} +{"current_steps": 3540, "total_steps": 25209, "loss": 1.1062, "lr": 4.297112365362637e-05, "epoch": 0.4212812483729648, "percentage": 14.04, "elapsed_time": "10:07:19", "remaining_time": "2 days, 13:57:35", "throughput": 26137.36, "total_tokens": 952442176} +{"current_steps": 3550, "total_steps": 25209, "loss": 1.1069, "lr": 4.295526305305891e-05, "epoch": 0.42247130839661723, "percentage": 14.08, "elapsed_time": "10:08:54", "remaining_time": "2 days, 13:55:01", "throughput": 26142.12, "total_tokens": 955088896} +{"current_steps": 3560, "total_steps": 25209, "loss": 1.1224, "lr": 4.293942000193429e-05, "epoch": 0.4236613684202697, "percentage": 14.12, "elapsed_time": "10:10:31", "remaining_time": "2 days, 13:52:42", "throughput": 26145.89, "total_tokens": 957761536} +{"current_steps": 3570, "total_steps": 25209, "loss": 1.1167, "lr": 4.2923594467912866e-05, "epoch": 0.42485142844392215, "percentage": 14.16, "elapsed_time": "10:12:12", "remaining_time": "2 days, 13:50:48", "throughput": 26146.58, "total_tokens": 960431744} +{"current_steps": 3580, "total_steps": 25209, "loss": 1.1189, "lr": 4.290778641873832e-05, "epoch": 0.42604148846757456, "percentage": 14.2, "elapsed_time": "10:13:48", "remaining_time": "2 days, 13:48:25", "throughput": 26151.05, "total_tokens": 963110784} +{"current_steps": 3590, "total_steps": 25209, "loss": 1.1115, "lr": 4.2891995822237455e-05, "epoch": 0.427231548491227, "percentage": 14.24, "elapsed_time": "10:15:32", "remaining_time": "2 days, 13:46:47", "throughput": 26151.55, "total_tokens": 965842688} +{"current_steps": 3600, "total_steps": 25209, "loss": 1.1148, "lr": 4.28762226463199e-05, "epoch": 0.4284216085148795, "percentage": 14.28, "elapsed_time": "10:17:12", "remaining_time": "2 days, 13:44:48", "throughput": 26154.41, "total_tokens": 968568768} +{"current_steps": 3610, "total_steps": 25209, "loss": 1.1032, "lr": 4.286046685897781e-05, "epoch": 0.4296116685385319, "percentage": 14.32, "elapsed_time": "10:18:49", "remaining_time": "2 days, 13:42:32", "throughput": 26158.56, "total_tokens": 971264704} +{"current_steps": 3620, "total_steps": 25209, "loss": 1.1144, "lr": 4.284472842828562e-05, "epoch": 0.43080172856218435, "percentage": 14.36, "elapsed_time": "10:20:29", "remaining_time": "2 days, 13:40:30", "throughput": 26160.66, "total_tokens": 973951808} +{"current_steps": 3630, "total_steps": 25209, "loss": 1.1146, "lr": 4.282900732239977e-05, "epoch": 0.4319917885858368, "percentage": 14.4, "elapsed_time": "10:22:07", "remaining_time": "2 days, 13:38:16", "throughput": 26164.28, "total_tokens": 976638208} +{"current_steps": 3640, "total_steps": 25209, "loss": 1.1126, "lr": 4.281330350955845e-05, "epoch": 0.4331818486094892, "percentage": 14.44, "elapsed_time": "10:23:49", "remaining_time": "2 days, 13:36:29", "throughput": 26165.86, "total_tokens": 979371264} +{"current_steps": 3650, "total_steps": 25209, "loss": 1.1086, "lr": 4.279761695808125e-05, "epoch": 0.4343719086331417, "percentage": 14.48, "elapsed_time": "10:25:26", "remaining_time": "2 days, 13:34:10", "throughput": 26169.94, "total_tokens": 982056448} +{"current_steps": 3660, "total_steps": 25209, "loss": 1.1006, "lr": 4.278194763636904e-05, "epoch": 0.43556196865679414, "percentage": 14.52, "elapsed_time": "10:27:09", "remaining_time": "2 days, 13:32:31", "throughput": 26170.77, "total_tokens": 984791296} +{"current_steps": 3670, "total_steps": 25209, "loss": 1.0997, "lr": 4.276629551290354e-05, "epoch": 0.43675202868044655, "percentage": 14.56, "elapsed_time": "10:28:44", "remaining_time": "2 days, 13:30:05", "throughput": 26175.1, "total_tokens": 987453568} +{"current_steps": 3680, "total_steps": 25209, "loss": 1.1096, "lr": 4.2750660556247175e-05, "epoch": 0.437942088704099, "percentage": 14.6, "elapsed_time": "10:30:21", "remaining_time": "2 days, 13:27:44", "throughput": 26179.41, "total_tokens": 990136704} +{"current_steps": 3690, "total_steps": 25209, "loss": 1.1152, "lr": 4.273504273504274e-05, "epoch": 0.43913214872775147, "percentage": 14.64, "elapsed_time": "10:32:01", "remaining_time": "2 days, 13:25:49", "throughput": 26180.83, "total_tokens": 992825280} +{"current_steps": 3700, "total_steps": 25209, "loss": 1.1158, "lr": 4.271944201801317e-05, "epoch": 0.4403222087514039, "percentage": 14.68, "elapsed_time": "10:33:41", "remaining_time": "2 days, 13:23:46", "throughput": 26183.1, "total_tokens": 995512640} +{"current_steps": 3710, "total_steps": 25209, "loss": 1.1098, "lr": 4.270385837396127e-05, "epoch": 0.44151226877505634, "percentage": 14.72, "elapsed_time": "10:35:18", "remaining_time": "2 days, 13:21:32", "throughput": 26186.21, "total_tokens": 998180032} +{"current_steps": 3720, "total_steps": 25209, "loss": 1.1026, "lr": 4.268829177176945e-05, "epoch": 0.4427023287987088, "percentage": 14.76, "elapsed_time": "10:36:55", "remaining_time": "2 days, 13:19:14", "throughput": 26190.64, "total_tokens": 1000882688} +{"current_steps": 3730, "total_steps": 25209, "loss": 1.1122, "lr": 4.2672742180399455e-05, "epoch": 0.4438923888223612, "percentage": 14.8, "elapsed_time": "10:38:31", "remaining_time": "2 days, 13:16:53", "throughput": 26195.25, "total_tokens": 1003575232} +{"current_steps": 3740, "total_steps": 25209, "loss": 1.1237, "lr": 4.265720956889213e-05, "epoch": 0.44508244884601367, "percentage": 14.84, "elapsed_time": "10:40:12", "remaining_time": "2 days, 13:15:01", "throughput": 26197.6, "total_tokens": 1006314560} +{"current_steps": 3750, "total_steps": 25209, "loss": 1.1062, "lr": 4.2641693906367113e-05, "epoch": 0.44627250886966613, "percentage": 14.88, "elapsed_time": "10:41:52", "remaining_time": "2 days, 13:13:06", "throughput": 26199.25, "total_tokens": 1009009664} +{"current_steps": 3760, "total_steps": 25209, "loss": 1.1129, "lr": 4.2626195162022646e-05, "epoch": 0.44746256889331854, "percentage": 14.92, "elapsed_time": "10:43:31", "remaining_time": "2 days, 13:11:01", "throughput": 26201.76, "total_tokens": 1011693376} +{"current_steps": 3770, "total_steps": 25209, "loss": 1.116, "lr": 4.2610713305135255e-05, "epoch": 0.448652628916971, "percentage": 14.95, "elapsed_time": "10:45:08", "remaining_time": "2 days, 13:08:42", "throughput": 26205.42, "total_tokens": 1014362048} +{"current_steps": 3780, "total_steps": 25209, "loss": 1.0934, "lr": 4.2595248305059546e-05, "epoch": 0.44984268894062346, "percentage": 14.99, "elapsed_time": "10:46:43", "remaining_time": "2 days, 13:06:20", "throughput": 26209.13, "total_tokens": 1017011072} +{"current_steps": 3790, "total_steps": 25209, "loss": 1.1174, "lr": 4.2579800131227916e-05, "epoch": 0.45103274896427586, "percentage": 15.03, "elapsed_time": "10:48:20", "remaining_time": "2 days, 13:04:03", "throughput": 26212.64, "total_tokens": 1019681664} +{"current_steps": 3800, "total_steps": 25209, "loss": 1.1094, "lr": 4.256436875315028e-05, "epoch": 0.4522228089879283, "percentage": 15.07, "elapsed_time": "10:49:54", "remaining_time": "2 days, 13:01:33", "throughput": 26217.29, "total_tokens": 1022331776} +{"current_steps": 3810, "total_steps": 25209, "loss": 1.1091, "lr": 4.2548954140413895e-05, "epoch": 0.4534128690115808, "percentage": 15.11, "elapsed_time": "10:51:40", "remaining_time": "2 days, 13:00:09", "throughput": 26216.6, "total_tokens": 1025082304} +{"current_steps": 3820, "total_steps": 25209, "loss": 1.1041, "lr": 4.253355626268302e-05, "epoch": 0.4546029290352332, "percentage": 15.15, "elapsed_time": "10:53:21", "remaining_time": "2 days, 12:58:19", "throughput": 26217.23, "total_tokens": 1027763520} +{"current_steps": 3830, "total_steps": 25209, "loss": 1.1239, "lr": 4.2518175089698716e-05, "epoch": 0.45579298905888566, "percentage": 15.19, "elapsed_time": "10:55:02", "remaining_time": "2 days, 12:56:23", "throughput": 26218.24, "total_tokens": 1030431744} +{"current_steps": 3840, "total_steps": 25209, "loss": 1.11, "lr": 4.25028105912786e-05, "epoch": 0.4569830490825381, "percentage": 15.23, "elapsed_time": "10:56:40", "remaining_time": "2 days, 12:54:17", "throughput": 26222.1, "total_tokens": 1033161344} +{"current_steps": 3850, "total_steps": 25209, "loss": 1.1121, "lr": 4.2487462737316565e-05, "epoch": 0.4581731091061905, "percentage": 15.27, "elapsed_time": "10:58:15", "remaining_time": "2 days, 12:51:52", "throughput": 26226.54, "total_tokens": 1035830336} +{"current_steps": 3860, "total_steps": 25209, "loss": 1.1191, "lr": 4.2472131497782555e-05, "epoch": 0.459363169129843, "percentage": 15.31, "elapsed_time": "10:59:52", "remaining_time": "2 days, 12:49:40", "throughput": 26229.55, "total_tokens": 1038500352} +{"current_steps": 3870, "total_steps": 25209, "loss": 1.1082, "lr": 4.245681684272231e-05, "epoch": 0.46055322915349545, "percentage": 15.35, "elapsed_time": "11:01:27", "remaining_time": "2 days, 12:47:16", "throughput": 26234.18, "total_tokens": 1041173696} +{"current_steps": 3880, "total_steps": 25209, "loss": 1.1115, "lr": 4.244151874225712e-05, "epoch": 0.46174328917714785, "percentage": 15.39, "elapsed_time": "11:03:04", "remaining_time": "2 days, 12:45:01", "throughput": 26237.26, "total_tokens": 1043833408} +{"current_steps": 3890, "total_steps": 25209, "loss": 1.1078, "lr": 4.2426237166583596e-05, "epoch": 0.4629333492008003, "percentage": 15.43, "elapsed_time": "11:04:42", "remaining_time": "2 days, 12:42:52", "throughput": 26240.54, "total_tokens": 1046528704} +{"current_steps": 3900, "total_steps": 25209, "loss": 1.115, "lr": 4.241097208597339e-05, "epoch": 0.4641234092244528, "percentage": 15.47, "elapsed_time": "11:06:21", "remaining_time": "2 days, 12:40:50", "throughput": 26243.91, "total_tokens": 1049259520} +{"current_steps": 3910, "total_steps": 25209, "loss": 1.1197, "lr": 4.2395723470773005e-05, "epoch": 0.4653134692481052, "percentage": 15.51, "elapsed_time": "11:08:02", "remaining_time": "2 days, 12:38:59", "throughput": 26244.95, "total_tokens": 1051950976} +{"current_steps": 3920, "total_steps": 25209, "loss": 1.1116, "lr": 4.238049129140347e-05, "epoch": 0.46650352927175764, "percentage": 15.55, "elapsed_time": "11:09:35", "remaining_time": "2 days, 12:36:30", "throughput": 26249.75, "total_tokens": 1054607360} +{"current_steps": 3930, "total_steps": 25209, "loss": 1.0917, "lr": 4.236527551836022e-05, "epoch": 0.4676935892954101, "percentage": 15.59, "elapsed_time": "11:11:15", "remaining_time": "2 days, 12:34:32", "throughput": 26252.15, "total_tokens": 1057321088} +{"current_steps": 3940, "total_steps": 25209, "loss": 1.1054, "lr": 4.235007612221274e-05, "epoch": 0.4688836493190625, "percentage": 15.63, "elapsed_time": "11:12:53", "remaining_time": "2 days, 12:32:23", "throughput": 26255.06, "total_tokens": 1060002048} +{"current_steps": 3950, "total_steps": 25209, "loss": 1.1235, "lr": 4.2334893073604386e-05, "epoch": 0.470073709342715, "percentage": 15.67, "elapsed_time": "11:14:31", "remaining_time": "2 days, 12:30:18", "throughput": 26257.36, "total_tokens": 1062675136} +{"current_steps": 3960, "total_steps": 25209, "loss": 1.1157, "lr": 4.231972634325214e-05, "epoch": 0.47126376936636744, "percentage": 15.71, "elapsed_time": "11:16:07", "remaining_time": "2 days, 12:28:00", "throughput": 26261.3, "total_tokens": 1065351296} +{"current_steps": 3970, "total_steps": 25209, "loss": 1.115, "lr": 4.230457590194635e-05, "epoch": 0.47245382939001984, "percentage": 15.75, "elapsed_time": "11:17:48", "remaining_time": "2 days, 12:26:08", "throughput": 26262.61, "total_tokens": 1068049344} +{"current_steps": 3980, "total_steps": 25209, "loss": 1.1135, "lr": 4.228944172055053e-05, "epoch": 0.4736438894136723, "percentage": 15.79, "elapsed_time": "11:19:31", "remaining_time": "2 days, 12:24:33", "throughput": 26263.12, "total_tokens": 1070796160} +{"current_steps": 3990, "total_steps": 25209, "loss": 1.1062, "lr": 4.22743237700011e-05, "epoch": 0.47483394943732476, "percentage": 15.83, "elapsed_time": "11:21:12", "remaining_time": "2 days, 12:22:43", "throughput": 26264.36, "total_tokens": 1073497344} +{"current_steps": 4000, "total_steps": 25209, "loss": 1.1067, "lr": 4.225922202130716e-05, "epoch": 0.47602400946097717, "percentage": 15.87, "elapsed_time": "11:22:56", "remaining_time": "2 days, 12:21:09", "throughput": 26264.79, "total_tokens": 1076250112} +{"current_steps": 4010, "total_steps": 25209, "loss": 1.1036, "lr": 4.224413644555024e-05, "epoch": 0.47721406948462963, "percentage": 15.91, "elapsed_time": "11:24:31", "remaining_time": "2 days, 12:18:47", "throughput": 26269.25, "total_tokens": 1078928000} +{"current_steps": 4020, "total_steps": 25209, "loss": 1.0939, "lr": 4.222906701388411e-05, "epoch": 0.4784041295082821, "percentage": 15.95, "elapsed_time": "11:26:09", "remaining_time": "2 days, 12:16:41", "throughput": 26271.9, "total_tokens": 1081607232} +{"current_steps": 4030, "total_steps": 25209, "loss": 1.1158, "lr": 4.2214013697534466e-05, "epoch": 0.4795941895319345, "percentage": 15.99, "elapsed_time": "11:27:46", "remaining_time": "2 days, 12:14:30", "throughput": 26274.87, "total_tokens": 1084275776} +{"current_steps": 4040, "total_steps": 25209, "loss": 1.1155, "lr": 4.219897646779882e-05, "epoch": 0.48078424955558696, "percentage": 16.03, "elapsed_time": "11:29:25", "remaining_time": "2 days, 12:12:30", "throughput": 26277.72, "total_tokens": 1086996224} +{"current_steps": 4050, "total_steps": 25209, "loss": 1.1058, "lr": 4.2183955296046145e-05, "epoch": 0.4819743095792394, "percentage": 16.07, "elapsed_time": "11:31:02", "remaining_time": "2 days, 12:10:16", "throughput": 26282.11, "total_tokens": 1089711936} +{"current_steps": 4060, "total_steps": 25209, "loss": 1.1112, "lr": 4.2168950153716746e-05, "epoch": 0.48316436960289183, "percentage": 16.11, "elapsed_time": "11:32:41", "remaining_time": "2 days, 12:08:17", "throughput": 26283.8, "total_tokens": 1092386816} +{"current_steps": 4070, "total_steps": 25209, "loss": 1.105, "lr": 4.215396101232197e-05, "epoch": 0.4843544296265443, "percentage": 16.15, "elapsed_time": "11:34:15", "remaining_time": "2 days, 12:05:53", "throughput": 26287.75, "total_tokens": 1095033920} +{"current_steps": 4080, "total_steps": 25209, "loss": 1.1065, "lr": 4.213898784344398e-05, "epoch": 0.48554448965019675, "percentage": 16.18, "elapsed_time": "11:35:55", "remaining_time": "2 days, 12:03:59", "throughput": 26289.52, "total_tokens": 1097740992} +{"current_steps": 4090, "total_steps": 25209, "loss": 1.0991, "lr": 4.21240306187356e-05, "epoch": 0.48673454967384916, "percentage": 16.22, "elapsed_time": "11:37:34", "remaining_time": "2 days, 12:01:57", "throughput": 26291.8, "total_tokens": 1100422080} +{"current_steps": 4100, "total_steps": 25209, "loss": 1.099, "lr": 4.2109089309919967e-05, "epoch": 0.4879246096975016, "percentage": 16.26, "elapsed_time": "11:39:13", "remaining_time": "2 days, 11:59:59", "throughput": 26293.86, "total_tokens": 1103119296} +{"current_steps": 4110, "total_steps": 25209, "loss": 1.1025, "lr": 4.2094163888790445e-05, "epoch": 0.4891146697211541, "percentage": 16.3, "elapsed_time": "11:40:57", "remaining_time": "2 days, 11:58:26", "throughput": 26294.53, "total_tokens": 1105890240} +{"current_steps": 4120, "total_steps": 25209, "loss": 1.099, "lr": 4.2079254327210294e-05, "epoch": 0.4903047297448065, "percentage": 16.34, "elapsed_time": "11:42:33", "remaining_time": "2 days, 11:56:12", "throughput": 26298.34, "total_tokens": 1108578560} +{"current_steps": 4130, "total_steps": 25209, "loss": 1.0988, "lr": 4.206436059711249e-05, "epoch": 0.49149478976845895, "percentage": 16.38, "elapsed_time": "11:44:08", "remaining_time": "2 days, 11:53:51", "throughput": 26301.8, "total_tokens": 1111214656} +{"current_steps": 4140, "total_steps": 25209, "loss": 1.1024, "lr": 4.20494826704995e-05, "epoch": 0.4926848497921114, "percentage": 16.42, "elapsed_time": "11:45:47", "remaining_time": "2 days, 11:51:52", "throughput": 26304.91, "total_tokens": 1113947776} +{"current_steps": 4150, "total_steps": 25209, "loss": 1.1049, "lr": 4.203462051944307e-05, "epoch": 0.4938749098157638, "percentage": 16.46, "elapsed_time": "11:47:28", "remaining_time": "2 days, 11:50:04", "throughput": 26305.88, "total_tokens": 1116650752} +{"current_steps": 4160, "total_steps": 25209, "loss": 1.1056, "lr": 4.201977411608398e-05, "epoch": 0.4950649698394163, "percentage": 16.5, "elapsed_time": "11:49:05", "remaining_time": "2 days, 11:47:54", "throughput": 26309.06, "total_tokens": 1119336128} +{"current_steps": 4170, "total_steps": 25209, "loss": 1.1067, "lr": 4.200494343263185e-05, "epoch": 0.49625502986306874, "percentage": 16.54, "elapsed_time": "11:50:44", "remaining_time": "2 days, 11:45:53", "throughput": 26312.25, "total_tokens": 1122064512} +{"current_steps": 4180, "total_steps": 25209, "loss": 1.0989, "lr": 4.1990128441364914e-05, "epoch": 0.49744508988672115, "percentage": 16.58, "elapsed_time": "11:52:22", "remaining_time": "2 days, 11:43:53", "throughput": 26314.89, "total_tokens": 1124772096} +{"current_steps": 4190, "total_steps": 25209, "loss": 1.1007, "lr": 4.197532911462977e-05, "epoch": 0.4986351499103736, "percentage": 16.62, "elapsed_time": "11:54:00", "remaining_time": "2 days, 11:41:46", "throughput": 26318.23, "total_tokens": 1127477952} +{"current_steps": 4200, "total_steps": 25209, "loss": 1.1186, "lr": 4.196054542484125e-05, "epoch": 0.49982520993402607, "percentage": 16.66, "elapsed_time": "11:55:31", "remaining_time": "2 days, 11:39:09", "throughput": 26323.85, "total_tokens": 1130124992} +{"current_steps": 4210, "total_steps": 25209, "loss": 1.1022, "lr": 4.1945777344482084e-05, "epoch": 0.5010152699576785, "percentage": 16.7, "elapsed_time": "11:57:12", "remaining_time": "2 days, 11:37:20", "throughput": 26325.87, "total_tokens": 1132862464} +{"current_steps": 4220, "total_steps": 25209, "loss": 1.0943, "lr": 4.19310248461028e-05, "epoch": 0.5022053299813309, "percentage": 16.74, "elapsed_time": "11:58:53", "remaining_time": "2 days, 11:35:31", "throughput": 26327.07, "total_tokens": 1135573504} +{"current_steps": 4230, "total_steps": 25209, "loss": 1.0868, "lr": 4.1916287902321405e-05, "epoch": 0.5033953900049833, "percentage": 16.78, "elapsed_time": "12:00:29", "remaining_time": "2 days, 11:33:22", "throughput": 26330.49, "total_tokens": 1138266944} +{"current_steps": 4240, "total_steps": 25209, "loss": 1.0991, "lr": 4.190156648582328e-05, "epoch": 0.5045854500286359, "percentage": 16.82, "elapsed_time": "12:02:09", "remaining_time": "2 days, 11:31:26", "throughput": 26332.58, "total_tokens": 1140977856} +{"current_steps": 4250, "total_steps": 25209, "loss": 1.1032, "lr": 4.188686056936087e-05, "epoch": 0.5057755100522883, "percentage": 16.86, "elapsed_time": "12:03:47", "remaining_time": "2 days, 11:29:25", "throughput": 26335.63, "total_tokens": 1143698368} +{"current_steps": 4260, "total_steps": 25209, "loss": 1.1, "lr": 4.187217012575352e-05, "epoch": 0.5069655700759407, "percentage": 16.9, "elapsed_time": "12:05:27", "remaining_time": "2 days, 11:27:31", "throughput": 26337.01, "total_tokens": 1146383744} +{"current_steps": 4270, "total_steps": 25209, "loss": 1.1134, "lr": 4.185749512788727e-05, "epoch": 0.5081556300995932, "percentage": 16.94, "elapsed_time": "12:07:08", "remaining_time": "2 days, 11:25:45", "throughput": 26338.37, "total_tokens": 1149116672} +{"current_steps": 4280, "total_steps": 25209, "loss": 1.1005, "lr": 4.184283554871462e-05, "epoch": 0.5093456901232456, "percentage": 16.98, "elapsed_time": "12:08:47", "remaining_time": "2 days, 11:23:45", "throughput": 26341.12, "total_tokens": 1151832192} +{"current_steps": 4290, "total_steps": 25209, "loss": 1.0979, "lr": 4.1828191361254344e-05, "epoch": 0.510535750146898, "percentage": 17.02, "elapsed_time": "12:10:21", "remaining_time": "2 days, 11:21:21", "throughput": 26346.33, "total_tokens": 1154526272} +{"current_steps": 4300, "total_steps": 25209, "loss": 1.1043, "lr": 4.181356253859127e-05, "epoch": 0.5117258101705505, "percentage": 17.06, "elapsed_time": "12:11:54", "remaining_time": "2 days, 11:18:54", "throughput": 26351.35, "total_tokens": 1157196224} +{"current_steps": 4310, "total_steps": 25209, "loss": 1.1008, "lr": 4.179894905387606e-05, "epoch": 0.5129158701942029, "percentage": 17.1, "elapsed_time": "12:13:33", "remaining_time": "2 days, 11:16:58", "throughput": 26353.17, "total_tokens": 1159887744} +{"current_steps": 4320, "total_steps": 25209, "loss": 1.0987, "lr": 4.178435088032502e-05, "epoch": 0.5141059302178553, "percentage": 17.14, "elapsed_time": "12:15:10", "remaining_time": "2 days, 11:14:54", "throughput": 26356.14, "total_tokens": 1162590912} +{"current_steps": 4330, "total_steps": 25209, "loss": 1.0861, "lr": 4.176976799121989e-05, "epoch": 0.5152959902415079, "percentage": 17.18, "elapsed_time": "12:16:47", "remaining_time": "2 days, 11:12:47", "throughput": 26359.51, "total_tokens": 1165295744} +{"current_steps": 4340, "total_steps": 25209, "loss": 1.0832, "lr": 4.1755200359907657e-05, "epoch": 0.5164860502651603, "percentage": 17.22, "elapsed_time": "12:18:25", "remaining_time": "2 days, 11:10:44", "throughput": 26362.08, "total_tokens": 1167985408} +{"current_steps": 4350, "total_steps": 25209, "loss": 1.0996, "lr": 4.174064795980028e-05, "epoch": 0.5176761102888127, "percentage": 17.26, "elapsed_time": "12:20:02", "remaining_time": "2 days, 11:08:37", "throughput": 26365.6, "total_tokens": 1170698432} +{"current_steps": 4360, "total_steps": 25209, "loss": 1.1061, "lr": 4.17261107643746e-05, "epoch": 0.5188661703124652, "percentage": 17.3, "elapsed_time": "12:21:37", "remaining_time": "2 days, 11:06:22", "throughput": 26368.58, "total_tokens": 1173338624} +{"current_steps": 4370, "total_steps": 25209, "loss": 1.1005, "lr": 4.171158874717204e-05, "epoch": 0.5200562303361176, "percentage": 17.34, "elapsed_time": "12:23:11", "remaining_time": "2 days, 11:04:00", "throughput": 26373.08, "total_tokens": 1176010432} +{"current_steps": 4380, "total_steps": 25209, "loss": 1.0779, "lr": 4.169708188179844e-05, "epoch": 0.52124629035977, "percentage": 17.37, "elapsed_time": "12:24:46", "remaining_time": "2 days, 11:01:45", "throughput": 26375.74, "total_tokens": 1178638208} +{"current_steps": 4390, "total_steps": 25209, "loss": 1.1132, "lr": 4.1682590141923846e-05, "epoch": 0.5224363503834225, "percentage": 17.41, "elapsed_time": "12:26:24", "remaining_time": "2 days, 10:59:45", "throughput": 26378.3, "total_tokens": 1181345600} +{"current_steps": 4400, "total_steps": 25209, "loss": 1.0866, "lr": 4.1668113501282335e-05, "epoch": 0.5236264104070749, "percentage": 17.45, "elapsed_time": "12:28:00", "remaining_time": "2 days, 10:57:34", "throughput": 26381.29, "total_tokens": 1184009728} +{"current_steps": 4410, "total_steps": 25209, "loss": 1.0962, "lr": 4.165365193367178e-05, "epoch": 0.5248164704307273, "percentage": 17.49, "elapsed_time": "12:29:37", "remaining_time": "2 days, 10:55:28", "throughput": 26383.47, "total_tokens": 1186659584} +{"current_steps": 4420, "total_steps": 25209, "loss": 1.1007, "lr": 4.163920541295369e-05, "epoch": 0.5260065304543798, "percentage": 17.53, "elapsed_time": "12:31:15", "remaining_time": "2 days, 10:53:29", "throughput": 26385.61, "total_tokens": 1189355968} +{"current_steps": 4430, "total_steps": 25209, "loss": 1.0936, "lr": 4.1624773913052946e-05, "epoch": 0.5271965904780322, "percentage": 17.57, "elapsed_time": "12:32:53", "remaining_time": "2 days, 10:51:27", "throughput": 26388.08, "total_tokens": 1192042368} +{"current_steps": 4440, "total_steps": 25209, "loss": 1.0914, "lr": 4.161035740795769e-05, "epoch": 0.5283866505016847, "percentage": 17.61, "elapsed_time": "12:34:31", "remaining_time": "2 days, 10:49:24", "throughput": 26390.77, "total_tokens": 1194737152} +{"current_steps": 4450, "total_steps": 25209, "loss": 1.1014, "lr": 4.1595955871719055e-05, "epoch": 0.5295767105253372, "percentage": 17.65, "elapsed_time": "12:36:08", "remaining_time": "2 days, 10:47:19", "throughput": 26393.42, "total_tokens": 1197419200} +{"current_steps": 4460, "total_steps": 25209, "loss": 1.1142, "lr": 4.158156927845101e-05, "epoch": 0.5307667705489896, "percentage": 17.69, "elapsed_time": "12:37:43", "remaining_time": "2 days, 10:45:09", "throughput": 26396.82, "total_tokens": 1200104960} +{"current_steps": 4470, "total_steps": 25209, "loss": 1.1062, "lr": 4.156719760233016e-05, "epoch": 0.531956830572642, "percentage": 17.73, "elapsed_time": "12:39:22", "remaining_time": "2 days, 10:43:11", "throughput": 26399.28, "total_tokens": 1202817216} +{"current_steps": 4480, "total_steps": 25209, "loss": 1.081, "lr": 4.155284081759552e-05, "epoch": 0.5331468905962945, "percentage": 17.77, "elapsed_time": "12:40:59", "remaining_time": "2 days, 10:41:04", "throughput": 26402.13, "total_tokens": 1205496384} +{"current_steps": 4490, "total_steps": 25209, "loss": 1.0913, "lr": 4.1538498898548356e-05, "epoch": 0.5343369506199469, "percentage": 17.81, "elapsed_time": "12:42:40", "remaining_time": "2 days, 10:39:21", "throughput": 26404.26, "total_tokens": 1208278016} +{"current_steps": 4500, "total_steps": 25209, "loss": 1.103, "lr": 4.1524171819552e-05, "epoch": 0.5355270106435993, "percentage": 17.85, "elapsed_time": "12:44:16", "remaining_time": "2 days, 10:37:13", "throughput": 26407.29, "total_tokens": 1210958528} +{"current_steps": 4510, "total_steps": 25209, "loss": 1.1052, "lr": 4.15098595550316e-05, "epoch": 0.5367170706672518, "percentage": 17.89, "elapsed_time": "12:45:58", "remaining_time": "2 days, 10:35:30", "throughput": 26408.58, "total_tokens": 1213701440} +{"current_steps": 4520, "total_steps": 25209, "loss": 1.1181, "lr": 4.1495562079474e-05, "epoch": 0.5379071306909042, "percentage": 17.93, "elapsed_time": "12:47:35", "remaining_time": "2 days, 10:33:27", "throughput": 26411.81, "total_tokens": 1216420864} +{"current_steps": 4530, "total_steps": 25209, "loss": 1.1089, "lr": 4.148127936742749e-05, "epoch": 0.5390971907145566, "percentage": 17.97, "elapsed_time": "12:49:20", "remaining_time": "2 days, 10:31:56", "throughput": 26411.91, "total_tokens": 1219178816} +{"current_steps": 4540, "total_steps": 25209, "loss": 1.1026, "lr": 4.146701139350166e-05, "epoch": 0.5402872507382092, "percentage": 18.01, "elapsed_time": "12:50:56", "remaining_time": "2 days, 10:29:50", "throughput": 26415.28, "total_tokens": 1221886720} +{"current_steps": 4550, "total_steps": 25209, "loss": 1.0966, "lr": 4.1452758132367196e-05, "epoch": 0.5414773107618616, "percentage": 18.05, "elapsed_time": "12:52:32", "remaining_time": "2 days, 10:27:41", "throughput": 26418.7, "total_tokens": 1224576832} +{"current_steps": 4560, "total_steps": 25209, "loss": 1.1033, "lr": 4.1438519558755656e-05, "epoch": 0.542667370785514, "percentage": 18.09, "elapsed_time": "12:54:10", "remaining_time": "2 days, 10:25:40", "throughput": 26420.8, "total_tokens": 1227256448} +{"current_steps": 4570, "total_steps": 25209, "loss": 1.0704, "lr": 4.1424295647459336e-05, "epoch": 0.5438574308091665, "percentage": 18.13, "elapsed_time": "12:55:49", "remaining_time": "2 days, 10:23:48", "throughput": 26422.92, "total_tokens": 1229984768} +{"current_steps": 4580, "total_steps": 25209, "loss": 1.0976, "lr": 4.141008637333106e-05, "epoch": 0.5450474908328189, "percentage": 18.17, "elapsed_time": "12:57:30", "remaining_time": "2 days, 10:22:02", "throughput": 26424.47, "total_tokens": 1232726400} +{"current_steps": 4590, "total_steps": 25209, "loss": 1.0859, "lr": 4.1395891711283974e-05, "epoch": 0.5462375508564713, "percentage": 18.21, "elapsed_time": "12:59:07", "remaining_time": "2 days, 10:19:56", "throughput": 26426.68, "total_tokens": 1235379072} +{"current_steps": 4600, "total_steps": 25209, "loss": 1.0864, "lr": 4.1381711636291395e-05, "epoch": 0.5474276108801238, "percentage": 18.25, "elapsed_time": "13:00:45", "remaining_time": "2 days, 10:17:57", "throughput": 26428.69, "total_tokens": 1238062848} +{"current_steps": 4610, "total_steps": 25209, "loss": 1.0876, "lr": 4.1367546123386604e-05, "epoch": 0.5486176709037762, "percentage": 18.29, "elapsed_time": "13:02:22", "remaining_time": "2 days, 10:15:53", "throughput": 26431.41, "total_tokens": 1240748864} +{"current_steps": 4620, "total_steps": 25209, "loss": 1.0988, "lr": 4.1353395147662673e-05, "epoch": 0.5498077309274286, "percentage": 18.33, "elapsed_time": "13:03:59", "remaining_time": "2 days, 10:13:52", "throughput": 26434.26, "total_tokens": 1243464896} +{"current_steps": 4630, "total_steps": 25209, "loss": 1.0909, "lr": 4.133925868427225e-05, "epoch": 0.5509977909510811, "percentage": 18.37, "elapsed_time": "13:05:38", "remaining_time": "2 days, 10:11:58", "throughput": 26435.67, "total_tokens": 1246149504} +{"current_steps": 4640, "total_steps": 25209, "loss": 1.1009, "lr": 4.132513670842744e-05, "epoch": 0.5521878509747336, "percentage": 18.41, "elapsed_time": "13:07:14", "remaining_time": "2 days, 10:09:47", "throughput": 26438.98, "total_tokens": 1248818944} +{"current_steps": 4650, "total_steps": 25209, "loss": 1.0865, "lr": 4.1311029195399534e-05, "epoch": 0.553377910998386, "percentage": 18.45, "elapsed_time": "13:08:50", "remaining_time": "2 days, 10:07:41", "throughput": 26441.63, "total_tokens": 1251491328} +{"current_steps": 4660, "total_steps": 25209, "loss": 1.0849, "lr": 4.129693612051892e-05, "epoch": 0.5545679710220385, "percentage": 18.49, "elapsed_time": "13:10:24", "remaining_time": "2 days, 10:05:25", "throughput": 26445.27, "total_tokens": 1254150464} +{"current_steps": 4670, "total_steps": 25209, "loss": 1.0889, "lr": 4.1282857459174826e-05, "epoch": 0.5557580310456909, "percentage": 18.53, "elapsed_time": "13:11:59", "remaining_time": "2 days, 10:03:13", "throughput": 26448.21, "total_tokens": 1256801728} +{"current_steps": 4680, "total_steps": 25209, "loss": 1.0928, "lr": 4.1268793186815184e-05, "epoch": 0.5569480910693433, "percentage": 18.56, "elapsed_time": "13:13:33", "remaining_time": "2 days, 10:00:57", "throughput": 26452.31, "total_tokens": 1259478400} +{"current_steps": 4690, "total_steps": 25209, "loss": 1.0926, "lr": 4.1254743278946456e-05, "epoch": 0.5581381510929958, "percentage": 18.6, "elapsed_time": "13:15:09", "remaining_time": "2 days, 9:58:51", "throughput": 26454.82, "total_tokens": 1262146048} +{"current_steps": 4700, "total_steps": 25209, "loss": 1.0981, "lr": 4.1240707711133394e-05, "epoch": 0.5593282111166482, "percentage": 18.64, "elapsed_time": "13:16:51", "remaining_time": "2 days, 9:57:11", "throughput": 26455.44, "total_tokens": 1264879104} +{"current_steps": 4710, "total_steps": 25209, "loss": 1.1003, "lr": 4.122668645899893e-05, "epoch": 0.5605182711403006, "percentage": 18.68, "elapsed_time": "13:18:27", "remaining_time": "2 days, 9:55:04", "throughput": 26458.45, "total_tokens": 1267556928} +{"current_steps": 4720, "total_steps": 25209, "loss": 1.0923, "lr": 4.1212679498223975e-05, "epoch": 0.5617083311639531, "percentage": 18.72, "elapsed_time": "13:20:04", "remaining_time": "2 days, 9:53:04", "throughput": 26460.54, "total_tokens": 1270237824} +{"current_steps": 4730, "total_steps": 25209, "loss": 1.0932, "lr": 4.1198686804547215e-05, "epoch": 0.5628983911876055, "percentage": 18.76, "elapsed_time": "13:21:44", "remaining_time": "2 days, 9:51:11", "throughput": 26462.76, "total_tokens": 1272965568} +{"current_steps": 4740, "total_steps": 25209, "loss": 1.1016, "lr": 4.118470835376499e-05, "epoch": 0.564088451211258, "percentage": 18.8, "elapsed_time": "13:23:18", "remaining_time": "2 days, 9:48:57", "throughput": 26466.42, "total_tokens": 1275635456} +{"current_steps": 4750, "total_steps": 25209, "loss": 1.095, "lr": 4.117074412173107e-05, "epoch": 0.5652785112349105, "percentage": 18.84, "elapsed_time": "13:24:54", "remaining_time": "2 days, 9:46:53", "throughput": 26469.66, "total_tokens": 1278348224} +{"current_steps": 4760, "total_steps": 25209, "loss": 1.0964, "lr": 4.115679408435648e-05, "epoch": 0.5664685712585629, "percentage": 18.88, "elapsed_time": "13:26:27", "remaining_time": "2 days, 9:44:34", "throughput": 26473.7, "total_tokens": 1281001664} +{"current_steps": 4770, "total_steps": 25209, "loss": 1.0912, "lr": 4.114285821760937e-05, "epoch": 0.5676586312822153, "percentage": 18.92, "elapsed_time": "13:28:05", "remaining_time": "2 days, 9:42:36", "throughput": 26476.06, "total_tokens": 1283709440} +{"current_steps": 4780, "total_steps": 25209, "loss": 1.0691, "lr": 4.11289364975148e-05, "epoch": 0.5688486913058678, "percentage": 18.96, "elapsed_time": "13:29:42", "remaining_time": "2 days, 9:40:35", "throughput": 26479.04, "total_tokens": 1286423424} +{"current_steps": 4790, "total_steps": 25209, "loss": 1.0994, "lr": 4.111502890015456e-05, "epoch": 0.5700387513295202, "percentage": 19.0, "elapsed_time": "13:31:25", "remaining_time": "2 days, 9:38:56", "throughput": 26479.68, "total_tokens": 1289164672} +{"current_steps": 4800, "total_steps": 25209, "loss": 1.0866, "lr": 4.1101135401667056e-05, "epoch": 0.5712288113531726, "percentage": 19.04, "elapsed_time": "13:32:56", "remaining_time": "2 days, 9:36:33", "throughput": 26484.16, "total_tokens": 1291816896} +{"current_steps": 4810, "total_steps": 25209, "loss": 1.0947, "lr": 4.108725597824708e-05, "epoch": 0.5724188713768251, "percentage": 19.08, "elapsed_time": "13:34:37", "remaining_time": "2 days, 9:34:47", "throughput": 26484.85, "total_tokens": 1294515648} +{"current_steps": 4820, "total_steps": 25209, "loss": 1.1016, "lr": 4.107339060614564e-05, "epoch": 0.5736089314004775, "percentage": 19.12, "elapsed_time": "13:36:15", "remaining_time": "2 days, 9:32:50", "throughput": 26487.17, "total_tokens": 1297224064} +{"current_steps": 4830, "total_steps": 25209, "loss": 1.0851, "lr": 4.1059539261669825e-05, "epoch": 0.5747989914241299, "percentage": 19.16, "elapsed_time": "13:37:56", "remaining_time": "2 days, 9:31:07", "throughput": 26487.73, "total_tokens": 1299934336} +{"current_steps": 4840, "total_steps": 25209, "loss": 1.1048, "lr": 4.104570192118262e-05, "epoch": 0.5759890514477825, "percentage": 19.2, "elapsed_time": "13:39:34", "remaining_time": "2 days, 9:29:11", "throughput": 26489.17, "total_tokens": 1302602880} +{"current_steps": 4850, "total_steps": 25209, "loss": 1.0982, "lr": 4.1031878561102714e-05, "epoch": 0.5771791114714349, "percentage": 19.24, "elapsed_time": "13:41:14", "remaining_time": "2 days, 9:27:21", "throughput": 26490.69, "total_tokens": 1305317312} +{"current_steps": 4860, "total_steps": 25209, "loss": 1.0846, "lr": 4.1018069157904385e-05, "epoch": 0.5783691714950873, "percentage": 19.28, "elapsed_time": "13:42:53", "remaining_time": "2 days, 9:25:28", "throughput": 26492.6, "total_tokens": 1308031168} +{"current_steps": 4870, "total_steps": 25209, "loss": 1.097, "lr": 4.100427368811727e-05, "epoch": 0.5795592315187398, "percentage": 19.32, "elapsed_time": "13:44:32", "remaining_time": "2 days, 9:23:35", "throughput": 26495.12, "total_tokens": 1310772352} +{"current_steps": 4880, "total_steps": 25209, "loss": 1.084, "lr": 4.099049212832622e-05, "epoch": 0.5807492915423922, "percentage": 19.36, "elapsed_time": "13:46:07", "remaining_time": "2 days, 9:21:27", "throughput": 26498.07, "total_tokens": 1313448000} +{"current_steps": 4890, "total_steps": 25209, "loss": 1.078, "lr": 4.0976724455171155e-05, "epoch": 0.5819393515660446, "percentage": 19.4, "elapsed_time": "13:47:45", "remaining_time": "2 days, 9:19:31", "throughput": 26500.97, "total_tokens": 1316190592} +{"current_steps": 4900, "total_steps": 25209, "loss": 1.0967, "lr": 4.096297064534688e-05, "epoch": 0.583129411589697, "percentage": 19.44, "elapsed_time": "13:49:24", "remaining_time": "2 days, 9:17:37", "throughput": 26502.68, "total_tokens": 1318885696} +{"current_steps": 4910, "total_steps": 25209, "loss": 1.0984, "lr": 4.0949230675602904e-05, "epoch": 0.5843194716133495, "percentage": 19.48, "elapsed_time": "13:50:59", "remaining_time": "2 days, 9:15:30", "throughput": 26504.83, "total_tokens": 1321524288} +{"current_steps": 4920, "total_steps": 25209, "loss": 1.0724, "lr": 4.09355045227433e-05, "epoch": 0.5855095316370019, "percentage": 19.52, "elapsed_time": "13:52:37", "remaining_time": "2 days, 9:13:33", "throughput": 26506.85, "total_tokens": 1324211200} +{"current_steps": 4930, "total_steps": 25209, "loss": 1.0991, "lr": 4.092179216362654e-05, "epoch": 0.5866995916606543, "percentage": 19.56, "elapsed_time": "13:54:06", "remaining_time": "2 days, 9:11:02", "throughput": 26511.69, "total_tokens": 1326827904} +{"current_steps": 4940, "total_steps": 25209, "loss": 1.0936, "lr": 4.090809357516532e-05, "epoch": 0.5878896516843068, "percentage": 19.6, "elapsed_time": "13:55:40", "remaining_time": "2 days, 9:08:49", "throughput": 26514.76, "total_tokens": 1329472320} +{"current_steps": 4950, "total_steps": 25209, "loss": 1.0802, "lr": 4.089440873432638e-05, "epoch": 0.5890797117079593, "percentage": 19.64, "elapsed_time": "13:57:19", "remaining_time": "2 days, 9:06:55", "throughput": 26516.72, "total_tokens": 1332176512} +{"current_steps": 4960, "total_steps": 25209, "loss": 1.0858, "lr": 4.088073761813037e-05, "epoch": 0.5902697717316117, "percentage": 19.68, "elapsed_time": "13:58:50", "remaining_time": "2 days, 9:04:32", "throughput": 26520.46, "total_tokens": 1334788928} +{"current_steps": 4970, "total_steps": 25209, "loss": 1.1029, "lr": 4.086708020365172e-05, "epoch": 0.5914598317552642, "percentage": 19.72, "elapsed_time": "14:00:28", "remaining_time": "2 days, 9:02:36", "throughput": 26522.42, "total_tokens": 1337484928} +{"current_steps": 4980, "total_steps": 25209, "loss": 1.085, "lr": 4.0853436468018354e-05, "epoch": 0.5926498917789166, "percentage": 19.75, "elapsed_time": "14:02:05", "remaining_time": "2 days, 9:00:35", "throughput": 26525.66, "total_tokens": 1340212544} +{"current_steps": 4990, "total_steps": 25209, "loss": 1.0904, "lr": 4.0839806388411686e-05, "epoch": 0.593839951802569, "percentage": 19.79, "elapsed_time": "14:03:42", "remaining_time": "2 days, 8:58:36", "throughput": 26527.99, "total_tokens": 1342904320} +{"current_steps": 5000, "total_steps": 25209, "loss": 1.0972, "lr": 4.0826189942066346e-05, "epoch": 0.5950300118262215, "percentage": 19.83, "elapsed_time": "14:05:19", "remaining_time": "2 days, 8:56:38", "throughput": 26530.5, "total_tokens": 1345616192} +{"current_steps": 5000, "total_steps": 25209, "eval_loss": 1.0117703676223755, "epoch": 0.5950300118262215, "percentage": 19.83, "elapsed_time": "14:05:21", "remaining_time": "2 days, 8:56:46", "throughput": 26529.45, "total_tokens": 1345616192} +{"current_steps": 5010, "total_steps": 25209, "loss": 1.0796, "lr": 4.081258710627008e-05, "epoch": 0.5962200718498739, "percentage": 19.87, "elapsed_time": "14:07:31", "remaining_time": "2 days, 8:56:59", "throughput": 26515.62, "total_tokens": 1348357440} +{"current_steps": 5020, "total_steps": 25209, "loss": 1.0865, "lr": 4.0798997858363557e-05, "epoch": 0.5974101318735263, "percentage": 19.91, "elapsed_time": "14:09:11", "remaining_time": "2 days, 8:55:12", "throughput": 26516.49, "total_tokens": 1351055808} +{"current_steps": 5030, "total_steps": 25209, "loss": 1.0922, "lr": 4.078542217574024e-05, "epoch": 0.5986001918971788, "percentage": 19.95, "elapsed_time": "14:10:51", "remaining_time": "2 days, 8:53:23", "throughput": 26517.5, "total_tokens": 1353750464} +{"current_steps": 5040, "total_steps": 25209, "loss": 1.0786, "lr": 4.0771860035846196e-05, "epoch": 0.5997902519208312, "percentage": 19.99, "elapsed_time": "14:12:24", "remaining_time": "2 days, 8:51:10", "throughput": 26520.42, "total_tokens": 1356381120} +{"current_steps": 5050, "total_steps": 25209, "loss": 1.077, "lr": 4.0758311416179965e-05, "epoch": 0.6009803119444836, "percentage": 20.03, "elapsed_time": "14:13:59", "remaining_time": "2 days, 8:49:02", "throughput": 26523.95, "total_tokens": 1359080640} +{"current_steps": 5060, "total_steps": 25209, "loss": 1.0805, "lr": 4.0744776294292386e-05, "epoch": 0.6021703719681362, "percentage": 20.07, "elapsed_time": "14:15:38", "remaining_time": "2 days, 8:47:11", "throughput": 26525.8, "total_tokens": 1361798144} +{"current_steps": 5070, "total_steps": 25209, "loss": 1.078, "lr": 4.073125464778646e-05, "epoch": 0.6033604319917886, "percentage": 20.11, "elapsed_time": "14:17:18", "remaining_time": "2 days, 8:45:24", "throughput": 26527.23, "total_tokens": 1364529152} +{"current_steps": 5080, "total_steps": 25209, "loss": 1.0895, "lr": 4.071774645431717e-05, "epoch": 0.604550492015441, "percentage": 20.15, "elapsed_time": "14:18:51", "remaining_time": "2 days, 8:43:08", "throughput": 26530.84, "total_tokens": 1367174400} +{"current_steps": 5090, "total_steps": 25209, "loss": 1.0829, "lr": 4.070425169159135e-05, "epoch": 0.6057405520390935, "percentage": 20.19, "elapsed_time": "14:20:33", "remaining_time": "2 days, 8:41:27", "throughput": 26532.72, "total_tokens": 1369967168} +{"current_steps": 5100, "total_steps": 25209, "loss": 1.1017, "lr": 4.069077033736751e-05, "epoch": 0.6069306120627459, "percentage": 20.23, "elapsed_time": "14:22:03", "remaining_time": "2 days, 8:39:04", "throughput": 26537.31, "total_tokens": 1372615296} +{"current_steps": 5110, "total_steps": 25209, "loss": 1.0888, "lr": 4.06773023694557e-05, "epoch": 0.6081206720863983, "percentage": 20.27, "elapsed_time": "14:23:44", "remaining_time": "2 days, 8:37:20", "throughput": 26538.23, "total_tokens": 1375339392} +{"current_steps": 5120, "total_steps": 25209, "loss": 1.0866, "lr": 4.066384776571732e-05, "epoch": 0.6093107321100508, "percentage": 20.31, "elapsed_time": "14:25:19", "remaining_time": "2 days, 8:35:13", "throughput": 26541.13, "total_tokens": 1378007744} +{"current_steps": 5130, "total_steps": 25209, "loss": 1.099, "lr": 4.065040650406504e-05, "epoch": 0.6105007921337032, "percentage": 20.35, "elapsed_time": "14:26:55", "remaining_time": "2 days, 8:33:09", "throughput": 26544.24, "total_tokens": 1380703296} +{"current_steps": 5140, "total_steps": 25209, "loss": 1.0862, "lr": 4.0636978562462576e-05, "epoch": 0.6116908521573556, "percentage": 20.39, "elapsed_time": "14:28:33", "remaining_time": "2 days, 8:31:14", "throughput": 26546.06, "total_tokens": 1383399808} +{"current_steps": 5150, "total_steps": 25209, "loss": 1.096, "lr": 4.062356391892456e-05, "epoch": 0.6128809121810082, "percentage": 20.43, "elapsed_time": "14:30:03", "remaining_time": "2 days, 8:28:50", "throughput": 26550.44, "total_tokens": 1386027456} +{"current_steps": 5160, "total_steps": 25209, "loss": 1.0958, "lr": 4.0610162551516395e-05, "epoch": 0.6140709722046606, "percentage": 20.47, "elapsed_time": "14:31:43", "remaining_time": "2 days, 8:27:03", "throughput": 26551.55, "total_tokens": 1388736704} +{"current_steps": 5170, "total_steps": 25209, "loss": 1.1023, "lr": 4.059677443835412e-05, "epoch": 0.615261032228313, "percentage": 20.51, "elapsed_time": "14:33:22", "remaining_time": "2 days, 8:25:11", "throughput": 26553.91, "total_tokens": 1391480960} +{"current_steps": 5180, "total_steps": 25209, "loss": 1.0899, "lr": 4.058339955760423e-05, "epoch": 0.6164510922519655, "percentage": 20.55, "elapsed_time": "14:34:56", "remaining_time": "2 days, 8:23:04", "throughput": 26556.86, "total_tokens": 1394154496} +{"current_steps": 5190, "total_steps": 25209, "loss": 1.0896, "lr": 4.0570037887483535e-05, "epoch": 0.6176411522756179, "percentage": 20.59, "elapsed_time": "14:36:32", "remaining_time": "2 days, 8:21:01", "throughput": 26559.45, "total_tokens": 1396833600} +{"current_steps": 5200, "total_steps": 25209, "loss": 1.0744, "lr": 4.0556689406259025e-05, "epoch": 0.6188312122992703, "percentage": 20.63, "elapsed_time": "14:38:11", "remaining_time": "2 days, 8:19:12", "throughput": 26560.51, "total_tokens": 1399526080} +{"current_steps": 5210, "total_steps": 25209, "loss": 1.0794, "lr": 4.054335409224771e-05, "epoch": 0.6200212723229228, "percentage": 20.67, "elapsed_time": "14:39:50", "remaining_time": "2 days, 8:17:22", "throughput": 26561.33, "total_tokens": 1402196096} +{"current_steps": 5220, "total_steps": 25209, "loss": 1.0815, "lr": 4.053003192381646e-05, "epoch": 0.6212113323465752, "percentage": 20.71, "elapsed_time": "14:41:34", "remaining_time": "2 days, 8:15:49", "throughput": 26561.84, "total_tokens": 1404972096} +{"current_steps": 5230, "total_steps": 25209, "loss": 1.087, "lr": 4.051672287938189e-05, "epoch": 0.6224013923702276, "percentage": 20.75, "elapsed_time": "14:43:10", "remaining_time": "2 days, 8:13:47", "throughput": 26563.72, "total_tokens": 1407624448} +{"current_steps": 5240, "total_steps": 25209, "loss": 1.0764, "lr": 4.050342693741019e-05, "epoch": 0.6235914523938801, "percentage": 20.79, "elapsed_time": "14:44:47", "remaining_time": "2 days, 8:11:49", "throughput": 26566.46, "total_tokens": 1410342720} +{"current_steps": 5250, "total_steps": 25209, "loss": 1.0846, "lr": 4.049014407641699e-05, "epoch": 0.6247815124175325, "percentage": 20.83, "elapsed_time": "14:46:25", "remaining_time": "2 days, 8:09:54", "throughput": 26567.83, "total_tokens": 1413015680} +{"current_steps": 5260, "total_steps": 25209, "loss": 1.0683, "lr": 4.047687427496717e-05, "epoch": 0.625971572441185, "percentage": 20.87, "elapsed_time": "14:48:05", "remaining_time": "2 days, 8:08:09", "throughput": 26568.99, "total_tokens": 1415736448} +{"current_steps": 5270, "total_steps": 25209, "loss": 1.0801, "lr": 4.046361751167479e-05, "epoch": 0.6271616324648375, "percentage": 20.91, "elapsed_time": "14:49:44", "remaining_time": "2 days, 8:06:19", "throughput": 26570.51, "total_tokens": 1418452352} +{"current_steps": 5280, "total_steps": 25209, "loss": 1.0794, "lr": 4.045037376520292e-05, "epoch": 0.6283516924884899, "percentage": 20.94, "elapsed_time": "14:51:24", "remaining_time": "2 days, 8:04:32", "throughput": 26572.25, "total_tokens": 1421198080} +{"current_steps": 5290, "total_steps": 25209, "loss": 1.0893, "lr": 4.043714301426344e-05, "epoch": 0.6295417525121423, "percentage": 20.98, "elapsed_time": "14:52:59", "remaining_time": "2 days, 8:02:29", "throughput": 26574.82, "total_tokens": 1423874176} +{"current_steps": 5300, "total_steps": 25209, "loss": 1.0923, "lr": 4.042392523761696e-05, "epoch": 0.6307318125357948, "percentage": 21.02, "elapsed_time": "14:54:36", "remaining_time": "2 days, 8:00:30", "throughput": 26576.95, "total_tokens": 1426555776} +{"current_steps": 5310, "total_steps": 25209, "loss": 1.0883, "lr": 4.041072041407267e-05, "epoch": 0.6319218725594472, "percentage": 21.06, "elapsed_time": "14:56:16", "remaining_time": "2 days, 7:58:43", "throughput": 26577.67, "total_tokens": 1429244672} +{"current_steps": 5320, "total_steps": 25209, "loss": 1.0822, "lr": 4.039752852248815e-05, "epoch": 0.6331119325830996, "percentage": 21.1, "elapsed_time": "14:57:54", "remaining_time": "2 days, 7:56:50", "throughput": 26579.44, "total_tokens": 1431945984} +{"current_steps": 5330, "total_steps": 25209, "loss": 1.0998, "lr": 4.0384349541769286e-05, "epoch": 0.6343019926067521, "percentage": 21.14, "elapsed_time": "14:59:30", "remaining_time": "2 days, 7:54:52", "throughput": 26581.7, "total_tokens": 1434640512} +{"current_steps": 5340, "total_steps": 25209, "loss": 1.0835, "lr": 4.037118345087011e-05, "epoch": 0.6354920526304045, "percentage": 21.18, "elapsed_time": "15:01:09", "remaining_time": "2 days, 7:53:00", "throughput": 26583.68, "total_tokens": 1437359552} +{"current_steps": 5350, "total_steps": 25209, "loss": 1.0861, "lr": 4.0358030228792636e-05, "epoch": 0.6366821126540569, "percentage": 21.22, "elapsed_time": "15:02:42", "remaining_time": "2 days, 7:50:49", "throughput": 26586.64, "total_tokens": 1440002752} +{"current_steps": 5360, "total_steps": 25209, "loss": 1.0878, "lr": 4.034488985458673e-05, "epoch": 0.6378721726777095, "percentage": 21.26, "elapsed_time": "15:04:21", "remaining_time": "2 days, 7:49:00", "throughput": 26588.33, "total_tokens": 1442726912} +{"current_steps": 5370, "total_steps": 25209, "loss": 1.0835, "lr": 4.033176230735001e-05, "epoch": 0.6390622327013619, "percentage": 21.3, "elapsed_time": "15:06:01", "remaining_time": "2 days, 7:47:12", "throughput": 26589.66, "total_tokens": 1445441408} +{"current_steps": 5380, "total_steps": 25209, "loss": 1.0905, "lr": 4.0318647566227626e-05, "epoch": 0.6402522927250143, "percentage": 21.34, "elapsed_time": "15:07:37", "remaining_time": "2 days, 7:45:12", "throughput": 26592.17, "total_tokens": 1448138880} +{"current_steps": 5390, "total_steps": 25209, "loss": 1.0917, "lr": 4.0305545610412205e-05, "epoch": 0.6414423527486668, "percentage": 21.38, "elapsed_time": "15:09:13", "remaining_time": "2 days, 7:43:13", "throughput": 26594.66, "total_tokens": 1450835328} +{"current_steps": 5400, "total_steps": 25209, "loss": 1.0846, "lr": 4.029245641914365e-05, "epoch": 0.6426324127723192, "percentage": 21.42, "elapsed_time": "15:10:50", "remaining_time": "2 days, 7:41:17", "throughput": 26596.25, "total_tokens": 1453505664} +{"current_steps": 5410, "total_steps": 25209, "loss": 1.0935, "lr": 4.027937997170904e-05, "epoch": 0.6438224727959716, "percentage": 21.46, "elapsed_time": "15:12:23", "remaining_time": "2 days, 7:39:05", "throughput": 26599.7, "total_tokens": 1456163392} +{"current_steps": 5420, "total_steps": 25209, "loss": 1.0865, "lr": 4.026631624744247e-05, "epoch": 0.6450125328196241, "percentage": 21.5, "elapsed_time": "15:13:58", "remaining_time": "2 days, 7:37:02", "throughput": 26602.21, "total_tokens": 1458837568} +{"current_steps": 5430, "total_steps": 25209, "loss": 1.0879, "lr": 4.025326522572493e-05, "epoch": 0.6462025928432765, "percentage": 21.54, "elapsed_time": "15:15:36", "remaining_time": "2 days, 7:35:07", "throughput": 26604.45, "total_tokens": 1461546368} +{"current_steps": 5440, "total_steps": 25209, "loss": 1.0958, "lr": 4.024022688598415e-05, "epoch": 0.6473926528669289, "percentage": 21.58, "elapsed_time": "15:17:10", "remaining_time": "2 days, 7:33:02", "throughput": 26607.43, "total_tokens": 1464226176} +{"current_steps": 5450, "total_steps": 25209, "loss": 1.0919, "lr": 4.0227201207694494e-05, "epoch": 0.6485827128905814, "percentage": 21.62, "elapsed_time": "15:18:48", "remaining_time": "2 days, 7:31:07", "throughput": 26609.61, "total_tokens": 1466936768} +{"current_steps": 5460, "total_steps": 25209, "loss": 1.0804, "lr": 4.021418817037677e-05, "epoch": 0.6497727729142339, "percentage": 21.66, "elapsed_time": "15:20:24", "remaining_time": "2 days, 7:29:09", "throughput": 26611.42, "total_tokens": 1469608064} +{"current_steps": 5470, "total_steps": 25209, "loss": 1.068, "lr": 4.0201187753598174e-05, "epoch": 0.6509628329378863, "percentage": 21.7, "elapsed_time": "15:21:58", "remaining_time": "2 days, 7:27:03", "throughput": 26613.44, "total_tokens": 1472226880} +{"current_steps": 5480, "total_steps": 25209, "loss": 1.0864, "lr": 4.018819993697208e-05, "epoch": 0.6521528929615388, "percentage": 21.74, "elapsed_time": "15:23:37", "remaining_time": "2 days, 7:25:11", "throughput": 26614.96, "total_tokens": 1474921984} +{"current_steps": 5490, "total_steps": 25209, "loss": 1.0757, "lr": 4.017522470015793e-05, "epoch": 0.6533429529851912, "percentage": 21.78, "elapsed_time": "15:25:12", "remaining_time": "2 days, 7:23:11", "throughput": 26617.3, "total_tokens": 1477602496} +{"current_steps": 5500, "total_steps": 25209, "loss": 1.0656, "lr": 4.0162262022861144e-05, "epoch": 0.6545330130088436, "percentage": 21.82, "elapsed_time": "15:26:50", "remaining_time": "2 days, 7:21:18", "throughput": 26619.61, "total_tokens": 1480339584} +{"current_steps": 5510, "total_steps": 25209, "loss": 1.1008, "lr": 4.0149311884832906e-05, "epoch": 0.6557230730324961, "percentage": 21.86, "elapsed_time": "15:28:25", "remaining_time": "2 days, 7:19:14", "throughput": 26622.13, "total_tokens": 1482998976} +{"current_steps": 5520, "total_steps": 25209, "loss": 1.0789, "lr": 4.0136374265870116e-05, "epoch": 0.6569131330561485, "percentage": 21.9, "elapsed_time": "15:30:06", "remaining_time": "2 days, 7:17:33", "throughput": 26623.47, "total_tokens": 1485762752} +{"current_steps": 5530, "total_steps": 25209, "loss": 1.0839, "lr": 4.0123449145815174e-05, "epoch": 0.6581031930798009, "percentage": 21.94, "elapsed_time": "15:31:45", "remaining_time": "2 days, 7:15:45", "throughput": 26624.1, "total_tokens": 1488438400} +{"current_steps": 5540, "total_steps": 25209, "loss": 1.077, "lr": 4.011053650455592e-05, "epoch": 0.6592932531034534, "percentage": 21.98, "elapsed_time": "15:33:22", "remaining_time": "2 days, 7:13:49", "throughput": 26626.47, "total_tokens": 1491153856} +{"current_steps": 5550, "total_steps": 25209, "loss": 1.0763, "lr": 4.0097636322025466e-05, "epoch": 0.6604833131271058, "percentage": 22.02, "elapsed_time": "15:35:02", "remaining_time": "2 days, 7:12:04", "throughput": 26627.42, "total_tokens": 1493864832} +{"current_steps": 5560, "total_steps": 25209, "loss": 1.0885, "lr": 4.008474857820206e-05, "epoch": 0.6616733731507582, "percentage": 22.06, "elapsed_time": "15:36:40", "remaining_time": "2 days, 7:10:11", "throughput": 26629.45, "total_tokens": 1496583488} +{"current_steps": 5570, "total_steps": 25209, "loss": 1.0848, "lr": 4.007187325310899e-05, "epoch": 0.6628634331744108, "percentage": 22.1, "elapsed_time": "15:38:18", "remaining_time": "2 days, 7:08:19", "throughput": 26630.68, "total_tokens": 1499260032} +{"current_steps": 5580, "total_steps": 25209, "loss": 1.087, "lr": 4.00590103268144e-05, "epoch": 0.6640534931980632, "percentage": 22.13, "elapsed_time": "15:39:57", "remaining_time": "2 days, 7:06:32", "throughput": 26631.62, "total_tokens": 1501960768} +{"current_steps": 5590, "total_steps": 25209, "loss": 1.0707, "lr": 4.004615977943124e-05, "epoch": 0.6652435532217156, "percentage": 22.17, "elapsed_time": "15:41:36", "remaining_time": "2 days, 7:04:44", "throughput": 26632.18, "total_tokens": 1504634048} +{"current_steps": 5600, "total_steps": 25209, "loss": 1.0768, "lr": 4.0033321591117025e-05, "epoch": 0.6664336132453681, "percentage": 22.21, "elapsed_time": "15:43:09", "remaining_time": "2 days, 7:02:34", "throughput": 26635.99, "total_tokens": 1507322624} +{"current_steps": 5610, "total_steps": 25209, "loss": 1.0847, "lr": 4.002049574207381e-05, "epoch": 0.6676236732690205, "percentage": 22.25, "elapsed_time": "15:44:49", "remaining_time": "2 days, 7:00:49", "throughput": 26637.0, "total_tokens": 1510038592} +{"current_steps": 5620, "total_steps": 25209, "loss": 1.0739, "lr": 4.000768221254803e-05, "epoch": 0.6688137332926729, "percentage": 22.29, "elapsed_time": "15:46:27", "remaining_time": "2 days, 6:58:58", "throughput": 26638.41, "total_tokens": 1512735936} +{"current_steps": 5630, "total_steps": 25209, "loss": 1.0782, "lr": 3.999488098283034e-05, "epoch": 0.6700037933163254, "percentage": 22.33, "elapsed_time": "15:48:05", "remaining_time": "2 days, 6:57:04", "throughput": 26640.1, "total_tokens": 1515426752} +{"current_steps": 5640, "total_steps": 25209, "loss": 1.0777, "lr": 3.9982092033255506e-05, "epoch": 0.6711938533399778, "percentage": 22.37, "elapsed_time": "15:49:41", "remaining_time": "2 days, 6:55:07", "throughput": 26642.52, "total_tokens": 1518130688} +{"current_steps": 5650, "total_steps": 25209, "loss": 1.0834, "lr": 3.996931534420232e-05, "epoch": 0.6723839133636302, "percentage": 22.41, "elapsed_time": "15:51:19", "remaining_time": "2 days, 6:53:15", "throughput": 26644.03, "total_tokens": 1520820736} +{"current_steps": 5660, "total_steps": 25209, "loss": 1.0724, "lr": 3.995655089609339e-05, "epoch": 0.6735739733872828, "percentage": 22.45, "elapsed_time": "15:52:55", "remaining_time": "2 days, 6:51:16", "throughput": 26646.0, "total_tokens": 1523490176} +{"current_steps": 5670, "total_steps": 25209, "loss": 1.0659, "lr": 3.994379866939511e-05, "epoch": 0.6747640334109352, "percentage": 22.49, "elapsed_time": "15:54:33", "remaining_time": "2 days, 6:49:27", "throughput": 26647.22, "total_tokens": 1526188608} +{"current_steps": 5680, "total_steps": 25209, "loss": 1.0781, "lr": 3.993105864461745e-05, "epoch": 0.6759540934345876, "percentage": 22.53, "elapsed_time": "15:56:10", "remaining_time": "2 days, 6:47:33", "throughput": 26648.26, "total_tokens": 1528836544} +{"current_steps": 5690, "total_steps": 25209, "loss": 1.0646, "lr": 3.9918330802313866e-05, "epoch": 0.6771441534582401, "percentage": 22.57, "elapsed_time": "15:57:52", "remaining_time": "2 days, 6:45:55", "throughput": 26648.31, "total_tokens": 1531555840} +{"current_steps": 5700, "total_steps": 25209, "loss": 1.0658, "lr": 3.9905615123081206e-05, "epoch": 0.6783342134818925, "percentage": 22.61, "elapsed_time": "15:59:31", "remaining_time": "2 days, 6:44:05", "throughput": 26649.46, "total_tokens": 1534243712} +{"current_steps": 5710, "total_steps": 25209, "loss": 1.0709, "lr": 3.989291158755953e-05, "epoch": 0.6795242735055449, "percentage": 22.65, "elapsed_time": "16:01:04", "remaining_time": "2 days, 6:41:56", "throughput": 26652.55, "total_tokens": 1536897920} +{"current_steps": 5720, "total_steps": 25209, "loss": 1.0932, "lr": 3.988022017643201e-05, "epoch": 0.6807143335291974, "percentage": 22.69, "elapsed_time": "16:02:37", "remaining_time": "2 days, 6:39:50", "throughput": 26654.97, "total_tokens": 1539529344} +{"current_steps": 5730, "total_steps": 25209, "loss": 1.0745, "lr": 3.9867540870424826e-05, "epoch": 0.6819043935528498, "percentage": 22.73, "elapsed_time": "16:04:13", "remaining_time": "2 days, 6:37:50", "throughput": 26657.54, "total_tokens": 1542220160} +{"current_steps": 5740, "total_steps": 25209, "loss": 1.0853, "lr": 3.985487365030702e-05, "epoch": 0.6830944535765022, "percentage": 22.77, "elapsed_time": "16:05:52", "remaining_time": "2 days, 6:36:03", "throughput": 26658.74, "total_tokens": 1544937408} +{"current_steps": 5750, "total_steps": 25209, "loss": 1.0841, "lr": 3.984221849689036e-05, "epoch": 0.6842845136001547, "percentage": 22.81, "elapsed_time": "16:07:23", "remaining_time": "2 days, 6:33:50", "throughput": 26661.83, "total_tokens": 1547552320} +{"current_steps": 5760, "total_steps": 25209, "loss": 1.0692, "lr": 3.982957539102927e-05, "epoch": 0.6854745736238071, "percentage": 22.85, "elapsed_time": "16:09:00", "remaining_time": "2 days, 6:31:54", "throughput": 26663.72, "total_tokens": 1550236096} +{"current_steps": 5770, "total_steps": 25209, "loss": 1.0868, "lr": 3.981694431362065e-05, "epoch": 0.6866646336474596, "percentage": 22.89, "elapsed_time": "16:10:32", "remaining_time": "2 days, 6:29:42", "throughput": 26667.0, "total_tokens": 1552875392} +{"current_steps": 5780, "total_steps": 25209, "loss": 1.0728, "lr": 3.9804325245603786e-05, "epoch": 0.6878546936711121, "percentage": 22.93, "elapsed_time": "16:12:08", "remaining_time": "2 days, 6:27:46", "throughput": 26668.49, "total_tokens": 1555531712} +{"current_steps": 5790, "total_steps": 25209, "loss": 1.079, "lr": 3.9791718167960226e-05, "epoch": 0.6890447536947645, "percentage": 22.97, "elapsed_time": "16:13:39", "remaining_time": "2 days, 6:25:32", "throughput": 26671.86, "total_tokens": 1558155008} +{"current_steps": 5800, "total_steps": 25209, "loss": 1.0687, "lr": 3.9779123061713665e-05, "epoch": 0.6902348137184169, "percentage": 23.01, "elapsed_time": "16:15:15", "remaining_time": "2 days, 6:23:35", "throughput": 26673.45, "total_tokens": 1560817088} +{"current_steps": 5810, "total_steps": 25209, "loss": 1.084, "lr": 3.976653990792979e-05, "epoch": 0.6914248737420694, "percentage": 23.05, "elapsed_time": "16:16:47", "remaining_time": "2 days, 6:21:23", "throughput": 26676.72, "total_tokens": 1563446912} +{"current_steps": 5820, "total_steps": 25209, "loss": 1.0817, "lr": 3.9753968687716206e-05, "epoch": 0.6926149337657218, "percentage": 23.09, "elapsed_time": "16:18:24", "remaining_time": "2 days, 6:19:29", "throughput": 26677.9, "total_tokens": 1566103808} +{"current_steps": 5830, "total_steps": 25209, "loss": 1.094, "lr": 3.974140938222232e-05, "epoch": 0.6938049937893742, "percentage": 23.13, "elapsed_time": "16:19:59", "remaining_time": "2 days, 6:17:30", "throughput": 26680.18, "total_tokens": 1568785664} +{"current_steps": 5840, "total_steps": 25209, "loss": 1.0765, "lr": 3.972886197263915e-05, "epoch": 0.6949950538130267, "percentage": 23.17, "elapsed_time": "16:21:34", "remaining_time": "2 days, 6:15:29", "throughput": 26682.91, "total_tokens": 1571474240} +{"current_steps": 5850, "total_steps": 25209, "loss": 1.073, "lr": 3.97163264401993e-05, "epoch": 0.6961851138366791, "percentage": 23.21, "elapsed_time": "16:23:14", "remaining_time": "2 days, 6:13:45", "throughput": 26684.06, "total_tokens": 1574203264} +{"current_steps": 5860, "total_steps": 25209, "loss": 1.0813, "lr": 3.970380276617677e-05, "epoch": 0.6973751738603315, "percentage": 23.25, "elapsed_time": "16:24:50", "remaining_time": "2 days, 6:11:50", "throughput": 26686.16, "total_tokens": 1576910080} +{"current_steps": 5870, "total_steps": 25209, "loss": 1.0712, "lr": 3.96912909318869e-05, "epoch": 0.6985652338839841, "percentage": 23.29, "elapsed_time": "16:26:25", "remaining_time": "2 days, 6:09:48", "throughput": 26688.68, "total_tokens": 1579571008} +{"current_steps": 5880, "total_steps": 25209, "loss": 1.0853, "lr": 3.96787909186862e-05, "epoch": 0.6997552939076365, "percentage": 23.33, "elapsed_time": "16:28:02", "remaining_time": "2 days, 6:07:55", "throughput": 26690.2, "total_tokens": 1582258496} +{"current_steps": 5890, "total_steps": 25209, "loss": 1.071, "lr": 3.9666302707972244e-05, "epoch": 0.7009453539312889, "percentage": 23.36, "elapsed_time": "16:29:35", "remaining_time": "2 days, 6:05:50", "throughput": 26693.13, "total_tokens": 1584928640} +{"current_steps": 5900, "total_steps": 25209, "loss": 1.0749, "lr": 3.965382628118358e-05, "epoch": 0.7021354139549414, "percentage": 23.4, "elapsed_time": "16:31:13", "remaining_time": "2 days, 6:04:01", "throughput": 26694.58, "total_tokens": 1587632320} +{"current_steps": 5910, "total_steps": 25209, "loss": 1.0961, "lr": 3.964136161979959e-05, "epoch": 0.7033254739785938, "percentage": 23.44, "elapsed_time": "16:32:52", "remaining_time": "2 days, 6:02:12", "throughput": 26695.77, "total_tokens": 1590327744} +{"current_steps": 5920, "total_steps": 25209, "loss": 1.0655, "lr": 3.9628908705340406e-05, "epoch": 0.7045155340022462, "percentage": 23.48, "elapsed_time": "16:34:28", "remaining_time": "2 days, 6:00:16", "throughput": 26697.84, "total_tokens": 1593019584} +{"current_steps": 5930, "total_steps": 25209, "loss": 1.0905, "lr": 3.961646751936673e-05, "epoch": 0.7057055940258987, "percentage": 23.52, "elapsed_time": "16:36:02", "remaining_time": "2 days, 5:58:15", "throughput": 26700.71, "total_tokens": 1595712896} +{"current_steps": 5940, "total_steps": 25209, "loss": 1.0817, "lr": 3.960403804347979e-05, "epoch": 0.7068956540495511, "percentage": 23.56, "elapsed_time": "16:37:35", "remaining_time": "2 days, 5:56:08", "throughput": 26703.7, "total_tokens": 1598374144} +{"current_steps": 5950, "total_steps": 25209, "loss": 1.0708, "lr": 3.959162025932119e-05, "epoch": 0.7080857140732035, "percentage": 23.6, "elapsed_time": "16:39:14", "remaining_time": "2 days, 5:54:20", "throughput": 26705.03, "total_tokens": 1601084096} +{"current_steps": 5960, "total_steps": 25209, "loss": 1.0818, "lr": 3.95792141485728e-05, "epoch": 0.709275774096856, "percentage": 23.64, "elapsed_time": "16:40:52", "remaining_time": "2 days, 5:52:32", "throughput": 26706.45, "total_tokens": 1603800000} +{"current_steps": 5970, "total_steps": 25209, "loss": 1.0799, "lr": 3.956681969295664e-05, "epoch": 0.7104658341205085, "percentage": 23.68, "elapsed_time": "16:42:29", "remaining_time": "2 days, 5:50:37", "throughput": 26708.56, "total_tokens": 1606495808} +{"current_steps": 5980, "total_steps": 25209, "loss": 1.0878, "lr": 3.955443687423479e-05, "epoch": 0.7116558941441609, "percentage": 23.72, "elapsed_time": "16:44:07", "remaining_time": "2 days, 5:48:48", "throughput": 26709.87, "total_tokens": 1609200192} +{"current_steps": 5990, "total_steps": 25209, "loss": 1.0801, "lr": 3.954206567420924e-05, "epoch": 0.7128459541678134, "percentage": 23.76, "elapsed_time": "16:45:43", "remaining_time": "2 days, 5:46:52", "throughput": 26712.48, "total_tokens": 1611921088} +{"current_steps": 6000, "total_steps": 25209, "loss": 1.0812, "lr": 3.952970607472179e-05, "epoch": 0.7140360141914658, "percentage": 23.8, "elapsed_time": "16:47:20", "remaining_time": "2 days, 5:45:00", "throughput": 26713.99, "total_tokens": 1614610112} +{"current_steps": 6010, "total_steps": 25209, "loss": 1.0747, "lr": 3.951735805765399e-05, "epoch": 0.7152260742151182, "percentage": 23.84, "elapsed_time": "16:49:01", "remaining_time": "2 days, 5:43:20", "throughput": 26714.98, "total_tokens": 1617366080} +{"current_steps": 6020, "total_steps": 25209, "loss": 1.0683, "lr": 3.950502160492692e-05, "epoch": 0.7164161342387707, "percentage": 23.88, "elapsed_time": "16:50:38", "remaining_time": "2 days, 5:41:28", "throughput": 26715.92, "total_tokens": 1620018432} +{"current_steps": 6030, "total_steps": 25209, "loss": 1.077, "lr": 3.9492696698501205e-05, "epoch": 0.7176061942624231, "percentage": 23.92, "elapsed_time": "16:52:15", "remaining_time": "2 days, 5:39:36", "throughput": 26717.91, "total_tokens": 1622738304} +{"current_steps": 6040, "total_steps": 25209, "loss": 1.0813, "lr": 3.9480383320376784e-05, "epoch": 0.7187962542860755, "percentage": 23.96, "elapsed_time": "16:53:48", "remaining_time": "2 days, 5:37:31", "throughput": 26720.9, "total_tokens": 1625401984} +{"current_steps": 6050, "total_steps": 25209, "loss": 1.084, "lr": 3.94680814525929e-05, "epoch": 0.719986314309728, "percentage": 24.0, "elapsed_time": "16:55:27", "remaining_time": "2 days, 5:35:44", "throughput": 26722.12, "total_tokens": 1628120640} +{"current_steps": 6060, "total_steps": 25209, "loss": 1.0855, "lr": 3.945579107722792e-05, "epoch": 0.7211763743333804, "percentage": 24.04, "elapsed_time": "16:57:04", "remaining_time": "2 days, 5:33:51", "throughput": 26723.52, "total_tokens": 1630792448} +{"current_steps": 6070, "total_steps": 25209, "loss": 1.069, "lr": 3.9443512176399276e-05, "epoch": 0.7223664343570328, "percentage": 24.08, "elapsed_time": "16:58:42", "remaining_time": "2 days, 5:32:03", "throughput": 26724.52, "total_tokens": 1633479296} +{"current_steps": 6080, "total_steps": 25209, "loss": 1.0789, "lr": 3.9431244732263307e-05, "epoch": 0.7235564943806854, "percentage": 24.12, "elapsed_time": "17:00:22", "remaining_time": "2 days, 5:30:20", "throughput": 26725.32, "total_tokens": 1636200832} +{"current_steps": 6090, "total_steps": 25209, "loss": 1.0854, "lr": 3.941898872701519e-05, "epoch": 0.7247465544043378, "percentage": 24.16, "elapsed_time": "17:02:03", "remaining_time": "2 days, 5:28:38", "throughput": 26726.56, "total_tokens": 1638959872} +{"current_steps": 6100, "total_steps": 25209, "loss": 1.073, "lr": 3.940674414288882e-05, "epoch": 0.7259366144279902, "percentage": 24.2, "elapsed_time": "17:03:39", "remaining_time": "2 days, 5:26:42", "throughput": 26728.27, "total_tokens": 1641626304} +{"current_steps": 6110, "total_steps": 25209, "loss": 1.0805, "lr": 3.939451096215668e-05, "epoch": 0.7271266744516427, "percentage": 24.24, "elapsed_time": "17:05:12", "remaining_time": "2 days, 5:24:39", "throughput": 26731.14, "total_tokens": 1644298240} +{"current_steps": 6120, "total_steps": 25209, "loss": 1.0652, "lr": 3.938228916712978e-05, "epoch": 0.7283167344752951, "percentage": 24.28, "elapsed_time": "17:06:49", "remaining_time": "2 days, 5:22:46", "throughput": 26732.63, "total_tokens": 1646976256} +{"current_steps": 6130, "total_steps": 25209, "loss": 1.0813, "lr": 3.937007874015748e-05, "epoch": 0.7295067944989475, "percentage": 24.32, "elapsed_time": "17:08:30", "remaining_time": "2 days, 5:21:08", "throughput": 26732.71, "total_tokens": 1649693504} +{"current_steps": 6140, "total_steps": 25209, "loss": 1.0691, "lr": 3.935787966362748e-05, "epoch": 0.7306968545226, "percentage": 24.36, "elapsed_time": "17:10:06", "remaining_time": "2 days, 5:19:11", "throughput": 26734.85, "total_tokens": 1652376320} +{"current_steps": 6150, "total_steps": 25209, "loss": 1.0829, "lr": 3.9345691919965595e-05, "epoch": 0.7318869145462524, "percentage": 24.4, "elapsed_time": "17:11:45", "remaining_time": "2 days, 5:17:25", "throughput": 26735.88, "total_tokens": 1655085056} +{"current_steps": 6160, "total_steps": 25209, "loss": 1.0582, "lr": 3.9333515491635764e-05, "epoch": 0.7330769745699048, "percentage": 24.44, "elapsed_time": "17:13:18", "remaining_time": "2 days, 5:15:23", "throughput": 26738.37, "total_tokens": 1657746240} +{"current_steps": 6170, "total_steps": 25209, "loss": 1.0834, "lr": 3.932135036113987e-05, "epoch": 0.7342670345935574, "percentage": 24.48, "elapsed_time": "17:14:53", "remaining_time": "2 days, 5:13:24", "throughput": 26740.63, "total_tokens": 1660425984} +{"current_steps": 6180, "total_steps": 25209, "loss": 1.0711, "lr": 3.930919651101764e-05, "epoch": 0.7354570946172098, "percentage": 24.52, "elapsed_time": "17:16:30", "remaining_time": "2 days, 5:11:32", "throughput": 26741.66, "total_tokens": 1663080704} +{"current_steps": 6190, "total_steps": 25209, "loss": 1.0836, "lr": 3.9297053923846576e-05, "epoch": 0.7366471546408622, "percentage": 24.55, "elapsed_time": "17:18:08", "remaining_time": "2 days, 5:09:42", "throughput": 26742.61, "total_tokens": 1665749952} +{"current_steps": 6200, "total_steps": 25209, "loss": 1.0769, "lr": 3.928492258224183e-05, "epoch": 0.7378372146645147, "percentage": 24.59, "elapsed_time": "17:19:40", "remaining_time": "2 days, 5:07:37", "throughput": 26745.48, "total_tokens": 1668408128} +{"current_steps": 6210, "total_steps": 25209, "loss": 1.0641, "lr": 3.927280246885609e-05, "epoch": 0.7390272746881671, "percentage": 24.63, "elapsed_time": "17:21:16", "remaining_time": "2 days, 5:05:41", "throughput": 26747.38, "total_tokens": 1671083008} +{"current_steps": 6220, "total_steps": 25209, "loss": 1.0776, "lr": 3.9260693566379486e-05, "epoch": 0.7402173347118195, "percentage": 24.67, "elapsed_time": "17:22:57", "remaining_time": "2 days, 5:04:02", "throughput": 26747.23, "total_tokens": 1673773632} +{"current_steps": 6230, "total_steps": 25209, "loss": 1.0671, "lr": 3.924859585753948e-05, "epoch": 0.741407394735472, "percentage": 24.71, "elapsed_time": "17:24:35", "remaining_time": "2 days, 5:02:13", "throughput": 26748.42, "total_tokens": 1676463360} +{"current_steps": 6240, "total_steps": 25209, "loss": 1.0665, "lr": 3.923650932510079e-05, "epoch": 0.7425974547591244, "percentage": 24.75, "elapsed_time": "17:26:11", "remaining_time": "2 days, 5:00:19", "throughput": 26750.1, "total_tokens": 1679145088} +{"current_steps": 6250, "total_steps": 25209, "loss": 1.0612, "lr": 3.9224433951865215e-05, "epoch": 0.7437875147827768, "percentage": 24.79, "elapsed_time": "17:27:47", "remaining_time": "2 days, 4:58:24", "throughput": 26752.17, "total_tokens": 1681839232} +{"current_steps": 6260, "total_steps": 25209, "loss": 1.0691, "lr": 3.921236972067165e-05, "epoch": 0.7449775748064293, "percentage": 24.83, "elapsed_time": "17:29:23", "remaining_time": "2 days, 4:56:31", "throughput": 26753.8, "total_tokens": 1684523136} +{"current_steps": 6270, "total_steps": 25209, "loss": 1.091, "lr": 3.920031661439585e-05, "epoch": 0.7461676348300817, "percentage": 24.87, "elapsed_time": "17:30:59", "remaining_time": "2 days, 4:54:36", "throughput": 26756.46, "total_tokens": 1687250240} +{"current_steps": 6280, "total_steps": 25209, "loss": 1.0817, "lr": 3.918827461595045e-05, "epoch": 0.7473576948537342, "percentage": 24.91, "elapsed_time": "17:32:37", "remaining_time": "2 days, 4:52:47", "throughput": 26757.85, "total_tokens": 1689954432} +{"current_steps": 6290, "total_steps": 25209, "loss": 1.094, "lr": 3.9176243708284746e-05, "epoch": 0.7485477548773867, "percentage": 24.95, "elapsed_time": "17:34:14", "remaining_time": "2 days, 4:50:56", "throughput": 26758.86, "total_tokens": 1692623040} +{"current_steps": 6300, "total_steps": 25209, "loss": 1.0793, "lr": 3.9164223874384715e-05, "epoch": 0.7497378149010391, "percentage": 24.99, "elapsed_time": "17:35:50", "remaining_time": "2 days, 4:49:01", "throughput": 26760.71, "total_tokens": 1695299648} +{"current_steps": 6310, "total_steps": 25209, "loss": 1.0658, "lr": 3.91522150972728e-05, "epoch": 0.7509278749246915, "percentage": 25.03, "elapsed_time": "17:37:28", "remaining_time": "2 days, 4:47:12", "throughput": 26762.37, "total_tokens": 1698020608} +{"current_steps": 6320, "total_steps": 25209, "loss": 1.0735, "lr": 3.9140217360007896e-05, "epoch": 0.752117934948344, "percentage": 25.07, "elapsed_time": "17:39:03", "remaining_time": "2 days, 4:45:17", "throughput": 26764.22, "total_tokens": 1700703232} +{"current_steps": 6330, "total_steps": 25209, "loss": 1.0642, "lr": 3.912823064568521e-05, "epoch": 0.7533079949719964, "percentage": 25.11, "elapsed_time": "17:40:38", "remaining_time": "2 days, 4:43:20", "throughput": 26765.84, "total_tokens": 1703347392} +{"current_steps": 6340, "total_steps": 25209, "loss": 1.0941, "lr": 3.9116254937436155e-05, "epoch": 0.7544980549956488, "percentage": 25.15, "elapsed_time": "17:42:18", "remaining_time": "2 days, 4:41:38", "throughput": 26766.26, "total_tokens": 1706049152} +{"current_steps": 6350, "total_steps": 25209, "loss": 1.0712, "lr": 3.910429021842825e-05, "epoch": 0.7556881150193013, "percentage": 25.19, "elapsed_time": "17:43:52", "remaining_time": "2 days, 4:39:37", "throughput": 26768.85, "total_tokens": 1708721088} +{"current_steps": 6360, "total_steps": 25209, "loss": 1.0805, "lr": 3.9092336471865084e-05, "epoch": 0.7568781750429537, "percentage": 25.23, "elapsed_time": "17:45:34", "remaining_time": "2 days, 4:38:00", "throughput": 26769.57, "total_tokens": 1711488704} +{"current_steps": 6370, "total_steps": 25209, "loss": 1.0758, "lr": 3.908039368098611e-05, "epoch": 0.7580682350666061, "percentage": 25.27, "elapsed_time": "17:47:12", "remaining_time": "2 days, 4:36:14", "throughput": 26770.72, "total_tokens": 1714206976} +{"current_steps": 6380, "total_steps": 25209, "loss": 1.0741, "lr": 3.9068461829066633e-05, "epoch": 0.7592582950902587, "percentage": 25.31, "elapsed_time": "17:48:51", "remaining_time": "2 days, 4:34:29", "throughput": 26771.68, "total_tokens": 1716918528} +{"current_steps": 6390, "total_steps": 25209, "loss": 1.0797, "lr": 3.9056540899417656e-05, "epoch": 0.7604483551139111, "percentage": 25.35, "elapsed_time": "17:50:24", "remaining_time": "2 days, 4:32:24", "throughput": 26774.5, "total_tokens": 1719570560} +{"current_steps": 6400, "total_steps": 25209, "loss": 1.067, "lr": 3.904463087538585e-05, "epoch": 0.7616384151375635, "percentage": 25.39, "elapsed_time": "17:52:06", "remaining_time": "2 days, 4:30:48", "throughput": 26774.78, "total_tokens": 1722319680} +{"current_steps": 6410, "total_steps": 25209, "loss": 1.0708, "lr": 3.903273174035336e-05, "epoch": 0.762828475161216, "percentage": 25.43, "elapsed_time": "17:53:42", "remaining_time": "2 days, 4:28:56", "throughput": 26776.33, "total_tokens": 1725004032} +{"current_steps": 6420, "total_steps": 25209, "loss": 1.0673, "lr": 3.902084347773779e-05, "epoch": 0.7640185351848684, "percentage": 25.47, "elapsed_time": "17:55:24", "remaining_time": "2 days, 4:27:20", "throughput": 26775.94, "total_tokens": 1727711296} +{"current_steps": 6430, "total_steps": 25209, "loss": 1.0572, "lr": 3.900896607099207e-05, "epoch": 0.7652085952085208, "percentage": 25.51, "elapsed_time": "17:57:04", "remaining_time": "2 days, 4:25:36", "throughput": 26776.61, "total_tokens": 1730414656} +{"current_steps": 6440, "total_steps": 25209, "loss": 1.0602, "lr": 3.899709950360437e-05, "epoch": 0.7663986552321733, "percentage": 25.55, "elapsed_time": "17:58:43", "remaining_time": "2 days, 4:23:51", "throughput": 26777.54, "total_tokens": 1733123904} +{"current_steps": 6450, "total_steps": 25209, "loss": 1.0717, "lr": 3.8985243759097997e-05, "epoch": 0.7675887152558257, "percentage": 25.59, "elapsed_time": "18:00:20", "remaining_time": "2 days, 4:22:01", "throughput": 26778.71, "total_tokens": 1735805888} +{"current_steps": 6460, "total_steps": 25209, "loss": 1.0794, "lr": 3.897339882103129e-05, "epoch": 0.7687787752794781, "percentage": 25.63, "elapsed_time": "18:02:01", "remaining_time": "2 days, 4:20:23", "throughput": 26779.67, "total_tokens": 1738584576} +{"current_steps": 6470, "total_steps": 25209, "loss": 1.0646, "lr": 3.8961564672997544e-05, "epoch": 0.7699688353031306, "percentage": 25.67, "elapsed_time": "18:03:40", "remaining_time": "2 days, 4:18:39", "throughput": 26780.45, "total_tokens": 1741291072} +{"current_steps": 6480, "total_steps": 25209, "loss": 1.0699, "lr": 3.8949741298624924e-05, "epoch": 0.7711588953267831, "percentage": 25.71, "elapsed_time": "18:05:20", "remaining_time": "2 days, 4:16:54", "throughput": 26781.52, "total_tokens": 1744012864} +{"current_steps": 6490, "total_steps": 25209, "loss": 1.0793, "lr": 3.8937928681576305e-05, "epoch": 0.7723489553504355, "percentage": 25.74, "elapsed_time": "18:06:56", "remaining_time": "2 days, 4:15:04", "throughput": 26782.83, "total_tokens": 1746695616} +{"current_steps": 6500, "total_steps": 25209, "loss": 1.0714, "lr": 3.8926126805549276e-05, "epoch": 0.773539015374088, "percentage": 25.78, "elapsed_time": "18:08:33", "remaining_time": "2 days, 4:13:11", "throughput": 26784.33, "total_tokens": 1749368640} +{"current_steps": 6510, "total_steps": 25209, "loss": 1.0602, "lr": 3.891433565427596e-05, "epoch": 0.7747290753977404, "percentage": 25.82, "elapsed_time": "18:10:05", "remaining_time": "2 days, 4:11:08", "throughput": 26787.27, "total_tokens": 1752041792} +{"current_steps": 6520, "total_steps": 25209, "loss": 1.0819, "lr": 3.8902555211522964e-05, "epoch": 0.7759191354213928, "percentage": 25.86, "elapsed_time": "18:11:47", "remaining_time": "2 days, 4:09:32", "throughput": 26787.59, "total_tokens": 1754794240} +{"current_steps": 6530, "total_steps": 25209, "loss": 1.0703, "lr": 3.889078546109127e-05, "epoch": 0.7771091954450453, "percentage": 25.9, "elapsed_time": "18:13:21", "remaining_time": "2 days, 4:07:31", "throughput": 26790.09, "total_tokens": 1757465728} +{"current_steps": 6540, "total_steps": 25209, "loss": 1.0625, "lr": 3.887902638681616e-05, "epoch": 0.7782992554686977, "percentage": 25.94, "elapsed_time": "18:15:01", "remaining_time": "2 days, 4:05:51", "throughput": 26791.2, "total_tokens": 1760234176} +{"current_steps": 6550, "total_steps": 25209, "loss": 1.0704, "lr": 3.886727797256707e-05, "epoch": 0.7794893154923501, "percentage": 25.98, "elapsed_time": "18:16:39", "remaining_time": "2 days, 4:04:01", "throughput": 26792.78, "total_tokens": 1762940480} +{"current_steps": 6560, "total_steps": 25209, "loss": 1.0579, "lr": 3.88555402022476e-05, "epoch": 0.7806793755160026, "percentage": 26.02, "elapsed_time": "18:18:15", "remaining_time": "2 days, 4:02:09", "throughput": 26794.91, "total_tokens": 1765658112} +{"current_steps": 6570, "total_steps": 25209, "loss": 1.0629, "lr": 3.884381305979528e-05, "epoch": 0.781869435539655, "percentage": 26.06, "elapsed_time": "18:19:45", "remaining_time": "2 days, 3:59:59", "throughput": 26797.75, "total_tokens": 1768258688} +{"current_steps": 6580, "total_steps": 25209, "loss": 1.0851, "lr": 3.883209652918163e-05, "epoch": 0.7830594955633075, "percentage": 26.1, "elapsed_time": "18:21:17", "remaining_time": "2 days, 3:57:54", "throughput": 26800.31, "total_tokens": 1770887104} +{"current_steps": 6590, "total_steps": 25209, "loss": 1.0714, "lr": 3.8820390594411935e-05, "epoch": 0.78424955558696, "percentage": 26.14, "elapsed_time": "18:22:55", "remaining_time": "2 days, 3:56:08", "throughput": 26800.94, "total_tokens": 1773570048} +{"current_steps": 6600, "total_steps": 25209, "loss": 1.0641, "lr": 3.880869523952524e-05, "epoch": 0.7854396156106124, "percentage": 26.18, "elapsed_time": "18:24:29", "remaining_time": "2 days, 3:54:09", "throughput": 26803.04, "total_tokens": 1776221824} +{"current_steps": 6610, "total_steps": 25209, "loss": 1.0544, "lr": 3.879701044859422e-05, "epoch": 0.7866296756342648, "percentage": 26.22, "elapsed_time": "18:26:07", "remaining_time": "2 days, 3:52:22", "throughput": 26804.53, "total_tokens": 1778951360} +{"current_steps": 6620, "total_steps": 25209, "loss": 1.0655, "lr": 3.87853362057251e-05, "epoch": 0.7878197356579173, "percentage": 26.26, "elapsed_time": "18:27:43", "remaining_time": "2 days, 3:50:30", "throughput": 26806.09, "total_tokens": 1781633344} +{"current_steps": 6630, "total_steps": 25209, "loss": 1.0634, "lr": 3.8773672495057576e-05, "epoch": 0.7890097956815697, "percentage": 26.3, "elapsed_time": "18:29:17", "remaining_time": "2 days, 3:48:31", "throughput": 26808.04, "total_tokens": 1784275584} +{"current_steps": 6640, "total_steps": 25209, "loss": 1.0653, "lr": 3.8762019300764674e-05, "epoch": 0.7901998557052221, "percentage": 26.34, "elapsed_time": "18:30:50", "remaining_time": "2 days, 3:46:30", "throughput": 26811.17, "total_tokens": 1786982592} +{"current_steps": 6650, "total_steps": 25209, "loss": 1.0773, "lr": 3.875037660705273e-05, "epoch": 0.7913899157288746, "percentage": 26.38, "elapsed_time": "18:32:29", "remaining_time": "2 days, 3:44:45", "throughput": 26812.53, "total_tokens": 1789714560} +{"current_steps": 6660, "total_steps": 25209, "loss": 1.0743, "lr": 3.873874439816127e-05, "epoch": 0.792579975752527, "percentage": 26.42, "elapsed_time": "18:34:05", "remaining_time": "2 days, 3:42:54", "throughput": 26814.02, "total_tokens": 1792399744} +{"current_steps": 6670, "total_steps": 25209, "loss": 1.076, "lr": 3.872712265836289e-05, "epoch": 0.7937700357761794, "percentage": 26.46, "elapsed_time": "18:35:43", "remaining_time": "2 days, 3:41:05", "throughput": 26815.06, "total_tokens": 1795085184} +{"current_steps": 6680, "total_steps": 25209, "loss": 1.0569, "lr": 3.8715511371963225e-05, "epoch": 0.794960095799832, "percentage": 26.5, "elapsed_time": "18:37:16", "remaining_time": "2 days, 3:39:05", "throughput": 26817.32, "total_tokens": 1797737984} +{"current_steps": 6690, "total_steps": 25209, "loss": 1.0663, "lr": 3.87039105233008e-05, "epoch": 0.7961501558234844, "percentage": 26.54, "elapsed_time": "18:38:56", "remaining_time": "2 days, 3:37:23", "throughput": 26817.99, "total_tokens": 1800456768} +{"current_steps": 6700, "total_steps": 25209, "loss": 1.0505, "lr": 3.8692320096746975e-05, "epoch": 0.7973402158471368, "percentage": 26.58, "elapsed_time": "18:40:30", "remaining_time": "2 days, 3:35:27", "throughput": 26820.6, "total_tokens": 1803173568} +{"current_steps": 6710, "total_steps": 25209, "loss": 1.0758, "lr": 3.868074007670589e-05, "epoch": 0.7985302758707893, "percentage": 26.62, "elapsed_time": "18:42:04", "remaining_time": "2 days, 3:33:29", "throughput": 26822.67, "total_tokens": 1805824768} +{"current_steps": 6720, "total_steps": 25209, "loss": 1.0638, "lr": 3.866917044761428e-05, "epoch": 0.7997203358944417, "percentage": 26.66, "elapsed_time": "18:43:41", "remaining_time": "2 days, 3:31:40", "throughput": 26823.92, "total_tokens": 1808522112} +{"current_steps": 6730, "total_steps": 25209, "loss": 1.0716, "lr": 3.8657611193941486e-05, "epoch": 0.8009103959180941, "percentage": 26.7, "elapsed_time": "18:45:25", "remaining_time": "2 days, 3:30:08", "throughput": 26823.4, "total_tokens": 1811255680} +{"current_steps": 6740, "total_steps": 25209, "loss": 1.0794, "lr": 3.8646062300189315e-05, "epoch": 0.8021004559417466, "percentage": 26.74, "elapsed_time": "18:47:07", "remaining_time": "2 days, 3:28:32", "throughput": 26823.83, "total_tokens": 1814019072} +{"current_steps": 6750, "total_steps": 25209, "loss": 1.0656, "lr": 3.8634523750891984e-05, "epoch": 0.803290515965399, "percentage": 26.78, "elapsed_time": "18:48:44", "remaining_time": "2 days, 3:26:43", "throughput": 26825.16, "total_tokens": 1816719616} +{"current_steps": 6760, "total_steps": 25209, "loss": 1.061, "lr": 3.862299553061597e-05, "epoch": 0.8044805759890514, "percentage": 26.82, "elapsed_time": "18:50:22", "remaining_time": "2 days, 3:24:56", "throughput": 26826.31, "total_tokens": 1819417216} +{"current_steps": 6770, "total_steps": 25209, "loss": 1.0779, "lr": 3.861147762396e-05, "epoch": 0.805670636012704, "percentage": 26.86, "elapsed_time": "18:51:57", "remaining_time": "2 days, 3:23:02", "throughput": 26827.94, "total_tokens": 1822083200} +{"current_steps": 6780, "total_steps": 25209, "loss": 1.087, "lr": 3.859997001555494e-05, "epoch": 0.8068606960363564, "percentage": 26.9, "elapsed_time": "18:53:32", "remaining_time": "2 days, 3:21:07", "throughput": 26829.43, "total_tokens": 1824740288} +{"current_steps": 6790, "total_steps": 25209, "loss": 1.0796, "lr": 3.8588472690063676e-05, "epoch": 0.8080507560600088, "percentage": 26.93, "elapsed_time": "18:55:13", "remaining_time": "2 days, 3:19:28", "throughput": 26830.36, "total_tokens": 1827500160} +{"current_steps": 6800, "total_steps": 25209, "loss": 1.0638, "lr": 3.857698563218106e-05, "epoch": 0.8092408160836613, "percentage": 26.97, "elapsed_time": "18:56:47", "remaining_time": "2 days, 3:17:31", "throughput": 26833.34, "total_tokens": 1830228672} +{"current_steps": 6810, "total_steps": 25209, "loss": 1.0649, "lr": 3.8565508826633836e-05, "epoch": 0.8104308761073137, "percentage": 27.01, "elapsed_time": "18:58:29", "remaining_time": "2 days, 3:15:54", "throughput": 26833.58, "total_tokens": 1832978304} +{"current_steps": 6820, "total_steps": 25209, "loss": 1.0604, "lr": 3.855404225818049e-05, "epoch": 0.8116209361309661, "percentage": 27.05, "elapsed_time": "19:00:04", "remaining_time": "2 days, 3:14:01", "throughput": 26835.08, "total_tokens": 1835644160} +{"current_steps": 6830, "total_steps": 25209, "loss": 1.062, "lr": 3.8542585911611286e-05, "epoch": 0.8128109961546186, "percentage": 27.09, "elapsed_time": "19:01:35", "remaining_time": "2 days, 3:11:56", "throughput": 26837.51, "total_tokens": 1838256256} +{"current_steps": 6840, "total_steps": 25209, "loss": 1.0763, "lr": 3.853113977174803e-05, "epoch": 0.814001056178271, "percentage": 27.13, "elapsed_time": "19:03:10", "remaining_time": "2 days, 3:10:00", "throughput": 26839.56, "total_tokens": 1840932160} +{"current_steps": 6850, "total_steps": 25209, "loss": 1.0592, "lr": 3.851970382344411e-05, "epoch": 0.8151911162019234, "percentage": 27.17, "elapsed_time": "19:04:46", "remaining_time": "2 days, 3:08:08", "throughput": 26840.94, "total_tokens": 1843599232} +{"current_steps": 6860, "total_steps": 25209, "loss": 1.0664, "lr": 3.850827805158433e-05, "epoch": 0.8163811762255758, "percentage": 27.21, "elapsed_time": "19:06:16", "remaining_time": "2 days, 3:06:01", "throughput": 26843.39, "total_tokens": 1846189120} +{"current_steps": 6870, "total_steps": 25209, "loss": 1.0686, "lr": 3.8496862441084896e-05, "epoch": 0.8175712362492283, "percentage": 27.25, "elapsed_time": "19:07:54", "remaining_time": "2 days, 3:04:17", "throughput": 26843.93, "total_tokens": 1848875392} +{"current_steps": 6880, "total_steps": 25209, "loss": 1.0815, "lr": 3.848545697689328e-05, "epoch": 0.8187612962728807, "percentage": 27.29, "elapsed_time": "19:09:31", "remaining_time": "2 days, 3:02:26", "throughput": 26845.86, "total_tokens": 1851591552} +{"current_steps": 6890, "total_steps": 25209, "loss": 1.0625, "lr": 3.8474061643988136e-05, "epoch": 0.8199513562965332, "percentage": 27.33, "elapsed_time": "19:11:06", "remaining_time": "2 days, 3:00:33", "throughput": 26847.16, "total_tokens": 1854249152} +{"current_steps": 6900, "total_steps": 25209, "loss": 1.0828, "lr": 3.846267642737925e-05, "epoch": 0.8211414163201857, "percentage": 27.37, "elapsed_time": "19:12:45", "remaining_time": "2 days, 2:58:49", "throughput": 26848.41, "total_tokens": 1856986688} +{"current_steps": 6910, "total_steps": 25209, "loss": 1.0748, "lr": 3.8451301312107455e-05, "epoch": 0.8223314763438381, "percentage": 27.41, "elapsed_time": "19:14:26", "remaining_time": "2 days, 2:57:12", "throughput": 26848.42, "total_tokens": 1859708736} +{"current_steps": 6920, "total_steps": 25209, "loss": 1.0835, "lr": 3.843993628324451e-05, "epoch": 0.8235215363674905, "percentage": 27.45, "elapsed_time": "19:16:09", "remaining_time": "2 days, 2:55:37", "throughput": 26848.49, "total_tokens": 1862463424} +{"current_steps": 6930, "total_steps": 25209, "loss": 1.0691, "lr": 3.8428581325893034e-05, "epoch": 0.824711596391143, "percentage": 27.49, "elapsed_time": "19:17:51", "remaining_time": "2 days, 2:54:01", "throughput": 26848.39, "total_tokens": 1865193216} +{"current_steps": 6940, "total_steps": 25209, "loss": 1.0641, "lr": 3.8417236425186484e-05, "epoch": 0.8259016564147954, "percentage": 27.53, "elapsed_time": "19:19:25", "remaining_time": "2 days, 2:52:05", "throughput": 26850.64, "total_tokens": 1867878976} +{"current_steps": 6950, "total_steps": 25209, "loss": 1.0675, "lr": 3.840590156628895e-05, "epoch": 0.8270917164384478, "percentage": 27.57, "elapsed_time": "19:20:58", "remaining_time": "2 days, 2:50:05", "throughput": 26853.59, "total_tokens": 1870570112} +{"current_steps": 6960, "total_steps": 25209, "loss": 1.0763, "lr": 3.8394576734395205e-05, "epoch": 0.8282817764621003, "percentage": 27.61, "elapsed_time": "19:22:35", "remaining_time": "2 days, 2:48:17", "throughput": 26855.22, "total_tokens": 1873299072} +{"current_steps": 6970, "total_steps": 25209, "loss": 1.0783, "lr": 3.838326191473054e-05, "epoch": 0.8294718364857527, "percentage": 27.65, "elapsed_time": "19:24:08", "remaining_time": "2 days, 2:46:19", "throughput": 26857.48, "total_tokens": 1875961024} +{"current_steps": 6980, "total_steps": 25209, "loss": 1.0649, "lr": 3.837195709255069e-05, "epoch": 0.8306618965094051, "percentage": 27.69, "elapsed_time": "19:25:41", "remaining_time": "2 days, 2:44:20", "throughput": 26860.3, "total_tokens": 1878657920} +{"current_steps": 6990, "total_steps": 25209, "loss": 1.0727, "lr": 3.8360662253141796e-05, "epoch": 0.8318519565330577, "percentage": 27.73, "elapsed_time": "19:27:22", "remaining_time": "2 days, 2:42:41", "throughput": 26860.25, "total_tokens": 1881363904} +{"current_steps": 7000, "total_steps": 25209, "loss": 1.0676, "lr": 3.834937738182029e-05, "epoch": 0.8330420165567101, "percentage": 27.77, "elapsed_time": "19:28:59", "remaining_time": "2 days, 2:40:53", "throughput": 26861.83, "total_tokens": 1884081920} +{"current_steps": 7010, "total_steps": 25209, "loss": 1.0714, "lr": 3.833810246393281e-05, "epoch": 0.8342320765803625, "percentage": 27.81, "elapsed_time": "19:30:33", "remaining_time": "2 days, 2:38:57", "throughput": 26863.58, "total_tokens": 1886729728} +{"current_steps": 7020, "total_steps": 25209, "loss": 1.0564, "lr": 3.832683748485616e-05, "epoch": 0.835422136604015, "percentage": 27.85, "elapsed_time": "19:32:11", "remaining_time": "2 days, 2:37:10", "throughput": 26864.49, "total_tokens": 1889416128} +{"current_steps": 7030, "total_steps": 25209, "loss": 1.0685, "lr": 3.8315582429997184e-05, "epoch": 0.8366121966276674, "percentage": 27.89, "elapsed_time": "19:33:41", "remaining_time": "2 days, 2:35:02", "throughput": 26867.56, "total_tokens": 1892041088} +{"current_steps": 7040, "total_steps": 25209, "loss": 1.0616, "lr": 3.830433728479272e-05, "epoch": 0.8378022566513198, "percentage": 27.93, "elapsed_time": "19:35:20", "remaining_time": "2 days, 2:33:20", "throughput": 26868.45, "total_tokens": 1894766144} +{"current_steps": 7050, "total_steps": 25209, "loss": 1.062, "lr": 3.829310203470948e-05, "epoch": 0.8389923166749723, "percentage": 27.97, "elapsed_time": "19:36:56", "remaining_time": "2 days, 2:31:30", "throughput": 26869.63, "total_tokens": 1897442112} +{"current_steps": 7060, "total_steps": 25209, "loss": 1.0779, "lr": 3.828187666524403e-05, "epoch": 0.8401823766986247, "percentage": 28.01, "elapsed_time": "19:38:33", "remaining_time": "2 days, 2:29:42", "throughput": 26870.82, "total_tokens": 1900134912} +{"current_steps": 7070, "total_steps": 25209, "loss": 1.0627, "lr": 3.827066116192266e-05, "epoch": 0.8413724367222771, "percentage": 28.05, "elapsed_time": "19:40:13", "remaining_time": "2 days, 2:28:01", "throughput": 26871.68, "total_tokens": 1902881920} +{"current_steps": 7080, "total_steps": 25209, "loss": 1.0534, "lr": 3.825945551030135e-05, "epoch": 0.8425624967459296, "percentage": 28.09, "elapsed_time": "19:41:50", "remaining_time": "2 days, 2:26:13", "throughput": 26873.23, "total_tokens": 1905599168} +{"current_steps": 7090, "total_steps": 25209, "loss": 1.0538, "lr": 3.824825969596561e-05, "epoch": 0.843752556769582, "percentage": 28.12, "elapsed_time": "19:43:28", "remaining_time": "2 days, 2:24:27", "throughput": 26874.43, "total_tokens": 1908319488} +{"current_steps": 7100, "total_steps": 25209, "loss": 1.0725, "lr": 3.823707370453054e-05, "epoch": 0.8449426167932345, "percentage": 28.16, "elapsed_time": "19:45:08", "remaining_time": "2 days, 2:22:46", "throughput": 26874.78, "total_tokens": 1911025024} +{"current_steps": 7110, "total_steps": 25209, "loss": 1.0694, "lr": 3.8225897521640614e-05, "epoch": 0.846132676816887, "percentage": 28.2, "elapsed_time": "19:46:40", "remaining_time": "2 days, 2:20:46", "throughput": 26877.0, "total_tokens": 1913663552} +{"current_steps": 7120, "total_steps": 25209, "loss": 1.0648, "lr": 3.8214731132969675e-05, "epoch": 0.8473227368405394, "percentage": 28.24, "elapsed_time": "19:48:18", "remaining_time": "2 days, 2:19:00", "throughput": 26878.03, "total_tokens": 1916370944} +{"current_steps": 7130, "total_steps": 25209, "loss": 1.0507, "lr": 3.820357452422084e-05, "epoch": 0.8485127968641918, "percentage": 28.28, "elapsed_time": "19:49:59", "remaining_time": "2 days, 2:17:21", "throughput": 26878.39, "total_tokens": 1919097152} +{"current_steps": 7140, "total_steps": 25209, "loss": 1.0553, "lr": 3.8192427681126445e-05, "epoch": 0.8497028568878443, "percentage": 28.32, "elapsed_time": "19:51:36", "remaining_time": "2 days, 2:15:34", "throughput": 26879.88, "total_tokens": 1921818496} +{"current_steps": 7150, "total_steps": 25209, "loss": 1.0571, "lr": 3.818129058944793e-05, "epoch": 0.8508929169114967, "percentage": 28.36, "elapsed_time": "19:53:15", "remaining_time": "2 days, 2:13:51", "throughput": 26880.14, "total_tokens": 1924505216} +{"current_steps": 7160, "total_steps": 25209, "loss": 1.0734, "lr": 3.817016323497578e-05, "epoch": 0.8520829769351491, "percentage": 28.4, "elapsed_time": "19:54:54", "remaining_time": "2 days, 2:12:07", "throughput": 26880.4, "total_tokens": 1927170432} +{"current_steps": 7170, "total_steps": 25209, "loss": 1.0677, "lr": 3.8159045603529455e-05, "epoch": 0.8532730369588016, "percentage": 28.44, "elapsed_time": "19:56:34", "remaining_time": "2 days, 2:10:27", "throughput": 26880.89, "total_tokens": 1929897344} +{"current_steps": 7180, "total_steps": 25209, "loss": 1.0604, "lr": 3.8147937680957334e-05, "epoch": 0.854463096982454, "percentage": 28.48, "elapsed_time": "19:58:06", "remaining_time": "2 days, 2:08:27", "throughput": 26883.7, "total_tokens": 1932573952} +{"current_steps": 7190, "total_steps": 25209, "loss": 1.0656, "lr": 3.813683945313658e-05, "epoch": 0.8556531570061064, "percentage": 28.52, "elapsed_time": "19:59:43", "remaining_time": "2 days, 2:06:38", "throughput": 26884.87, "total_tokens": 1935258368} +{"current_steps": 7200, "total_steps": 25209, "loss": 1.0661, "lr": 3.812575090597313e-05, "epoch": 0.856843217029759, "percentage": 28.56, "elapsed_time": "20:01:19", "remaining_time": "2 days, 2:04:49", "throughput": 26886.53, "total_tokens": 1937971328} +{"current_steps": 7210, "total_steps": 25209, "loss": 1.069, "lr": 3.811467202540156e-05, "epoch": 0.8580332770534114, "percentage": 28.6, "elapsed_time": "20:02:58", "remaining_time": "2 days, 2:03:07", "throughput": 26887.4, "total_tokens": 1940704256} +{"current_steps": 7220, "total_steps": 25209, "loss": 1.0586, "lr": 3.810360279738507e-05, "epoch": 0.8592233370770638, "percentage": 28.64, "elapsed_time": "20:04:37", "remaining_time": "2 days, 2:01:22", "throughput": 26888.28, "total_tokens": 1943409728} +{"current_steps": 7230, "total_steps": 25209, "loss": 1.0554, "lr": 3.809254320791535e-05, "epoch": 0.8604133971007163, "percentage": 28.68, "elapsed_time": "20:06:15", "remaining_time": "2 days, 1:59:38", "throughput": 26889.03, "total_tokens": 1946115456} +{"current_steps": 7240, "total_steps": 25209, "loss": 1.0548, "lr": 3.808149324301256e-05, "epoch": 0.8616034571243687, "percentage": 28.72, "elapsed_time": "20:07:49", "remaining_time": "2 days, 1:57:42", "throughput": 26890.55, "total_tokens": 1948743936} +{"current_steps": 7250, "total_steps": 25209, "loss": 1.0586, "lr": 3.807045288872522e-05, "epoch": 0.8627935171480211, "percentage": 28.76, "elapsed_time": "20:09:29", "remaining_time": "2 days, 1:56:02", "throughput": 26890.78, "total_tokens": 1951452608} +{"current_steps": 7260, "total_steps": 25209, "loss": 1.0597, "lr": 3.805942213113015e-05, "epoch": 0.8639835771716736, "percentage": 28.8, "elapsed_time": "20:11:04", "remaining_time": "2 days, 1:54:10", "throughput": 26892.72, "total_tokens": 1954152448} +{"current_steps": 7270, "total_steps": 25209, "loss": 1.0564, "lr": 3.8048400956332385e-05, "epoch": 0.865173637195326, "percentage": 28.84, "elapsed_time": "20:12:43", "remaining_time": "2 days, 1:52:26", "throughput": 26893.29, "total_tokens": 1956849152} +{"current_steps": 7280, "total_steps": 25209, "loss": 1.0579, "lr": 3.803738935046512e-05, "epoch": 0.8663636972189784, "percentage": 28.88, "elapsed_time": "20:14:18", "remaining_time": "2 days, 1:50:33", "throughput": 26894.99, "total_tokens": 1959517952} +{"current_steps": 7290, "total_steps": 25209, "loss": 1.0742, "lr": 3.802638729968962e-05, "epoch": 0.867553757242631, "percentage": 28.92, "elapsed_time": "20:15:58", "remaining_time": "2 days, 1:48:53", "throughput": 26895.34, "total_tokens": 1962241152} +{"current_steps": 7300, "total_steps": 25209, "loss": 1.0548, "lr": 3.8015394790195145e-05, "epoch": 0.8687438172662834, "percentage": 28.96, "elapsed_time": "20:17:31", "remaining_time": "2 days, 1:46:56", "throughput": 26897.54, "total_tokens": 1964906560} +{"current_steps": 7310, "total_steps": 25209, "loss": 1.0728, "lr": 3.800441180819891e-05, "epoch": 0.8699338772899358, "percentage": 29.0, "elapsed_time": "20:19:10", "remaining_time": "2 days, 1:45:12", "throughput": 26898.57, "total_tokens": 1967633984} +{"current_steps": 7320, "total_steps": 25209, "loss": 1.0647, "lr": 3.7993438339945965e-05, "epoch": 0.8711239373135883, "percentage": 29.04, "elapsed_time": "20:20:48", "remaining_time": "2 days, 1:43:28", "throughput": 26899.57, "total_tokens": 1970348160} +{"current_steps": 7330, "total_steps": 25209, "loss": 1.0509, "lr": 3.798247437170914e-05, "epoch": 0.8723139973372407, "percentage": 29.08, "elapsed_time": "20:22:25", "remaining_time": "2 days, 1:41:39", "throughput": 26900.62, "total_tokens": 1973026688} +{"current_steps": 7340, "total_steps": 25209, "loss": 1.067, "lr": 3.797151988978901e-05, "epoch": 0.8735040573608931, "percentage": 29.12, "elapsed_time": "20:24:02", "remaining_time": "2 days, 1:39:54", "throughput": 26901.46, "total_tokens": 1975718784} +{"current_steps": 7350, "total_steps": 25209, "loss": 1.0511, "lr": 3.796057488051377e-05, "epoch": 0.8746941173845456, "percentage": 29.16, "elapsed_time": "20:25:35", "remaining_time": "2 days, 1:37:56", "throughput": 26903.34, "total_tokens": 1978357056} +{"current_steps": 7360, "total_steps": 25209, "loss": 1.0615, "lr": 3.794963933023918e-05, "epoch": 0.875884177408198, "percentage": 29.2, "elapsed_time": "20:27:08", "remaining_time": "2 days, 1:35:59", "throughput": 26905.53, "total_tokens": 1981017856} +{"current_steps": 7370, "total_steps": 25209, "loss": 1.061, "lr": 3.79387132253485e-05, "epoch": 0.8770742374318504, "percentage": 29.24, "elapsed_time": "20:28:43", "remaining_time": "2 days, 1:34:07", "throughput": 26906.84, "total_tokens": 1983671040} +{"current_steps": 7380, "total_steps": 25209, "loss": 1.081, "lr": 3.792779655225243e-05, "epoch": 0.8782642974555029, "percentage": 29.28, "elapsed_time": "20:30:19", "remaining_time": "2 days, 1:32:17", "throughput": 26908.17, "total_tokens": 1986357248} +{"current_steps": 7390, "total_steps": 25209, "loss": 1.0585, "lr": 3.791688929738902e-05, "epoch": 0.8794543574791553, "percentage": 29.31, "elapsed_time": "20:31:58", "remaining_time": "2 days, 1:30:34", "throughput": 26909.03, "total_tokens": 1989071744} +{"current_steps": 7400, "total_steps": 25209, "loss": 1.0471, "lr": 3.79059914472236e-05, "epoch": 0.8806444175028078, "percentage": 29.35, "elapsed_time": "20:33:37", "remaining_time": "2 days, 1:28:52", "throughput": 26908.98, "total_tokens": 1991743232} +{"current_steps": 7410, "total_steps": 25209, "loss": 1.0668, "lr": 3.7895102988248716e-05, "epoch": 0.8818344775264603, "percentage": 29.39, "elapsed_time": "20:35:17", "remaining_time": "2 days, 1:27:12", "throughput": 26909.49, "total_tokens": 1994469568} +{"current_steps": 7420, "total_steps": 25209, "loss": 1.0678, "lr": 3.7884223906984064e-05, "epoch": 0.8830245375501127, "percentage": 29.43, "elapsed_time": "20:36:55", "remaining_time": "2 days, 1:25:27", "throughput": 26910.49, "total_tokens": 1997180352} +{"current_steps": 7430, "total_steps": 25209, "loss": 1.0678, "lr": 3.787335418997641e-05, "epoch": 0.8842145975737651, "percentage": 29.47, "elapsed_time": "20:38:37", "remaining_time": "2 days, 1:23:51", "throughput": 26910.35, "total_tokens": 1999905280} +{"current_steps": 7440, "total_steps": 25209, "loss": 1.0542, "lr": 3.786249382379952e-05, "epoch": 0.8854046575974176, "percentage": 29.51, "elapsed_time": "20:40:13", "remaining_time": "2 days, 1:22:03", "throughput": 26911.32, "total_tokens": 2002575104} +{"current_steps": 7450, "total_steps": 25209, "loss": 1.0606, "lr": 3.785164279505411e-05, "epoch": 0.88659471762107, "percentage": 29.55, "elapsed_time": "20:41:51", "remaining_time": "2 days, 1:20:16", "throughput": 26912.84, "total_tokens": 2005310272} +{"current_steps": 7460, "total_steps": 25209, "loss": 1.0606, "lr": 3.7840801090367744e-05, "epoch": 0.8877847776447224, "percentage": 29.59, "elapsed_time": "20:43:26", "remaining_time": "2 days, 1:18:25", "throughput": 26914.29, "total_tokens": 2007979008} +{"current_steps": 7470, "total_steps": 25209, "loss": 1.0597, "lr": 3.782996869639479e-05, "epoch": 0.8889748376683749, "percentage": 29.63, "elapsed_time": "20:45:02", "remaining_time": "2 days, 1:16:36", "throughput": 26915.13, "total_tokens": 2010630848} +{"current_steps": 7480, "total_steps": 25209, "loss": 1.0733, "lr": 3.7819145599816354e-05, "epoch": 0.8901648976920273, "percentage": 29.67, "elapsed_time": "20:46:37", "remaining_time": "2 days, 1:14:44", "throughput": 26917.25, "total_tokens": 2013342784} +{"current_steps": 7490, "total_steps": 25209, "loss": 1.0548, "lr": 3.780833178734018e-05, "epoch": 0.8913549577156797, "percentage": 29.71, "elapsed_time": "20:48:20", "remaining_time": "2 days, 1:13:10", "throughput": 26917.06, "total_tokens": 2016094656} +{"current_steps": 7500, "total_steps": 25209, "loss": 1.0501, "lr": 3.77975272457006e-05, "epoch": 0.8925450177393323, "percentage": 29.75, "elapsed_time": "20:49:55", "remaining_time": "2 days, 1:11:20", "throughput": 26918.75, "total_tokens": 2018795840} +{"current_steps": 7510, "total_steps": 25209, "loss": 1.06, "lr": 3.778673196165851e-05, "epoch": 0.8937350777629847, "percentage": 29.79, "elapsed_time": "20:51:30", "remaining_time": "2 days, 1:09:27", "throughput": 26920.71, "total_tokens": 2021493440} +{"current_steps": 7520, "total_steps": 25209, "loss": 1.0655, "lr": 3.7775945922001186e-05, "epoch": 0.8949251377866371, "percentage": 29.83, "elapsed_time": "20:53:10", "remaining_time": "2 days, 1:07:47", "throughput": 26921.56, "total_tokens": 2024241920} +{"current_steps": 7530, "total_steps": 25209, "loss": 1.0589, "lr": 3.776516911354236e-05, "epoch": 0.8961151978102896, "percentage": 29.87, "elapsed_time": "20:54:45", "remaining_time": "2 days, 1:05:55", "throughput": 26923.71, "total_tokens": 2026961088} +{"current_steps": 7540, "total_steps": 25209, "loss": 1.0516, "lr": 3.775440152312205e-05, "epoch": 0.897305257833942, "percentage": 29.91, "elapsed_time": "20:56:19", "remaining_time": "2 days, 1:04:02", "throughput": 26925.51, "total_tokens": 2029632704} +{"current_steps": 7550, "total_steps": 25209, "loss": 1.0591, "lr": 3.774364313760652e-05, "epoch": 0.8984953178575944, "percentage": 29.95, "elapsed_time": "20:58:00", "remaining_time": "2 days, 1:02:24", "throughput": 26925.44, "total_tokens": 2032344576} +{"current_steps": 7560, "total_steps": 25209, "loss": 1.065, "lr": 3.7732893943888224e-05, "epoch": 0.8996853778812469, "percentage": 29.99, "elapsed_time": "20:59:37", "remaining_time": "2 days, 1:00:38", "throughput": 26926.83, "total_tokens": 2035072896} +{"current_steps": 7570, "total_steps": 25209, "loss": 1.0612, "lr": 3.772215392888574e-05, "epoch": 0.9008754379048993, "percentage": 30.03, "elapsed_time": "21:01:15", "remaining_time": "2 days, 0:58:52", "throughput": 26928.11, "total_tokens": 2037797056} +{"current_steps": 7580, "total_steps": 25209, "loss": 1.0614, "lr": 3.771142307954368e-05, "epoch": 0.9020654979285517, "percentage": 30.07, "elapsed_time": "21:02:53", "remaining_time": "2 days, 0:57:07", "throughput": 26929.32, "total_tokens": 2040517568} +{"current_steps": 7590, "total_steps": 25209, "loss": 1.0641, "lr": 3.770070138283264e-05, "epoch": 0.9032555579522042, "percentage": 30.11, "elapsed_time": "21:04:32", "remaining_time": "2 days, 0:55:25", "throughput": 26930.33, "total_tokens": 2043263744} +{"current_steps": 7600, "total_steps": 25209, "loss": 1.0663, "lr": 3.768998882574915e-05, "epoch": 0.9044456179758567, "percentage": 30.15, "elapsed_time": "21:06:09", "remaining_time": "2 days, 0:53:40", "throughput": 26931.1, "total_tokens": 2045950400} +{"current_steps": 7610, "total_steps": 25209, "loss": 1.0634, "lr": 3.767928539531557e-05, "epoch": 0.9056356779995091, "percentage": 30.19, "elapsed_time": "21:07:42", "remaining_time": "2 days, 0:51:43", "throughput": 26933.33, "total_tokens": 2048624000} +{"current_steps": 7620, "total_steps": 25209, "loss": 1.0607, "lr": 3.7668591078580055e-05, "epoch": 0.9068257380231616, "percentage": 30.23, "elapsed_time": "21:09:18", "remaining_time": "2 days, 0:49:54", "throughput": 26934.63, "total_tokens": 2051303616} +{"current_steps": 7630, "total_steps": 25209, "loss": 1.0662, "lr": 3.765790586261647e-05, "epoch": 0.908015798046814, "percentage": 30.27, "elapsed_time": "21:10:56", "remaining_time": "2 days, 0:48:10", "throughput": 26935.02, "total_tokens": 2053978624} +{"current_steps": 7640, "total_steps": 25209, "loss": 1.0668, "lr": 3.7647229734524326e-05, "epoch": 0.9092058580704664, "percentage": 30.31, "elapsed_time": "21:12:34", "remaining_time": "2 days, 0:46:25", "throughput": 26935.82, "total_tokens": 2056666752} +{"current_steps": 7650, "total_steps": 25209, "loss": 1.0624, "lr": 3.7636562681428744e-05, "epoch": 0.9103959180941189, "percentage": 30.35, "elapsed_time": "21:14:12", "remaining_time": "2 days, 0:44:40", "throughput": 26936.52, "total_tokens": 2059356224} +{"current_steps": 7660, "total_steps": 25209, "loss": 1.0613, "lr": 3.7625904690480346e-05, "epoch": 0.9115859781177713, "percentage": 30.39, "elapsed_time": "21:15:45", "remaining_time": "2 days, 0:42:44", "throughput": 26938.39, "total_tokens": 2062003904} +{"current_steps": 7670, "total_steps": 25209, "loss": 1.0628, "lr": 3.7615255748855224e-05, "epoch": 0.9127760381414237, "percentage": 30.43, "elapsed_time": "21:17:21", "remaining_time": "2 days, 0:40:55", "throughput": 26939.8, "total_tokens": 2064701248} +{"current_steps": 7680, "total_steps": 25209, "loss": 1.0675, "lr": 3.7604615843754845e-05, "epoch": 0.9139660981650762, "percentage": 30.47, "elapsed_time": "21:18:59", "remaining_time": "2 days, 0:39:11", "throughput": 26940.38, "total_tokens": 2067385472} +{"current_steps": 7690, "total_steps": 25209, "loss": 1.0645, "lr": 3.759398496240601e-05, "epoch": 0.9151561581887286, "percentage": 30.5, "elapsed_time": "21:20:35", "remaining_time": "2 days, 0:37:23", "throughput": 26941.88, "total_tokens": 2070093952} +{"current_steps": 7700, "total_steps": 25209, "loss": 1.0388, "lr": 3.7583363092060815e-05, "epoch": 0.916346218212381, "percentage": 30.54, "elapsed_time": "21:22:13", "remaining_time": "2 days, 0:35:39", "throughput": 26943.16, "total_tokens": 2072840704} +{"current_steps": 7710, "total_steps": 25209, "loss": 1.073, "lr": 3.757275021999649e-05, "epoch": 0.9175362782360336, "percentage": 30.58, "elapsed_time": "21:23:47", "remaining_time": "2 days, 0:33:45", "throughput": 26945.03, "total_tokens": 2075514368} +{"current_steps": 7720, "total_steps": 25209, "loss": 1.0693, "lr": 3.7562146333515445e-05, "epoch": 0.918726338259686, "percentage": 30.62, "elapsed_time": "21:25:27", "remaining_time": "2 days, 0:32:06", "throughput": 26945.58, "total_tokens": 2078248512} +{"current_steps": 7730, "total_steps": 25209, "loss": 1.057, "lr": 3.7551551419945167e-05, "epoch": 0.9199163982833384, "percentage": 30.66, "elapsed_time": "21:27:06", "remaining_time": "2 days, 0:30:23", "throughput": 26946.28, "total_tokens": 2080961856} +{"current_steps": 7740, "total_steps": 25209, "loss": 1.0451, "lr": 3.7540965466638104e-05, "epoch": 0.9211064583069909, "percentage": 30.7, "elapsed_time": "21:28:44", "remaining_time": "2 days, 0:28:39", "throughput": 26947.42, "total_tokens": 2083691456} +{"current_steps": 7750, "total_steps": 25209, "loss": 1.0679, "lr": 3.753038846097172e-05, "epoch": 0.9222965183306433, "percentage": 30.74, "elapsed_time": "21:30:24", "remaining_time": "2 days, 0:26:59", "throughput": 26947.54, "total_tokens": 2086391360} +{"current_steps": 7760, "total_steps": 25209, "loss": 1.0585, "lr": 3.751982039034827e-05, "epoch": 0.9234865783542957, "percentage": 30.78, "elapsed_time": "21:32:00", "remaining_time": "2 days, 0:25:10", "throughput": 26948.53, "total_tokens": 2089051264} +{"current_steps": 7770, "total_steps": 25209, "loss": 1.0536, "lr": 3.75092612421949e-05, "epoch": 0.9246766383779482, "percentage": 30.82, "elapsed_time": "21:33:38", "remaining_time": "2 days, 0:23:26", "throughput": 26949.33, "total_tokens": 2091758656} +{"current_steps": 7780, "total_steps": 25209, "loss": 1.0568, "lr": 3.7498711003963475e-05, "epoch": 0.9258666984016006, "percentage": 30.86, "elapsed_time": "21:35:10", "remaining_time": "2 days, 0:21:30", "throughput": 26951.61, "total_tokens": 2094431360} +{"current_steps": 7790, "total_steps": 25209, "loss": 1.0631, "lr": 3.748816966313058e-05, "epoch": 0.927056758425253, "percentage": 30.9, "elapsed_time": "21:36:48", "remaining_time": "2 days, 0:19:46", "throughput": 26952.21, "total_tokens": 2097121728} +{"current_steps": 7800, "total_steps": 25209, "loss": 1.0641, "lr": 3.7477637207197374e-05, "epoch": 0.9282468184489056, "percentage": 30.94, "elapsed_time": "21:38:20", "remaining_time": "2 days, 0:17:48", "throughput": 26954.61, "total_tokens": 2099789952} +{"current_steps": 7810, "total_steps": 25209, "loss": 1.0577, "lr": 3.7467113623689666e-05, "epoch": 0.929436878472558, "percentage": 30.98, "elapsed_time": "21:39:59", "remaining_time": "2 days, 0:16:06", "throughput": 26955.25, "total_tokens": 2102505536} +{"current_steps": 7820, "total_steps": 25209, "loss": 1.0697, "lr": 3.745659890015768e-05, "epoch": 0.9306269384962104, "percentage": 31.02, "elapsed_time": "21:41:38", "remaining_time": "2 days, 0:14:23", "throughput": 26955.95, "total_tokens": 2105210752} +{"current_steps": 7830, "total_steps": 25209, "loss": 1.0648, "lr": 3.744609302417615e-05, "epoch": 0.9318169985198629, "percentage": 31.06, "elapsed_time": "21:43:13", "remaining_time": "2 days, 0:12:32", "throughput": 26957.12, "total_tokens": 2107861120} +{"current_steps": 7840, "total_steps": 25209, "loss": 1.061, "lr": 3.7435595983344175e-05, "epoch": 0.9330070585435153, "percentage": 31.1, "elapsed_time": "21:44:49", "remaining_time": "2 days, 0:10:45", "throughput": 26957.95, "total_tokens": 2110529408} +{"current_steps": 7850, "total_steps": 25209, "loss": 1.0551, "lr": 3.7425107765285155e-05, "epoch": 0.9341971185671677, "percentage": 31.14, "elapsed_time": "21:46:28", "remaining_time": "2 days, 0:09:04", "throughput": 26958.51, "total_tokens": 2113247936} +{"current_steps": 7860, "total_steps": 25209, "loss": 1.0616, "lr": 3.741462835764676e-05, "epoch": 0.9353871785908202, "percentage": 31.18, "elapsed_time": "21:48:03", "remaining_time": "2 days, 0:07:12", "throughput": 26960.16, "total_tokens": 2115927680} +{"current_steps": 7870, "total_steps": 25209, "loss": 1.0533, "lr": 3.740415774810088e-05, "epoch": 0.9365772386144726, "percentage": 31.22, "elapsed_time": "21:49:39", "remaining_time": "2 days, 0:05:24", "throughput": 26961.69, "total_tokens": 2118640128} +{"current_steps": 7880, "total_steps": 25209, "loss": 1.0596, "lr": 3.739369592434351e-05, "epoch": 0.937767298638125, "percentage": 31.26, "elapsed_time": "21:51:16", "remaining_time": "2 days, 0:03:39", "throughput": 26962.81, "total_tokens": 2121347392} +{"current_steps": 7890, "total_steps": 25209, "loss": 1.0587, "lr": 3.738324287409473e-05, "epoch": 0.9389573586617775, "percentage": 31.3, "elapsed_time": "21:52:54", "remaining_time": "2 days, 0:01:55", "throughput": 26964.02, "total_tokens": 2124083648} +{"current_steps": 7900, "total_steps": 25209, "loss": 1.0584, "lr": 3.7372798585098644e-05, "epoch": 0.94014741868543, "percentage": 31.34, "elapsed_time": "21:54:28", "remaining_time": "2 days, 0:00:02", "throughput": 26965.65, "total_tokens": 2126744128} +{"current_steps": 7910, "total_steps": 25209, "loss": 1.0386, "lr": 3.736236304512331e-05, "epoch": 0.9413374787090824, "percentage": 31.38, "elapsed_time": "21:56:01", "remaining_time": "1 day, 23:58:07", "throughput": 26967.48, "total_tokens": 2129393728} +{"current_steps": 7920, "total_steps": 25209, "loss": 1.055, "lr": 3.735193624196067e-05, "epoch": 0.9425275387327349, "percentage": 31.42, "elapsed_time": "21:57:36", "remaining_time": "1 day, 23:56:17", "throughput": 26968.87, "total_tokens": 2132069568} +{"current_steps": 7930, "total_steps": 25209, "loss": 1.0483, "lr": 3.7341518163426514e-05, "epoch": 0.9437175987563873, "percentage": 31.46, "elapsed_time": "21:59:17", "remaining_time": "1 day, 23:54:40", "throughput": 26969.16, "total_tokens": 2134818752} +{"current_steps": 7940, "total_steps": 25209, "loss": 1.0622, "lr": 3.73311087973604e-05, "epoch": 0.9449076587800397, "percentage": 31.5, "elapsed_time": "22:00:56", "remaining_time": "1 day, 23:52:58", "throughput": 26969.01, "total_tokens": 2137475392} +{"current_steps": 7950, "total_steps": 25209, "loss": 1.0695, "lr": 3.732070813162561e-05, "epoch": 0.9460977188036922, "percentage": 31.54, "elapsed_time": "22:02:38", "remaining_time": "1 day, 23:51:22", "throughput": 26969.06, "total_tokens": 2140218048} +{"current_steps": 7960, "total_steps": 25209, "loss": 1.0608, "lr": 3.731031615410908e-05, "epoch": 0.9472877788273446, "percentage": 31.58, "elapsed_time": "22:04:09", "remaining_time": "1 day, 23:49:23", "throughput": 26971.51, "total_tokens": 2142871104} +{"current_steps": 7970, "total_steps": 25209, "loss": 1.0674, "lr": 3.729993285272132e-05, "epoch": 0.948477838850997, "percentage": 31.62, "elapsed_time": "22:05:48", "remaining_time": "1 day, 23:47:42", "throughput": 26972.28, "total_tokens": 2145610688} +{"current_steps": 7980, "total_steps": 25209, "loss": 1.06, "lr": 3.7289558215396414e-05, "epoch": 0.9496678988746495, "percentage": 31.66, "elapsed_time": "22:07:27", "remaining_time": "1 day, 23:46:00", "throughput": 26972.87, "total_tokens": 2148322176} +{"current_steps": 7990, "total_steps": 25209, "loss": 1.0559, "lr": 3.727919223009191e-05, "epoch": 0.9508579588983019, "percentage": 31.7, "elapsed_time": "22:09:07", "remaining_time": "1 day, 23:44:20", "throughput": 26973.65, "total_tokens": 2151070272} +{"current_steps": 8000, "total_steps": 25209, "loss": 1.0538, "lr": 3.726883488478877e-05, "epoch": 0.9520480189219543, "percentage": 31.73, "elapsed_time": "22:10:44", "remaining_time": "1 day, 23:42:34", "throughput": 26974.45, "total_tokens": 2153749312} +{"current_steps": 8010, "total_steps": 25209, "loss": 1.0615, "lr": 3.7258486167491323e-05, "epoch": 0.9532380789456069, "percentage": 31.77, "elapsed_time": "22:12:26", "remaining_time": "1 day, 23:41:00", "throughput": 26974.06, "total_tokens": 2156476736} +{"current_steps": 8020, "total_steps": 25209, "loss": 1.0451, "lr": 3.724814606622721e-05, "epoch": 0.9544281389692593, "percentage": 31.81, "elapsed_time": "22:14:04", "remaining_time": "1 day, 23:39:15", "throughput": 26974.9, "total_tokens": 2159182976} +{"current_steps": 8030, "total_steps": 25209, "loss": 1.0618, "lr": 3.7237814569047294e-05, "epoch": 0.9556181989929117, "percentage": 31.85, "elapsed_time": "22:15:40", "remaining_time": "1 day, 23:37:28", "throughput": 26975.83, "total_tokens": 2161853632} +{"current_steps": 8040, "total_steps": 25209, "loss": 1.055, "lr": 3.7227491664025656e-05, "epoch": 0.9568082590165642, "percentage": 31.89, "elapsed_time": "22:17:20", "remaining_time": "1 day, 23:35:48", "throughput": 26976.02, "total_tokens": 2164562048} +{"current_steps": 8050, "total_steps": 25209, "loss": 1.0472, "lr": 3.721717733925948e-05, "epoch": 0.9579983190402166, "percentage": 31.93, "elapsed_time": "22:18:56", "remaining_time": "1 day, 23:34:02", "throughput": 26977.0, "total_tokens": 2167245440} +{"current_steps": 8060, "total_steps": 25209, "loss": 1.0622, "lr": 3.720687158286904e-05, "epoch": 0.959188379063869, "percentage": 31.97, "elapsed_time": "22:20:32", "remaining_time": "1 day, 23:32:13", "throughput": 26978.57, "total_tokens": 2169955840} +{"current_steps": 8070, "total_steps": 25209, "loss": 1.0477, "lr": 3.719657438299762e-05, "epoch": 0.9603784390875215, "percentage": 32.01, "elapsed_time": "22:22:07", "remaining_time": "1 day, 23:30:23", "throughput": 26980.04, "total_tokens": 2172628224} +{"current_steps": 8080, "total_steps": 25209, "loss": 1.0508, "lr": 3.7186285727811446e-05, "epoch": 0.9615684991111739, "percentage": 32.05, "elapsed_time": "22:23:44", "remaining_time": "1 day, 23:28:38", "throughput": 26981.42, "total_tokens": 2175374976} +{"current_steps": 8090, "total_steps": 25209, "loss": 1.0533, "lr": 3.717600560549967e-05, "epoch": 0.9627585591348263, "percentage": 32.09, "elapsed_time": "22:25:18", "remaining_time": "1 day, 23:26:46", "throughput": 26982.73, "total_tokens": 2178011904} +{"current_steps": 8100, "total_steps": 25209, "loss": 1.0464, "lr": 3.716573400427426e-05, "epoch": 0.9639486191584788, "percentage": 32.13, "elapsed_time": "22:26:54", "remaining_time": "1 day, 23:24:59", "throughput": 26983.74, "total_tokens": 2180688128} +{"current_steps": 8110, "total_steps": 25209, "loss": 1.0554, "lr": 3.7155470912370004e-05, "epoch": 0.9651386791821313, "percentage": 32.17, "elapsed_time": "22:28:35", "remaining_time": "1 day, 23:23:21", "throughput": 26983.96, "total_tokens": 2183427328} +{"current_steps": 8120, "total_steps": 25209, "loss": 1.0543, "lr": 3.714521631804439e-05, "epoch": 0.9663287392057837, "percentage": 32.21, "elapsed_time": "22:30:11", "remaining_time": "1 day, 23:21:33", "throughput": 26984.94, "total_tokens": 2186099072} +{"current_steps": 8130, "total_steps": 25209, "loss": 1.0561, "lr": 3.713497020957759e-05, "epoch": 0.9675187992294362, "percentage": 32.25, "elapsed_time": "22:31:50", "remaining_time": "1 day, 23:19:51", "throughput": 26985.71, "total_tokens": 2188823232} +{"current_steps": 8140, "total_steps": 25209, "loss": 1.0589, "lr": 3.712473257527238e-05, "epoch": 0.9687088592530886, "percentage": 32.29, "elapsed_time": "22:33:28", "remaining_time": "1 day, 23:18:07", "throughput": 26986.89, "total_tokens": 2191554176} +{"current_steps": 8150, "total_steps": 25209, "loss": 1.0592, "lr": 3.711450340345412e-05, "epoch": 0.969898919276741, "percentage": 32.33, "elapsed_time": "22:35:04", "remaining_time": "1 day, 23:16:20", "throughput": 26988.08, "total_tokens": 2194250880} +{"current_steps": 8160, "total_steps": 25209, "loss": 1.0484, "lr": 3.710428268247067e-05, "epoch": 0.9710889793003935, "percentage": 32.37, "elapsed_time": "22:36:37", "remaining_time": "1 day, 23:14:27", "throughput": 26988.99, "total_tokens": 2196849344} +{"current_steps": 8170, "total_steps": 25209, "loss": 1.0574, "lr": 3.709407040069233e-05, "epoch": 0.9722790393240459, "percentage": 32.41, "elapsed_time": "22:38:14", "remaining_time": "1 day, 23:12:40", "throughput": 26989.73, "total_tokens": 2199508352} +{"current_steps": 8180, "total_steps": 25209, "loss": 1.0579, "lr": 3.708386654651179e-05, "epoch": 0.9734690993476983, "percentage": 32.45, "elapsed_time": "22:39:52", "remaining_time": "1 day, 23:10:58", "throughput": 26990.55, "total_tokens": 2202234368} +{"current_steps": 8190, "total_steps": 25209, "loss": 1.038, "lr": 3.707367110834409e-05, "epoch": 0.9746591593713508, "percentage": 32.49, "elapsed_time": "22:41:30", "remaining_time": "1 day, 23:09:14", "throughput": 26991.59, "total_tokens": 2204949760} +{"current_steps": 8200, "total_steps": 25209, "loss": 1.0389, "lr": 3.7063484074626555e-05, "epoch": 0.9758492193950032, "percentage": 32.53, "elapsed_time": "22:43:07", "remaining_time": "1 day, 23:07:28", "throughput": 26993.01, "total_tokens": 2207677568} +{"current_steps": 8210, "total_steps": 25209, "loss": 1.0418, "lr": 3.7053305433818725e-05, "epoch": 0.9770392794186556, "percentage": 32.57, "elapsed_time": "22:44:45", "remaining_time": "1 day, 23:05:45", "throughput": 26993.4, "total_tokens": 2210363648} +{"current_steps": 8220, "total_steps": 25209, "loss": 1.0448, "lr": 3.704313517440232e-05, "epoch": 0.9782293394423082, "percentage": 32.61, "elapsed_time": "22:46:16", "remaining_time": "1 day, 23:03:48", "throughput": 26995.48, "total_tokens": 2213003264} +{"current_steps": 8230, "total_steps": 25209, "loss": 1.0588, "lr": 3.703297328488118e-05, "epoch": 0.9794193994659606, "percentage": 32.65, "elapsed_time": "22:47:55", "remaining_time": "1 day, 23:02:07", "throughput": 26995.87, "total_tokens": 2215704448} +{"current_steps": 8240, "total_steps": 25209, "loss": 1.0573, "lr": 3.70228197537812e-05, "epoch": 0.980609459489613, "percentage": 32.69, "elapsed_time": "22:49:35", "remaining_time": "1 day, 23:00:26", "throughput": 26996.63, "total_tokens": 2218448320} +{"current_steps": 8250, "total_steps": 25209, "loss": 1.05, "lr": 3.7012674569650305e-05, "epoch": 0.9817995195132655, "percentage": 32.73, "elapsed_time": "22:51:12", "remaining_time": "1 day, 22:58:41", "throughput": 26997.45, "total_tokens": 2221139712} +{"current_steps": 8260, "total_steps": 25209, "loss": 1.0722, "lr": 3.700253772105835e-05, "epoch": 0.9829895795369179, "percentage": 32.77, "elapsed_time": "22:52:47", "remaining_time": "1 day, 22:56:52", "throughput": 26998.83, "total_tokens": 2223822656} +{"current_steps": 8270, "total_steps": 25209, "loss": 1.0431, "lr": 3.699240919659711e-05, "epoch": 0.9841796395605703, "percentage": 32.81, "elapsed_time": "22:54:20", "remaining_time": "1 day, 22:54:58", "throughput": 27000.64, "total_tokens": 2226476608} +{"current_steps": 8280, "total_steps": 25209, "loss": 1.0578, "lr": 3.698228898488019e-05, "epoch": 0.9853696995842228, "percentage": 32.85, "elapsed_time": "22:56:00", "remaining_time": "1 day, 22:53:20", "throughput": 27000.57, "total_tokens": 2229180544} +{"current_steps": 8290, "total_steps": 25209, "loss": 1.0516, "lr": 3.6972177074543e-05, "epoch": 0.9865597596078752, "percentage": 32.89, "elapsed_time": "22:57:38", "remaining_time": "1 day, 22:51:36", "throughput": 27001.41, "total_tokens": 2231893888} +{"current_steps": 8300, "total_steps": 25209, "loss": 1.0534, "lr": 3.69620734542427e-05, "epoch": 0.9877498196315276, "percentage": 32.92, "elapsed_time": "22:59:11", "remaining_time": "1 day, 22:49:42", "throughput": 27003.41, "total_tokens": 2234561024} +{"current_steps": 8310, "total_steps": 25209, "loss": 1.0609, "lr": 3.695197811265811e-05, "epoch": 0.9889398796551802, "percentage": 32.96, "elapsed_time": "23:00:44", "remaining_time": "1 day, 22:47:49", "throughput": 27004.91, "total_tokens": 2237202432} +{"current_steps": 8320, "total_steps": 25209, "loss": 1.0497, "lr": 3.6941891038489694e-05, "epoch": 0.9901299396788326, "percentage": 33.0, "elapsed_time": "23:02:18", "remaining_time": "1 day, 22:45:59", "throughput": 27006.0, "total_tokens": 2239835392} +{"current_steps": 8330, "total_steps": 25209, "loss": 1.0525, "lr": 3.693181222045952e-05, "epoch": 0.991319999702485, "percentage": 33.04, "elapsed_time": "23:03:54", "remaining_time": "1 day, 22:44:12", "throughput": 27006.61, "total_tokens": 2242481536} +{"current_steps": 8340, "total_steps": 25209, "loss": 1.0582, "lr": 3.692174164731113e-05, "epoch": 0.9925100597261375, "percentage": 33.08, "elapsed_time": "23:05:29", "remaining_time": "1 day, 22:42:22", "throughput": 27007.62, "total_tokens": 2245125824} +{"current_steps": 8350, "total_steps": 25209, "loss": 1.0474, "lr": 3.6911679307809595e-05, "epoch": 0.9937001197497899, "percentage": 33.12, "elapsed_time": "23:07:10", "remaining_time": "1 day, 22:40:44", "throughput": 27007.62, "total_tokens": 2247845312} +{"current_steps": 8360, "total_steps": 25209, "loss": 1.0513, "lr": 3.690162519074137e-05, "epoch": 0.9948901797734423, "percentage": 33.16, "elapsed_time": "23:08:49", "remaining_time": "1 day, 22:39:04", "throughput": 27008.29, "total_tokens": 2250586240} +{"current_steps": 8370, "total_steps": 25209, "loss": 1.0451, "lr": 3.689157928491431e-05, "epoch": 0.9960802397970948, "percentage": 33.2, "elapsed_time": "23:10:27", "remaining_time": "1 day, 22:37:21", "throughput": 27008.41, "total_tokens": 2253235008} +{"current_steps": 8380, "total_steps": 25209, "loss": 1.0407, "lr": 3.6881541579157566e-05, "epoch": 0.9972702998207472, "percentage": 33.24, "elapsed_time": "23:12:04", "remaining_time": "1 day, 22:35:37", "throughput": 27009.32, "total_tokens": 2255950912} +{"current_steps": 8390, "total_steps": 25209, "loss": 1.0678, "lr": 3.687151206232154e-05, "epoch": 0.9984603598443996, "percentage": 33.28, "elapsed_time": "23:13:46", "remaining_time": "1 day, 22:34:01", "throughput": 27009.42, "total_tokens": 2258703296} +{"current_steps": 8400, "total_steps": 25209, "loss": 1.0525, "lr": 3.686149072327788e-05, "epoch": 0.9996504198680521, "percentage": 33.32, "elapsed_time": "23:15:27", "remaining_time": "1 day, 22:32:23", "throughput": 27009.56, "total_tokens": 2261430912} +{"current_steps": 8410, "total_steps": 25209, "loss": 0.9998, "lr": 3.685147755091937e-05, "epoch": 1.0008330420165568, "percentage": 33.36, "elapsed_time": "23:17:06", "remaining_time": "1 day, 22:30:44", "throughput": 27009.86, "total_tokens": 2264154944} +{"current_steps": 8420, "total_steps": 25209, "loss": 0.9789, "lr": 3.684147253415992e-05, "epoch": 1.002023102040209, "percentage": 33.4, "elapsed_time": "23:18:44", "remaining_time": "1 day, 22:29:00", "throughput": 27011.06, "total_tokens": 2266883520} +{"current_steps": 8430, "total_steps": 25209, "loss": 0.9697, "lr": 3.683147566193448e-05, "epoch": 1.0032131620638616, "percentage": 33.44, "elapsed_time": "23:20:23", "remaining_time": "1 day, 22:27:20", "throughput": 27011.7, "total_tokens": 2269624640} +{"current_steps": 8440, "total_steps": 25209, "loss": 0.9798, "lr": 3.6821486923199025e-05, "epoch": 1.004403222087514, "percentage": 33.48, "elapsed_time": "23:21:56", "remaining_time": "1 day, 22:25:27", "throughput": 27013.46, "total_tokens": 2272284160} +{"current_steps": 8450, "total_steps": 25209, "loss": 0.9891, "lr": 3.681150630693046e-05, "epoch": 1.0055932821111664, "percentage": 33.52, "elapsed_time": "23:23:33", "remaining_time": "1 day, 22:23:42", "throughput": 27014.45, "total_tokens": 2274989504} +{"current_steps": 8460, "total_steps": 25209, "loss": 0.9767, "lr": 3.6801533802126615e-05, "epoch": 1.006783342134819, "percentage": 33.56, "elapsed_time": "23:25:19", "remaining_time": "1 day, 22:22:14", "throughput": 27013.5, "total_tokens": 2277760192} +{"current_steps": 8470, "total_steps": 25209, "loss": 0.9761, "lr": 3.679156939780617e-05, "epoch": 1.0079734021584714, "percentage": 33.6, "elapsed_time": "23:26:56", "remaining_time": "1 day, 22:20:30", "throughput": 27013.81, "total_tokens": 2280424320} +{"current_steps": 8480, "total_steps": 25209, "loss": 0.9739, "lr": 3.6781613083008594e-05, "epoch": 1.0091634621821237, "percentage": 33.64, "elapsed_time": "23:28:40", "remaining_time": "1 day, 22:18:58", "throughput": 27013.07, "total_tokens": 2283155904} +{"current_steps": 8490, "total_steps": 25209, "loss": 0.9726, "lr": 3.677166484679412e-05, "epoch": 1.0103535222057762, "percentage": 33.68, "elapsed_time": "23:30:15", "remaining_time": "1 day, 22:17:09", "throughput": 27014.11, "total_tokens": 2285812544} +{"current_steps": 8500, "total_steps": 25209, "loss": 0.972, "lr": 3.676172467824368e-05, "epoch": 1.0115435822294288, "percentage": 33.72, "elapsed_time": "23:31:48", "remaining_time": "1 day, 22:15:17", "throughput": 27015.03, "total_tokens": 2288412608} +{"current_steps": 8510, "total_steps": 25209, "loss": 0.9791, "lr": 3.675179256645885e-05, "epoch": 1.012733642253081, "percentage": 33.76, "elapsed_time": "23:33:27", "remaining_time": "1 day, 22:13:35", "throughput": 27015.68, "total_tokens": 2291124160} +{"current_steps": 8520, "total_steps": 25209, "loss": 0.99, "lr": 3.674186850056181e-05, "epoch": 1.0139237022767336, "percentage": 33.8, "elapsed_time": "23:35:02", "remaining_time": "1 day, 22:11:46", "throughput": 27017.26, "total_tokens": 2293823552} +{"current_steps": 8530, "total_steps": 25209, "loss": 0.9945, "lr": 3.67319524696953e-05, "epoch": 1.015113762300386, "percentage": 33.84, "elapsed_time": "23:36:37", "remaining_time": "1 day, 22:09:58", "throughput": 27018.78, "total_tokens": 2296522176} +{"current_steps": 8540, "total_steps": 25209, "loss": 0.9706, "lr": 3.6722044463022536e-05, "epoch": 1.0163038223240384, "percentage": 33.88, "elapsed_time": "23:38:16", "remaining_time": "1 day, 22:08:17", "throughput": 27019.26, "total_tokens": 2299237632} +{"current_steps": 8550, "total_steps": 25209, "loss": 0.9901, "lr": 3.6712144469727214e-05, "epoch": 1.017493882347691, "percentage": 33.92, "elapsed_time": "23:39:54", "remaining_time": "1 day, 22:06:34", "throughput": 27020.01, "total_tokens": 2301948416} +{"current_steps": 8560, "total_steps": 25209, "loss": 0.9805, "lr": 3.67022524790134e-05, "epoch": 1.0186839423713434, "percentage": 33.96, "elapsed_time": "23:41:30", "remaining_time": "1 day, 22:04:48", "throughput": 27020.73, "total_tokens": 2304613440} +{"current_steps": 8570, "total_steps": 25209, "loss": 0.9846, "lr": 3.6692368480105546e-05, "epoch": 1.0198740023949957, "percentage": 34.0, "elapsed_time": "23:43:06", "remaining_time": "1 day, 22:03:00", "throughput": 27021.77, "total_tokens": 2307281472} +{"current_steps": 8580, "total_steps": 25209, "loss": 0.9478, "lr": 3.6682492462248374e-05, "epoch": 1.0210640624186482, "percentage": 34.04, "elapsed_time": "23:44:43", "remaining_time": "1 day, 22:01:16", "throughput": 27022.58, "total_tokens": 2309982976} +{"current_steps": 8590, "total_steps": 25209, "loss": 0.9783, "lr": 3.667262441470689e-05, "epoch": 1.0222541224423007, "percentage": 34.08, "elapsed_time": "23:46:18", "remaining_time": "1 day, 21:59:28", "throughput": 27023.77, "total_tokens": 2312659328} +{"current_steps": 8600, "total_steps": 25209, "loss": 0.9753, "lr": 3.6662764326766255e-05, "epoch": 1.023444182465953, "percentage": 34.11, "elapsed_time": "23:47:53", "remaining_time": "1 day, 21:57:40", "throughput": 27025.34, "total_tokens": 2315367232} +{"current_steps": 8610, "total_steps": 25209, "loss": 0.9812, "lr": 3.665291218773185e-05, "epoch": 1.0246342424896056, "percentage": 34.15, "elapsed_time": "23:49:30", "remaining_time": "1 day, 21:55:55", "throughput": 27026.31, "total_tokens": 2318073344} +{"current_steps": 8620, "total_steps": 25209, "loss": 0.9807, "lr": 3.664306798692912e-05, "epoch": 1.025824302513258, "percentage": 34.19, "elapsed_time": "23:51:11", "remaining_time": "1 day, 21:54:18", "throughput": 27026.76, "total_tokens": 2320840064} +{"current_steps": 8630, "total_steps": 25209, "loss": 0.9679, "lr": 3.6633231713703576e-05, "epoch": 1.0270143625369104, "percentage": 34.23, "elapsed_time": "23:52:50", "remaining_time": "1 day, 21:52:37", "throughput": 27027.06, "total_tokens": 2323532480} +{"current_steps": 8640, "total_steps": 25209, "loss": 0.9869, "lr": 3.6623403357420745e-05, "epoch": 1.0282044225605629, "percentage": 34.27, "elapsed_time": "23:54:28", "remaining_time": "1 day, 21:50:54", "throughput": 27027.73, "total_tokens": 2326235904} +{"current_steps": 8650, "total_steps": 25209, "loss": 0.9793, "lr": 3.661358290746611e-05, "epoch": 1.0293944825842154, "percentage": 34.31, "elapsed_time": "23:56:09", "remaining_time": "1 day, 21:49:16", "throughput": 27027.69, "total_tokens": 2328955200} +{"current_steps": 8660, "total_steps": 25209, "loss": 0.9665, "lr": 3.6603770353245056e-05, "epoch": 1.0305845426078677, "percentage": 34.35, "elapsed_time": "23:57:44", "remaining_time": "1 day, 21:47:28", "throughput": 27028.92, "total_tokens": 2331628416} +{"current_steps": 8670, "total_steps": 25209, "loss": 0.9813, "lr": 3.659396568418286e-05, "epoch": 1.0317746026315202, "percentage": 34.39, "elapsed_time": "23:59:21", "remaining_time": "1 day, 21:45:44", "throughput": 27029.71, "total_tokens": 2334330624} +{"current_steps": 8680, "total_steps": 25209, "loss": 0.9733, "lr": 3.658416888972459e-05, "epoch": 1.0329646626551727, "percentage": 34.43, "elapsed_time": "1 day, 0:00:58", "remaining_time": "1 day, 21:43:59", "throughput": 27030.39, "total_tokens": 2337005568} +{"current_steps": 8690, "total_steps": 25209, "loss": 0.9798, "lr": 3.6574379959335106e-05, "epoch": 1.034154722678825, "percentage": 34.47, "elapsed_time": "1 day, 0:02:31", "remaining_time": "1 day, 21:42:07", "throughput": 27032.51, "total_tokens": 2339704256} +{"current_steps": 8700, "total_steps": 25209, "loss": 0.9841, "lr": 3.6564598882498976e-05, "epoch": 1.0353447827024775, "percentage": 34.51, "elapsed_time": "1 day, 0:04:10", "remaining_time": "1 day, 21:40:27", "throughput": 27032.39, "total_tokens": 2342380288} +{"current_steps": 8710, "total_steps": 25209, "loss": 0.9899, "lr": 3.655482564872043e-05, "epoch": 1.03653484272613, "percentage": 34.55, "elapsed_time": "1 day, 0:05:51", "remaining_time": "1 day, 21:38:49", "throughput": 27032.44, "total_tokens": 2345100288} +{"current_steps": 8720, "total_steps": 25209, "loss": 0.9738, "lr": 3.654506024752336e-05, "epoch": 1.0377249027497824, "percentage": 34.59, "elapsed_time": "1 day, 0:07:27", "remaining_time": "1 day, 21:37:03", "throughput": 27033.51, "total_tokens": 2347787840} +{"current_steps": 8730, "total_steps": 25209, "loss": 0.9861, "lr": 3.653530266845121e-05, "epoch": 1.0389149627734349, "percentage": 34.63, "elapsed_time": "1 day, 0:09:07", "remaining_time": "1 day, 21:35:23", "throughput": 27033.68, "total_tokens": 2350498944} +{"current_steps": 8740, "total_steps": 25209, "loss": 0.9705, "lr": 3.652555290106696e-05, "epoch": 1.0401050227970874, "percentage": 34.67, "elapsed_time": "1 day, 0:10:45", "remaining_time": "1 day, 21:33:42", "throughput": 27033.75, "total_tokens": 2353173760} +{"current_steps": 8750, "total_steps": 25209, "loss": 0.9681, "lr": 3.6515810934953084e-05, "epoch": 1.0412950828207397, "percentage": 34.71, "elapsed_time": "1 day, 0:12:22", "remaining_time": "1 day, 21:31:57", "throughput": 27034.57, "total_tokens": 2355862912} +{"current_steps": 8760, "total_steps": 25209, "loss": 0.9814, "lr": 3.650607675971151e-05, "epoch": 1.0424851428443922, "percentage": 34.75, "elapsed_time": "1 day, 0:14:00", "remaining_time": "1 day, 21:30:15", "throughput": 27034.82, "total_tokens": 2358542912} +{"current_steps": 8770, "total_steps": 25209, "loss": 0.9695, "lr": 3.649635036496351e-05, "epoch": 1.0436752028680447, "percentage": 34.79, "elapsed_time": "1 day, 0:15:52", "remaining_time": "1 day, 21:28:58", "throughput": 27031.65, "total_tokens": 2361287104} +{"current_steps": 8780, "total_steps": 25209, "loss": 0.9844, "lr": 3.6486631740349746e-05, "epoch": 1.044865262891697, "percentage": 34.83, "elapsed_time": "1 day, 0:17:27", "remaining_time": "1 day, 21:27:10", "throughput": 27033.25, "total_tokens": 2363986816} +{"current_steps": 8790, "total_steps": 25209, "loss": 0.994, "lr": 3.647692087553018e-05, "epoch": 1.0460553229153495, "percentage": 34.87, "elapsed_time": "1 day, 0:19:06", "remaining_time": "1 day, 21:25:29", "throughput": 27033.95, "total_tokens": 2366720000} +{"current_steps": 8800, "total_steps": 25209, "loss": 0.9887, "lr": 3.6467217760184005e-05, "epoch": 1.047245382939002, "percentage": 34.91, "elapsed_time": "1 day, 0:20:41", "remaining_time": "1 day, 21:23:42", "throughput": 27035.32, "total_tokens": 2369425152} +{"current_steps": 8810, "total_steps": 25209, "loss": 0.9787, "lr": 3.6457522384009625e-05, "epoch": 1.0484354429626543, "percentage": 34.95, "elapsed_time": "1 day, 0:22:33", "remaining_time": "1 day, 21:22:24", "throughput": 27031.52, "total_tokens": 2372099968} +{"current_steps": 8820, "total_steps": 25209, "loss": 0.9795, "lr": 3.644783473672462e-05, "epoch": 1.0496255029863069, "percentage": 34.99, "elapsed_time": "1 day, 0:24:27", "remaining_time": "1 day, 21:21:12", "throughput": 27026.56, "total_tokens": 2374760896} +{"current_steps": 8830, "total_steps": 25209, "loss": 0.9737, "lr": 3.643815480806568e-05, "epoch": 1.0508155630099594, "percentage": 35.03, "elapsed_time": "1 day, 0:26:23", "remaining_time": "1 day, 21:20:03", "throughput": 27021.87, "total_tokens": 2377481728} +{"current_steps": 8840, "total_steps": 25209, "loss": 0.9749, "lr": 3.6428482587788555e-05, "epoch": 1.0520056230336117, "percentage": 35.07, "elapsed_time": "1 day, 0:28:12", "remaining_time": "1 day, 21:18:40", "throughput": 27019.01, "total_tokens": 2380169024} +{"current_steps": 8850, "total_steps": 25209, "loss": 0.9737, "lr": 3.641881806566803e-05, "epoch": 1.0531956830572642, "percentage": 35.11, "elapsed_time": "1 day, 0:30:03", "remaining_time": "1 day, 21:17:21", "throughput": 27015.61, "total_tokens": 2382867840} +{"current_steps": 8860, "total_steps": 25209, "loss": 0.9701, "lr": 3.640916123149788e-05, "epoch": 1.0543857430809167, "percentage": 35.15, "elapsed_time": "1 day, 0:31:49", "remaining_time": "1 day, 21:15:53", "throughput": 27013.38, "total_tokens": 2385534144} +{"current_steps": 8870, "total_steps": 25209, "loss": 0.9779, "lr": 3.639951207509079e-05, "epoch": 1.055575803104569, "percentage": 35.19, "elapsed_time": "1 day, 0:33:34", "remaining_time": "1 day, 21:14:23", "throughput": 27011.92, "total_tokens": 2388238272} +{"current_steps": 8880, "total_steps": 25209, "loss": 0.9887, "lr": 3.6389870586278333e-05, "epoch": 1.0567658631282215, "percentage": 35.23, "elapsed_time": "1 day, 0:35:20", "remaining_time": "1 day, 21:12:56", "throughput": 27009.89, "total_tokens": 2390929536} +{"current_steps": 8890, "total_steps": 25209, "loss": 0.9711, "lr": 3.6380236754910965e-05, "epoch": 1.057955923151874, "percentage": 35.27, "elapsed_time": "1 day, 0:37:04", "remaining_time": "1 day, 21:11:24", "throughput": 27008.32, "total_tokens": 2393608640} +{"current_steps": 8900, "total_steps": 25209, "loss": 0.9742, "lr": 3.6370610570857897e-05, "epoch": 1.0591459831755263, "percentage": 35.3, "elapsed_time": "1 day, 0:38:56", "remaining_time": "1 day, 21:10:08", "throughput": 27004.33, "total_tokens": 2396282688} +{"current_steps": 8910, "total_steps": 25209, "loss": 0.9798, "lr": 3.6360992024007114e-05, "epoch": 1.0603360431991788, "percentage": 35.34, "elapsed_time": "1 day, 0:40:38", "remaining_time": "1 day, 21:08:31", "throughput": 27003.6, "total_tokens": 2398961536} +{"current_steps": 8920, "total_steps": 25209, "loss": 0.9756, "lr": 3.6351381104265304e-05, "epoch": 1.0615261032228314, "percentage": 35.38, "elapsed_time": "1 day, 0:42:22", "remaining_time": "1 day, 21:06:59", "throughput": 27002.54, "total_tokens": 2401662720} +{"current_steps": 8930, "total_steps": 25209, "loss": 0.9841, "lr": 3.634177780155783e-05, "epoch": 1.0627161632464837, "percentage": 35.42, "elapsed_time": "1 day, 0:44:13", "remaining_time": "1 day, 21:05:40", "throughput": 26999.1, "total_tokens": 2404356800} +{"current_steps": 8940, "total_steps": 25209, "loss": 0.9773, "lr": 3.633218210582867e-05, "epoch": 1.0639062232701362, "percentage": 35.46, "elapsed_time": "1 day, 0:46:09", "remaining_time": "1 day, 21:04:29", "throughput": 26994.08, "total_tokens": 2407036352} +{"current_steps": 8950, "total_steps": 25209, "loss": 0.9674, "lr": 3.6322594007040376e-05, "epoch": 1.0650962832937887, "percentage": 35.5, "elapsed_time": "1 day, 0:48:06", "remaining_time": "1 day, 21:03:22", "throughput": 26989.71, "total_tokens": 2409819136} +{"current_steps": 8960, "total_steps": 25209, "loss": 0.9742, "lr": 3.631301349517403e-05, "epoch": 1.066286343317441, "percentage": 35.54, "elapsed_time": "1 day, 0:49:57", "remaining_time": "1 day, 21:02:02", "throughput": 26985.9, "total_tokens": 2412472128} +{"current_steps": 8970, "total_steps": 25209, "loss": 0.9792, "lr": 3.6303440560229216e-05, "epoch": 1.0674764033410935, "percentage": 35.58, "elapsed_time": "1 day, 0:51:38", "remaining_time": "1 day, 21:00:24", "throughput": 26985.67, "total_tokens": 2415172800} +{"current_steps": 8980, "total_steps": 25209, "loss": 0.9745, "lr": 3.629387519222395e-05, "epoch": 1.068666463364746, "percentage": 35.62, "elapsed_time": "1 day, 0:53:21", "remaining_time": "1 day, 20:58:50", "throughput": 26984.53, "total_tokens": 2417845888} +{"current_steps": 8990, "total_steps": 25209, "loss": 0.9732, "lr": 3.628431738119464e-05, "epoch": 1.0698565233883983, "percentage": 35.66, "elapsed_time": "1 day, 0:55:13", "remaining_time": "1 day, 20:57:33", "throughput": 26980.99, "total_tokens": 2420558080} +{"current_steps": 9000, "total_steps": 25209, "loss": 0.9783, "lr": 3.62747671171961e-05, "epoch": 1.0710465834120508, "percentage": 35.7, "elapsed_time": "1 day, 0:57:00", "remaining_time": "1 day, 20:56:06", "throughput": 26978.3, "total_tokens": 2423197376} +{"current_steps": 9010, "total_steps": 25209, "loss": 0.9733, "lr": 3.626522439030138e-05, "epoch": 1.0722366434357034, "percentage": 35.74, "elapsed_time": "1 day, 0:58:40", "remaining_time": "1 day, 20:54:27", "throughput": 26977.97, "total_tokens": 2425871168} +{"current_steps": 9020, "total_steps": 25209, "loss": 0.9825, "lr": 3.6255689190601863e-05, "epoch": 1.0734267034593556, "percentage": 35.78, "elapsed_time": "1 day, 1:00:30", "remaining_time": "1 day, 20:53:05", "throughput": 26974.13, "total_tokens": 2428489024} +{"current_steps": 9030, "total_steps": 25209, "loss": 0.9747, "lr": 3.624616150820714e-05, "epoch": 1.0746167634830082, "percentage": 35.82, "elapsed_time": "1 day, 1:02:10", "remaining_time": "1 day, 20:51:25", "throughput": 26973.74, "total_tokens": 2431144320} +{"current_steps": 9040, "total_steps": 25209, "loss": 0.9736, "lr": 3.623664133324499e-05, "epoch": 1.0758068235066607, "percentage": 35.86, "elapsed_time": "1 day, 1:03:51", "remaining_time": "1 day, 20:49:48", "throughput": 26973.29, "total_tokens": 2433832256} +{"current_steps": 9050, "total_steps": 25209, "loss": 0.978, "lr": 3.622712865586131e-05, "epoch": 1.076996883530313, "percentage": 35.9, "elapsed_time": "1 day, 1:05:32", "remaining_time": "1 day, 20:48:10", "throughput": 26973.05, "total_tokens": 2436530368} +{"current_steps": 9060, "total_steps": 25209, "loss": 0.9719, "lr": 3.621762346622014e-05, "epoch": 1.0781869435539655, "percentage": 35.94, "elapsed_time": "1 day, 1:07:13", "remaining_time": "1 day, 20:46:32", "throughput": 26972.44, "total_tokens": 2439200896} +{"current_steps": 9070, "total_steps": 25209, "loss": 0.9854, "lr": 3.620812575450352e-05, "epoch": 1.079377003577618, "percentage": 35.98, "elapsed_time": "1 day, 1:09:06", "remaining_time": "1 day, 20:45:16", "throughput": 26968.0, "total_tokens": 2441857664} +{"current_steps": 9080, "total_steps": 25209, "loss": 0.9708, "lr": 3.6198635510911556e-05, "epoch": 1.0805670636012703, "percentage": 36.02, "elapsed_time": "1 day, 1:11:06", "remaining_time": "1 day, 20:44:13", "throughput": 26961.29, "total_tokens": 2444497856} +{"current_steps": 9090, "total_steps": 25209, "loss": 0.9774, "lr": 3.618915272566228e-05, "epoch": 1.0817571236249228, "percentage": 36.06, "elapsed_time": "1 day, 1:12:53", "remaining_time": "1 day, 20:42:46", "throughput": 26958.58, "total_tokens": 2447137024} +{"current_steps": 9100, "total_steps": 25209, "loss": 0.9825, "lr": 3.6179677388991694e-05, "epoch": 1.0829471836485753, "percentage": 36.1, "elapsed_time": "1 day, 1:14:46", "remaining_time": "1 day, 20:41:28", "throughput": 26954.77, "total_tokens": 2449813824} +{"current_steps": 9110, "total_steps": 25209, "loss": 0.9808, "lr": 3.617020949115366e-05, "epoch": 1.0841372436722276, "percentage": 36.14, "elapsed_time": "1 day, 1:16:26", "remaining_time": "1 day, 20:39:48", "throughput": 26954.15, "total_tokens": 2452453120} +{"current_steps": 9120, "total_steps": 25209, "loss": 0.9656, "lr": 3.6160749022419886e-05, "epoch": 1.0853273036958802, "percentage": 36.18, "elapsed_time": "1 day, 1:18:06", "remaining_time": "1 day, 20:38:09", "throughput": 26953.69, "total_tokens": 2455108032} +{"current_steps": 9130, "total_steps": 25209, "loss": 0.9931, "lr": 3.6151295973079887e-05, "epoch": 1.0865173637195327, "percentage": 36.22, "elapsed_time": "1 day, 1:19:49", "remaining_time": "1 day, 20:36:35", "throughput": 26952.84, "total_tokens": 2457820480} +{"current_steps": 9140, "total_steps": 25209, "loss": 0.9762, "lr": 3.6141850333440934e-05, "epoch": 1.087707423743185, "percentage": 36.26, "elapsed_time": "1 day, 1:21:46", "remaining_time": "1 day, 20:35:25", "throughput": 26948.62, "total_tokens": 2460579392} +{"current_steps": 9150, "total_steps": 25209, "loss": 0.9655, "lr": 3.613241209382803e-05, "epoch": 1.0888974837668375, "percentage": 36.3, "elapsed_time": "1 day, 1:23:36", "remaining_time": "1 day, 20:34:02", "throughput": 26946.12, "total_tokens": 2463307008} +{"current_steps": 9160, "total_steps": 25209, "loss": 0.9704, "lr": 3.6122981244583834e-05, "epoch": 1.09008754379049, "percentage": 36.34, "elapsed_time": "1 day, 1:25:26", "remaining_time": "1 day, 20:32:41", "throughput": 26942.82, "total_tokens": 2465991360} +{"current_steps": 9170, "total_steps": 25209, "loss": 0.9778, "lr": 3.6113557776068644e-05, "epoch": 1.0912776038141423, "percentage": 36.38, "elapsed_time": "1 day, 1:27:19", "remaining_time": "1 day, 20:31:23", "throughput": 26939.97, "total_tokens": 2468754176} +{"current_steps": 9180, "total_steps": 25209, "loss": 0.9864, "lr": 3.6104141678660386e-05, "epoch": 1.0924676638377948, "percentage": 36.42, "elapsed_time": "1 day, 1:29:01", "remaining_time": "1 day, 20:29:48", "throughput": 26938.47, "total_tokens": 2471383296} +{"current_steps": 9190, "total_steps": 25209, "loss": 0.9872, "lr": 3.6094732942754487e-05, "epoch": 1.0936577238614473, "percentage": 36.46, "elapsed_time": "1 day, 1:30:41", "remaining_time": "1 day, 20:28:08", "throughput": 26938.36, "total_tokens": 2474064256} +{"current_steps": 9200, "total_steps": 25209, "loss": 0.9696, "lr": 3.60853315587639e-05, "epoch": 1.0948477838850996, "percentage": 36.49, "elapsed_time": "1 day, 1:32:23", "remaining_time": "1 day, 20:26:32", "throughput": 26938.09, "total_tokens": 2476788800} +{"current_steps": 9210, "total_steps": 25209, "loss": 0.9797, "lr": 3.607593751711909e-05, "epoch": 1.0960378439087521, "percentage": 36.53, "elapsed_time": "1 day, 1:34:05", "remaining_time": "1 day, 20:24:55", "throughput": 26937.62, "total_tokens": 2479488832} +{"current_steps": 9220, "total_steps": 25209, "loss": 0.9783, "lr": 3.60665508082679e-05, "epoch": 1.0972279039324047, "percentage": 36.57, "elapsed_time": "1 day, 1:35:48", "remaining_time": "1 day, 20:23:20", "throughput": 26936.99, "total_tokens": 2482198272} +{"current_steps": 9230, "total_steps": 25209, "loss": 0.9766, "lr": 3.6057171422675585e-05, "epoch": 1.098417963956057, "percentage": 36.61, "elapsed_time": "1 day, 1:37:36", "remaining_time": "1 day, 20:21:54", "throughput": 26935.06, "total_tokens": 2484934912} +{"current_steps": 9240, "total_steps": 25209, "loss": 0.9643, "lr": 3.604779935082474e-05, "epoch": 1.0996080239797095, "percentage": 36.65, "elapsed_time": "1 day, 1:39:30", "remaining_time": "1 day, 20:20:38", "throughput": 26930.99, "total_tokens": 2487617728} +{"current_steps": 9250, "total_steps": 25209, "loss": 0.9727, "lr": 3.603843458321526e-05, "epoch": 1.100798084003362, "percentage": 36.69, "elapsed_time": "1 day, 1:41:30", "remaining_time": "1 day, 20:19:33", "throughput": 26925.13, "total_tokens": 2490317824} +{"current_steps": 9260, "total_steps": 25209, "loss": 0.9712, "lr": 3.6029077110364355e-05, "epoch": 1.1019881440270143, "percentage": 36.73, "elapsed_time": "1 day, 1:43:21", "remaining_time": "1 day, 20:18:12", "throughput": 26922.09, "total_tokens": 2493019648} +{"current_steps": 9270, "total_steps": 25209, "loss": 0.9677, "lr": 3.60197269228064e-05, "epoch": 1.1031782040506668, "percentage": 36.77, "elapsed_time": "1 day, 1:45:10", "remaining_time": "1 day, 20:16:48", "throughput": 26919.09, "total_tokens": 2495682816} +{"current_steps": 9280, "total_steps": 25209, "loss": 0.9871, "lr": 3.601038401109299e-05, "epoch": 1.1043682640743193, "percentage": 36.81, "elapsed_time": "1 day, 1:46:51", "remaining_time": "1 day, 20:15:09", "throughput": 26918.56, "total_tokens": 2498346816} +{"current_steps": 9290, "total_steps": 25209, "loss": 0.9591, "lr": 3.6001048365792846e-05, "epoch": 1.1055583240979716, "percentage": 36.85, "elapsed_time": "1 day, 1:48:31", "remaining_time": "1 day, 20:13:29", "throughput": 26918.23, "total_tokens": 2501017344} +{"current_steps": 9300, "total_steps": 25209, "loss": 0.978, "lr": 3.599171997749182e-05, "epoch": 1.1067483841216241, "percentage": 36.89, "elapsed_time": "1 day, 1:50:13", "remaining_time": "1 day, 20:11:52", "throughput": 26917.89, "total_tokens": 2503718528} +{"current_steps": 9310, "total_steps": 25209, "loss": 0.979, "lr": 3.598239883679281e-05, "epoch": 1.1079384441452766, "percentage": 36.93, "elapsed_time": "1 day, 1:51:55", "remaining_time": "1 day, 20:10:16", "throughput": 26916.99, "total_tokens": 2506392960} +{"current_steps": 9320, "total_steps": 25209, "loss": 0.9877, "lr": 3.597308493431576e-05, "epoch": 1.109128504168929, "percentage": 36.97, "elapsed_time": "1 day, 1:53:36", "remaining_time": "1 day, 20:08:38", "throughput": 26916.74, "total_tokens": 2509087872} +{"current_steps": 9330, "total_steps": 25209, "loss": 0.987, "lr": 3.596377826069758e-05, "epoch": 1.1103185641925815, "percentage": 37.01, "elapsed_time": "1 day, 1:55:14", "remaining_time": "1 day, 20:06:54", "throughput": 26916.49, "total_tokens": 2511692032} +{"current_steps": 9340, "total_steps": 25209, "loss": 0.9959, "lr": 3.5954478806592155e-05, "epoch": 1.111508624216234, "percentage": 37.05, "elapsed_time": "1 day, 1:56:58", "remaining_time": "1 day, 20:05:20", "throughput": 26915.77, "total_tokens": 2514421568} +{"current_steps": 9350, "total_steps": 25209, "loss": 0.9767, "lr": 3.594518656267024e-05, "epoch": 1.1126986842398863, "percentage": 37.09, "elapsed_time": "1 day, 1:58:51", "remaining_time": "1 day, 20:04:04", "throughput": 26912.25, "total_tokens": 2517154944} +{"current_steps": 9360, "total_steps": 25209, "loss": 0.9826, "lr": 3.5935901519619496e-05, "epoch": 1.1138887442635388, "percentage": 37.13, "elapsed_time": "1 day, 2:00:40", "remaining_time": "1 day, 20:02:39", "throughput": 26909.37, "total_tokens": 2519818880} +{"current_steps": 9370, "total_steps": 25209, "loss": 0.9925, "lr": 3.5926623668144385e-05, "epoch": 1.1150788042871913, "percentage": 37.17, "elapsed_time": "1 day, 2:02:21", "remaining_time": "1 day, 20:00:59", "throughput": 26908.61, "total_tokens": 2522451136} +{"current_steps": 9380, "total_steps": 25209, "loss": 0.9834, "lr": 3.5917352998966194e-05, "epoch": 1.1162688643108436, "percentage": 37.21, "elapsed_time": "1 day, 2:04:01", "remaining_time": "1 day, 19:59:20", "throughput": 26908.59, "total_tokens": 2525153472} +{"current_steps": 9390, "total_steps": 25209, "loss": 0.9853, "lr": 3.5908089502822914e-05, "epoch": 1.1174589243344961, "percentage": 37.25, "elapsed_time": "1 day, 2:05:53", "remaining_time": "1 day, 19:58:00", "throughput": 26905.38, "total_tokens": 2527855936} +{"current_steps": 9400, "total_steps": 25209, "loss": 0.9884, "lr": 3.589883317046929e-05, "epoch": 1.1186489843581486, "percentage": 37.29, "elapsed_time": "1 day, 2:07:35", "remaining_time": "1 day, 19:56:23", "throughput": 26904.89, "total_tokens": 2530562048} +{"current_steps": 9410, "total_steps": 25209, "loss": 0.9835, "lr": 3.5889583992676715e-05, "epoch": 1.119839044381801, "percentage": 37.33, "elapsed_time": "1 day, 2:09:11", "remaining_time": "1 day, 19:54:37", "throughput": 26905.61, "total_tokens": 2533217152} +{"current_steps": 9420, "total_steps": 25209, "loss": 0.972, "lr": 3.5880341960233244e-05, "epoch": 1.1210291044054534, "percentage": 37.37, "elapsed_time": "1 day, 2:10:51", "remaining_time": "1 day, 19:52:56", "throughput": 26905.32, "total_tokens": 2535867648} +{"current_steps": 9430, "total_steps": 25209, "loss": 0.9766, "lr": 3.58711070639435e-05, "epoch": 1.122219164429106, "percentage": 37.41, "elapsed_time": "1 day, 2:12:41", "remaining_time": "1 day, 19:51:33", "throughput": 26901.91, "total_tokens": 2538507584} +{"current_steps": 9440, "total_steps": 25209, "loss": 0.9761, "lr": 3.586187929462869e-05, "epoch": 1.1234092244527583, "percentage": 37.45, "elapsed_time": "1 day, 2:14:37", "remaining_time": "1 day, 19:50:20", "throughput": 26897.83, "total_tokens": 2541251072} +{"current_steps": 9450, "total_steps": 25209, "loss": 0.9703, "lr": 3.585265864312651e-05, "epoch": 1.1245992844764108, "percentage": 37.49, "elapsed_time": "1 day, 2:16:35", "remaining_time": "1 day, 19:49:10", "throughput": 26892.33, "total_tokens": 2543905792} +{"current_steps": 9460, "total_steps": 25209, "loss": 0.975, "lr": 3.584344510029118e-05, "epoch": 1.1257893445000633, "percentage": 37.53, "elapsed_time": "1 day, 2:18:11", "remaining_time": "1 day, 19:47:22", "throughput": 26892.84, "total_tokens": 2546528704} +{"current_steps": 9470, "total_steps": 25209, "loss": 0.9832, "lr": 3.583423865699333e-05, "epoch": 1.1269794045237156, "percentage": 37.57, "elapsed_time": "1 day, 2:19:55", "remaining_time": "1 day, 19:45:48", "throughput": 26891.51, "total_tokens": 2549184256} +{"current_steps": 9480, "total_steps": 25209, "loss": 0.9735, "lr": 3.5825039304119994e-05, "epoch": 1.128169464547368, "percentage": 37.61, "elapsed_time": "1 day, 2:21:38", "remaining_time": "1 day, 19:44:14", "throughput": 26890.07, "total_tokens": 2551837888} +{"current_steps": 9490, "total_steps": 25209, "loss": 0.9735, "lr": 3.581584703257461e-05, "epoch": 1.1293595245710206, "percentage": 37.65, "elapsed_time": "1 day, 2:23:26", "remaining_time": "1 day, 19:42:46", "throughput": 26888.32, "total_tokens": 2554572544} +{"current_steps": 9500, "total_steps": 25209, "loss": 0.9663, "lr": 3.580666183327689e-05, "epoch": 1.130549584594673, "percentage": 37.68, "elapsed_time": "1 day, 2:25:11", "remaining_time": "1 day, 19:41:15", "throughput": 26887.1, "total_tokens": 2557286016} +{"current_steps": 9510, "total_steps": 25209, "loss": 0.9606, "lr": 3.5797483697162906e-05, "epoch": 1.1317396446183254, "percentage": 37.72, "elapsed_time": "1 day, 2:27:01", "remaining_time": "1 day, 19:39:50", "throughput": 26884.99, "total_tokens": 2560035648} +{"current_steps": 9520, "total_steps": 25209, "loss": 0.985, "lr": 3.5788312615184936e-05, "epoch": 1.132929704641978, "percentage": 37.76, "elapsed_time": "1 day, 2:28:44", "remaining_time": "1 day, 19:38:14", "throughput": 26884.03, "total_tokens": 2562695104} +{"current_steps": 9530, "total_steps": 25209, "loss": 0.9791, "lr": 3.5779148578311476e-05, "epoch": 1.1341197646656302, "percentage": 37.8, "elapsed_time": "1 day, 2:30:29", "remaining_time": "1 day, 19:36:42", "throughput": 26882.77, "total_tokens": 2565407104} +{"current_steps": 9540, "total_steps": 25209, "loss": 0.9783, "lr": 3.5769991577527236e-05, "epoch": 1.1353098246892828, "percentage": 37.84, "elapsed_time": "1 day, 2:32:20", "remaining_time": "1 day, 19:35:19", "throughput": 26880.19, "total_tokens": 2568134208} +{"current_steps": 9550, "total_steps": 25209, "loss": 0.9729, "lr": 3.5760841603833034e-05, "epoch": 1.1364998847129353, "percentage": 37.88, "elapsed_time": "1 day, 2:34:05", "remaining_time": "1 day, 19:33:47", "throughput": 26879.02, "total_tokens": 2570844608} +{"current_steps": 9560, "total_steps": 25209, "loss": 0.9726, "lr": 3.5751698648245814e-05, "epoch": 1.1376899447365876, "percentage": 37.92, "elapsed_time": "1 day, 2:35:49", "remaining_time": "1 day, 19:32:14", "throughput": 26877.84, "total_tokens": 2573539648} +{"current_steps": 9570, "total_steps": 25209, "loss": 0.9761, "lr": 3.574256270179857e-05, "epoch": 1.13888000476024, "percentage": 37.96, "elapsed_time": "1 day, 2:37:31", "remaining_time": "1 day, 19:30:36", "throughput": 26877.06, "total_tokens": 2576194304} +{"current_steps": 9580, "total_steps": 25209, "loss": 0.9777, "lr": 3.573343375554037e-05, "epoch": 1.1400700647838926, "percentage": 38.0, "elapsed_time": "1 day, 2:39:17", "remaining_time": "1 day, 19:29:07", "throughput": 26875.46, "total_tokens": 2578904768} +{"current_steps": 9590, "total_steps": 25209, "loss": 0.9679, "lr": 3.572431180053621e-05, "epoch": 1.141260124807545, "percentage": 38.04, "elapsed_time": "1 day, 2:41:05", "remaining_time": "1 day, 19:27:39", "throughput": 26872.77, "total_tokens": 2581548992} +{"current_steps": 9600, "total_steps": 25209, "loss": 0.9605, "lr": 3.571519682786711e-05, "epoch": 1.1424501848311974, "percentage": 38.08, "elapsed_time": "1 day, 2:42:51", "remaining_time": "1 day, 19:26:09", "throughput": 26871.13, "total_tokens": 2584243840} +{"current_steps": 9610, "total_steps": 25209, "loss": 0.9719, "lr": 3.570608882862996e-05, "epoch": 1.14364024485485, "percentage": 38.12, "elapsed_time": "1 day, 2:44:37", "remaining_time": "1 day, 19:24:38", "throughput": 26869.45, "total_tokens": 2586935424} +{"current_steps": 9620, "total_steps": 25209, "loss": 0.9754, "lr": 3.569698779393757e-05, "epoch": 1.1448303048785022, "percentage": 38.16, "elapsed_time": "1 day, 2:46:32", "remaining_time": "1 day, 19:23:22", "throughput": 26865.79, "total_tokens": 2589671744} +{"current_steps": 9630, "total_steps": 25209, "loss": 0.9784, "lr": 3.568789371491859e-05, "epoch": 1.1460203649021548, "percentage": 38.2, "elapsed_time": "1 day, 2:48:31", "remaining_time": "1 day, 19:22:11", "throughput": 26860.78, "total_tokens": 2592366784} +{"current_steps": 9640, "total_steps": 25209, "loss": 0.9774, "lr": 3.567880658271748e-05, "epoch": 1.1472104249258073, "percentage": 38.24, "elapsed_time": "1 day, 2:50:22", "remaining_time": "1 day, 19:20:49", "throughput": 26857.69, "total_tokens": 2595065856} +{"current_steps": 9650, "total_steps": 25209, "loss": 0.9824, "lr": 3.566972638849445e-05, "epoch": 1.1484004849494596, "percentage": 38.28, "elapsed_time": "1 day, 2:52:24", "remaining_time": "1 day, 19:19:43", "throughput": 26852.41, "total_tokens": 2597815616} +{"current_steps": 9660, "total_steps": 25209, "loss": 0.9938, "lr": 3.566065312342551e-05, "epoch": 1.149590544973112, "percentage": 38.32, "elapsed_time": "1 day, 2:54:06", "remaining_time": "1 day, 19:18:06", "throughput": 26851.51, "total_tokens": 2600474688} +{"current_steps": 9670, "total_steps": 25209, "loss": 0.9709, "lr": 3.565158677870231e-05, "epoch": 1.1507806049967646, "percentage": 38.36, "elapsed_time": "1 day, 2:55:49", "remaining_time": "1 day, 19:16:30", "throughput": 26850.75, "total_tokens": 2603155712} +{"current_steps": 9680, "total_steps": 25209, "loss": 0.988, "lr": 3.564252734553221e-05, "epoch": 1.151970665020417, "percentage": 38.4, "elapsed_time": "1 day, 2:57:29", "remaining_time": "1 day, 19:14:50", "throughput": 26850.37, "total_tokens": 2605811264} +{"current_steps": 9690, "total_steps": 25209, "loss": 0.9789, "lr": 3.563347481513818e-05, "epoch": 1.1531607250440694, "percentage": 38.44, "elapsed_time": "1 day, 2:59:12", "remaining_time": "1 day, 19:13:13", "throughput": 26849.62, "total_tokens": 2608495808} +{"current_steps": 9700, "total_steps": 25209, "loss": 0.9593, "lr": 3.56244291787588e-05, "epoch": 1.154350785067722, "percentage": 38.48, "elapsed_time": "1 day, 3:00:59", "remaining_time": "1 day, 19:11:44", "throughput": 26848.29, "total_tokens": 2611248640} +{"current_steps": 9710, "total_steps": 25209, "loss": 0.9817, "lr": 3.5615390427648216e-05, "epoch": 1.1555408450913742, "percentage": 38.52, "elapsed_time": "1 day, 3:02:36", "remaining_time": "1 day, 19:09:59", "throughput": 26848.5, "total_tokens": 2613878592} +{"current_steps": 9720, "total_steps": 25209, "loss": 0.9923, "lr": 3.5606358553076075e-05, "epoch": 1.1567309051150267, "percentage": 38.56, "elapsed_time": "1 day, 3:04:15", "remaining_time": "1 day, 19:08:17", "throughput": 26848.47, "total_tokens": 2616541184} +{"current_steps": 9730, "total_steps": 25209, "loss": 0.983, "lr": 3.5597333546327526e-05, "epoch": 1.1579209651386793, "percentage": 38.6, "elapsed_time": "1 day, 3:05:55", "remaining_time": "1 day, 19:06:36", "throughput": 26848.14, "total_tokens": 2619185088} +{"current_steps": 9740, "total_steps": 25209, "loss": 0.9895, "lr": 3.5588315398703186e-05, "epoch": 1.1591110251623316, "percentage": 38.64, "elapsed_time": "1 day, 3:07:37", "remaining_time": "1 day, 19:04:59", "throughput": 26847.71, "total_tokens": 2621882432} +{"current_steps": 9750, "total_steps": 25209, "loss": 0.9688, "lr": 3.557930410151907e-05, "epoch": 1.160301085185984, "percentage": 38.68, "elapsed_time": "1 day, 3:09:15", "remaining_time": "1 day, 19:03:15", "throughput": 26847.97, "total_tokens": 2624536896} +{"current_steps": 9760, "total_steps": 25209, "loss": 0.9705, "lr": 3.5570299646106606e-05, "epoch": 1.1614911452096366, "percentage": 38.72, "elapsed_time": "1 day, 3:10:55", "remaining_time": "1 day, 19:01:34", "throughput": 26848.09, "total_tokens": 2627226816} +{"current_steps": 9770, "total_steps": 25209, "loss": 0.9775, "lr": 3.556130202381253e-05, "epoch": 1.1626812052332889, "percentage": 38.76, "elapsed_time": "1 day, 3:12:36", "remaining_time": "1 day, 18:59:56", "throughput": 26847.59, "total_tokens": 2629907584} +{"current_steps": 9780, "total_steps": 25209, "loss": 0.9681, "lr": 3.555231122599892e-05, "epoch": 1.1638712652569414, "percentage": 38.8, "elapsed_time": "1 day, 3:14:24", "remaining_time": "1 day, 18:58:27", "throughput": 26845.86, "total_tokens": 2632626112} +{"current_steps": 9790, "total_steps": 25209, "loss": 0.9808, "lr": 3.554332724404313e-05, "epoch": 1.165061325280594, "percentage": 38.84, "elapsed_time": "1 day, 3:16:07", "remaining_time": "1 day, 18:56:51", "throughput": 26844.86, "total_tokens": 2635293952} +{"current_steps": 9800, "total_steps": 25209, "loss": 0.9676, "lr": 3.553435006933777e-05, "epoch": 1.1662513853042462, "percentage": 38.88, "elapsed_time": "1 day, 3:17:51", "remaining_time": "1 day, 18:55:17", "throughput": 26843.65, "total_tokens": 2637975424} +{"current_steps": 9810, "total_steps": 25209, "loss": 0.9835, "lr": 3.5525379693290626e-05, "epoch": 1.1674414453278987, "percentage": 38.91, "elapsed_time": "1 day, 3:19:33", "remaining_time": "1 day, 18:53:38", "throughput": 26843.15, "total_tokens": 2640646912} +{"current_steps": 9820, "total_steps": 25209, "loss": 0.9776, "lr": 3.551641610732469e-05, "epoch": 1.1686315053515512, "percentage": 38.95, "elapsed_time": "1 day, 3:21:16", "remaining_time": "1 day, 18:52:02", "throughput": 26842.38, "total_tokens": 2643337792} +{"current_steps": 9830, "total_steps": 25209, "loss": 0.9694, "lr": 3.55074593028781e-05, "epoch": 1.1698215653752035, "percentage": 38.99, "elapsed_time": "1 day, 3:22:57", "remaining_time": "1 day, 18:50:23", "throughput": 26842.03, "total_tokens": 2646014784} +{"current_steps": 9840, "total_steps": 25209, "loss": 0.9626, "lr": 3.5498509271404065e-05, "epoch": 1.171011625398856, "percentage": 39.03, "elapsed_time": "1 day, 3:24:37", "remaining_time": "1 day, 18:48:43", "throughput": 26841.71, "total_tokens": 2648681216} +{"current_steps": 9850, "total_steps": 25209, "loss": 0.9763, "lr": 3.5489566004370893e-05, "epoch": 1.1722016854225086, "percentage": 39.07, "elapsed_time": "1 day, 3:26:17", "remaining_time": "1 day, 18:47:02", "throughput": 26841.2, "total_tokens": 2651298048} +{"current_steps": 9860, "total_steps": 25209, "loss": 0.9798, "lr": 3.548062949326194e-05, "epoch": 1.1733917454461609, "percentage": 39.11, "elapsed_time": "1 day, 3:28:00", "remaining_time": "1 day, 18:45:26", "throughput": 26840.69, "total_tokens": 2654024128} +{"current_steps": 9870, "total_steps": 25209, "loss": 0.9728, "lr": 3.547169972957554e-05, "epoch": 1.1745818054698134, "percentage": 39.15, "elapsed_time": "1 day, 3:29:44", "remaining_time": "1 day, 18:43:52", "throughput": 26839.98, "total_tokens": 2656741056} +{"current_steps": 9880, "total_steps": 25209, "loss": 0.9781, "lr": 3.5462776704825e-05, "epoch": 1.175771865493466, "percentage": 39.19, "elapsed_time": "1 day, 3:31:23", "remaining_time": "1 day, 18:42:09", "throughput": 26839.76, "total_tokens": 2659364928} +{"current_steps": 9890, "total_steps": 25209, "loss": 0.9619, "lr": 3.5453860410538594e-05, "epoch": 1.1769619255171182, "percentage": 39.23, "elapsed_time": "1 day, 3:33:04", "remaining_time": "1 day, 18:40:30", "throughput": 26839.36, "total_tokens": 2662046976} +{"current_steps": 9900, "total_steps": 25209, "loss": 0.9919, "lr": 3.5444950838259455e-05, "epoch": 1.1781519855407707, "percentage": 39.27, "elapsed_time": "1 day, 3:34:49", "remaining_time": "1 day, 18:38:57", "throughput": 26838.26, "total_tokens": 2664752960} +{"current_steps": 9910, "total_steps": 25209, "loss": 0.9757, "lr": 3.543604797954563e-05, "epoch": 1.1793420455644232, "percentage": 39.31, "elapsed_time": "1 day, 3:36:35", "remaining_time": "1 day, 18:37:25", "throughput": 26837.16, "total_tokens": 2667480704} +{"current_steps": 9920, "total_steps": 25209, "loss": 0.966, "lr": 3.542715182596996e-05, "epoch": 1.1805321055880755, "percentage": 39.35, "elapsed_time": "1 day, 3:38:17", "remaining_time": "1 day, 18:35:49", "throughput": 26836.58, "total_tokens": 2670181120} +{"current_steps": 9930, "total_steps": 25209, "loss": 0.9789, "lr": 3.5418262369120115e-05, "epoch": 1.181722165611728, "percentage": 39.39, "elapsed_time": "1 day, 3:40:04", "remaining_time": "1 day, 18:34:18", "throughput": 26835.41, "total_tokens": 2672933568} +{"current_steps": 9940, "total_steps": 25209, "loss": 0.9837, "lr": 3.5409379600598526e-05, "epoch": 1.1829122256353806, "percentage": 39.43, "elapsed_time": "1 day, 3:41:46", "remaining_time": "1 day, 18:32:40", "throughput": 26834.71, "total_tokens": 2675593664} +{"current_steps": 9950, "total_steps": 25209, "loss": 0.9797, "lr": 3.540050351202235e-05, "epoch": 1.1841022856590329, "percentage": 39.47, "elapsed_time": "1 day, 3:43:34", "remaining_time": "1 day, 18:31:11", "throughput": 26833.58, "total_tokens": 2678373248} +{"current_steps": 9960, "total_steps": 25209, "loss": 0.9724, "lr": 3.539163409502347e-05, "epoch": 1.1852923456826854, "percentage": 39.51, "elapsed_time": "1 day, 3:45:22", "remaining_time": "1 day, 18:29:43", "throughput": 26832.41, "total_tokens": 2681155904} +{"current_steps": 9970, "total_steps": 25209, "loss": 0.9829, "lr": 3.5382771341248416e-05, "epoch": 1.186482405706338, "percentage": 39.55, "elapsed_time": "1 day, 3:47:03", "remaining_time": "1 day, 18:28:05", "throughput": 26832.02, "total_tokens": 2683843136} +{"current_steps": 9980, "total_steps": 25209, "loss": 0.9789, "lr": 3.537391524235835e-05, "epoch": 1.1876724657299902, "percentage": 39.59, "elapsed_time": "1 day, 3:48:46", "remaining_time": "1 day, 18:26:27", "throughput": 26831.67, "total_tokens": 2686556608} +{"current_steps": 9990, "total_steps": 25209, "loss": 0.9661, "lr": 3.5365065790029055e-05, "epoch": 1.1888625257536427, "percentage": 39.63, "elapsed_time": "1 day, 3:50:27", "remaining_time": "1 day, 18:24:48", "throughput": 26831.46, "total_tokens": 2689244928} +{"current_steps": 10000, "total_steps": 25209, "loss": 0.9714, "lr": 3.535622297595087e-05, "epoch": 1.1900525857772952, "percentage": 39.67, "elapsed_time": "1 day, 3:52:09", "remaining_time": "1 day, 18:23:10", "throughput": 26830.87, "total_tokens": 2691916416} +{"current_steps": 10000, "total_steps": 25209, "eval_loss": 1.0167350769042969, "epoch": 1.1900525857772952, "percentage": 39.67, "elapsed_time": "1 day, 3:52:11", "remaining_time": "1 day, 18:23:13", "throughput": 26830.32, "total_tokens": 2691916416} +{"current_steps": 10010, "total_steps": 25209, "loss": 0.9775, "lr": 3.534738679182869e-05, "epoch": 1.1912426458009475, "percentage": 39.71, "elapsed_time": "1 day, 3:54:26", "remaining_time": "1 day, 18:22:26", "throughput": 26821.18, "total_tokens": 2694635328} +{"current_steps": 10020, "total_steps": 25209, "loss": 0.9866, "lr": 3.533855722938188e-05, "epoch": 1.1924327058246, "percentage": 39.75, "elapsed_time": "1 day, 3:56:11", "remaining_time": "1 day, 18:20:52", "throughput": 26820.17, "total_tokens": 2697334272} +{"current_steps": 10030, "total_steps": 25209, "loss": 0.9911, "lr": 3.5329734280344325e-05, "epoch": 1.1936227658482526, "percentage": 39.79, "elapsed_time": "1 day, 3:57:54", "remaining_time": "1 day, 18:19:16", "throughput": 26819.55, "total_tokens": 2700039104} +{"current_steps": 10040, "total_steps": 25209, "loss": 0.9787, "lr": 3.5320917936464294e-05, "epoch": 1.1948128258719048, "percentage": 39.83, "elapsed_time": "1 day, 3:59:34", "remaining_time": "1 day, 18:17:35", "throughput": 26819.22, "total_tokens": 2702692160} +{"current_steps": 10050, "total_steps": 25209, "loss": 0.9822, "lr": 3.5312108189504505e-05, "epoch": 1.1960028858955574, "percentage": 39.87, "elapsed_time": "1 day, 4:01:14", "remaining_time": "1 day, 18:15:55", "throughput": 26818.97, "total_tokens": 2705357248} +{"current_steps": 10060, "total_steps": 25209, "loss": 0.9819, "lr": 3.530330503124204e-05, "epoch": 1.1971929459192099, "percentage": 39.91, "elapsed_time": "1 day, 4:02:56", "remaining_time": "1 day, 18:14:17", "throughput": 26818.52, "total_tokens": 2708041792} +{"current_steps": 10070, "total_steps": 25209, "loss": 0.9656, "lr": 3.5294508453468325e-05, "epoch": 1.1983830059428622, "percentage": 39.95, "elapsed_time": "1 day, 4:04:35", "remaining_time": "1 day, 18:12:35", "throughput": 26818.38, "total_tokens": 2710691328} +{"current_steps": 10080, "total_steps": 25209, "loss": 0.973, "lr": 3.528571844798908e-05, "epoch": 1.1995730659665147, "percentage": 39.99, "elapsed_time": "1 day, 4:06:16", "remaining_time": "1 day, 18:10:55", "throughput": 26818.39, "total_tokens": 2713403200} +{"current_steps": 10090, "total_steps": 25209, "loss": 0.987, "lr": 3.527693500662431e-05, "epoch": 1.2007631259901672, "percentage": 40.03, "elapsed_time": "1 day, 4:07:55", "remaining_time": "1 day, 18:09:13", "throughput": 26818.45, "total_tokens": 2716061824} +{"current_steps": 10100, "total_steps": 25209, "loss": 0.9786, "lr": 3.5268158121208294e-05, "epoch": 1.2019531860138195, "percentage": 40.07, "elapsed_time": "1 day, 4:09:34", "remaining_time": "1 day, 18:07:30", "throughput": 26818.87, "total_tokens": 2718746176} +{"current_steps": 10110, "total_steps": 25209, "loss": 0.9609, "lr": 3.525938778358949e-05, "epoch": 1.203143246037472, "percentage": 40.1, "elapsed_time": "1 day, 4:11:21", "remaining_time": "1 day, 18:06:00", "throughput": 26817.22, "total_tokens": 2721457536} +{"current_steps": 10120, "total_steps": 25209, "loss": 0.9816, "lr": 3.5250623985630537e-05, "epoch": 1.2043333060611245, "percentage": 40.14, "elapsed_time": "1 day, 4:13:03", "remaining_time": "1 day, 18:04:22", "throughput": 26816.68, "total_tokens": 2724138368} +{"current_steps": 10130, "total_steps": 25209, "loss": 0.9878, "lr": 3.524186671920826e-05, "epoch": 1.2055233660847768, "percentage": 40.18, "elapsed_time": "1 day, 4:14:46", "remaining_time": "1 day, 18:02:44", "throughput": 26816.24, "total_tokens": 2726839424} +{"current_steps": 10140, "total_steps": 25209, "loss": 0.9721, "lr": 3.523311597621358e-05, "epoch": 1.2067134261084294, "percentage": 40.22, "elapsed_time": "1 day, 4:16:28", "remaining_time": "1 day, 18:01:07", "throughput": 26815.35, "total_tokens": 2729504000} +{"current_steps": 10150, "total_steps": 25209, "loss": 0.9737, "lr": 3.5224371748551505e-05, "epoch": 1.2079034861320819, "percentage": 40.26, "elapsed_time": "1 day, 4:18:08", "remaining_time": "1 day, 17:59:27", "throughput": 26815.25, "total_tokens": 2732178176} +{"current_steps": 10160, "total_steps": 25209, "loss": 0.971, "lr": 3.521563402814109e-05, "epoch": 1.2090935461557342, "percentage": 40.3, "elapsed_time": "1 day, 4:19:55", "remaining_time": "1 day, 17:57:55", "throughput": 26814.16, "total_tokens": 2734925312} +{"current_steps": 10170, "total_steps": 25209, "loss": 0.9703, "lr": 3.5206902806915436e-05, "epoch": 1.2102836061793867, "percentage": 40.34, "elapsed_time": "1 day, 4:21:32", "remaining_time": "1 day, 17:56:10", "throughput": 26814.75, "total_tokens": 2737589504} +{"current_steps": 10180, "total_steps": 25209, "loss": 0.9888, "lr": 3.5198178076821644e-05, "epoch": 1.2114736662030392, "percentage": 40.38, "elapsed_time": "1 day, 4:23:11", "remaining_time": "1 day, 17:54:27", "throughput": 26815.07, "total_tokens": 2740269120} +{"current_steps": 10190, "total_steps": 25209, "loss": 0.9832, "lr": 3.5189459829820743e-05, "epoch": 1.2126637262266915, "percentage": 40.42, "elapsed_time": "1 day, 4:24:55", "remaining_time": "1 day, 17:52:53", "throughput": 26814.41, "total_tokens": 2743000640} +{"current_steps": 10200, "total_steps": 25209, "loss": 0.9821, "lr": 3.5180748057887714e-05, "epoch": 1.213853786250344, "percentage": 40.46, "elapsed_time": "1 day, 4:26:37", "remaining_time": "1 day, 17:51:15", "throughput": 26814.01, "total_tokens": 2745690368} +{"current_steps": 10210, "total_steps": 25209, "loss": 0.974, "lr": 3.517204275301144e-05, "epoch": 1.2150438462739965, "percentage": 40.5, "elapsed_time": "1 day, 4:28:17", "remaining_time": "1 day, 17:49:33", "throughput": 26813.93, "total_tokens": 2748361152} +{"current_steps": 10220, "total_steps": 25209, "loss": 0.9717, "lr": 3.5163343907194676e-05, "epoch": 1.2162339062976488, "percentage": 40.54, "elapsed_time": "1 day, 4:29:59", "remaining_time": "1 day, 17:47:56", "throughput": 26813.71, "total_tokens": 2751077888} +{"current_steps": 10230, "total_steps": 25209, "loss": 0.9731, "lr": 3.5154651512453995e-05, "epoch": 1.2174239663213013, "percentage": 40.58, "elapsed_time": "1 day, 4:31:40", "remaining_time": "1 day, 17:46:17", "throughput": 26813.54, "total_tokens": 2753775360} +{"current_steps": 10240, "total_steps": 25209, "loss": 0.9641, "lr": 3.514596556081981e-05, "epoch": 1.2186140263449539, "percentage": 40.62, "elapsed_time": "1 day, 4:33:18", "remaining_time": "1 day, 17:44:32", "throughput": 26813.87, "total_tokens": 2756426752} +{"current_steps": 10250, "total_steps": 25209, "loss": 0.9733, "lr": 3.513728604433628e-05, "epoch": 1.2198040863686062, "percentage": 40.66, "elapsed_time": "1 day, 4:35:00", "remaining_time": "1 day, 17:42:54", "throughput": 26813.8, "total_tokens": 2759155008} +{"current_steps": 10260, "total_steps": 25209, "loss": 0.9755, "lr": 3.5128612955061334e-05, "epoch": 1.2209941463922587, "percentage": 40.7, "elapsed_time": "1 day, 4:36:40", "remaining_time": "1 day, 17:41:14", "throughput": 26813.71, "total_tokens": 2761835520} +{"current_steps": 10270, "total_steps": 25209, "loss": 0.9872, "lr": 3.5119946285066595e-05, "epoch": 1.2221842064159112, "percentage": 40.74, "elapsed_time": "1 day, 4:38:28", "remaining_time": "1 day, 17:39:44", "throughput": 26812.49, "total_tokens": 2764592320} +{"current_steps": 10280, "total_steps": 25209, "loss": 0.9949, "lr": 3.511128602643739e-05, "epoch": 1.2233742664395635, "percentage": 40.78, "elapsed_time": "1 day, 4:40:10", "remaining_time": "1 day, 17:38:06", "throughput": 26811.71, "total_tokens": 2767260416} +{"current_steps": 10290, "total_steps": 25209, "loss": 0.9814, "lr": 3.510263217127269e-05, "epoch": 1.224564326463216, "percentage": 40.82, "elapsed_time": "1 day, 4:41:50", "remaining_time": "1 day, 17:36:24", "throughput": 26811.7, "total_tokens": 2769924096} +{"current_steps": 10300, "total_steps": 25209, "loss": 0.9652, "lr": 3.50939847116851e-05, "epoch": 1.2257543864868685, "percentage": 40.86, "elapsed_time": "1 day, 4:43:32", "remaining_time": "1 day, 17:34:46", "throughput": 26811.09, "total_tokens": 2772596672} +{"current_steps": 10310, "total_steps": 25209, "loss": 0.9679, "lr": 3.508534363980081e-05, "epoch": 1.2269444465105208, "percentage": 40.9, "elapsed_time": "1 day, 4:45:09", "remaining_time": "1 day, 17:33:01", "throughput": 26811.32, "total_tokens": 2775227200} +{"current_steps": 10320, "total_steps": 25209, "loss": 0.978, "lr": 3.507670894775958e-05, "epoch": 1.2281345065341733, "percentage": 40.94, "elapsed_time": "1 day, 4:46:49", "remaining_time": "1 day, 17:31:21", "throughput": 26811.36, "total_tokens": 2777924800} +{"current_steps": 10330, "total_steps": 25209, "loss": 0.9773, "lr": 3.506808062771471e-05, "epoch": 1.2293245665578258, "percentage": 40.98, "elapsed_time": "1 day, 4:48:30", "remaining_time": "1 day, 17:29:41", "throughput": 26811.33, "total_tokens": 2780616768} +{"current_steps": 10340, "total_steps": 25209, "loss": 0.9756, "lr": 3.505945867183298e-05, "epoch": 1.2305146265814781, "percentage": 41.02, "elapsed_time": "1 day, 4:50:11", "remaining_time": "1 day, 17:28:01", "throughput": 26811.33, "total_tokens": 2783327488} +{"current_steps": 10350, "total_steps": 25209, "loss": 0.966, "lr": 3.505084307229468e-05, "epoch": 1.2317046866051307, "percentage": 41.06, "elapsed_time": "1 day, 4:51:59", "remaining_time": "1 day, 17:26:32", "throughput": 26809.65, "total_tokens": 2786043712} +{"current_steps": 10360, "total_steps": 25209, "loss": 0.9751, "lr": 3.5042233821293525e-05, "epoch": 1.2328947466287832, "percentage": 41.1, "elapsed_time": "1 day, 4:53:51", "remaining_time": "1 day, 17:25:08", "throughput": 26806.73, "total_tokens": 2788737984} +{"current_steps": 10370, "total_steps": 25209, "loss": 0.9716, "lr": 3.503363091103664e-05, "epoch": 1.2340848066524355, "percentage": 41.14, "elapsed_time": "1 day, 4:55:34", "remaining_time": "1 day, 17:23:31", "throughput": 26806.12, "total_tokens": 2791443456} +{"current_steps": 10380, "total_steps": 25209, "loss": 0.9903, "lr": 3.5025034333744545e-05, "epoch": 1.235274866676088, "percentage": 41.18, "elapsed_time": "1 day, 4:57:23", "remaining_time": "1 day, 17:22:04", "throughput": 26804.12, "total_tokens": 2794166208} +{"current_steps": 10390, "total_steps": 25209, "loss": 0.9734, "lr": 3.501644408165112e-05, "epoch": 1.2364649266997405, "percentage": 41.22, "elapsed_time": "1 day, 4:59:07", "remaining_time": "1 day, 17:20:28", "throughput": 26803.33, "total_tokens": 2796859072} +{"current_steps": 10400, "total_steps": 25209, "loss": 0.9953, "lr": 3.500786014700357e-05, "epoch": 1.2376549867233928, "percentage": 41.26, "elapsed_time": "1 day, 5:00:47", "remaining_time": "1 day, 17:18:47", "throughput": 26803.2, "total_tokens": 2799537088} +{"current_steps": 10410, "total_steps": 25209, "loss": 0.9823, "lr": 3.499928252206237e-05, "epoch": 1.2388450467470453, "percentage": 41.29, "elapsed_time": "1 day, 5:02:28", "remaining_time": "1 day, 17:17:07", "throughput": 26803.12, "total_tokens": 2802225152} +{"current_steps": 10420, "total_steps": 25209, "loss": 0.9838, "lr": 3.499071119910131e-05, "epoch": 1.2400351067706978, "percentage": 41.33, "elapsed_time": "1 day, 5:04:11", "remaining_time": "1 day, 17:15:30", "throughput": 26803.1, "total_tokens": 2804979648} +{"current_steps": 10430, "total_steps": 25209, "loss": 0.9673, "lr": 3.498214617040739e-05, "epoch": 1.2412251667943501, "percentage": 41.37, "elapsed_time": "1 day, 5:05:50", "remaining_time": "1 day, 17:13:48", "throughput": 26802.88, "total_tokens": 2807619840} +{"current_steps": 10440, "total_steps": 25209, "loss": 0.9755, "lr": 3.49735874282808e-05, "epoch": 1.2424152268180026, "percentage": 41.41, "elapsed_time": "1 day, 5:07:30", "remaining_time": "1 day, 17:12:06", "throughput": 26803.05, "total_tokens": 2810307136} +{"current_steps": 10450, "total_steps": 25209, "loss": 0.9704, "lr": 3.4965034965034965e-05, "epoch": 1.2436052868416552, "percentage": 41.45, "elapsed_time": "1 day, 5:09:17", "remaining_time": "1 day, 17:10:36", "throughput": 26801.93, "total_tokens": 2813066176} +{"current_steps": 10460, "total_steps": 25209, "loss": 0.9661, "lr": 3.495648877299642e-05, "epoch": 1.2447953468653075, "percentage": 41.49, "elapsed_time": "1 day, 5:10:57", "remaining_time": "1 day, 17:08:55", "throughput": 26802.09, "total_tokens": 2815762432} +{"current_steps": 10470, "total_steps": 25209, "loss": 0.9792, "lr": 3.494794884450483e-05, "epoch": 1.24598540688896, "percentage": 41.53, "elapsed_time": "1 day, 5:12:41", "remaining_time": "1 day, 17:07:19", "throughput": 26801.22, "total_tokens": 2818445248} +{"current_steps": 10480, "total_steps": 25209, "loss": 0.9903, "lr": 3.4939415171912954e-05, "epoch": 1.2471754669126125, "percentage": 41.57, "elapsed_time": "1 day, 5:14:23", "remaining_time": "1 day, 17:05:41", "throughput": 26800.77, "total_tokens": 2821152320} +{"current_steps": 10490, "total_steps": 25209, "loss": 0.9928, "lr": 3.4930887747586616e-05, "epoch": 1.2483655269362648, "percentage": 41.61, "elapsed_time": "1 day, 5:16:02", "remaining_time": "1 day, 17:03:58", "throughput": 26800.87, "total_tokens": 2823800384} +{"current_steps": 10500, "total_steps": 25209, "loss": 0.9634, "lr": 3.492236656390469e-05, "epoch": 1.2495555869599173, "percentage": 41.65, "elapsed_time": "1 day, 5:17:39", "remaining_time": "1 day, 17:02:13", "throughput": 26801.65, "total_tokens": 2826476352} +{"current_steps": 10510, "total_steps": 25209, "loss": 0.973, "lr": 3.4913851613259034e-05, "epoch": 1.2507456469835696, "percentage": 41.69, "elapsed_time": "1 day, 5:19:21", "remaining_time": "1 day, 17:00:35", "throughput": 26801.38, "total_tokens": 2829198272} +{"current_steps": 10520, "total_steps": 25209, "loss": 0.9621, "lr": 3.490534288805452e-05, "epoch": 1.2519357070072221, "percentage": 41.73, "elapsed_time": "1 day, 5:21:02", "remaining_time": "1 day, 16:58:56", "throughput": 26801.27, "total_tokens": 2831898368} +{"current_steps": 10530, "total_steps": 25209, "loss": 0.9766, "lr": 3.489684038070891e-05, "epoch": 1.2531257670308746, "percentage": 41.77, "elapsed_time": "1 day, 5:22:40", "remaining_time": "1 day, 16:57:11", "throughput": 26801.9, "total_tokens": 2834577472} +{"current_steps": 10540, "total_steps": 25209, "loss": 0.9898, "lr": 3.488834408365296e-05, "epoch": 1.2543158270545272, "percentage": 41.81, "elapsed_time": "1 day, 5:24:18", "remaining_time": "1 day, 16:55:27", "throughput": 26802.37, "total_tokens": 2837256384} +{"current_steps": 10550, "total_steps": 25209, "loss": 0.9672, "lr": 3.487985398933027e-05, "epoch": 1.2555058870781795, "percentage": 41.85, "elapsed_time": "1 day, 5:25:56", "remaining_time": "1 day, 16:53:44", "throughput": 26802.77, "total_tokens": 2839936256} +{"current_steps": 10560, "total_steps": 25209, "loss": 0.9709, "lr": 3.4871370090197324e-05, "epoch": 1.256695947101832, "percentage": 41.89, "elapsed_time": "1 day, 5:27:41", "remaining_time": "1 day, 16:52:10", "throughput": 26801.82, "total_tokens": 2842642240} +{"current_steps": 10570, "total_steps": 25209, "loss": 0.9794, "lr": 3.486289237872343e-05, "epoch": 1.2578860071254843, "percentage": 41.93, "elapsed_time": "1 day, 5:29:18", "remaining_time": "1 day, 16:50:25", "throughput": 26802.44, "total_tokens": 2845318784} +{"current_steps": 10580, "total_steps": 25209, "loss": 0.9719, "lr": 3.485442084739075e-05, "epoch": 1.2590760671491368, "percentage": 41.97, "elapsed_time": "1 day, 5:30:56", "remaining_time": "1 day, 16:48:41", "throughput": 26802.86, "total_tokens": 2847984960} +{"current_steps": 10590, "total_steps": 25209, "loss": 0.9901, "lr": 3.484595548869416e-05, "epoch": 1.2602661271727893, "percentage": 42.01, "elapsed_time": "1 day, 5:32:34", "remaining_time": "1 day, 16:46:57", "throughput": 26803.06, "total_tokens": 2850627648} +{"current_steps": 10600, "total_steps": 25209, "loss": 0.9771, "lr": 3.4837496295141335e-05, "epoch": 1.2614561871964418, "percentage": 42.05, "elapsed_time": "1 day, 5:34:17", "remaining_time": "1 day, 16:45:21", "throughput": 26802.11, "total_tokens": 2853295104} +{"current_steps": 10610, "total_steps": 25209, "loss": 0.979, "lr": 3.482904325925266e-05, "epoch": 1.262646247220094, "percentage": 42.09, "elapsed_time": "1 day, 5:35:55", "remaining_time": "1 day, 16:43:36", "throughput": 26802.82, "total_tokens": 2855985792} +{"current_steps": 10620, "total_steps": 25209, "loss": 0.9848, "lr": 3.482059637356124e-05, "epoch": 1.2638363072437466, "percentage": 42.13, "elapsed_time": "1 day, 5:37:37", "remaining_time": "1 day, 16:41:58", "throughput": 26802.57, "total_tokens": 2858704064} +{"current_steps": 10630, "total_steps": 25209, "loss": 0.9764, "lr": 3.481215563061281e-05, "epoch": 1.265026367267399, "percentage": 42.17, "elapsed_time": "1 day, 5:39:20", "remaining_time": "1 day, 16:40:22", "throughput": 26801.97, "total_tokens": 2861400960} +{"current_steps": 10640, "total_steps": 25209, "loss": 0.9682, "lr": 3.4803721022965785e-05, "epoch": 1.2662164272910514, "percentage": 42.21, "elapsed_time": "1 day, 5:40:58", "remaining_time": "1 day, 16:38:38", "throughput": 26802.13, "total_tokens": 2864047616} +{"current_steps": 10650, "total_steps": 25209, "loss": 0.9887, "lr": 3.479529254319117e-05, "epoch": 1.267406487314704, "percentage": 42.25, "elapsed_time": "1 day, 5:42:41", "remaining_time": "1 day, 16:37:00", "throughput": 26801.92, "total_tokens": 2866772160} +{"current_steps": 10660, "total_steps": 25209, "loss": 0.9645, "lr": 3.478687018387257e-05, "epoch": 1.2685965473383565, "percentage": 42.29, "elapsed_time": "1 day, 5:44:21", "remaining_time": "1 day, 16:35:19", "throughput": 26802.25, "total_tokens": 2869484480} +{"current_steps": 10670, "total_steps": 25209, "loss": 0.9705, "lr": 3.477845393760616e-05, "epoch": 1.2697866073620088, "percentage": 42.33, "elapsed_time": "1 day, 5:46:00", "remaining_time": "1 day, 16:33:37", "throughput": 26802.73, "total_tokens": 2872197504} +{"current_steps": 10680, "total_steps": 25209, "loss": 0.978, "lr": 3.4770043797000614e-05, "epoch": 1.2709766673856613, "percentage": 42.37, "elapsed_time": "1 day, 5:47:37", "remaining_time": "1 day, 16:31:52", "throughput": 26803.32, "total_tokens": 2874859520} +{"current_steps": 10690, "total_steps": 25209, "loss": 0.9711, "lr": 3.4761639754677146e-05, "epoch": 1.2721667274093136, "percentage": 42.41, "elapsed_time": "1 day, 5:49:15", "remaining_time": "1 day, 16:30:09", "throughput": 26803.49, "total_tokens": 2877513024} +{"current_steps": 10700, "total_steps": 25209, "loss": 0.9828, "lr": 3.4753241803269435e-05, "epoch": 1.273356787432966, "percentage": 42.45, "elapsed_time": "1 day, 5:50:50", "remaining_time": "1 day, 16:28:20", "throughput": 26804.46, "total_tokens": 2880143232} +{"current_steps": 10710, "total_steps": 25209, "loss": 0.9808, "lr": 3.474484993542361e-05, "epoch": 1.2745468474566186, "percentage": 42.48, "elapsed_time": "1 day, 5:52:31", "remaining_time": "1 day, 16:26:40", "throughput": 26804.36, "total_tokens": 2882838272} +{"current_steps": 10720, "total_steps": 25209, "loss": 0.9574, "lr": 3.473646414379822e-05, "epoch": 1.2757369074802711, "percentage": 42.52, "elapsed_time": "1 day, 5:54:09", "remaining_time": "1 day, 16:24:57", "throughput": 26804.8, "total_tokens": 2885525120} +{"current_steps": 10730, "total_steps": 25209, "loss": 0.9863, "lr": 3.472808442106422e-05, "epoch": 1.2769269675039234, "percentage": 42.56, "elapsed_time": "1 day, 5:55:47", "remaining_time": "1 day, 16:23:14", "throughput": 26805.02, "total_tokens": 2888182784} +{"current_steps": 10740, "total_steps": 25209, "loss": 0.9809, "lr": 3.4719710759904936e-05, "epoch": 1.278117027527576, "percentage": 42.6, "elapsed_time": "1 day, 5:57:30", "remaining_time": "1 day, 16:21:36", "throughput": 26804.71, "total_tokens": 2890890176} +{"current_steps": 10750, "total_steps": 25209, "loss": 0.9671, "lr": 3.471134315301603e-05, "epoch": 1.2793070875512282, "percentage": 42.64, "elapsed_time": "1 day, 5:59:04", "remaining_time": "1 day, 16:19:48", "throughput": 26805.76, "total_tokens": 2893544896} +{"current_steps": 10760, "total_steps": 25209, "loss": 0.9843, "lr": 3.470298159310549e-05, "epoch": 1.2804971475748808, "percentage": 42.68, "elapsed_time": "1 day, 6:00:48", "remaining_time": "1 day, 16:18:12", "throughput": 26805.53, "total_tokens": 2896299072} +{"current_steps": 10770, "total_steps": 25209, "loss": 0.9866, "lr": 3.4694626072893585e-05, "epoch": 1.2816872075985333, "percentage": 42.72, "elapsed_time": "1 day, 6:02:30", "remaining_time": "1 day, 16:16:33", "throughput": 26805.65, "total_tokens": 2899034624} +{"current_steps": 10780, "total_steps": 25209, "loss": 0.982, "lr": 3.468627658511285e-05, "epoch": 1.2828772676221858, "percentage": 42.76, "elapsed_time": "1 day, 6:04:10", "remaining_time": "1 day, 16:14:53", "throughput": 26805.81, "total_tokens": 2901751680} +{"current_steps": 10790, "total_steps": 25209, "loss": 0.9698, "lr": 3.467793312250806e-05, "epoch": 1.284067327645838, "percentage": 42.8, "elapsed_time": "1 day, 6:05:51", "remaining_time": "1 day, 16:13:13", "throughput": 26805.71, "total_tokens": 2904448768} +{"current_steps": 10800, "total_steps": 25209, "loss": 0.9677, "lr": 3.466959567783619e-05, "epoch": 1.2852573876694906, "percentage": 42.84, "elapsed_time": "1 day, 6:07:31", "remaining_time": "1 day, 16:11:31", "throughput": 26805.86, "total_tokens": 2907126016} +{"current_steps": 10810, "total_steps": 25209, "loss": 0.9711, "lr": 3.466126424386642e-05, "epoch": 1.286447447693143, "percentage": 42.88, "elapsed_time": "1 day, 6:09:11", "remaining_time": "1 day, 16:09:50", "throughput": 26806.07, "total_tokens": 2909827456} +{"current_steps": 10820, "total_steps": 25209, "loss": 0.9836, "lr": 3.4652938813380056e-05, "epoch": 1.2876375077167954, "percentage": 42.92, "elapsed_time": "1 day, 6:10:49", "remaining_time": "1 day, 16:08:08", "throughput": 26806.88, "total_tokens": 2912566528} +{"current_steps": 10830, "total_steps": 25209, "loss": 0.9789, "lr": 3.464461937917057e-05, "epoch": 1.288827567740448, "percentage": 42.96, "elapsed_time": "1 day, 6:12:33", "remaining_time": "1 day, 16:06:32", "throughput": 26806.47, "total_tokens": 2915296000} +{"current_steps": 10840, "total_steps": 25209, "loss": 0.9759, "lr": 3.4636305934043525e-05, "epoch": 1.2900176277641004, "percentage": 43.0, "elapsed_time": "1 day, 6:14:11", "remaining_time": "1 day, 16:04:48", "throughput": 26806.76, "total_tokens": 2917948480} +{"current_steps": 10850, "total_steps": 25209, "loss": 0.9674, "lr": 3.4627998470816544e-05, "epoch": 1.2912076877877527, "percentage": 43.04, "elapsed_time": "1 day, 6:15:53", "remaining_time": "1 day, 16:03:10", "throughput": 26806.25, "total_tokens": 2920644864} +{"current_steps": 10860, "total_steps": 25209, "loss": 0.9769, "lr": 3.4619696982319334e-05, "epoch": 1.2923977478114053, "percentage": 43.08, "elapsed_time": "1 day, 6:17:30", "remaining_time": "1 day, 16:01:25", "throughput": 26807.0, "total_tokens": 2923326336} +{"current_steps": 10870, "total_steps": 25209, "loss": 0.9885, "lr": 3.461140146139361e-05, "epoch": 1.2935878078350576, "percentage": 43.12, "elapsed_time": "1 day, 6:19:15", "remaining_time": "1 day, 15:59:51", "throughput": 26805.96, "total_tokens": 2926026560} +{"current_steps": 10880, "total_steps": 25209, "loss": 0.9752, "lr": 3.460311190089309e-05, "epoch": 1.29477786785871, "percentage": 43.16, "elapsed_time": "1 day, 6:20:53", "remaining_time": "1 day, 15:58:07", "throughput": 26806.32, "total_tokens": 2928692928} +{"current_steps": 10890, "total_steps": 25209, "loss": 0.9656, "lr": 3.459482829368348e-05, "epoch": 1.2959679278823626, "percentage": 43.2, "elapsed_time": "1 day, 6:22:34", "remaining_time": "1 day, 15:56:27", "throughput": 26806.29, "total_tokens": 2931379520} +{"current_steps": 10900, "total_steps": 25209, "loss": 0.9843, "lr": 3.4586550632642425e-05, "epoch": 1.297157987906015, "percentage": 43.24, "elapsed_time": "1 day, 6:24:15", "remaining_time": "1 day, 15:54:48", "throughput": 26806.02, "total_tokens": 2934078272} +{"current_steps": 10910, "total_steps": 25209, "loss": 0.9785, "lr": 3.457827891065949e-05, "epoch": 1.2983480479296674, "percentage": 43.28, "elapsed_time": "1 day, 6:25:53", "remaining_time": "1 day, 15:53:04", "throughput": 26806.11, "total_tokens": 2936715328} +{"current_steps": 10920, "total_steps": 25209, "loss": 0.9458, "lr": 3.457001312063614e-05, "epoch": 1.29953810795332, "percentage": 43.32, "elapsed_time": "1 day, 6:27:39", "remaining_time": "1 day, 15:51:30", "throughput": 26805.32, "total_tokens": 2939446272} +{"current_steps": 10930, "total_steps": 25209, "loss": 0.9795, "lr": 3.45617532554857e-05, "epoch": 1.3007281679769722, "percentage": 43.36, "elapsed_time": "1 day, 6:29:14", "remaining_time": "1 day, 15:49:44", "throughput": 26806.37, "total_tokens": 2942129536} +{"current_steps": 10940, "total_steps": 25209, "loss": 0.9782, "lr": 3.455349930813339e-05, "epoch": 1.3019182280006247, "percentage": 43.4, "elapsed_time": "1 day, 6:30:55", "remaining_time": "1 day, 15:48:03", "throughput": 26806.49, "total_tokens": 2944835968} +{"current_steps": 10950, "total_steps": 25209, "loss": 0.9696, "lr": 3.45452512715162e-05, "epoch": 1.3031082880242773, "percentage": 43.44, "elapsed_time": "1 day, 6:32:34", "remaining_time": "1 day, 15:46:21", "throughput": 26806.69, "total_tokens": 2947513792} +{"current_steps": 10960, "total_steps": 25209, "loss": 0.965, "lr": 3.4537009138582935e-05, "epoch": 1.3042983480479298, "percentage": 43.48, "elapsed_time": "1 day, 6:34:16", "remaining_time": "1 day, 15:44:43", "throughput": 26806.68, "total_tokens": 2950243648} +{"current_steps": 10970, "total_steps": 25209, "loss": 0.9786, "lr": 3.4528772902294174e-05, "epoch": 1.305488408071582, "percentage": 43.52, "elapsed_time": "1 day, 6:35:55", "remaining_time": "1 day, 15:43:01", "throughput": 26806.88, "total_tokens": 2952924160} +{"current_steps": 10980, "total_steps": 25209, "loss": 0.9779, "lr": 3.452054255562222e-05, "epoch": 1.3066784680952346, "percentage": 43.56, "elapsed_time": "1 day, 6:37:37", "remaining_time": "1 day, 15:41:23", "throughput": 26806.69, "total_tokens": 2955644544} +{"current_steps": 10990, "total_steps": 25209, "loss": 0.9708, "lr": 3.451231809155115e-05, "epoch": 1.3078685281188869, "percentage": 43.6, "elapsed_time": "1 day, 6:39:16", "remaining_time": "1 day, 15:39:40", "throughput": 26807.0, "total_tokens": 2958320448} +{"current_steps": 11000, "total_steps": 25209, "loss": 0.9754, "lr": 3.450409950307666e-05, "epoch": 1.3090585881425394, "percentage": 43.64, "elapsed_time": "1 day, 6:41:02", "remaining_time": "1 day, 15:38:06", "throughput": 26806.46, "total_tokens": 2961096320} +{"current_steps": 11010, "total_steps": 25209, "loss": 0.962, "lr": 3.449588678320619e-05, "epoch": 1.310248648166192, "percentage": 43.67, "elapsed_time": "1 day, 6:42:40", "remaining_time": "1 day, 15:36:23", "throughput": 26806.9, "total_tokens": 2963782720} +{"current_steps": 11020, "total_steps": 25209, "loss": 0.9672, "lr": 3.4487679924958767e-05, "epoch": 1.3114387081898444, "percentage": 43.71, "elapsed_time": "1 day, 6:44:20", "remaining_time": "1 day, 15:34:43", "throughput": 26806.94, "total_tokens": 2966482112} +{"current_steps": 11030, "total_steps": 25209, "loss": 0.982, "lr": 3.4479478921365076e-05, "epoch": 1.3126287682134967, "percentage": 43.75, "elapsed_time": "1 day, 6:46:03", "remaining_time": "1 day, 15:33:05", "throughput": 26807.08, "total_tokens": 2969245376} +{"current_steps": 11040, "total_steps": 25209, "loss": 0.9751, "lr": 3.447128376546738e-05, "epoch": 1.3138188282371492, "percentage": 43.79, "elapsed_time": "1 day, 6:47:42", "remaining_time": "1 day, 15:31:23", "throughput": 26807.45, "total_tokens": 2971942400} +{"current_steps": 11050, "total_steps": 25209, "loss": 0.976, "lr": 3.4463094450319505e-05, "epoch": 1.3150088882608015, "percentage": 43.83, "elapsed_time": "1 day, 6:49:25", "remaining_time": "1 day, 15:29:47", "throughput": 26806.98, "total_tokens": 2974661824} +{"current_steps": 11060, "total_steps": 25209, "loss": 0.96, "lr": 3.4454910968986855e-05, "epoch": 1.316198948284454, "percentage": 43.87, "elapsed_time": "1 day, 6:51:02", "remaining_time": "1 day, 15:28:02", "throughput": 26807.45, "total_tokens": 2977314432} +{"current_steps": 11070, "total_steps": 25209, "loss": 0.9772, "lr": 3.4446733314546336e-05, "epoch": 1.3173890083081066, "percentage": 43.91, "elapsed_time": "1 day, 6:52:40", "remaining_time": "1 day, 15:26:18", "throughput": 26807.83, "total_tokens": 2979970048} +{"current_steps": 11080, "total_steps": 25209, "loss": 0.9724, "lr": 3.443856148008633e-05, "epoch": 1.318579068331759, "percentage": 43.95, "elapsed_time": "1 day, 6:54:25", "remaining_time": "1 day, 15:24:44", "throughput": 26806.53, "total_tokens": 2982654400} +{"current_steps": 11090, "total_steps": 25209, "loss": 0.9692, "lr": 3.443039545870672e-05, "epoch": 1.3197691283554114, "percentage": 43.99, "elapsed_time": "1 day, 6:56:06", "remaining_time": "1 day, 15:23:04", "throughput": 26806.77, "total_tokens": 2985379200} +{"current_steps": 11100, "total_steps": 25209, "loss": 0.977, "lr": 3.442223524351883e-05, "epoch": 1.320959188379064, "percentage": 44.03, "elapsed_time": "1 day, 6:57:44", "remaining_time": "1 day, 15:21:20", "throughput": 26807.42, "total_tokens": 2988075328} +{"current_steps": 11110, "total_steps": 25209, "loss": 0.9631, "lr": 3.44140808276454e-05, "epoch": 1.3221492484027162, "percentage": 44.07, "elapsed_time": "1 day, 6:59:28", "remaining_time": "1 day, 15:19:44", "throughput": 26806.96, "total_tokens": 2990809280} +{"current_steps": 11120, "total_steps": 25209, "loss": 0.979, "lr": 3.4405932204220575e-05, "epoch": 1.3233393084263687, "percentage": 44.11, "elapsed_time": "1 day, 7:01:07", "remaining_time": "1 day, 15:18:02", "throughput": 26807.05, "total_tokens": 2993474944} +{"current_steps": 11130, "total_steps": 25209, "loss": 0.9666, "lr": 3.4397789366389876e-05, "epoch": 1.3245293684500212, "percentage": 44.15, "elapsed_time": "1 day, 7:02:46", "remaining_time": "1 day, 15:16:20", "throughput": 26807.62, "total_tokens": 2996195136} +{"current_steps": 11140, "total_steps": 25209, "loss": 0.976, "lr": 3.438965230731016e-05, "epoch": 1.3257194284736737, "percentage": 44.19, "elapsed_time": "1 day, 7:04:25", "remaining_time": "1 day, 15:14:37", "throughput": 26808.23, "total_tokens": 2998912256} +{"current_steps": 11150, "total_steps": 25209, "loss": 0.9863, "lr": 3.438152102014964e-05, "epoch": 1.326909488497326, "percentage": 44.23, "elapsed_time": "1 day, 7:06:02", "remaining_time": "1 day, 15:12:53", "throughput": 26808.75, "total_tokens": 3001583168} +{"current_steps": 11160, "total_steps": 25209, "loss": 0.9651, "lr": 3.437339549808778e-05, "epoch": 1.3280995485209786, "percentage": 44.27, "elapsed_time": "1 day, 7:07:46", "remaining_time": "1 day, 15:11:17", "throughput": 26808.17, "total_tokens": 3004293376} +{"current_steps": 11170, "total_steps": 25209, "loss": 0.9745, "lr": 3.43652757343154e-05, "epoch": 1.3292896085446309, "percentage": 44.31, "elapsed_time": "1 day, 7:09:25", "remaining_time": "1 day, 15:09:34", "throughput": 26808.36, "total_tokens": 3006966848} +{"current_steps": 11180, "total_steps": 25209, "loss": 0.9556, "lr": 3.435716172203449e-05, "epoch": 1.3304796685682834, "percentage": 44.35, "elapsed_time": "1 day, 7:11:07", "remaining_time": "1 day, 15:07:57", "throughput": 26807.7, "total_tokens": 3009643072} +{"current_steps": 11190, "total_steps": 25209, "loss": 0.9859, "lr": 3.434905345445833e-05, "epoch": 1.3316697285919359, "percentage": 44.39, "elapsed_time": "1 day, 7:12:44", "remaining_time": "1 day, 15:06:11", "throughput": 26808.35, "total_tokens": 3012298176} +{"current_steps": 11200, "total_steps": 25209, "loss": 0.9642, "lr": 3.4340950924811374e-05, "epoch": 1.3328597886155884, "percentage": 44.43, "elapsed_time": "1 day, 7:14:22", "remaining_time": "1 day, 15:04:28", "throughput": 26808.83, "total_tokens": 3014987264} +{"current_steps": 11210, "total_steps": 25209, "loss": 0.9534, "lr": 3.433285412632927e-05, "epoch": 1.3340498486392407, "percentage": 44.47, "elapsed_time": "1 day, 7:15:58", "remaining_time": "1 day, 15:02:42", "throughput": 26809.94, "total_tokens": 3017687744} +{"current_steps": 11220, "total_steps": 25209, "loss": 0.9665, "lr": 3.4324763052258835e-05, "epoch": 1.3352399086628932, "percentage": 44.51, "elapsed_time": "1 day, 7:17:39", "remaining_time": "1 day, 15:01:03", "throughput": 26809.5, "total_tokens": 3020352320} +{"current_steps": 11230, "total_steps": 25209, "loss": 0.9674, "lr": 3.4316677695858003e-05, "epoch": 1.3364299686865455, "percentage": 44.55, "elapsed_time": "1 day, 7:19:15", "remaining_time": "1 day, 14:59:16", "throughput": 26810.49, "total_tokens": 3023028224} +{"current_steps": 11240, "total_steps": 25209, "loss": 0.9908, "lr": 3.430859805039583e-05, "epoch": 1.337620028710198, "percentage": 44.59, "elapsed_time": "1 day, 7:20:55", "remaining_time": "1 day, 14:57:35", "throughput": 26810.72, "total_tokens": 3025724224} +{"current_steps": 11250, "total_steps": 25209, "loss": 0.9767, "lr": 3.430052410915246e-05, "epoch": 1.3388100887338505, "percentage": 44.63, "elapsed_time": "1 day, 7:22:31", "remaining_time": "1 day, 14:55:49", "throughput": 26811.4, "total_tokens": 3028378496} +{"current_steps": 11260, "total_steps": 25209, "loss": 0.9734, "lr": 3.4292455865419086e-05, "epoch": 1.340000148757503, "percentage": 44.67, "elapsed_time": "1 day, 7:24:07", "remaining_time": "1 day, 14:54:03", "throughput": 26812.34, "total_tokens": 3031059776} +{"current_steps": 11270, "total_steps": 25209, "loss": 0.9865, "lr": 3.4284393312497973e-05, "epoch": 1.3411902087811554, "percentage": 44.71, "elapsed_time": "1 day, 7:25:49", "remaining_time": "1 day, 14:52:25", "throughput": 26812.13, "total_tokens": 3033772160} +{"current_steps": 11280, "total_steps": 25209, "loss": 0.9771, "lr": 3.427633644370238e-05, "epoch": 1.3423802688048079, "percentage": 44.75, "elapsed_time": "1 day, 7:27:30", "remaining_time": "1 day, 14:50:46", "throughput": 26812.08, "total_tokens": 3036478272} +{"current_steps": 11290, "total_steps": 25209, "loss": 0.9645, "lr": 3.4268285252356564e-05, "epoch": 1.3435703288284602, "percentage": 44.79, "elapsed_time": "1 day, 7:29:08", "remaining_time": "1 day, 14:49:02", "throughput": 26813.1, "total_tokens": 3039213952} +{"current_steps": 11300, "total_steps": 25209, "loss": 0.97, "lr": 3.426023973179575e-05, "epoch": 1.3447603888521127, "percentage": 44.83, "elapsed_time": "1 day, 7:30:48", "remaining_time": "1 day, 14:47:21", "throughput": 26813.13, "total_tokens": 3041904896} +{"current_steps": 11310, "total_steps": 25209, "loss": 0.9682, "lr": 3.425219987536614e-05, "epoch": 1.3459504488757652, "percentage": 44.86, "elapsed_time": "1 day, 7:32:24", "remaining_time": "1 day, 14:45:36", "throughput": 26813.97, "total_tokens": 3044586240} +{"current_steps": 11320, "total_steps": 25209, "loss": 0.9568, "lr": 3.4244165676424815e-05, "epoch": 1.3471405088994177, "percentage": 44.9, "elapsed_time": "1 day, 7:33:59", "remaining_time": "1 day, 14:43:49", "throughput": 26814.49, "total_tokens": 3047188416} +{"current_steps": 11330, "total_steps": 25209, "loss": 0.9756, "lr": 3.423613712833979e-05, "epoch": 1.34833056892307, "percentage": 44.94, "elapsed_time": "1 day, 7:35:39", "remaining_time": "1 day, 14:42:08", "throughput": 26814.73, "total_tokens": 3049888384} +{"current_steps": 11340, "total_steps": 25209, "loss": 0.9781, "lr": 3.422811422448995e-05, "epoch": 1.3495206289467225, "percentage": 44.98, "elapsed_time": "1 day, 7:37:13", "remaining_time": "1 day, 14:40:19", "throughput": 26815.59, "total_tokens": 3052504832} +{"current_steps": 11350, "total_steps": 25209, "loss": 0.9898, "lr": 3.422009695826503e-05, "epoch": 1.3507106889703748, "percentage": 45.02, "elapsed_time": "1 day, 7:38:51", "remaining_time": "1 day, 14:38:36", "throughput": 26816.06, "total_tokens": 3055186944} +{"current_steps": 11360, "total_steps": 25209, "loss": 0.9694, "lr": 3.4212085323065626e-05, "epoch": 1.3519007489940273, "percentage": 45.06, "elapsed_time": "1 day, 7:40:30", "remaining_time": "1 day, 14:36:54", "throughput": 26816.33, "total_tokens": 3057875712} +{"current_steps": 11370, "total_steps": 25209, "loss": 0.9773, "lr": 3.4204079312303103e-05, "epoch": 1.3530908090176799, "percentage": 45.1, "elapsed_time": "1 day, 7:42:15", "remaining_time": "1 day, 14:35:19", "throughput": 26815.73, "total_tokens": 3060621056} +{"current_steps": 11380, "total_steps": 25209, "loss": 0.9738, "lr": 3.419607891939964e-05, "epoch": 1.3542808690413324, "percentage": 45.14, "elapsed_time": "1 day, 7:43:58", "remaining_time": "1 day, 14:33:43", "throughput": 26815.55, "total_tokens": 3063372544} +{"current_steps": 11390, "total_steps": 25209, "loss": 0.9623, "lr": 3.4188084137788166e-05, "epoch": 1.3554709290649847, "percentage": 45.18, "elapsed_time": "1 day, 7:45:42", "remaining_time": "1 day, 14:32:07", "throughput": 26815.12, "total_tokens": 3066119232} +{"current_steps": 11400, "total_steps": 25209, "loss": 0.9644, "lr": 3.418009496091238e-05, "epoch": 1.3566609890886372, "percentage": 45.22, "elapsed_time": "1 day, 7:47:21", "remaining_time": "1 day, 14:30:24", "throughput": 26815.43, "total_tokens": 3068793984} +{"current_steps": 11410, "total_steps": 25209, "loss": 0.9761, "lr": 3.417211138222666e-05, "epoch": 1.3578510491122895, "percentage": 45.26, "elapsed_time": "1 day, 7:48:52", "remaining_time": "1 day, 14:28:32", "throughput": 26816.85, "total_tokens": 3071392576} +{"current_steps": 11420, "total_steps": 25209, "loss": 0.9791, "lr": 3.416413339519612e-05, "epoch": 1.359041109135942, "percentage": 45.3, "elapsed_time": "1 day, 7:50:35", "remaining_time": "1 day, 14:26:56", "throughput": 26816.5, "total_tokens": 3074128576} +{"current_steps": 11430, "total_steps": 25209, "loss": 0.9622, "lr": 3.4156160993296524e-05, "epoch": 1.3602311691595945, "percentage": 45.34, "elapsed_time": "1 day, 7:52:10", "remaining_time": "1 day, 14:25:08", "throughput": 26817.41, "total_tokens": 3076767232} +{"current_steps": 11440, "total_steps": 25209, "loss": 0.9728, "lr": 3.4148194170014295e-05, "epoch": 1.361421229183247, "percentage": 45.38, "elapsed_time": "1 day, 7:53:51", "remaining_time": "1 day, 14:23:29", "throughput": 26817.45, "total_tokens": 3079498048} +{"current_steps": 11450, "total_steps": 25209, "loss": 0.9698, "lr": 3.4140232918846484e-05, "epoch": 1.3626112892068993, "percentage": 45.42, "elapsed_time": "1 day, 7:55:27", "remaining_time": "1 day, 14:21:43", "throughput": 26818.23, "total_tokens": 3082157312} +{"current_steps": 11460, "total_steps": 25209, "loss": 0.9632, "lr": 3.4132277233300753e-05, "epoch": 1.3638013492305519, "percentage": 45.46, "elapsed_time": "1 day, 7:57:08", "remaining_time": "1 day, 14:20:03", "throughput": 26818.2, "total_tokens": 3084845952} +{"current_steps": 11470, "total_steps": 25209, "loss": 0.9806, "lr": 3.4124327106895356e-05, "epoch": 1.3649914092542041, "percentage": 45.5, "elapsed_time": "1 day, 7:58:42", "remaining_time": "1 day, 14:18:16", "throughput": 26819.17, "total_tokens": 3087499392} +{"current_steps": 11480, "total_steps": 25209, "loss": 0.9688, "lr": 3.4116382533159097e-05, "epoch": 1.3661814692778567, "percentage": 45.54, "elapsed_time": "1 day, 8:00:23", "remaining_time": "1 day, 14:16:36", "throughput": 26819.08, "total_tokens": 3090188160} +{"current_steps": 11490, "total_steps": 25209, "loss": 0.9742, "lr": 3.4108443505631335e-05, "epoch": 1.3673715293015092, "percentage": 45.58, "elapsed_time": "1 day, 8:02:05", "remaining_time": "1 day, 14:14:57", "throughput": 26818.64, "total_tokens": 3092869888} +{"current_steps": 11500, "total_steps": 25209, "loss": 0.9732, "lr": 3.410051001786192e-05, "epoch": 1.3685615893251617, "percentage": 45.62, "elapsed_time": "1 day, 8:03:44", "remaining_time": "1 day, 14:13:15", "throughput": 26819.15, "total_tokens": 3095580288} +{"current_steps": 11510, "total_steps": 25209, "loss": 0.9643, "lr": 3.409258206341124e-05, "epoch": 1.369751649348814, "percentage": 45.66, "elapsed_time": "1 day, 8:05:26", "remaining_time": "1 day, 14:11:37", "throughput": 26818.87, "total_tokens": 3098297344} +{"current_steps": 11520, "total_steps": 25209, "loss": 0.9759, "lr": 3.4084659635850134e-05, "epoch": 1.3709417093724665, "percentage": 45.7, "elapsed_time": "1 day, 8:07:01", "remaining_time": "1 day, 14:09:50", "throughput": 26819.96, "total_tokens": 3100952384} +{"current_steps": 11530, "total_steps": 25209, "loss": 0.9805, "lr": 3.40767427287599e-05, "epoch": 1.3721317693961188, "percentage": 45.74, "elapsed_time": "1 day, 8:08:38", "remaining_time": "1 day, 14:08:06", "throughput": 26820.45, "total_tokens": 3103631488} +{"current_steps": 11540, "total_steps": 25209, "loss": 0.9673, "lr": 3.406883133573224e-05, "epoch": 1.3733218294197713, "percentage": 45.78, "elapsed_time": "1 day, 8:10:18", "remaining_time": "1 day, 14:06:25", "throughput": 26820.78, "total_tokens": 3106329792} +{"current_steps": 11550, "total_steps": 25209, "loss": 0.9848, "lr": 3.406092545036932e-05, "epoch": 1.3745118894434238, "percentage": 45.82, "elapsed_time": "1 day, 8:11:53", "remaining_time": "1 day, 14:04:38", "throughput": 26821.54, "total_tokens": 3108974272} +{"current_steps": 11560, "total_steps": 25209, "loss": 0.9723, "lr": 3.405302506628365e-05, "epoch": 1.3757019494670764, "percentage": 45.86, "elapsed_time": "1 day, 8:13:33", "remaining_time": "1 day, 14:02:58", "throughput": 26821.59, "total_tokens": 3111670080} +{"current_steps": 11570, "total_steps": 25209, "loss": 0.9715, "lr": 3.404513017709813e-05, "epoch": 1.3768920094907287, "percentage": 45.9, "elapsed_time": "1 day, 8:15:09", "remaining_time": "1 day, 14:01:13", "throughput": 26822.34, "total_tokens": 3114339456} +{"current_steps": 11580, "total_steps": 25209, "loss": 0.9613, "lr": 3.403724077644598e-05, "epoch": 1.3780820695143812, "percentage": 45.94, "elapsed_time": "1 day, 8:16:49", "remaining_time": "1 day, 13:59:32", "throughput": 26822.62, "total_tokens": 3117045632} +{"current_steps": 11590, "total_steps": 25209, "loss": 0.9634, "lr": 3.402935685797077e-05, "epoch": 1.3792721295380335, "percentage": 45.98, "elapsed_time": "1 day, 8:18:27", "remaining_time": "1 day, 13:57:49", "throughput": 26823.33, "total_tokens": 3119758272} +{"current_steps": 11600, "total_steps": 25209, "loss": 0.9655, "lr": 3.4021478415326355e-05, "epoch": 1.380462189561686, "percentage": 46.02, "elapsed_time": "1 day, 8:20:08", "remaining_time": "1 day, 13:56:09", "throughput": 26822.94, "total_tokens": 3122414912} +{"current_steps": 11610, "total_steps": 25209, "loss": 0.9774, "lr": 3.401360544217687e-05, "epoch": 1.3816522495853385, "percentage": 46.05, "elapsed_time": "1 day, 8:21:49", "remaining_time": "1 day, 13:54:30", "throughput": 26822.95, "total_tokens": 3125138048} +{"current_steps": 11620, "total_steps": 25209, "loss": 0.9688, "lr": 3.400573793219672e-05, "epoch": 1.382842309608991, "percentage": 46.09, "elapsed_time": "1 day, 8:23:32", "remaining_time": "1 day, 13:52:52", "throughput": 26822.97, "total_tokens": 3127895808} +{"current_steps": 11630, "total_steps": 25209, "loss": 0.9654, "lr": 3.3997875879070546e-05, "epoch": 1.3840323696326433, "percentage": 46.13, "elapsed_time": "1 day, 8:25:08", "remaining_time": "1 day, 13:51:07", "throughput": 26823.59, "total_tokens": 3130553600} +{"current_steps": 11640, "total_steps": 25209, "loss": 0.9693, "lr": 3.399001927649318e-05, "epoch": 1.3852224296562958, "percentage": 46.17, "elapsed_time": "1 day, 8:26:48", "remaining_time": "1 day, 13:49:26", "throughput": 26824.07, "total_tokens": 3133289408} +{"current_steps": 11650, "total_steps": 25209, "loss": 0.9668, "lr": 3.398216811816968e-05, "epoch": 1.3864124896799481, "percentage": 46.21, "elapsed_time": "1 day, 8:28:26", "remaining_time": "1 day, 13:47:43", "throughput": 26824.71, "total_tokens": 3135990784} +{"current_steps": 11660, "total_steps": 25209, "loss": 0.9738, "lr": 3.397432239781527e-05, "epoch": 1.3876025497036006, "percentage": 46.25, "elapsed_time": "1 day, 8:30:00", "remaining_time": "1 day, 13:45:54", "throughput": 26825.46, "total_tokens": 3138582208} +{"current_steps": 11670, "total_steps": 25209, "loss": 0.966, "lr": 3.396648210915531e-05, "epoch": 1.3887926097272532, "percentage": 46.29, "elapsed_time": "1 day, 8:31:38", "remaining_time": "1 day, 13:44:11", "throughput": 26825.86, "total_tokens": 3141254144} +{"current_steps": 11680, "total_steps": 25209, "loss": 0.9728, "lr": 3.3958647245925315e-05, "epoch": 1.3899826697509057, "percentage": 46.33, "elapsed_time": "1 day, 8:33:24", "remaining_time": "1 day, 13:42:38", "throughput": 26825.17, "total_tokens": 3144021568} +{"current_steps": 11690, "total_steps": 25209, "loss": 0.9864, "lr": 3.3950817801870885e-05, "epoch": 1.391172729774558, "percentage": 46.37, "elapsed_time": "1 day, 8:35:04", "remaining_time": "1 day, 13:40:58", "throughput": 26825.45, "total_tokens": 3146754752} +{"current_steps": 11700, "total_steps": 25209, "loss": 0.9737, "lr": 3.3942993770747735e-05, "epoch": 1.3923627897982105, "percentage": 46.41, "elapsed_time": "1 day, 8:36:45", "remaining_time": "1 day, 13:39:17", "throughput": 26825.47, "total_tokens": 3149447680} +{"current_steps": 11710, "total_steps": 25209, "loss": 0.9654, "lr": 3.3935175146321626e-05, "epoch": 1.3935528498218628, "percentage": 46.45, "elapsed_time": "1 day, 8:38:28", "remaining_time": "1 day, 13:37:41", "throughput": 26825.33, "total_tokens": 3152209472} +{"current_steps": 11720, "total_steps": 25209, "loss": 0.9768, "lr": 3.392736192236839e-05, "epoch": 1.3947429098455153, "percentage": 46.49, "elapsed_time": "1 day, 8:40:10", "remaining_time": "1 day, 13:36:03", "throughput": 26825.36, "total_tokens": 3154957184} +{"current_steps": 11730, "total_steps": 25209, "loss": 0.9598, "lr": 3.391955409267387e-05, "epoch": 1.3959329698691678, "percentage": 46.53, "elapsed_time": "1 day, 8:41:53", "remaining_time": "1 day, 13:34:25", "throughput": 26825.05, "total_tokens": 3157672832} +{"current_steps": 11740, "total_steps": 25209, "loss": 0.9869, "lr": 3.3911751651033896e-05, "epoch": 1.3971230298928203, "percentage": 46.57, "elapsed_time": "1 day, 8:43:33", "remaining_time": "1 day, 13:32:44", "throughput": 26825.39, "total_tokens": 3160389824} +{"current_steps": 11750, "total_steps": 25209, "loss": 0.9698, "lr": 3.3903954591254334e-05, "epoch": 1.3983130899164726, "percentage": 46.61, "elapsed_time": "1 day, 8:45:10", "remaining_time": "1 day, 13:31:00", "throughput": 26825.8, "total_tokens": 3163049408} +{"current_steps": 11760, "total_steps": 25209, "loss": 0.9631, "lr": 3.389616290715097e-05, "epoch": 1.3995031499401251, "percentage": 46.65, "elapsed_time": "1 day, 8:46:49", "remaining_time": "1 day, 13:29:18", "throughput": 26825.82, "total_tokens": 3165703552} +{"current_steps": 11770, "total_steps": 25209, "loss": 0.9674, "lr": 3.388837659254955e-05, "epoch": 1.4006932099637774, "percentage": 46.69, "elapsed_time": "1 day, 8:48:27", "remaining_time": "1 day, 13:27:35", "throughput": 26825.99, "total_tokens": 3168349760} +{"current_steps": 11780, "total_steps": 25209, "loss": 0.986, "lr": 3.3880595641285746e-05, "epoch": 1.40188326998743, "percentage": 46.73, "elapsed_time": "1 day, 8:50:08", "remaining_time": "1 day, 13:25:55", "throughput": 26826.41, "total_tokens": 3171104128} +{"current_steps": 11790, "total_steps": 25209, "loss": 0.9835, "lr": 3.387282004720513e-05, "epoch": 1.4030733300110825, "percentage": 46.77, "elapsed_time": "1 day, 8:51:42", "remaining_time": "1 day, 13:24:08", "throughput": 26827.66, "total_tokens": 3173781248} +{"current_steps": 11800, "total_steps": 25209, "loss": 0.9534, "lr": 3.386504980416316e-05, "epoch": 1.404263390034735, "percentage": 46.81, "elapsed_time": "1 day, 8:53:22", "remaining_time": "1 day, 13:22:27", "throughput": 26827.99, "total_tokens": 3176494272} +{"current_steps": 11810, "total_steps": 25209, "loss": 0.9719, "lr": 3.385728490602515e-05, "epoch": 1.4054534500583873, "percentage": 46.85, "elapsed_time": "1 day, 8:54:59", "remaining_time": "1 day, 13:20:43", "throughput": 26828.67, "total_tokens": 3179194368} +{"current_steps": 11820, "total_steps": 25209, "loss": 0.996, "lr": 3.384952534666625e-05, "epoch": 1.4066435100820398, "percentage": 46.89, "elapsed_time": "1 day, 8:56:39", "remaining_time": "1 day, 13:19:02", "throughput": 26828.89, "total_tokens": 3181902272} +{"current_steps": 11830, "total_steps": 25209, "loss": 0.9864, "lr": 3.3841771119971455e-05, "epoch": 1.407833570105692, "percentage": 46.93, "elapsed_time": "1 day, 8:58:18", "remaining_time": "1 day, 13:17:20", "throughput": 26829.27, "total_tokens": 3184594688} +{"current_steps": 11840, "total_steps": 25209, "loss": 0.9631, "lr": 3.383402221983554e-05, "epoch": 1.4090236301293446, "percentage": 46.97, "elapsed_time": "1 day, 8:59:55", "remaining_time": "1 day, 13:15:36", "throughput": 26829.9, "total_tokens": 3187258240} +{"current_steps": 11850, "total_steps": 25209, "loss": 0.975, "lr": 3.3826278640163064e-05, "epoch": 1.4102136901529971, "percentage": 47.01, "elapsed_time": "1 day, 9:01:34", "remaining_time": "1 day, 13:13:54", "throughput": 26830.39, "total_tokens": 3189984448} +{"current_steps": 11860, "total_steps": 25209, "loss": 0.9736, "lr": 3.3818540374868354e-05, "epoch": 1.4114037501766497, "percentage": 47.05, "elapsed_time": "1 day, 9:03:11", "remaining_time": "1 day, 13:12:10", "throughput": 26831.0, "total_tokens": 3192657920} +{"current_steps": 11870, "total_steps": 25209, "loss": 0.9859, "lr": 3.381080741787547e-05, "epoch": 1.412593810200302, "percentage": 47.09, "elapsed_time": "1 day, 9:04:50", "remaining_time": "1 day, 13:10:28", "throughput": 26831.61, "total_tokens": 3195392064} +{"current_steps": 11880, "total_steps": 25209, "loss": 0.9873, "lr": 3.38030797631182e-05, "epoch": 1.4137838702239545, "percentage": 47.13, "elapsed_time": "1 day, 9:06:27", "remaining_time": "1 day, 13:08:44", "throughput": 26832.53, "total_tokens": 3198103168} +{"current_steps": 11890, "total_steps": 25209, "loss": 0.9795, "lr": 3.379535740454003e-05, "epoch": 1.4149739302476068, "percentage": 47.17, "elapsed_time": "1 day, 9:08:05", "remaining_time": "1 day, 13:07:01", "throughput": 26833.05, "total_tokens": 3200782976} +{"current_steps": 11900, "total_steps": 25209, "loss": 0.9717, "lr": 3.3787640336094126e-05, "epoch": 1.4161639902712593, "percentage": 47.21, "elapsed_time": "1 day, 9:09:42", "remaining_time": "1 day, 13:05:17", "throughput": 26833.68, "total_tokens": 3203470400} +{"current_steps": 11910, "total_steps": 25209, "loss": 0.9701, "lr": 3.3779928551743325e-05, "epoch": 1.4173540502949118, "percentage": 47.25, "elapsed_time": "1 day, 9:11:19", "remaining_time": "1 day, 13:03:34", "throughput": 26834.66, "total_tokens": 3206203392} +{"current_steps": 11920, "total_steps": 25209, "loss": 0.948, "lr": 3.3772222045460084e-05, "epoch": 1.4185441103185643, "percentage": 47.28, "elapsed_time": "1 day, 9:12:58", "remaining_time": "1 day, 13:01:52", "throughput": 26835.0, "total_tokens": 3208893632} +{"current_steps": 11930, "total_steps": 25209, "loss": 0.9734, "lr": 3.37645208112265e-05, "epoch": 1.4197341703422166, "percentage": 47.32, "elapsed_time": "1 day, 9:14:34", "remaining_time": "1 day, 13:00:06", "throughput": 26835.75, "total_tokens": 3211550016} +{"current_steps": 11940, "total_steps": 25209, "loss": 0.9637, "lr": 3.3756824843034255e-05, "epoch": 1.4209242303658691, "percentage": 47.36, "elapsed_time": "1 day, 9:16:10", "remaining_time": "1 day, 12:58:22", "throughput": 26836.44, "total_tokens": 3214221184} +{"current_steps": 11950, "total_steps": 25209, "loss": 0.9699, "lr": 3.374913413488464e-05, "epoch": 1.4221142903895214, "percentage": 47.4, "elapsed_time": "1 day, 9:17:47", "remaining_time": "1 day, 12:56:38", "throughput": 26837.09, "total_tokens": 3216907968} +{"current_steps": 11960, "total_steps": 25209, "loss": 0.9776, "lr": 3.374144868078848e-05, "epoch": 1.423304350413174, "percentage": 47.44, "elapsed_time": "1 day, 9:19:27", "remaining_time": "1 day, 12:54:56", "throughput": 26836.89, "total_tokens": 3219550848} +{"current_steps": 11970, "total_steps": 25209, "loss": 0.9777, "lr": 3.373376847476615e-05, "epoch": 1.4244944104368265, "percentage": 47.48, "elapsed_time": "1 day, 9:21:05", "remaining_time": "1 day, 12:53:14", "throughput": 26837.15, "total_tokens": 3222226112} +{"current_steps": 11980, "total_steps": 25209, "loss": 0.9736, "lr": 3.3726093510847566e-05, "epoch": 1.425684470460479, "percentage": 47.52, "elapsed_time": "1 day, 9:22:42", "remaining_time": "1 day, 12:51:30", "throughput": 26837.79, "total_tokens": 3224899264} +{"current_steps": 11990, "total_steps": 25209, "loss": 0.9831, "lr": 3.371842378307212e-05, "epoch": 1.4268745304841313, "percentage": 47.56, "elapsed_time": "1 day, 9:24:23", "remaining_time": "1 day, 12:49:51", "throughput": 26837.8, "total_tokens": 3227616896} +{"current_steps": 12000, "total_steps": 25209, "loss": 0.9693, "lr": 3.371075928548872e-05, "epoch": 1.4280645905077838, "percentage": 47.6, "elapsed_time": "1 day, 9:25:59", "remaining_time": "1 day, 12:48:05", "throughput": 26838.86, "total_tokens": 3230309312} +{"current_steps": 12010, "total_steps": 25209, "loss": 0.975, "lr": 3.37031000121557e-05, "epoch": 1.429254650531436, "percentage": 47.64, "elapsed_time": "1 day, 9:27:36", "remaining_time": "1 day, 12:46:21", "throughput": 26839.3, "total_tokens": 3232956608} +{"current_steps": 12020, "total_steps": 25209, "loss": 0.9666, "lr": 3.369544595714088e-05, "epoch": 1.4304447105550886, "percentage": 47.68, "elapsed_time": "1 day, 9:29:15", "remaining_time": "1 day, 12:44:40", "throughput": 26839.43, "total_tokens": 3235645760} +{"current_steps": 12030, "total_steps": 25209, "loss": 0.9647, "lr": 3.368779711452148e-05, "epoch": 1.4316347705787411, "percentage": 47.72, "elapsed_time": "1 day, 9:30:56", "remaining_time": "1 day, 12:43:00", "throughput": 26839.52, "total_tokens": 3238364224} +{"current_steps": 12040, "total_steps": 25209, "loss": 0.9725, "lr": 3.368015347838413e-05, "epoch": 1.4328248306023936, "percentage": 47.76, "elapsed_time": "1 day, 9:32:34", "remaining_time": "1 day, 12:41:17", "throughput": 26839.97, "total_tokens": 3241042368} +{"current_steps": 12050, "total_steps": 25209, "loss": 0.9624, "lr": 3.3672515042824855e-05, "epoch": 1.434014890626046, "percentage": 47.8, "elapsed_time": "1 day, 9:34:06", "remaining_time": "1 day, 12:39:28", "throughput": 26841.35, "total_tokens": 3243694208} +{"current_steps": 12060, "total_steps": 25209, "loss": 0.969, "lr": 3.366488180194904e-05, "epoch": 1.4352049506496984, "percentage": 47.84, "elapsed_time": "1 day, 9:35:45", "remaining_time": "1 day, 12:37:46", "throughput": 26842.01, "total_tokens": 3246411136} +{"current_steps": 12070, "total_steps": 25209, "loss": 0.9664, "lr": 3.365725374987143e-05, "epoch": 1.4363950106733507, "percentage": 47.88, "elapsed_time": "1 day, 9:37:24", "remaining_time": "1 day, 12:36:05", "throughput": 26842.28, "total_tokens": 3249120832} +{"current_steps": 12080, "total_steps": 25209, "loss": 0.9799, "lr": 3.36496308807161e-05, "epoch": 1.4375850706970033, "percentage": 47.92, "elapsed_time": "1 day, 9:39:06", "remaining_time": "1 day, 12:34:26", "throughput": 26842.42, "total_tokens": 3251866752} +{"current_steps": 12090, "total_steps": 25209, "loss": 0.973, "lr": 3.3642013188616426e-05, "epoch": 1.4387751307206558, "percentage": 47.96, "elapsed_time": "1 day, 9:40:39", "remaining_time": "1 day, 12:32:37", "throughput": 26843.42, "total_tokens": 3254471488} +{"current_steps": 12100, "total_steps": 25209, "loss": 0.9715, "lr": 3.3634400667715074e-05, "epoch": 1.4399651907443083, "percentage": 48.0, "elapsed_time": "1 day, 9:42:14", "remaining_time": "1 day, 12:30:52", "throughput": 26844.19, "total_tokens": 3257122560} +{"current_steps": 12110, "total_steps": 25209, "loss": 0.9795, "lr": 3.3626793312164013e-05, "epoch": 1.4411552507679606, "percentage": 48.04, "elapsed_time": "1 day, 9:43:51", "remaining_time": "1 day, 12:29:08", "throughput": 26844.73, "total_tokens": 3259799680} +{"current_steps": 12120, "total_steps": 25209, "loss": 0.9873, "lr": 3.361919111612443e-05, "epoch": 1.442345310791613, "percentage": 48.08, "elapsed_time": "1 day, 9:45:31", "remaining_time": "1 day, 12:27:27", "throughput": 26844.95, "total_tokens": 3262494784} +{"current_steps": 12130, "total_steps": 25209, "loss": 0.9728, "lr": 3.361159407376678e-05, "epoch": 1.4435353708152654, "percentage": 48.12, "elapsed_time": "1 day, 9:47:04", "remaining_time": "1 day, 12:25:39", "throughput": 26846.13, "total_tokens": 3265138496} +{"current_steps": 12140, "total_steps": 25209, "loss": 0.9692, "lr": 3.3604002179270685e-05, "epoch": 1.444725430838918, "percentage": 48.16, "elapsed_time": "1 day, 9:48:40", "remaining_time": "1 day, 12:23:55", "throughput": 26846.66, "total_tokens": 3267791168} +{"current_steps": 12150, "total_steps": 25209, "loss": 0.9677, "lr": 3.359641542682504e-05, "epoch": 1.4459154908625704, "percentage": 48.2, "elapsed_time": "1 day, 9:50:23", "remaining_time": "1 day, 12:22:17", "throughput": 26846.4, "total_tokens": 3270525376} +{"current_steps": 12160, "total_steps": 25209, "loss": 0.9638, "lr": 3.3588833810627854e-05, "epoch": 1.447105550886223, "percentage": 48.24, "elapsed_time": "1 day, 9:52:03", "remaining_time": "1 day, 12:20:37", "throughput": 26846.73, "total_tokens": 3273252096} +{"current_steps": 12170, "total_steps": 25209, "loss": 0.9711, "lr": 3.358125732488632e-05, "epoch": 1.4482956109098752, "percentage": 48.28, "elapsed_time": "1 day, 9:53:41", "remaining_time": "1 day, 12:18:54", "throughput": 26847.08, "total_tokens": 3275926144} +{"current_steps": 12180, "total_steps": 25209, "loss": 0.98, "lr": 3.357368596381679e-05, "epoch": 1.4494856709335278, "percentage": 48.32, "elapsed_time": "1 day, 9:55:23", "remaining_time": "1 day, 12:17:16", "throughput": 26847.22, "total_tokens": 3278678912} +{"current_steps": 12190, "total_steps": 25209, "loss": 0.9707, "lr": 3.356611972164471e-05, "epoch": 1.45067573095718, "percentage": 48.36, "elapsed_time": "1 day, 9:56:56", "remaining_time": "1 day, 12:15:27", "throughput": 26848.56, "total_tokens": 3281328960} +{"current_steps": 12200, "total_steps": 25209, "loss": 0.9738, "lr": 3.355855859260466e-05, "epoch": 1.4518657909808326, "percentage": 48.4, "elapsed_time": "1 day, 9:58:38", "remaining_time": "1 day, 12:13:49", "throughput": 26848.54, "total_tokens": 3284070848} +{"current_steps": 12210, "total_steps": 25209, "loss": 0.9633, "lr": 3.3551002570940285e-05, "epoch": 1.453055851004485, "percentage": 48.44, "elapsed_time": "1 day, 10:00:15", "remaining_time": "1 day, 12:12:06", "throughput": 26849.0, "total_tokens": 3286739072} +{"current_steps": 12220, "total_steps": 25209, "loss": 0.9712, "lr": 3.354345165090431e-05, "epoch": 1.4542459110281376, "percentage": 48.47, "elapsed_time": "1 day, 10:01:54", "remaining_time": "1 day, 12:10:24", "throughput": 26849.3, "total_tokens": 3289432000} +{"current_steps": 12230, "total_steps": 25209, "loss": 0.9804, "lr": 3.3535905826758515e-05, "epoch": 1.45543597105179, "percentage": 48.51, "elapsed_time": "1 day, 10:03:32", "remaining_time": "1 day, 12:08:41", "throughput": 26850.02, "total_tokens": 3292147200} +{"current_steps": 12240, "total_steps": 25209, "loss": 0.9703, "lr": 3.352836509277369e-05, "epoch": 1.4566260310754424, "percentage": 48.55, "elapsed_time": "1 day, 10:05:09", "remaining_time": "1 day, 12:06:58", "throughput": 26850.9, "total_tokens": 3294866688} +{"current_steps": 12250, "total_steps": 25209, "loss": 0.9765, "lr": 3.352082944322966e-05, "epoch": 1.4578160910990947, "percentage": 48.59, "elapsed_time": "1 day, 10:06:45", "remaining_time": "1 day, 12:05:13", "throughput": 26851.92, "total_tokens": 3297572416} +{"current_steps": 12260, "total_steps": 25209, "loss": 0.9739, "lr": 3.351329887241524e-05, "epoch": 1.4590061511227472, "percentage": 48.63, "elapsed_time": "1 day, 10:08:21", "remaining_time": "1 day, 12:03:28", "throughput": 26852.82, "total_tokens": 3300241856} +{"current_steps": 12270, "total_steps": 25209, "loss": 0.9684, "lr": 3.3505773374628225e-05, "epoch": 1.4601962111463997, "percentage": 48.67, "elapsed_time": "1 day, 10:10:02", "remaining_time": "1 day, 12:01:49", "throughput": 26852.9, "total_tokens": 3302980288} +{"current_steps": 12280, "total_steps": 25209, "loss": 0.9723, "lr": 3.3498252944175354e-05, "epoch": 1.4613862711700523, "percentage": 48.71, "elapsed_time": "1 day, 10:11:40", "remaining_time": "1 day, 12:00:06", "throughput": 26853.42, "total_tokens": 3305672448} +{"current_steps": 12290, "total_steps": 25209, "loss": 0.9684, "lr": 3.3490737575372326e-05, "epoch": 1.4625763311937046, "percentage": 48.75, "elapsed_time": "1 day, 10:13:19", "remaining_time": "1 day, 11:58:24", "throughput": 26853.93, "total_tokens": 3308392896} +{"current_steps": 12300, "total_steps": 25209, "loss": 0.9796, "lr": 3.348322726254375e-05, "epoch": 1.463766391217357, "percentage": 48.79, "elapsed_time": "1 day, 10:14:52", "remaining_time": "1 day, 11:56:36", "throughput": 26855.1, "total_tokens": 3311020032} +{"current_steps": 12310, "total_steps": 25209, "loss": 0.9725, "lr": 3.347572200002315e-05, "epoch": 1.4649564512410094, "percentage": 48.83, "elapsed_time": "1 day, 10:16:34", "remaining_time": "1 day, 11:54:58", "throughput": 26854.58, "total_tokens": 3313713728} +{"current_steps": 12320, "total_steps": 25209, "loss": 0.9856, "lr": 3.3468221782152924e-05, "epoch": 1.466146511264662, "percentage": 48.87, "elapsed_time": "1 day, 10:18:13", "remaining_time": "1 day, 11:53:17", "throughput": 26854.85, "total_tokens": 3316412672} +{"current_steps": 12330, "total_steps": 25209, "loss": 0.9627, "lr": 3.346072660328435e-05, "epoch": 1.4673365712883144, "percentage": 48.91, "elapsed_time": "1 day, 10:19:52", "remaining_time": "1 day, 11:51:35", "throughput": 26855.4, "total_tokens": 3319123264} +{"current_steps": 12340, "total_steps": 25209, "loss": 0.9841, "lr": 3.345323645777756e-05, "epoch": 1.468526631311967, "percentage": 48.95, "elapsed_time": "1 day, 10:21:28", "remaining_time": "1 day, 11:49:51", "throughput": 26856.13, "total_tokens": 3321801408} +{"current_steps": 12350, "total_steps": 25209, "loss": 0.9667, "lr": 3.34457513400015e-05, "epoch": 1.4697166913356192, "percentage": 48.99, "elapsed_time": "1 day, 10:23:02", "remaining_time": "1 day, 11:48:03", "throughput": 26857.51, "total_tokens": 3324479296} +{"current_steps": 12360, "total_steps": 25209, "loss": 0.969, "lr": 3.343827124433396e-05, "epoch": 1.4709067513592717, "percentage": 49.03, "elapsed_time": "1 day, 10:24:38", "remaining_time": "1 day, 11:46:19", "throughput": 26858.34, "total_tokens": 3327164992} +{"current_steps": 12370, "total_steps": 25209, "loss": 0.9562, "lr": 3.343079616516151e-05, "epoch": 1.472096811382924, "percentage": 49.07, "elapsed_time": "1 day, 10:26:17", "remaining_time": "1 day, 11:44:38", "throughput": 26858.51, "total_tokens": 3329856384} +{"current_steps": 12380, "total_steps": 25209, "loss": 0.9835, "lr": 3.3423326096879495e-05, "epoch": 1.4732868714065765, "percentage": 49.11, "elapsed_time": "1 day, 10:28:02", "remaining_time": "1 day, 11:43:02", "throughput": 26858.11, "total_tokens": 3332618304} +{"current_steps": 12390, "total_steps": 25209, "loss": 0.9722, "lr": 3.341586103389203e-05, "epoch": 1.474476931430229, "percentage": 49.15, "elapsed_time": "1 day, 10:29:45", "remaining_time": "1 day, 11:41:25", "throughput": 26857.88, "total_tokens": 3335362688} +{"current_steps": 12400, "total_steps": 25209, "loss": 0.9566, "lr": 3.3408400970611995e-05, "epoch": 1.4756669914538816, "percentage": 49.19, "elapsed_time": "1 day, 10:31:20", "remaining_time": "1 day, 11:39:39", "throughput": 26858.76, "total_tokens": 3338022592} +{"current_steps": 12410, "total_steps": 25209, "loss": 0.9741, "lr": 3.340094590146095e-05, "epoch": 1.4768570514775339, "percentage": 49.23, "elapsed_time": "1 day, 10:33:01", "remaining_time": "1 day, 11:38:00", "throughput": 26858.92, "total_tokens": 3340747264} +{"current_steps": 12420, "total_steps": 25209, "loss": 0.9609, "lr": 3.3393495820869215e-05, "epoch": 1.4780471115011864, "percentage": 49.27, "elapsed_time": "1 day, 10:34:38", "remaining_time": "1 day, 11:36:16", "throughput": 26859.47, "total_tokens": 3343430144} +{"current_steps": 12430, "total_steps": 25209, "loss": 0.9601, "lr": 3.338605072327576e-05, "epoch": 1.4792371715248387, "percentage": 49.31, "elapsed_time": "1 day, 10:36:16", "remaining_time": "1 day, 11:34:34", "throughput": 26860.05, "total_tokens": 3346144448} +{"current_steps": 12440, "total_steps": 25209, "loss": 0.9692, "lr": 3.337861060312827e-05, "epoch": 1.4804272315484912, "percentage": 49.35, "elapsed_time": "1 day, 10:37:52", "remaining_time": "1 day, 11:32:50", "throughput": 26860.51, "total_tokens": 3348779136} +{"current_steps": 12450, "total_steps": 25209, "loss": 0.9704, "lr": 3.337117545488306e-05, "epoch": 1.4816172915721437, "percentage": 49.39, "elapsed_time": "1 day, 10:39:29", "remaining_time": "1 day, 11:31:05", "throughput": 26860.99, "total_tokens": 3351426496} +{"current_steps": 12460, "total_steps": 25209, "loss": 0.9641, "lr": 3.33637452730051e-05, "epoch": 1.4828073515957962, "percentage": 49.43, "elapsed_time": "1 day, 10:41:03", "remaining_time": "1 day, 11:29:19", "throughput": 26862.08, "total_tokens": 3354091968} +{"current_steps": 12470, "total_steps": 25209, "loss": 0.9848, "lr": 3.335632005196796e-05, "epoch": 1.4839974116194485, "percentage": 49.47, "elapsed_time": "1 day, 10:42:36", "remaining_time": "1 day, 11:27:32", "throughput": 26863.3, "total_tokens": 3356753984} +{"current_steps": 12480, "total_steps": 25209, "loss": 0.9656, "lr": 3.334889978625383e-05, "epoch": 1.485187471643101, "percentage": 49.51, "elapsed_time": "1 day, 10:44:11", "remaining_time": "1 day, 11:25:46", "throughput": 26864.35, "total_tokens": 3359415936} +{"current_steps": 12490, "total_steps": 25209, "loss": 0.9549, "lr": 3.3341484470353515e-05, "epoch": 1.4863775316667533, "percentage": 49.55, "elapsed_time": "1 day, 10:45:50", "remaining_time": "1 day, 11:24:04", "throughput": 26864.59, "total_tokens": 3362113664} +{"current_steps": 12500, "total_steps": 25209, "loss": 0.9843, "lr": 3.333407409876635e-05, "epoch": 1.4875675916904059, "percentage": 49.59, "elapsed_time": "1 day, 10:47:27", "remaining_time": "1 day, 11:22:21", "throughput": 26865.01, "total_tokens": 3364762368} +{"current_steps": 12510, "total_steps": 25209, "loss": 0.9674, "lr": 3.332666866600024e-05, "epoch": 1.4887576517140584, "percentage": 49.63, "elapsed_time": "1 day, 10:49:05", "remaining_time": "1 day, 11:20:39", "throughput": 26865.49, "total_tokens": 3367473600} +{"current_steps": 12520, "total_steps": 25209, "loss": 0.9719, "lr": 3.331926816657162e-05, "epoch": 1.489947711737711, "percentage": 49.66, "elapsed_time": "1 day, 10:50:47", "remaining_time": "1 day, 11:19:01", "throughput": 26865.37, "total_tokens": 3370202944} +{"current_steps": 12530, "total_steps": 25209, "loss": 0.9779, "lr": 3.331187259500546e-05, "epoch": 1.4911377717613632, "percentage": 49.7, "elapsed_time": "1 day, 10:52:20", "remaining_time": "1 day, 11:17:13", "throughput": 26866.46, "total_tokens": 3372819776} +{"current_steps": 12540, "total_steps": 25209, "loss": 0.9811, "lr": 3.3304481945835235e-05, "epoch": 1.4923278317850157, "percentage": 49.74, "elapsed_time": "1 day, 10:53:57", "remaining_time": "1 day, 11:15:29", "throughput": 26867.12, "total_tokens": 3375505088} +{"current_steps": 12550, "total_steps": 25209, "loss": 0.9602, "lr": 3.329709621360288e-05, "epoch": 1.493517891808668, "percentage": 49.78, "elapsed_time": "1 day, 10:55:36", "remaining_time": "1 day, 11:13:48", "throughput": 26867.29, "total_tokens": 3378194816} +{"current_steps": 12560, "total_steps": 25209, "loss": 0.9894, "lr": 3.328971539285882e-05, "epoch": 1.4947079518323205, "percentage": 49.82, "elapsed_time": "1 day, 10:57:11", "remaining_time": "1 day, 11:12:03", "throughput": 26868.26, "total_tokens": 3380880832} +{"current_steps": 12570, "total_steps": 25209, "loss": 0.9737, "lr": 3.3282339478161935e-05, "epoch": 1.495898011855973, "percentage": 49.86, "elapsed_time": "1 day, 10:58:48", "remaining_time": "1 day, 11:10:19", "throughput": 26868.87, "total_tokens": 3383554176} +{"current_steps": 12580, "total_steps": 25209, "loss": 0.9762, "lr": 3.327496846407953e-05, "epoch": 1.4970880718796256, "percentage": 49.9, "elapsed_time": "1 day, 11:00:25", "remaining_time": "1 day, 11:08:36", "throughput": 26869.65, "total_tokens": 3386254528} +{"current_steps": 12590, "total_steps": 25209, "loss": 0.9703, "lr": 3.3267602345187304e-05, "epoch": 1.4982781319032779, "percentage": 49.94, "elapsed_time": "1 day, 11:02:05", "remaining_time": "1 day, 11:06:55", "throughput": 26869.5, "total_tokens": 3388921408} +{"current_steps": 12600, "total_steps": 25209, "loss": 0.9765, "lr": 3.326024111606942e-05, "epoch": 1.4994681919269304, "percentage": 49.98, "elapsed_time": "1 day, 11:03:41", "remaining_time": "1 day, 11:05:11", "throughput": 26870.51, "total_tokens": 3391630208} +{"current_steps": 12610, "total_steps": 25209, "loss": 0.9675, "lr": 3.325288477131839e-05, "epoch": 1.5006582519505827, "percentage": 50.02, "elapsed_time": "1 day, 11:05:17", "remaining_time": "1 day, 11:03:27", "throughput": 26871.3, "total_tokens": 3394317440} +{"current_steps": 12620, "total_steps": 25209, "loss": 0.964, "lr": 3.324553330553507e-05, "epoch": 1.5018483119742352, "percentage": 50.06, "elapsed_time": "1 day, 11:06:59", "remaining_time": "1 day, 11:01:48", "throughput": 26871.38, "total_tokens": 3397064640} +{"current_steps": 12630, "total_steps": 25209, "loss": 0.9759, "lr": 3.323818671332871e-05, "epoch": 1.5030383719978877, "percentage": 50.1, "elapsed_time": "1 day, 11:08:38", "remaining_time": "1 day, 11:00:07", "throughput": 26872.01, "total_tokens": 3399811456} +{"current_steps": 12640, "total_steps": 25209, "loss": 0.9682, "lr": 3.323084498931687e-05, "epoch": 1.5042284320215402, "percentage": 50.14, "elapsed_time": "1 day, 11:10:15", "remaining_time": "1 day, 10:58:24", "throughput": 26872.53, "total_tokens": 3402479040} +{"current_steps": 12650, "total_steps": 25209, "loss": 0.9736, "lr": 3.322350812812545e-05, "epoch": 1.5054184920451925, "percentage": 50.18, "elapsed_time": "1 day, 11:11:51", "remaining_time": "1 day, 10:56:39", "throughput": 26873.38, "total_tokens": 3405154176} +{"current_steps": 12660, "total_steps": 25209, "loss": 0.9593, "lr": 3.321617612438862e-05, "epoch": 1.5066085520688448, "percentage": 50.22, "elapsed_time": "1 day, 11:13:27", "remaining_time": "1 day, 10:54:55", "throughput": 26874.28, "total_tokens": 3407855808} +{"current_steps": 12670, "total_steps": 25209, "loss": 0.9698, "lr": 3.320884897274886e-05, "epoch": 1.5077986120924973, "percentage": 50.26, "elapsed_time": "1 day, 11:15:00", "remaining_time": "1 day, 10:53:08", "throughput": 26875.22, "total_tokens": 3410486400} +{"current_steps": 12680, "total_steps": 25209, "loss": 0.9764, "lr": 3.320152666785692e-05, "epoch": 1.5089886721161498, "percentage": 50.3, "elapsed_time": "1 day, 11:16:44", "remaining_time": "1 day, 10:51:32", "throughput": 26874.79, "total_tokens": 3413227968} +{"current_steps": 12690, "total_steps": 25209, "loss": 0.9618, "lr": 3.319420920437179e-05, "epoch": 1.5101787321398024, "percentage": 50.34, "elapsed_time": "1 day, 11:18:22", "remaining_time": "1 day, 10:49:49", "throughput": 26875.46, "total_tokens": 3415933888} +{"current_steps": 12700, "total_steps": 25209, "loss": 0.9644, "lr": 3.31868965769607e-05, "epoch": 1.5113687921634549, "percentage": 50.38, "elapsed_time": "1 day, 11:19:59", "remaining_time": "1 day, 10:48:06", "throughput": 26875.82, "total_tokens": 3418598400} +{"current_steps": 12710, "total_steps": 25209, "loss": 0.9718, "lr": 3.317958878029911e-05, "epoch": 1.5125588521871072, "percentage": 50.42, "elapsed_time": "1 day, 11:21:37", "remaining_time": "1 day, 10:46:24", "throughput": 26876.61, "total_tokens": 3421326336} +{"current_steps": 12720, "total_steps": 25209, "loss": 0.9656, "lr": 3.3172285809070665e-05, "epoch": 1.5137489122107595, "percentage": 50.46, "elapsed_time": "1 day, 11:23:16", "remaining_time": "1 day, 10:44:43", "throughput": 26877.02, "total_tokens": 3424046912} +{"current_steps": 12730, "total_steps": 25209, "loss": 0.9718, "lr": 3.3164987657967214e-05, "epoch": 1.514938972234412, "percentage": 50.5, "elapsed_time": "1 day, 11:24:54", "remaining_time": "1 day, 10:43:00", "throughput": 26878.13, "total_tokens": 3426817408} +{"current_steps": 12740, "total_steps": 25209, "loss": 0.9612, "lr": 3.315769432168877e-05, "epoch": 1.5161290322580645, "percentage": 50.54, "elapsed_time": "1 day, 11:26:29", "remaining_time": "1 day, 10:41:15", "throughput": 26879.03, "total_tokens": 3429475264} +{"current_steps": 12750, "total_steps": 25209, "loss": 0.9671, "lr": 3.315040579494349e-05, "epoch": 1.517319092281717, "percentage": 50.58, "elapsed_time": "1 day, 11:28:03", "remaining_time": "1 day, 10:39:29", "throughput": 26880.18, "total_tokens": 3432155264} +{"current_steps": 12760, "total_steps": 25209, "loss": 0.9703, "lr": 3.31431220724477e-05, "epoch": 1.5185091523053695, "percentage": 50.62, "elapsed_time": "1 day, 11:29:41", "remaining_time": "1 day, 10:37:46", "throughput": 26880.91, "total_tokens": 3434872768} +{"current_steps": 12770, "total_steps": 25209, "loss": 0.9745, "lr": 3.3135843148925834e-05, "epoch": 1.5196992123290218, "percentage": 50.66, "elapsed_time": "1 day, 11:31:20", "remaining_time": "1 day, 10:36:05", "throughput": 26881.44, "total_tokens": 3437614656} +{"current_steps": 12780, "total_steps": 25209, "loss": 0.9652, "lr": 3.3128569019110414e-05, "epoch": 1.5208892723526741, "percentage": 50.7, "elapsed_time": "1 day, 11:32:57", "remaining_time": "1 day, 10:34:22", "throughput": 26882.19, "total_tokens": 3440322304} +{"current_steps": 12790, "total_steps": 25209, "loss": 0.9762, "lr": 3.312129967774207e-05, "epoch": 1.5220793323763266, "percentage": 50.74, "elapsed_time": "1 day, 11:34:33", "remaining_time": "1 day, 10:32:38", "throughput": 26882.95, "total_tokens": 3443003904} +{"current_steps": 12800, "total_steps": 25209, "loss": 0.9762, "lr": 3.311403511956952e-05, "epoch": 1.5232693923999792, "percentage": 50.78, "elapsed_time": "1 day, 11:36:03", "remaining_time": "1 day, 10:30:48", "throughput": 26884.57, "total_tokens": 3445628096} +{"current_steps": 12810, "total_steps": 25209, "loss": 0.9689, "lr": 3.310677533934952e-05, "epoch": 1.5244594524236317, "percentage": 50.82, "elapsed_time": "1 day, 11:37:42", "remaining_time": "1 day, 10:29:07", "throughput": 26884.53, "total_tokens": 3448286912} +{"current_steps": 12820, "total_steps": 25209, "loss": 0.9676, "lr": 3.309952033184686e-05, "epoch": 1.5256495124472842, "percentage": 50.85, "elapsed_time": "1 day, 11:39:19", "remaining_time": "1 day, 10:27:24", "throughput": 26885.49, "total_tokens": 3451006720} +{"current_steps": 12830, "total_steps": 25209, "loss": 0.9738, "lr": 3.309227009183439e-05, "epoch": 1.5268395724709365, "percentage": 50.89, "elapsed_time": "1 day, 11:41:04", "remaining_time": "1 day, 10:25:48", "throughput": 26885.16, "total_tokens": 3453777152} +{"current_steps": 12840, "total_steps": 25209, "loss": 0.963, "lr": 3.308502461409295e-05, "epoch": 1.5280296324945888, "percentage": 50.93, "elapsed_time": "1 day, 11:42:41", "remaining_time": "1 day, 10:24:05", "throughput": 26885.64, "total_tokens": 3456468800} +{"current_steps": 12850, "total_steps": 25209, "loss": 0.9685, "lr": 3.3077783893411386e-05, "epoch": 1.5292196925182413, "percentage": 50.97, "elapsed_time": "1 day, 11:44:22", "remaining_time": "1 day, 10:22:26", "throughput": 26885.92, "total_tokens": 3459202240} +{"current_steps": 12860, "total_steps": 25209, "loss": 0.9808, "lr": 3.30705479245865e-05, "epoch": 1.5304097525418938, "percentage": 51.01, "elapsed_time": "1 day, 11:45:59", "remaining_time": "1 day, 10:20:42", "throughput": 26886.5, "total_tokens": 3461883904} +{"current_steps": 12870, "total_steps": 25209, "loss": 0.9513, "lr": 3.3063316702423094e-05, "epoch": 1.5315998125655463, "percentage": 51.05, "elapsed_time": "1 day, 11:47:31", "remaining_time": "1 day, 10:18:55", "throughput": 26887.51, "total_tokens": 3464501440} +{"current_steps": 12880, "total_steps": 25209, "loss": 0.9623, "lr": 3.305609022173388e-05, "epoch": 1.5327898725891989, "percentage": 51.09, "elapsed_time": "1 day, 11:49:09", "remaining_time": "1 day, 10:17:12", "throughput": 26887.85, "total_tokens": 3467170304} +{"current_steps": 12890, "total_steps": 25209, "loss": 0.9674, "lr": 3.304886847733954e-05, "epoch": 1.5339799326128511, "percentage": 51.13, "elapsed_time": "1 day, 11:50:44", "remaining_time": "1 day, 10:15:28", "throughput": 26888.54, "total_tokens": 3469829312} +{"current_steps": 12900, "total_steps": 25209, "loss": 0.968, "lr": 3.304165146406865e-05, "epoch": 1.5351699926365034, "percentage": 51.17, "elapsed_time": "1 day, 11:52:18", "remaining_time": "1 day, 10:13:42", "throughput": 26889.45, "total_tokens": 3472473088} +{"current_steps": 12910, "total_steps": 25209, "loss": 0.9745, "lr": 3.30344391767577e-05, "epoch": 1.536360052660156, "percentage": 51.21, "elapsed_time": "1 day, 11:53:58", "remaining_time": "1 day, 10:12:01", "throughput": 26889.57, "total_tokens": 3475162752} +{"current_steps": 12920, "total_steps": 25209, "loss": 0.9754, "lr": 3.302723161025104e-05, "epoch": 1.5375501126838085, "percentage": 51.25, "elapsed_time": "1 day, 11:55:35", "remaining_time": "1 day, 10:10:18", "throughput": 26890.19, "total_tokens": 3477849344} +{"current_steps": 12930, "total_steps": 25209, "loss": 0.9605, "lr": 3.302002875940093e-05, "epoch": 1.538740172707461, "percentage": 51.29, "elapsed_time": "1 day, 11:57:15", "remaining_time": "1 day, 10:08:38", "throughput": 26890.35, "total_tokens": 3480566272} +{"current_steps": 12940, "total_steps": 25209, "loss": 0.9623, "lr": 3.3012830619067466e-05, "epoch": 1.5399302327311135, "percentage": 51.33, "elapsed_time": "1 day, 11:58:52", "remaining_time": "1 day, 10:06:55", "throughput": 26890.91, "total_tokens": 3483256576} +{"current_steps": 12950, "total_steps": 25209, "loss": 0.9703, "lr": 3.300563718411857e-05, "epoch": 1.5411202927547658, "percentage": 51.37, "elapsed_time": "1 day, 12:00:30", "remaining_time": "1 day, 10:05:13", "throughput": 26891.57, "total_tokens": 3485965952} +{"current_steps": 12960, "total_steps": 25209, "loss": 0.9655, "lr": 3.299844844943e-05, "epoch": 1.542310352778418, "percentage": 51.41, "elapsed_time": "1 day, 12:02:04", "remaining_time": "1 day, 10:03:27", "throughput": 26892.66, "total_tokens": 3488634752} +{"current_steps": 12970, "total_steps": 25209, "loss": 0.9737, "lr": 3.299126440988535e-05, "epoch": 1.5435004128020706, "percentage": 51.45, "elapsed_time": "1 day, 12:03:40", "remaining_time": "1 day, 10:01:44", "throughput": 26893.29, "total_tokens": 3491311616} +{"current_steps": 12980, "total_steps": 25209, "loss": 0.9635, "lr": 3.298408506037596e-05, "epoch": 1.5446904728257231, "percentage": 51.49, "elapsed_time": "1 day, 12:05:22", "remaining_time": "1 day, 10:00:05", "throughput": 26893.42, "total_tokens": 3494049984} +{"current_steps": 12990, "total_steps": 25209, "loss": 0.9674, "lr": 3.297691039580097e-05, "epoch": 1.5458805328493757, "percentage": 51.53, "elapsed_time": "1 day, 12:06:59", "remaining_time": "1 day, 9:58:22", "throughput": 26894.32, "total_tokens": 3496776832} +{"current_steps": 13000, "total_steps": 25209, "loss": 0.9666, "lr": 3.29697404110673e-05, "epoch": 1.5470705928730282, "percentage": 51.57, "elapsed_time": "1 day, 12:08:41", "remaining_time": "1 day, 9:56:43", "throughput": 26894.12, "total_tokens": 3499494656} +{"current_steps": 13010, "total_steps": 25209, "loss": 0.9694, "lr": 3.2962575101089594e-05, "epoch": 1.5482606528966805, "percentage": 51.61, "elapsed_time": "1 day, 12:10:22", "remaining_time": "1 day, 9:55:04", "throughput": 26894.04, "total_tokens": 3502212544} +{"current_steps": 13020, "total_steps": 25209, "loss": 0.9814, "lr": 3.295541446079024e-05, "epoch": 1.5494507129203328, "percentage": 51.65, "elapsed_time": "1 day, 12:11:56", "remaining_time": "1 day, 9:53:18", "throughput": 26895.2, "total_tokens": 3504885632} +{"current_steps": 13030, "total_steps": 25209, "loss": 0.9637, "lr": 3.2948258485099336e-05, "epoch": 1.5506407729439853, "percentage": 51.69, "elapsed_time": "1 day, 12:13:34", "remaining_time": "1 day, 9:51:37", "throughput": 26895.53, "total_tokens": 3507580416} +{"current_steps": 13040, "total_steps": 25209, "loss": 0.9669, "lr": 3.29411071689547e-05, "epoch": 1.5518308329676378, "percentage": 51.73, "elapsed_time": "1 day, 12:15:13", "remaining_time": "1 day, 9:49:56", "throughput": 26896.13, "total_tokens": 3510319680} +{"current_steps": 13050, "total_steps": 25209, "loss": 0.9601, "lr": 3.2933960507301826e-05, "epoch": 1.5530208929912903, "percentage": 51.77, "elapsed_time": "1 day, 12:16:47", "remaining_time": "1 day, 9:48:10", "throughput": 26897.13, "total_tokens": 3512968704} +{"current_steps": 13060, "total_steps": 25209, "loss": 0.9747, "lr": 3.292681849509387e-05, "epoch": 1.5542109530149428, "percentage": 51.81, "elapsed_time": "1 day, 12:18:23", "remaining_time": "1 day, 9:46:26", "throughput": 26897.99, "total_tokens": 3515654848} +{"current_steps": 13070, "total_steps": 25209, "loss": 0.9801, "lr": 3.291968112729166e-05, "epoch": 1.5554010130385951, "percentage": 51.85, "elapsed_time": "1 day, 12:19:59", "remaining_time": "1 day, 9:44:42", "throughput": 26898.63, "total_tokens": 3518334208} +{"current_steps": 13080, "total_steps": 25209, "loss": 0.9697, "lr": 3.291254839886367e-05, "epoch": 1.5565910730622474, "percentage": 51.89, "elapsed_time": "1 day, 12:21:34", "remaining_time": "1 day, 9:42:57", "throughput": 26899.48, "total_tokens": 3520994432} +{"current_steps": 13090, "total_steps": 25209, "loss": 0.9659, "lr": 3.2905420304785995e-05, "epoch": 1.5577811330859, "percentage": 51.93, "elapsed_time": "1 day, 12:23:13", "remaining_time": "1 day, 9:41:16", "throughput": 26899.98, "total_tokens": 3523720768} +{"current_steps": 13100, "total_steps": 25209, "loss": 0.9638, "lr": 3.289829684004235e-05, "epoch": 1.5589711931095525, "percentage": 51.97, "elapsed_time": "1 day, 12:24:54", "remaining_time": "1 day, 9:39:37", "throughput": 26900.17, "total_tokens": 3526460032} +{"current_steps": 13110, "total_steps": 25209, "loss": 0.9697, "lr": 3.289117799962402e-05, "epoch": 1.560161253133205, "percentage": 52.01, "elapsed_time": "1 day, 12:26:33", "remaining_time": "1 day, 9:37:56", "throughput": 26900.56, "total_tokens": 3529171520} +{"current_steps": 13120, "total_steps": 25209, "loss": 0.9757, "lr": 3.2884063778529914e-05, "epoch": 1.5613513131568575, "percentage": 52.04, "elapsed_time": "1 day, 12:28:04", "remaining_time": "1 day, 9:36:08", "throughput": 26901.91, "total_tokens": 3531817408} +{"current_steps": 13130, "total_steps": 25209, "loss": 0.9914, "lr": 3.28769541717665e-05, "epoch": 1.5625413731805098, "percentage": 52.08, "elapsed_time": "1 day, 12:29:43", "remaining_time": "1 day, 9:34:26", "throughput": 26902.49, "total_tokens": 3534545152} +{"current_steps": 13140, "total_steps": 25209, "loss": 0.9636, "lr": 3.2869849174347775e-05, "epoch": 1.563731433204162, "percentage": 52.12, "elapsed_time": "1 day, 12:31:27", "remaining_time": "1 day, 9:32:50", "throughput": 26902.23, "total_tokens": 3537297216} +{"current_steps": 13150, "total_steps": 25209, "loss": 0.9695, "lr": 3.2862748781295294e-05, "epoch": 1.5649214932278146, "percentage": 52.16, "elapsed_time": "1 day, 12:33:06", "remaining_time": "1 day, 9:31:09", "throughput": 26902.7, "total_tokens": 3540033600} +{"current_steps": 13160, "total_steps": 25209, "loss": 0.9642, "lr": 3.2855652987638146e-05, "epoch": 1.5661115532514671, "percentage": 52.2, "elapsed_time": "1 day, 12:34:45", "remaining_time": "1 day, 9:29:28", "throughput": 26903.01, "total_tokens": 3542729664} +{"current_steps": 13170, "total_steps": 25209, "loss": 0.99, "lr": 3.284856178841291e-05, "epoch": 1.5673016132751196, "percentage": 52.24, "elapsed_time": "1 day, 12:36:20", "remaining_time": "1 day, 9:27:43", "throughput": 26903.63, "total_tokens": 3545373632} +{"current_steps": 13180, "total_steps": 25209, "loss": 0.9676, "lr": 3.284147517866367e-05, "epoch": 1.5684916732987721, "percentage": 52.28, "elapsed_time": "1 day, 12:37:54", "remaining_time": "1 day, 9:25:57", "throughput": 26904.93, "total_tokens": 3548069184} +{"current_steps": 13190, "total_steps": 25209, "loss": 0.9665, "lr": 3.2834393153441976e-05, "epoch": 1.5696817333224244, "percentage": 52.32, "elapsed_time": "1 day, 12:39:31", "remaining_time": "1 day, 9:24:15", "throughput": 26905.38, "total_tokens": 3550740928} +{"current_steps": 13200, "total_steps": 25209, "loss": 0.9566, "lr": 3.282731570780689e-05, "epoch": 1.5708717933460767, "percentage": 52.36, "elapsed_time": "1 day, 12:41:12", "remaining_time": "1 day, 9:22:35", "throughput": 26905.38, "total_tokens": 3553460480} +{"current_steps": 13210, "total_steps": 25209, "loss": 0.9718, "lr": 3.2820242836824875e-05, "epoch": 1.5720618533697293, "percentage": 52.4, "elapsed_time": "1 day, 12:42:52", "remaining_time": "1 day, 9:20:55", "throughput": 26905.46, "total_tokens": 3556157056} +{"current_steps": 13220, "total_steps": 25209, "loss": 0.9849, "lr": 3.2813174535569854e-05, "epoch": 1.5732519133933818, "percentage": 52.44, "elapsed_time": "1 day, 12:44:27", "remaining_time": "1 day, 9:19:11", "throughput": 26906.26, "total_tokens": 3558822272} +{"current_steps": 13230, "total_steps": 25209, "loss": 0.9692, "lr": 3.280611079912318e-05, "epoch": 1.5744419734170343, "percentage": 52.48, "elapsed_time": "1 day, 12:46:06", "remaining_time": "1 day, 9:17:30", "throughput": 26906.43, "total_tokens": 3561505664} +{"current_steps": 13240, "total_steps": 25209, "loss": 0.9651, "lr": 3.279905162257358e-05, "epoch": 1.5756320334406868, "percentage": 52.52, "elapsed_time": "1 day, 12:47:40", "remaining_time": "1 day, 9:15:45", "throughput": 26907.15, "total_tokens": 3564144832} +{"current_steps": 13250, "total_steps": 25209, "loss": 0.9793, "lr": 3.279199700101723e-05, "epoch": 1.576822093464339, "percentage": 52.56, "elapsed_time": "1 day, 12:49:16", "remaining_time": "1 day, 9:14:01", "throughput": 26907.76, "total_tokens": 3566811712} +{"current_steps": 13260, "total_steps": 25209, "loss": 0.9614, "lr": 3.2784946929557644e-05, "epoch": 1.5780121534879914, "percentage": 52.6, "elapsed_time": "1 day, 12:50:49", "remaining_time": "1 day, 9:12:14", "throughput": 26909.0, "total_tokens": 3569465600} +{"current_steps": 13270, "total_steps": 25209, "loss": 0.9698, "lr": 3.277790140330571e-05, "epoch": 1.579202213511644, "percentage": 52.64, "elapsed_time": "1 day, 12:52:26", "remaining_time": "1 day, 9:10:31", "throughput": 26909.6, "total_tokens": 3572152064} +{"current_steps": 13280, "total_steps": 25209, "loss": 0.9752, "lr": 3.277086041737968e-05, "epoch": 1.5803922735352964, "percentage": 52.68, "elapsed_time": "1 day, 12:54:00", "remaining_time": "1 day, 9:08:46", "throughput": 26910.79, "total_tokens": 3574852032} +{"current_steps": 13290, "total_steps": 25209, "loss": 0.9657, "lr": 3.276382396690513e-05, "epoch": 1.581582333558949, "percentage": 52.72, "elapsed_time": "1 day, 12:55:39", "remaining_time": "1 day, 9:07:05", "throughput": 26911.13, "total_tokens": 3577544384} +{"current_steps": 13300, "total_steps": 25209, "loss": 0.9634, "lr": 3.275679204701496e-05, "epoch": 1.5827723935826015, "percentage": 52.76, "elapsed_time": "1 day, 12:57:19", "remaining_time": "1 day, 9:05:25", "throughput": 26911.29, "total_tokens": 3580277632} +{"current_steps": 13310, "total_steps": 25209, "loss": 0.9752, "lr": 3.274976465284939e-05, "epoch": 1.5839624536062538, "percentage": 52.8, "elapsed_time": "1 day, 12:58:58", "remaining_time": "1 day, 9:03:44", "throughput": 26911.84, "total_tokens": 3583012096} +{"current_steps": 13320, "total_steps": 25209, "loss": 0.9704, "lr": 3.274274177955593e-05, "epoch": 1.585152513629906, "percentage": 52.84, "elapsed_time": "1 day, 13:00:38", "remaining_time": "1 day, 9:02:04", "throughput": 26912.07, "total_tokens": 3585723648} +{"current_steps": 13330, "total_steps": 25209, "loss": 0.9595, "lr": 3.273572342228937e-05, "epoch": 1.5863425736535586, "percentage": 52.88, "elapsed_time": "1 day, 13:02:19", "remaining_time": "1 day, 9:00:24", "throughput": 26912.41, "total_tokens": 3588477888} +{"current_steps": 13340, "total_steps": 25209, "loss": 0.9481, "lr": 3.272870957621176e-05, "epoch": 1.587532633677211, "percentage": 52.92, "elapsed_time": "1 day, 13:03:58", "remaining_time": "1 day, 8:58:44", "throughput": 26913.13, "total_tokens": 3591252800} +{"current_steps": 13350, "total_steps": 25209, "loss": 0.9565, "lr": 3.2721700236492414e-05, "epoch": 1.5887226937008636, "percentage": 52.96, "elapsed_time": "1 day, 13:05:36", "remaining_time": "1 day, 8:57:02", "throughput": 26913.69, "total_tokens": 3593963648} +{"current_steps": 13360, "total_steps": 25209, "loss": 0.9597, "lr": 3.271469539830788e-05, "epoch": 1.5899127537245161, "percentage": 53.0, "elapsed_time": "1 day, 13:07:15", "remaining_time": "1 day, 8:55:21", "throughput": 26914.36, "total_tokens": 3596702784} +{"current_steps": 13370, "total_steps": 25209, "loss": 0.9804, "lr": 3.270769505684193e-05, "epoch": 1.5911028137481684, "percentage": 53.04, "elapsed_time": "1 day, 13:08:47", "remaining_time": "1 day, 8:53:34", "throughput": 26915.69, "total_tokens": 3599364160} +{"current_steps": 13380, "total_steps": 25209, "loss": 0.9473, "lr": 3.2700699207285544e-05, "epoch": 1.5922928737718207, "percentage": 53.08, "elapsed_time": "1 day, 13:10:22", "remaining_time": "1 day, 8:51:50", "throughput": 26916.44, "total_tokens": 3602038400} +{"current_steps": 13390, "total_steps": 25209, "loss": 0.9583, "lr": 3.269370784483691e-05, "epoch": 1.5934829337954732, "percentage": 53.12, "elapsed_time": "1 day, 13:11:59", "remaining_time": "1 day, 8:50:07", "throughput": 26917.04, "total_tokens": 3604723520} +{"current_steps": 13400, "total_steps": 25209, "loss": 0.9706, "lr": 3.268672096470138e-05, "epoch": 1.5946729938191258, "percentage": 53.16, "elapsed_time": "1 day, 13:13:35", "remaining_time": "1 day, 8:48:23", "throughput": 26918.03, "total_tokens": 3607430912} +{"current_steps": 13410, "total_steps": 25209, "loss": 0.9776, "lr": 3.2679738562091506e-05, "epoch": 1.5958630538427783, "percentage": 53.2, "elapsed_time": "1 day, 13:15:11", "remaining_time": "1 day, 8:46:39", "throughput": 26918.69, "total_tokens": 3610098688} +{"current_steps": 13420, "total_steps": 25209, "loss": 0.9638, "lr": 3.2672760632226964e-05, "epoch": 1.5970531138664308, "percentage": 53.23, "elapsed_time": "1 day, 13:16:49", "remaining_time": "1 day, 8:44:58", "throughput": 26918.91, "total_tokens": 3612781696} +{"current_steps": 13430, "total_steps": 25209, "loss": 0.9713, "lr": 3.266578717033458e-05, "epoch": 1.598243173890083, "percentage": 53.27, "elapsed_time": "1 day, 13:18:28", "remaining_time": "1 day, 8:43:17", "throughput": 26918.99, "total_tokens": 3615460992} +{"current_steps": 13440, "total_steps": 25209, "loss": 0.9756, "lr": 3.265881817164833e-05, "epoch": 1.5994332339137354, "percentage": 53.31, "elapsed_time": "1 day, 13:20:05", "remaining_time": "1 day, 8:41:34", "throughput": 26919.69, "total_tokens": 3618148288} +{"current_steps": 13450, "total_steps": 25209, "loss": 0.9682, "lr": 3.265185363140928e-05, "epoch": 1.600623293937388, "percentage": 53.35, "elapsed_time": "1 day, 13:21:46", "remaining_time": "1 day, 8:39:55", "throughput": 26919.91, "total_tokens": 3620898944} +{"current_steps": 13460, "total_steps": 25209, "loss": 0.9702, "lr": 3.26448935448656e-05, "epoch": 1.6018133539610404, "percentage": 53.39, "elapsed_time": "1 day, 13:23:22", "remaining_time": "1 day, 8:38:12", "throughput": 26920.39, "total_tokens": 3623563328} +{"current_steps": 13470, "total_steps": 25209, "loss": 0.9551, "lr": 3.263793790727256e-05, "epoch": 1.603003413984693, "percentage": 53.43, "elapsed_time": "1 day, 13:24:59", "remaining_time": "1 day, 8:36:29", "throughput": 26920.9, "total_tokens": 3626230208} +{"current_steps": 13480, "total_steps": 25209, "loss": 0.968, "lr": 3.2630986713892495e-05, "epoch": 1.6041934740083454, "percentage": 53.47, "elapsed_time": "1 day, 13:26:37", "remaining_time": "1 day, 8:34:47", "throughput": 26921.4, "total_tokens": 3628937856} +{"current_steps": 13490, "total_steps": 25209, "loss": 0.9682, "lr": 3.26240399599948e-05, "epoch": 1.6053835340319977, "percentage": 53.51, "elapsed_time": "1 day, 13:28:18", "remaining_time": "1 day, 8:33:08", "throughput": 26921.82, "total_tokens": 3631715840} +{"current_steps": 13500, "total_steps": 25209, "loss": 0.9773, "lr": 3.2617097640855914e-05, "epoch": 1.60657359405565, "percentage": 53.55, "elapsed_time": "1 day, 13:29:52", "remaining_time": "1 day, 8:31:23", "throughput": 26922.73, "total_tokens": 3634356800} +{"current_steps": 13510, "total_steps": 25209, "loss": 0.9776, "lr": 3.2610159751759314e-05, "epoch": 1.6077636540793026, "percentage": 53.59, "elapsed_time": "1 day, 13:31:35", "remaining_time": "1 day, 8:29:45", "throughput": 26922.55, "total_tokens": 3637110016} +{"current_steps": 13520, "total_steps": 25209, "loss": 0.9675, "lr": 3.26032262879955e-05, "epoch": 1.608953714102955, "percentage": 53.63, "elapsed_time": "1 day, 13:33:15", "remaining_time": "1 day, 8:28:06", "throughput": 26922.77, "total_tokens": 3639840128} +{"current_steps": 13530, "total_steps": 25209, "loss": 0.9696, "lr": 3.259629724486198e-05, "epoch": 1.6101437741266076, "percentage": 53.67, "elapsed_time": "1 day, 13:34:51", "remaining_time": "1 day, 8:26:22", "throughput": 26923.48, "total_tokens": 3642526528} +{"current_steps": 13540, "total_steps": 25209, "loss": 0.9634, "lr": 3.258937261766323e-05, "epoch": 1.61133383415026, "percentage": 53.71, "elapsed_time": "1 day, 13:36:31", "remaining_time": "1 day, 8:24:42", "throughput": 26923.77, "total_tokens": 3645251264} +{"current_steps": 13550, "total_steps": 25209, "loss": 0.9698, "lr": 3.258245240171074e-05, "epoch": 1.6125238941739124, "percentage": 53.75, "elapsed_time": "1 day, 13:38:07", "remaining_time": "1 day, 8:22:59", "throughput": 26924.46, "total_tokens": 3647928640} +{"current_steps": 13560, "total_steps": 25209, "loss": 0.9649, "lr": 3.2575536592322935e-05, "epoch": 1.6137139541975647, "percentage": 53.79, "elapsed_time": "1 day, 13:39:42", "remaining_time": "1 day, 8:21:14", "throughput": 26925.49, "total_tokens": 3650615488} +{"current_steps": 13570, "total_steps": 25209, "loss": 0.9654, "lr": 3.256862518482523e-05, "epoch": 1.6149040142212172, "percentage": 53.83, "elapsed_time": "1 day, 13:41:19", "remaining_time": "1 day, 8:19:32", "throughput": 26925.8, "total_tokens": 3653277952} +{"current_steps": 13580, "total_steps": 25209, "loss": 0.96, "lr": 3.256171817454994e-05, "epoch": 1.6160940742448697, "percentage": 53.87, "elapsed_time": "1 day, 13:42:52", "remaining_time": "1 day, 8:17:46", "throughput": 26927.03, "total_tokens": 3655960576} +{"current_steps": 13590, "total_steps": 25209, "loss": 0.9885, "lr": 3.255481555683633e-05, "epoch": 1.6172841342685222, "percentage": 53.91, "elapsed_time": "1 day, 13:44:26", "remaining_time": "1 day, 8:16:01", "throughput": 26928.13, "total_tokens": 3658639744} +{"current_steps": 13600, "total_steps": 25209, "loss": 0.975, "lr": 3.254791732703057e-05, "epoch": 1.6184741942921748, "percentage": 53.95, "elapsed_time": "1 day, 13:46:04", "remaining_time": "1 day, 8:14:19", "throughput": 26928.58, "total_tokens": 3661328704} +{"current_steps": 13610, "total_steps": 25209, "loss": 0.9592, "lr": 3.254102348048575e-05, "epoch": 1.619664254315827, "percentage": 53.99, "elapsed_time": "1 day, 13:47:46", "remaining_time": "1 day, 8:12:41", "throughput": 26928.23, "total_tokens": 3664023808} +{"current_steps": 13620, "total_steps": 25209, "loss": 0.9697, "lr": 3.25341340125618e-05, "epoch": 1.6208543143394794, "percentage": 54.03, "elapsed_time": "1 day, 13:49:23", "remaining_time": "1 day, 8:10:59", "throughput": 26928.8, "total_tokens": 3666731456} +{"current_steps": 13630, "total_steps": 25209, "loss": 0.9761, "lr": 3.2527248918625575e-05, "epoch": 1.6220443743631319, "percentage": 54.07, "elapsed_time": "1 day, 13:51:00", "remaining_time": "1 day, 8:09:16", "throughput": 26929.71, "total_tokens": 3669455424} +{"current_steps": 13640, "total_steps": 25209, "loss": 0.9787, "lr": 3.252036819405075e-05, "epoch": 1.6232344343867844, "percentage": 54.11, "elapsed_time": "1 day, 13:52:39", "remaining_time": "1 day, 8:07:35", "throughput": 26929.91, "total_tokens": 3672143360} +{"current_steps": 13650, "total_steps": 25209, "loss": 0.9644, "lr": 3.251349183421788e-05, "epoch": 1.624424494410437, "percentage": 54.15, "elapsed_time": "1 day, 13:54:17", "remaining_time": "1 day, 8:05:54", "throughput": 26930.33, "total_tokens": 3674845440} +{"current_steps": 13660, "total_steps": 25209, "loss": 0.9798, "lr": 3.250661983451434e-05, "epoch": 1.6256145544340894, "percentage": 54.19, "elapsed_time": "1 day, 13:55:55", "remaining_time": "1 day, 8:04:11", "throughput": 26930.94, "total_tokens": 3677555136} +{"current_steps": 13670, "total_steps": 25209, "loss": 0.9679, "lr": 3.2499752190334326e-05, "epoch": 1.6268046144577417, "percentage": 54.23, "elapsed_time": "1 day, 13:57:32", "remaining_time": "1 day, 8:02:29", "throughput": 26931.42, "total_tokens": 3680249088} +{"current_steps": 13680, "total_steps": 25209, "loss": 0.9545, "lr": 3.2492888897078834e-05, "epoch": 1.627994674481394, "percentage": 54.27, "elapsed_time": "1 day, 13:59:10", "remaining_time": "1 day, 8:00:48", "throughput": 26932.08, "total_tokens": 3682986688} +{"current_steps": 13690, "total_steps": 25209, "loss": 0.9667, "lr": 3.248602995015567e-05, "epoch": 1.6291847345050465, "percentage": 54.31, "elapsed_time": "1 day, 14:00:46", "remaining_time": "1 day, 7:59:04", "throughput": 26932.79, "total_tokens": 3685646272} +{"current_steps": 13700, "total_steps": 25209, "loss": 0.9614, "lr": 3.247917534497943e-05, "epoch": 1.630374794528699, "percentage": 54.35, "elapsed_time": "1 day, 14:02:17", "remaining_time": "1 day, 7:57:17", "throughput": 26934.0, "total_tokens": 3688280832} +{"current_steps": 13710, "total_steps": 25209, "loss": 0.9541, "lr": 3.247232507697145e-05, "epoch": 1.6315648545523516, "percentage": 54.39, "elapsed_time": "1 day, 14:03:49", "remaining_time": "1 day, 7:55:30", "throughput": 26935.13, "total_tokens": 3690897216} +{"current_steps": 13720, "total_steps": 25209, "loss": 0.9646, "lr": 3.246547914155985e-05, "epoch": 1.632754914576004, "percentage": 54.43, "elapsed_time": "1 day, 14:05:25", "remaining_time": "1 day, 7:53:47", "throughput": 26935.79, "total_tokens": 3693573568} +{"current_steps": 13730, "total_steps": 25209, "loss": 0.9751, "lr": 3.245863753417949e-05, "epoch": 1.6339449745996564, "percentage": 54.46, "elapsed_time": "1 day, 14:07:00", "remaining_time": "1 day, 7:52:03", "throughput": 26936.6, "total_tokens": 3696264704} +{"current_steps": 13740, "total_steps": 25209, "loss": 0.9547, "lr": 3.2451800250271944e-05, "epoch": 1.6351350346233087, "percentage": 54.5, "elapsed_time": "1 day, 14:08:38", "remaining_time": "1 day, 7:50:21", "throughput": 26937.04, "total_tokens": 3698947840} +{"current_steps": 13750, "total_steps": 25209, "loss": 0.951, "lr": 3.244496728528553e-05, "epoch": 1.6363250946469612, "percentage": 54.54, "elapsed_time": "1 day, 14:10:16", "remaining_time": "1 day, 7:48:40", "throughput": 26937.58, "total_tokens": 3701680384} +{"current_steps": 13760, "total_steps": 25209, "loss": 0.9819, "lr": 3.243813863467525e-05, "epoch": 1.6375151546706137, "percentage": 54.58, "elapsed_time": "1 day, 14:11:50", "remaining_time": "1 day, 7:46:55", "throughput": 26938.68, "total_tokens": 3704357888} +{"current_steps": 13770, "total_steps": 25209, "loss": 0.9744, "lr": 3.243131429390281e-05, "epoch": 1.6387052146942662, "percentage": 54.62, "elapsed_time": "1 day, 14:13:25", "remaining_time": "1 day, 7:45:11", "throughput": 26939.41, "total_tokens": 3707013952} +{"current_steps": 13780, "total_steps": 25209, "loss": 0.9626, "lr": 3.2424494258436594e-05, "epoch": 1.6398952747179187, "percentage": 54.66, "elapsed_time": "1 day, 14:15:03", "remaining_time": "1 day, 7:43:30", "throughput": 26939.91, "total_tokens": 3709725184} +{"current_steps": 13790, "total_steps": 25209, "loss": 0.9739, "lr": 3.241767852375166e-05, "epoch": 1.641085334741571, "percentage": 54.7, "elapsed_time": "1 day, 14:16:42", "remaining_time": "1 day, 7:41:48", "throughput": 26940.08, "total_tokens": 3712401472} +{"current_steps": 13800, "total_steps": 25209, "loss": 0.9533, "lr": 3.241086708532971e-05, "epoch": 1.6422753947652233, "percentage": 54.74, "elapsed_time": "1 day, 14:18:24", "remaining_time": "1 day, 7:40:10", "throughput": 26940.02, "total_tokens": 3715145344} +{"current_steps": 13810, "total_steps": 25209, "loss": 0.9791, "lr": 3.24040599386591e-05, "epoch": 1.6434654547888758, "percentage": 54.78, "elapsed_time": "1 day, 14:19:55", "remaining_time": "1 day, 7:38:23", "throughput": 26941.22, "total_tokens": 3717774528} +{"current_steps": 13820, "total_steps": 25209, "loss": 0.9675, "lr": 3.23972570792348e-05, "epoch": 1.6446555148125284, "percentage": 54.82, "elapsed_time": "1 day, 14:21:36", "remaining_time": "1 day, 7:36:44", "throughput": 26941.68, "total_tokens": 3720539392} +{"current_steps": 13830, "total_steps": 25209, "loss": 0.9635, "lr": 3.239045850255842e-05, "epoch": 1.6458455748361809, "percentage": 54.86, "elapsed_time": "1 day, 14:23:11", "remaining_time": "1 day, 7:35:00", "throughput": 26942.65, "total_tokens": 3723241152} +{"current_steps": 13840, "total_steps": 25209, "loss": 0.9712, "lr": 3.238366420413817e-05, "epoch": 1.6470356348598334, "percentage": 54.9, "elapsed_time": "1 day, 14:24:48", "remaining_time": "1 day, 7:33:18", "throughput": 26943.3, "total_tokens": 3725959808} +{"current_steps": 13850, "total_steps": 25209, "loss": 0.9608, "lr": 3.237687417948882e-05, "epoch": 1.6482256948834857, "percentage": 54.94, "elapsed_time": "1 day, 14:26:23", "remaining_time": "1 day, 7:31:34", "throughput": 26944.02, "total_tokens": 3728620416} +{"current_steps": 13860, "total_steps": 25209, "loss": 0.9637, "lr": 3.2370088424131776e-05, "epoch": 1.649415754907138, "percentage": 54.98, "elapsed_time": "1 day, 14:28:00", "remaining_time": "1 day, 7:29:52", "throughput": 26944.65, "total_tokens": 3731306112} +{"current_steps": 13870, "total_steps": 25209, "loss": 0.9633, "lr": 3.236330693359497e-05, "epoch": 1.6506058149307905, "percentage": 55.02, "elapsed_time": "1 day, 14:29:38", "remaining_time": "1 day, 7:28:10", "throughput": 26945.31, "total_tokens": 3734031808} +{"current_steps": 13880, "total_steps": 25209, "loss": 0.9753, "lr": 3.2356529703412894e-05, "epoch": 1.651795874954443, "percentage": 55.06, "elapsed_time": "1 day, 14:31:14", "remaining_time": "1 day, 7:26:27", "throughput": 26945.89, "total_tokens": 3736717632} +{"current_steps": 13890, "total_steps": 25209, "loss": 0.9624, "lr": 3.234975672912661e-05, "epoch": 1.6529859349780955, "percentage": 55.1, "elapsed_time": "1 day, 14:32:53", "remaining_time": "1 day, 7:24:47", "throughput": 26946.08, "total_tokens": 3739410432} +{"current_steps": 13900, "total_steps": 25209, "loss": 0.9677, "lr": 3.234298800628368e-05, "epoch": 1.654175995001748, "percentage": 55.14, "elapsed_time": "1 day, 14:34:33", "remaining_time": "1 day, 7:23:07", "throughput": 26946.32, "total_tokens": 3742131072} +{"current_steps": 13910, "total_steps": 25209, "loss": 0.9729, "lr": 3.2336223530438195e-05, "epoch": 1.6553660550254004, "percentage": 55.18, "elapsed_time": "1 day, 14:36:07", "remaining_time": "1 day, 7:21:22", "throughput": 26947.32, "total_tokens": 3744803072} +{"current_steps": 13920, "total_steps": 25209, "loss": 0.9743, "lr": 3.232946329715076e-05, "epoch": 1.6565561150490526, "percentage": 55.22, "elapsed_time": "1 day, 14:37:44", "remaining_time": "1 day, 7:19:39", "throughput": 26947.88, "total_tokens": 3747484800} +{"current_steps": 13930, "total_steps": 25209, "loss": 0.9576, "lr": 3.2322707301988456e-05, "epoch": 1.6577461750727052, "percentage": 55.26, "elapsed_time": "1 day, 14:39:20", "remaining_time": "1 day, 7:17:56", "throughput": 26948.58, "total_tokens": 3750166848} +{"current_steps": 13940, "total_steps": 25209, "loss": 0.9652, "lr": 3.231595554052488e-05, "epoch": 1.6589362350963577, "percentage": 55.3, "elapsed_time": "1 day, 14:40:57", "remaining_time": "1 day, 7:16:14", "throughput": 26949.07, "total_tokens": 3752862336} +{"current_steps": 13950, "total_steps": 25209, "loss": 0.9571, "lr": 3.230920800834005e-05, "epoch": 1.6601262951200102, "percentage": 55.34, "elapsed_time": "1 day, 14:42:33", "remaining_time": "1 day, 7:14:31", "throughput": 26949.64, "total_tokens": 3755534080} +{"current_steps": 13960, "total_steps": 25209, "loss": 0.9547, "lr": 3.2302464701020486e-05, "epoch": 1.6613163551436627, "percentage": 55.38, "elapsed_time": "1 day, 14:44:12", "remaining_time": "1 day, 7:12:51", "throughput": 26950.15, "total_tokens": 3758270784} +{"current_steps": 13970, "total_steps": 25209, "loss": 0.979, "lr": 3.2295725614159126e-05, "epoch": 1.662506415167315, "percentage": 55.42, "elapsed_time": "1 day, 14:45:47", "remaining_time": "1 day, 7:11:07", "throughput": 26951.08, "total_tokens": 3760950976} +{"current_steps": 13980, "total_steps": 25209, "loss": 0.9735, "lr": 3.228899074335536e-05, "epoch": 1.6636964751909673, "percentage": 55.46, "elapsed_time": "1 day, 14:47:20", "remaining_time": "1 day, 7:09:22", "throughput": 26952.1, "total_tokens": 3763611200} +{"current_steps": 13990, "total_steps": 25209, "loss": 0.9652, "lr": 3.228226008421498e-05, "epoch": 1.6648865352146198, "percentage": 55.5, "elapsed_time": "1 day, 14:48:59", "remaining_time": "1 day, 7:07:41", "throughput": 26952.47, "total_tokens": 3766329216} +{"current_steps": 14000, "total_steps": 25209, "loss": 0.9665, "lr": 3.2275533632350193e-05, "epoch": 1.6660765952382723, "percentage": 55.54, "elapsed_time": "1 day, 14:50:36", "remaining_time": "1 day, 7:05:58", "throughput": 26953.04, "total_tokens": 3769011520} +{"current_steps": 14010, "total_steps": 25209, "loss": 0.9584, "lr": 3.226881138337963e-05, "epoch": 1.6672666552619249, "percentage": 55.58, "elapsed_time": "1 day, 14:52:09", "remaining_time": "1 day, 7:04:13", "throughput": 26954.18, "total_tokens": 3771671552} +{"current_steps": 14020, "total_steps": 25209, "loss": 0.9678, "lr": 3.2262093332928256e-05, "epoch": 1.6684567152855774, "percentage": 55.62, "elapsed_time": "1 day, 14:53:42", "remaining_time": "1 day, 7:02:28", "throughput": 26955.05, "total_tokens": 3774326400} +{"current_steps": 14030, "total_steps": 25209, "loss": 0.9687, "lr": 3.225537947662746e-05, "epoch": 1.6696467753092297, "percentage": 55.65, "elapsed_time": "1 day, 14:55:22", "remaining_time": "1 day, 7:00:48", "throughput": 26955.27, "total_tokens": 3777044416} +{"current_steps": 14040, "total_steps": 25209, "loss": 0.97, "lr": 3.224866981011494e-05, "epoch": 1.670836835332882, "percentage": 55.69, "elapsed_time": "1 day, 14:56:58", "remaining_time": "1 day, 6:59:05", "throughput": 26955.87, "total_tokens": 3779713088} +{"current_steps": 14050, "total_steps": 25209, "loss": 0.9763, "lr": 3.22419643290348e-05, "epoch": 1.6720268953565345, "percentage": 55.73, "elapsed_time": "1 day, 14:58:33", "remaining_time": "1 day, 6:57:21", "throughput": 26956.82, "total_tokens": 3782404736} +{"current_steps": 14060, "total_steps": 25209, "loss": 0.9731, "lr": 3.2235263029037446e-05, "epoch": 1.673216955380187, "percentage": 55.77, "elapsed_time": "1 day, 15:00:13", "remaining_time": "1 day, 6:55:41", "throughput": 26957.01, "total_tokens": 3785122304} +{"current_steps": 14070, "total_steps": 25209, "loss": 0.9705, "lr": 3.222856590577962e-05, "epoch": 1.6744070154038395, "percentage": 55.81, "elapsed_time": "1 day, 15:01:56", "remaining_time": "1 day, 6:54:04", "throughput": 26957.07, "total_tokens": 3787908800} +{"current_steps": 14080, "total_steps": 25209, "loss": 0.9727, "lr": 3.222187295492436e-05, "epoch": 1.675597075427492, "percentage": 55.85, "elapsed_time": "1 day, 15:03:37", "remaining_time": "1 day, 6:52:25", "throughput": 26957.32, "total_tokens": 3790664000} +{"current_steps": 14090, "total_steps": 25209, "loss": 0.9558, "lr": 3.221518417214104e-05, "epoch": 1.6767871354511443, "percentage": 55.89, "elapsed_time": "1 day, 15:05:13", "remaining_time": "1 day, 6:50:42", "throughput": 26957.91, "total_tokens": 3793338112} +{"current_steps": 14100, "total_steps": 25209, "loss": 0.9628, "lr": 3.22084995531053e-05, "epoch": 1.6779771954747966, "percentage": 55.93, "elapsed_time": "1 day, 15:06:54", "remaining_time": "1 day, 6:49:03", "throughput": 26957.82, "total_tokens": 3796056512} +{"current_steps": 14110, "total_steps": 25209, "loss": 0.9647, "lr": 3.220181909349907e-05, "epoch": 1.6791672554984491, "percentage": 55.97, "elapsed_time": "1 day, 15:08:31", "remaining_time": "1 day, 6:47:21", "throughput": 26958.55, "total_tokens": 3798761536} +{"current_steps": 14120, "total_steps": 25209, "loss": 0.9731, "lr": 3.219514278901053e-05, "epoch": 1.6803573155221017, "percentage": 56.01, "elapsed_time": "1 day, 15:10:08", "remaining_time": "1 day, 6:45:39", "throughput": 26959.1, "total_tokens": 3801452416} +{"current_steps": 14130, "total_steps": 25209, "loss": 0.9666, "lr": 3.218847063533413e-05, "epoch": 1.6815473755457542, "percentage": 56.05, "elapsed_time": "1 day, 15:11:44", "remaining_time": "1 day, 6:43:56", "throughput": 26959.95, "total_tokens": 3804162048} +{"current_steps": 14140, "total_steps": 25209, "loss": 0.968, "lr": 3.218180262817055e-05, "epoch": 1.6827374355694067, "percentage": 56.09, "elapsed_time": "1 day, 15:13:25", "remaining_time": "1 day, 6:42:17", "throughput": 26960.1, "total_tokens": 3806916032} +{"current_steps": 14150, "total_steps": 25209, "loss": 0.9625, "lr": 3.217513876322674e-05, "epoch": 1.683927495593059, "percentage": 56.13, "elapsed_time": "1 day, 15:15:05", "remaining_time": "1 day, 6:40:38", "throughput": 26960.29, "total_tokens": 3809644224} +{"current_steps": 14160, "total_steps": 25209, "loss": 0.9758, "lr": 3.216847903621581e-05, "epoch": 1.6851175556167113, "percentage": 56.17, "elapsed_time": "1 day, 15:16:40", "remaining_time": "1 day, 6:38:54", "throughput": 26961.28, "total_tokens": 3812345472} +{"current_steps": 14170, "total_steps": 25209, "loss": 0.9651, "lr": 3.216182344285713e-05, "epoch": 1.6863076156403638, "percentage": 56.21, "elapsed_time": "1 day, 15:18:21", "remaining_time": "1 day, 6:37:15", "throughput": 26961.49, "total_tokens": 3815080064} +{"current_steps": 14180, "total_steps": 25209, "loss": 0.9549, "lr": 3.215517197887625e-05, "epoch": 1.6874976756640163, "percentage": 56.25, "elapsed_time": "1 day, 15:19:55", "remaining_time": "1 day, 6:35:30", "throughput": 26962.06, "total_tokens": 3817697472} +{"current_steps": 14190, "total_steps": 25209, "loss": 0.9795, "lr": 3.214852464000488e-05, "epoch": 1.6886877356876688, "percentage": 56.29, "elapsed_time": "1 day, 15:21:37", "remaining_time": "1 day, 6:33:52", "throughput": 26961.9, "total_tokens": 3820425984} +{"current_steps": 14200, "total_steps": 25209, "loss": 0.967, "lr": 3.2141881421980945e-05, "epoch": 1.6898777957113214, "percentage": 56.33, "elapsed_time": "1 day, 15:23:12", "remaining_time": "1 day, 6:32:08", "throughput": 26962.81, "total_tokens": 3823116992} +{"current_steps": 14210, "total_steps": 25209, "loss": 0.9701, "lr": 3.213524232054851e-05, "epoch": 1.6910678557349736, "percentage": 56.37, "elapsed_time": "1 day, 15:24:46", "remaining_time": "1 day, 6:30:24", "throughput": 26963.62, "total_tokens": 3825778112} +{"current_steps": 14220, "total_steps": 25209, "loss": 0.9578, "lr": 3.21286073314578e-05, "epoch": 1.692257915758626, "percentage": 56.41, "elapsed_time": "1 day, 15:26:28", "remaining_time": "1 day, 6:28:46", "throughput": 26963.63, "total_tokens": 3828528000} +{"current_steps": 14230, "total_steps": 25209, "loss": 0.9713, "lr": 3.2121976450465155e-05, "epoch": 1.6934479757822785, "percentage": 56.45, "elapsed_time": "1 day, 15:28:02", "remaining_time": "1 day, 6:27:01", "throughput": 26964.58, "total_tokens": 3831187968} +{"current_steps": 14240, "total_steps": 25209, "loss": 0.9635, "lr": 3.211534967333308e-05, "epoch": 1.694638035805931, "percentage": 56.49, "elapsed_time": "1 day, 15:29:40", "remaining_time": "1 day, 6:25:21", "throughput": 26965.09, "total_tokens": 3833920384} +{"current_steps": 14250, "total_steps": 25209, "loss": 0.9687, "lr": 3.210872699583019e-05, "epoch": 1.6958280958295835, "percentage": 56.53, "elapsed_time": "1 day, 15:31:18", "remaining_time": "1 day, 6:23:39", "throughput": 26965.65, "total_tokens": 3836635392} +{"current_steps": 14260, "total_steps": 25209, "loss": 0.9665, "lr": 3.210210841373118e-05, "epoch": 1.697018155853236, "percentage": 56.57, "elapsed_time": "1 day, 15:32:54", "remaining_time": "1 day, 6:21:56", "throughput": 26966.24, "total_tokens": 3839299264} +{"current_steps": 14270, "total_steps": 25209, "loss": 0.9619, "lr": 3.2095493922816855e-05, "epoch": 1.6982082158768883, "percentage": 56.61, "elapsed_time": "1 day, 15:34:30", "remaining_time": "1 day, 6:20:14", "throughput": 26966.69, "total_tokens": 3841959040} +{"current_steps": 14280, "total_steps": 25209, "loss": 0.9532, "lr": 3.2088883518874105e-05, "epoch": 1.6993982759005406, "percentage": 56.65, "elapsed_time": "1 day, 15:36:05", "remaining_time": "1 day, 6:18:30", "throughput": 26967.35, "total_tokens": 3844608704} +{"current_steps": 14290, "total_steps": 25209, "loss": 0.9666, "lr": 3.208227719769589e-05, "epoch": 1.7005883359241931, "percentage": 56.69, "elapsed_time": "1 day, 15:37:44", "remaining_time": "1 day, 6:16:50", "throughput": 26967.67, "total_tokens": 3847341824} +{"current_steps": 14300, "total_steps": 25209, "loss": 0.9705, "lr": 3.207567495508124e-05, "epoch": 1.7017783959478456, "percentage": 56.73, "elapsed_time": "1 day, 15:39:20", "remaining_time": "1 day, 6:15:07", "throughput": 26968.47, "total_tokens": 3850044224} +{"current_steps": 14310, "total_steps": 25209, "loss": 0.9513, "lr": 3.2069076786835205e-05, "epoch": 1.7029684559714982, "percentage": 56.77, "elapsed_time": "1 day, 15:40:58", "remaining_time": "1 day, 6:13:26", "throughput": 26969.09, "total_tokens": 3852762240} +{"current_steps": 14320, "total_steps": 25209, "loss": 0.966, "lr": 3.2062482688768904e-05, "epoch": 1.7041585159951507, "percentage": 56.81, "elapsed_time": "1 day, 15:42:31", "remaining_time": "1 day, 6:11:40", "throughput": 26969.98, "total_tokens": 3855390976} +{"current_steps": 14330, "total_steps": 25209, "loss": 0.9625, "lr": 3.205589265669947e-05, "epoch": 1.705348576018803, "percentage": 56.84, "elapsed_time": "1 day, 15:44:10", "remaining_time": "1 day, 6:10:00", "throughput": 26970.62, "total_tokens": 3858170240} +{"current_steps": 14340, "total_steps": 25209, "loss": 0.9708, "lr": 3.204930668645005e-05, "epoch": 1.7065386360424553, "percentage": 56.88, "elapsed_time": "1 day, 15:45:42", "remaining_time": "1 day, 6:08:15", "throughput": 26971.81, "total_tokens": 3860818752} +{"current_steps": 14350, "total_steps": 25209, "loss": 0.9578, "lr": 3.20427247738498e-05, "epoch": 1.7077286960661078, "percentage": 56.92, "elapsed_time": "1 day, 15:47:26", "remaining_time": "1 day, 6:06:38", "throughput": 26971.38, "total_tokens": 3863569600} +{"current_steps": 14360, "total_steps": 25209, "loss": 0.9743, "lr": 3.2036146914733854e-05, "epoch": 1.7089187560897603, "percentage": 56.96, "elapsed_time": "1 day, 15:49:01", "remaining_time": "1 day, 6:04:54", "throughput": 26971.98, "total_tokens": 3866203392} +{"current_steps": 14370, "total_steps": 25209, "loss": 0.9667, "lr": 3.202957310494336e-05, "epoch": 1.7101088161134128, "percentage": 57.0, "elapsed_time": "1 day, 15:50:36", "remaining_time": "1 day, 6:03:11", "throughput": 26972.53, "total_tokens": 3868847872} +{"current_steps": 14380, "total_steps": 25209, "loss": 0.9653, "lr": 3.202300334032542e-05, "epoch": 1.7112988761370653, "percentage": 57.04, "elapsed_time": "1 day, 15:52:11", "remaining_time": "1 day, 6:01:28", "throughput": 26973.24, "total_tokens": 3871518464} +{"current_steps": 14390, "total_steps": 25209, "loss": 0.972, "lr": 3.201643761673308e-05, "epoch": 1.7124889361607176, "percentage": 57.08, "elapsed_time": "1 day, 15:53:49", "remaining_time": "1 day, 5:59:46", "throughput": 26973.83, "total_tokens": 3874228096} +{"current_steps": 14400, "total_steps": 25209, "loss": 0.9561, "lr": 3.200987593002536e-05, "epoch": 1.71367899618437, "percentage": 57.12, "elapsed_time": "1 day, 15:55:25", "remaining_time": "1 day, 5:58:04", "throughput": 26974.28, "total_tokens": 3876895360} +{"current_steps": 14410, "total_steps": 25209, "loss": 0.9599, "lr": 3.200331827606721e-05, "epoch": 1.7148690562080224, "percentage": 57.16, "elapsed_time": "1 day, 15:57:01", "remaining_time": "1 day, 5:56:21", "throughput": 26975.03, "total_tokens": 3879587456} +{"current_steps": 14420, "total_steps": 25209, "loss": 0.974, "lr": 3.199676465072951e-05, "epoch": 1.716059116231675, "percentage": 57.2, "elapsed_time": "1 day, 15:58:34", "remaining_time": "1 day, 5:54:36", "throughput": 26976.08, "total_tokens": 3882238080} +{"current_steps": 14430, "total_steps": 25209, "loss": 0.9641, "lr": 3.1990215049889046e-05, "epoch": 1.7172491762553275, "percentage": 57.24, "elapsed_time": "1 day, 16:00:17", "remaining_time": "1 day, 5:52:58", "throughput": 26975.87, "total_tokens": 3884992448} +{"current_steps": 14440, "total_steps": 25209, "loss": 0.9636, "lr": 3.198366946942851e-05, "epoch": 1.71843923627898, "percentage": 57.28, "elapsed_time": "1 day, 16:01:54", "remaining_time": "1 day, 5:51:16", "throughput": 26976.59, "total_tokens": 3887709120} +{"current_steps": 14450, "total_steps": 25209, "loss": 0.962, "lr": 3.1977127905236514e-05, "epoch": 1.7196292963026323, "percentage": 57.32, "elapsed_time": "1 day, 16:03:36", "remaining_time": "1 day, 5:49:39", "throughput": 26976.47, "total_tokens": 3890459008} +{"current_steps": 14460, "total_steps": 25209, "loss": 0.9677, "lr": 3.197059035320752e-05, "epoch": 1.7208193563262846, "percentage": 57.36, "elapsed_time": "1 day, 16:05:12", "remaining_time": "1 day, 5:47:56", "throughput": 26977.07, "total_tokens": 3893124416} +{"current_steps": 14470, "total_steps": 25209, "loss": 0.9655, "lr": 3.196405680924189e-05, "epoch": 1.722009416349937, "percentage": 57.4, "elapsed_time": "1 day, 16:06:52", "remaining_time": "1 day, 5:46:16", "throughput": 26977.19, "total_tokens": 3895848896} +{"current_steps": 14480, "total_steps": 25209, "loss": 0.9656, "lr": 3.195752726924582e-05, "epoch": 1.7231994763735896, "percentage": 57.44, "elapsed_time": "1 day, 16:08:32", "remaining_time": "1 day, 5:44:36", "throughput": 26977.73, "total_tokens": 3898611968} +{"current_steps": 14490, "total_steps": 25209, "loss": 0.9722, "lr": 3.195100172913139e-05, "epoch": 1.7243895363972421, "percentage": 57.48, "elapsed_time": "1 day, 16:10:10", "remaining_time": "1 day, 5:42:55", "throughput": 26978.11, "total_tokens": 3901306944} +{"current_steps": 14500, "total_steps": 25209, "loss": 0.9689, "lr": 3.19444801848165e-05, "epoch": 1.7255795964208944, "percentage": 57.52, "elapsed_time": "1 day, 16:11:46", "remaining_time": "1 day, 5:41:13", "throughput": 26978.57, "total_tokens": 3903967296} +{"current_steps": 14510, "total_steps": 25209, "loss": 0.9561, "lr": 3.1937962632224885e-05, "epoch": 1.726769656444547, "percentage": 57.56, "elapsed_time": "1 day, 16:13:24", "remaining_time": "1 day, 5:39:31", "throughput": 26978.76, "total_tokens": 3906641088} +{"current_steps": 14520, "total_steps": 25209, "loss": 0.9644, "lr": 3.193144906728609e-05, "epoch": 1.7279597164681992, "percentage": 57.6, "elapsed_time": "1 day, 16:14:56", "remaining_time": "1 day, 5:37:46", "throughput": 26979.8, "total_tokens": 3909269248} +{"current_steps": 14530, "total_steps": 25209, "loss": 0.9674, "lr": 3.1924939485935494e-05, "epoch": 1.7291497764918518, "percentage": 57.64, "elapsed_time": "1 day, 16:16:29", "remaining_time": "1 day, 5:36:02", "throughput": 26980.58, "total_tokens": 3911910784} +{"current_steps": 14540, "total_steps": 25209, "loss": 0.9633, "lr": 3.1918433884114253e-05, "epoch": 1.7303398365155043, "percentage": 57.68, "elapsed_time": "1 day, 16:18:07", "remaining_time": "1 day, 5:34:20", "throughput": 26981.02, "total_tokens": 3914598144} +{"current_steps": 14550, "total_steps": 25209, "loss": 0.9635, "lr": 3.191193225776931e-05, "epoch": 1.7315298965391568, "percentage": 57.72, "elapsed_time": "1 day, 16:19:42", "remaining_time": "1 day, 5:32:37", "throughput": 26981.66, "total_tokens": 3917269376} +{"current_steps": 14560, "total_steps": 25209, "loss": 0.9613, "lr": 3.190543460285339e-05, "epoch": 1.732719956562809, "percentage": 57.76, "elapsed_time": "1 day, 16:21:23", "remaining_time": "1 day, 5:30:58", "throughput": 26982.05, "total_tokens": 3920033472} +{"current_steps": 14570, "total_steps": 25209, "loss": 0.9616, "lr": 3.189894091532499e-05, "epoch": 1.7339100165864616, "percentage": 57.8, "elapsed_time": "1 day, 16:22:59", "remaining_time": "1 day, 5:29:15", "throughput": 26982.74, "total_tokens": 3922727040} +{"current_steps": 14580, "total_steps": 25209, "loss": 0.9586, "lr": 3.1892451191148346e-05, "epoch": 1.735100076610114, "percentage": 57.84, "elapsed_time": "1 day, 16:24:37", "remaining_time": "1 day, 5:27:34", "throughput": 26983.22, "total_tokens": 3925442304} +{"current_steps": 14590, "total_steps": 25209, "loss": 0.9593, "lr": 3.1885965426293465e-05, "epoch": 1.7362901366337664, "percentage": 57.88, "elapsed_time": "1 day, 16:26:15", "remaining_time": "1 day, 5:25:53", "throughput": 26983.77, "total_tokens": 3928166080} +{"current_steps": 14600, "total_steps": 25209, "loss": 0.9654, "lr": 3.187948361673606e-05, "epoch": 1.737480196657419, "percentage": 57.92, "elapsed_time": "1 day, 16:27:48", "remaining_time": "1 day, 5:24:08", "throughput": 26984.83, "total_tokens": 3930826560} +{"current_steps": 14610, "total_steps": 25209, "loss": 0.9723, "lr": 3.187300575845759e-05, "epoch": 1.7386702566810714, "percentage": 57.96, "elapsed_time": "1 day, 16:29:27", "remaining_time": "1 day, 5:22:28", "throughput": 26985.09, "total_tokens": 3933538432} +{"current_steps": 14620, "total_steps": 25209, "loss": 0.969, "lr": 3.186653184744521e-05, "epoch": 1.7398603167047237, "percentage": 58.0, "elapsed_time": "1 day, 16:31:04", "remaining_time": "1 day, 5:20:47", "throughput": 26985.68, "total_tokens": 3936253056} +{"current_steps": 14630, "total_steps": 25209, "loss": 0.9616, "lr": 3.18600618796918e-05, "epoch": 1.7410503767283763, "percentage": 58.03, "elapsed_time": "1 day, 16:32:39", "remaining_time": "1 day, 5:19:03", "throughput": 26986.57, "total_tokens": 3938950336} +{"current_steps": 14640, "total_steps": 25209, "loss": 0.9746, "lr": 3.185359585119591e-05, "epoch": 1.7422404367520286, "percentage": 58.07, "elapsed_time": "1 day, 16:34:14", "remaining_time": "1 day, 5:17:20", "throughput": 26987.22, "total_tokens": 3941604096} +{"current_steps": 14650, "total_steps": 25209, "loss": 0.9632, "lr": 3.184713375796178e-05, "epoch": 1.743430496775681, "percentage": 58.11, "elapsed_time": "1 day, 16:35:48", "remaining_time": "1 day, 5:15:36", "throughput": 26988.21, "total_tokens": 3944283136} +{"current_steps": 14660, "total_steps": 25209, "loss": 0.9581, "lr": 3.1840675595999344e-05, "epoch": 1.7446205567993336, "percentage": 58.15, "elapsed_time": "1 day, 16:37:25", "remaining_time": "1 day, 5:13:54", "throughput": 26988.62, "total_tokens": 3946964160} +{"current_steps": 14670, "total_steps": 25209, "loss": 0.9562, "lr": 3.1834221361324155e-05, "epoch": 1.745810616822986, "percentage": 58.19, "elapsed_time": "1 day, 16:39:04", "remaining_time": "1 day, 5:12:14", "throughput": 26988.93, "total_tokens": 3949682688} +{"current_steps": 14680, "total_steps": 25209, "loss": 0.9613, "lr": 3.182777104995744e-05, "epoch": 1.7470006768466384, "percentage": 58.23, "elapsed_time": "1 day, 16:40:34", "remaining_time": "1 day, 5:10:27", "throughput": 26990.23, "total_tokens": 3952299520} +{"current_steps": 14690, "total_steps": 25209, "loss": 0.9631, "lr": 3.182132465792609e-05, "epoch": 1.748190736870291, "percentage": 58.27, "elapsed_time": "1 day, 16:42:10", "remaining_time": "1 day, 5:08:45", "throughput": 26990.9, "total_tokens": 3955003392} +{"current_steps": 14700, "total_steps": 25209, "loss": 0.9608, "lr": 3.181488218126259e-05, "epoch": 1.7493807968939432, "percentage": 58.31, "elapsed_time": "1 day, 16:43:49", "remaining_time": "1 day, 5:07:05", "throughput": 26991.03, "total_tokens": 3957686336} +{"current_steps": 14710, "total_steps": 25209, "loss": 0.9638, "lr": 3.180844361600506e-05, "epoch": 1.7505708569175957, "percentage": 58.35, "elapsed_time": "1 day, 16:45:24", "remaining_time": "1 day, 5:05:21", "throughput": 26991.87, "total_tokens": 3960361408} +{"current_steps": 14720, "total_steps": 25209, "loss": 0.9751, "lr": 3.180200895819722e-05, "epoch": 1.7517609169412482, "percentage": 58.39, "elapsed_time": "1 day, 16:47:02", "remaining_time": "1 day, 5:03:41", "throughput": 26991.99, "total_tokens": 3963040448} +{"current_steps": 14730, "total_steps": 25209, "loss": 0.969, "lr": 3.1795578203888424e-05, "epoch": 1.7529509769649008, "percentage": 58.43, "elapsed_time": "1 day, 16:48:42", "remaining_time": "1 day, 5:02:01", "throughput": 26992.13, "total_tokens": 3965747648} +{"current_steps": 14740, "total_steps": 25209, "loss": 0.9482, "lr": 3.178915134913357e-05, "epoch": 1.754141036988553, "percentage": 58.47, "elapsed_time": "1 day, 16:50:19", "remaining_time": "1 day, 5:00:19", "throughput": 26992.72, "total_tokens": 3968451456} +{"current_steps": 14750, "total_steps": 25209, "loss": 0.9554, "lr": 3.178272838999316e-05, "epoch": 1.7553310970122056, "percentage": 58.51, "elapsed_time": "1 day, 16:51:53", "remaining_time": "1 day, 4:58:35", "throughput": 26993.71, "total_tokens": 3971133056} +{"current_steps": 14760, "total_steps": 25209, "loss": 0.9529, "lr": 3.1776309322533274e-05, "epoch": 1.7565211570358579, "percentage": 58.55, "elapsed_time": "1 day, 16:53:30", "remaining_time": "1 day, 4:56:54", "throughput": 26994.07, "total_tokens": 3973806144} +{"current_steps": 14770, "total_steps": 25209, "loss": 0.9771, "lr": 3.1769894142825536e-05, "epoch": 1.7577112170595104, "percentage": 58.59, "elapsed_time": "1 day, 16:55:04", "remaining_time": "1 day, 4:55:10", "throughput": 26994.75, "total_tokens": 3976434496} +{"current_steps": 14780, "total_steps": 25209, "loss": 0.9792, "lr": 3.176348284694712e-05, "epoch": 1.758901277083163, "percentage": 58.63, "elapsed_time": "1 day, 16:56:43", "remaining_time": "1 day, 4:53:30", "throughput": 26995.22, "total_tokens": 3979192640} +{"current_steps": 14790, "total_steps": 25209, "loss": 0.9855, "lr": 3.175707543098075e-05, "epoch": 1.7600913371068154, "percentage": 58.67, "elapsed_time": "1 day, 16:58:17", "remaining_time": "1 day, 4:51:46", "throughput": 26996.1, "total_tokens": 3981847872} +{"current_steps": 14800, "total_steps": 25209, "loss": 0.9573, "lr": 3.1750671891014653e-05, "epoch": 1.7612813971304677, "percentage": 58.71, "elapsed_time": "1 day, 16:59:51", "remaining_time": "1 day, 4:50:02", "throughput": 26996.87, "total_tokens": 3984519104} +{"current_steps": 14810, "total_steps": 25209, "loss": 0.9559, "lr": 3.174427222314262e-05, "epoch": 1.7624714571541202, "percentage": 58.75, "elapsed_time": "1 day, 17:01:32", "remaining_time": "1 day, 4:48:23", "throughput": 26997.05, "total_tokens": 3987266816} +{"current_steps": 14820, "total_steps": 25209, "loss": 0.9664, "lr": 3.173787642346391e-05, "epoch": 1.7636615171777725, "percentage": 58.79, "elapsed_time": "1 day, 17:03:09", "remaining_time": "1 day, 4:46:42", "throughput": 26997.57, "total_tokens": 3989962048} +{"current_steps": 14830, "total_steps": 25209, "loss": 0.9578, "lr": 3.173148448808331e-05, "epoch": 1.764851577201425, "percentage": 58.83, "elapsed_time": "1 day, 17:04:46", "remaining_time": "1 day, 4:45:00", "throughput": 26998.07, "total_tokens": 3992642176} +{"current_steps": 14840, "total_steps": 25209, "loss": 0.9604, "lr": 3.172509641311107e-05, "epoch": 1.7660416372250776, "percentage": 58.87, "elapsed_time": "1 day, 17:06:22", "remaining_time": "1 day, 4:43:17", "throughput": 26998.88, "total_tokens": 3995348736} +{"current_steps": 14850, "total_steps": 25209, "loss": 0.9755, "lr": 3.171871219466293e-05, "epoch": 1.76723169724873, "percentage": 58.91, "elapsed_time": "1 day, 17:08:01", "remaining_time": "1 day, 4:41:37", "throughput": 26999.18, "total_tokens": 3998071488} +{"current_steps": 14860, "total_steps": 25209, "loss": 0.9718, "lr": 3.171233182886011e-05, "epoch": 1.7684217572723824, "percentage": 58.95, "elapsed_time": "1 day, 17:09:39", "remaining_time": "1 day, 4:39:57", "throughput": 26999.57, "total_tokens": 4000783296} +{"current_steps": 14870, "total_steps": 25209, "loss": 0.9689, "lr": 3.170595531182928e-05, "epoch": 1.769611817296035, "percentage": 58.99, "elapsed_time": "1 day, 17:11:17", "remaining_time": "1 day, 4:38:15", "throughput": 27000.29, "total_tokens": 4003522304} +{"current_steps": 14880, "total_steps": 25209, "loss": 0.9751, "lr": 3.169958263970256e-05, "epoch": 1.7708018773196872, "percentage": 59.03, "elapsed_time": "1 day, 17:12:58", "remaining_time": "1 day, 4:36:37", "throughput": 27000.08, "total_tokens": 4006232512} +{"current_steps": 14890, "total_steps": 25209, "loss": 0.9679, "lr": 3.169321380861751e-05, "epoch": 1.7719919373433397, "percentage": 59.07, "elapsed_time": "1 day, 17:14:37", "remaining_time": "1 day, 4:34:56", "throughput": 27000.51, "total_tokens": 4008957504} +{"current_steps": 14900, "total_steps": 25209, "loss": 0.954, "lr": 3.168684881471711e-05, "epoch": 1.7731819973669922, "percentage": 59.11, "elapsed_time": "1 day, 17:16:16", "remaining_time": "1 day, 4:33:17", "throughput": 27000.85, "total_tokens": 4011696192} +{"current_steps": 14910, "total_steps": 25209, "loss": 0.9767, "lr": 3.168048765414979e-05, "epoch": 1.7743720573906447, "percentage": 59.15, "elapsed_time": "1 day, 17:17:53", "remaining_time": "1 day, 4:31:35", "throughput": 27001.41, "total_tokens": 4014406912} +{"current_steps": 14920, "total_steps": 25209, "loss": 0.9665, "lr": 3.167413032306936e-05, "epoch": 1.775562117414297, "percentage": 59.19, "elapsed_time": "1 day, 17:19:30", "remaining_time": "1 day, 4:29:54", "throughput": 27001.82, "total_tokens": 4017086208} +{"current_steps": 14930, "total_steps": 25209, "loss": 0.9602, "lr": 3.166777681763504e-05, "epoch": 1.7767521774379496, "percentage": 59.22, "elapsed_time": "1 day, 17:21:09", "remaining_time": "1 day, 4:28:13", "throughput": 27002.02, "total_tokens": 4019789696} +{"current_steps": 14940, "total_steps": 25209, "loss": 0.9612, "lr": 3.166142713401144e-05, "epoch": 1.7779422374616018, "percentage": 59.26, "elapsed_time": "1 day, 17:22:48", "remaining_time": "1 day, 4:26:33", "throughput": 27002.65, "total_tokens": 4022534400} +{"current_steps": 14950, "total_steps": 25209, "loss": 0.9695, "lr": 3.165508126836857e-05, "epoch": 1.7791322974852544, "percentage": 59.3, "elapsed_time": "1 day, 17:24:25", "remaining_time": "1 day, 4:24:51", "throughput": 27003.01, "total_tokens": 4025221312} +{"current_steps": 14960, "total_steps": 25209, "loss": 0.9658, "lr": 3.164873921688177e-05, "epoch": 1.7803223575089069, "percentage": 59.34, "elapsed_time": "1 day, 17:26:02", "remaining_time": "1 day, 4:23:10", "throughput": 27003.6, "total_tokens": 4027927616} +{"current_steps": 14970, "total_steps": 25209, "loss": 0.9663, "lr": 3.164240097573178e-05, "epoch": 1.7815124175325594, "percentage": 59.38, "elapsed_time": "1 day, 17:27:36", "remaining_time": "1 day, 4:21:26", "throughput": 27004.23, "total_tokens": 4030552256} +{"current_steps": 14980, "total_steps": 25209, "loss": 0.9651, "lr": 3.163606654110467e-05, "epoch": 1.7827024775562117, "percentage": 59.42, "elapsed_time": "1 day, 17:29:15", "remaining_time": "1 day, 4:19:46", "throughput": 27004.49, "total_tokens": 4033259264} +{"current_steps": 14990, "total_steps": 25209, "loss": 0.9706, "lr": 3.162973590919187e-05, "epoch": 1.7838925375798642, "percentage": 59.46, "elapsed_time": "1 day, 17:30:52", "remaining_time": "1 day, 4:18:05", "throughput": 27005.03, "total_tokens": 4035974400} +{"current_steps": 15000, "total_steps": 25209, "loss": 0.9638, "lr": 3.162340907619012e-05, "epoch": 1.7850825976035165, "percentage": 59.5, "elapsed_time": "1 day, 17:32:26", "remaining_time": "1 day, 4:16:21", "throughput": 27005.89, "total_tokens": 4038642624} +{"current_steps": 15000, "total_steps": 25209, "eval_loss": 1.0152374505996704, "epoch": 1.7850825976035165, "percentage": 59.5, "elapsed_time": "1 day, 17:32:28", "remaining_time": "1 day, 4:16:22", "throughput": 27005.54, "total_tokens": 4038642624} +{"current_steps": 15010, "total_steps": 25209, "loss": 0.9567, "lr": 3.1617086038301516e-05, "epoch": 1.786272657627169, "percentage": 59.54, "elapsed_time": "1 day, 17:34:40", "remaining_time": "1 day, 4:15:04", "throughput": 26999.94, "total_tokens": 4041365504} +{"current_steps": 15020, "total_steps": 25209, "loss": 0.98, "lr": 3.161076679173344e-05, "epoch": 1.7874627176508215, "percentage": 59.58, "elapsed_time": "1 day, 17:36:17", "remaining_time": "1 day, 4:13:23", "throughput": 27000.21, "total_tokens": 4044032896} +{"current_steps": 15030, "total_steps": 25209, "loss": 0.9642, "lr": 3.1604451332698575e-05, "epoch": 1.788652777674474, "percentage": 59.62, "elapsed_time": "1 day, 17:37:57", "remaining_time": "1 day, 4:11:43", "throughput": 27000.32, "total_tokens": 4046735360} +{"current_steps": 15040, "total_steps": 25209, "loss": 0.959, "lr": 3.1598139657414923e-05, "epoch": 1.7898428376981264, "percentage": 59.66, "elapsed_time": "1 day, 17:39:32", "remaining_time": "1 day, 4:10:01", "throughput": 27000.75, "total_tokens": 4049380416} +{"current_steps": 15050, "total_steps": 25209, "loss": 0.97, "lr": 3.159183176210574e-05, "epoch": 1.7910328977217789, "percentage": 59.7, "elapsed_time": "1 day, 17:41:06", "remaining_time": "1 day, 4:08:17", "throughput": 27001.49, "total_tokens": 4052026752} +{"current_steps": 15060, "total_steps": 25209, "loss": 0.9655, "lr": 3.1585527642999595e-05, "epoch": 1.7922229577454312, "percentage": 59.74, "elapsed_time": "1 day, 17:42:46", "remaining_time": "1 day, 4:06:37", "throughput": 27001.37, "total_tokens": 4054705344} +{"current_steps": 15070, "total_steps": 25209, "loss": 0.9603, "lr": 3.1579227296330294e-05, "epoch": 1.7934130177690837, "percentage": 59.78, "elapsed_time": "1 day, 17:44:23", "remaining_time": "1 day, 4:04:56", "throughput": 27001.89, "total_tokens": 4057399680} +{"current_steps": 15080, "total_steps": 25209, "loss": 0.9705, "lr": 3.157293071833691e-05, "epoch": 1.7946030777927362, "percentage": 59.82, "elapsed_time": "1 day, 17:45:59", "remaining_time": "1 day, 4:03:14", "throughput": 27002.55, "total_tokens": 4060085952} +{"current_steps": 15090, "total_steps": 25209, "loss": 0.9729, "lr": 3.156663790526375e-05, "epoch": 1.7957931378163887, "percentage": 59.86, "elapsed_time": "1 day, 17:47:34", "remaining_time": "1 day, 4:01:31", "throughput": 27003.03, "total_tokens": 4062738240} +{"current_steps": 15100, "total_steps": 25209, "loss": 0.9695, "lr": 3.156034885336039e-05, "epoch": 1.796983197840041, "percentage": 59.9, "elapsed_time": "1 day, 17:49:13", "remaining_time": "1 day, 3:59:51", "throughput": 27003.09, "total_tokens": 4065419392} +{"current_steps": 15110, "total_steps": 25209, "loss": 0.9741, "lr": 3.155406355888161e-05, "epoch": 1.7981732578636935, "percentage": 59.94, "elapsed_time": "1 day, 17:50:52", "remaining_time": "1 day, 3:58:10", "throughput": 27003.39, "total_tokens": 4068119168} +{"current_steps": 15120, "total_steps": 25209, "loss": 0.9643, "lr": 3.1547782018087407e-05, "epoch": 1.7993633178873458, "percentage": 59.98, "elapsed_time": "1 day, 17:52:32", "remaining_time": "1 day, 3:56:31", "throughput": 27003.33, "total_tokens": 4070812864} +{"current_steps": 15130, "total_steps": 25209, "loss": 0.9573, "lr": 3.154150422724299e-05, "epoch": 1.8005533779109983, "percentage": 60.02, "elapsed_time": "1 day, 17:54:09", "remaining_time": "1 day, 3:54:50", "throughput": 27003.75, "total_tokens": 4073509888} +{"current_steps": 15140, "total_steps": 25209, "loss": 0.9648, "lr": 3.1535230182618783e-05, "epoch": 1.8017434379346509, "percentage": 60.06, "elapsed_time": "1 day, 17:55:48", "remaining_time": "1 day, 3:53:09", "throughput": 27003.95, "total_tokens": 4076208512} +{"current_steps": 15150, "total_steps": 25209, "loss": 0.9471, "lr": 3.1528959880490387e-05, "epoch": 1.8029334979583034, "percentage": 60.1, "elapsed_time": "1 day, 17:57:33", "remaining_time": "1 day, 3:51:33", "throughput": 27003.59, "total_tokens": 4078978752} +{"current_steps": 15160, "total_steps": 25209, "loss": 0.9644, "lr": 3.152269331713859e-05, "epoch": 1.8041235579819557, "percentage": 60.14, "elapsed_time": "1 day, 17:59:11", "remaining_time": "1 day, 3:49:52", "throughput": 27004.07, "total_tokens": 4081692352} +{"current_steps": 15170, "total_steps": 25209, "loss": 0.9615, "lr": 3.151643048884935e-05, "epoch": 1.8053136180056082, "percentage": 60.18, "elapsed_time": "1 day, 18:00:45", "remaining_time": "1 day, 3:48:09", "throughput": 27004.88, "total_tokens": 4084358912} +{"current_steps": 15180, "total_steps": 25209, "loss": 0.9688, "lr": 3.151017139191379e-05, "epoch": 1.8065036780292605, "percentage": 60.22, "elapsed_time": "1 day, 18:02:21", "remaining_time": "1 day, 3:46:27", "throughput": 27005.62, "total_tokens": 4087070016} +{"current_steps": 15190, "total_steps": 25209, "loss": 0.9453, "lr": 3.150391602262818e-05, "epoch": 1.807693738052913, "percentage": 60.26, "elapsed_time": "1 day, 18:03:57", "remaining_time": "1 day, 3:44:44", "throughput": 27006.33, "total_tokens": 4089758912} +{"current_steps": 15200, "total_steps": 25209, "loss": 0.9604, "lr": 3.149766437729394e-05, "epoch": 1.8088837980765655, "percentage": 60.3, "elapsed_time": "1 day, 18:05:35", "remaining_time": "1 day, 3:43:03", "throughput": 27006.61, "total_tokens": 4092447296} +{"current_steps": 15210, "total_steps": 25209, "loss": 0.9577, "lr": 3.1491416452217635e-05, "epoch": 1.810073858100218, "percentage": 60.34, "elapsed_time": "1 day, 18:07:10", "remaining_time": "1 day, 3:41:21", "throughput": 27007.15, "total_tokens": 4095118016} +{"current_steps": 15220, "total_steps": 25209, "loss": 0.953, "lr": 3.1485172243710954e-05, "epoch": 1.8112639181238703, "percentage": 60.38, "elapsed_time": "1 day, 18:08:51", "remaining_time": "1 day, 3:39:42", "throughput": 27007.02, "total_tokens": 4097811648} +{"current_steps": 15230, "total_steps": 25209, "loss": 0.9579, "lr": 3.1478931748090676e-05, "epoch": 1.8124539781475228, "percentage": 60.41, "elapsed_time": "1 day, 18:10:28", "remaining_time": "1 day, 3:38:01", "throughput": 27007.79, "total_tokens": 4100555968} +{"current_steps": 15240, "total_steps": 25209, "loss": 0.9485, "lr": 3.147269496167873e-05, "epoch": 1.8136440381711751, "percentage": 60.45, "elapsed_time": "1 day, 18:12:05", "remaining_time": "1 day, 3:36:19", "throughput": 27008.14, "total_tokens": 4103229312} +{"current_steps": 15250, "total_steps": 25209, "loss": 0.9752, "lr": 3.1466461880802105e-05, "epoch": 1.8148340981948277, "percentage": 60.49, "elapsed_time": "1 day, 18:13:40", "remaining_time": "1 day, 3:34:36", "throughput": 27008.93, "total_tokens": 4105907776} +{"current_steps": 15260, "total_steps": 25209, "loss": 0.954, "lr": 3.146023250179291e-05, "epoch": 1.8160241582184802, "percentage": 60.53, "elapsed_time": "1 day, 18:15:18", "remaining_time": "1 day, 3:32:56", "throughput": 27009.12, "total_tokens": 4108587584} +{"current_steps": 15270, "total_steps": 25209, "loss": 0.9695, "lr": 3.145400682098833e-05, "epoch": 1.8172142182421327, "percentage": 60.57, "elapsed_time": "1 day, 18:16:55", "remaining_time": "1 day, 3:31:14", "throughput": 27009.9, "total_tokens": 4111321472} +{"current_steps": 15280, "total_steps": 25209, "loss": 0.9809, "lr": 3.14477848347306e-05, "epoch": 1.818404278265785, "percentage": 60.61, "elapsed_time": "1 day, 18:18:34", "remaining_time": "1 day, 3:29:34", "throughput": 27010.07, "total_tokens": 4114027904} +{"current_steps": 15290, "total_steps": 25209, "loss": 0.9584, "lr": 3.144156653936703e-05, "epoch": 1.8195943382894375, "percentage": 60.65, "elapsed_time": "1 day, 18:20:09", "remaining_time": "1 day, 3:27:51", "throughput": 27010.5, "total_tokens": 4116659264} +{"current_steps": 15300, "total_steps": 25209, "loss": 0.9613, "lr": 3.1435351931250004e-05, "epoch": 1.8207843983130898, "percentage": 60.69, "elapsed_time": "1 day, 18:21:45", "remaining_time": "1 day, 3:26:09", "throughput": 27011.07, "total_tokens": 4119346112} +{"current_steps": 15310, "total_steps": 25209, "loss": 0.9616, "lr": 3.142914100673692e-05, "epoch": 1.8219744583367423, "percentage": 60.73, "elapsed_time": "1 day, 18:23:20", "remaining_time": "1 day, 3:24:27", "throughput": 27012.08, "total_tokens": 4122064448} +{"current_steps": 15320, "total_steps": 25209, "loss": 0.9706, "lr": 3.1422933762190235e-05, "epoch": 1.8231645183603948, "percentage": 60.77, "elapsed_time": "1 day, 18:24:59", "remaining_time": "1 day, 3:22:46", "throughput": 27012.44, "total_tokens": 4124783232} +{"current_steps": 15330, "total_steps": 25209, "loss": 0.9524, "lr": 3.141673019397741e-05, "epoch": 1.8243545783840474, "percentage": 60.81, "elapsed_time": "1 day, 18:26:32", "remaining_time": "1 day, 3:21:02", "throughput": 27013.55, "total_tokens": 4127457984} +{"current_steps": 15340, "total_steps": 25209, "loss": 0.9681, "lr": 3.141053029847095e-05, "epoch": 1.8255446384076996, "percentage": 60.85, "elapsed_time": "1 day, 18:28:08", "remaining_time": "1 day, 3:19:21", "throughput": 27013.98, "total_tokens": 4130132992} +{"current_steps": 15350, "total_steps": 25209, "loss": 0.9684, "lr": 3.140433407204835e-05, "epoch": 1.8267346984313522, "percentage": 60.89, "elapsed_time": "1 day, 18:29:43", "remaining_time": "1 day, 3:17:38", "throughput": 27014.97, "total_tokens": 4132848256} +{"current_steps": 15360, "total_steps": 25209, "loss": 0.9655, "lr": 3.1398141511092124e-05, "epoch": 1.8279247584550045, "percentage": 60.93, "elapsed_time": "1 day, 18:31:18", "remaining_time": "1 day, 3:15:55", "throughput": 27015.73, "total_tokens": 4135528832} +{"current_steps": 15370, "total_steps": 25209, "loss": 0.9592, "lr": 3.1391952611989736e-05, "epoch": 1.829114818478657, "percentage": 60.97, "elapsed_time": "1 day, 18:32:47", "remaining_time": "1 day, 3:14:09", "throughput": 27017.14, "total_tokens": 4138158336} +{"current_steps": 15380, "total_steps": 25209, "loss": 0.9835, "lr": 3.138576737113369e-05, "epoch": 1.8303048785023095, "percentage": 61.01, "elapsed_time": "1 day, 18:34:25", "remaining_time": "1 day, 3:12:28", "throughput": 27017.75, "total_tokens": 4140883648} +{"current_steps": 15390, "total_steps": 25209, "loss": 0.9628, "lr": 3.137958578492143e-05, "epoch": 1.831494938525962, "percentage": 61.05, "elapsed_time": "1 day, 18:36:00", "remaining_time": "1 day, 3:10:45", "throughput": 27018.4, "total_tokens": 4143555264} +{"current_steps": 15400, "total_steps": 25209, "loss": 0.9691, "lr": 3.137340784975535e-05, "epoch": 1.8326849985496143, "percentage": 61.09, "elapsed_time": "1 day, 18:37:37", "remaining_time": "1 day, 3:09:04", "throughput": 27018.91, "total_tokens": 4146249728} +{"current_steps": 15410, "total_steps": 25209, "loss": 0.9476, "lr": 3.136723356204285e-05, "epoch": 1.8338750585732668, "percentage": 61.13, "elapsed_time": "1 day, 18:39:13", "remaining_time": "1 day, 3:07:22", "throughput": 27019.62, "total_tokens": 4148946944} +{"current_steps": 15420, "total_steps": 25209, "loss": 0.9675, "lr": 3.136106291819622e-05, "epoch": 1.8350651185969191, "percentage": 61.17, "elapsed_time": "1 day, 18:40:47", "remaining_time": "1 day, 3:05:39", "throughput": 27020.42, "total_tokens": 4151628608} +{"current_steps": 15430, "total_steps": 25209, "loss": 0.9572, "lr": 3.1354895914632736e-05, "epoch": 1.8362551786205716, "percentage": 61.21, "elapsed_time": "1 day, 18:42:28", "remaining_time": "1 day, 3:04:00", "throughput": 27020.63, "total_tokens": 4154388416} +{"current_steps": 15440, "total_steps": 25209, "loss": 0.9597, "lr": 3.1348732547774575e-05, "epoch": 1.8374452386442242, "percentage": 61.25, "elapsed_time": "1 day, 18:44:07", "remaining_time": "1 day, 3:02:20", "throughput": 27021.04, "total_tokens": 4157121152} +{"current_steps": 15450, "total_steps": 25209, "loss": 0.9732, "lr": 3.134257281404883e-05, "epoch": 1.8386352986678767, "percentage": 61.29, "elapsed_time": "1 day, 18:45:45", "remaining_time": "1 day, 3:00:39", "throughput": 27021.24, "total_tokens": 4159803968} +{"current_steps": 15460, "total_steps": 25209, "loss": 0.9671, "lr": 3.133641670988755e-05, "epoch": 1.839825358691529, "percentage": 61.33, "elapsed_time": "1 day, 18:47:20", "remaining_time": "1 day, 2:58:57", "throughput": 27021.94, "total_tokens": 4162475392} +{"current_steps": 15470, "total_steps": 25209, "loss": 0.9662, "lr": 3.133026423172764e-05, "epoch": 1.8410154187151815, "percentage": 61.37, "elapsed_time": "1 day, 18:48:57", "remaining_time": "1 day, 2:57:15", "throughput": 27022.41, "total_tokens": 4165167552} +{"current_steps": 15480, "total_steps": 25209, "loss": 0.961, "lr": 3.1324115376010897e-05, "epoch": 1.8422054787388338, "percentage": 61.41, "elapsed_time": "1 day, 18:50:33", "remaining_time": "1 day, 2:55:34", "throughput": 27022.85, "total_tokens": 4167835008} +{"current_steps": 15490, "total_steps": 25209, "loss": 0.9618, "lr": 3.131797013918406e-05, "epoch": 1.8433955387624863, "percentage": 61.45, "elapsed_time": "1 day, 18:52:16", "remaining_time": "1 day, 2:53:56", "throughput": 27022.91, "total_tokens": 4170629376} +{"current_steps": 15500, "total_steps": 25209, "loss": 0.9718, "lr": 3.13118285176987e-05, "epoch": 1.8445855987861388, "percentage": 61.49, "elapsed_time": "1 day, 18:53:49", "remaining_time": "1 day, 2:52:12", "throughput": 27023.74, "total_tokens": 4173273216} +{"current_steps": 15510, "total_steps": 25209, "loss": 0.9539, "lr": 3.130569050801126e-05, "epoch": 1.8457756588097913, "percentage": 61.53, "elapsed_time": "1 day, 18:55:24", "remaining_time": "1 day, 2:50:30", "throughput": 27024.5, "total_tokens": 4175947520} +{"current_steps": 15520, "total_steps": 25209, "loss": 0.9689, "lr": 3.129955610658306e-05, "epoch": 1.8469657188334436, "percentage": 61.57, "elapsed_time": "1 day, 18:56:57", "remaining_time": "1 day, 2:48:46", "throughput": 27025.42, "total_tokens": 4178604224} +{"current_steps": 15530, "total_steps": 25209, "loss": 0.9793, "lr": 3.129342530988025e-05, "epoch": 1.8481557788570961, "percentage": 61.6, "elapsed_time": "1 day, 18:58:33", "remaining_time": "1 day, 2:47:04", "throughput": 27025.88, "total_tokens": 4181258688} +{"current_steps": 15540, "total_steps": 25209, "loss": 0.972, "lr": 3.128729811437385e-05, "epoch": 1.8493458388807484, "percentage": 61.64, "elapsed_time": "1 day, 19:00:10", "remaining_time": "1 day, 2:45:22", "throughput": 27026.08, "total_tokens": 4183908352} +{"current_steps": 15550, "total_steps": 25209, "loss": 0.9654, "lr": 3.12811745165397e-05, "epoch": 1.850535898904401, "percentage": 61.68, "elapsed_time": "1 day, 19:01:46", "remaining_time": "1 day, 2:43:41", "throughput": 27026.59, "total_tokens": 4186607872} +{"current_steps": 15560, "total_steps": 25209, "loss": 0.9774, "lr": 3.127505451285846e-05, "epoch": 1.8517259589280535, "percentage": 61.72, "elapsed_time": "1 day, 19:03:25", "remaining_time": "1 day, 2:42:01", "throughput": 27026.85, "total_tokens": 4189322752} +{"current_steps": 15570, "total_steps": 25209, "loss": 0.9649, "lr": 3.126893809981563e-05, "epoch": 1.852916018951706, "percentage": 61.76, "elapsed_time": "1 day, 19:05:02", "remaining_time": "1 day, 2:40:20", "throughput": 27027.18, "total_tokens": 4191995392} +{"current_steps": 15580, "total_steps": 25209, "loss": 0.9596, "lr": 3.126282527390149e-05, "epoch": 1.8541060789753583, "percentage": 61.8, "elapsed_time": "1 day, 19:06:37", "remaining_time": "1 day, 2:38:37", "throughput": 27027.97, "total_tokens": 4194661504} +{"current_steps": 15590, "total_steps": 25209, "loss": 0.9602, "lr": 3.1256716031611146e-05, "epoch": 1.8552961389990108, "percentage": 61.84, "elapsed_time": "1 day, 19:08:18", "remaining_time": "1 day, 2:36:59", "throughput": 27027.84, "total_tokens": 4197388864} +{"current_steps": 15600, "total_steps": 25209, "loss": 0.9581, "lr": 3.1250610369444475e-05, "epoch": 1.856486199022663, "percentage": 61.88, "elapsed_time": "1 day, 19:09:54", "remaining_time": "1 day, 2:35:17", "throughput": 27028.45, "total_tokens": 4200084864} +{"current_steps": 15610, "total_steps": 25209, "loss": 0.9686, "lr": 3.124450828390616e-05, "epoch": 1.8576762590463156, "percentage": 61.92, "elapsed_time": "1 day, 19:11:30", "remaining_time": "1 day, 2:33:35", "throughput": 27029.03, "total_tokens": 4202757696} +{"current_steps": 15620, "total_steps": 25209, "loss": 0.9631, "lr": 3.123840977150566e-05, "epoch": 1.8588663190699681, "percentage": 61.96, "elapsed_time": "1 day, 19:13:09", "remaining_time": "1 day, 2:31:55", "throughput": 27029.24, "total_tokens": 4205458880} +{"current_steps": 15630, "total_steps": 25209, "loss": 0.9594, "lr": 3.123231482875717e-05, "epoch": 1.8600563790936206, "percentage": 62.0, "elapsed_time": "1 day, 19:14:41", "remaining_time": "1 day, 2:30:11", "throughput": 27030.28, "total_tokens": 4208123776} +{"current_steps": 15640, "total_steps": 25209, "loss": 0.9503, "lr": 3.122622345217967e-05, "epoch": 1.861246439117273, "percentage": 62.04, "elapsed_time": "1 day, 19:16:16", "remaining_time": "1 day, 2:28:28", "throughput": 27031.15, "total_tokens": 4210816064} +{"current_steps": 15650, "total_steps": 25209, "loss": 0.9666, "lr": 3.12201356382969e-05, "epoch": 1.8624364991409255, "percentage": 62.08, "elapsed_time": "1 day, 19:17:57", "remaining_time": "1 day, 2:26:49", "throughput": 27031.34, "total_tokens": 4213565312} +{"current_steps": 15660, "total_steps": 25209, "loss": 0.9683, "lr": 3.1214051383637304e-05, "epoch": 1.8636265591645778, "percentage": 62.12, "elapsed_time": "1 day, 19:19:32", "remaining_time": "1 day, 2:25:07", "throughput": 27032.07, "total_tokens": 4216253568} +{"current_steps": 15670, "total_steps": 25209, "loss": 0.9555, "lr": 3.1207970684734104e-05, "epoch": 1.8648166191882303, "percentage": 62.16, "elapsed_time": "1 day, 19:21:16", "remaining_time": "1 day, 2:23:30", "throughput": 27031.71, "total_tokens": 4219015104} +{"current_steps": 15680, "total_steps": 25209, "loss": 0.9577, "lr": 3.120189353812521e-05, "epoch": 1.8660066792118828, "percentage": 62.2, "elapsed_time": "1 day, 19:22:54", "remaining_time": "1 day, 2:21:50", "throughput": 27031.94, "total_tokens": 4221707328} +{"current_steps": 15690, "total_steps": 25209, "loss": 0.9602, "lr": 3.1195819940353294e-05, "epoch": 1.8671967392355353, "percentage": 62.24, "elapsed_time": "1 day, 19:24:30", "remaining_time": "1 day, 2:20:08", "throughput": 27032.67, "total_tokens": 4224410624} +{"current_steps": 15700, "total_steps": 25209, "loss": 0.9639, "lr": 3.1189749887965684e-05, "epoch": 1.8683867992591876, "percentage": 62.28, "elapsed_time": "1 day, 19:26:04", "remaining_time": "1 day, 2:18:25", "throughput": 27033.44, "total_tokens": 4227080128} +{"current_steps": 15710, "total_steps": 25209, "loss": 0.9539, "lr": 3.118368337751443e-05, "epoch": 1.8695768592828401, "percentage": 62.32, "elapsed_time": "1 day, 19:27:40", "remaining_time": "1 day, 2:16:43", "throughput": 27034.25, "total_tokens": 4229789248} +{"current_steps": 15720, "total_steps": 25209, "loss": 0.9637, "lr": 3.1177620405556305e-05, "epoch": 1.8707669193064924, "percentage": 62.36, "elapsed_time": "1 day, 19:29:11", "remaining_time": "1 day, 2:14:58", "throughput": 27035.25, "total_tokens": 4232419072} +{"current_steps": 15730, "total_steps": 25209, "loss": 0.9648, "lr": 3.117156096865272e-05, "epoch": 1.871956979330145, "percentage": 62.4, "elapsed_time": "1 day, 19:30:51", "remaining_time": "1 day, 2:13:19", "throughput": 27035.42, "total_tokens": 4235146624} +{"current_steps": 15740, "total_steps": 25209, "loss": 0.9585, "lr": 3.116550506336979e-05, "epoch": 1.8731470393537974, "percentage": 62.44, "elapsed_time": "1 day, 19:32:27", "remaining_time": "1 day, 2:11:37", "throughput": 27036.05, "total_tokens": 4237842240} +{"current_steps": 15750, "total_steps": 25209, "loss": 0.9588, "lr": 3.11594526862783e-05, "epoch": 1.87433709937745, "percentage": 62.48, "elapsed_time": "1 day, 19:34:04", "remaining_time": "1 day, 2:09:56", "throughput": 27036.59, "total_tokens": 4240533952} +{"current_steps": 15760, "total_steps": 25209, "loss": 0.9658, "lr": 3.115340383395367e-05, "epoch": 1.8755271594011023, "percentage": 62.52, "elapsed_time": "1 day, 19:35:46", "remaining_time": "1 day, 2:08:17", "throughput": 27036.62, "total_tokens": 4243290240} +{"current_steps": 15770, "total_steps": 25209, "loss": 0.9627, "lr": 3.1147358502975995e-05, "epoch": 1.8767172194247548, "percentage": 62.56, "elapsed_time": "1 day, 19:37:23", "remaining_time": "1 day, 2:06:36", "throughput": 27036.97, "total_tokens": 4245978048} +{"current_steps": 15780, "total_steps": 25209, "loss": 0.9673, "lr": 3.114131668993e-05, "epoch": 1.877907279448407, "percentage": 62.6, "elapsed_time": "1 day, 19:38:57", "remaining_time": "1 day, 2:04:54", "throughput": 27037.64, "total_tokens": 4248640576} +{"current_steps": 15790, "total_steps": 25209, "loss": 0.9484, "lr": 3.113527839140507e-05, "epoch": 1.8790973394720596, "percentage": 62.64, "elapsed_time": "1 day, 19:40:35", "remaining_time": "1 day, 2:03:13", "throughput": 27038.04, "total_tokens": 4251334400} +{"current_steps": 15800, "total_steps": 25209, "loss": 0.9624, "lr": 3.112924360399517e-05, "epoch": 1.880287399495712, "percentage": 62.68, "elapsed_time": "1 day, 19:42:13", "remaining_time": "1 day, 2:01:33", "throughput": 27038.38, "total_tokens": 4254044096} +{"current_steps": 15810, "total_steps": 25209, "loss": 0.9641, "lr": 3.112321232429894e-05, "epoch": 1.8814774595193646, "percentage": 62.72, "elapsed_time": "1 day, 19:43:51", "remaining_time": "1 day, 1:59:52", "throughput": 27038.66, "total_tokens": 4256728896} +{"current_steps": 15820, "total_steps": 25209, "loss": 0.9619, "lr": 3.11171845489196e-05, "epoch": 1.882667519543017, "percentage": 62.76, "elapsed_time": "1 day, 19:45:26", "remaining_time": "1 day, 1:58:10", "throughput": 27039.63, "total_tokens": 4259454528} +{"current_steps": 15830, "total_steps": 25209, "loss": 0.9626, "lr": 3.1111160274464965e-05, "epoch": 1.8838575795666694, "percentage": 62.8, "elapsed_time": "1 day, 19:47:04", "remaining_time": "1 day, 1:56:29", "throughput": 27040.09, "total_tokens": 4262170240} +{"current_steps": 15840, "total_steps": 25209, "loss": 0.9662, "lr": 3.1105139497547466e-05, "epoch": 1.8850476395903217, "percentage": 62.83, "elapsed_time": "1 day, 19:48:40", "remaining_time": "1 day, 1:54:47", "throughput": 27040.63, "total_tokens": 4264850688} +{"current_steps": 15850, "total_steps": 25209, "loss": 0.957, "lr": 3.109912221478411e-05, "epoch": 1.8862376996139743, "percentage": 62.87, "elapsed_time": "1 day, 19:50:17", "remaining_time": "1 day, 1:53:06", "throughput": 27040.89, "total_tokens": 4267513536} +{"current_steps": 15860, "total_steps": 25209, "loss": 0.9666, "lr": 3.10931084227965e-05, "epoch": 1.8874277596376268, "percentage": 62.91, "elapsed_time": "1 day, 19:51:54", "remaining_time": "1 day, 1:51:26", "throughput": 27041.19, "total_tokens": 4270204096} +{"current_steps": 15870, "total_steps": 25209, "loss": 0.964, "lr": 3.108709811821079e-05, "epoch": 1.8886178196612793, "percentage": 62.95, "elapsed_time": "1 day, 19:53:28", "remaining_time": "1 day, 1:49:43", "throughput": 27042.02, "total_tokens": 4272879680} +{"current_steps": 15880, "total_steps": 25209, "loss": 0.9702, "lr": 3.1081091297657696e-05, "epoch": 1.8898078796849316, "percentage": 62.99, "elapsed_time": "1 day, 19:55:06", "remaining_time": "1 day, 1:48:02", "throughput": 27042.54, "total_tokens": 4275595264} +{"current_steps": 15890, "total_steps": 25209, "loss": 0.9628, "lr": 3.107508795777251e-05, "epoch": 1.890997939708584, "percentage": 63.03, "elapsed_time": "1 day, 19:56:38", "remaining_time": "1 day, 1:46:18", "throughput": 27043.54, "total_tokens": 4278241920} +{"current_steps": 15900, "total_steps": 25209, "loss": 0.9624, "lr": 3.1069088095195056e-05, "epoch": 1.8921879997322364, "percentage": 63.07, "elapsed_time": "1 day, 19:58:17", "remaining_time": "1 day, 1:44:38", "throughput": 27043.67, "total_tokens": 4280956608} +{"current_steps": 15910, "total_steps": 25209, "loss": 0.958, "lr": 3.1063091706569703e-05, "epoch": 1.893378059755889, "percentage": 63.11, "elapsed_time": "1 day, 19:59:57", "remaining_time": "1 day, 1:42:59", "throughput": 27043.9, "total_tokens": 4283679168} +{"current_steps": 15920, "total_steps": 25209, "loss": 0.9568, "lr": 3.105709878854535e-05, "epoch": 1.8945681197795414, "percentage": 63.15, "elapsed_time": "1 day, 20:01:33", "remaining_time": "1 day, 1:41:17", "throughput": 27044.35, "total_tokens": 4286358976} +{"current_steps": 15930, "total_steps": 25209, "loss": 0.9683, "lr": 3.105110933777541e-05, "epoch": 1.895758179803194, "percentage": 63.19, "elapsed_time": "1 day, 20:03:13", "remaining_time": "1 day, 1:39:38", "throughput": 27044.67, "total_tokens": 4289108800} +{"current_steps": 15940, "total_steps": 25209, "loss": 0.9491, "lr": 3.104512335091783e-05, "epoch": 1.8969482398268462, "percentage": 63.23, "elapsed_time": "1 day, 20:04:55", "remaining_time": "1 day, 1:38:00", "throughput": 27044.75, "total_tokens": 4291875264} +{"current_steps": 15950, "total_steps": 25209, "loss": 0.9827, "lr": 3.1039140824635074e-05, "epoch": 1.8981382998504988, "percentage": 63.27, "elapsed_time": "1 day, 20:06:32", "remaining_time": "1 day, 1:36:19", "throughput": 27045.31, "total_tokens": 4294599936} +{"current_steps": 15960, "total_steps": 25209, "loss": 0.9667, "lr": 3.103316175559406e-05, "epoch": 1.899328359874151, "percentage": 63.31, "elapsed_time": "1 day, 20:08:09", "remaining_time": "1 day, 1:34:38", "throughput": 27045.82, "total_tokens": 4297287424} +{"current_steps": 15970, "total_steps": 25209, "loss": 0.9538, "lr": 3.102718614046624e-05, "epoch": 1.9005184198978036, "percentage": 63.35, "elapsed_time": "1 day, 20:09:44", "remaining_time": "1 day, 1:32:56", "throughput": 27046.18, "total_tokens": 4299931520} +{"current_steps": 15980, "total_steps": 25209, "loss": 0.9661, "lr": 3.1021213975927546e-05, "epoch": 1.901708479921456, "percentage": 63.39, "elapsed_time": "1 day, 20:11:27", "remaining_time": "1 day, 1:31:18", "throughput": 27046.09, "total_tokens": 4302690688} +{"current_steps": 15990, "total_steps": 25209, "loss": 0.9637, "lr": 3.1015245258658374e-05, "epoch": 1.9028985399451086, "percentage": 63.43, "elapsed_time": "1 day, 20:13:07", "remaining_time": "1 day, 1:29:39", "throughput": 27046.25, "total_tokens": 4305418112} +{"current_steps": 16000, "total_steps": 25209, "loss": 0.9678, "lr": 3.1009279985343606e-05, "epoch": 1.904088599968761, "percentage": 63.47, "elapsed_time": "1 day, 20:14:43", "remaining_time": "1 day, 1:27:57", "throughput": 27046.54, "total_tokens": 4308063616} +{"current_steps": 16010, "total_steps": 25209, "loss": 0.9692, "lr": 3.100331815267255e-05, "epoch": 1.9052786599924134, "percentage": 63.51, "elapsed_time": "1 day, 20:16:19", "remaining_time": "1 day, 1:26:15", "throughput": 27047.24, "total_tokens": 4310766208} +{"current_steps": 16020, "total_steps": 25209, "loss": 0.9578, "lr": 3.099735975733902e-05, "epoch": 1.9064687200160657, "percentage": 63.55, "elapsed_time": "1 day, 20:17:55", "remaining_time": "1 day, 1:24:34", "throughput": 27047.71, "total_tokens": 4313440512} +{"current_steps": 16030, "total_steps": 25209, "loss": 0.9696, "lr": 3.099140479604123e-05, "epoch": 1.9076587800397182, "percentage": 63.59, "elapsed_time": "1 day, 20:19:30", "remaining_time": "1 day, 1:22:52", "throughput": 27048.14, "total_tokens": 4316073600} +{"current_steps": 16040, "total_steps": 25209, "loss": 0.9679, "lr": 3.098545326548186e-05, "epoch": 1.9088488400633707, "percentage": 63.63, "elapsed_time": "1 day, 20:21:08", "remaining_time": "1 day, 1:21:11", "throughput": 27048.17, "total_tokens": 4318744000} +{"current_steps": 16050, "total_steps": 25209, "loss": 0.9526, "lr": 3.0979505162368014e-05, "epoch": 1.9100389000870233, "percentage": 63.67, "elapsed_time": "1 day, 20:22:44", "remaining_time": "1 day, 1:19:30", "throughput": 27048.69, "total_tokens": 4321423552} +{"current_steps": 16060, "total_steps": 25209, "loss": 0.9673, "lr": 3.097356048341121e-05, "epoch": 1.9112289601106756, "percentage": 63.71, "elapsed_time": "1 day, 20:24:26", "remaining_time": "1 day, 1:17:51", "throughput": 27048.63, "total_tokens": 4324160768} +{"current_steps": 16070, "total_steps": 25209, "loss": 0.9584, "lr": 3.0967619225327396e-05, "epoch": 1.912419020134328, "percentage": 63.75, "elapsed_time": "1 day, 20:26:03", "remaining_time": "1 day, 1:16:10", "throughput": 27049.32, "total_tokens": 4326892032} +{"current_steps": 16080, "total_steps": 25209, "loss": 0.9463, "lr": 3.0961681384836924e-05, "epoch": 1.9136090801579804, "percentage": 63.79, "elapsed_time": "1 day, 20:27:38", "remaining_time": "1 day, 1:14:28", "throughput": 27050.13, "total_tokens": 4329593792} +{"current_steps": 16090, "total_steps": 25209, "loss": 0.9651, "lr": 3.095574695866453e-05, "epoch": 1.9147991401816329, "percentage": 63.83, "elapsed_time": "1 day, 20:29:14", "remaining_time": "1 day, 1:12:47", "throughput": 27050.69, "total_tokens": 4332283136} +{"current_steps": 16100, "total_steps": 25209, "loss": 0.9691, "lr": 3.0949815943539355e-05, "epoch": 1.9159892002052854, "percentage": 63.87, "elapsed_time": "1 day, 20:30:52", "remaining_time": "1 day, 1:11:06", "throughput": 27051.1, "total_tokens": 4334993152} +{"current_steps": 16110, "total_steps": 25209, "loss": 0.9617, "lr": 3.094388833619495e-05, "epoch": 1.917179260228938, "percentage": 63.91, "elapsed_time": "1 day, 20:32:30", "remaining_time": "1 day, 1:09:26", "throughput": 27051.19, "total_tokens": 4337681600} +{"current_steps": 16120, "total_steps": 25209, "loss": 0.9524, "lr": 3.0937964133369196e-05, "epoch": 1.9183693202525902, "percentage": 63.95, "elapsed_time": "1 day, 20:34:10", "remaining_time": "1 day, 1:07:47", "throughput": 27051.16, "total_tokens": 4340358848} +{"current_steps": 16130, "total_steps": 25209, "loss": 0.9742, "lr": 3.093204333180437e-05, "epoch": 1.9195593802762427, "percentage": 63.99, "elapsed_time": "1 day, 20:35:48", "remaining_time": "1 day, 1:06:06", "throughput": 27051.46, "total_tokens": 4343058176} +{"current_steps": 16140, "total_steps": 25209, "loss": 0.9572, "lr": 3.0926125928247114e-05, "epoch": 1.920749440299895, "percentage": 64.02, "elapsed_time": "1 day, 20:37:23", "remaining_time": "1 day, 1:04:25", "throughput": 27051.94, "total_tokens": 4345731520} +{"current_steps": 16150, "total_steps": 25209, "loss": 0.9667, "lr": 3.092021191944842e-05, "epoch": 1.9219395003235475, "percentage": 64.06, "elapsed_time": "1 day, 20:39:00", "remaining_time": "1 day, 1:02:43", "throughput": 27052.51, "total_tokens": 4348423616} +{"current_steps": 16160, "total_steps": 25209, "loss": 0.9789, "lr": 3.091430130216363e-05, "epoch": 1.9231295603472, "percentage": 64.1, "elapsed_time": "1 day, 20:40:37", "remaining_time": "1 day, 1:01:03", "throughput": 27052.83, "total_tokens": 4351110144} +{"current_steps": 16170, "total_steps": 25209, "loss": 0.9819, "lr": 3.090839407315242e-05, "epoch": 1.9243196203708526, "percentage": 64.14, "elapsed_time": "1 day, 20:42:13", "remaining_time": "1 day, 0:59:21", "throughput": 27053.59, "total_tokens": 4353827520} +{"current_steps": 16180, "total_steps": 25209, "loss": 0.9534, "lr": 3.0902490229178794e-05, "epoch": 1.9255096803945049, "percentage": 64.18, "elapsed_time": "1 day, 20:43:49", "remaining_time": "1 day, 0:57:39", "throughput": 27054.24, "total_tokens": 4356522816} +{"current_steps": 16190, "total_steps": 25209, "loss": 0.96, "lr": 3.0896589767011104e-05, "epoch": 1.9266997404181574, "percentage": 64.22, "elapsed_time": "1 day, 20:45:32", "remaining_time": "1 day, 0:56:02", "throughput": 27054.13, "total_tokens": 4359292800} +{"current_steps": 16200, "total_steps": 25209, "loss": 0.9743, "lr": 3.0890692683421985e-05, "epoch": 1.9278898004418097, "percentage": 64.26, "elapsed_time": "1 day, 20:47:10", "remaining_time": "1 day, 0:54:22", "throughput": 27054.31, "total_tokens": 4361991552} +{"current_steps": 16210, "total_steps": 25209, "loss": 0.9599, "lr": 3.088479897518843e-05, "epoch": 1.9290798604654622, "percentage": 64.3, "elapsed_time": "1 day, 20:48:49", "remaining_time": "1 day, 0:52:42", "throughput": 27054.66, "total_tokens": 4364722304} +{"current_steps": 16220, "total_steps": 25209, "loss": 0.9711, "lr": 3.087890863909168e-05, "epoch": 1.9302699204891147, "percentage": 64.34, "elapsed_time": "1 day, 20:50:22", "remaining_time": "1 day, 0:50:59", "throughput": 27055.32, "total_tokens": 4367344704} +{"current_steps": 16230, "total_steps": 25209, "loss": 0.9668, "lr": 3.087302167191732e-05, "epoch": 1.9314599805127672, "percentage": 64.38, "elapsed_time": "1 day, 20:51:56", "remaining_time": "1 day, 0:49:16", "throughput": 27056.13, "total_tokens": 4370011968} +{"current_steps": 16240, "total_steps": 25209, "loss": 0.9699, "lr": 3.086713807045518e-05, "epoch": 1.9326500405364195, "percentage": 64.42, "elapsed_time": "1 day, 20:53:36", "remaining_time": "1 day, 0:47:37", "throughput": 27056.29, "total_tokens": 4372750656} +{"current_steps": 16250, "total_steps": 25209, "loss": 0.9652, "lr": 3.086125783149941e-05, "epoch": 1.933840100560072, "percentage": 64.46, "elapsed_time": "1 day, 20:55:11", "remaining_time": "1 day, 0:45:55", "throughput": 27056.75, "total_tokens": 4375396672} +{"current_steps": 16260, "total_steps": 25209, "loss": 0.9622, "lr": 3.0855380951848404e-05, "epoch": 1.9350301605837243, "percentage": 64.5, "elapsed_time": "1 day, 20:56:48", "remaining_time": "1 day, 0:44:14", "throughput": 27057.17, "total_tokens": 4378076480} +{"current_steps": 16270, "total_steps": 25209, "loss": 0.9612, "lr": 3.084950742830484e-05, "epoch": 1.9362202206073769, "percentage": 64.54, "elapsed_time": "1 day, 20:58:20", "remaining_time": "1 day, 0:42:30", "throughput": 27058.16, "total_tokens": 4380720320} +{"current_steps": 16280, "total_steps": 25209, "loss": 0.9565, "lr": 3.0843637257675654e-05, "epoch": 1.9374102806310294, "percentage": 64.58, "elapsed_time": "1 day, 21:00:01", "remaining_time": "1 day, 0:40:51", "throughput": 27058.2, "total_tokens": 4383457920} +{"current_steps": 16290, "total_steps": 25209, "loss": 0.9523, "lr": 3.083777043677202e-05, "epoch": 1.938600340654682, "percentage": 64.62, "elapsed_time": "1 day, 21:01:38", "remaining_time": "1 day, 0:39:10", "throughput": 27058.47, "total_tokens": 4386129024} +{"current_steps": 16300, "total_steps": 25209, "loss": 0.9544, "lr": 3.083190696240936e-05, "epoch": 1.9397904006783342, "percentage": 64.66, "elapsed_time": "1 day, 21:03:13", "remaining_time": "1 day, 0:37:29", "throughput": 27059.02, "total_tokens": 4388810240} +{"current_steps": 16310, "total_steps": 25209, "loss": 0.9698, "lr": 3.082604683140735e-05, "epoch": 1.9409804607019867, "percentage": 64.7, "elapsed_time": "1 day, 21:04:49", "remaining_time": "1 day, 0:35:47", "throughput": 27059.62, "total_tokens": 4391495936} +{"current_steps": 16320, "total_steps": 25209, "loss": 0.9634, "lr": 3.082019004058987e-05, "epoch": 1.942170520725639, "percentage": 64.74, "elapsed_time": "1 day, 21:06:28", "remaining_time": "1 day, 0:34:07", "throughput": 27059.83, "total_tokens": 4394200832} +{"current_steps": 16330, "total_steps": 25209, "loss": 0.9586, "lr": 3.081433658678505e-05, "epoch": 1.9433605807492915, "percentage": 64.78, "elapsed_time": "1 day, 21:08:01", "remaining_time": "1 day, 0:32:24", "throughput": 27060.92, "total_tokens": 4396890752} +{"current_steps": 16340, "total_steps": 25209, "loss": 0.9473, "lr": 3.080848646682521e-05, "epoch": 1.944550640772944, "percentage": 64.82, "elapsed_time": "1 day, 21:09:35", "remaining_time": "1 day, 0:30:42", "throughput": 27061.73, "total_tokens": 4399579264} +{"current_steps": 16350, "total_steps": 25209, "loss": 0.9471, "lr": 3.080263967754689e-05, "epoch": 1.9457407007965966, "percentage": 64.86, "elapsed_time": "1 day, 21:11:13", "remaining_time": "1 day, 0:29:02", "throughput": 27062.08, "total_tokens": 4402275072} +{"current_steps": 16360, "total_steps": 25209, "loss": 0.9761, "lr": 3.079679621579083e-05, "epoch": 1.9469307608202489, "percentage": 64.9, "elapsed_time": "1 day, 21:12:51", "remaining_time": "1 day, 0:27:21", "throughput": 27062.49, "total_tokens": 4404989888} +{"current_steps": 16370, "total_steps": 25209, "loss": 0.9694, "lr": 3.079095607840197e-05, "epoch": 1.9481208208439014, "percentage": 64.94, "elapsed_time": "1 day, 21:14:29", "remaining_time": "1 day, 0:25:41", "throughput": 27062.6, "total_tokens": 4407683584} +{"current_steps": 16380, "total_steps": 25209, "loss": 0.9533, "lr": 3.0785119262229416e-05, "epoch": 1.9493108808675537, "percentage": 64.98, "elapsed_time": "1 day, 21:16:06", "remaining_time": "1 day, 0:24:00", "throughput": 27063.01, "total_tokens": 4410364672} +{"current_steps": 16390, "total_steps": 25209, "loss": 0.9589, "lr": 3.0779285764126485e-05, "epoch": 1.9505009408912062, "percentage": 65.02, "elapsed_time": "1 day, 21:17:43", "remaining_time": "1 day, 0:22:20", "throughput": 27063.5, "total_tokens": 4413077504} +{"current_steps": 16400, "total_steps": 25209, "loss": 0.9544, "lr": 3.077345558095064e-05, "epoch": 1.9516910009148587, "percentage": 65.06, "elapsed_time": "1 day, 21:19:19", "remaining_time": "1 day, 0:20:38", "throughput": 27064.03, "total_tokens": 4415756224} +{"current_steps": 16410, "total_steps": 25209, "loss": 0.9479, "lr": 3.076762870956352e-05, "epoch": 1.9528810609385112, "percentage": 65.1, "elapsed_time": "1 day, 21:20:55", "remaining_time": "1 day, 0:18:57", "throughput": 27064.62, "total_tokens": 4418456512} +{"current_steps": 16420, "total_steps": 25209, "loss": 0.9585, "lr": 3.076180514683092e-05, "epoch": 1.9540711209621635, "percentage": 65.14, "elapsed_time": "1 day, 21:22:33", "remaining_time": "1 day, 0:17:17", "throughput": 27064.67, "total_tokens": 4421121984} +{"current_steps": 16430, "total_steps": 25209, "loss": 0.9618, "lr": 3.075598488962278e-05, "epoch": 1.955261180985816, "percentage": 65.18, "elapsed_time": "1 day, 21:24:11", "remaining_time": "1 day, 0:15:36", "throughput": 27065.1, "total_tokens": 4423839680} +{"current_steps": 16440, "total_steps": 25209, "loss": 0.9678, "lr": 3.0750167934813207e-05, "epoch": 1.9564512410094683, "percentage": 65.21, "elapsed_time": "1 day, 21:25:47", "remaining_time": "1 day, 0:13:55", "throughput": 27065.65, "total_tokens": 4426525632} +{"current_steps": 16450, "total_steps": 25209, "loss": 0.9643, "lr": 3.074435427928041e-05, "epoch": 1.9576413010331208, "percentage": 65.25, "elapsed_time": "1 day, 21:27:25", "remaining_time": "1 day, 0:12:14", "throughput": 27066.25, "total_tokens": 4429268608} +{"current_steps": 16460, "total_steps": 25209, "loss": 0.9708, "lr": 3.073854391990675e-05, "epoch": 1.9588313610567734, "percentage": 65.29, "elapsed_time": "1 day, 21:29:05", "remaining_time": "1 day, 0:10:35", "throughput": 27066.28, "total_tokens": 4431970944} +{"current_steps": 16470, "total_steps": 25209, "loss": 0.9712, "lr": 3.073273685357871e-05, "epoch": 1.9600214210804259, "percentage": 65.33, "elapsed_time": "1 day, 21:30:44", "remaining_time": "1 day, 0:08:56", "throughput": 27066.22, "total_tokens": 4434653568} +{"current_steps": 16480, "total_steps": 25209, "loss": 0.9628, "lr": 3.072693307718689e-05, "epoch": 1.9612114811040782, "percentage": 65.37, "elapsed_time": "1 day, 21:32:27", "remaining_time": "1 day, 0:07:18", "throughput": 27065.88, "total_tokens": 4437379712} +{"current_steps": 16490, "total_steps": 25209, "loss": 0.9633, "lr": 3.0721132587626e-05, "epoch": 1.9624015411277305, "percentage": 65.41, "elapsed_time": "1 day, 21:34:03", "remaining_time": "1 day, 0:05:37", "throughput": 27066.6, "total_tokens": 4440095680} +{"current_steps": 16500, "total_steps": 25209, "loss": 0.9568, "lr": 3.071533538179482e-05, "epoch": 1.963591601151383, "percentage": 65.45, "elapsed_time": "1 day, 21:35:39", "remaining_time": "1 day, 0:03:55", "throughput": 27067.25, "total_tokens": 4442793920} +{"current_steps": 16510, "total_steps": 25209, "loss": 0.9653, "lr": 3.070954145659627e-05, "epoch": 1.9647816611750355, "percentage": 65.49, "elapsed_time": "1 day, 21:37:17", "remaining_time": "1 day, 0:02:15", "throughput": 27067.56, "total_tokens": 4445512000} +{"current_steps": 16520, "total_steps": 25209, "loss": 0.9654, "lr": 3.070375080893734e-05, "epoch": 1.965971721198688, "percentage": 65.53, "elapsed_time": "1 day, 21:38:54", "remaining_time": "1 day, 0:00:35", "throughput": 27067.82, "total_tokens": 4448190592} +{"current_steps": 16530, "total_steps": 25209, "loss": 0.9706, "lr": 3.06979634357291e-05, "epoch": 1.9671617812223405, "percentage": 65.57, "elapsed_time": "1 day, 21:40:28", "remaining_time": "23:58:52", "throughput": 27068.58, "total_tokens": 4450839680} +{"current_steps": 16540, "total_steps": 25209, "loss": 0.9674, "lr": 3.0692179333886686e-05, "epoch": 1.9683518412459928, "percentage": 65.61, "elapsed_time": "1 day, 21:42:08", "remaining_time": "23:57:13", "throughput": 27068.6, "total_tokens": 4453561664} +{"current_steps": 16550, "total_steps": 25209, "loss": 0.9694, "lr": 3.068639850032933e-05, "epoch": 1.9695419012696451, "percentage": 65.65, "elapsed_time": "1 day, 21:43:48", "remaining_time": "23:55:33", "throughput": 27068.84, "total_tokens": 4456293760} +{"current_steps": 16560, "total_steps": 25209, "loss": 0.9566, "lr": 3.068062093198028e-05, "epoch": 1.9707319612932976, "percentage": 65.69, "elapsed_time": "1 day, 21:45:28", "remaining_time": "23:53:54", "throughput": 27068.92, "total_tokens": 4459012160} +{"current_steps": 16570, "total_steps": 25209, "loss": 0.9554, "lr": 3.067484662576687e-05, "epoch": 1.9719220213169502, "percentage": 65.73, "elapsed_time": "1 day, 21:47:03", "remaining_time": "23:52:12", "throughput": 27069.51, "total_tokens": 4461678912} +{"current_steps": 16580, "total_steps": 25209, "loss": 0.9531, "lr": 3.066907557862048e-05, "epoch": 1.9731120813406027, "percentage": 65.77, "elapsed_time": "1 day, 21:48:40", "remaining_time": "23:50:32", "throughput": 27070.0, "total_tokens": 4464411072} +{"current_steps": 16590, "total_steps": 25209, "loss": 0.9532, "lr": 3.066330778747651e-05, "epoch": 1.9743021413642552, "percentage": 65.81, "elapsed_time": "1 day, 21:50:21", "remaining_time": "23:48:53", "throughput": 27070.27, "total_tokens": 4467164224} +{"current_steps": 16600, "total_steps": 25209, "loss": 0.9754, "lr": 3.065754324927441e-05, "epoch": 1.9754922013879075, "percentage": 65.85, "elapsed_time": "1 day, 21:52:00", "remaining_time": "23:47:13", "throughput": 27070.49, "total_tokens": 4469887040} +{"current_steps": 16610, "total_steps": 25209, "loss": 0.9668, "lr": 3.065178196095765e-05, "epoch": 1.9766822614115598, "percentage": 65.89, "elapsed_time": "1 day, 21:53:33", "remaining_time": "23:45:31", "throughput": 27071.14, "total_tokens": 4472520960} +{"current_steps": 16620, "total_steps": 25209, "loss": 0.9711, "lr": 3.064602391947372e-05, "epoch": 1.9778723214352123, "percentage": 65.93, "elapsed_time": "1 day, 21:55:16", "remaining_time": "23:43:53", "throughput": 27071.12, "total_tokens": 4475291200} +{"current_steps": 16630, "total_steps": 25209, "loss": 0.9856, "lr": 3.0640269121774126e-05, "epoch": 1.9790623814588648, "percentage": 65.97, "elapsed_time": "1 day, 21:56:55", "remaining_time": "23:42:13", "throughput": 27071.31, "total_tokens": 4478006400} +{"current_steps": 16640, "total_steps": 25209, "loss": 0.9707, "lr": 3.063451756481437e-05, "epoch": 1.9802524414825173, "percentage": 66.01, "elapsed_time": "1 day, 21:58:29", "remaining_time": "23:40:31", "throughput": 27071.95, "total_tokens": 4480662144} +{"current_steps": 16650, "total_steps": 25209, "loss": 0.9627, "lr": 3.062876924555396e-05, "epoch": 1.9814425015061699, "percentage": 66.05, "elapsed_time": "1 day, 22:00:05", "remaining_time": "23:38:50", "throughput": 27072.46, "total_tokens": 4483339648} +{"current_steps": 16660, "total_steps": 25209, "loss": 0.9678, "lr": 3.06230241609564e-05, "epoch": 1.9826325615298221, "percentage": 66.09, "elapsed_time": "1 day, 22:01:39", "remaining_time": "23:37:07", "throughput": 27073.09, "total_tokens": 4485987456} +{"current_steps": 16670, "total_steps": 25209, "loss": 0.9651, "lr": 3.061728230798916e-05, "epoch": 1.9838226215534744, "percentage": 66.13, "elapsed_time": "1 day, 22:03:14", "remaining_time": "23:35:26", "throughput": 27073.63, "total_tokens": 4488662528} +{"current_steps": 16680, "total_steps": 25209, "loss": 0.9417, "lr": 3.061154368362373e-05, "epoch": 1.985012681577127, "percentage": 66.17, "elapsed_time": "1 day, 22:04:53", "remaining_time": "23:33:46", "throughput": 27074.05, "total_tokens": 4491397888} +{"current_steps": 16690, "total_steps": 25209, "loss": 0.9599, "lr": 3.060580828483552e-05, "epoch": 1.9862027416007795, "percentage": 66.21, "elapsed_time": "1 day, 22:06:22", "remaining_time": "23:32:01", "throughput": 27075.29, "total_tokens": 4494023808} +{"current_steps": 16700, "total_steps": 25209, "loss": 0.9571, "lr": 3.060007610860395e-05, "epoch": 1.987392801624432, "percentage": 66.25, "elapsed_time": "1 day, 22:07:59", "remaining_time": "23:30:20", "throughput": 27075.83, "total_tokens": 4496731136} +{"current_steps": 16710, "total_steps": 25209, "loss": 0.9706, "lr": 3.059434715191236e-05, "epoch": 1.9885828616480845, "percentage": 66.29, "elapsed_time": "1 day, 22:09:38", "remaining_time": "23:28:41", "throughput": 27076.0, "total_tokens": 4499447680} +{"current_steps": 16720, "total_steps": 25209, "loss": 0.9609, "lr": 3.0588621411748074e-05, "epoch": 1.9897729216717368, "percentage": 66.33, "elapsed_time": "1 day, 22:11:11", "remaining_time": "23:26:58", "throughput": 27076.89, "total_tokens": 4502118656} +{"current_steps": 16730, "total_steps": 25209, "loss": 0.9729, "lr": 3.0582898885102344e-05, "epoch": 1.990962981695389, "percentage": 66.37, "elapsed_time": "1 day, 22:12:45", "remaining_time": "23:25:16", "throughput": 27077.78, "total_tokens": 4504802176} +{"current_steps": 16740, "total_steps": 25209, "loss": 0.9534, "lr": 3.0577179568970366e-05, "epoch": 1.9921530417190416, "percentage": 66.4, "elapsed_time": "1 day, 22:14:21", "remaining_time": "23:23:35", "throughput": 27078.3, "total_tokens": 4507485248} +{"current_steps": 16750, "total_steps": 25209, "loss": 0.9519, "lr": 3.057146346035127e-05, "epoch": 1.9933431017426941, "percentage": 66.44, "elapsed_time": "1 day, 22:15:52", "remaining_time": "23:21:51", "throughput": 27078.97, "total_tokens": 4510081152} +{"current_steps": 16760, "total_steps": 25209, "loss": 0.9543, "lr": 3.056575055624811e-05, "epoch": 1.9945331617663467, "percentage": 66.48, "elapsed_time": "1 day, 22:17:28", "remaining_time": "23:20:10", "throughput": 27079.38, "total_tokens": 4512744064} +{"current_steps": 16770, "total_steps": 25209, "loss": 0.9661, "lr": 3.0560040853667846e-05, "epoch": 1.9957232217899992, "percentage": 66.52, "elapsed_time": "1 day, 22:19:08", "remaining_time": "23:18:30", "throughput": 27079.36, "total_tokens": 4515429504} +{"current_steps": 16780, "total_steps": 25209, "loss": 0.9605, "lr": 3.0554334349621366e-05, "epoch": 1.9969132818136515, "percentage": 66.56, "elapsed_time": "1 day, 22:20:45", "remaining_time": "23:16:50", "throughput": 27079.54, "total_tokens": 4518097984} +{"current_steps": 16790, "total_steps": 25209, "loss": 0.9375, "lr": 3.054863104112347e-05, "epoch": 1.9981033418373038, "percentage": 66.6, "elapsed_time": "1 day, 22:22:22", "remaining_time": "23:15:09", "throughput": 27079.96, "total_tokens": 4520782528} +{"current_steps": 16800, "total_steps": 25209, "loss": 0.9597, "lr": 3.0542930925192835e-05, "epoch": 1.9992934018609563, "percentage": 66.64, "elapsed_time": "1 day, 22:23:59", "remaining_time": "23:13:29", "throughput": 27080.27, "total_tokens": 4523479808} +{"current_steps": 16810, "total_steps": 25209, "loss": 0.9439, "lr": 3.053723399885205e-05, "epoch": 2.000476024009461, "percentage": 66.68, "elapsed_time": "1 day, 22:25:35", "remaining_time": "23:11:48", "throughput": 27080.67, "total_tokens": 4526146624} +{"current_steps": 16820, "total_steps": 25209, "loss": 0.9165, "lr": 3.0531540259127565e-05, "epoch": 2.0016660840331135, "percentage": 66.72, "elapsed_time": "1 day, 22:27:15", "remaining_time": "23:10:09", "throughput": 27080.64, "total_tokens": 4528850624} +{"current_steps": 16830, "total_steps": 25209, "loss": 0.9179, "lr": 3.052584970304976e-05, "epoch": 2.002856144056766, "percentage": 66.76, "elapsed_time": "1 day, 22:28:57", "remaining_time": "23:08:30", "throughput": 27080.66, "total_tokens": 4531597056} +{"current_steps": 16840, "total_steps": 25209, "loss": 0.9082, "lr": 3.052016232765282e-05, "epoch": 2.004046204080418, "percentage": 66.8, "elapsed_time": "1 day, 22:30:36", "remaining_time": "23:06:51", "throughput": 27080.92, "total_tokens": 4534344832} +{"current_steps": 16850, "total_steps": 25209, "loss": 0.923, "lr": 3.0514478129974845e-05, "epoch": 2.0052362641040706, "percentage": 66.84, "elapsed_time": "1 day, 22:32:12", "remaining_time": "23:05:10", "throughput": 27081.59, "total_tokens": 4537045952} +{"current_steps": 16860, "total_steps": 25209, "loss": 0.9176, "lr": 3.0508797107057785e-05, "epoch": 2.006426324127723, "percentage": 66.88, "elapsed_time": "1 day, 22:33:47", "remaining_time": "23:03:28", "throughput": 27082.31, "total_tokens": 4539737408} +{"current_steps": 16870, "total_steps": 25209, "loss": 0.919, "lr": 3.0503119255947432e-05, "epoch": 2.0076163841513757, "percentage": 66.92, "elapsed_time": "1 day, 22:35:23", "remaining_time": "23:01:47", "throughput": 27082.68, "total_tokens": 4542393920} +{"current_steps": 16880, "total_steps": 25209, "loss": 0.9271, "lr": 3.049744457369344e-05, "epoch": 2.008806444175028, "percentage": 66.96, "elapsed_time": "1 day, 22:37:02", "remaining_time": "23:00:07", "throughput": 27082.83, "total_tokens": 4545100480} +{"current_steps": 16890, "total_steps": 25209, "loss": 0.9134, "lr": 3.049177305734929e-05, "epoch": 2.0099965041986807, "percentage": 67.0, "elapsed_time": "1 day, 22:38:37", "remaining_time": "22:58:25", "throughput": 27083.4, "total_tokens": 4547771200} +{"current_steps": 16900, "total_steps": 25209, "loss": 0.9225, "lr": 3.04861047039723e-05, "epoch": 2.0111865642223328, "percentage": 67.04, "elapsed_time": "1 day, 22:40:13", "remaining_time": "22:56:45", "throughput": 27083.9, "total_tokens": 4550463808} +{"current_steps": 16910, "total_steps": 25209, "loss": 0.9093, "lr": 3.0480439510623638e-05, "epoch": 2.0123766242459853, "percentage": 67.08, "elapsed_time": "1 day, 22:41:49", "remaining_time": "22:55:03", "throughput": 27084.53, "total_tokens": 4553165312} +{"current_steps": 16920, "total_steps": 25209, "loss": 0.9355, "lr": 3.0474777474368255e-05, "epoch": 2.013566684269638, "percentage": 67.12, "elapsed_time": "1 day, 22:43:22", "remaining_time": "22:53:21", "throughput": 27085.21, "total_tokens": 4555808448} +{"current_steps": 16930, "total_steps": 25209, "loss": 0.9071, "lr": 3.046911859227495e-05, "epoch": 2.0147567442932903, "percentage": 67.16, "elapsed_time": "1 day, 22:45:01", "remaining_time": "22:51:41", "throughput": 27085.48, "total_tokens": 4558537088} +{"current_steps": 16940, "total_steps": 25209, "loss": 0.9192, "lr": 3.0463462861416302e-05, "epoch": 2.015946804316943, "percentage": 67.2, "elapsed_time": "1 day, 22:46:37", "remaining_time": "22:50:00", "throughput": 27085.79, "total_tokens": 4561189376} +{"current_steps": 16950, "total_steps": 25209, "loss": 0.9258, "lr": 3.045781027886873e-05, "epoch": 2.0171368643405954, "percentage": 67.24, "elapsed_time": "1 day, 22:48:08", "remaining_time": "22:48:17", "throughput": 27086.72, "total_tokens": 4563804544} +{"current_steps": 16960, "total_steps": 25209, "loss": 0.916, "lr": 3.0452160841712408e-05, "epoch": 2.0183269243642474, "percentage": 67.28, "elapsed_time": "1 day, 22:49:48", "remaining_time": "22:46:38", "throughput": 27087.12, "total_tokens": 4566585600} +{"current_steps": 16970, "total_steps": 25209, "loss": 0.9264, "lr": 3.044651454703133e-05, "epoch": 2.0195169843879, "percentage": 67.32, "elapsed_time": "1 day, 22:51:19", "remaining_time": "22:44:54", "throughput": 27088.28, "total_tokens": 4569231360} +{"current_steps": 16980, "total_steps": 25209, "loss": 0.9266, "lr": 3.0440871391913257e-05, "epoch": 2.0207070444115525, "percentage": 67.36, "elapsed_time": "1 day, 22:52:59", "remaining_time": "22:43:15", "throughput": 27088.05, "total_tokens": 4571918976} +{"current_steps": 16990, "total_steps": 25209, "loss": 0.9331, "lr": 3.043523137344973e-05, "epoch": 2.021897104435205, "percentage": 67.4, "elapsed_time": "1 day, 22:54:39", "remaining_time": "22:41:36", "throughput": 27088.29, "total_tokens": 4574656576} +{"current_steps": 17000, "total_steps": 25209, "loss": 0.9175, "lr": 3.0429594488736074e-05, "epoch": 2.0230871644588575, "percentage": 67.44, "elapsed_time": "1 day, 22:56:13", "remaining_time": "22:39:54", "throughput": 27088.91, "total_tokens": 4577308928} +{"current_steps": 17010, "total_steps": 25209, "loss": 0.9265, "lr": 3.0423960734871348e-05, "epoch": 2.02427722448251, "percentage": 67.48, "elapsed_time": "1 day, 22:57:47", "remaining_time": "22:38:12", "throughput": 27089.39, "total_tokens": 4579933632} +{"current_steps": 17020, "total_steps": 25209, "loss": 0.912, "lr": 3.0418330108958404e-05, "epoch": 2.025467284506162, "percentage": 67.52, "elapsed_time": "1 day, 22:59:20", "remaining_time": "22:36:29", "throughput": 27090.01, "total_tokens": 4582563136} +{"current_steps": 17030, "total_steps": 25209, "loss": 0.9265, "lr": 3.0412702608103828e-05, "epoch": 2.0266573445298146, "percentage": 67.56, "elapsed_time": "1 day, 23:00:59", "remaining_time": "22:34:50", "throughput": 27090.27, "total_tokens": 4585296192} +{"current_steps": 17040, "total_steps": 25209, "loss": 0.9183, "lr": 3.0407078229417944e-05, "epoch": 2.027847404553467, "percentage": 67.59, "elapsed_time": "1 day, 23:02:30", "remaining_time": "22:33:07", "throughput": 27091.18, "total_tokens": 4587914880} +{"current_steps": 17050, "total_steps": 25209, "loss": 0.9215, "lr": 3.0401456970014836e-05, "epoch": 2.0290374645771196, "percentage": 67.63, "elapsed_time": "1 day, 23:04:05", "remaining_time": "22:31:25", "throughput": 27091.95, "total_tokens": 4590608448} +{"current_steps": 17060, "total_steps": 25209, "loss": 0.9218, "lr": 3.039583882701231e-05, "epoch": 2.030227524600772, "percentage": 67.67, "elapsed_time": "1 day, 23:05:38", "remaining_time": "22:29:42", "throughput": 27092.63, "total_tokens": 4593238272} +{"current_steps": 17070, "total_steps": 25209, "loss": 0.9332, "lr": 3.0390223797531887e-05, "epoch": 2.0314175846244247, "percentage": 67.71, "elapsed_time": "1 day, 23:07:15", "remaining_time": "22:28:02", "throughput": 27093.0, "total_tokens": 4595924032} +{"current_steps": 17080, "total_steps": 25209, "loss": 0.926, "lr": 3.0384611878698837e-05, "epoch": 2.0326076446480768, "percentage": 67.75, "elapsed_time": "1 day, 23:08:52", "remaining_time": "22:26:22", "throughput": 27093.43, "total_tokens": 4598643520} +{"current_steps": 17090, "total_steps": 25209, "loss": 0.9248, "lr": 3.0379003067642113e-05, "epoch": 2.0337977046717293, "percentage": 67.79, "elapsed_time": "1 day, 23:10:28", "remaining_time": "22:24:40", "throughput": 27094.04, "total_tokens": 4601334720} +{"current_steps": 17100, "total_steps": 25209, "loss": 0.9024, "lr": 3.037339736149441e-05, "epoch": 2.034987764695382, "percentage": 67.83, "elapsed_time": "1 day, 23:11:57", "remaining_time": "22:22:56", "throughput": 27095.06, "total_tokens": 4603931008} +{"current_steps": 17110, "total_steps": 25209, "loss": 0.9289, "lr": 3.0367794757392092e-05, "epoch": 2.0361778247190343, "percentage": 67.87, "elapsed_time": "1 day, 23:13:32", "remaining_time": "22:21:15", "throughput": 27095.62, "total_tokens": 4606595840} +{"current_steps": 17120, "total_steps": 25209, "loss": 0.9208, "lr": 3.0362195252475245e-05, "epoch": 2.037367884742687, "percentage": 67.91, "elapsed_time": "1 day, 23:15:13", "remaining_time": "22:19:36", "throughput": 27095.61, "total_tokens": 4609333952} +{"current_steps": 17130, "total_steps": 25209, "loss": 0.9189, "lr": 3.0356598843887634e-05, "epoch": 2.0385579447663393, "percentage": 67.95, "elapsed_time": "1 day, 23:16:47", "remaining_time": "22:17:54", "throughput": 27096.29, "total_tokens": 4612005120} +{"current_steps": 17140, "total_steps": 25209, "loss": 0.9325, "lr": 3.03510055287767e-05, "epoch": 2.0397480047899914, "percentage": 67.99, "elapsed_time": "1 day, 23:18:24", "remaining_time": "22:16:14", "throughput": 27096.81, "total_tokens": 4614715904} +{"current_steps": 17150, "total_steps": 25209, "loss": 0.9082, "lr": 3.0345415304293578e-05, "epoch": 2.040938064813644, "percentage": 68.03, "elapsed_time": "1 day, 23:20:02", "remaining_time": "22:14:34", "throughput": 27097.3, "total_tokens": 4617456000} +{"current_steps": 17160, "total_steps": 25209, "loss": 0.9187, "lr": 3.0339828167593065e-05, "epoch": 2.0421281248372964, "percentage": 68.07, "elapsed_time": "1 day, 23:21:41", "remaining_time": "22:12:54", "throughput": 27097.7, "total_tokens": 4620205888} +{"current_steps": 17170, "total_steps": 25209, "loss": 0.9335, "lr": 3.033424411583363e-05, "epoch": 2.043318184860949, "percentage": 68.11, "elapsed_time": "1 day, 23:23:13", "remaining_time": "22:11:12", "throughput": 27098.36, "total_tokens": 4622815488} +{"current_steps": 17180, "total_steps": 25209, "loss": 0.9152, "lr": 3.0328663146177387e-05, "epoch": 2.0445082448846015, "percentage": 68.15, "elapsed_time": "1 day, 23:24:50", "remaining_time": "22:09:31", "throughput": 27098.85, "total_tokens": 4625506624} +{"current_steps": 17190, "total_steps": 25209, "loss": 0.9161, "lr": 3.032308525579013e-05, "epoch": 2.045698304908254, "percentage": 68.19, "elapsed_time": "1 day, 23:26:25", "remaining_time": "22:07:50", "throughput": 27099.39, "total_tokens": 4628184576} +{"current_steps": 17200, "total_steps": 25209, "loss": 0.9196, "lr": 3.031751044184127e-05, "epoch": 2.046888364931906, "percentage": 68.23, "elapsed_time": "1 day, 23:28:03", "remaining_time": "22:06:09", "throughput": 27099.79, "total_tokens": 4630899520} +{"current_steps": 17210, "total_steps": 25209, "loss": 0.9223, "lr": 3.0311938701503872e-05, "epoch": 2.0480784249555586, "percentage": 68.27, "elapsed_time": "1 day, 23:29:37", "remaining_time": "22:04:28", "throughput": 27100.58, "total_tokens": 4633592576} +{"current_steps": 17220, "total_steps": 25209, "loss": 0.9304, "lr": 3.0306370031954646e-05, "epoch": 2.049268484979211, "percentage": 68.31, "elapsed_time": "1 day, 23:31:18", "remaining_time": "22:02:49", "throughput": 27100.6, "total_tokens": 4636334592} +{"current_steps": 17230, "total_steps": 25209, "loss": 0.9229, "lr": 3.030080443037393e-05, "epoch": 2.0504585450028636, "percentage": 68.35, "elapsed_time": "1 day, 23:33:01", "remaining_time": "22:01:12", "throughput": 27100.29, "total_tokens": 4639067136} +{"current_steps": 17240, "total_steps": 25209, "loss": 0.9087, "lr": 3.0295241893945663e-05, "epoch": 2.051648605026516, "percentage": 68.39, "elapsed_time": "1 day, 23:34:39", "remaining_time": "21:59:31", "throughput": 27100.48, "total_tokens": 4641747072} +{"current_steps": 17250, "total_steps": 25209, "loss": 0.9225, "lr": 3.028968241985743e-05, "epoch": 2.0528386650501687, "percentage": 68.43, "elapsed_time": "1 day, 23:36:18", "remaining_time": "21:57:52", "throughput": 27100.62, "total_tokens": 4644467584} +{"current_steps": 17260, "total_steps": 25209, "loss": 0.9293, "lr": 3.0284126005300405e-05, "epoch": 2.0540287250738207, "percentage": 68.47, "elapsed_time": "1 day, 23:37:56", "remaining_time": "21:56:12", "throughput": 27100.92, "total_tokens": 4647168000} +{"current_steps": 17270, "total_steps": 25209, "loss": 0.9221, "lr": 3.0278572647469385e-05, "epoch": 2.0552187850974732, "percentage": 68.51, "elapsed_time": "1 day, 23:39:31", "remaining_time": "21:54:31", "throughput": 27101.59, "total_tokens": 4649867008} +{"current_steps": 17280, "total_steps": 25209, "loss": 0.925, "lr": 3.027302234356275e-05, "epoch": 2.0564088451211258, "percentage": 68.55, "elapsed_time": "1 day, 23:41:08", "remaining_time": "21:52:51", "throughput": 27102.12, "total_tokens": 4652591872} +{"current_steps": 17290, "total_steps": 25209, "loss": 0.9409, "lr": 3.0267475090782494e-05, "epoch": 2.0575989051447783, "percentage": 68.59, "elapsed_time": "1 day, 23:42:45", "remaining_time": "21:51:10", "throughput": 27102.56, "total_tokens": 4655295488} +{"current_steps": 17300, "total_steps": 25209, "loss": 0.9322, "lr": 3.026193088633418e-05, "epoch": 2.058788965168431, "percentage": 68.63, "elapsed_time": "1 day, 23:44:18", "remaining_time": "21:49:28", "throughput": 27103.45, "total_tokens": 4657971648} +{"current_steps": 17310, "total_steps": 25209, "loss": 0.9247, "lr": 3.0256389727426952e-05, "epoch": 2.0599790251920833, "percentage": 68.67, "elapsed_time": "1 day, 23:45:55", "remaining_time": "21:47:47", "throughput": 27103.97, "total_tokens": 4660685504} +{"current_steps": 17320, "total_steps": 25209, "loss": 0.92, "lr": 3.0250851611273555e-05, "epoch": 2.0611690852157354, "percentage": 68.71, "elapsed_time": "1 day, 23:47:31", "remaining_time": "21:46:06", "throughput": 27104.47, "total_tokens": 4663368512} +{"current_steps": 17330, "total_steps": 25209, "loss": 0.9173, "lr": 3.0245316535090273e-05, "epoch": 2.062359145239388, "percentage": 68.75, "elapsed_time": "1 day, 23:49:08", "remaining_time": "21:44:26", "throughput": 27105.15, "total_tokens": 4666097216} +{"current_steps": 17340, "total_steps": 25209, "loss": 0.9227, "lr": 3.023978449609697e-05, "epoch": 2.0635492052630404, "percentage": 68.78, "elapsed_time": "1 day, 23:50:46", "remaining_time": "21:42:46", "throughput": 27105.37, "total_tokens": 4668806656} +{"current_steps": 17350, "total_steps": 25209, "loss": 0.9371, "lr": 3.023425549151707e-05, "epoch": 2.064739265286693, "percentage": 68.82, "elapsed_time": "1 day, 23:52:20", "remaining_time": "21:41:04", "throughput": 27105.99, "total_tokens": 4671451392} +{"current_steps": 17360, "total_steps": 25209, "loss": 0.9081, "lr": 3.022872951857754e-05, "epoch": 2.0659293253103455, "percentage": 68.86, "elapsed_time": "1 day, 23:53:55", "remaining_time": "21:39:23", "throughput": 27106.37, "total_tokens": 4674108032} +{"current_steps": 17370, "total_steps": 25209, "loss": 0.9255, "lr": 3.0223206574508904e-05, "epoch": 2.067119385333998, "percentage": 68.9, "elapsed_time": "1 day, 23:55:34", "remaining_time": "21:37:43", "throughput": 27106.8, "total_tokens": 4676852416} +{"current_steps": 17380, "total_steps": 25209, "loss": 0.9052, "lr": 3.0217686656545224e-05, "epoch": 2.06830944535765, "percentage": 68.94, "elapsed_time": "1 day, 23:57:13", "remaining_time": "21:36:04", "throughput": 27106.75, "total_tokens": 4679541056} +{"current_steps": 17390, "total_steps": 25209, "loss": 0.9213, "lr": 3.0212169761924077e-05, "epoch": 2.0694995053813026, "percentage": 68.98, "elapsed_time": "1 day, 23:58:50", "remaining_time": "21:34:24", "throughput": 27107.1, "total_tokens": 4682229376} +{"current_steps": 17400, "total_steps": 25209, "loss": 0.9025, "lr": 3.0206655887886604e-05, "epoch": 2.070689565404955, "percentage": 69.02, "elapsed_time": "2 days, 0:00:24", "remaining_time": "21:32:42", "throughput": 27107.88, "total_tokens": 4684913344} +{"current_steps": 17410, "total_steps": 25209, "loss": 0.9411, "lr": 3.0201145031677448e-05, "epoch": 2.0718796254286076, "percentage": 69.06, "elapsed_time": "2 days, 0:02:02", "remaining_time": "21:31:02", "throughput": 27108.14, "total_tokens": 4687617024} +{"current_steps": 17420, "total_steps": 25209, "loss": 0.9291, "lr": 3.019563719054477e-05, "epoch": 2.07306968545226, "percentage": 69.1, "elapsed_time": "2 days, 0:03:43", "remaining_time": "21:29:23", "throughput": 27108.21, "total_tokens": 4690349824} +{"current_steps": 17430, "total_steps": 25209, "loss": 0.9173, "lr": 3.019013236174025e-05, "epoch": 2.0742597454759126, "percentage": 69.14, "elapsed_time": "2 days, 0:05:18", "remaining_time": "21:27:42", "throughput": 27108.77, "total_tokens": 4693037888} +{"current_steps": 17440, "total_steps": 25209, "loss": 0.922, "lr": 3.018463054251906e-05, "epoch": 2.0754498054995647, "percentage": 69.18, "elapsed_time": "2 days, 0:07:03", "remaining_time": "21:26:06", "throughput": 27108.58, "total_tokens": 4695855232} +{"current_steps": 17450, "total_steps": 25209, "loss": 0.9191, "lr": 3.017913173013989e-05, "epoch": 2.076639865523217, "percentage": 69.22, "elapsed_time": "2 days, 0:08:47", "remaining_time": "21:24:28", "throughput": 27108.44, "total_tokens": 4698641792} +{"current_steps": 17460, "total_steps": 25209, "loss": 0.9049, "lr": 3.017363592186491e-05, "epoch": 2.0778299255468697, "percentage": 69.26, "elapsed_time": "2 days, 0:10:23", "remaining_time": "21:22:47", "throughput": 27108.89, "total_tokens": 4701316416} +{"current_steps": 17470, "total_steps": 25209, "loss": 0.9212, "lr": 3.0168143114959797e-05, "epoch": 2.0790199855705223, "percentage": 69.3, "elapsed_time": "2 days, 0:11:57", "remaining_time": "21:21:06", "throughput": 27109.65, "total_tokens": 4703996416} +{"current_steps": 17480, "total_steps": 25209, "loss": 0.9327, "lr": 3.016265330669369e-05, "epoch": 2.0802100455941748, "percentage": 69.34, "elapsed_time": "2 days, 0:13:30", "remaining_time": "21:19:24", "throughput": 27110.38, "total_tokens": 4706644352} +{"current_steps": 17490, "total_steps": 25209, "loss": 0.9239, "lr": 3.0157166494339223e-05, "epoch": 2.0814001056178273, "percentage": 69.38, "elapsed_time": "2 days, 0:15:07", "remaining_time": "21:17:43", "throughput": 27110.91, "total_tokens": 4709379200} +{"current_steps": 17500, "total_steps": 25209, "loss": 0.9098, "lr": 3.0151682675172482e-05, "epoch": 2.0825901656414794, "percentage": 69.42, "elapsed_time": "2 days, 0:16:45", "remaining_time": "21:16:04", "throughput": 27111.16, "total_tokens": 4712082176} +{"current_steps": 17510, "total_steps": 25209, "loss": 0.9158, "lr": 3.0146201846473034e-05, "epoch": 2.083780225665132, "percentage": 69.46, "elapsed_time": "2 days, 0:18:22", "remaining_time": "21:14:23", "throughput": 27111.65, "total_tokens": 4714770048} +{"current_steps": 17520, "total_steps": 25209, "loss": 0.9128, "lr": 3.01407240055239e-05, "epoch": 2.0849702856887844, "percentage": 69.5, "elapsed_time": "2 days, 0:19:57", "remaining_time": "21:12:42", "throughput": 27112.15, "total_tokens": 4717452160} +{"current_steps": 17530, "total_steps": 25209, "loss": 0.901, "lr": 3.013524914961157e-05, "epoch": 2.086160345712437, "percentage": 69.54, "elapsed_time": "2 days, 0:21:31", "remaining_time": "21:11:00", "throughput": 27112.94, "total_tokens": 4720120640} +{"current_steps": 17540, "total_steps": 25209, "loss": 0.9282, "lr": 3.012977727602596e-05, "epoch": 2.0873504057360894, "percentage": 69.58, "elapsed_time": "2 days, 0:23:07", "remaining_time": "21:09:20", "throughput": 27113.32, "total_tokens": 4722815168} +{"current_steps": 17550, "total_steps": 25209, "loss": 0.9234, "lr": 3.0124308382060446e-05, "epoch": 2.088540465759742, "percentage": 69.62, "elapsed_time": "2 days, 0:24:42", "remaining_time": "21:07:38", "throughput": 27114.1, "total_tokens": 4725518464} +{"current_steps": 17560, "total_steps": 25209, "loss": 0.9347, "lr": 3.011884246501183e-05, "epoch": 2.089730525783394, "percentage": 69.66, "elapsed_time": "2 days, 0:26:15", "remaining_time": "21:05:56", "throughput": 27114.89, "total_tokens": 4728180096} +{"current_steps": 17570, "total_steps": 25209, "loss": 0.9123, "lr": 3.0113379522180363e-05, "epoch": 2.0909205858070465, "percentage": 69.7, "elapsed_time": "2 days, 0:27:52", "remaining_time": "21:04:16", "throughput": 27115.22, "total_tokens": 4730847232} +{"current_steps": 17580, "total_steps": 25209, "loss": 0.9266, "lr": 3.0107919550869702e-05, "epoch": 2.092110645830699, "percentage": 69.74, "elapsed_time": "2 days, 0:29:29", "remaining_time": "21:02:35", "throughput": 27115.71, "total_tokens": 4733569728} +{"current_steps": 17590, "total_steps": 25209, "loss": 0.9133, "lr": 3.0102462548386933e-05, "epoch": 2.0933007058543516, "percentage": 69.78, "elapsed_time": "2 days, 0:31:08", "remaining_time": "21:00:56", "throughput": 27115.87, "total_tokens": 4736290880} +{"current_steps": 17600, "total_steps": 25209, "loss": 0.9039, "lr": 3.0097008512042572e-05, "epoch": 2.094490765878004, "percentage": 69.82, "elapsed_time": "2 days, 0:32:49", "remaining_time": "20:59:18", "throughput": 27116.07, "total_tokens": 4739063616} +{"current_steps": 17610, "total_steps": 25209, "loss": 0.9101, "lr": 3.009155743915052e-05, "epoch": 2.0956808259016566, "percentage": 69.86, "elapsed_time": "2 days, 0:34:22", "remaining_time": "20:57:35", "throughput": 27116.91, "total_tokens": 4741728960} +{"current_steps": 17620, "total_steps": 25209, "loss": 0.9118, "lr": 3.00861093270281e-05, "epoch": 2.0968708859253087, "percentage": 69.9, "elapsed_time": "2 days, 0:36:00", "remaining_time": "20:55:56", "throughput": 27117.28, "total_tokens": 4744446784} +{"current_steps": 17630, "total_steps": 25209, "loss": 0.9084, "lr": 3.008066417299602e-05, "epoch": 2.098060945948961, "percentage": 69.94, "elapsed_time": "2 days, 0:37:38", "remaining_time": "20:54:16", "throughput": 27117.35, "total_tokens": 4747131776} +{"current_steps": 17640, "total_steps": 25209, "loss": 0.9231, "lr": 3.00752219743784e-05, "epoch": 2.0992510059726137, "percentage": 69.98, "elapsed_time": "2 days, 0:39:13", "remaining_time": "20:52:35", "throughput": 27117.92, "total_tokens": 4749803648} +{"current_steps": 17650, "total_steps": 25209, "loss": 0.913, "lr": 3.0069782728502737e-05, "epoch": 2.1004410659962662, "percentage": 70.01, "elapsed_time": "2 days, 0:40:55", "remaining_time": "20:50:57", "throughput": 27117.78, "total_tokens": 4752540096} +{"current_steps": 17660, "total_steps": 25209, "loss": 0.9217, "lr": 3.00643464326999e-05, "epoch": 2.1016311260199187, "percentage": 70.05, "elapsed_time": "2 days, 0:42:33", "remaining_time": "20:49:17", "throughput": 27118.17, "total_tokens": 4755256256} +{"current_steps": 17670, "total_steps": 25209, "loss": 0.9219, "lr": 3.0058913084304146e-05, "epoch": 2.1028211860435713, "percentage": 70.09, "elapsed_time": "2 days, 0:44:11", "remaining_time": "20:47:37", "throughput": 27118.81, "total_tokens": 4758038976} +{"current_steps": 17680, "total_steps": 25209, "loss": 0.9183, "lr": 3.0053482680653112e-05, "epoch": 2.1040112460672233, "percentage": 70.13, "elapsed_time": "2 days, 0:45:44", "remaining_time": "20:45:55", "throughput": 27119.84, "total_tokens": 4760730240} +{"current_steps": 17690, "total_steps": 25209, "loss": 0.9219, "lr": 3.0048055219087777e-05, "epoch": 2.105201306090876, "percentage": 70.17, "elapsed_time": "2 days, 0:47:22", "remaining_time": "20:44:15", "throughput": 27120.06, "total_tokens": 4763424000} +{"current_steps": 17700, "total_steps": 25209, "loss": 0.9241, "lr": 3.0042630696952507e-05, "epoch": 2.1063913661145284, "percentage": 70.21, "elapsed_time": "2 days, 0:48:59", "remaining_time": "20:42:35", "throughput": 27120.39, "total_tokens": 4766118144} +{"current_steps": 17710, "total_steps": 25209, "loss": 0.9289, "lr": 3.0037209111594994e-05, "epoch": 2.107581426138181, "percentage": 70.25, "elapsed_time": "2 days, 0:50:38", "remaining_time": "20:40:55", "throughput": 27120.71, "total_tokens": 4768859840} +{"current_steps": 17720, "total_steps": 25209, "loss": 0.9182, "lr": 3.0031790460366305e-05, "epoch": 2.1087714861618334, "percentage": 70.29, "elapsed_time": "2 days, 0:52:13", "remaining_time": "20:39:14", "throughput": 27121.16, "total_tokens": 4771524032} +{"current_steps": 17730, "total_steps": 25209, "loss": 0.9294, "lr": 3.002637474062083e-05, "epoch": 2.109961546185486, "percentage": 70.33, "elapsed_time": "2 days, 0:53:49", "remaining_time": "20:37:34", "throughput": 27121.46, "total_tokens": 4774189632} +{"current_steps": 17740, "total_steps": 25209, "loss": 0.9226, "lr": 3.0020961949716325e-05, "epoch": 2.111151606209138, "percentage": 70.37, "elapsed_time": "2 days, 0:55:31", "remaining_time": "20:35:56", "throughput": 27121.39, "total_tokens": 4776939584} +{"current_steps": 17750, "total_steps": 25209, "loss": 0.9152, "lr": 3.0015552085013847e-05, "epoch": 2.1123416662327905, "percentage": 70.41, "elapsed_time": "2 days, 0:57:08", "remaining_time": "20:34:15", "throughput": 27122.02, "total_tokens": 4779674752} +{"current_steps": 17760, "total_steps": 25209, "loss": 0.9478, "lr": 3.0010145143877805e-05, "epoch": 2.113531726256443, "percentage": 70.45, "elapsed_time": "2 days, 0:58:44", "remaining_time": "20:32:34", "throughput": 27122.44, "total_tokens": 4782340992} +{"current_steps": 17770, "total_steps": 25209, "loss": 0.9175, "lr": 3.0004741123675907e-05, "epoch": 2.1147217862800956, "percentage": 70.49, "elapsed_time": "2 days, 1:00:21", "remaining_time": "20:30:54", "throughput": 27122.71, "total_tokens": 4785035264} +{"current_steps": 17780, "total_steps": 25209, "loss": 0.9248, "lr": 2.9999340021779205e-05, "epoch": 2.115911846303748, "percentage": 70.53, "elapsed_time": "2 days, 1:01:59", "remaining_time": "20:29:15", "throughput": 27122.82, "total_tokens": 4787714688} +{"current_steps": 17790, "total_steps": 25209, "loss": 0.9107, "lr": 2.999394183556204e-05, "epoch": 2.1171019063274006, "percentage": 70.57, "elapsed_time": "2 days, 1:03:33", "remaining_time": "20:27:33", "throughput": 27123.62, "total_tokens": 4790408768} +{"current_steps": 17800, "total_steps": 25209, "loss": 0.9355, "lr": 2.998854656240207e-05, "epoch": 2.1182919663510527, "percentage": 70.61, "elapsed_time": "2 days, 1:05:12", "remaining_time": "20:25:54", "throughput": 27123.74, "total_tokens": 4793115328} +{"current_steps": 17810, "total_steps": 25209, "loss": 0.9332, "lr": 2.9983154199680257e-05, "epoch": 2.119482026374705, "percentage": 70.65, "elapsed_time": "2 days, 1:06:45", "remaining_time": "20:24:12", "throughput": 27124.52, "total_tokens": 4795767936} +{"current_steps": 17820, "total_steps": 25209, "loss": 0.9146, "lr": 2.9977764744780845e-05, "epoch": 2.1206720863983577, "percentage": 70.69, "elapsed_time": "2 days, 1:08:19", "remaining_time": "20:22:30", "throughput": 27125.09, "total_tokens": 4798409280} +{"current_steps": 17830, "total_steps": 25209, "loss": 0.9251, "lr": 2.9972378195091384e-05, "epoch": 2.12186214642201, "percentage": 70.73, "elapsed_time": "2 days, 1:09:57", "remaining_time": "20:20:50", "throughput": 27125.57, "total_tokens": 4801151040} +{"current_steps": 17840, "total_steps": 25209, "loss": 0.9155, "lr": 2.996699454800269e-05, "epoch": 2.1230522064456627, "percentage": 70.77, "elapsed_time": "2 days, 1:11:39", "remaining_time": "20:19:12", "throughput": 27125.33, "total_tokens": 4803882496} +{"current_steps": 17850, "total_steps": 25209, "loss": 0.9191, "lr": 2.9961613800908883e-05, "epoch": 2.1242422664693152, "percentage": 70.81, "elapsed_time": "2 days, 1:13:17", "remaining_time": "20:17:33", "throughput": 27125.55, "total_tokens": 4806580928} +{"current_steps": 17860, "total_steps": 25209, "loss": 0.9314, "lr": 2.995623595120733e-05, "epoch": 2.1254323264929673, "percentage": 70.85, "elapsed_time": "2 days, 1:14:52", "remaining_time": "20:15:51", "throughput": 27126.31, "total_tokens": 4809280384} +{"current_steps": 17870, "total_steps": 25209, "loss": 0.9217, "lr": 2.995086099629869e-05, "epoch": 2.12662238651662, "percentage": 70.89, "elapsed_time": "2 days, 1:16:27", "remaining_time": "20:14:10", "throughput": 27126.58, "total_tokens": 4811906944} +{"current_steps": 17880, "total_steps": 25209, "loss": 0.9148, "lr": 2.9945488933586867e-05, "epoch": 2.1278124465402724, "percentage": 70.93, "elapsed_time": "2 days, 1:18:03", "remaining_time": "20:12:30", "throughput": 27126.84, "total_tokens": 4814572672} +{"current_steps": 17890, "total_steps": 25209, "loss": 0.9136, "lr": 2.9940119760479045e-05, "epoch": 2.129002506563925, "percentage": 70.97, "elapsed_time": "2 days, 1:19:39", "remaining_time": "20:10:49", "throughput": 27127.19, "total_tokens": 4817237248} +{"current_steps": 17900, "total_steps": 25209, "loss": 0.9129, "lr": 2.9934753474385635e-05, "epoch": 2.1301925665875774, "percentage": 71.01, "elapsed_time": "2 days, 1:21:15", "remaining_time": "20:09:09", "throughput": 27127.85, "total_tokens": 4819965056} +{"current_steps": 17910, "total_steps": 25209, "loss": 0.928, "lr": 2.9929390072720314e-05, "epoch": 2.13138262661123, "percentage": 71.05, "elapsed_time": "2 days, 1:22:54", "remaining_time": "20:07:29", "throughput": 27128.23, "total_tokens": 4822698496} +{"current_steps": 17920, "total_steps": 25209, "loss": 0.9107, "lr": 2.99240295529e-05, "epoch": 2.132572686634882, "percentage": 71.09, "elapsed_time": "2 days, 1:24:29", "remaining_time": "20:05:48", "throughput": 27128.77, "total_tokens": 4825376192} +{"current_steps": 17930, "total_steps": 25209, "loss": 0.9104, "lr": 2.991867191234484e-05, "epoch": 2.1337627466585345, "percentage": 71.13, "elapsed_time": "2 days, 1:26:02", "remaining_time": "20:04:07", "throughput": 27129.6, "total_tokens": 4828052480} +{"current_steps": 17940, "total_steps": 25209, "loss": 0.9183, "lr": 2.991331714847822e-05, "epoch": 2.134952806682187, "percentage": 71.17, "elapsed_time": "2 days, 1:27:41", "remaining_time": "20:02:27", "throughput": 27129.75, "total_tokens": 4830762816} +{"current_steps": 17950, "total_steps": 25209, "loss": 0.9255, "lr": 2.990796525872675e-05, "epoch": 2.1361428667058395, "percentage": 71.2, "elapsed_time": "2 days, 1:29:15", "remaining_time": "20:00:46", "throughput": 27130.61, "total_tokens": 4833461632} +{"current_steps": 17960, "total_steps": 25209, "loss": 0.929, "lr": 2.990261624052027e-05, "epoch": 2.137332926729492, "percentage": 71.24, "elapsed_time": "2 days, 1:30:56", "remaining_time": "19:59:07", "throughput": 27130.48, "total_tokens": 4836187264} +{"current_steps": 17970, "total_steps": 25209, "loss": 0.9267, "lr": 2.989727009129182e-05, "epoch": 2.1385229867531446, "percentage": 71.28, "elapsed_time": "2 days, 1:32:35", "remaining_time": "19:57:28", "throughput": 27130.69, "total_tokens": 4838895040} +{"current_steps": 17980, "total_steps": 25209, "loss": 0.924, "lr": 2.989192680847766e-05, "epoch": 2.1397130467767966, "percentage": 71.32, "elapsed_time": "2 days, 1:34:10", "remaining_time": "19:55:47", "throughput": 27131.32, "total_tokens": 4841590016} +{"current_steps": 17990, "total_steps": 25209, "loss": 0.9134, "lr": 2.9886586389517267e-05, "epoch": 2.140903106800449, "percentage": 71.36, "elapsed_time": "2 days, 1:35:48", "remaining_time": "19:54:07", "throughput": 27131.56, "total_tokens": 4844288320} +{"current_steps": 18000, "total_steps": 25209, "loss": 0.9233, "lr": 2.98812488318533e-05, "epoch": 2.1420931668241017, "percentage": 71.4, "elapsed_time": "2 days, 1:37:25", "remaining_time": "19:52:27", "throughput": 27131.86, "total_tokens": 4846972736} +{"current_steps": 18010, "total_steps": 25209, "loss": 0.9383, "lr": 2.987591413293162e-05, "epoch": 2.143283226847754, "percentage": 71.44, "elapsed_time": "2 days, 1:38:59", "remaining_time": "19:50:46", "throughput": 27132.3, "total_tokens": 4849605760} +{"current_steps": 18020, "total_steps": 25209, "loss": 0.9231, "lr": 2.98705822902013e-05, "epoch": 2.1444732868714067, "percentage": 71.48, "elapsed_time": "2 days, 1:40:34", "remaining_time": "19:49:05", "throughput": 27133.05, "total_tokens": 4852314368} +{"current_steps": 18030, "total_steps": 25209, "loss": 0.9233, "lr": 2.9865253301114553e-05, "epoch": 2.145663346895059, "percentage": 71.52, "elapsed_time": "2 days, 1:42:15", "remaining_time": "19:47:26", "throughput": 27133.0, "total_tokens": 4855047936} +{"current_steps": 18040, "total_steps": 25209, "loss": 0.9107, "lr": 2.985992716312683e-05, "epoch": 2.1468534069187113, "percentage": 71.56, "elapsed_time": "2 days, 1:43:47", "remaining_time": "19:45:44", "throughput": 27133.68, "total_tokens": 4857676224} +{"current_steps": 18050, "total_steps": 25209, "loss": 0.9186, "lr": 2.9854603873696703e-05, "epoch": 2.148043466942364, "percentage": 71.6, "elapsed_time": "2 days, 1:45:24", "remaining_time": "19:44:04", "throughput": 27134.28, "total_tokens": 4860421120} +{"current_steps": 18060, "total_steps": 25209, "loss": 0.9128, "lr": 2.9849283430285947e-05, "epoch": 2.1492335269660163, "percentage": 71.64, "elapsed_time": "2 days, 1:47:00", "remaining_time": "19:42:23", "throughput": 27134.71, "total_tokens": 4863093696} +{"current_steps": 18070, "total_steps": 25209, "loss": 0.9254, "lr": 2.98439658303595e-05, "epoch": 2.150423586989669, "percentage": 71.68, "elapsed_time": "2 days, 1:48:37", "remaining_time": "19:40:43", "throughput": 27135.1, "total_tokens": 4865794880} +{"current_steps": 18080, "total_steps": 25209, "loss": 0.9185, "lr": 2.9838651071385442e-05, "epoch": 2.1516136470133214, "percentage": 71.72, "elapsed_time": "2 days, 1:50:07", "remaining_time": "19:39:01", "throughput": 27135.88, "total_tokens": 4868390912} +{"current_steps": 18090, "total_steps": 25209, "loss": 0.9218, "lr": 2.9833339150835037e-05, "epoch": 2.152803707036974, "percentage": 71.76, "elapsed_time": "2 days, 1:51:46", "remaining_time": "19:37:21", "throughput": 27135.87, "total_tokens": 4871075072} +{"current_steps": 18100, "total_steps": 25209, "loss": 0.9131, "lr": 2.982803006618267e-05, "epoch": 2.153993767060626, "percentage": 71.8, "elapsed_time": "2 days, 1:53:22", "remaining_time": "19:35:41", "throughput": 27136.26, "total_tokens": 4873750464} +{"current_steps": 18110, "total_steps": 25209, "loss": 0.9227, "lr": 2.982272381490588e-05, "epoch": 2.1551838270842785, "percentage": 71.84, "elapsed_time": "2 days, 1:55:05", "remaining_time": "19:34:03", "throughput": 27136.03, "total_tokens": 4876497920} +{"current_steps": 18120, "total_steps": 25209, "loss": 0.9185, "lr": 2.9817420394485363e-05, "epoch": 2.156373887107931, "percentage": 71.88, "elapsed_time": "2 days, 1:56:48", "remaining_time": "19:32:25", "throughput": 27135.79, "total_tokens": 4879253888} +{"current_steps": 18130, "total_steps": 25209, "loss": 0.9344, "lr": 2.9812119802404927e-05, "epoch": 2.1575639471315835, "percentage": 71.92, "elapsed_time": "2 days, 1:58:23", "remaining_time": "19:30:44", "throughput": 27136.4, "total_tokens": 4881945984} +{"current_steps": 18140, "total_steps": 25209, "loss": 0.9218, "lr": 2.9806822036151523e-05, "epoch": 2.158754007155236, "percentage": 71.96, "elapsed_time": "2 days, 2:00:02", "remaining_time": "19:29:05", "throughput": 27136.48, "total_tokens": 4884627328} +{"current_steps": 18150, "total_steps": 25209, "loss": 0.9157, "lr": 2.980152709321522e-05, "epoch": 2.1599440671788885, "percentage": 72.0, "elapsed_time": "2 days, 2:01:38", "remaining_time": "19:27:25", "throughput": 27136.76, "total_tokens": 4887296064} +{"current_steps": 18160, "total_steps": 25209, "loss": 0.9, "lr": 2.9796234971089214e-05, "epoch": 2.1611341272025406, "percentage": 72.04, "elapsed_time": "2 days, 2:03:12", "remaining_time": "19:25:43", "throughput": 27137.6, "total_tokens": 4889985920} +{"current_steps": 18170, "total_steps": 25209, "loss": 0.9165, "lr": 2.979094566726981e-05, "epoch": 2.162324187226193, "percentage": 72.08, "elapsed_time": "2 days, 2:04:49", "remaining_time": "19:24:03", "throughput": 27137.86, "total_tokens": 4892669120} +{"current_steps": 18180, "total_steps": 25209, "loss": 0.9227, "lr": 2.9785659179256427e-05, "epoch": 2.1635142472498456, "percentage": 72.12, "elapsed_time": "2 days, 2:06:21", "remaining_time": "19:22:21", "throughput": 27138.59, "total_tokens": 4895297408} +{"current_steps": 18190, "total_steps": 25209, "loss": 0.9213, "lr": 2.978037550455159e-05, "epoch": 2.164704307273498, "percentage": 72.16, "elapsed_time": "2 days, 2:07:55", "remaining_time": "19:20:40", "throughput": 27139.38, "total_tokens": 4897988992} +{"current_steps": 18200, "total_steps": 25209, "loss": 0.9161, "lr": 2.977509464066091e-05, "epoch": 2.1658943672971507, "percentage": 72.2, "elapsed_time": "2 days, 2:09:30", "remaining_time": "19:18:59", "throughput": 27139.8, "total_tokens": 4900658880} +{"current_steps": 18210, "total_steps": 25209, "loss": 0.9152, "lr": 2.9769816585093126e-05, "epoch": 2.167084427320803, "percentage": 72.24, "elapsed_time": "2 days, 2:11:07", "remaining_time": "19:17:19", "throughput": 27140.23, "total_tokens": 4903357376} +{"current_steps": 18220, "total_steps": 25209, "loss": 0.9162, "lr": 2.9764541335360024e-05, "epoch": 2.1682744873444553, "percentage": 72.28, "elapsed_time": "2 days, 2:12:44", "remaining_time": "19:15:39", "throughput": 27140.45, "total_tokens": 4906030144} +{"current_steps": 18230, "total_steps": 25209, "loss": 0.9245, "lr": 2.9759268888976505e-05, "epoch": 2.169464547368108, "percentage": 72.32, "elapsed_time": "2 days, 2:14:22", "remaining_time": "19:13:59", "throughput": 27140.78, "total_tokens": 4908754688} +{"current_steps": 18240, "total_steps": 25209, "loss": 0.9284, "lr": 2.9753999243460546e-05, "epoch": 2.1706546073917603, "percentage": 72.36, "elapsed_time": "2 days, 2:16:00", "remaining_time": "19:12:19", "throughput": 27141.3, "total_tokens": 4911495680} +{"current_steps": 18250, "total_steps": 25209, "loss": 0.9247, "lr": 2.974873239633319e-05, "epoch": 2.171844667415413, "percentage": 72.39, "elapsed_time": "2 days, 2:17:41", "remaining_time": "19:10:41", "throughput": 27141.17, "total_tokens": 4914217088} +{"current_steps": 18260, "total_steps": 25209, "loss": 0.9328, "lr": 2.9743468345118563e-05, "epoch": 2.1730347274390653, "percentage": 72.43, "elapsed_time": "2 days, 2:19:15", "remaining_time": "19:09:00", "throughput": 27141.83, "total_tokens": 4916899328} +{"current_steps": 18270, "total_steps": 25209, "loss": 0.9135, "lr": 2.9738207087343844e-05, "epoch": 2.174224787462718, "percentage": 72.47, "elapsed_time": "2 days, 2:20:51", "remaining_time": "19:07:20", "throughput": 27142.24, "total_tokens": 4919584576} +{"current_steps": 18280, "total_steps": 25209, "loss": 0.9253, "lr": 2.9732948620539287e-05, "epoch": 2.17541484748637, "percentage": 72.51, "elapsed_time": "2 days, 2:22:28", "remaining_time": "19:05:39", "throughput": 27142.57, "total_tokens": 4922254080} +{"current_steps": 18290, "total_steps": 25209, "loss": 0.9199, "lr": 2.9727692942238188e-05, "epoch": 2.1766049075100224, "percentage": 72.55, "elapsed_time": "2 days, 2:24:09", "remaining_time": "19:04:01", "throughput": 27142.47, "total_tokens": 4924974976} +{"current_steps": 18300, "total_steps": 25209, "loss": 0.9196, "lr": 2.97224400499769e-05, "epoch": 2.177794967533675, "percentage": 72.59, "elapsed_time": "2 days, 2:25:40", "remaining_time": "19:02:18", "throughput": 27143.17, "total_tokens": 4927585024} +{"current_steps": 18310, "total_steps": 25209, "loss": 0.921, "lr": 2.9717189941294826e-05, "epoch": 2.1789850275573275, "percentage": 72.63, "elapsed_time": "2 days, 2:27:14", "remaining_time": "19:00:37", "throughput": 27143.7, "total_tokens": 4930225088} +{"current_steps": 18320, "total_steps": 25209, "loss": 0.9287, "lr": 2.97119426137344e-05, "epoch": 2.18017508758098, "percentage": 72.67, "elapsed_time": "2 days, 2:28:48", "remaining_time": "18:58:56", "throughput": 27144.44, "total_tokens": 4932930176} +{"current_steps": 18330, "total_steps": 25209, "loss": 0.9328, "lr": 2.9706698064841103e-05, "epoch": 2.1813651476046325, "percentage": 72.71, "elapsed_time": "2 days, 2:30:23", "remaining_time": "18:57:15", "throughput": 27145.04, "total_tokens": 4935600192} +{"current_steps": 18340, "total_steps": 25209, "loss": 0.9236, "lr": 2.970145629216345e-05, "epoch": 2.1825552076282846, "percentage": 72.75, "elapsed_time": "2 days, 2:32:01", "remaining_time": "18:55:36", "throughput": 27145.23, "total_tokens": 4938295616} +{"current_steps": 18350, "total_steps": 25209, "loss": 0.9128, "lr": 2.969621729325296e-05, "epoch": 2.183745267651937, "percentage": 72.79, "elapsed_time": "2 days, 2:33:38", "remaining_time": "18:53:56", "throughput": 27145.54, "total_tokens": 4940979776} +{"current_steps": 18360, "total_steps": 25209, "loss": 0.9216, "lr": 2.969098106566421e-05, "epoch": 2.1849353276755896, "percentage": 72.83, "elapsed_time": "2 days, 2:35:15", "remaining_time": "18:52:16", "throughput": 27145.94, "total_tokens": 4943701312} +{"current_steps": 18370, "total_steps": 25209, "loss": 0.919, "lr": 2.968574760695476e-05, "epoch": 2.186125387699242, "percentage": 72.87, "elapsed_time": "2 days, 2:36:48", "remaining_time": "18:50:34", "throughput": 27146.53, "total_tokens": 4946335488} +{"current_steps": 18380, "total_steps": 25209, "loss": 0.9118, "lr": 2.9680516914685206e-05, "epoch": 2.1873154477228947, "percentage": 72.91, "elapsed_time": "2 days, 2:38:23", "remaining_time": "18:48:54", "throughput": 27147.01, "total_tokens": 4949008128} +{"current_steps": 18390, "total_steps": 25209, "loss": 0.9187, "lr": 2.9675288986419148e-05, "epoch": 2.188505507746547, "percentage": 72.95, "elapsed_time": "2 days, 2:39:59", "remaining_time": "18:47:13", "throughput": 27147.46, "total_tokens": 4951690432} +{"current_steps": 18400, "total_steps": 25209, "loss": 0.9159, "lr": 2.967006381972317e-05, "epoch": 2.1896955677701992, "percentage": 72.99, "elapsed_time": "2 days, 2:41:35", "remaining_time": "18:45:33", "throughput": 27148.1, "total_tokens": 4954411136} +{"current_steps": 18410, "total_steps": 25209, "loss": 0.9177, "lr": 2.9664841412166882e-05, "epoch": 2.1908856277938518, "percentage": 73.03, "elapsed_time": "2 days, 2:43:14", "remaining_time": "18:43:53", "throughput": 27148.33, "total_tokens": 4957128640} +{"current_steps": 18420, "total_steps": 25209, "loss": 0.9204, "lr": 2.965962176132287e-05, "epoch": 2.1920756878175043, "percentage": 73.07, "elapsed_time": "2 days, 2:44:53", "remaining_time": "18:42:14", "throughput": 27148.41, "total_tokens": 4959836096} +{"current_steps": 18430, "total_steps": 25209, "loss": 0.9192, "lr": 2.9654404864766706e-05, "epoch": 2.193265747841157, "percentage": 73.11, "elapsed_time": "2 days, 2:46:27", "remaining_time": "18:40:33", "throughput": 27148.8, "total_tokens": 4962468480} +{"current_steps": 18440, "total_steps": 25209, "loss": 0.9191, "lr": 2.9649190720076962e-05, "epoch": 2.1944558078648093, "percentage": 73.15, "elapsed_time": "2 days, 2:48:07", "remaining_time": "18:38:54", "throughput": 27148.82, "total_tokens": 4965182784} +{"current_steps": 18450, "total_steps": 25209, "loss": 0.9165, "lr": 2.9643979324835176e-05, "epoch": 2.1956458678884614, "percentage": 73.19, "elapsed_time": "2 days, 2:49:47", "remaining_time": "18:37:15", "throughput": 27148.81, "total_tokens": 4967891776} +{"current_steps": 18460, "total_steps": 25209, "loss": 0.9159, "lr": 2.9638770676625866e-05, "epoch": 2.196835927912114, "percentage": 73.23, "elapsed_time": "2 days, 2:51:22", "remaining_time": "18:35:35", "throughput": 27149.27, "total_tokens": 4970558336} +{"current_steps": 18470, "total_steps": 25209, "loss": 0.9174, "lr": 2.9633564773036517e-05, "epoch": 2.1980259879357664, "percentage": 73.27, "elapsed_time": "2 days, 2:53:00", "remaining_time": "18:33:55", "throughput": 27149.45, "total_tokens": 4973251328} +{"current_steps": 18480, "total_steps": 25209, "loss": 0.9311, "lr": 2.9628361611657578e-05, "epoch": 2.199216047959419, "percentage": 73.31, "elapsed_time": "2 days, 2:54:32", "remaining_time": "18:32:13", "throughput": 27150.24, "total_tokens": 4975887808} +{"current_steps": 18490, "total_steps": 25209, "loss": 0.9298, "lr": 2.9623161190082472e-05, "epoch": 2.2004061079830715, "percentage": 73.35, "elapsed_time": "2 days, 2:56:08", "remaining_time": "18:30:33", "throughput": 27150.72, "total_tokens": 4978595840} +{"current_steps": 18500, "total_steps": 25209, "loss": 0.9102, "lr": 2.9617963505907554e-05, "epoch": 2.201596168006724, "percentage": 73.39, "elapsed_time": "2 days, 2:57:41", "remaining_time": "18:28:51", "throughput": 27151.52, "total_tokens": 4981245824} +{"current_steps": 18510, "total_steps": 25209, "loss": 0.9244, "lr": 2.9612768556732145e-05, "epoch": 2.2027862280303765, "percentage": 73.43, "elapsed_time": "2 days, 2:59:14", "remaining_time": "18:27:10", "throughput": 27152.37, "total_tokens": 4983950784} +{"current_steps": 18520, "total_steps": 25209, "loss": 0.9402, "lr": 2.960757634015852e-05, "epoch": 2.2039762880540286, "percentage": 73.47, "elapsed_time": "2 days, 3:00:51", "remaining_time": "18:25:30", "throughput": 27152.83, "total_tokens": 4986650112} +{"current_steps": 18530, "total_steps": 25209, "loss": 0.9291, "lr": 2.9602386853791885e-05, "epoch": 2.205166348077681, "percentage": 73.51, "elapsed_time": "2 days, 3:02:26", "remaining_time": "18:23:50", "throughput": 27153.24, "total_tokens": 4989323072} +{"current_steps": 18540, "total_steps": 25209, "loss": 0.9126, "lr": 2.959720009524038e-05, "epoch": 2.2063564081013336, "percentage": 73.55, "elapsed_time": "2 days, 3:04:05", "remaining_time": "18:22:10", "throughput": 27153.39, "total_tokens": 4992020160} +{"current_steps": 18550, "total_steps": 25209, "loss": 0.9335, "lr": 2.9592016062115085e-05, "epoch": 2.207546468124986, "percentage": 73.58, "elapsed_time": "2 days, 3:05:38", "remaining_time": "18:20:29", "throughput": 27154.2, "total_tokens": 4994696768} +{"current_steps": 18560, "total_steps": 25209, "loss": 0.9134, "lr": 2.9586834752030002e-05, "epoch": 2.2087365281486386, "percentage": 73.62, "elapsed_time": "2 days, 3:07:15", "remaining_time": "18:18:49", "throughput": 27154.37, "total_tokens": 4997376512} +{"current_steps": 18570, "total_steps": 25209, "loss": 0.9092, "lr": 2.958165616260206e-05, "epoch": 2.2099265881722907, "percentage": 73.66, "elapsed_time": "2 days, 3:08:53", "remaining_time": "18:17:10", "throughput": 27154.64, "total_tokens": 5000089792} +{"current_steps": 18580, "total_steps": 25209, "loss": 0.9187, "lr": 2.9576480291451114e-05, "epoch": 2.2111166481959432, "percentage": 73.7, "elapsed_time": "2 days, 3:10:30", "remaining_time": "18:15:30", "throughput": 27155.19, "total_tokens": 5002821184} +{"current_steps": 18590, "total_steps": 25209, "loss": 0.9156, "lr": 2.957130713619991e-05, "epoch": 2.2123067082195957, "percentage": 73.74, "elapsed_time": "2 days, 3:12:06", "remaining_time": "18:13:49", "throughput": 27155.63, "total_tokens": 5005505216} +{"current_steps": 18600, "total_steps": 25209, "loss": 0.9242, "lr": 2.9566136694474138e-05, "epoch": 2.2134967682432483, "percentage": 73.78, "elapsed_time": "2 days, 3:13:41", "remaining_time": "18:12:09", "throughput": 27156.0, "total_tokens": 5008157440} +{"current_steps": 18610, "total_steps": 25209, "loss": 0.9298, "lr": 2.9560968963902365e-05, "epoch": 2.2146868282669008, "percentage": 73.82, "elapsed_time": "2 days, 3:15:19", "remaining_time": "18:10:29", "throughput": 27156.58, "total_tokens": 5010917632} +{"current_steps": 18620, "total_steps": 25209, "loss": 0.9182, "lr": 2.9555803942116062e-05, "epoch": 2.2158768882905533, "percentage": 73.86, "elapsed_time": "2 days, 3:16:56", "remaining_time": "18:08:49", "throughput": 27156.87, "total_tokens": 5013608640} +{"current_steps": 18630, "total_steps": 25209, "loss": 0.9105, "lr": 2.955064162674961e-05, "epoch": 2.217066948314206, "percentage": 73.9, "elapsed_time": "2 days, 3:18:32", "remaining_time": "18:07:09", "throughput": 27157.15, "total_tokens": 5016272704} +{"current_steps": 18640, "total_steps": 25209, "loss": 0.9263, "lr": 2.9545482015440266e-05, "epoch": 2.218257008337858, "percentage": 73.94, "elapsed_time": "2 days, 3:20:10", "remaining_time": "18:05:29", "throughput": 27157.31, "total_tokens": 5018960320} +{"current_steps": 18650, "total_steps": 25209, "loss": 0.9194, "lr": 2.954032510582819e-05, "epoch": 2.2194470683615104, "percentage": 73.98, "elapsed_time": "2 days, 3:21:43", "remaining_time": "18:03:48", "throughput": 27158.0, "total_tokens": 5021610624} +{"current_steps": 18660, "total_steps": 25209, "loss": 0.9263, "lr": 2.95351708955564e-05, "epoch": 2.220637128385163, "percentage": 74.02, "elapsed_time": "2 days, 3:23:21", "remaining_time": "18:02:09", "throughput": 27157.99, "total_tokens": 5024280704} +{"current_steps": 18670, "total_steps": 25209, "loss": 0.9231, "lr": 2.9530019382270823e-05, "epoch": 2.2218271884088154, "percentage": 74.06, "elapsed_time": "2 days, 3:24:58", "remaining_time": "18:00:28", "throughput": 27158.22, "total_tokens": 5026932928} +{"current_steps": 18680, "total_steps": 25209, "loss": 0.9332, "lr": 2.9524870563620233e-05, "epoch": 2.223017248432468, "percentage": 74.1, "elapsed_time": "2 days, 3:26:39", "remaining_time": "17:58:50", "throughput": 27158.14, "total_tokens": 5029663488} +{"current_steps": 18690, "total_steps": 25209, "loss": 0.9383, "lr": 2.9519724437256287e-05, "epoch": 2.22420730845612, "percentage": 74.14, "elapsed_time": "2 days, 3:28:17", "remaining_time": "17:57:10", "throughput": 27158.24, "total_tokens": 5032345920} +{"current_steps": 18700, "total_steps": 25209, "loss": 0.9208, "lr": 2.9514581000833496e-05, "epoch": 2.2253973684797725, "percentage": 74.18, "elapsed_time": "2 days, 3:29:50", "remaining_time": "17:55:29", "throughput": 27158.71, "total_tokens": 5034979776} +{"current_steps": 18710, "total_steps": 25209, "loss": 0.9182, "lr": 2.950944025200924e-05, "epoch": 2.226587428503425, "percentage": 74.22, "elapsed_time": "2 days, 3:31:26", "remaining_time": "17:53:49", "throughput": 27159.02, "total_tokens": 5037629440} +{"current_steps": 18720, "total_steps": 25209, "loss": 0.9153, "lr": 2.950430218844375e-05, "epoch": 2.2277774885270776, "percentage": 74.26, "elapsed_time": "2 days, 3:33:01", "remaining_time": "17:52:08", "throughput": 27159.62, "total_tokens": 5040323776} +{"current_steps": 18730, "total_steps": 25209, "loss": 0.9174, "lr": 2.9499166807800106e-05, "epoch": 2.22896754855073, "percentage": 74.3, "elapsed_time": "2 days, 3:34:39", "remaining_time": "17:50:29", "throughput": 27160.1, "total_tokens": 5043060800} +{"current_steps": 18740, "total_steps": 25209, "loss": 0.9121, "lr": 2.949403410774424e-05, "epoch": 2.2301576085743826, "percentage": 74.34, "elapsed_time": "2 days, 3:36:14", "remaining_time": "17:48:49", "throughput": 27160.44, "total_tokens": 5045728320} +{"current_steps": 18750, "total_steps": 25209, "loss": 0.9238, "lr": 2.948890408594492e-05, "epoch": 2.231347668598035, "percentage": 74.38, "elapsed_time": "2 days, 3:37:47", "remaining_time": "17:47:07", "throughput": 27161.11, "total_tokens": 5048362048} +{"current_steps": 18760, "total_steps": 25209, "loss": 0.9188, "lr": 2.9483776740073748e-05, "epoch": 2.232537728621687, "percentage": 74.42, "elapsed_time": "2 days, 3:39:28", "remaining_time": "17:45:28", "throughput": 27161.21, "total_tokens": 5051117376} +{"current_steps": 18770, "total_steps": 25209, "loss": 0.9192, "lr": 2.947865206780518e-05, "epoch": 2.2337277886453397, "percentage": 74.46, "elapsed_time": "2 days, 3:41:05", "remaining_time": "17:43:49", "throughput": 27161.58, "total_tokens": 5053842880} +{"current_steps": 18780, "total_steps": 25209, "loss": 0.9224, "lr": 2.947353006681647e-05, "epoch": 2.2349178486689922, "percentage": 74.5, "elapsed_time": "2 days, 3:42:37", "remaining_time": "17:42:07", "throughput": 27162.46, "total_tokens": 5056496960} +{"current_steps": 18790, "total_steps": 25209, "loss": 0.9163, "lr": 2.9468410734787717e-05, "epoch": 2.2361079086926448, "percentage": 74.54, "elapsed_time": "2 days, 3:44:11", "remaining_time": "17:40:26", "throughput": 27163.05, "total_tokens": 5059166464} +{"current_steps": 18800, "total_steps": 25209, "loss": 0.9366, "lr": 2.9463294069401838e-05, "epoch": 2.2372979687162973, "percentage": 74.58, "elapsed_time": "2 days, 3:45:50", "remaining_time": "17:38:47", "throughput": 27163.31, "total_tokens": 5061883392} +{"current_steps": 18810, "total_steps": 25209, "loss": 0.9207, "lr": 2.9458180068344555e-05, "epoch": 2.2384880287399493, "percentage": 74.62, "elapsed_time": "2 days, 3:47:27", "remaining_time": "17:37:07", "throughput": 27163.62, "total_tokens": 5064598336} +{"current_steps": 18820, "total_steps": 25209, "loss": 0.9151, "lr": 2.9453068729304407e-05, "epoch": 2.239678088763602, "percentage": 74.66, "elapsed_time": "2 days, 3:49:07", "remaining_time": "17:35:29", "throughput": 27163.79, "total_tokens": 5067347904} +{"current_steps": 18830, "total_steps": 25209, "loss": 0.9184, "lr": 2.944796004997274e-05, "epoch": 2.2408681487872544, "percentage": 74.7, "elapsed_time": "2 days, 3:50:44", "remaining_time": "17:33:49", "throughput": 27164.05, "total_tokens": 5070019200} +{"current_steps": 18840, "total_steps": 25209, "loss": 0.9068, "lr": 2.94428540280437e-05, "epoch": 2.242058208810907, "percentage": 74.74, "elapsed_time": "2 days, 3:52:15", "remaining_time": "17:32:07", "throughput": 27164.94, "total_tokens": 5072665920} +{"current_steps": 18850, "total_steps": 25209, "loss": 0.9144, "lr": 2.9437750661214242e-05, "epoch": 2.2432482688345594, "percentage": 74.77, "elapsed_time": "2 days, 3:53:51", "remaining_time": "17:30:27", "throughput": 27165.53, "total_tokens": 5075368256} +{"current_steps": 18860, "total_steps": 25209, "loss": 0.9198, "lr": 2.9432649947184094e-05, "epoch": 2.244438328858212, "percentage": 74.81, "elapsed_time": "2 days, 3:55:28", "remaining_time": "17:28:47", "throughput": 27165.73, "total_tokens": 5078055680} +{"current_steps": 18870, "total_steps": 25209, "loss": 0.9238, "lr": 2.942755188365579e-05, "epoch": 2.2456283888818644, "percentage": 74.85, "elapsed_time": "2 days, 3:57:06", "remaining_time": "17:27:07", "throughput": 27166.03, "total_tokens": 5080764288} +{"current_steps": 18880, "total_steps": 25209, "loss": 0.9264, "lr": 2.9422456468334635e-05, "epoch": 2.2468184489055165, "percentage": 74.89, "elapsed_time": "2 days, 3:58:44", "remaining_time": "17:25:28", "throughput": 27166.22, "total_tokens": 5083468096} +{"current_steps": 18890, "total_steps": 25209, "loss": 0.9266, "lr": 2.9417363698928734e-05, "epoch": 2.248008508929169, "percentage": 74.93, "elapsed_time": "2 days, 4:00:16", "remaining_time": "17:23:46", "throughput": 27167.05, "total_tokens": 5086111424} +{"current_steps": 18900, "total_steps": 25209, "loss": 0.9248, "lr": 2.9412273573148946e-05, "epoch": 2.2491985689528216, "percentage": 74.97, "elapsed_time": "2 days, 4:01:56", "remaining_time": "17:22:07", "throughput": 27167.08, "total_tokens": 5088833600} +{"current_steps": 18910, "total_steps": 25209, "loss": 0.9316, "lr": 2.940718608870891e-05, "epoch": 2.250388628976474, "percentage": 75.01, "elapsed_time": "2 days, 4:03:30", "remaining_time": "17:20:27", "throughput": 27167.66, "total_tokens": 5091508736} +{"current_steps": 18920, "total_steps": 25209, "loss": 0.9297, "lr": 2.940210124332504e-05, "epoch": 2.2515786890001266, "percentage": 75.05, "elapsed_time": "2 days, 4:05:05", "remaining_time": "17:18:46", "throughput": 27168.16, "total_tokens": 5094174208} +{"current_steps": 18930, "total_steps": 25209, "loss": 0.9178, "lr": 2.9397019034716504e-05, "epoch": 2.2527687490237787, "percentage": 75.09, "elapsed_time": "2 days, 4:06:45", "remaining_time": "17:17:08", "throughput": 27167.94, "total_tokens": 5096866816} +{"current_steps": 18940, "total_steps": 25209, "loss": 0.9338, "lr": 2.9391939460605233e-05, "epoch": 2.253958809047431, "percentage": 75.13, "elapsed_time": "2 days, 4:08:23", "remaining_time": "17:15:28", "throughput": 27168.3, "total_tokens": 5099583104} +{"current_steps": 18950, "total_steps": 25209, "loss": 0.9314, "lr": 2.9386862518715914e-05, "epoch": 2.2551488690710837, "percentage": 75.17, "elapsed_time": "2 days, 4:09:59", "remaining_time": "17:13:48", "throughput": 27168.57, "total_tokens": 5102233024} +{"current_steps": 18960, "total_steps": 25209, "loss": 0.9251, "lr": 2.9381788206775966e-05, "epoch": 2.256338929094736, "percentage": 75.21, "elapsed_time": "2 days, 4:11:33", "remaining_time": "17:12:07", "throughput": 27169.12, "total_tokens": 5104897216} +{"current_steps": 18970, "total_steps": 25209, "loss": 0.9359, "lr": 2.937671652251559e-05, "epoch": 2.2575289891183887, "percentage": 75.25, "elapsed_time": "2 days, 4:13:14", "remaining_time": "17:10:29", "throughput": 27169.03, "total_tokens": 5107639168} +{"current_steps": 18980, "total_steps": 25209, "loss": 0.929, "lr": 2.9371647463667696e-05, "epoch": 2.2587190491420412, "percentage": 75.29, "elapsed_time": "2 days, 4:14:50", "remaining_time": "17:08:48", "throughput": 27169.49, "total_tokens": 5110319552} +{"current_steps": 18990, "total_steps": 25209, "loss": 0.9379, "lr": 2.9366581027967943e-05, "epoch": 2.2599091091656938, "percentage": 75.33, "elapsed_time": "2 days, 4:16:28", "remaining_time": "17:07:09", "throughput": 27169.67, "total_tokens": 5113024384} +{"current_steps": 19000, "total_steps": 25209, "loss": 0.9108, "lr": 2.9361517213154726e-05, "epoch": 2.261099169189346, "percentage": 75.37, "elapsed_time": "2 days, 4:18:03", "remaining_time": "17:05:29", "throughput": 27170.38, "total_tokens": 5115738688} +{"current_steps": 19010, "total_steps": 25209, "loss": 0.9221, "lr": 2.935645601696917e-05, "epoch": 2.2622892292129984, "percentage": 75.41, "elapsed_time": "2 days, 4:19:40", "remaining_time": "17:03:49", "throughput": 27170.72, "total_tokens": 5118441088} +{"current_steps": 19020, "total_steps": 25209, "loss": 0.9161, "lr": 2.9351397437155114e-05, "epoch": 2.263479289236651, "percentage": 75.45, "elapsed_time": "2 days, 4:21:13", "remaining_time": "17:02:08", "throughput": 27171.44, "total_tokens": 5121086016} +{"current_steps": 19030, "total_steps": 25209, "loss": 0.9257, "lr": 2.934634147145913e-05, "epoch": 2.2646693492603034, "percentage": 75.49, "elapsed_time": "2 days, 4:22:47", "remaining_time": "17:00:27", "throughput": 27171.87, "total_tokens": 5123741888} +{"current_steps": 19040, "total_steps": 25209, "loss": 0.9316, "lr": 2.9341288117630495e-05, "epoch": 2.265859409283956, "percentage": 75.53, "elapsed_time": "2 days, 4:24:28", "remaining_time": "16:58:49", "throughput": 27171.78, "total_tokens": 5126461696} +{"current_steps": 19050, "total_steps": 25209, "loss": 0.9229, "lr": 2.933623737342121e-05, "epoch": 2.267049469307608, "percentage": 75.57, "elapsed_time": "2 days, 4:26:03", "remaining_time": "16:57:08", "throughput": 27172.49, "total_tokens": 5129170368} +{"current_steps": 19060, "total_steps": 25209, "loss": 0.9233, "lr": 2.9331189236585977e-05, "epoch": 2.2682395293312605, "percentage": 75.61, "elapsed_time": "2 days, 4:27:43", "remaining_time": "16:55:29", "throughput": 27172.67, "total_tokens": 5131926336} +{"current_steps": 19070, "total_steps": 25209, "loss": 0.9259, "lr": 2.9326143704882192e-05, "epoch": 2.269429589354913, "percentage": 75.65, "elapsed_time": "2 days, 4:29:20", "remaining_time": "16:53:50", "throughput": 27172.75, "total_tokens": 5134583360} +{"current_steps": 19080, "total_steps": 25209, "loss": 0.9316, "lr": 2.932110077606997e-05, "epoch": 2.2706196493785655, "percentage": 75.69, "elapsed_time": "2 days, 4:31:01", "remaining_time": "16:52:11", "throughput": 27172.74, "total_tokens": 5137320128} +{"current_steps": 19090, "total_steps": 25209, "loss": 0.9104, "lr": 2.931606044791212e-05, "epoch": 2.271809709402218, "percentage": 75.73, "elapsed_time": "2 days, 4:32:39", "remaining_time": "16:50:32", "throughput": 27172.99, "total_tokens": 5140026048} +{"current_steps": 19100, "total_steps": 25209, "loss": 0.9174, "lr": 2.9311022718174114e-05, "epoch": 2.2729997694258706, "percentage": 75.77, "elapsed_time": "2 days, 4:34:12", "remaining_time": "16:48:51", "throughput": 27173.57, "total_tokens": 5142672640} +{"current_steps": 19110, "total_steps": 25209, "loss": 0.9337, "lr": 2.930598758462415e-05, "epoch": 2.274189829449523, "percentage": 75.81, "elapsed_time": "2 days, 4:35:47", "remaining_time": "16:47:10", "throughput": 27174.06, "total_tokens": 5145338880} +{"current_steps": 19120, "total_steps": 25209, "loss": 0.9296, "lr": 2.9300955045033072e-05, "epoch": 2.275379889473175, "percentage": 75.85, "elapsed_time": "2 days, 4:37:21", "remaining_time": "16:45:30", "throughput": 27174.75, "total_tokens": 5148033216} +{"current_steps": 19130, "total_steps": 25209, "loss": 0.9341, "lr": 2.9295925097174435e-05, "epoch": 2.2765699494968277, "percentage": 75.89, "elapsed_time": "2 days, 4:39:01", "remaining_time": "16:43:51", "throughput": 27174.79, "total_tokens": 5150761280} +{"current_steps": 19140, "total_steps": 25209, "loss": 0.9308, "lr": 2.929089773882445e-05, "epoch": 2.27776000952048, "percentage": 75.93, "elapsed_time": "2 days, 4:40:39", "remaining_time": "16:42:11", "throughput": 27174.84, "total_tokens": 5153422144} +{"current_steps": 19150, "total_steps": 25209, "loss": 0.936, "lr": 2.9285872967762007e-05, "epoch": 2.2789500695441327, "percentage": 75.96, "elapsed_time": "2 days, 4:42:16", "remaining_time": "16:40:31", "throughput": 27175.17, "total_tokens": 5156110208} +{"current_steps": 19160, "total_steps": 25209, "loss": 0.9237, "lr": 2.9280850781768638e-05, "epoch": 2.2801401295677852, "percentage": 76.0, "elapsed_time": "2 days, 4:43:56", "remaining_time": "16:38:53", "throughput": 27175.16, "total_tokens": 5158827840} +{"current_steps": 19170, "total_steps": 25209, "loss": 0.9117, "lr": 2.9275831178628576e-05, "epoch": 2.2813301895914373, "percentage": 76.04, "elapsed_time": "2 days, 4:45:33", "remaining_time": "16:37:13", "throughput": 27175.74, "total_tokens": 5161579392} +{"current_steps": 19180, "total_steps": 25209, "loss": 0.9182, "lr": 2.927081415612869e-05, "epoch": 2.28252024961509, "percentage": 76.08, "elapsed_time": "2 days, 4:47:11", "remaining_time": "16:35:34", "throughput": 27175.76, "total_tokens": 5164244544} +{"current_steps": 19190, "total_steps": 25209, "loss": 0.9285, "lr": 2.9265799712058505e-05, "epoch": 2.2837103096387423, "percentage": 76.12, "elapsed_time": "2 days, 4:48:43", "remaining_time": "16:33:52", "throughput": 27176.44, "total_tokens": 5166879680} +{"current_steps": 19200, "total_steps": 25209, "loss": 0.9174, "lr": 2.926078784421019e-05, "epoch": 2.284900369662395, "percentage": 76.16, "elapsed_time": "2 days, 4:50:19", "remaining_time": "16:32:12", "throughput": 27176.79, "total_tokens": 5169559104} +{"current_steps": 19210, "total_steps": 25209, "loss": 0.9175, "lr": 2.9255778550378575e-05, "epoch": 2.2860904296860474, "percentage": 76.2, "elapsed_time": "2 days, 4:51:54", "remaining_time": "16:30:32", "throughput": 27177.06, "total_tokens": 5172192320} +{"current_steps": 19220, "total_steps": 25209, "loss": 0.9261, "lr": 2.9250771828361118e-05, "epoch": 2.2872804897097, "percentage": 76.24, "elapsed_time": "2 days, 4:53:30", "remaining_time": "16:28:52", "throughput": 27177.89, "total_tokens": 5174942528} +{"current_steps": 19230, "total_steps": 25209, "loss": 0.9284, "lr": 2.9245767675957923e-05, "epoch": 2.2884705497333524, "percentage": 76.28, "elapsed_time": "2 days, 4:55:07", "remaining_time": "16:27:12", "throughput": 27178.14, "total_tokens": 5177640128} +{"current_steps": 19240, "total_steps": 25209, "loss": 0.9017, "lr": 2.924076609097172e-05, "epoch": 2.2896606097570045, "percentage": 76.32, "elapsed_time": "2 days, 4:56:48", "remaining_time": "16:25:34", "throughput": 27178.14, "total_tokens": 5180374912} +{"current_steps": 19250, "total_steps": 25209, "loss": 0.9129, "lr": 2.9235767071207876e-05, "epoch": 2.290850669780657, "percentage": 76.36, "elapsed_time": "2 days, 4:58:19", "remaining_time": "16:23:52", "throughput": 27178.96, "total_tokens": 5183005504} +{"current_steps": 19260, "total_steps": 25209, "loss": 0.9244, "lr": 2.9230770614474383e-05, "epoch": 2.2920407298043095, "percentage": 76.4, "elapsed_time": "2 days, 4:59:53", "remaining_time": "16:22:12", "throughput": 27179.49, "total_tokens": 5185679104} +{"current_steps": 19270, "total_steps": 25209, "loss": 0.9128, "lr": 2.9225776718581842e-05, "epoch": 2.293230789827962, "percentage": 76.44, "elapsed_time": "2 days, 5:01:28", "remaining_time": "16:20:31", "throughput": 27179.92, "total_tokens": 5188342400} +{"current_steps": 19280, "total_steps": 25209, "loss": 0.919, "lr": 2.9220785381343495e-05, "epoch": 2.2944208498516145, "percentage": 76.48, "elapsed_time": "2 days, 5:03:08", "remaining_time": "16:18:52", "throughput": 27179.93, "total_tokens": 5191047168} +{"current_steps": 19290, "total_steps": 25209, "loss": 0.9252, "lr": 2.9215796600575174e-05, "epoch": 2.2956109098752666, "percentage": 76.52, "elapsed_time": "2 days, 5:04:44", "remaining_time": "16:17:12", "throughput": 27180.22, "total_tokens": 5193712896} +{"current_steps": 19300, "total_steps": 25209, "loss": 0.906, "lr": 2.9210810374095332e-05, "epoch": 2.296800969898919, "percentage": 76.56, "elapsed_time": "2 days, 5:06:18", "remaining_time": "16:15:32", "throughput": 27180.89, "total_tokens": 5196407616} +{"current_steps": 19310, "total_steps": 25209, "loss": 0.9253, "lr": 2.9205826699725026e-05, "epoch": 2.2979910299225716, "percentage": 76.6, "elapsed_time": "2 days, 5:07:53", "remaining_time": "16:13:51", "throughput": 27181.53, "total_tokens": 5199097280} +{"current_steps": 19320, "total_steps": 25209, "loss": 0.9129, "lr": 2.920084557528791e-05, "epoch": 2.299181089946224, "percentage": 76.64, "elapsed_time": "2 days, 5:09:33", "remaining_time": "16:12:13", "throughput": 27181.45, "total_tokens": 5201819904} +{"current_steps": 19330, "total_steps": 25209, "loss": 0.9144, "lr": 2.9195866998610245e-05, "epoch": 2.3003711499698767, "percentage": 76.68, "elapsed_time": "2 days, 5:11:08", "remaining_time": "16:10:33", "throughput": 27182.05, "total_tokens": 5204512640} +{"current_steps": 19340, "total_steps": 25209, "loss": 0.9258, "lr": 2.9190890967520878e-05, "epoch": 2.301561209993529, "percentage": 76.72, "elapsed_time": "2 days, 5:12:42", "remaining_time": "16:08:52", "throughput": 27182.65, "total_tokens": 5207168448} +{"current_steps": 19350, "total_steps": 25209, "loss": 0.9243, "lr": 2.9185917479851243e-05, "epoch": 2.3027512700171817, "percentage": 76.76, "elapsed_time": "2 days, 5:14:20", "remaining_time": "16:07:13", "throughput": 27182.82, "total_tokens": 5209885440} +{"current_steps": 19360, "total_steps": 25209, "loss": 0.9219, "lr": 2.9180946533435366e-05, "epoch": 2.303941330040834, "percentage": 76.8, "elapsed_time": "2 days, 5:15:57", "remaining_time": "16:05:33", "throughput": 27183.28, "total_tokens": 5212583424} +{"current_steps": 19370, "total_steps": 25209, "loss": 0.9232, "lr": 2.9175978126109853e-05, "epoch": 2.3051313900644863, "percentage": 76.84, "elapsed_time": "2 days, 5:17:35", "remaining_time": "16:03:53", "throughput": 27183.56, "total_tokens": 5215315136} +{"current_steps": 19380, "total_steps": 25209, "loss": 0.9362, "lr": 2.9171012255713885e-05, "epoch": 2.306321450088139, "percentage": 76.88, "elapsed_time": "2 days, 5:19:08", "remaining_time": "16:02:13", "throughput": 27184.26, "total_tokens": 5217974528} +{"current_steps": 19390, "total_steps": 25209, "loss": 0.9134, "lr": 2.9166048920089217e-05, "epoch": 2.3075115101117913, "percentage": 76.92, "elapsed_time": "2 days, 5:20:44", "remaining_time": "16:00:33", "throughput": 27184.82, "total_tokens": 5220683456} +{"current_steps": 19400, "total_steps": 25209, "loss": 0.9016, "lr": 2.9161088117080175e-05, "epoch": 2.308701570135444, "percentage": 76.96, "elapsed_time": "2 days, 5:22:18", "remaining_time": "15:58:52", "throughput": 27185.44, "total_tokens": 5223365056} +{"current_steps": 19410, "total_steps": 25209, "loss": 0.9141, "lr": 2.9156129844533658e-05, "epoch": 2.309891630159096, "percentage": 77.0, "elapsed_time": "2 days, 5:23:53", "remaining_time": "15:57:12", "throughput": 27185.82, "total_tokens": 5226011200} +{"current_steps": 19420, "total_steps": 25209, "loss": 0.9211, "lr": 2.9151174100299104e-05, "epoch": 2.3110816901827484, "percentage": 77.04, "elapsed_time": "2 days, 5:25:28", "remaining_time": "15:55:31", "throughput": 27186.31, "total_tokens": 5228689984} +{"current_steps": 19430, "total_steps": 25209, "loss": 0.9255, "lr": 2.9146220882228535e-05, "epoch": 2.312271750206401, "percentage": 77.08, "elapsed_time": "2 days, 5:27:07", "remaining_time": "15:53:53", "throughput": 27186.51, "total_tokens": 5231445504} +{"current_steps": 19440, "total_steps": 25209, "loss": 0.9147, "lr": 2.914127018817651e-05, "epoch": 2.3134618102300535, "percentage": 77.12, "elapsed_time": "2 days, 5:28:46", "remaining_time": "15:52:13", "throughput": 27186.69, "total_tokens": 5234145984} +{"current_steps": 19450, "total_steps": 25209, "loss": 0.9156, "lr": 2.9136322016000152e-05, "epoch": 2.314651870253706, "percentage": 77.15, "elapsed_time": "2 days, 5:30:19", "remaining_time": "15:50:33", "throughput": 27187.23, "total_tokens": 5236802688} +{"current_steps": 19460, "total_steps": 25209, "loss": 0.9171, "lr": 2.9131376363559116e-05, "epoch": 2.3158419302773585, "percentage": 77.19, "elapsed_time": "2 days, 5:31:59", "remaining_time": "15:48:54", "throughput": 27187.26, "total_tokens": 5239507904} +{"current_steps": 19470, "total_steps": 25209, "loss": 0.9153, "lr": 2.9126433228715606e-05, "epoch": 2.317031990301011, "percentage": 77.23, "elapsed_time": "2 days, 5:33:35", "remaining_time": "15:47:14", "throughput": 27187.64, "total_tokens": 5242197376} +{"current_steps": 19480, "total_steps": 25209, "loss": 0.9207, "lr": 2.9121492609334354e-05, "epoch": 2.318222050324663, "percentage": 77.27, "elapsed_time": "2 days, 5:35:12", "remaining_time": "15:45:34", "throughput": 27187.82, "total_tokens": 5244871488} +{"current_steps": 19490, "total_steps": 25209, "loss": 0.9117, "lr": 2.9116554503282656e-05, "epoch": 2.3194121103483156, "percentage": 77.31, "elapsed_time": "2 days, 5:36:51", "remaining_time": "15:43:55", "throughput": 27187.98, "total_tokens": 5247599616} +{"current_steps": 19500, "total_steps": 25209, "loss": 0.9298, "lr": 2.9111618908430303e-05, "epoch": 2.320602170371968, "percentage": 77.35, "elapsed_time": "2 days, 5:38:30", "remaining_time": "15:42:16", "throughput": 27188.15, "total_tokens": 5250311424} +{"current_steps": 19510, "total_steps": 25209, "loss": 0.9225, "lr": 2.9106685822649643e-05, "epoch": 2.3217922303956207, "percentage": 77.39, "elapsed_time": "2 days, 5:40:07", "remaining_time": "15:40:37", "throughput": 27188.42, "total_tokens": 5253010560} +{"current_steps": 19520, "total_steps": 25209, "loss": 0.9217, "lr": 2.910175524381552e-05, "epoch": 2.322982290419273, "percentage": 77.43, "elapsed_time": "2 days, 5:41:43", "remaining_time": "15:38:57", "throughput": 27188.91, "total_tokens": 5255698624} +{"current_steps": 19530, "total_steps": 25209, "loss": 0.9124, "lr": 2.9096827169805318e-05, "epoch": 2.3241723504429253, "percentage": 77.47, "elapsed_time": "2 days, 5:43:19", "remaining_time": "15:37:17", "throughput": 27189.25, "total_tokens": 5258384832} +{"current_steps": 19540, "total_steps": 25209, "loss": 0.9033, "lr": 2.9091901598498923e-05, "epoch": 2.3253624104665778, "percentage": 77.51, "elapsed_time": "2 days, 5:44:58", "remaining_time": "15:35:38", "throughput": 27189.52, "total_tokens": 5261129792} +{"current_steps": 19550, "total_steps": 25209, "loss": 0.9121, "lr": 2.9086978527778736e-05, "epoch": 2.3265524704902303, "percentage": 77.55, "elapsed_time": "2 days, 5:46:38", "remaining_time": "15:33:59", "throughput": 27189.53, "total_tokens": 5263863232} +{"current_steps": 19560, "total_steps": 25209, "loss": 0.9073, "lr": 2.9082057955529668e-05, "epoch": 2.327742530513883, "percentage": 77.59, "elapsed_time": "2 days, 5:48:16", "remaining_time": "15:32:20", "throughput": 27189.85, "total_tokens": 5266591168} +{"current_steps": 19570, "total_steps": 25209, "loss": 0.9316, "lr": 2.907713987963914e-05, "epoch": 2.3289325905375353, "percentage": 77.63, "elapsed_time": "2 days, 5:49:57", "remaining_time": "15:30:41", "throughput": 27189.93, "total_tokens": 5269345152} +{"current_steps": 19580, "total_steps": 25209, "loss": 0.925, "lr": 2.9072224297997058e-05, "epoch": 2.330122650561188, "percentage": 77.67, "elapsed_time": "2 days, 5:51:37", "remaining_time": "15:29:03", "throughput": 27190.11, "total_tokens": 5272108096} +{"current_steps": 19590, "total_steps": 25209, "loss": 0.932, "lr": 2.9067311208495834e-05, "epoch": 2.3313127105848404, "percentage": 77.71, "elapsed_time": "2 days, 5:53:10", "remaining_time": "15:27:22", "throughput": 27190.76, "total_tokens": 5274751104} +{"current_steps": 19600, "total_steps": 25209, "loss": 0.9296, "lr": 2.9062400609030372e-05, "epoch": 2.3325027706084924, "percentage": 77.75, "elapsed_time": "2 days, 5:54:44", "remaining_time": "15:25:41", "throughput": 27191.22, "total_tokens": 5277400320} +{"current_steps": 19610, "total_steps": 25209, "loss": 0.9209, "lr": 2.905749249749806e-05, "epoch": 2.333692830632145, "percentage": 77.79, "elapsed_time": "2 days, 5:56:19", "remaining_time": "15:24:01", "throughput": 27191.83, "total_tokens": 5280085824} +{"current_steps": 19620, "total_steps": 25209, "loss": 0.9215, "lr": 2.905258687179878e-05, "epoch": 2.3348828906557975, "percentage": 77.83, "elapsed_time": "2 days, 5:57:54", "remaining_time": "15:22:21", "throughput": 27192.18, "total_tokens": 5282752896} +{"current_steps": 19630, "total_steps": 25209, "loss": 0.9188, "lr": 2.904768372983488e-05, "epoch": 2.33607295067945, "percentage": 77.87, "elapsed_time": "2 days, 5:59:35", "remaining_time": "15:20:43", "throughput": 27191.98, "total_tokens": 5285466432} +{"current_steps": 19640, "total_steps": 25209, "loss": 0.9084, "lr": 2.90427830695112e-05, "epoch": 2.3372630107031025, "percentage": 77.91, "elapsed_time": "2 days, 6:01:10", "remaining_time": "15:19:02", "throughput": 27192.27, "total_tokens": 5288088896} +{"current_steps": 19650, "total_steps": 25209, "loss": 0.9154, "lr": 2.9037884888735044e-05, "epoch": 2.3384530707267546, "percentage": 77.95, "elapsed_time": "2 days, 6:02:50", "remaining_time": "15:17:24", "throughput": 27192.45, "total_tokens": 5290846080} +{"current_steps": 19660, "total_steps": 25209, "loss": 0.9234, "lr": 2.9032989185416194e-05, "epoch": 2.339643130750407, "percentage": 77.99, "elapsed_time": "2 days, 6:04:29", "remaining_time": "15:15:45", "throughput": 27192.34, "total_tokens": 5293511872} +{"current_steps": 19670, "total_steps": 25209, "loss": 0.9168, "lr": 2.9028095957466888e-05, "epoch": 2.3408331907740596, "percentage": 78.03, "elapsed_time": "2 days, 6:06:06", "remaining_time": "15:14:05", "throughput": 27192.86, "total_tokens": 5296249216} +{"current_steps": 19680, "total_steps": 25209, "loss": 0.9193, "lr": 2.9023205202801833e-05, "epoch": 2.342023250797712, "percentage": 78.07, "elapsed_time": "2 days, 6:07:45", "remaining_time": "15:12:26", "throughput": 27192.79, "total_tokens": 5298942144} +{"current_steps": 19690, "total_steps": 25209, "loss": 0.9291, "lr": 2.90183169193382e-05, "epoch": 2.3432133108213646, "percentage": 78.11, "elapsed_time": "2 days, 6:09:23", "remaining_time": "15:10:47", "throughput": 27192.92, "total_tokens": 5301621440} +{"current_steps": 19700, "total_steps": 25209, "loss": 0.9294, "lr": 2.90134311049956e-05, "epoch": 2.344403370845017, "percentage": 78.15, "elapsed_time": "2 days, 6:11:01", "remaining_time": "15:09:08", "throughput": 27193.04, "total_tokens": 5304328128} +{"current_steps": 19710, "total_steps": 25209, "loss": 0.9375, "lr": 2.90085477576961e-05, "epoch": 2.3455934308686697, "percentage": 78.19, "elapsed_time": "2 days, 6:12:35", "remaining_time": "15:07:27", "throughput": 27193.44, "total_tokens": 5306953664} +{"current_steps": 19720, "total_steps": 25209, "loss": 0.9205, "lr": 2.9003666875364226e-05, "epoch": 2.3467834908923217, "percentage": 78.23, "elapsed_time": "2 days, 6:14:12", "remaining_time": "15:05:48", "throughput": 27193.65, "total_tokens": 5309638976} +{"current_steps": 19730, "total_steps": 25209, "loss": 0.9293, "lr": 2.899878845592694e-05, "epoch": 2.3479735509159743, "percentage": 78.27, "elapsed_time": "2 days, 6:15:50", "remaining_time": "15:04:08", "throughput": 27193.92, "total_tokens": 5312346048} +{"current_steps": 19740, "total_steps": 25209, "loss": 0.9344, "lr": 2.8993912497313636e-05, "epoch": 2.349163610939627, "percentage": 78.31, "elapsed_time": "2 days, 6:17:24", "remaining_time": "15:02:28", "throughput": 27194.57, "total_tokens": 5315027840} +{"current_steps": 19750, "total_steps": 25209, "loss": 0.9232, "lr": 2.8989038997456153e-05, "epoch": 2.3503536709632793, "percentage": 78.35, "elapsed_time": "2 days, 6:19:02", "remaining_time": "15:00:48", "throughput": 27194.82, "total_tokens": 5317737024} +{"current_steps": 19760, "total_steps": 25209, "loss": 0.9208, "lr": 2.898416795428876e-05, "epoch": 2.351543730986932, "percentage": 78.38, "elapsed_time": "2 days, 6:20:42", "remaining_time": "14:59:10", "throughput": 27194.74, "total_tokens": 5320442176} +{"current_steps": 19770, "total_steps": 25209, "loss": 0.9137, "lr": 2.897929936574816e-05, "epoch": 2.352733791010584, "percentage": 78.42, "elapsed_time": "2 days, 6:22:15", "remaining_time": "14:57:29", "throughput": 27195.26, "total_tokens": 5323087616} +{"current_steps": 19780, "total_steps": 25209, "loss": 0.9179, "lr": 2.8974433229773478e-05, "epoch": 2.3539238510342364, "percentage": 78.46, "elapsed_time": "2 days, 6:23:50", "remaining_time": "14:55:49", "throughput": 27195.8, "total_tokens": 5325770432} +{"current_steps": 19790, "total_steps": 25209, "loss": 0.9183, "lr": 2.896956954430625e-05, "epoch": 2.355113911057889, "percentage": 78.5, "elapsed_time": "2 days, 6:25:26", "remaining_time": "14:54:09", "throughput": 27196.21, "total_tokens": 5328448256} +{"current_steps": 19800, "total_steps": 25209, "loss": 0.9234, "lr": 2.896470830729045e-05, "epoch": 2.3563039710815414, "percentage": 78.54, "elapsed_time": "2 days, 6:27:03", "remaining_time": "14:52:29", "throughput": 27196.43, "total_tokens": 5331131456} +{"current_steps": 19810, "total_steps": 25209, "loss": 0.9274, "lr": 2.895984951667245e-05, "epoch": 2.357494031105194, "percentage": 78.58, "elapsed_time": "2 days, 6:28:37", "remaining_time": "14:50:49", "throughput": 27196.9, "total_tokens": 5333800896} +{"current_steps": 19820, "total_steps": 25209, "loss": 0.92, "lr": 2.8954993170401047e-05, "epoch": 2.3586840911288465, "percentage": 78.62, "elapsed_time": "2 days, 6:30:18", "remaining_time": "14:49:11", "throughput": 27196.9, "total_tokens": 5336524544} +{"current_steps": 19830, "total_steps": 25209, "loss": 0.9251, "lr": 2.8950139266427423e-05, "epoch": 2.359874151152499, "percentage": 78.66, "elapsed_time": "2 days, 6:31:57", "remaining_time": "14:47:32", "throughput": 27197.03, "total_tokens": 5339241664} +{"current_steps": 19840, "total_steps": 25209, "loss": 0.9292, "lr": 2.8945287802705186e-05, "epoch": 2.361064211176151, "percentage": 78.7, "elapsed_time": "2 days, 6:33:36", "remaining_time": "14:45:53", "throughput": 27197.26, "total_tokens": 5341981056} +{"current_steps": 19850, "total_steps": 25209, "loss": 0.9201, "lr": 2.8940438777190336e-05, "epoch": 2.3622542711998036, "percentage": 78.74, "elapsed_time": "2 days, 6:35:12", "remaining_time": "14:44:13", "throughput": 27197.49, "total_tokens": 5344654272} +{"current_steps": 19860, "total_steps": 25209, "loss": 0.9255, "lr": 2.8935592187841265e-05, "epoch": 2.363444331223456, "percentage": 78.78, "elapsed_time": "2 days, 6:36:45", "remaining_time": "14:42:32", "throughput": 27198.13, "total_tokens": 5347311616} +{"current_steps": 19870, "total_steps": 25209, "loss": 0.9303, "lr": 2.893074803261876e-05, "epoch": 2.3646343912471086, "percentage": 78.82, "elapsed_time": "2 days, 6:38:23", "remaining_time": "14:40:53", "throughput": 27198.38, "total_tokens": 5350029056} +{"current_steps": 19880, "total_steps": 25209, "loss": 0.9309, "lr": 2.8925906309485995e-05, "epoch": 2.365824451270761, "percentage": 78.86, "elapsed_time": "2 days, 6:40:01", "remaining_time": "14:39:14", "throughput": 27198.61, "total_tokens": 5352722752} +{"current_steps": 19890, "total_steps": 25209, "loss": 0.9099, "lr": 2.8921067016408532e-05, "epoch": 2.367014511294413, "percentage": 78.9, "elapsed_time": "2 days, 6:41:36", "remaining_time": "14:37:34", "throughput": 27199.3, "total_tokens": 5355444480} +{"current_steps": 19900, "total_steps": 25209, "loss": 0.9219, "lr": 2.8916230151354316e-05, "epoch": 2.3682045713180657, "percentage": 78.94, "elapsed_time": "2 days, 6:43:09", "remaining_time": "14:35:53", "throughput": 27199.96, "total_tokens": 5358119552} +{"current_steps": 19910, "total_steps": 25209, "loss": 0.9234, "lr": 2.8911395712293677e-05, "epoch": 2.3693946313417182, "percentage": 78.98, "elapsed_time": "2 days, 6:44:43", "remaining_time": "14:34:13", "throughput": 27200.37, "total_tokens": 5360746304} +{"current_steps": 19920, "total_steps": 25209, "loss": 0.9321, "lr": 2.8906563697199294e-05, "epoch": 2.3705846913653708, "percentage": 79.02, "elapsed_time": "2 days, 6:46:22", "remaining_time": "14:32:34", "throughput": 27200.69, "total_tokens": 5363499968} +{"current_steps": 19930, "total_steps": 25209, "loss": 0.9146, "lr": 2.8901734104046245e-05, "epoch": 2.3717747513890233, "percentage": 79.06, "elapsed_time": "2 days, 6:47:58", "remaining_time": "14:30:54", "throughput": 27200.97, "total_tokens": 5366179008} +{"current_steps": 19940, "total_steps": 25209, "loss": 0.9149, "lr": 2.8896906930811964e-05, "epoch": 2.372964811412676, "percentage": 79.1, "elapsed_time": "2 days, 6:49:38", "remaining_time": "14:29:15", "throughput": 27200.98, "total_tokens": 5368889344} +{"current_steps": 19950, "total_steps": 25209, "loss": 0.9261, "lr": 2.8892082175476243e-05, "epoch": 2.3741548714363283, "percentage": 79.14, "elapsed_time": "2 days, 6:51:12", "remaining_time": "14:27:35", "throughput": 27201.58, "total_tokens": 5371563328} +{"current_steps": 19960, "total_steps": 25209, "loss": 0.934, "lr": 2.8887259836021246e-05, "epoch": 2.3753449314599804, "percentage": 79.18, "elapsed_time": "2 days, 6:52:49", "remaining_time": "14:25:55", "throughput": 27202.05, "total_tokens": 5374290560} +{"current_steps": 19970, "total_steps": 25209, "loss": 0.921, "lr": 2.8882439910431493e-05, "epoch": 2.376534991483633, "percentage": 79.22, "elapsed_time": "2 days, 6:54:27", "remaining_time": "14:24:16", "throughput": 27202.28, "total_tokens": 5377004288} +{"current_steps": 19980, "total_steps": 25209, "loss": 0.9251, "lr": 2.8877622396693843e-05, "epoch": 2.3777250515072854, "percentage": 79.26, "elapsed_time": "2 days, 6:56:04", "remaining_time": "14:22:37", "throughput": 27202.58, "total_tokens": 5379713984} +{"current_steps": 19990, "total_steps": 25209, "loss": 0.9148, "lr": 2.8872807292797516e-05, "epoch": 2.378915111530938, "percentage": 79.3, "elapsed_time": "2 days, 6:57:36", "remaining_time": "14:20:56", "throughput": 27203.33, "total_tokens": 5382368064} +{"current_steps": 20000, "total_steps": 25209, "loss": 0.9278, "lr": 2.8867994596734084e-05, "epoch": 2.3801051715545904, "percentage": 79.34, "elapsed_time": "2 days, 6:59:13", "remaining_time": "14:19:17", "throughput": 27203.74, "total_tokens": 5385085312} +{"current_steps": 20000, "total_steps": 25209, "eval_loss": 1.03257417678833, "epoch": 2.3801051715545904, "percentage": 79.34, "elapsed_time": "2 days, 6:59:15", "remaining_time": "14:19:17", "throughput": 27203.47, "total_tokens": 5385085312} +{"current_steps": 20010, "total_steps": 25209, "loss": 0.9339, "lr": 2.8863184306497437e-05, "epoch": 2.3812952315782425, "percentage": 79.38, "elapsed_time": "2 days, 7:01:32", "remaining_time": "14:17:48", "throughput": 27198.39, "total_tokens": 5387805376} +{"current_steps": 20020, "total_steps": 25209, "loss": 0.9223, "lr": 2.8858376420083848e-05, "epoch": 2.382485291601895, "percentage": 79.42, "elapsed_time": "2 days, 7:03:10", "remaining_time": "14:16:09", "throughput": 27198.69, "total_tokens": 5390507776} +{"current_steps": 20030, "total_steps": 25209, "loss": 0.9161, "lr": 2.8853570935491873e-05, "epoch": 2.3836753516255476, "percentage": 79.46, "elapsed_time": "2 days, 7:04:43", "remaining_time": "14:14:28", "throughput": 27199.2, "total_tokens": 5393160960} +{"current_steps": 20040, "total_steps": 25209, "loss": 0.9137, "lr": 2.8848767850722447e-05, "epoch": 2.3848654116492, "percentage": 79.5, "elapsed_time": "2 days, 7:06:17", "remaining_time": "14:12:48", "throughput": 27199.7, "total_tokens": 5395813696} +{"current_steps": 20050, "total_steps": 25209, "loss": 0.9225, "lr": 2.88439671637788e-05, "epoch": 2.3860554716728526, "percentage": 79.54, "elapsed_time": "2 days, 7:07:57", "remaining_time": "14:11:09", "throughput": 27199.76, "total_tokens": 5398535872} +{"current_steps": 20060, "total_steps": 25209, "loss": 0.9228, "lr": 2.8839168872666505e-05, "epoch": 2.387245531696505, "percentage": 79.57, "elapsed_time": "2 days, 7:09:34", "remaining_time": "14:09:30", "throughput": 27199.84, "total_tokens": 5401200320} +{"current_steps": 20070, "total_steps": 25209, "loss": 0.9274, "lr": 2.8834372975393448e-05, "epoch": 2.3884355917201576, "percentage": 79.61, "elapsed_time": "2 days, 7:11:07", "remaining_time": "14:07:49", "throughput": 27200.42, "total_tokens": 5403839424} +{"current_steps": 20080, "total_steps": 25209, "loss": 0.9251, "lr": 2.8829579469969843e-05, "epoch": 2.3896256517438097, "percentage": 79.65, "elapsed_time": "2 days, 7:12:41", "remaining_time": "14:06:09", "throughput": 27200.81, "total_tokens": 5406474240} +{"current_steps": 20090, "total_steps": 25209, "loss": 0.9142, "lr": 2.88247883544082e-05, "epoch": 2.390815711767462, "percentage": 79.69, "elapsed_time": "2 days, 7:14:12", "remaining_time": "14:04:28", "throughput": 27201.61, "total_tokens": 5409118400} +{"current_steps": 20100, "total_steps": 25209, "loss": 0.9122, "lr": 2.8819999626723366e-05, "epoch": 2.3920057717911147, "percentage": 79.73, "elapsed_time": "2 days, 7:15:49", "remaining_time": "14:02:48", "throughput": 27202.22, "total_tokens": 5411857728} +{"current_steps": 20110, "total_steps": 25209, "loss": 0.9172, "lr": 2.881521328493248e-05, "epoch": 2.3931958318147672, "percentage": 79.77, "elapsed_time": "2 days, 7:17:23", "remaining_time": "14:01:08", "throughput": 27202.82, "total_tokens": 5414540032} +{"current_steps": 20120, "total_steps": 25209, "loss": 0.9303, "lr": 2.881042932705499e-05, "epoch": 2.3943858918384198, "percentage": 79.81, "elapsed_time": "2 days, 7:19:00", "remaining_time": "13:59:28", "throughput": 27203.21, "total_tokens": 5417249152} +{"current_steps": 20130, "total_steps": 25209, "loss": 0.9247, "lr": 2.8805647751112635e-05, "epoch": 2.395575951862072, "percentage": 79.85, "elapsed_time": "2 days, 7:20:31", "remaining_time": "13:57:48", "throughput": 27203.92, "total_tokens": 5419887744} +{"current_steps": 20140, "total_steps": 25209, "loss": 0.9162, "lr": 2.8800868555129462e-05, "epoch": 2.3967660118857244, "percentage": 79.89, "elapsed_time": "2 days, 7:22:05", "remaining_time": "13:56:07", "throughput": 27204.39, "total_tokens": 5422531200} +{"current_steps": 20150, "total_steps": 25209, "loss": 0.93, "lr": 2.8796091737131814e-05, "epoch": 2.397956071909377, "percentage": 79.93, "elapsed_time": "2 days, 7:23:47", "remaining_time": "13:54:29", "throughput": 27204.12, "total_tokens": 5425240704} +{"current_steps": 20160, "total_steps": 25209, "loss": 0.9346, "lr": 2.8791317295148322e-05, "epoch": 2.3991461319330294, "percentage": 79.97, "elapsed_time": "2 days, 7:25:22", "remaining_time": "13:52:49", "throughput": 27204.68, "total_tokens": 5427939072} +{"current_steps": 20170, "total_steps": 25209, "loss": 0.9196, "lr": 2.8786545227209893e-05, "epoch": 2.400336191956682, "percentage": 80.01, "elapsed_time": "2 days, 7:26:55", "remaining_time": "13:51:09", "throughput": 27205.22, "total_tokens": 5430586880} +{"current_steps": 20180, "total_steps": 25209, "loss": 0.9185, "lr": 2.8781775531349742e-05, "epoch": 2.4015262519803344, "percentage": 80.05, "elapsed_time": "2 days, 7:28:29", "remaining_time": "13:49:29", "throughput": 27205.69, "total_tokens": 5433242496} +{"current_steps": 20190, "total_steps": 25209, "loss": 0.9319, "lr": 2.8777008205603334e-05, "epoch": 2.402716312003987, "percentage": 80.09, "elapsed_time": "2 days, 7:30:06", "remaining_time": "13:47:49", "throughput": 27205.98, "total_tokens": 5435942720} +{"current_steps": 20200, "total_steps": 25209, "loss": 0.9193, "lr": 2.877224324800844e-05, "epoch": 2.403906372027639, "percentage": 80.13, "elapsed_time": "2 days, 7:31:44", "remaining_time": "13:46:10", "throughput": 27206.17, "total_tokens": 5438647488} +{"current_steps": 20210, "total_steps": 25209, "loss": 0.9263, "lr": 2.8767480656605078e-05, "epoch": 2.4050964320512915, "percentage": 80.17, "elapsed_time": "2 days, 7:33:21", "remaining_time": "13:44:30", "throughput": 27206.44, "total_tokens": 5441336448} +{"current_steps": 20220, "total_steps": 25209, "loss": 0.918, "lr": 2.8762720429435556e-05, "epoch": 2.406286492074944, "percentage": 80.21, "elapsed_time": "2 days, 7:35:00", "remaining_time": "13:42:52", "throughput": 27206.34, "total_tokens": 5444006528} +{"current_steps": 20230, "total_steps": 25209, "loss": 0.9192, "lr": 2.8757962564544448e-05, "epoch": 2.4074765520985966, "percentage": 80.25, "elapsed_time": "2 days, 7:36:31", "remaining_time": "13:41:11", "throughput": 27207.23, "total_tokens": 5446661312} +{"current_steps": 20240, "total_steps": 25209, "loss": 0.9113, "lr": 2.8753207059978586e-05, "epoch": 2.408666612122249, "percentage": 80.29, "elapsed_time": "2 days, 7:38:06", "remaining_time": "13:39:31", "throughput": 27207.62, "total_tokens": 5449331136} +{"current_steps": 20250, "total_steps": 25209, "loss": 0.9207, "lr": 2.874845391378706e-05, "epoch": 2.409856672145901, "percentage": 80.33, "elapsed_time": "2 days, 7:39:47", "remaining_time": "13:37:52", "throughput": 27207.72, "total_tokens": 5452081216} +{"current_steps": 20260, "total_steps": 25209, "loss": 0.9127, "lr": 2.874370312402121e-05, "epoch": 2.4110467321695537, "percentage": 80.37, "elapsed_time": "2 days, 7:41:24", "remaining_time": "13:36:13", "throughput": 27208.03, "total_tokens": 5454791552} +{"current_steps": 20270, "total_steps": 25209, "loss": 0.919, "lr": 2.8738954688734647e-05, "epoch": 2.412236792193206, "percentage": 80.41, "elapsed_time": "2 days, 7:43:04", "remaining_time": "13:34:34", "throughput": 27208.02, "total_tokens": 5457499264} +{"current_steps": 20280, "total_steps": 25209, "loss": 0.9215, "lr": 2.8734208605983226e-05, "epoch": 2.4134268522168587, "percentage": 80.45, "elapsed_time": "2 days, 7:44:45", "remaining_time": "13:32:55", "throughput": 27207.95, "total_tokens": 5460230720} +{"current_steps": 20290, "total_steps": 25209, "loss": 0.917, "lr": 2.8729464873825035e-05, "epoch": 2.4146169122405112, "percentage": 80.49, "elapsed_time": "2 days, 7:46:24", "remaining_time": "13:31:17", "throughput": 27207.95, "total_tokens": 5462947328} +{"current_steps": 20300, "total_steps": 25209, "loss": 0.9212, "lr": 2.8724723490320427e-05, "epoch": 2.4158069722641637, "percentage": 80.53, "elapsed_time": "2 days, 7:48:05", "remaining_time": "13:29:38", "throughput": 27207.95, "total_tokens": 5465675456} +{"current_steps": 20310, "total_steps": 25209, "loss": 0.936, "lr": 2.8719984453531983e-05, "epoch": 2.4169970322878163, "percentage": 80.57, "elapsed_time": "2 days, 7:49:37", "remaining_time": "13:27:57", "throughput": 27208.62, "total_tokens": 5468314176} +{"current_steps": 20320, "total_steps": 25209, "loss": 0.9173, "lr": 2.871524776152452e-05, "epoch": 2.4181870923114683, "percentage": 80.61, "elapsed_time": "2 days, 7:51:15", "remaining_time": "13:26:18", "throughput": 27208.89, "total_tokens": 5471053184} +{"current_steps": 20330, "total_steps": 25209, "loss": 0.9333, "lr": 2.8710513412365093e-05, "epoch": 2.419377152335121, "percentage": 80.65, "elapsed_time": "2 days, 7:52:50", "remaining_time": "13:24:38", "throughput": 27209.28, "total_tokens": 5473709824} +{"current_steps": 20340, "total_steps": 25209, "loss": 0.9257, "lr": 2.8705781404122977e-05, "epoch": 2.4205672123587734, "percentage": 80.69, "elapsed_time": "2 days, 7:54:28", "remaining_time": "13:22:59", "throughput": 27209.36, "total_tokens": 5476387456} +{"current_steps": 20350, "total_steps": 25209, "loss": 0.9246, "lr": 2.87010517348697e-05, "epoch": 2.421757272382426, "percentage": 80.73, "elapsed_time": "2 days, 7:56:07", "remaining_time": "13:21:20", "throughput": 27209.43, "total_tokens": 5479091776} +{"current_steps": 20360, "total_steps": 25209, "loss": 0.9114, "lr": 2.8696324402678976e-05, "epoch": 2.4229473324060784, "percentage": 80.76, "elapsed_time": "2 days, 7:57:49", "remaining_time": "13:19:42", "throughput": 27209.11, "total_tokens": 5481806720} +{"current_steps": 20370, "total_steps": 25209, "loss": 0.932, "lr": 2.8691599405626764e-05, "epoch": 2.4241373924297305, "percentage": 80.8, "elapsed_time": "2 days, 7:59:22", "remaining_time": "13:18:02", "throughput": 27209.64, "total_tokens": 5484430144} +{"current_steps": 20380, "total_steps": 25209, "loss": 0.9189, "lr": 2.8686876741791234e-05, "epoch": 2.425327452453383, "percentage": 80.84, "elapsed_time": "2 days, 8:00:56", "remaining_time": "13:16:22", "throughput": 27210.14, "total_tokens": 5487113024} +{"current_steps": 20390, "total_steps": 25209, "loss": 0.9282, "lr": 2.8682156409252775e-05, "epoch": 2.4265175124770355, "percentage": 80.88, "elapsed_time": "2 days, 8:02:32", "remaining_time": "13:14:42", "throughput": 27210.65, "total_tokens": 5489820480} +{"current_steps": 20400, "total_steps": 25209, "loss": 0.912, "lr": 2.8677438406093976e-05, "epoch": 2.427707572500688, "percentage": 80.92, "elapsed_time": "2 days, 8:04:13", "remaining_time": "13:13:03", "throughput": 27210.86, "total_tokens": 5492596864} +{"current_steps": 20410, "total_steps": 25209, "loss": 0.9297, "lr": 2.867272273039964e-05, "epoch": 2.4288976325243405, "percentage": 80.96, "elapsed_time": "2 days, 8:05:48", "remaining_time": "13:11:24", "throughput": 27211.2, "total_tokens": 5495253248} +{"current_steps": 20420, "total_steps": 25209, "loss": 0.928, "lr": 2.8668009380256765e-05, "epoch": 2.430087692547993, "percentage": 81.0, "elapsed_time": "2 days, 8:07:24", "remaining_time": "13:09:44", "throughput": 27211.51, "total_tokens": 5497944256} +{"current_steps": 20430, "total_steps": 25209, "loss": 0.9418, "lr": 2.8663298353754574e-05, "epoch": 2.4312777525716456, "percentage": 81.04, "elapsed_time": "2 days, 8:09:05", "remaining_time": "13:08:05", "throughput": 27211.35, "total_tokens": 5500642752} +{"current_steps": 20440, "total_steps": 25209, "loss": 0.9215, "lr": 2.865858964898445e-05, "epoch": 2.4324678125952977, "percentage": 81.08, "elapsed_time": "2 days, 8:10:42", "remaining_time": "13:06:26", "throughput": 27211.44, "total_tokens": 5503312832} +{"current_steps": 20450, "total_steps": 25209, "loss": 0.9125, "lr": 2.8653883264040004e-05, "epoch": 2.43365787261895, "percentage": 81.12, "elapsed_time": "2 days, 8:12:21", "remaining_time": "13:04:47", "throughput": 27211.5, "total_tokens": 5506012160} +{"current_steps": 20460, "total_steps": 25209, "loss": 0.9122, "lr": 2.8649179197017017e-05, "epoch": 2.4348479326426027, "percentage": 81.16, "elapsed_time": "2 days, 8:14:00", "remaining_time": "13:03:08", "throughput": 27211.61, "total_tokens": 5508718336} +{"current_steps": 20470, "total_steps": 25209, "loss": 0.9315, "lr": 2.864447744601347e-05, "epoch": 2.436037992666255, "percentage": 81.2, "elapsed_time": "2 days, 8:15:35", "remaining_time": "13:01:28", "throughput": 27212.06, "total_tokens": 5511417024} +{"current_steps": 20480, "total_steps": 25209, "loss": 0.9406, "lr": 2.8639778009129507e-05, "epoch": 2.4372280526899077, "percentage": 81.24, "elapsed_time": "2 days, 8:17:12", "remaining_time": "12:59:49", "throughput": 27212.36, "total_tokens": 5514098944} +{"current_steps": 20490, "total_steps": 25209, "loss": 0.9182, "lr": 2.8635080884467492e-05, "epoch": 2.43841811271356, "percentage": 81.28, "elapsed_time": "2 days, 8:18:47", "remaining_time": "12:58:09", "throughput": 27212.92, "total_tokens": 5516800576} +{"current_steps": 20500, "total_steps": 25209, "loss": 0.9242, "lr": 2.8630386070131927e-05, "epoch": 2.4396081727372123, "percentage": 81.32, "elapsed_time": "2 days, 8:20:26", "remaining_time": "12:56:30", "throughput": 27212.96, "total_tokens": 5519505408} +{"current_steps": 20510, "total_steps": 25209, "loss": 0.9242, "lr": 2.8625693564229507e-05, "epoch": 2.440798232760865, "percentage": 81.36, "elapsed_time": "2 days, 8:22:01", "remaining_time": "12:54:50", "throughput": 27213.41, "total_tokens": 5522184064} +{"current_steps": 20520, "total_steps": 25209, "loss": 0.9215, "lr": 2.8621003364869102e-05, "epoch": 2.4419882927845173, "percentage": 81.4, "elapsed_time": "2 days, 8:23:38", "remaining_time": "12:53:11", "throughput": 27213.66, "total_tokens": 5524872000} +{"current_steps": 20530, "total_steps": 25209, "loss": 0.9208, "lr": 2.8616315470161738e-05, "epoch": 2.44317835280817, "percentage": 81.44, "elapsed_time": "2 days, 8:25:15", "remaining_time": "12:51:32", "throughput": 27213.93, "total_tokens": 5527564736} +{"current_steps": 20540, "total_steps": 25209, "loss": 0.919, "lr": 2.8611629878220624e-05, "epoch": 2.4443684128318224, "percentage": 81.48, "elapsed_time": "2 days, 8:26:49", "remaining_time": "12:49:52", "throughput": 27214.54, "total_tokens": 5530256256} +{"current_steps": 20550, "total_steps": 25209, "loss": 0.9198, "lr": 2.8606946587161116e-05, "epoch": 2.445558472855475, "percentage": 81.52, "elapsed_time": "2 days, 8:28:27", "remaining_time": "12:48:12", "throughput": 27214.78, "total_tokens": 5532969536} +{"current_steps": 20560, "total_steps": 25209, "loss": 0.9243, "lr": 2.860226559510072e-05, "epoch": 2.446748532879127, "percentage": 81.56, "elapsed_time": "2 days, 8:30:03", "remaining_time": "12:46:33", "throughput": 27215.13, "total_tokens": 5535643136} +{"current_steps": 20570, "total_steps": 25209, "loss": 0.9143, "lr": 2.859758690015913e-05, "epoch": 2.4479385929027795, "percentage": 81.6, "elapsed_time": "2 days, 8:31:38", "remaining_time": "12:44:53", "throughput": 27215.58, "total_tokens": 5538327808} +{"current_steps": 20580, "total_steps": 25209, "loss": 0.9162, "lr": 2.8592910500458154e-05, "epoch": 2.449128652926432, "percentage": 81.64, "elapsed_time": "2 days, 8:33:13", "remaining_time": "12:43:13", "throughput": 27215.92, "total_tokens": 5540996672} +{"current_steps": 20590, "total_steps": 25209, "loss": 0.9198, "lr": 2.858823639412178e-05, "epoch": 2.4503187129500845, "percentage": 81.68, "elapsed_time": "2 days, 8:34:51", "remaining_time": "12:41:34", "throughput": 27216.13, "total_tokens": 5543701248} +{"current_steps": 20600, "total_steps": 25209, "loss": 0.9239, "lr": 2.858356457927613e-05, "epoch": 2.451508772973737, "percentage": 81.72, "elapsed_time": "2 days, 8:36:30", "remaining_time": "12:39:55", "throughput": 27216.33, "total_tokens": 5546421760} +{"current_steps": 20610, "total_steps": 25209, "loss": 0.9223, "lr": 2.857889505404946e-05, "epoch": 2.452698832997389, "percentage": 81.76, "elapsed_time": "2 days, 8:38:04", "remaining_time": "12:38:15", "throughput": 27216.65, "total_tokens": 5549060608} +{"current_steps": 20620, "total_steps": 25209, "loss": 0.9145, "lr": 2.8574227816572184e-05, "epoch": 2.4538888930210416, "percentage": 81.8, "elapsed_time": "2 days, 8:39:37", "remaining_time": "12:36:35", "throughput": 27217.09, "total_tokens": 5551683456} +{"current_steps": 20630, "total_steps": 25209, "loss": 0.9225, "lr": 2.856956286497684e-05, "epoch": 2.455078953044694, "percentage": 81.84, "elapsed_time": "2 days, 8:41:15", "remaining_time": "12:34:56", "throughput": 27217.43, "total_tokens": 5554399168} +{"current_steps": 20640, "total_steps": 25209, "loss": 0.9264, "lr": 2.85649001973981e-05, "epoch": 2.4562690130683467, "percentage": 81.88, "elapsed_time": "2 days, 8:42:54", "remaining_time": "12:33:17", "throughput": 27217.5, "total_tokens": 5557131008} +{"current_steps": 20650, "total_steps": 25209, "loss": 0.9235, "lr": 2.8560239811972754e-05, "epoch": 2.457459073091999, "percentage": 81.92, "elapsed_time": "2 days, 8:44:34", "remaining_time": "12:31:38", "throughput": 27217.64, "total_tokens": 5559867776} +{"current_steps": 20660, "total_steps": 25209, "loss": 0.8995, "lr": 2.855558170683976e-05, "epoch": 2.4586491331156517, "percentage": 81.95, "elapsed_time": "2 days, 8:46:14", "remaining_time": "12:29:59", "throughput": 27217.7, "total_tokens": 5562602816} +{"current_steps": 20670, "total_steps": 25209, "loss": 0.9144, "lr": 2.855092588014017e-05, "epoch": 2.4598391931393038, "percentage": 81.99, "elapsed_time": "2 days, 8:47:52", "remaining_time": "12:28:20", "throughput": 27217.81, "total_tokens": 5565286080} +{"current_steps": 20680, "total_steps": 25209, "loss": 0.9217, "lr": 2.854627233001715e-05, "epoch": 2.4610292531629563, "percentage": 82.03, "elapsed_time": "2 days, 8:49:27", "remaining_time": "12:26:41", "throughput": 27218.16, "total_tokens": 5567960704} +{"current_steps": 20690, "total_steps": 25209, "loss": 0.9256, "lr": 2.8541621054615992e-05, "epoch": 2.462219313186609, "percentage": 82.07, "elapsed_time": "2 days, 8:51:05", "remaining_time": "12:25:01", "throughput": 27218.18, "total_tokens": 5570619392} +{"current_steps": 20700, "total_steps": 25209, "loss": 0.9194, "lr": 2.8536972052084122e-05, "epoch": 2.4634093732102613, "percentage": 82.11, "elapsed_time": "2 days, 8:52:44", "remaining_time": "12:23:22", "throughput": 27218.23, "total_tokens": 5573317824} +{"current_steps": 20710, "total_steps": 25209, "loss": 0.922, "lr": 2.853232532057104e-05, "epoch": 2.464599433233914, "percentage": 82.15, "elapsed_time": "2 days, 8:54:21", "remaining_time": "12:21:43", "throughput": 27218.27, "total_tokens": 5575971008} +{"current_steps": 20720, "total_steps": 25209, "loss": 0.9311, "lr": 2.8527680858228395e-05, "epoch": 2.4657894932575664, "percentage": 82.19, "elapsed_time": "2 days, 8:55:54", "remaining_time": "12:20:03", "throughput": 27218.96, "total_tokens": 5578654272} +{"current_steps": 20730, "total_steps": 25209, "loss": 0.9281, "lr": 2.8523038663209906e-05, "epoch": 2.4669795532812184, "percentage": 82.23, "elapsed_time": "2 days, 8:57:30", "remaining_time": "12:18:23", "throughput": 27219.68, "total_tokens": 5581397440} +{"current_steps": 20740, "total_steps": 25209, "loss": 0.9353, "lr": 2.8518398733671427e-05, "epoch": 2.468169613304871, "percentage": 82.27, "elapsed_time": "2 days, 8:59:05", "remaining_time": "12:16:44", "throughput": 27220.22, "total_tokens": 5584116160} +{"current_steps": 20750, "total_steps": 25209, "loss": 0.9267, "lr": 2.8513761067770877e-05, "epoch": 2.4693596733285235, "percentage": 82.31, "elapsed_time": "2 days, 9:00:40", "remaining_time": "12:15:04", "throughput": 27220.79, "total_tokens": 5586804032} +{"current_steps": 20760, "total_steps": 25209, "loss": 0.9215, "lr": 2.85091256636683e-05, "epoch": 2.470549733352176, "percentage": 82.35, "elapsed_time": "2 days, 9:02:16", "remaining_time": "12:13:24", "throughput": 27221.3, "total_tokens": 5589523008} +{"current_steps": 20770, "total_steps": 25209, "loss": 0.9207, "lr": 2.850449251952582e-05, "epoch": 2.4717397933758285, "percentage": 82.39, "elapsed_time": "2 days, 9:03:50", "remaining_time": "12:11:45", "throughput": 27221.72, "total_tokens": 5592182208} +{"current_steps": 20780, "total_steps": 25209, "loss": 0.9174, "lr": 2.849986163350766e-05, "epoch": 2.472929853399481, "percentage": 82.43, "elapsed_time": "2 days, 9:05:27", "remaining_time": "12:10:05", "throughput": 27222.1, "total_tokens": 5594898816} +{"current_steps": 20790, "total_steps": 25209, "loss": 0.9348, "lr": 2.8495233003780103e-05, "epoch": 2.474119913423133, "percentage": 82.47, "elapsed_time": "2 days, 9:07:05", "remaining_time": "12:08:26", "throughput": 27222.28, "total_tokens": 5597603776} +{"current_steps": 20800, "total_steps": 25209, "loss": 0.9227, "lr": 2.8490606628511557e-05, "epoch": 2.4753099734467856, "percentage": 82.51, "elapsed_time": "2 days, 9:08:44", "remaining_time": "12:06:47", "throughput": 27222.22, "total_tokens": 5600269248} +{"current_steps": 20810, "total_steps": 25209, "loss": 0.9192, "lr": 2.8485982505872476e-05, "epoch": 2.476500033470438, "percentage": 82.55, "elapsed_time": "2 days, 9:10:22", "remaining_time": "12:05:08", "throughput": 27222.42, "total_tokens": 5602975360} +{"current_steps": 20820, "total_steps": 25209, "loss": 0.9303, "lr": 2.8481360634035415e-05, "epoch": 2.4776900934940906, "percentage": 82.59, "elapsed_time": "2 days, 9:12:00", "remaining_time": "12:03:29", "throughput": 27222.77, "total_tokens": 5605722496} +{"current_steps": 20830, "total_steps": 25209, "loss": 0.9153, "lr": 2.847674101117499e-05, "epoch": 2.478880153517743, "percentage": 82.63, "elapsed_time": "2 days, 9:13:34", "remaining_time": "12:01:49", "throughput": 27223.32, "total_tokens": 5608399232} +{"current_steps": 20840, "total_steps": 25209, "loss": 0.9227, "lr": 2.8472123635467896e-05, "epoch": 2.4800702135413957, "percentage": 82.67, "elapsed_time": "2 days, 9:15:13", "remaining_time": "12:00:10", "throughput": 27223.64, "total_tokens": 5611168640} +{"current_steps": 20850, "total_steps": 25209, "loss": 0.9417, "lr": 2.846750850509289e-05, "epoch": 2.4812602735650477, "percentage": 82.71, "elapsed_time": "2 days, 9:16:50", "remaining_time": "11:58:31", "throughput": 27223.93, "total_tokens": 5613847424} +{"current_steps": 20860, "total_steps": 25209, "loss": 0.9293, "lr": 2.8462895618230813e-05, "epoch": 2.4824503335887003, "percentage": 82.75, "elapsed_time": "2 days, 9:18:27", "remaining_time": "11:56:52", "throughput": 27224.23, "total_tokens": 5616558720} +{"current_steps": 20870, "total_steps": 25209, "loss": 0.9347, "lr": 2.845828497306453e-05, "epoch": 2.483640393612353, "percentage": 82.79, "elapsed_time": "2 days, 9:20:09", "remaining_time": "11:55:13", "throughput": 27223.88, "total_tokens": 5619258496} +{"current_steps": 20880, "total_steps": 25209, "loss": 0.9262, "lr": 2.8453676567779018e-05, "epoch": 2.4848304536360053, "percentage": 82.83, "elapsed_time": "2 days, 9:21:41", "remaining_time": "11:53:33", "throughput": 27224.36, "total_tokens": 5621876736} +{"current_steps": 20890, "total_steps": 25209, "loss": 0.9252, "lr": 2.8449070400561267e-05, "epoch": 2.486020513659658, "percentage": 82.87, "elapsed_time": "2 days, 9:23:15", "remaining_time": "11:51:53", "throughput": 27225.0, "total_tokens": 5624570624} +{"current_steps": 20900, "total_steps": 25209, "loss": 0.9297, "lr": 2.8444466469600343e-05, "epoch": 2.4872105736833103, "percentage": 82.91, "elapsed_time": "2 days, 9:24:53", "remaining_time": "11:50:14", "throughput": 27225.15, "total_tokens": 5627262528} +{"current_steps": 20910, "total_steps": 25209, "loss": 0.9126, "lr": 2.8439864773087354e-05, "epoch": 2.4884006337069624, "percentage": 82.95, "elapsed_time": "2 days, 9:26:27", "remaining_time": "11:48:34", "throughput": 27225.48, "total_tokens": 5629892480} +{"current_steps": 20920, "total_steps": 25209, "loss": 0.936, "lr": 2.8435265309215465e-05, "epoch": 2.489590693730615, "percentage": 82.99, "elapsed_time": "2 days, 9:28:06", "remaining_time": "11:46:55", "throughput": 27225.48, "total_tokens": 5632596736} +{"current_steps": 20930, "total_steps": 25209, "loss": 0.9354, "lr": 2.843066807617987e-05, "epoch": 2.4907807537542674, "percentage": 83.03, "elapsed_time": "2 days, 9:29:40", "remaining_time": "11:45:15", "throughput": 27226.07, "total_tokens": 5635265152} +{"current_steps": 20940, "total_steps": 25209, "loss": 0.9238, "lr": 2.8426073072177827e-05, "epoch": 2.49197081377792, "percentage": 83.07, "elapsed_time": "2 days, 9:31:14", "remaining_time": "11:43:35", "throughput": 27226.36, "total_tokens": 5637892608} +{"current_steps": 20950, "total_steps": 25209, "loss": 0.9235, "lr": 2.8421480295408616e-05, "epoch": 2.4931608738015725, "percentage": 83.11, "elapsed_time": "2 days, 9:32:50", "remaining_time": "11:41:56", "throughput": 27226.91, "total_tokens": 5640620992} +{"current_steps": 20960, "total_steps": 25209, "loss": 0.9107, "lr": 2.841688974407355e-05, "epoch": 2.494350933825225, "percentage": 83.14, "elapsed_time": "2 days, 9:34:30", "remaining_time": "11:40:17", "throughput": 27226.81, "total_tokens": 5643305408} +{"current_steps": 20970, "total_steps": 25209, "loss": 0.9238, "lr": 2.8412301416375984e-05, "epoch": 2.495540993848877, "percentage": 83.18, "elapsed_time": "2 days, 9:36:09", "remaining_time": "11:38:38", "throughput": 27226.72, "total_tokens": 5645994752} +{"current_steps": 20980, "total_steps": 25209, "loss": 0.9137, "lr": 2.840771531052131e-05, "epoch": 2.4967310538725296, "percentage": 83.22, "elapsed_time": "2 days, 9:37:46", "remaining_time": "11:36:59", "throughput": 27226.86, "total_tokens": 5648656128} +{"current_steps": 20990, "total_steps": 25209, "loss": 0.9212, "lr": 2.840313142471694e-05, "epoch": 2.497921113896182, "percentage": 83.26, "elapsed_time": "2 days, 9:39:24", "remaining_time": "11:35:20", "throughput": 27227.0, "total_tokens": 5651371072} +{"current_steps": 21000, "total_steps": 25209, "loss": 0.9251, "lr": 2.83985497571723e-05, "epoch": 2.4991111739198346, "percentage": 83.3, "elapsed_time": "2 days, 9:41:03", "remaining_time": "11:33:41", "throughput": 27227.11, "total_tokens": 5654079616} +{"current_steps": 21010, "total_steps": 25209, "loss": 0.9169, "lr": 2.8393970306098843e-05, "epoch": 2.500301233943487, "percentage": 83.34, "elapsed_time": "2 days, 9:42:41", "remaining_time": "11:32:02", "throughput": 27227.22, "total_tokens": 5656761152} +{"current_steps": 21020, "total_steps": 25209, "loss": 0.9236, "lr": 2.8389393069710053e-05, "epoch": 2.501491293967139, "percentage": 83.38, "elapsed_time": "2 days, 9:44:17", "remaining_time": "11:30:23", "throughput": 27227.42, "total_tokens": 5659426304} +{"current_steps": 21030, "total_steps": 25209, "loss": 0.913, "lr": 2.8384818046221418e-05, "epoch": 2.502681353990792, "percentage": 83.42, "elapsed_time": "2 days, 9:45:53", "remaining_time": "11:28:43", "throughput": 27227.81, "total_tokens": 5662106304} +{"current_steps": 21040, "total_steps": 25209, "loss": 0.9281, "lr": 2.8380245233850434e-05, "epoch": 2.5038714140144442, "percentage": 83.46, "elapsed_time": "2 days, 9:47:29", "remaining_time": "11:27:04", "throughput": 27228.06, "total_tokens": 5664774528} +{"current_steps": 21050, "total_steps": 25209, "loss": 0.917, "lr": 2.837567463081662e-05, "epoch": 2.5050614740380968, "percentage": 83.5, "elapsed_time": "2 days, 9:49:04", "remaining_time": "11:25:24", "throughput": 27228.33, "total_tokens": 5667418688} +{"current_steps": 21060, "total_steps": 25209, "loss": 0.9158, "lr": 2.8371106235341477e-05, "epoch": 2.5062515340617493, "percentage": 83.54, "elapsed_time": "2 days, 9:50:40", "remaining_time": "11:23:45", "throughput": 27228.64, "total_tokens": 5670099328} +{"current_steps": 21070, "total_steps": 25209, "loss": 0.922, "lr": 2.836654004564855e-05, "epoch": 2.507441594085402, "percentage": 83.58, "elapsed_time": "2 days, 9:52:17", "remaining_time": "11:22:05", "throughput": 27228.9, "total_tokens": 5672812096} +{"current_steps": 21080, "total_steps": 25209, "loss": 0.9119, "lr": 2.8361976059963348e-05, "epoch": 2.5086316541090543, "percentage": 83.62, "elapsed_time": "2 days, 9:53:50", "remaining_time": "11:20:25", "throughput": 27229.46, "total_tokens": 5675458368} +{"current_steps": 21090, "total_steps": 25209, "loss": 0.9204, "lr": 2.835741427651339e-05, "epoch": 2.5098217141327064, "percentage": 83.66, "elapsed_time": "2 days, 9:55:29", "remaining_time": "11:18:46", "throughput": 27229.53, "total_tokens": 5678150784} +{"current_steps": 21100, "total_steps": 25209, "loss": 0.9265, "lr": 2.8352854693528197e-05, "epoch": 2.511011774156359, "percentage": 83.7, "elapsed_time": "2 days, 9:56:58", "remaining_time": "11:17:06", "throughput": 27230.43, "total_tokens": 5680777536} +{"current_steps": 21110, "total_steps": 25209, "loss": 0.9286, "lr": 2.8348297309239274e-05, "epoch": 2.5122018341800114, "percentage": 83.74, "elapsed_time": "2 days, 9:58:34", "remaining_time": "11:15:26", "throughput": 27230.79, "total_tokens": 5683451968} +{"current_steps": 21120, "total_steps": 25209, "loss": 0.9341, "lr": 2.834374212188012e-05, "epoch": 2.513391894203664, "percentage": 83.78, "elapsed_time": "2 days, 10:00:13", "remaining_time": "11:13:47", "throughput": 27230.78, "total_tokens": 5686143104} +{"current_steps": 21130, "total_steps": 25209, "loss": 0.9333, "lr": 2.833918912968621e-05, "epoch": 2.5145819542273165, "percentage": 83.82, "elapsed_time": "2 days, 10:01:51", "remaining_time": "11:12:08", "throughput": 27230.8, "total_tokens": 5688823616} +{"current_steps": 21140, "total_steps": 25209, "loss": 0.9197, "lr": 2.833463833089502e-05, "epoch": 2.5157720142509685, "percentage": 83.86, "elapsed_time": "2 days, 10:03:29", "remaining_time": "11:10:29", "throughput": 27230.84, "total_tokens": 5691502080} +{"current_steps": 21150, "total_steps": 25209, "loss": 0.9407, "lr": 2.8330089723745985e-05, "epoch": 2.5169620742746215, "percentage": 83.9, "elapsed_time": "2 days, 10:05:03", "remaining_time": "11:08:50", "throughput": 27231.24, "total_tokens": 5694153984} +{"current_steps": 21160, "total_steps": 25209, "loss": 0.9315, "lr": 2.8325543306480538e-05, "epoch": 2.5181521342982736, "percentage": 83.94, "elapsed_time": "2 days, 10:06:39", "remaining_time": "11:07:10", "throughput": 27231.47, "total_tokens": 5696820096} +{"current_steps": 21170, "total_steps": 25209, "loss": 0.9153, "lr": 2.832099907734208e-05, "epoch": 2.519342194321926, "percentage": 83.98, "elapsed_time": "2 days, 10:08:13", "remaining_time": "11:05:30", "throughput": 27232.14, "total_tokens": 5699506752} +{"current_steps": 21180, "total_steps": 25209, "loss": 0.9295, "lr": 2.831645703457598e-05, "epoch": 2.5205322543455786, "percentage": 84.02, "elapsed_time": "2 days, 10:09:48", "remaining_time": "11:03:51", "throughput": 27232.48, "total_tokens": 5702156544} +{"current_steps": 21190, "total_steps": 25209, "loss": 0.9286, "lr": 2.8311917176429582e-05, "epoch": 2.521722314369231, "percentage": 84.06, "elapsed_time": "2 days, 10:11:21", "remaining_time": "11:02:11", "throughput": 27233.2, "total_tokens": 5704845760} +{"current_steps": 21200, "total_steps": 25209, "loss": 0.914, "lr": 2.830737950115218e-05, "epoch": 2.5229123743928836, "percentage": 84.1, "elapsed_time": "2 days, 10:13:03", "remaining_time": "11:00:32", "throughput": 27232.94, "total_tokens": 5707562048} +{"current_steps": 21210, "total_steps": 25209, "loss": 0.9228, "lr": 2.8302844006995062e-05, "epoch": 2.5241024344165357, "percentage": 84.14, "elapsed_time": "2 days, 10:14:36", "remaining_time": "10:58:53", "throughput": 27233.51, "total_tokens": 5710233152} +{"current_steps": 21220, "total_steps": 25209, "loss": 0.9194, "lr": 2.829831069221145e-05, "epoch": 2.525292494440188, "percentage": 84.18, "elapsed_time": "2 days, 10:16:14", "remaining_time": "10:57:13", "throughput": 27233.51, "total_tokens": 5712887680} +{"current_steps": 21230, "total_steps": 25209, "loss": 0.915, "lr": 2.8293779555056532e-05, "epoch": 2.5264825544638407, "percentage": 84.22, "elapsed_time": "2 days, 10:17:52", "remaining_time": "10:55:35", "throughput": 27233.53, "total_tokens": 5715581184} +{"current_steps": 21240, "total_steps": 25209, "loss": 0.911, "lr": 2.8289250593787454e-05, "epoch": 2.5276726144874933, "percentage": 84.26, "elapsed_time": "2 days, 10:19:31", "remaining_time": "10:53:56", "throughput": 27233.67, "total_tokens": 5718304256} +{"current_steps": 21250, "total_steps": 25209, "loss": 0.9347, "lr": 2.8284723806663316e-05, "epoch": 2.5288626745111458, "percentage": 84.3, "elapsed_time": "2 days, 10:21:07", "remaining_time": "10:52:16", "throughput": 27234.18, "total_tokens": 5721020352} +{"current_steps": 21260, "total_steps": 25209, "loss": 0.918, "lr": 2.828019919194515e-05, "epoch": 2.530052734534798, "percentage": 84.33, "elapsed_time": "2 days, 10:22:42", "remaining_time": "10:50:37", "throughput": 27234.55, "total_tokens": 5723691392} +{"current_steps": 21270, "total_steps": 25209, "loss": 0.9244, "lr": 2.827567674789597e-05, "epoch": 2.531242794558451, "percentage": 84.37, "elapsed_time": "2 days, 10:24:20", "remaining_time": "10:48:58", "throughput": 27234.74, "total_tokens": 5726385856} +{"current_steps": 21280, "total_steps": 25209, "loss": 0.9442, "lr": 2.8271156472780697e-05, "epoch": 2.532432854582103, "percentage": 84.41, "elapsed_time": "2 days, 10:26:00", "remaining_time": "10:47:19", "throughput": 27234.72, "total_tokens": 5729100480} +{"current_steps": 21290, "total_steps": 25209, "loss": 0.92, "lr": 2.826663836486621e-05, "epoch": 2.5336229146057554, "percentage": 84.45, "elapsed_time": "2 days, 10:27:38", "remaining_time": "10:45:40", "throughput": 27234.77, "total_tokens": 5731787136} +{"current_steps": 21300, "total_steps": 25209, "loss": 0.9288, "lr": 2.8262122422421326e-05, "epoch": 2.534812974629408, "percentage": 84.49, "elapsed_time": "2 days, 10:29:19", "remaining_time": "10:44:02", "throughput": 27234.6, "total_tokens": 5734513984} +{"current_steps": 21310, "total_steps": 25209, "loss": 0.9232, "lr": 2.8257608643716797e-05, "epoch": 2.5360030346530604, "percentage": 84.53, "elapsed_time": "2 days, 10:30:56", "remaining_time": "10:42:22", "throughput": 27235.0, "total_tokens": 5737238272} +{"current_steps": 21320, "total_steps": 25209, "loss": 0.9206, "lr": 2.8253097027025312e-05, "epoch": 2.537193094676713, "percentage": 84.57, "elapsed_time": "2 days, 10:32:36", "remaining_time": "10:40:44", "throughput": 27235.18, "total_tokens": 5739979840} +{"current_steps": 21330, "total_steps": 25209, "loss": 0.9309, "lr": 2.8248587570621472e-05, "epoch": 2.538383154700365, "percentage": 84.61, "elapsed_time": "2 days, 10:34:09", "remaining_time": "10:39:04", "throughput": 27235.79, "total_tokens": 5742661504} +{"current_steps": 21340, "total_steps": 25209, "loss": 0.9154, "lr": 2.824408027278182e-05, "epoch": 2.5395732147240175, "percentage": 84.65, "elapsed_time": "2 days, 10:35:47", "remaining_time": "10:37:25", "throughput": 27236.04, "total_tokens": 5745377216} +{"current_steps": 21350, "total_steps": 25209, "loss": 0.9296, "lr": 2.823957513178483e-05, "epoch": 2.54076327474767, "percentage": 84.69, "elapsed_time": "2 days, 10:37:26", "remaining_time": "10:35:46", "throughput": 27236.01, "total_tokens": 5748068544} +{"current_steps": 21360, "total_steps": 25209, "loss": 0.9518, "lr": 2.8235072145910878e-05, "epoch": 2.5419533347713226, "percentage": 84.73, "elapsed_time": "2 days, 10:39:04", "remaining_time": "10:34:07", "throughput": 27236.08, "total_tokens": 5750743808} +{"current_steps": 21370, "total_steps": 25209, "loss": 0.925, "lr": 2.8230571313442273e-05, "epoch": 2.543143394794975, "percentage": 84.77, "elapsed_time": "2 days, 10:40:45", "remaining_time": "10:32:29", "throughput": 27235.97, "total_tokens": 5753471488} +{"current_steps": 21380, "total_steps": 25209, "loss": 0.9152, "lr": 2.822607263266324e-05, "epoch": 2.544333454818627, "percentage": 84.81, "elapsed_time": "2 days, 10:42:25", "remaining_time": "10:30:50", "throughput": 27235.93, "total_tokens": 5756189184} +{"current_steps": 21390, "total_steps": 25209, "loss": 0.9224, "lr": 2.822157610185991e-05, "epoch": 2.54552351484228, "percentage": 84.85, "elapsed_time": "2 days, 10:43:58", "remaining_time": "10:29:10", "throughput": 27236.48, "total_tokens": 5758847296} +{"current_steps": 21400, "total_steps": 25209, "loss": 0.922, "lr": 2.821708171932032e-05, "epoch": 2.546713574865932, "percentage": 84.89, "elapsed_time": "2 days, 10:45:33", "remaining_time": "10:27:30", "throughput": 27236.93, "total_tokens": 5761510912} +{"current_steps": 21410, "total_steps": 25209, "loss": 0.9206, "lr": 2.821258948333444e-05, "epoch": 2.5479036348895847, "percentage": 84.93, "elapsed_time": "2 days, 10:47:11", "remaining_time": "10:25:51", "throughput": 27237.12, "total_tokens": 5764224512} +{"current_steps": 21420, "total_steps": 25209, "loss": 0.9166, "lr": 2.8208099392194116e-05, "epoch": 2.5490936949132372, "percentage": 84.97, "elapsed_time": "2 days, 10:48:50", "remaining_time": "10:24:13", "throughput": 27237.25, "total_tokens": 5766944320} +{"current_steps": 21430, "total_steps": 25209, "loss": 0.9167, "lr": 2.8203611444193113e-05, "epoch": 2.5502837549368897, "percentage": 85.01, "elapsed_time": "2 days, 10:50:26", "remaining_time": "10:22:33", "throughput": 27237.68, "total_tokens": 5769651328} +{"current_steps": 21440, "total_steps": 25209, "loss": 0.9108, "lr": 2.8199125637627084e-05, "epoch": 2.5514738149605423, "percentage": 85.05, "elapsed_time": "2 days, 10:52:03", "remaining_time": "10:20:54", "throughput": 27237.93, "total_tokens": 5772364992} +{"current_steps": 21450, "total_steps": 25209, "loss": 0.9372, "lr": 2.8194641970793593e-05, "epoch": 2.5526638749841943, "percentage": 85.09, "elapsed_time": "2 days, 10:53:47", "remaining_time": "10:19:16", "throughput": 27237.75, "total_tokens": 5775141888} +{"current_steps": 21460, "total_steps": 25209, "loss": 0.9353, "lr": 2.8190160441992092e-05, "epoch": 2.553853935007847, "percentage": 85.13, "elapsed_time": "2 days, 10:55:22", "remaining_time": "10:17:37", "throughput": 27238.16, "total_tokens": 5777839360} +{"current_steps": 21470, "total_steps": 25209, "loss": 0.9332, "lr": 2.818568104952392e-05, "epoch": 2.5550439950314994, "percentage": 85.17, "elapsed_time": "2 days, 10:57:05", "remaining_time": "10:15:59", "throughput": 27237.96, "total_tokens": 5780585664} +{"current_steps": 21480, "total_steps": 25209, "loss": 0.9255, "lr": 2.8181203791692306e-05, "epoch": 2.556234055055152, "percentage": 85.21, "elapsed_time": "2 days, 10:58:42", "remaining_time": "10:14:19", "throughput": 27238.2, "total_tokens": 5783284800} +{"current_steps": 21490, "total_steps": 25209, "loss": 0.915, "lr": 2.8176728666802375e-05, "epoch": 2.5574241150788044, "percentage": 85.25, "elapsed_time": "2 days, 11:00:18", "remaining_time": "10:12:40", "throughput": 27238.57, "total_tokens": 5785986240} +{"current_steps": 21500, "total_steps": 25209, "loss": 0.923, "lr": 2.8172255673161124e-05, "epoch": 2.5586141751024565, "percentage": 85.29, "elapsed_time": "2 days, 11:01:52", "remaining_time": "10:11:00", "throughput": 27238.97, "total_tokens": 5788614784} +{"current_steps": 21510, "total_steps": 25209, "loss": 0.926, "lr": 2.8167784809077436e-05, "epoch": 2.5598042351261094, "percentage": 85.33, "elapsed_time": "2 days, 11:03:27", "remaining_time": "10:09:21", "throughput": 27239.34, "total_tokens": 5791282240} +{"current_steps": 21520, "total_steps": 25209, "loss": 0.9197, "lr": 2.816331607286207e-05, "epoch": 2.5609942951497615, "percentage": 85.37, "elapsed_time": "2 days, 11:05:07", "remaining_time": "10:07:42", "throughput": 27239.2, "total_tokens": 5793982016} +{"current_steps": 21530, "total_steps": 25209, "loss": 0.9189, "lr": 2.815884946282766e-05, "epoch": 2.562184355173414, "percentage": 85.41, "elapsed_time": "2 days, 11:06:43", "remaining_time": "10:06:03", "throughput": 27239.54, "total_tokens": 5796679808} +{"current_steps": 21540, "total_steps": 25209, "loss": 0.9319, "lr": 2.815438497728871e-05, "epoch": 2.5633744151970665, "percentage": 85.45, "elapsed_time": "2 days, 11:08:19", "remaining_time": "10:04:24", "throughput": 27240.0, "total_tokens": 5799372416} +{"current_steps": 21550, "total_steps": 25209, "loss": 0.9097, "lr": 2.8149922614561607e-05, "epoch": 2.564564475220719, "percentage": 85.49, "elapsed_time": "2 days, 11:09:54", "remaining_time": "10:02:44", "throughput": 27240.36, "total_tokens": 5802053056} +{"current_steps": 21560, "total_steps": 25209, "loss": 0.9233, "lr": 2.8145462372964588e-05, "epoch": 2.5657545352443716, "percentage": 85.53, "elapsed_time": "2 days, 11:11:28", "remaining_time": "10:01:04", "throughput": 27240.82, "total_tokens": 5804712576} +{"current_steps": 21570, "total_steps": 25209, "loss": 0.9342, "lr": 2.814100425081777e-05, "epoch": 2.5669445952680237, "percentage": 85.56, "elapsed_time": "2 days, 11:13:04", "remaining_time": "9:59:25", "throughput": 27241.2, "total_tokens": 5807415232} +{"current_steps": 21580, "total_steps": 25209, "loss": 0.9419, "lr": 2.8136548246443117e-05, "epoch": 2.568134655291676, "percentage": 85.6, "elapsed_time": "2 days, 11:14:36", "remaining_time": "9:57:45", "throughput": 27241.93, "total_tokens": 5810073664} +{"current_steps": 21590, "total_steps": 25209, "loss": 0.9134, "lr": 2.8132094358164468e-05, "epoch": 2.5693247153153287, "percentage": 85.64, "elapsed_time": "2 days, 11:16:09", "remaining_time": "9:56:05", "throughput": 27242.69, "total_tokens": 5812751616} +{"current_steps": 21600, "total_steps": 25209, "loss": 0.9253, "lr": 2.8127642584307508e-05, "epoch": 2.570514775338981, "percentage": 85.68, "elapsed_time": "2 days, 11:17:43", "remaining_time": "9:54:26", "throughput": 27243.25, "total_tokens": 5815426816} +{"current_steps": 21610, "total_steps": 25209, "loss": 0.9252, "lr": 2.8123192923199776e-05, "epoch": 2.5717048353626337, "percentage": 85.72, "elapsed_time": "2 days, 11:19:25", "remaining_time": "9:52:47", "throughput": 27243.09, "total_tokens": 5818182976} +{"current_steps": 21620, "total_steps": 25209, "loss": 0.9203, "lr": 2.8118745373170667e-05, "epoch": 2.572894895386286, "percentage": 85.76, "elapsed_time": "2 days, 11:20:56", "remaining_time": "9:51:07", "throughput": 27243.84, "total_tokens": 5820823488} +{"current_steps": 21630, "total_steps": 25209, "loss": 0.9375, "lr": 2.8114299932551423e-05, "epoch": 2.5740849554099388, "percentage": 85.8, "elapsed_time": "2 days, 11:22:30", "remaining_time": "9:49:28", "throughput": 27244.18, "total_tokens": 5823465984} +{"current_steps": 21640, "total_steps": 25209, "loss": 0.9102, "lr": 2.8109856599675145e-05, "epoch": 2.575275015433591, "percentage": 85.84, "elapsed_time": "2 days, 11:24:06", "remaining_time": "9:47:48", "throughput": 27244.7, "total_tokens": 5826190144} +{"current_steps": 21650, "total_steps": 25209, "loss": 0.9255, "lr": 2.8105415372876742e-05, "epoch": 2.5764650754572433, "percentage": 85.88, "elapsed_time": "2 days, 11:25:43", "remaining_time": "9:46:09", "throughput": 27244.85, "total_tokens": 5828863424} +{"current_steps": 21660, "total_steps": 25209, "loss": 0.9148, "lr": 2.8100976250493e-05, "epoch": 2.577655135480896, "percentage": 85.92, "elapsed_time": "2 days, 11:27:21", "remaining_time": "9:44:30", "throughput": 27244.83, "total_tokens": 5831532416} +{"current_steps": 21670, "total_steps": 25209, "loss": 0.9274, "lr": 2.8096539230862527e-05, "epoch": 2.5788451955045484, "percentage": 85.96, "elapsed_time": "2 days, 11:29:02", "remaining_time": "9:42:52", "throughput": 27244.91, "total_tokens": 5834296448} +{"current_steps": 21680, "total_steps": 25209, "loss": 0.9289, "lr": 2.809210431232578e-05, "epoch": 2.580035255528201, "percentage": 86.0, "elapsed_time": "2 days, 11:30:38", "remaining_time": "9:41:13", "throughput": 27245.37, "total_tokens": 5837011264} +{"current_steps": 21690, "total_steps": 25209, "loss": 0.9247, "lr": 2.8087671493225025e-05, "epoch": 2.581225315551853, "percentage": 86.04, "elapsed_time": "2 days, 11:32:15", "remaining_time": "9:39:33", "throughput": 27245.57, "total_tokens": 5839680832} +{"current_steps": 21700, "total_steps": 25209, "loss": 0.9161, "lr": 2.808324077190438e-05, "epoch": 2.5824153755755055, "percentage": 86.08, "elapsed_time": "2 days, 11:33:54", "remaining_time": "9:37:55", "throughput": 27245.69, "total_tokens": 5842428672} +{"current_steps": 21710, "total_steps": 25209, "loss": 0.9229, "lr": 2.807881214670978e-05, "epoch": 2.583605435599158, "percentage": 86.12, "elapsed_time": "2 days, 11:35:27", "remaining_time": "9:36:15", "throughput": 27246.08, "total_tokens": 5845035200} +{"current_steps": 21720, "total_steps": 25209, "loss": 0.9322, "lr": 2.8074385615988996e-05, "epoch": 2.5847954956228105, "percentage": 86.16, "elapsed_time": "2 days, 11:37:06", "remaining_time": "9:34:36", "throughput": 27246.14, "total_tokens": 5847735872} +{"current_steps": 21730, "total_steps": 25209, "loss": 0.9294, "lr": 2.8069961178091602e-05, "epoch": 2.585985555646463, "percentage": 86.2, "elapsed_time": "2 days, 11:38:44", "remaining_time": "9:32:57", "throughput": 27246.26, "total_tokens": 5850427392} +{"current_steps": 21740, "total_steps": 25209, "loss": 0.9196, "lr": 2.806553883136901e-05, "epoch": 2.587175615670115, "percentage": 86.24, "elapsed_time": "2 days, 11:40:19", "remaining_time": "9:31:18", "throughput": 27246.65, "total_tokens": 5853117760} +{"current_steps": 21750, "total_steps": 25209, "loss": 0.9233, "lr": 2.806111857417445e-05, "epoch": 2.588365675693768, "percentage": 86.28, "elapsed_time": "2 days, 11:41:55", "remaining_time": "9:29:39", "throughput": 27247.14, "total_tokens": 5855841216} +{"current_steps": 21760, "total_steps": 25209, "loss": 0.9293, "lr": 2.8056700404862957e-05, "epoch": 2.58955573571742, "percentage": 86.32, "elapsed_time": "2 days, 11:43:32", "remaining_time": "9:27:59", "throughput": 27247.38, "total_tokens": 5858517504} +{"current_steps": 21770, "total_steps": 25209, "loss": 0.928, "lr": 2.8052284321791383e-05, "epoch": 2.5907457957410727, "percentage": 86.36, "elapsed_time": "2 days, 11:45:12", "remaining_time": "9:26:21", "throughput": 27247.17, "total_tokens": 5861206400} +{"current_steps": 21780, "total_steps": 25209, "loss": 0.9232, "lr": 2.8047870323318382e-05, "epoch": 2.591935855764725, "percentage": 86.4, "elapsed_time": "2 days, 11:46:46", "remaining_time": "9:24:41", "throughput": 27247.65, "total_tokens": 5863876160} +{"current_steps": 21790, "total_steps": 25209, "loss": 0.9301, "lr": 2.8043458407804428e-05, "epoch": 2.5931259157883777, "percentage": 86.44, "elapsed_time": "2 days, 11:48:24", "remaining_time": "9:23:02", "throughput": 27247.72, "total_tokens": 5866554112} +{"current_steps": 21800, "total_steps": 25209, "loss": 0.9288, "lr": 2.8039048573611805e-05, "epoch": 2.59431597581203, "percentage": 86.48, "elapsed_time": "2 days, 11:49:55", "remaining_time": "9:21:22", "throughput": 27248.42, "total_tokens": 5869173312} +{"current_steps": 21810, "total_steps": 25209, "loss": 0.9307, "lr": 2.8034640819104574e-05, "epoch": 2.5955060358356823, "percentage": 86.52, "elapsed_time": "2 days, 11:51:28", "remaining_time": "9:19:43", "throughput": 27248.8, "total_tokens": 5871811264} +{"current_steps": 21820, "total_steps": 25209, "loss": 0.9248, "lr": 2.803023514264861e-05, "epoch": 2.596696095859335, "percentage": 86.56, "elapsed_time": "2 days, 11:53:05", "remaining_time": "9:18:03", "throughput": 27249.1, "total_tokens": 5874514048} +{"current_steps": 21830, "total_steps": 25209, "loss": 0.9322, "lr": 2.8025831542611596e-05, "epoch": 2.5978861558829873, "percentage": 86.6, "elapsed_time": "2 days, 11:54:40", "remaining_time": "9:16:24", "throughput": 27249.65, "total_tokens": 5877208000} +{"current_steps": 21840, "total_steps": 25209, "loss": 0.9289, "lr": 2.8021430017362994e-05, "epoch": 2.59907621590664, "percentage": 86.64, "elapsed_time": "2 days, 11:56:15", "remaining_time": "9:14:45", "throughput": 27249.9, "total_tokens": 5879862208} +{"current_steps": 21850, "total_steps": 25209, "loss": 0.918, "lr": 2.801703056527406e-05, "epoch": 2.6002662759302924, "percentage": 86.68, "elapsed_time": "2 days, 11:57:52", "remaining_time": "9:13:06", "throughput": 27250.09, "total_tokens": 5882547968} +{"current_steps": 21860, "total_steps": 25209, "loss": 0.9135, "lr": 2.801263318471784e-05, "epoch": 2.6014563359539444, "percentage": 86.72, "elapsed_time": "2 days, 11:59:28", "remaining_time": "9:11:26", "throughput": 27250.48, "total_tokens": 5885247872} +{"current_steps": 21870, "total_steps": 25209, "loss": 0.9192, "lr": 2.800823787406917e-05, "epoch": 2.6026463959775974, "percentage": 86.75, "elapsed_time": "2 days, 12:01:05", "remaining_time": "9:09:47", "throughput": 27250.84, "total_tokens": 5887963904} +{"current_steps": 21880, "total_steps": 25209, "loss": 0.9256, "lr": 2.8003844631704678e-05, "epoch": 2.6038364560012495, "percentage": 86.79, "elapsed_time": "2 days, 12:02:40", "remaining_time": "9:08:08", "throughput": 27251.26, "total_tokens": 5890637312} +{"current_steps": 21890, "total_steps": 25209, "loss": 0.9317, "lr": 2.7999453456002755e-05, "epoch": 2.605026516024902, "percentage": 86.83, "elapsed_time": "2 days, 12:04:17", "remaining_time": "9:06:29", "throughput": 27251.38, "total_tokens": 5893318592} +{"current_steps": 21900, "total_steps": 25209, "loss": 0.9193, "lr": 2.799506434534359e-05, "epoch": 2.6062165760485545, "percentage": 86.87, "elapsed_time": "2 days, 12:05:51", "remaining_time": "9:04:49", "throughput": 27251.89, "total_tokens": 5895996224} +{"current_steps": 21910, "total_steps": 25209, "loss": 0.9143, "lr": 2.7990677298109136e-05, "epoch": 2.607406636072207, "percentage": 86.91, "elapsed_time": "2 days, 12:07:26", "remaining_time": "9:03:10", "throughput": 27252.48, "total_tokens": 5898705216} +{"current_steps": 21920, "total_steps": 25209, "loss": 0.9269, "lr": 2.7986292312683125e-05, "epoch": 2.6085966960958595, "percentage": 86.95, "elapsed_time": "2 days, 12:09:02", "remaining_time": "9:01:31", "throughput": 27252.7, "total_tokens": 5901374336} +{"current_steps": 21930, "total_steps": 25209, "loss": 0.9213, "lr": 2.798190938745106e-05, "epoch": 2.6097867561195116, "percentage": 86.99, "elapsed_time": "2 days, 12:10:36", "remaining_time": "8:59:51", "throughput": 27253.11, "total_tokens": 5904030528} +{"current_steps": 21940, "total_steps": 25209, "loss": 0.9059, "lr": 2.7977528520800218e-05, "epoch": 2.610976816143164, "percentage": 87.03, "elapsed_time": "2 days, 12:12:14", "remaining_time": "8:58:12", "throughput": 27253.3, "total_tokens": 5906737472} +{"current_steps": 21950, "total_steps": 25209, "loss": 0.9213, "lr": 2.7973149711119635e-05, "epoch": 2.6121668761668166, "percentage": 87.07, "elapsed_time": "2 days, 12:13:51", "remaining_time": "8:56:33", "throughput": 27253.52, "total_tokens": 5909434432} +{"current_steps": 21960, "total_steps": 25209, "loss": 0.9209, "lr": 2.7968772956800115e-05, "epoch": 2.613356936190469, "percentage": 87.11, "elapsed_time": "2 days, 12:15:23", "remaining_time": "8:54:54", "throughput": 27254.16, "total_tokens": 5912075264} +{"current_steps": 21970, "total_steps": 25209, "loss": 0.9198, "lr": 2.796439825623423e-05, "epoch": 2.6145469962141217, "percentage": 87.15, "elapsed_time": "2 days, 12:17:02", "remaining_time": "8:53:15", "throughput": 27254.32, "total_tokens": 5914788544} +{"current_steps": 21980, "total_steps": 25209, "loss": 0.9235, "lr": 2.79600256078163e-05, "epoch": 2.6157370562377737, "percentage": 87.19, "elapsed_time": "2 days, 12:18:40", "remaining_time": "8:51:36", "throughput": 27254.29, "total_tokens": 5917469952} +{"current_steps": 21990, "total_steps": 25209, "loss": 0.9358, "lr": 2.7955655009942416e-05, "epoch": 2.6169271162614267, "percentage": 87.23, "elapsed_time": "2 days, 12:20:27", "remaining_time": "8:49:58", "throughput": 27253.2, "total_tokens": 5920146304} +{"current_steps": 22000, "total_steps": 25209, "loss": 0.9266, "lr": 2.79512864610104e-05, "epoch": 2.618117176285079, "percentage": 87.27, "elapsed_time": "2 days, 12:22:16", "remaining_time": "8:48:21", "throughput": 27251.94, "total_tokens": 5922851264} +{"current_steps": 22010, "total_steps": 25209, "loss": 0.9247, "lr": 2.794691995941986e-05, "epoch": 2.6193072363087313, "percentage": 87.31, "elapsed_time": "2 days, 12:24:00", "remaining_time": "8:46:43", "throughput": 27251.17, "total_tokens": 5925495936} +{"current_steps": 22020, "total_steps": 25209, "loss": 0.9246, "lr": 2.7942555503572115e-05, "epoch": 2.620497296332384, "percentage": 87.35, "elapsed_time": "2 days, 12:25:42", "remaining_time": "8:45:05", "throughput": 27250.52, "total_tokens": 5928152256} +{"current_steps": 22030, "total_steps": 25209, "loss": 0.9186, "lr": 2.7938193091870268e-05, "epoch": 2.6216873563560363, "percentage": 87.39, "elapsed_time": "2 days, 12:27:26", "remaining_time": "8:43:27", "throughput": 27249.74, "total_tokens": 5930817472} +{"current_steps": 22040, "total_steps": 25209, "loss": 0.9202, "lr": 2.793383272271914e-05, "epoch": 2.622877416379689, "percentage": 87.43, "elapsed_time": "2 days, 12:29:14", "remaining_time": "8:41:49", "throughput": 27248.62, "total_tokens": 5933509248} +{"current_steps": 22050, "total_steps": 25209, "loss": 0.9265, "lr": 2.7929474394525307e-05, "epoch": 2.624067476403341, "percentage": 87.47, "elapsed_time": "2 days, 12:30:56", "remaining_time": "8:40:11", "throughput": 27247.95, "total_tokens": 5936134720} +{"current_steps": 22060, "total_steps": 25209, "loss": 0.9245, "lr": 2.7925118105697078e-05, "epoch": 2.6252575364269934, "percentage": 87.51, "elapsed_time": "2 days, 12:32:42", "remaining_time": "8:38:33", "throughput": 27247.11, "total_tokens": 5938839232} +{"current_steps": 22070, "total_steps": 25209, "loss": 0.9239, "lr": 2.792076385464451e-05, "epoch": 2.626447596450646, "percentage": 87.55, "elapsed_time": "2 days, 12:34:22", "remaining_time": "8:36:54", "throughput": 27246.71, "total_tokens": 5941498816} +{"current_steps": 22080, "total_steps": 25209, "loss": 0.9218, "lr": 2.7916411639779383e-05, "epoch": 2.6276376564742985, "percentage": 87.59, "elapsed_time": "2 days, 12:36:04", "remaining_time": "8:35:16", "throughput": 27246.29, "total_tokens": 5944178304} +{"current_steps": 22090, "total_steps": 25209, "loss": 0.9251, "lr": 2.7912061459515215e-05, "epoch": 2.628827716497951, "percentage": 87.63, "elapsed_time": "2 days, 12:37:44", "remaining_time": "8:33:37", "throughput": 27246.05, "total_tokens": 5946858560} +{"current_steps": 22100, "total_steps": 25209, "loss": 0.9264, "lr": 2.7907713312267247e-05, "epoch": 2.630017776521603, "percentage": 87.67, "elapsed_time": "2 days, 12:39:29", "remaining_time": "8:31:59", "throughput": 27245.29, "total_tokens": 5949529408} +{"current_steps": 22110, "total_steps": 25209, "loss": 0.9213, "lr": 2.7903367196452457e-05, "epoch": 2.6312078365452556, "percentage": 87.71, "elapsed_time": "2 days, 12:41:14", "remaining_time": "8:30:21", "throughput": 27244.66, "total_tokens": 5952257344} +{"current_steps": 22120, "total_steps": 25209, "loss": 0.9317, "lr": 2.7899023110489554e-05, "epoch": 2.632397896568908, "percentage": 87.75, "elapsed_time": "2 days, 12:42:59", "remaining_time": "8:28:44", "throughput": 27243.94, "total_tokens": 5954975104} +{"current_steps": 22130, "total_steps": 25209, "loss": 0.9235, "lr": 2.789468105279895e-05, "epoch": 2.6335879565925606, "percentage": 87.79, "elapsed_time": "2 days, 12:44:46", "remaining_time": "8:27:06", "throughput": 27243.3, "total_tokens": 5957743744} +{"current_steps": 22140, "total_steps": 25209, "loss": 0.9152, "lr": 2.7890341021802786e-05, "epoch": 2.634778016616213, "percentage": 87.83, "elapsed_time": "2 days, 12:46:26", "remaining_time": "8:25:27", "throughput": 27242.98, "total_tokens": 5960394880} +{"current_steps": 22150, "total_steps": 25209, "loss": 0.9246, "lr": 2.7886003015924933e-05, "epoch": 2.6359680766398657, "percentage": 87.87, "elapsed_time": "2 days, 12:48:09", "remaining_time": "8:23:49", "throughput": 27242.43, "total_tokens": 5963084608} +{"current_steps": 22160, "total_steps": 25209, "loss": 0.9217, "lr": 2.788166703359096e-05, "epoch": 2.637158136663518, "percentage": 87.91, "elapsed_time": "2 days, 12:49:55", "remaining_time": "8:22:11", "throughput": 27241.71, "total_tokens": 5965801728} +{"current_steps": 22170, "total_steps": 25209, "loss": 0.916, "lr": 2.787733307322816e-05, "epoch": 2.6383481966871702, "percentage": 87.94, "elapsed_time": "2 days, 12:51:45", "remaining_time": "8:20:34", "throughput": 27240.42, "total_tokens": 5968517952} +{"current_steps": 22180, "total_steps": 25209, "loss": 0.9065, "lr": 2.7873001133265518e-05, "epoch": 2.6395382567108228, "percentage": 87.98, "elapsed_time": "2 days, 12:53:31", "remaining_time": "8:18:56", "throughput": 27239.7, "total_tokens": 5971256640} +{"current_steps": 22190, "total_steps": 25209, "loss": 0.9237, "lr": 2.7868671212133768e-05, "epoch": 2.6407283167344753, "percentage": 88.02, "elapsed_time": "2 days, 12:55:15", "remaining_time": "8:17:18", "throughput": 27239.03, "total_tokens": 5973941632} +{"current_steps": 22200, "total_steps": 25209, "loss": 0.9315, "lr": 2.7864343308265313e-05, "epoch": 2.641918376758128, "percentage": 88.06, "elapsed_time": "2 days, 12:57:00", "remaining_time": "8:15:40", "throughput": 27238.49, "total_tokens": 5976669184} +{"current_steps": 22210, "total_steps": 25209, "loss": 0.9254, "lr": 2.7860017420094258e-05, "epoch": 2.6431084367817803, "percentage": 88.1, "elapsed_time": "2 days, 12:58:41", "remaining_time": "8:14:01", "throughput": 27238.1, "total_tokens": 5979347200} +{"current_steps": 22220, "total_steps": 25209, "loss": 0.9133, "lr": 2.7855693546056445e-05, "epoch": 2.6442984968054324, "percentage": 88.14, "elapsed_time": "2 days, 13:00:20", "remaining_time": "8:12:23", "throughput": 27238.0, "total_tokens": 5982029760} +{"current_steps": 22230, "total_steps": 25209, "loss": 0.9227, "lr": 2.785137168458937e-05, "epoch": 2.645488556829085, "percentage": 88.18, "elapsed_time": "2 days, 13:02:08", "remaining_time": "8:10:45", "throughput": 27236.92, "total_tokens": 5984726528} +{"current_steps": 22240, "total_steps": 25209, "loss": 0.9276, "lr": 2.7847051834132265e-05, "epoch": 2.6466786168527374, "percentage": 88.22, "elapsed_time": "2 days, 13:03:51", "remaining_time": "8:09:07", "throughput": 27236.25, "total_tokens": 5987397952} +{"current_steps": 22250, "total_steps": 25209, "loss": 0.9268, "lr": 2.784273399312603e-05, "epoch": 2.64786867687639, "percentage": 88.26, "elapsed_time": "2 days, 13:05:31", "remaining_time": "8:07:28", "throughput": 27235.79, "total_tokens": 5990009984} +{"current_steps": 22260, "total_steps": 25209, "loss": 0.9178, "lr": 2.783841816001326e-05, "epoch": 2.6490587369000425, "percentage": 88.3, "elapsed_time": "2 days, 13:07:12", "remaining_time": "8:05:49", "throughput": 27235.26, "total_tokens": 5992655424} +{"current_steps": 22270, "total_steps": 25209, "loss": 0.928, "lr": 2.7834104333238255e-05, "epoch": 2.650248796923695, "percentage": 88.34, "elapsed_time": "2 days, 13:08:57", "remaining_time": "8:04:11", "throughput": 27234.62, "total_tokens": 5995362176} +{"current_steps": 22280, "total_steps": 25209, "loss": 0.9298, "lr": 2.7829792511246987e-05, "epoch": 2.6514388569473475, "percentage": 88.38, "elapsed_time": "2 days, 13:10:40", "remaining_time": "8:02:33", "throughput": 27233.97, "total_tokens": 5998019904} +{"current_steps": 22290, "total_steps": 25209, "loss": 0.9228, "lr": 2.7825482692487114e-05, "epoch": 2.6526289169709996, "percentage": 88.42, "elapsed_time": "2 days, 13:12:25", "remaining_time": "8:00:55", "throughput": 27233.41, "total_tokens": 6000757760} +{"current_steps": 22300, "total_steps": 25209, "loss": 0.9251, "lr": 2.7821174875407985e-05, "epoch": 2.653818976994652, "percentage": 88.46, "elapsed_time": "2 days, 13:14:11", "remaining_time": "7:59:17", "throughput": 27232.7, "total_tokens": 6003501696} +{"current_steps": 22310, "total_steps": 25209, "loss": 0.9245, "lr": 2.781686905846062e-05, "epoch": 2.6550090370183046, "percentage": 88.5, "elapsed_time": "2 days, 13:16:01", "remaining_time": "7:57:40", "throughput": 27231.74, "total_tokens": 6006263616} +{"current_steps": 22320, "total_steps": 25209, "loss": 0.9243, "lr": 2.7812565240097716e-05, "epoch": 2.656199097041957, "percentage": 88.54, "elapsed_time": "2 days, 13:17:46", "remaining_time": "7:56:02", "throughput": 27231.17, "total_tokens": 6008994240} +{"current_steps": 22330, "total_steps": 25209, "loss": 0.9379, "lr": 2.7808263418773656e-05, "epoch": 2.6573891570656096, "percentage": 88.58, "elapsed_time": "2 days, 13:19:26", "remaining_time": "7:54:23", "throughput": 27230.96, "total_tokens": 6011672448} +{"current_steps": 22340, "total_steps": 25209, "loss": 0.9133, "lr": 2.7803963592944482e-05, "epoch": 2.6585792170892617, "percentage": 88.62, "elapsed_time": "2 days, 13:21:09", "remaining_time": "7:52:44", "throughput": 27230.39, "total_tokens": 6014357568} +{"current_steps": 22350, "total_steps": 25209, "loss": 0.9189, "lr": 2.779966576106792e-05, "epoch": 2.659769277112914, "percentage": 88.66, "elapsed_time": "2 days, 13:22:51", "remaining_time": "7:51:06", "throughput": 27230.06, "total_tokens": 6017055616} +{"current_steps": 22360, "total_steps": 25209, "loss": 0.9214, "lr": 2.779536992160336e-05, "epoch": 2.6609593371365667, "percentage": 88.7, "elapsed_time": "2 days, 13:24:39", "remaining_time": "7:49:28", "throughput": 27229.22, "total_tokens": 6019828800} +{"current_steps": 22370, "total_steps": 25209, "loss": 0.9204, "lr": 2.7791076073011845e-05, "epoch": 2.6621493971602193, "percentage": 88.74, "elapsed_time": "2 days, 13:26:21", "remaining_time": "7:47:50", "throughput": 27228.72, "total_tokens": 6022496384} +{"current_steps": 22380, "total_steps": 25209, "loss": 0.9101, "lr": 2.7786784213756102e-05, "epoch": 2.6633394571838718, "percentage": 88.78, "elapsed_time": "2 days, 13:28:05", "remaining_time": "7:46:12", "throughput": 27228.21, "total_tokens": 6025210816} +{"current_steps": 22390, "total_steps": 25209, "loss": 0.9204, "lr": 2.7782494342300502e-05, "epoch": 2.6645295172075243, "percentage": 88.82, "elapsed_time": "2 days, 13:29:48", "remaining_time": "7:44:33", "throughput": 27227.81, "total_tokens": 6027926080} +{"current_steps": 22400, "total_steps": 25209, "loss": 0.9257, "lr": 2.777820645711109e-05, "epoch": 2.665719577231177, "percentage": 88.86, "elapsed_time": "2 days, 13:31:32", "remaining_time": "7:42:55", "throughput": 27227.24, "total_tokens": 6030617984} +{"current_steps": 22410, "total_steps": 25209, "loss": 0.9249, "lr": 2.777392055665556e-05, "epoch": 2.666909637254829, "percentage": 88.9, "elapsed_time": "2 days, 13:33:11", "remaining_time": "7:41:16", "throughput": 27226.99, "total_tokens": 6033261632} +{"current_steps": 22420, "total_steps": 25209, "loss": 0.9376, "lr": 2.7769636639403252e-05, "epoch": 2.6680996972784814, "percentage": 88.94, "elapsed_time": "2 days, 13:34:51", "remaining_time": "7:39:37", "throughput": 27226.66, "total_tokens": 6035915904} +{"current_steps": 22430, "total_steps": 25209, "loss": 0.9085, "lr": 2.776535470382518e-05, "epoch": 2.669289757302134, "percentage": 88.98, "elapsed_time": "2 days, 13:36:33", "remaining_time": "7:37:59", "throughput": 27226.16, "total_tokens": 6038580288} +{"current_steps": 22440, "total_steps": 25209, "loss": 0.9201, "lr": 2.776107474839399e-05, "epoch": 2.6704798173257864, "percentage": 89.02, "elapsed_time": "2 days, 13:38:16", "remaining_time": "7:36:21", "throughput": 27225.55, "total_tokens": 6041266176} +{"current_steps": 22450, "total_steps": 25209, "loss": 0.9248, "lr": 2.7756796771583976e-05, "epoch": 2.671669877349439, "percentage": 89.06, "elapsed_time": "2 days, 13:40:05", "remaining_time": "7:34:43", "throughput": 27224.55, "total_tokens": 6044003840} +{"current_steps": 22460, "total_steps": 25209, "loss": 0.9222, "lr": 2.775252077187109e-05, "epoch": 2.672859937373091, "percentage": 89.1, "elapsed_time": "2 days, 13:41:50", "remaining_time": "7:33:05", "throughput": 27223.97, "total_tokens": 6046719232} +{"current_steps": 22470, "total_steps": 25209, "loss": 0.921, "lr": 2.7748246747732902e-05, "epoch": 2.6740499973967435, "percentage": 89.13, "elapsed_time": "2 days, 13:43:31", "remaining_time": "7:31:26", "throughput": 27223.46, "total_tokens": 6049370240} +{"current_steps": 22480, "total_steps": 25209, "loss": 0.9136, "lr": 2.774397469764866e-05, "epoch": 2.675240057420396, "percentage": 89.17, "elapsed_time": "2 days, 13:45:13", "remaining_time": "7:29:48", "throughput": 27223.0, "total_tokens": 6052038976} +{"current_steps": 22490, "total_steps": 25209, "loss": 0.9286, "lr": 2.7739704620099226e-05, "epoch": 2.6764301174440486, "percentage": 89.21, "elapsed_time": "2 days, 13:46:54", "remaining_time": "7:28:09", "throughput": 27222.64, "total_tokens": 6054720000} +{"current_steps": 22500, "total_steps": 25209, "loss": 0.9182, "lr": 2.7735436513567098e-05, "epoch": 2.677620177467701, "percentage": 89.25, "elapsed_time": "2 days, 13:48:35", "remaining_time": "7:26:30", "throughput": 27222.29, "total_tokens": 6057382080} +{"current_steps": 22510, "total_steps": 25209, "loss": 0.9355, "lr": 2.7731170376536402e-05, "epoch": 2.6788102374913536, "percentage": 89.29, "elapsed_time": "2 days, 13:50:16", "remaining_time": "7:24:52", "throughput": 27221.91, "total_tokens": 6060041472} +{"current_steps": 22520, "total_steps": 25209, "loss": 0.926, "lr": 2.7726906207492925e-05, "epoch": 2.680000297515006, "percentage": 89.33, "elapsed_time": "2 days, 13:51:59", "remaining_time": "7:23:13", "throughput": 27221.37, "total_tokens": 6062735232} +{"current_steps": 22530, "total_steps": 25209, "loss": 0.9273, "lr": 2.7722644004924048e-05, "epoch": 2.681190357538658, "percentage": 89.37, "elapsed_time": "2 days, 13:53:37", "remaining_time": "7:21:34", "throughput": 27221.29, "total_tokens": 6065374400} +{"current_steps": 22540, "total_steps": 25209, "loss": 0.9272, "lr": 2.77183837673188e-05, "epoch": 2.6823804175623107, "percentage": 89.41, "elapsed_time": "2 days, 13:55:19", "remaining_time": "7:19:56", "throughput": 27220.89, "total_tokens": 6068073792} +{"current_steps": 22550, "total_steps": 25209, "loss": 0.9299, "lr": 2.7714125493167835e-05, "epoch": 2.6835704775859632, "percentage": 89.45, "elapsed_time": "2 days, 13:57:01", "remaining_time": "7:18:17", "throughput": 27220.68, "total_tokens": 6070787904} +{"current_steps": 22560, "total_steps": 25209, "loss": 0.9449, "lr": 2.770986918096342e-05, "epoch": 2.6847605376096157, "percentage": 89.49, "elapsed_time": "2 days, 13:58:47", "remaining_time": "7:16:39", "throughput": 27219.95, "total_tokens": 6073516160} +{"current_steps": 22570, "total_steps": 25209, "loss": 0.9183, "lr": 2.7705614829199454e-05, "epoch": 2.6859505976332683, "percentage": 89.53, "elapsed_time": "2 days, 14:00:31", "remaining_time": "7:15:01", "throughput": 27219.27, "total_tokens": 6076195840} +{"current_steps": 22580, "total_steps": 25209, "loss": 0.9501, "lr": 2.7701362436371437e-05, "epoch": 2.6871406576569203, "percentage": 89.57, "elapsed_time": "2 days, 14:02:13", "remaining_time": "7:13:22", "throughput": 27218.87, "total_tokens": 6078883904} +{"current_steps": 22590, "total_steps": 25209, "loss": 0.9183, "lr": 2.7697112000976492e-05, "epoch": 2.688330717680573, "percentage": 89.61, "elapsed_time": "2 days, 14:03:53", "remaining_time": "7:11:44", "throughput": 27218.53, "total_tokens": 6081542720} +{"current_steps": 22600, "total_steps": 25209, "loss": 0.9323, "lr": 2.769286352151338e-05, "epoch": 2.6895207777042254, "percentage": 89.65, "elapsed_time": "2 days, 14:05:36", "remaining_time": "7:10:05", "throughput": 27218.2, "total_tokens": 6084260032} +{"current_steps": 22610, "total_steps": 25209, "loss": 0.9358, "lr": 2.768861699648243e-05, "epoch": 2.690710837727878, "percentage": 89.69, "elapsed_time": "2 days, 14:07:22", "remaining_time": "7:08:27", "throughput": 27217.5, "total_tokens": 6086984512} +{"current_steps": 22620, "total_steps": 25209, "loss": 0.9186, "lr": 2.7684372424385613e-05, "epoch": 2.6919008977515304, "percentage": 89.73, "elapsed_time": "2 days, 14:08:59", "remaining_time": "7:06:48", "throughput": 27217.5, "total_tokens": 6089626560} +{"current_steps": 22630, "total_steps": 25209, "loss": 0.9288, "lr": 2.7680129803726496e-05, "epoch": 2.693090957775183, "percentage": 89.77, "elapsed_time": "2 days, 14:10:40", "remaining_time": "7:05:09", "throughput": 27217.37, "total_tokens": 6092336832} +{"current_steps": 22640, "total_steps": 25209, "loss": 0.9171, "lr": 2.767588913301025e-05, "epoch": 2.6942810177988354, "percentage": 89.81, "elapsed_time": "2 days, 14:12:15", "remaining_time": "7:03:30", "throughput": 27217.57, "total_tokens": 6094992576} +{"current_steps": 22650, "total_steps": 25209, "loss": 0.9169, "lr": 2.767165041074365e-05, "epoch": 2.6954710778224875, "percentage": 89.85, "elapsed_time": "2 days, 14:13:51", "remaining_time": "7:01:51", "throughput": 27217.7, "total_tokens": 6097635840} +{"current_steps": 22660, "total_steps": 25209, "loss": 0.9299, "lr": 2.766741363543507e-05, "epoch": 2.69666113784614, "percentage": 89.89, "elapsed_time": "2 days, 14:15:35", "remaining_time": "7:00:12", "throughput": 27217.17, "total_tokens": 6100322688} +{"current_steps": 22670, "total_steps": 25209, "loss": 0.9192, "lr": 2.7663178805594482e-05, "epoch": 2.6978511978697925, "percentage": 89.93, "elapsed_time": "2 days, 14:17:13", "remaining_time": "6:58:33", "throughput": 27217.14, "total_tokens": 6103007488} +{"current_steps": 22680, "total_steps": 25209, "loss": 0.9207, "lr": 2.7658945919733463e-05, "epoch": 2.699041257893445, "percentage": 89.97, "elapsed_time": "2 days, 14:18:55", "remaining_time": "6:56:55", "throughput": 27216.81, "total_tokens": 6105693504} +{"current_steps": 22690, "total_steps": 25209, "loss": 0.9272, "lr": 2.7654714976365164e-05, "epoch": 2.7002313179170976, "percentage": 90.01, "elapsed_time": "2 days, 14:20:37", "remaining_time": "6:55:16", "throughput": 27216.31, "total_tokens": 6108371008} +{"current_steps": 22700, "total_steps": 25209, "loss": 0.9313, "lr": 2.765048597400436e-05, "epoch": 2.7014213779407497, "percentage": 90.05, "elapsed_time": "2 days, 14:22:22", "remaining_time": "6:53:38", "throughput": 27215.82, "total_tokens": 6111098496} +{"current_steps": 22710, "total_steps": 25209, "loss": 0.9338, "lr": 2.7646258911167373e-05, "epoch": 2.702611437964402, "percentage": 90.09, "elapsed_time": "2 days, 14:24:03", "remaining_time": "6:51:59", "throughput": 27215.51, "total_tokens": 6113776256} +{"current_steps": 22720, "total_steps": 25209, "loss": 0.9232, "lr": 2.7642033786372145e-05, "epoch": 2.7038014979880547, "percentage": 90.13, "elapsed_time": "2 days, 14:25:44", "remaining_time": "6:50:21", "throughput": 27215.08, "total_tokens": 6116448256} +{"current_steps": 22730, "total_steps": 25209, "loss": 0.9153, "lr": 2.7637810598138193e-05, "epoch": 2.704991558011707, "percentage": 90.17, "elapsed_time": "2 days, 14:27:26", "remaining_time": "6:48:42", "throughput": 27214.66, "total_tokens": 6119108800} +{"current_steps": 22740, "total_steps": 25209, "loss": 0.9327, "lr": 2.7633589344986615e-05, "epoch": 2.7061816180353597, "percentage": 90.21, "elapsed_time": "2 days, 14:29:11", "remaining_time": "6:47:04", "throughput": 27214.19, "total_tokens": 6121878912} +{"current_steps": 22750, "total_steps": 25209, "loss": 0.9358, "lr": 2.7629370025440087e-05, "epoch": 2.7073716780590122, "percentage": 90.25, "elapsed_time": "2 days, 14:30:51", "remaining_time": "6:45:25", "throughput": 27214.01, "total_tokens": 6124542592} +{"current_steps": 22760, "total_steps": 25209, "loss": 0.913, "lr": 2.762515263802287e-05, "epoch": 2.7085617380826648, "percentage": 90.29, "elapsed_time": "2 days, 14:32:32", "remaining_time": "6:43:46", "throughput": 27213.71, "total_tokens": 6127234624} +{"current_steps": 22770, "total_steps": 25209, "loss": 0.9214, "lr": 2.762093718126081e-05, "epoch": 2.709751798106317, "percentage": 90.32, "elapsed_time": "2 days, 14:34:13", "remaining_time": "6:42:07", "throughput": 27213.4, "total_tokens": 6129905472} +{"current_steps": 22780, "total_steps": 25209, "loss": 0.9252, "lr": 2.7616723653681298e-05, "epoch": 2.7109418581299694, "percentage": 90.36, "elapsed_time": "2 days, 14:35:55", "remaining_time": "6:40:29", "throughput": 27213.02, "total_tokens": 6132597376} +{"current_steps": 22790, "total_steps": 25209, "loss": 0.9302, "lr": 2.761251205381332e-05, "epoch": 2.712131918153622, "percentage": 90.4, "elapsed_time": "2 days, 14:37:37", "remaining_time": "6:38:50", "throughput": 27212.8, "total_tokens": 6135317696} +{"current_steps": 22800, "total_steps": 25209, "loss": 0.9321, "lr": 2.760830238018744e-05, "epoch": 2.7133219781772744, "percentage": 90.44, "elapsed_time": "2 days, 14:39:20", "remaining_time": "6:37:12", "throughput": 27212.37, "total_tokens": 6138037888} +{"current_steps": 22810, "total_steps": 25209, "loss": 0.9166, "lr": 2.760409463133576e-05, "epoch": 2.714512038200927, "percentage": 90.48, "elapsed_time": "2 days, 14:40:59", "remaining_time": "6:35:33", "throughput": 27212.22, "total_tokens": 6140687808} +{"current_steps": 22820, "total_steps": 25209, "loss": 0.9195, "lr": 2.7599888805791967e-05, "epoch": 2.715702098224579, "percentage": 90.52, "elapsed_time": "2 days, 14:42:39", "remaining_time": "6:33:54", "throughput": 27212.22, "total_tokens": 6143425280} +{"current_steps": 22830, "total_steps": 25209, "loss": 0.9196, "lr": 2.759568490209132e-05, "epoch": 2.7168921582482315, "percentage": 90.56, "elapsed_time": "2 days, 14:44:22", "remaining_time": "6:32:16", "throughput": 27211.84, "total_tokens": 6146134784} +{"current_steps": 22840, "total_steps": 25209, "loss": 0.9244, "lr": 2.7591482918770613e-05, "epoch": 2.718082218271884, "percentage": 90.6, "elapsed_time": "2 days, 14:46:08", "remaining_time": "6:30:37", "throughput": 27211.18, "total_tokens": 6148855616} +{"current_steps": 22850, "total_steps": 25209, "loss": 0.9222, "lr": 2.7587282854368222e-05, "epoch": 2.7192722782955365, "percentage": 90.64, "elapsed_time": "2 days, 14:47:45", "remaining_time": "6:28:58", "throughput": 27211.29, "total_tokens": 6151532032} +{"current_steps": 22860, "total_steps": 25209, "loss": 0.9258, "lr": 2.7583084707424072e-05, "epoch": 2.720462338319189, "percentage": 90.68, "elapsed_time": "2 days, 14:49:26", "remaining_time": "6:27:19", "throughput": 27210.96, "total_tokens": 6154215104} +{"current_steps": 22870, "total_steps": 25209, "loss": 0.9228, "lr": 2.7578888476479643e-05, "epoch": 2.7216523983428416, "percentage": 90.72, "elapsed_time": "2 days, 14:51:06", "remaining_time": "6:25:41", "throughput": 27210.7, "total_tokens": 6156863552} +{"current_steps": 22880, "total_steps": 25209, "loss": 0.9206, "lr": 2.7574694160077964e-05, "epoch": 2.722842458366494, "percentage": 90.76, "elapsed_time": "2 days, 14:52:47", "remaining_time": "6:24:02", "throughput": 27210.41, "total_tokens": 6159539904} +{"current_steps": 22890, "total_steps": 25209, "loss": 0.9212, "lr": 2.757050175676362e-05, "epoch": 2.724032518390146, "percentage": 90.8, "elapsed_time": "2 days, 14:54:27", "remaining_time": "6:22:23", "throughput": 27210.34, "total_tokens": 6162255872} +{"current_steps": 22900, "total_steps": 25209, "loss": 0.9117, "lr": 2.756631126508274e-05, "epoch": 2.7252225784137987, "percentage": 90.84, "elapsed_time": "2 days, 14:56:08", "remaining_time": "6:20:44", "throughput": 27210.13, "total_tokens": 6164956736} +{"current_steps": 22910, "total_steps": 25209, "loss": 0.9019, "lr": 2.7562122683583004e-05, "epoch": 2.726412638437451, "percentage": 90.88, "elapsed_time": "2 days, 14:57:47", "remaining_time": "6:19:05", "throughput": 27209.91, "total_tokens": 6167614656} +{"current_steps": 22920, "total_steps": 25209, "loss": 0.9094, "lr": 2.7557936010813634e-05, "epoch": 2.7276026984611037, "percentage": 90.92, "elapsed_time": "2 days, 14:59:25", "remaining_time": "6:17:26", "throughput": 27210.04, "total_tokens": 6170302016} +{"current_steps": 22930, "total_steps": 25209, "loss": 0.9296, "lr": 2.75537512453254e-05, "epoch": 2.728792758484756, "percentage": 90.96, "elapsed_time": "2 days, 15:01:05", "remaining_time": "6:15:48", "throughput": 27209.97, "total_tokens": 6172994752} +{"current_steps": 22940, "total_steps": 25209, "loss": 0.9234, "lr": 2.7549568385670595e-05, "epoch": 2.7299828185084083, "percentage": 91.0, "elapsed_time": "2 days, 15:02:46", "remaining_time": "6:14:09", "throughput": 27209.82, "total_tokens": 6175725696} +{"current_steps": 22950, "total_steps": 25209, "loss": 0.9203, "lr": 2.754538743040307e-05, "epoch": 2.731172878532061, "percentage": 91.04, "elapsed_time": "2 days, 15:04:28", "remaining_time": "6:12:30", "throughput": 27209.56, "total_tokens": 6178438784} +{"current_steps": 22960, "total_steps": 25209, "loss": 0.9164, "lr": 2.75412083780782e-05, "epoch": 2.7323629385557133, "percentage": 91.08, "elapsed_time": "2 days, 15:06:08", "remaining_time": "6:10:51", "throughput": 27209.3, "total_tokens": 6181108416} +{"current_steps": 22970, "total_steps": 25209, "loss": 0.9372, "lr": 2.7537031227252898e-05, "epoch": 2.733552998579366, "percentage": 91.12, "elapsed_time": "2 days, 15:07:48", "remaining_time": "6:09:13", "throughput": 27209.06, "total_tokens": 6183767872} +{"current_steps": 22980, "total_steps": 25209, "loss": 0.9273, "lr": 2.75328559764856e-05, "epoch": 2.7347430586030184, "percentage": 91.16, "elapsed_time": "2 days, 15:09:30", "remaining_time": "6:07:34", "throughput": 27208.82, "total_tokens": 6186477760} +{"current_steps": 22990, "total_steps": 25209, "loss": 0.9311, "lr": 2.752868262433629e-05, "epoch": 2.735933118626671, "percentage": 91.2, "elapsed_time": "2 days, 15:11:13", "remaining_time": "6:05:55", "throughput": 27208.45, "total_tokens": 6189212160} +{"current_steps": 23000, "total_steps": 25209, "loss": 0.9202, "lr": 2.752451116936646e-05, "epoch": 2.7371231786503234, "percentage": 91.24, "elapsed_time": "2 days, 15:12:55", "remaining_time": "6:04:17", "throughput": 27208.14, "total_tokens": 6191914432} +{"current_steps": 23010, "total_steps": 25209, "loss": 0.927, "lr": 2.752034161013915e-05, "epoch": 2.7383132386739755, "percentage": 91.28, "elapsed_time": "2 days, 15:14:33", "remaining_time": "6:02:38", "throughput": 27208.18, "total_tokens": 6194573056} +{"current_steps": 23020, "total_steps": 25209, "loss": 0.9133, "lr": 2.7516173945218888e-05, "epoch": 2.739503298697628, "percentage": 91.32, "elapsed_time": "2 days, 15:16:13", "remaining_time": "6:00:59", "throughput": 27208.09, "total_tokens": 6197271680} +{"current_steps": 23030, "total_steps": 25209, "loss": 0.9363, "lr": 2.751200817317176e-05, "epoch": 2.7406933587212805, "percentage": 91.36, "elapsed_time": "2 days, 15:17:54", "remaining_time": "5:59:20", "throughput": 27208.02, "total_tokens": 6200004544} +{"current_steps": 23040, "total_steps": 25209, "loss": 0.9193, "lr": 2.7507844292565354e-05, "epoch": 2.741883418744933, "percentage": 91.4, "elapsed_time": "2 days, 15:19:35", "remaining_time": "5:57:41", "throughput": 27207.85, "total_tokens": 6202712320} +{"current_steps": 23050, "total_steps": 25209, "loss": 0.9164, "lr": 2.7503682301968763e-05, "epoch": 2.7430734787685855, "percentage": 91.44, "elapsed_time": "2 days, 15:21:19", "remaining_time": "5:56:03", "throughput": 27207.37, "total_tokens": 6205440000} +{"current_steps": 23060, "total_steps": 25209, "loss": 0.9218, "lr": 2.7499522199952627e-05, "epoch": 2.7442635387922376, "percentage": 91.48, "elapsed_time": "2 days, 15:23:01", "remaining_time": "5:54:24", "throughput": 27207.13, "total_tokens": 6208166528} +{"current_steps": 23070, "total_steps": 25209, "loss": 0.9219, "lr": 2.7495363985089072e-05, "epoch": 2.74545359881589, "percentage": 91.51, "elapsed_time": "2 days, 15:24:44", "remaining_time": "5:52:46", "throughput": 27206.9, "total_tokens": 6210921024} +{"current_steps": 23080, "total_steps": 25209, "loss": 0.9243, "lr": 2.7491207655951745e-05, "epoch": 2.7466436588395426, "percentage": 91.55, "elapsed_time": "2 days, 15:26:27", "remaining_time": "5:51:07", "throughput": 27206.47, "total_tokens": 6213629824} +{"current_steps": 23090, "total_steps": 25209, "loss": 0.924, "lr": 2.7487053211115797e-05, "epoch": 2.747833718863195, "percentage": 91.59, "elapsed_time": "2 days, 15:28:10", "remaining_time": "5:49:28", "throughput": 27206.16, "total_tokens": 6216343488} +{"current_steps": 23100, "total_steps": 25209, "loss": 0.9244, "lr": 2.748290064915789e-05, "epoch": 2.7490237788868477, "percentage": 91.63, "elapsed_time": "2 days, 15:29:45", "remaining_time": "5:47:49", "throughput": 27206.2, "total_tokens": 6218951040} +{"current_steps": 23110, "total_steps": 25209, "loss": 0.9238, "lr": 2.747874996865619e-05, "epoch": 2.7502138389105, "percentage": 91.67, "elapsed_time": "2 days, 15:31:25", "remaining_time": "5:46:10", "throughput": 27205.98, "total_tokens": 6221622272} +{"current_steps": 23120, "total_steps": 25209, "loss": 0.9194, "lr": 2.747460116819037e-05, "epoch": 2.7514038989341527, "percentage": 91.71, "elapsed_time": "2 days, 15:33:03", "remaining_time": "5:44:31", "throughput": 27206.16, "total_tokens": 6224323904} +{"current_steps": 23130, "total_steps": 25209, "loss": 0.931, "lr": 2.7470454246341597e-05, "epoch": 2.752593958957805, "percentage": 91.75, "elapsed_time": "2 days, 15:34:48", "remaining_time": "5:42:53", "throughput": 27205.74, "total_tokens": 6227075584} +{"current_steps": 23140, "total_steps": 25209, "loss": 0.9228, "lr": 2.746630920169254e-05, "epoch": 2.7537840189814573, "percentage": 91.79, "elapsed_time": "2 days, 15:36:30", "remaining_time": "5:41:14", "throughput": 27205.48, "total_tokens": 6229792960} +{"current_steps": 23150, "total_steps": 25209, "loss": 0.925, "lr": 2.7462166032827358e-05, "epoch": 2.75497407900511, "percentage": 91.83, "elapsed_time": "2 days, 15:38:10", "remaining_time": "5:39:35", "throughput": 27205.45, "total_tokens": 6232498176} +{"current_steps": 23160, "total_steps": 25209, "loss": 0.9121, "lr": 2.745802473833171e-05, "epoch": 2.7561641390287623, "percentage": 91.87, "elapsed_time": "2 days, 15:39:53", "remaining_time": "5:37:57", "throughput": 27205.1, "total_tokens": 6235226816} +{"current_steps": 23170, "total_steps": 25209, "loss": 0.9374, "lr": 2.7453885316792755e-05, "epoch": 2.757354199052415, "percentage": 91.91, "elapsed_time": "2 days, 15:41:35", "remaining_time": "5:36:18", "throughput": 27204.86, "total_tokens": 6237940096} +{"current_steps": 23180, "total_steps": 25209, "loss": 0.9234, "lr": 2.7449747766799135e-05, "epoch": 2.758544259076067, "percentage": 91.95, "elapsed_time": "2 days, 15:43:12", "remaining_time": "5:34:39", "throughput": 27205.06, "total_tokens": 6240634752} +{"current_steps": 23190, "total_steps": 25209, "loss": 0.9305, "lr": 2.744561208694097e-05, "epoch": 2.7597343190997194, "percentage": 91.99, "elapsed_time": "2 days, 15:44:58", "remaining_time": "5:33:00", "throughput": 27204.53, "total_tokens": 6243386048} +{"current_steps": 23200, "total_steps": 25209, "loss": 0.9105, "lr": 2.7441478275809884e-05, "epoch": 2.760924379123372, "percentage": 92.03, "elapsed_time": "2 days, 15:46:36", "remaining_time": "5:31:21", "throughput": 27204.47, "total_tokens": 6246053440} +{"current_steps": 23210, "total_steps": 25209, "loss": 0.9254, "lr": 2.743734633199898e-05, "epoch": 2.7621144391470245, "percentage": 92.07, "elapsed_time": "2 days, 15:48:17", "remaining_time": "5:29:43", "throughput": 27204.19, "total_tokens": 6248730752} +{"current_steps": 23220, "total_steps": 25209, "loss": 0.9077, "lr": 2.743321625410284e-05, "epoch": 2.763304499170677, "percentage": 92.11, "elapsed_time": "2 days, 15:49:56", "remaining_time": "5:28:04", "throughput": 27203.97, "total_tokens": 6251382848} +{"current_steps": 23230, "total_steps": 25209, "loss": 0.9195, "lr": 2.7429088040717526e-05, "epoch": 2.7644945591943295, "percentage": 92.15, "elapsed_time": "2 days, 15:51:34", "remaining_time": "5:26:25", "throughput": 27204.09, "total_tokens": 6254066240} +{"current_steps": 23240, "total_steps": 25209, "loss": 0.916, "lr": 2.7424961690440586e-05, "epoch": 2.765684619217982, "percentage": 92.19, "elapsed_time": "2 days, 15:53:20", "remaining_time": "5:24:46", "throughput": 27203.63, "total_tokens": 6256845056} +{"current_steps": 23250, "total_steps": 25209, "loss": 0.9144, "lr": 2.742083720187103e-05, "epoch": 2.766874679241634, "percentage": 92.23, "elapsed_time": "2 days, 15:55:00", "remaining_time": "5:23:07", "throughput": 27203.53, "total_tokens": 6259549952} +{"current_steps": 23260, "total_steps": 25209, "loss": 0.9246, "lr": 2.7416714573609363e-05, "epoch": 2.7680647392652866, "percentage": 92.27, "elapsed_time": "2 days, 15:56:40", "remaining_time": "5:21:28", "throughput": 27203.46, "total_tokens": 6262241344} +{"current_steps": 23270, "total_steps": 25209, "loss": 0.9225, "lr": 2.7412593804257543e-05, "epoch": 2.769254799288939, "percentage": 92.31, "elapsed_time": "2 days, 15:58:20", "remaining_time": "5:19:50", "throughput": 27203.27, "total_tokens": 6264921920} +{"current_steps": 23280, "total_steps": 25209, "loss": 0.9065, "lr": 2.740847489241901e-05, "epoch": 2.7704448593125917, "percentage": 92.35, "elapsed_time": "2 days, 16:00:02", "remaining_time": "5:18:11", "throughput": 27203.08, "total_tokens": 6267667840} +{"current_steps": 23290, "total_steps": 25209, "loss": 0.9291, "lr": 2.7404357836698668e-05, "epoch": 2.771634919336244, "percentage": 92.39, "elapsed_time": "2 days, 16:01:42", "remaining_time": "5:16:32", "throughput": 27202.92, "total_tokens": 6270350592} +{"current_steps": 23300, "total_steps": 25209, "loss": 0.9289, "lr": 2.740024263570289e-05, "epoch": 2.7728249793598962, "percentage": 92.43, "elapsed_time": "2 days, 16:03:26", "remaining_time": "5:14:53", "throughput": 27202.53, "total_tokens": 6273079168} +{"current_steps": 23310, "total_steps": 25209, "loss": 0.9356, "lr": 2.7396129288039503e-05, "epoch": 2.7740150393835488, "percentage": 92.47, "elapsed_time": "2 days, 16:05:04", "remaining_time": "5:13:14", "throughput": 27202.51, "total_tokens": 6275736256} +{"current_steps": 23320, "total_steps": 25209, "loss": 0.9168, "lr": 2.739201779231782e-05, "epoch": 2.7752050994072013, "percentage": 92.51, "elapsed_time": "2 days, 16:06:47", "remaining_time": "5:11:36", "throughput": 27202.14, "total_tokens": 6278445632} +{"current_steps": 23330, "total_steps": 25209, "loss": 0.9178, "lr": 2.7387908147148587e-05, "epoch": 2.776395159430854, "percentage": 92.55, "elapsed_time": "2 days, 16:08:30", "remaining_time": "5:09:57", "throughput": 27201.81, "total_tokens": 6281189440} +{"current_steps": 23340, "total_steps": 25209, "loss": 0.9204, "lr": 2.7383800351144027e-05, "epoch": 2.7775852194545063, "percentage": 92.59, "elapsed_time": "2 days, 16:10:09", "remaining_time": "5:08:18", "throughput": 27201.89, "total_tokens": 6283883072} +{"current_steps": 23350, "total_steps": 25209, "loss": 0.9148, "lr": 2.737969440291782e-05, "epoch": 2.778775279478159, "percentage": 92.63, "elapsed_time": "2 days, 16:11:48", "remaining_time": "5:06:39", "throughput": 27201.95, "total_tokens": 6286598208} +{"current_steps": 23360, "total_steps": 25209, "loss": 0.9226, "lr": 2.7375590301085087e-05, "epoch": 2.7799653395018113, "percentage": 92.67, "elapsed_time": "2 days, 16:13:30", "remaining_time": "5:05:00", "throughput": 27201.73, "total_tokens": 6289313920} +{"current_steps": 23370, "total_steps": 25209, "loss": 0.9287, "lr": 2.7371488044262406e-05, "epoch": 2.7811553995254634, "percentage": 92.7, "elapsed_time": "2 days, 16:15:06", "remaining_time": "5:03:21", "throughput": 27201.95, "total_tokens": 6291993216} +{"current_steps": 23380, "total_steps": 25209, "loss": 0.9257, "lr": 2.7367387631067816e-05, "epoch": 2.782345459549116, "percentage": 92.74, "elapsed_time": "2 days, 16:16:43", "remaining_time": "5:01:42", "throughput": 27201.86, "total_tokens": 6294601280} +{"current_steps": 23390, "total_steps": 25209, "loss": 0.9291, "lr": 2.73632890601208e-05, "epoch": 2.7835355195727685, "percentage": 92.78, "elapsed_time": "2 days, 16:18:22", "remaining_time": "5:00:03", "throughput": 27201.54, "total_tokens": 6297237888} +{"current_steps": 23400, "total_steps": 25209, "loss": 0.916, "lr": 2.7359192330042277e-05, "epoch": 2.784725579596421, "percentage": 92.82, "elapsed_time": "2 days, 16:20:03", "remaining_time": "4:58:24", "throughput": 27201.38, "total_tokens": 6299935424} +{"current_steps": 23410, "total_steps": 25209, "loss": 0.9151, "lr": 2.7355097439454625e-05, "epoch": 2.7859156396200735, "percentage": 92.86, "elapsed_time": "2 days, 16:21:42", "remaining_time": "4:56:45", "throughput": 27201.4, "total_tokens": 6302643200} +{"current_steps": 23420, "total_steps": 25209, "loss": 0.9115, "lr": 2.735100438698166e-05, "epoch": 2.7871056996437256, "percentage": 92.9, "elapsed_time": "2 days, 16:23:23", "remaining_time": "4:55:06", "throughput": 27201.22, "total_tokens": 6305345856} +{"current_steps": 23430, "total_steps": 25209, "loss": 0.9252, "lr": 2.7346913171248635e-05, "epoch": 2.788295759667378, "percentage": 92.94, "elapsed_time": "2 days, 16:25:03", "remaining_time": "4:53:28", "throughput": 27201.2, "total_tokens": 6308044352} +{"current_steps": 23440, "total_steps": 25209, "loss": 0.9195, "lr": 2.734282379088225e-05, "epoch": 2.7894858196910306, "percentage": 92.98, "elapsed_time": "2 days, 16:26:40", "remaining_time": "4:51:48", "throughput": 27201.2, "total_tokens": 6310685568} +{"current_steps": 23450, "total_steps": 25209, "loss": 0.9127, "lr": 2.733873624451063e-05, "epoch": 2.790675879714683, "percentage": 93.02, "elapsed_time": "2 days, 16:28:16", "remaining_time": "4:50:09", "throughput": 27201.43, "total_tokens": 6313351424} +{"current_steps": 23460, "total_steps": 25209, "loss": 0.9284, "lr": 2.733465053076335e-05, "epoch": 2.7918659397383356, "percentage": 93.06, "elapsed_time": "2 days, 16:29:56", "remaining_time": "4:48:30", "throughput": 27201.15, "total_tokens": 6316021312} +{"current_steps": 23470, "total_steps": 25209, "loss": 0.9268, "lr": 2.733056664827141e-05, "epoch": 2.793055999761988, "percentage": 93.1, "elapsed_time": "2 days, 16:31:40", "remaining_time": "4:46:52", "throughput": 27200.71, "total_tokens": 6318750592} +{"current_steps": 23480, "total_steps": 25209, "loss": 0.9176, "lr": 2.732648459566724e-05, "epoch": 2.7942460597856407, "percentage": 93.14, "elapsed_time": "2 days, 16:33:21", "remaining_time": "4:45:13", "throughput": 27200.72, "total_tokens": 6321475328} +{"current_steps": 23490, "total_steps": 25209, "loss": 0.9136, "lr": 2.73224043715847e-05, "epoch": 2.7954361198092927, "percentage": 93.18, "elapsed_time": "2 days, 16:34:59", "remaining_time": "4:43:34", "throughput": 27200.84, "total_tokens": 6324178176} +{"current_steps": 23500, "total_steps": 25209, "loss": 0.9306, "lr": 2.731832597465908e-05, "epoch": 2.7966261798329453, "percentage": 93.22, "elapsed_time": "2 days, 16:36:41", "remaining_time": "4:41:55", "throughput": 27200.43, "total_tokens": 6326861120} +{"current_steps": 23510, "total_steps": 25209, "loss": 0.9402, "lr": 2.7314249403527097e-05, "epoch": 2.7978162398565978, "percentage": 93.26, "elapsed_time": "2 days, 16:38:25", "remaining_time": "4:40:16", "throughput": 27199.99, "total_tokens": 6329585152} +{"current_steps": 23520, "total_steps": 25209, "loss": 0.9236, "lr": 2.731017465682689e-05, "epoch": 2.7990062998802503, "percentage": 93.3, "elapsed_time": "2 days, 16:40:08", "remaining_time": "4:38:38", "throughput": 27199.77, "total_tokens": 6332339648} +{"current_steps": 23530, "total_steps": 25209, "loss": 0.9267, "lr": 2.730610173319802e-05, "epoch": 2.800196359903903, "percentage": 93.34, "elapsed_time": "2 days, 16:41:49", "remaining_time": "4:36:59", "throughput": 27199.52, "total_tokens": 6335032896} +{"current_steps": 23540, "total_steps": 25209, "loss": 0.9169, "lr": 2.7302030631281454e-05, "epoch": 2.801386419927555, "percentage": 93.38, "elapsed_time": "2 days, 16:43:26", "remaining_time": "4:35:20", "throughput": 27199.62, "total_tokens": 6337693760} +{"current_steps": 23550, "total_steps": 25209, "loss": 0.9179, "lr": 2.7297961349719608e-05, "epoch": 2.8025764799512074, "percentage": 93.42, "elapsed_time": "2 days, 16:45:05", "remaining_time": "4:33:41", "throughput": 27199.69, "total_tokens": 6340404480} +{"current_steps": 23560, "total_steps": 25209, "loss": 0.9346, "lr": 2.729389388715628e-05, "epoch": 2.80376653997486, "percentage": 93.46, "elapsed_time": "2 days, 16:46:45", "remaining_time": "4:32:02", "throughput": 27199.7, "total_tokens": 6343124864} +{"current_steps": 23570, "total_steps": 25209, "loss": 0.9362, "lr": 2.728982824223671e-05, "epoch": 2.8049565999985124, "percentage": 93.5, "elapsed_time": "2 days, 16:48:22", "remaining_time": "4:30:23", "throughput": 27199.83, "total_tokens": 6345794816} +{"current_steps": 23580, "total_steps": 25209, "loss": 0.9064, "lr": 2.7285764413607527e-05, "epoch": 2.806146660022165, "percentage": 93.54, "elapsed_time": "2 days, 16:49:56", "remaining_time": "4:28:43", "throughput": 27200.29, "total_tokens": 6348450368} +{"current_steps": 23590, "total_steps": 25209, "loss": 0.9225, "lr": 2.7281702399916786e-05, "epoch": 2.8073367200458175, "percentage": 93.58, "elapsed_time": "2 days, 16:51:30", "remaining_time": "4:27:04", "throughput": 27200.61, "total_tokens": 6351079104} +{"current_steps": 23600, "total_steps": 25209, "loss": 0.9358, "lr": 2.7277642199813954e-05, "epoch": 2.80852678006947, "percentage": 93.62, "elapsed_time": "2 days, 16:53:07", "remaining_time": "4:25:25", "throughput": 27200.62, "total_tokens": 6353726336} +{"current_steps": 23610, "total_steps": 25209, "loss": 0.9237, "lr": 2.7273583811949882e-05, "epoch": 2.809716840093122, "percentage": 93.66, "elapsed_time": "2 days, 16:54:43", "remaining_time": "4:23:46", "throughput": 27200.85, "total_tokens": 6356391488} +{"current_steps": 23620, "total_steps": 25209, "loss": 0.9322, "lr": 2.7269527234976844e-05, "epoch": 2.8109069001167746, "percentage": 93.7, "elapsed_time": "2 days, 16:56:18", "remaining_time": "4:22:07", "throughput": 27201.21, "total_tokens": 6359070720} +{"current_steps": 23630, "total_steps": 25209, "loss": 0.9268, "lr": 2.726547246754852e-05, "epoch": 2.812096960140427, "percentage": 93.74, "elapsed_time": "2 days, 16:57:57", "remaining_time": "4:20:28", "throughput": 27201.33, "total_tokens": 6361787776} +{"current_steps": 23640, "total_steps": 25209, "loss": 0.9139, "lr": 2.726141950831998e-05, "epoch": 2.8132870201640796, "percentage": 93.78, "elapsed_time": "2 days, 16:59:35", "remaining_time": "4:18:49", "throughput": 27201.46, "total_tokens": 6364467712} +{"current_steps": 23650, "total_steps": 25209, "loss": 0.9079, "lr": 2.7257368355947686e-05, "epoch": 2.814477080187732, "percentage": 93.82, "elapsed_time": "2 days, 17:01:13", "remaining_time": "4:17:10", "throughput": 27201.52, "total_tokens": 6367161088} +{"current_steps": 23660, "total_steps": 25209, "loss": 0.9237, "lr": 2.7253319009089528e-05, "epoch": 2.815667140211384, "percentage": 93.86, "elapsed_time": "2 days, 17:02:51", "remaining_time": "4:15:31", "throughput": 27201.63, "total_tokens": 6369859456} +{"current_steps": 23670, "total_steps": 25209, "loss": 0.9241, "lr": 2.7249271466404758e-05, "epoch": 2.8168572002350367, "percentage": 93.9, "elapsed_time": "2 days, 17:04:32", "remaining_time": "4:13:52", "throughput": 27201.6, "total_tokens": 6372572672} +{"current_steps": 23680, "total_steps": 25209, "loss": 0.9212, "lr": 2.724522572655403e-05, "epoch": 2.8180472602586892, "percentage": 93.93, "elapsed_time": "2 days, 17:06:10", "remaining_time": "4:12:13", "throughput": 27201.75, "total_tokens": 6375295936} +{"current_steps": 23690, "total_steps": 25209, "loss": 0.9262, "lr": 2.7241181788199405e-05, "epoch": 2.8192373202823418, "percentage": 93.97, "elapsed_time": "2 days, 17:07:49", "remaining_time": "4:10:34", "throughput": 27201.72, "total_tokens": 6377971840} +{"current_steps": 23700, "total_steps": 25209, "loss": 0.921, "lr": 2.7237139650004316e-05, "epoch": 2.8204273803059943, "percentage": 94.01, "elapsed_time": "2 days, 17:09:29", "remaining_time": "4:08:55", "throughput": 27201.59, "total_tokens": 6380667776} +{"current_steps": 23710, "total_steps": 25209, "loss": 0.9234, "lr": 2.7233099310633598e-05, "epoch": 2.821617440329647, "percentage": 94.05, "elapsed_time": "2 days, 17:11:07", "remaining_time": "4:07:16", "throughput": 27201.82, "total_tokens": 6383371136} +{"current_steps": 23720, "total_steps": 25209, "loss": 0.9168, "lr": 2.722906076875345e-05, "epoch": 2.8228075003532993, "percentage": 94.09, "elapsed_time": "2 days, 17:12:46", "remaining_time": "4:05:37", "throughput": 27201.81, "total_tokens": 6386087744} +{"current_steps": 23730, "total_steps": 25209, "loss": 0.9279, "lr": 2.7225024023031487e-05, "epoch": 2.8239975603769514, "percentage": 94.13, "elapsed_time": "2 days, 17:14:27", "remaining_time": "4:03:58", "throughput": 27201.75, "total_tokens": 6388804352} +{"current_steps": 23740, "total_steps": 25209, "loss": 0.9165, "lr": 2.7220989072136676e-05, "epoch": 2.825187620400604, "percentage": 94.17, "elapsed_time": "2 days, 17:16:08", "remaining_time": "4:02:19", "throughput": 27201.51, "total_tokens": 6391505920} +{"current_steps": 23750, "total_steps": 25209, "loss": 0.9217, "lr": 2.7216955914739385e-05, "epoch": 2.8263776804242564, "percentage": 94.21, "elapsed_time": "2 days, 17:17:47", "remaining_time": "4:00:40", "throughput": 27201.45, "total_tokens": 6394171136} +{"current_steps": 23760, "total_steps": 25209, "loss": 0.9215, "lr": 2.7212924549511348e-05, "epoch": 2.827567740447909, "percentage": 94.25, "elapsed_time": "2 days, 17:19:26", "remaining_time": "3:59:01", "throughput": 27201.41, "total_tokens": 6396861760} +{"current_steps": 23770, "total_steps": 25209, "loss": 0.9102, "lr": 2.7208894975125688e-05, "epoch": 2.8287578004715614, "percentage": 94.29, "elapsed_time": "2 days, 17:21:05", "remaining_time": "3:57:22", "throughput": 27201.48, "total_tokens": 6399556608} +{"current_steps": 23780, "total_steps": 25209, "loss": 0.9191, "lr": 2.720486719025689e-05, "epoch": 2.8299478604952135, "percentage": 94.33, "elapsed_time": "2 days, 17:22:48", "remaining_time": "3:55:43", "throughput": 27201.3, "total_tokens": 6402340096} +{"current_steps": 23790, "total_steps": 25209, "loss": 0.9236, "lr": 2.7200841193580816e-05, "epoch": 2.831137920518866, "percentage": 94.37, "elapsed_time": "2 days, 17:24:28", "remaining_time": "3:54:04", "throughput": 27201.16, "total_tokens": 6405027776} +{"current_steps": 23800, "total_steps": 25209, "loss": 0.9219, "lr": 2.7196816983774708e-05, "epoch": 2.8323279805425186, "percentage": 94.41, "elapsed_time": "2 days, 17:26:12", "remaining_time": "3:52:26", "throughput": 27200.96, "total_tokens": 6407789760} +{"current_steps": 23810, "total_steps": 25209, "loss": 0.9281, "lr": 2.7192794559517166e-05, "epoch": 2.833518040566171, "percentage": 94.45, "elapsed_time": "2 days, 17:27:54", "remaining_time": "3:50:47", "throughput": 27200.69, "total_tokens": 6410503552} +{"current_steps": 23820, "total_steps": 25209, "loss": 0.9317, "lr": 2.7188773919488165e-05, "epoch": 2.8347081005898236, "percentage": 94.49, "elapsed_time": "2 days, 17:29:34", "remaining_time": "3:49:08", "throughput": 27200.59, "total_tokens": 6413207040} +{"current_steps": 23830, "total_steps": 25209, "loss": 0.925, "lr": 2.7184755062369043e-05, "epoch": 2.835898160613476, "percentage": 94.53, "elapsed_time": "2 days, 17:31:09", "remaining_time": "3:47:29", "throughput": 27201.04, "total_tokens": 6415883328} +{"current_steps": 23840, "total_steps": 25209, "loss": 0.9177, "lr": 2.7180737986842498e-05, "epoch": 2.8370882206371286, "percentage": 94.57, "elapsed_time": "2 days, 17:32:43", "remaining_time": "3:45:50", "throughput": 27201.18, "total_tokens": 6418487616} +{"current_steps": 23850, "total_steps": 25209, "loss": 0.9144, "lr": 2.71767226915926e-05, "epoch": 2.8382782806607807, "percentage": 94.61, "elapsed_time": "2 days, 17:34:25", "remaining_time": "3:44:11", "throughput": 27200.86, "total_tokens": 6421194240} +{"current_steps": 23860, "total_steps": 25209, "loss": 0.9093, "lr": 2.7172709175304767e-05, "epoch": 2.839468340684433, "percentage": 94.65, "elapsed_time": "2 days, 17:36:04", "remaining_time": "3:42:32", "throughput": 27200.9, "total_tokens": 6423883776} +{"current_steps": 23870, "total_steps": 25209, "loss": 0.9217, "lr": 2.716869743666579e-05, "epoch": 2.8406584007080857, "percentage": 94.69, "elapsed_time": "2 days, 17:37:44", "remaining_time": "3:40:53", "throughput": 27200.85, "total_tokens": 6426590464} +{"current_steps": 23880, "total_steps": 25209, "loss": 0.9184, "lr": 2.7164687474363803e-05, "epoch": 2.8418484607317382, "percentage": 94.73, "elapsed_time": "2 days, 17:39:22", "remaining_time": "3:39:14", "throughput": 27200.78, "total_tokens": 6429254784} +{"current_steps": 23890, "total_steps": 25209, "loss": 0.9214, "lr": 2.7160679287088307e-05, "epoch": 2.8430385207553908, "percentage": 94.77, "elapsed_time": "2 days, 17:41:02", "remaining_time": "3:37:35", "throughput": 27201.01, "total_tokens": 6432010880} +{"current_steps": 23900, "total_steps": 25209, "loss": 0.9314, "lr": 2.7156672873530147e-05, "epoch": 2.844228580779043, "percentage": 94.81, "elapsed_time": "2 days, 17:42:40", "remaining_time": "3:35:56", "throughput": 27201.02, "total_tokens": 6434674368} +{"current_steps": 23910, "total_steps": 25209, "loss": 0.9306, "lr": 2.715266823238152e-05, "epoch": 2.8454186408026954, "percentage": 94.85, "elapsed_time": "2 days, 17:44:15", "remaining_time": "3:34:17", "throughput": 27201.35, "total_tokens": 6437355776} +{"current_steps": 23920, "total_steps": 25209, "loss": 0.926, "lr": 2.714866536233598e-05, "epoch": 2.846608700826348, "percentage": 94.89, "elapsed_time": "2 days, 17:45:55", "remaining_time": "3:32:38", "throughput": 27201.26, "total_tokens": 6440034688} +{"current_steps": 23930, "total_steps": 25209, "loss": 0.9211, "lr": 2.7144664262088422e-05, "epoch": 2.8477987608500004, "percentage": 94.93, "elapsed_time": "2 days, 17:47:34", "remaining_time": "3:30:59", "throughput": 27201.18, "total_tokens": 6442724608} +{"current_steps": 23940, "total_steps": 25209, "loss": 0.9186, "lr": 2.7140664930335084e-05, "epoch": 2.848988820873653, "percentage": 94.97, "elapsed_time": "2 days, 17:49:19", "remaining_time": "3:29:20", "throughput": 27200.74, "total_tokens": 6445470976} +{"current_steps": 23950, "total_steps": 25209, "loss": 0.92, "lr": 2.713666736577356e-05, "epoch": 2.8501788808973054, "percentage": 95.01, "elapsed_time": "2 days, 17:50:57", "remaining_time": "3:27:41", "throughput": 27200.93, "total_tokens": 6448181248} +{"current_steps": 23960, "total_steps": 25209, "loss": 0.9122, "lr": 2.713267156710278e-05, "epoch": 2.851368940920958, "percentage": 95.05, "elapsed_time": "2 days, 17:52:39", "remaining_time": "3:26:02", "throughput": 27200.61, "total_tokens": 6450891840} +{"current_steps": 23970, "total_steps": 25209, "loss": 0.9271, "lr": 2.712867753302301e-05, "epoch": 2.85255900094461, "percentage": 95.09, "elapsed_time": "2 days, 17:54:18", "remaining_time": "3:24:23", "throughput": 27200.51, "total_tokens": 6453564160} +{"current_steps": 23980, "total_steps": 25209, "loss": 0.9351, "lr": 2.7124685262235865e-05, "epoch": 2.8537490609682625, "percentage": 95.12, "elapsed_time": "2 days, 17:55:59", "remaining_time": "3:22:44", "throughput": 27200.23, "total_tokens": 6456239552} +{"current_steps": 23990, "total_steps": 25209, "loss": 0.9237, "lr": 2.7120694753444287e-05, "epoch": 2.854939120991915, "percentage": 95.16, "elapsed_time": "2 days, 17:57:35", "remaining_time": "3:21:05", "throughput": 27200.43, "total_tokens": 6458904832} +{"current_steps": 24000, "total_steps": 25209, "loss": 0.9186, "lr": 2.7116706005352547e-05, "epoch": 2.8561291810155676, "percentage": 95.2, "elapsed_time": "2 days, 17:59:09", "remaining_time": "3:19:26", "throughput": 27200.88, "total_tokens": 6461554944} +{"current_steps": 24010, "total_steps": 25209, "loss": 0.9285, "lr": 2.7112719016666282e-05, "epoch": 2.85731924103922, "percentage": 95.24, "elapsed_time": "2 days, 18:00:46", "remaining_time": "3:17:47", "throughput": 27201.26, "total_tokens": 6464269952} +{"current_steps": 24020, "total_steps": 25209, "loss": 0.9319, "lr": 2.7108733786092427e-05, "epoch": 2.858509301062872, "percentage": 95.28, "elapsed_time": "2 days, 18:02:31", "remaining_time": "3:16:08", "throughput": 27200.78, "total_tokens": 6467038464} +{"current_steps": 24030, "total_steps": 25209, "loss": 0.9081, "lr": 2.7104750312339254e-05, "epoch": 2.8596993610865247, "percentage": 95.32, "elapsed_time": "2 days, 18:04:15", "remaining_time": "3:14:30", "throughput": 27200.48, "total_tokens": 6469772224} +{"current_steps": 24040, "total_steps": 25209, "loss": 0.9216, "lr": 2.7100768594116382e-05, "epoch": 2.860889421110177, "percentage": 95.36, "elapsed_time": "2 days, 18:05:49", "remaining_time": "3:12:50", "throughput": 27200.89, "total_tokens": 6472450112} +{"current_steps": 24050, "total_steps": 25209, "loss": 0.9256, "lr": 2.709678863013473e-05, "epoch": 2.8620794811338297, "percentage": 95.4, "elapsed_time": "2 days, 18:07:28", "remaining_time": "3:11:11", "throughput": 27200.96, "total_tokens": 6475155456} +{"current_steps": 24060, "total_steps": 25209, "loss": 0.9242, "lr": 2.7092810419106562e-05, "epoch": 2.8632695411574822, "percentage": 95.44, "elapsed_time": "2 days, 18:09:04", "remaining_time": "3:09:32", "throughput": 27201.23, "total_tokens": 6477817024} +{"current_steps": 24070, "total_steps": 25209, "loss": 0.925, "lr": 2.7088833959745457e-05, "epoch": 2.8644596011811343, "percentage": 95.48, "elapsed_time": "2 days, 18:10:39", "remaining_time": "3:07:53", "throughput": 27201.51, "total_tokens": 6480480512} +{"current_steps": 24080, "total_steps": 25209, "loss": 0.9093, "lr": 2.708485925076631e-05, "epoch": 2.8656496612047873, "percentage": 95.52, "elapsed_time": "2 days, 18:12:20", "remaining_time": "3:06:14", "throughput": 27201.31, "total_tokens": 6483180992} +{"current_steps": 24090, "total_steps": 25209, "loss": 0.9379, "lr": 2.708088629088535e-05, "epoch": 2.8668397212284393, "percentage": 95.56, "elapsed_time": "2 days, 18:13:57", "remaining_time": "3:04:35", "throughput": 27201.54, "total_tokens": 6485861568} +{"current_steps": 24100, "total_steps": 25209, "loss": 0.9105, "lr": 2.7076915078820115e-05, "epoch": 2.868029781252092, "percentage": 95.6, "elapsed_time": "2 days, 18:15:36", "remaining_time": "3:02:56", "throughput": 27201.45, "total_tokens": 6488549888} +{"current_steps": 24110, "total_steps": 25209, "loss": 0.919, "lr": 2.707294561328945e-05, "epoch": 2.8692198412757444, "percentage": 95.64, "elapsed_time": "2 days, 18:17:17", "remaining_time": "3:01:17", "throughput": 27201.23, "total_tokens": 6491241344} +{"current_steps": 24120, "total_steps": 25209, "loss": 0.9239, "lr": 2.706897789301353e-05, "epoch": 2.870409901299397, "percentage": 95.68, "elapsed_time": "2 days, 18:18:56", "remaining_time": "2:59:38", "throughput": 27201.27, "total_tokens": 6493925376} +{"current_steps": 24130, "total_steps": 25209, "loss": 0.938, "lr": 2.706501191671384e-05, "epoch": 2.8715999613230494, "percentage": 95.72, "elapsed_time": "2 days, 18:20:30", "remaining_time": "2:57:59", "throughput": 27201.69, "total_tokens": 6496606656} +{"current_steps": 24140, "total_steps": 25209, "loss": 0.9219, "lr": 2.7061047683113165e-05, "epoch": 2.8727900213467015, "percentage": 95.76, "elapsed_time": "2 days, 18:22:12", "remaining_time": "2:56:20", "throughput": 27201.33, "total_tokens": 6499278272} +{"current_steps": 24150, "total_steps": 25209, "loss": 0.9369, "lr": 2.705708519093561e-05, "epoch": 2.873980081370354, "percentage": 95.8, "elapsed_time": "2 days, 18:23:50", "remaining_time": "2:54:41", "throughput": 27201.22, "total_tokens": 6501934656} +{"current_steps": 24160, "total_steps": 25209, "loss": 0.9225, "lr": 2.705312443890658e-05, "epoch": 2.8751701413940065, "percentage": 95.84, "elapsed_time": "2 days, 18:25:39", "remaining_time": "2:53:03", "throughput": 27200.55, "total_tokens": 6504733824} +{"current_steps": 24170, "total_steps": 25209, "loss": 0.9413, "lr": 2.70491654257528e-05, "epoch": 2.876360201417659, "percentage": 95.88, "elapsed_time": "2 days, 18:27:18", "remaining_time": "2:51:24", "throughput": 27200.59, "total_tokens": 6507423616} +{"current_steps": 24180, "total_steps": 25209, "loss": 0.924, "lr": 2.7045208150202274e-05, "epoch": 2.8775502614413115, "percentage": 95.92, "elapsed_time": "2 days, 18:28:55", "remaining_time": "2:49:45", "throughput": 27200.8, "total_tokens": 6510118144} +{"current_steps": 24190, "total_steps": 25209, "loss": 0.9186, "lr": 2.704125261098433e-05, "epoch": 2.8787403214649636, "percentage": 95.96, "elapsed_time": "2 days, 18:30:27", "remaining_time": "2:48:05", "throughput": 27201.2, "total_tokens": 6512708480} +{"current_steps": 24200, "total_steps": 25209, "loss": 0.9252, "lr": 2.7037298806829586e-05, "epoch": 2.8799303814886166, "percentage": 96.0, "elapsed_time": "2 days, 18:32:07", "remaining_time": "2:46:26", "throughput": 27201.14, "total_tokens": 6515413184} +{"current_steps": 24210, "total_steps": 25209, "loss": 0.9264, "lr": 2.7033346736469967e-05, "epoch": 2.8811204415122686, "percentage": 96.04, "elapsed_time": "2 days, 18:33:44", "remaining_time": "2:44:47", "throughput": 27201.34, "total_tokens": 6518113472} +{"current_steps": 24220, "total_steps": 25209, "loss": 0.9285, "lr": 2.702939639863869e-05, "epoch": 2.882310501535921, "percentage": 96.08, "elapsed_time": "2 days, 18:35:21", "remaining_time": "2:43:08", "throughput": 27201.46, "total_tokens": 6520767616} +{"current_steps": 24230, "total_steps": 25209, "loss": 0.9211, "lr": 2.7025447792070262e-05, "epoch": 2.8835005615595737, "percentage": 96.12, "elapsed_time": "2 days, 18:36:58", "remaining_time": "2:41:29", "throughput": 27201.57, "total_tokens": 6523442432} +{"current_steps": 24240, "total_steps": 25209, "loss": 0.9117, "lr": 2.7021500915500493e-05, "epoch": 2.884690621583226, "percentage": 96.16, "elapsed_time": "2 days, 18:38:35", "remaining_time": "2:39:50", "throughput": 27201.59, "total_tokens": 6526074560} +{"current_steps": 24250, "total_steps": 25209, "loss": 0.9303, "lr": 2.701755576766648e-05, "epoch": 2.8858806816068787, "percentage": 96.2, "elapsed_time": "2 days, 18:40:14", "remaining_time": "2:38:11", "throughput": 27201.42, "total_tokens": 6528739584} +{"current_steps": 24260, "total_steps": 25209, "loss": 0.9299, "lr": 2.701361234730661e-05, "epoch": 2.887070741630531, "percentage": 96.24, "elapsed_time": "2 days, 18:41:51", "remaining_time": "2:36:32", "throughput": 27201.52, "total_tokens": 6531393408} +{"current_steps": 24270, "total_steps": 25209, "loss": 0.9276, "lr": 2.700967065316056e-05, "epoch": 2.8882608016541833, "percentage": 96.28, "elapsed_time": "2 days, 18:43:30", "remaining_time": "2:34:53", "throughput": 27201.49, "total_tokens": 6534096576} +{"current_steps": 24280, "total_steps": 25209, "loss": 0.9117, "lr": 2.70057306839693e-05, "epoch": 2.889450861677836, "percentage": 96.31, "elapsed_time": "2 days, 18:45:08", "remaining_time": "2:33:14", "throughput": 27201.66, "total_tokens": 6536796352} +{"current_steps": 24290, "total_steps": 25209, "loss": 0.9064, "lr": 2.7001792438475076e-05, "epoch": 2.8906409217014883, "percentage": 96.35, "elapsed_time": "2 days, 18:46:45", "remaining_time": "2:31:35", "throughput": 27201.75, "total_tokens": 6539457344} +{"current_steps": 24300, "total_steps": 25209, "loss": 0.9346, "lr": 2.6997855915421416e-05, "epoch": 2.891830981725141, "percentage": 96.39, "elapsed_time": "2 days, 18:48:25", "remaining_time": "2:29:56", "throughput": 27201.75, "total_tokens": 6542156736} +{"current_steps": 24310, "total_steps": 25209, "loss": 0.9332, "lr": 2.6993921113553145e-05, "epoch": 2.893021041748793, "percentage": 96.43, "elapsed_time": "2 days, 18:50:04", "remaining_time": "2:28:17", "throughput": 27201.93, "total_tokens": 6544907392} +{"current_steps": 24320, "total_steps": 25209, "loss": 0.9154, "lr": 2.6989988031616343e-05, "epoch": 2.894211101772446, "percentage": 96.47, "elapsed_time": "2 days, 18:51:48", "remaining_time": "2:26:38", "throughput": 27201.55, "total_tokens": 6547657472} +{"current_steps": 24330, "total_steps": 25209, "loss": 0.9296, "lr": 2.6986056668358396e-05, "epoch": 2.895401161796098, "percentage": 96.51, "elapsed_time": "2 days, 18:53:26", "remaining_time": "2:24:59", "throughput": 27201.55, "total_tokens": 6550318912} +{"current_steps": 24340, "total_steps": 25209, "loss": 0.9139, "lr": 2.6982127022527947e-05, "epoch": 2.8965912218197505, "percentage": 96.55, "elapsed_time": "2 days, 18:55:06", "remaining_time": "2:23:20", "throughput": 27201.57, "total_tokens": 6553032960} +{"current_steps": 24350, "total_steps": 25209, "loss": 0.9137, "lr": 2.697819909287493e-05, "epoch": 2.897781281843403, "percentage": 96.59, "elapsed_time": "2 days, 18:56:49", "remaining_time": "2:21:42", "throughput": 27201.32, "total_tokens": 6555766976} +{"current_steps": 24360, "total_steps": 25209, "loss": 0.9365, "lr": 2.697427287815053e-05, "epoch": 2.8989713418670555, "percentage": 96.63, "elapsed_time": "2 days, 18:58:27", "remaining_time": "2:20:03", "throughput": 27201.43, "total_tokens": 6558472512} +{"current_steps": 24370, "total_steps": 25209, "loss": 0.921, "lr": 2.6970348377107236e-05, "epoch": 2.900161401890708, "percentage": 96.67, "elapsed_time": "2 days, 19:00:01", "remaining_time": "2:18:23", "throughput": 27201.71, "total_tokens": 6561100416} +{"current_steps": 24380, "total_steps": 25209, "loss": 0.9235, "lr": 2.696642558849877e-05, "epoch": 2.90135146191436, "percentage": 96.71, "elapsed_time": "2 days, 19:01:43", "remaining_time": "2:16:45", "throughput": 27201.48, "total_tokens": 6563808832} +{"current_steps": 24390, "total_steps": 25209, "loss": 0.9189, "lr": 2.696250451108016e-05, "epoch": 2.9025415219380126, "percentage": 96.75, "elapsed_time": "2 days, 19:03:17", "remaining_time": "2:15:05", "throughput": 27201.78, "total_tokens": 6566453824} +{"current_steps": 24400, "total_steps": 25209, "loss": 0.9148, "lr": 2.6958585143607662e-05, "epoch": 2.903731581961665, "percentage": 96.79, "elapsed_time": "2 days, 19:04:57", "remaining_time": "2:13:27", "throughput": 27201.93, "total_tokens": 6569192064} +{"current_steps": 24410, "total_steps": 25209, "loss": 0.913, "lr": 2.695466748483883e-05, "epoch": 2.9049216419853177, "percentage": 96.83, "elapsed_time": "2 days, 19:06:34", "remaining_time": "2:11:47", "throughput": 27201.96, "total_tokens": 6571852928} +{"current_steps": 24420, "total_steps": 25209, "loss": 0.9184, "lr": 2.695075153353247e-05, "epoch": 2.90611170200897, "percentage": 96.87, "elapsed_time": "2 days, 19:08:11", "remaining_time": "2:10:08", "throughput": 27202.3, "total_tokens": 6574566016} +{"current_steps": 24430, "total_steps": 25209, "loss": 0.9343, "lr": 2.6946837288448646e-05, "epoch": 2.9073017620326222, "percentage": 96.91, "elapsed_time": "2 days, 19:09:55", "remaining_time": "2:08:30", "throughput": 27201.87, "total_tokens": 6577297024} +{"current_steps": 24440, "total_steps": 25209, "loss": 0.9283, "lr": 2.6942924748348684e-05, "epoch": 2.908491822056275, "percentage": 96.95, "elapsed_time": "2 days, 19:11:29", "remaining_time": "2:06:51", "throughput": 27202.34, "total_tokens": 6579971392} +{"current_steps": 24450, "total_steps": 25209, "loss": 0.9182, "lr": 2.693901391199517e-05, "epoch": 2.9096818820799273, "percentage": 96.99, "elapsed_time": "2 days, 19:13:12", "remaining_time": "2:05:12", "throughput": 27202.08, "total_tokens": 6582699392} +{"current_steps": 24460, "total_steps": 25209, "loss": 0.9305, "lr": 2.6935104778151943e-05, "epoch": 2.91087194210358, "percentage": 97.03, "elapsed_time": "2 days, 19:14:55", "remaining_time": "2:03:33", "throughput": 27201.8, "total_tokens": 6585426752} +{"current_steps": 24470, "total_steps": 25209, "loss": 0.9076, "lr": 2.6931197345584102e-05, "epoch": 2.9120620021272323, "percentage": 97.07, "elapsed_time": "2 days, 19:16:34", "remaining_time": "2:01:54", "throughput": 27201.78, "total_tokens": 6588125184} +{"current_steps": 24480, "total_steps": 25209, "loss": 0.9228, "lr": 2.6927291613058003e-05, "epoch": 2.913252062150885, "percentage": 97.11, "elapsed_time": "2 days, 19:18:10", "remaining_time": "2:00:15", "throughput": 27202.01, "total_tokens": 6590791936} +{"current_steps": 24490, "total_steps": 25209, "loss": 0.922, "lr": 2.6923387579341254e-05, "epoch": 2.9144421221745374, "percentage": 97.15, "elapsed_time": "2 days, 19:19:51", "remaining_time": "1:58:36", "throughput": 27201.87, "total_tokens": 6593489536} +{"current_steps": 24500, "total_steps": 25209, "loss": 0.9271, "lr": 2.6919485243202693e-05, "epoch": 2.9156321821981894, "percentage": 97.19, "elapsed_time": "2 days, 19:21:30", "remaining_time": "1:56:57", "throughput": 27201.79, "total_tokens": 6596181632} +{"current_steps": 24510, "total_steps": 25209, "loss": 0.9164, "lr": 2.6915584603412434e-05, "epoch": 2.916822242221842, "percentage": 97.23, "elapsed_time": "2 days, 19:23:10", "remaining_time": "1:55:18", "throughput": 27201.85, "total_tokens": 6598903424} +{"current_steps": 24520, "total_steps": 25209, "loss": 0.9289, "lr": 2.6911685658741827e-05, "epoch": 2.9180123022454945, "percentage": 97.27, "elapsed_time": "2 days, 19:24:47", "remaining_time": "1:53:39", "throughput": 27202.12, "total_tokens": 6601613312} +{"current_steps": 24530, "total_steps": 25209, "loss": 0.917, "lr": 2.690778840796346e-05, "epoch": 2.919202362269147, "percentage": 97.31, "elapsed_time": "2 days, 19:26:29", "remaining_time": "1:52:00", "throughput": 27202.05, "total_tokens": 6604377600} +{"current_steps": 24540, "total_steps": 25209, "loss": 0.9136, "lr": 2.6903892849851175e-05, "epoch": 2.9203924222927995, "percentage": 97.35, "elapsed_time": "2 days, 19:28:07", "remaining_time": "1:50:21", "throughput": 27202.19, "total_tokens": 6607067840} +{"current_steps": 24550, "total_steps": 25209, "loss": 0.9332, "lr": 2.6899998983180057e-05, "epoch": 2.9215824823164516, "percentage": 97.39, "elapsed_time": "2 days, 19:29:50", "remaining_time": "1:48:42", "throughput": 27201.94, "total_tokens": 6609815488} +{"current_steps": 24560, "total_steps": 25209, "loss": 0.9207, "lr": 2.689610680672642e-05, "epoch": 2.9227725423401045, "percentage": 97.43, "elapsed_time": "2 days, 19:31:31", "remaining_time": "1:47:03", "throughput": 27201.86, "total_tokens": 6612533952} +{"current_steps": 24570, "total_steps": 25209, "loss": 0.9314, "lr": 2.6892216319267843e-05, "epoch": 2.9239626023637566, "percentage": 97.47, "elapsed_time": "2 days, 19:33:11", "remaining_time": "1:45:24", "throughput": 27201.72, "total_tokens": 6615213760} +{"current_steps": 24580, "total_steps": 25209, "loss": 0.9275, "lr": 2.6888327519583107e-05, "epoch": 2.925152662387409, "percentage": 97.5, "elapsed_time": "2 days, 19:34:46", "remaining_time": "1:43:45", "throughput": 27201.97, "total_tokens": 6617873920} +{"current_steps": 24590, "total_steps": 25209, "loss": 0.9345, "lr": 2.688444040645225e-05, "epoch": 2.9263427224110616, "percentage": 97.54, "elapsed_time": "2 days, 19:36:24", "remaining_time": "1:42:06", "throughput": 27201.89, "total_tokens": 6620528896} +{"current_steps": 24600, "total_steps": 25209, "loss": 0.9284, "lr": 2.688055497865654e-05, "epoch": 2.927532782434714, "percentage": 97.58, "elapsed_time": "2 days, 19:38:06", "remaining_time": "1:40:27", "throughput": 27201.99, "total_tokens": 6623304896} +{"current_steps": 24610, "total_steps": 25209, "loss": 0.9158, "lr": 2.6876671234978483e-05, "epoch": 2.9287228424583667, "percentage": 97.62, "elapsed_time": "2 days, 19:39:41", "remaining_time": "1:38:48", "throughput": 27202.41, "total_tokens": 6626009408} +{"current_steps": 24620, "total_steps": 25209, "loss": 0.9168, "lr": 2.6872789174201807e-05, "epoch": 2.9299129024820187, "percentage": 97.66, "elapsed_time": "2 days, 19:41:19", "remaining_time": "1:37:09", "throughput": 27202.56, "total_tokens": 6628704576} +{"current_steps": 24630, "total_steps": 25209, "loss": 0.931, "lr": 2.686890879511147e-05, "epoch": 2.9311029625056713, "percentage": 97.7, "elapsed_time": "2 days, 19:42:59", "remaining_time": "1:35:30", "throughput": 27202.69, "total_tokens": 6631463744} +{"current_steps": 24640, "total_steps": 25209, "loss": 0.9274, "lr": 2.6865030096493665e-05, "epoch": 2.932293022529324, "percentage": 97.74, "elapsed_time": "2 days, 19:44:41", "remaining_time": "1:33:51", "throughput": 27202.47, "total_tokens": 6634190784} +{"current_steps": 24650, "total_steps": 25209, "loss": 0.9166, "lr": 2.6861153077135815e-05, "epoch": 2.9334830825529763, "percentage": 97.78, "elapsed_time": "2 days, 19:46:22", "remaining_time": "1:32:12", "throughput": 27202.43, "total_tokens": 6636916672} +{"current_steps": 24660, "total_steps": 25209, "loss": 0.9061, "lr": 2.6857277735826545e-05, "epoch": 2.934673142576629, "percentage": 97.82, "elapsed_time": "2 days, 19:48:00", "remaining_time": "1:30:33", "throughput": 27202.73, "total_tokens": 6639656256} +{"current_steps": 24670, "total_steps": 25209, "loss": 0.9208, "lr": 2.685340407135573e-05, "epoch": 2.935863202600281, "percentage": 97.86, "elapsed_time": "2 days, 19:49:38", "remaining_time": "1:28:54", "throughput": 27202.84, "total_tokens": 6642354432} +{"current_steps": 24680, "total_steps": 25209, "loss": 0.9266, "lr": 2.6849532082514445e-05, "epoch": 2.937053262623934, "percentage": 97.9, "elapsed_time": "2 days, 19:51:17", "remaining_time": "1:27:15", "throughput": 27203.16, "total_tokens": 6645115840} +{"current_steps": 24690, "total_steps": 25209, "loss": 0.9124, "lr": 2.6845661768095005e-05, "epoch": 2.938243322647586, "percentage": 97.94, "elapsed_time": "2 days, 19:52:53", "remaining_time": "1:25:36", "throughput": 27203.41, "total_tokens": 6647795456} +{"current_steps": 24700, "total_steps": 25209, "loss": 0.9294, "lr": 2.6841793126890925e-05, "epoch": 2.9394333826712384, "percentage": 97.98, "elapsed_time": "2 days, 19:54:31", "remaining_time": "1:23:57", "throughput": 27203.49, "total_tokens": 6650489536} +{"current_steps": 24710, "total_steps": 25209, "loss": 0.9122, "lr": 2.6837926157696946e-05, "epoch": 2.940623442694891, "percentage": 98.02, "elapsed_time": "2 days, 19:56:11", "remaining_time": "1:22:18", "throughput": 27203.63, "total_tokens": 6653226944} +{"current_steps": 24720, "total_steps": 25209, "loss": 0.9154, "lr": 2.6834060859309018e-05, "epoch": 2.9418135027185435, "percentage": 98.06, "elapsed_time": "2 days, 19:57:49", "remaining_time": "1:20:39", "throughput": 27203.64, "total_tokens": 6655906944} +{"current_steps": 24730, "total_steps": 25209, "loss": 0.9244, "lr": 2.6830197230524317e-05, "epoch": 2.943003562742196, "percentage": 98.1, "elapsed_time": "2 days, 19:59:25", "remaining_time": "1:19:00", "throughput": 27204.01, "total_tokens": 6658609472} +{"current_steps": 24740, "total_steps": 25209, "loss": 0.9195, "lr": 2.6826335270141216e-05, "epoch": 2.944193622765848, "percentage": 98.14, "elapsed_time": "2 days, 20:01:03", "remaining_time": "1:17:21", "throughput": 27204.2, "total_tokens": 6661306176} +{"current_steps": 24750, "total_steps": 25209, "loss": 0.9063, "lr": 2.6822474976959312e-05, "epoch": 2.9453836827895006, "percentage": 98.18, "elapsed_time": "2 days, 20:02:40", "remaining_time": "1:15:42", "throughput": 27204.49, "total_tokens": 6664024384} +{"current_steps": 24760, "total_steps": 25209, "loss": 0.918, "lr": 2.6818616349779397e-05, "epoch": 2.946573742813153, "percentage": 98.22, "elapsed_time": "2 days, 20:04:19", "remaining_time": "1:14:03", "throughput": 27204.56, "total_tokens": 6666745472} +{"current_steps": 24770, "total_steps": 25209, "loss": 0.9213, "lr": 2.6814759387403482e-05, "epoch": 2.9477638028368056, "percentage": 98.26, "elapsed_time": "2 days, 20:05:57", "remaining_time": "1:12:24", "throughput": 27204.69, "total_tokens": 6669422208} +{"current_steps": 24780, "total_steps": 25209, "loss": 0.9261, "lr": 2.681090408863477e-05, "epoch": 2.948953862860458, "percentage": 98.3, "elapsed_time": "2 days, 20:07:31", "remaining_time": "1:10:45", "throughput": 27205.04, "total_tokens": 6672082880} +{"current_steps": 24790, "total_steps": 25209, "loss": 0.9249, "lr": 2.6807050452277694e-05, "epoch": 2.95014392288411, "percentage": 98.34, "elapsed_time": "2 days, 20:09:12", "remaining_time": "1:09:06", "throughput": 27204.89, "total_tokens": 6674791104} +{"current_steps": 24800, "total_steps": 25209, "loss": 0.9146, "lr": 2.6803198477137853e-05, "epoch": 2.951333982907763, "percentage": 98.38, "elapsed_time": "2 days, 20:10:53", "remaining_time": "1:07:28", "throughput": 27204.75, "total_tokens": 6677499264} +{"current_steps": 24810, "total_steps": 25209, "loss": 0.926, "lr": 2.6799348162022082e-05, "epoch": 2.9525240429314152, "percentage": 98.42, "elapsed_time": "2 days, 20:12:32", "remaining_time": "1:05:49", "throughput": 27204.8, "total_tokens": 6680199168} +{"current_steps": 24820, "total_steps": 25209, "loss": 0.9209, "lr": 2.6795499505738397e-05, "epoch": 2.9537141029550678, "percentage": 98.46, "elapsed_time": "2 days, 20:14:14", "remaining_time": "1:04:10", "throughput": 27204.8, "total_tokens": 6682982656} +{"current_steps": 24830, "total_steps": 25209, "loss": 0.9245, "lr": 2.679165250709601e-05, "epoch": 2.9549041629787203, "percentage": 98.5, "elapsed_time": "2 days, 20:15:52", "remaining_time": "1:02:31", "throughput": 27204.84, "total_tokens": 6685653568} +{"current_steps": 24840, "total_steps": 25209, "loss": 0.9048, "lr": 2.678780716490533e-05, "epoch": 2.956094223002373, "percentage": 98.54, "elapsed_time": "2 days, 20:17:34", "remaining_time": "1:00:52", "throughput": 27204.73, "total_tokens": 6688399680} +{"current_steps": 24850, "total_steps": 25209, "loss": 0.9164, "lr": 2.678396347797798e-05, "epoch": 2.9572842830260253, "percentage": 98.58, "elapsed_time": "2 days, 20:19:08", "remaining_time": "0:59:13", "throughput": 27205.06, "total_tokens": 6691041216} +{"current_steps": 24860, "total_steps": 25209, "loss": 0.9319, "lr": 2.6780121445126756e-05, "epoch": 2.9584743430496774, "percentage": 98.62, "elapsed_time": "2 days, 20:20:50", "remaining_time": "0:57:34", "throughput": 27204.94, "total_tokens": 6693779712} +{"current_steps": 24870, "total_steps": 25209, "loss": 0.9205, "lr": 2.6776281065165644e-05, "epoch": 2.95966440307333, "percentage": 98.66, "elapsed_time": "2 days, 20:22:20", "remaining_time": "0:55:55", "throughput": 27205.74, "total_tokens": 6696443840} +{"current_steps": 24880, "total_steps": 25209, "loss": 0.912, "lr": 2.677244233690983e-05, "epoch": 2.9608544630969824, "percentage": 98.69, "elapsed_time": "2 days, 20:24:00", "remaining_time": "0:54:16", "throughput": 27205.71, "total_tokens": 6699139648} +{"current_steps": 24890, "total_steps": 25209, "loss": 0.9243, "lr": 2.6768605259175694e-05, "epoch": 2.962044523120635, "percentage": 98.73, "elapsed_time": "2 days, 20:25:39", "remaining_time": "0:52:37", "throughput": 27205.66, "total_tokens": 6701825728} +{"current_steps": 24900, "total_steps": 25209, "loss": 0.9384, "lr": 2.6764769830780784e-05, "epoch": 2.9632345831442874, "percentage": 98.77, "elapsed_time": "2 days, 20:27:15", "remaining_time": "0:50:58", "throughput": 27205.78, "total_tokens": 6704479488} +{"current_steps": 24910, "total_steps": 25209, "loss": 0.9401, "lr": 2.6760936050543857e-05, "epoch": 2.9644246431679395, "percentage": 98.81, "elapsed_time": "2 days, 20:28:51", "remaining_time": "0:49:19", "throughput": 27205.85, "total_tokens": 6707110336} +{"current_steps": 24920, "total_steps": 25209, "loss": 0.9212, "lr": 2.675710391728483e-05, "epoch": 2.9656147031915925, "percentage": 98.85, "elapsed_time": "2 days, 20:30:31", "remaining_time": "0:47:40", "throughput": 27205.92, "total_tokens": 6709843776} +{"current_steps": 24930, "total_steps": 25209, "loss": 0.9231, "lr": 2.6753273429824822e-05, "epoch": 2.9668047632152446, "percentage": 98.89, "elapsed_time": "2 days, 20:32:09", "remaining_time": "0:46:01", "throughput": 27206.08, "total_tokens": 6712534656} +{"current_steps": 24940, "total_steps": 25209, "loss": 0.9132, "lr": 2.6749444586986127e-05, "epoch": 2.967994823238897, "percentage": 98.93, "elapsed_time": "2 days, 20:33:48", "remaining_time": "0:44:22", "throughput": 27205.99, "total_tokens": 6715216704} +{"current_steps": 24950, "total_steps": 25209, "loss": 0.9305, "lr": 2.6745617387592214e-05, "epoch": 2.9691848832625496, "percentage": 98.97, "elapsed_time": "2 days, 20:35:25", "remaining_time": "0:42:43", "throughput": 27206.17, "total_tokens": 6717904768} +{"current_steps": 24960, "total_steps": 25209, "loss": 0.9143, "lr": 2.6741791830467728e-05, "epoch": 2.970374943286202, "percentage": 99.01, "elapsed_time": "2 days, 20:37:02", "remaining_time": "0:41:04", "throughput": 27206.51, "total_tokens": 6720615168} +{"current_steps": 24970, "total_steps": 25209, "loss": 0.9142, "lr": 2.67379679144385e-05, "epoch": 2.9715650033098546, "percentage": 99.05, "elapsed_time": "2 days, 20:38:37", "remaining_time": "0:39:25", "throughput": 27206.7, "total_tokens": 6723248192} +{"current_steps": 24980, "total_steps": 25209, "loss": 0.9013, "lr": 2.6734145638331536e-05, "epoch": 2.9727550633335067, "percentage": 99.09, "elapsed_time": "2 days, 20:40:11", "remaining_time": "0:37:46", "throughput": 27207.13, "total_tokens": 6725907968} +{"current_steps": 24990, "total_steps": 25209, "loss": 0.9268, "lr": 2.673032500097501e-05, "epoch": 2.973945123357159, "percentage": 99.13, "elapsed_time": "2 days, 20:41:49", "remaining_time": "0:36:07", "throughput": 27207.34, "total_tokens": 6728626752} +{"current_steps": 25000, "total_steps": 25209, "loss": 0.9281, "lr": 2.672650600119826e-05, "epoch": 2.9751351833808117, "percentage": 99.17, "elapsed_time": "2 days, 20:43:27", "remaining_time": "0:34:28", "throughput": 27207.62, "total_tokens": 6731377216} +{"current_steps": 25000, "total_steps": 25209, "eval_loss": 1.0308592319488525, "epoch": 2.9751351833808117, "percentage": 99.17, "elapsed_time": "2 days, 20:43:29", "remaining_time": "0:34:28", "throughput": 27207.4, "total_tokens": 6731377216} +{"current_steps": 25010, "total_steps": 25209, "loss": 0.9066, "lr": 2.672268863783181e-05, "epoch": 2.9763252434044642, "percentage": 99.21, "elapsed_time": "2 days, 20:45:30", "remaining_time": "0:32:49", "throughput": 27204.87, "total_tokens": 6734047040} +{"current_steps": 25020, "total_steps": 25209, "loss": 0.9293, "lr": 2.6718872909707347e-05, "epoch": 2.9775153034281168, "percentage": 99.25, "elapsed_time": "2 days, 20:47:06", "remaining_time": "0:31:10", "throughput": 27205.09, "total_tokens": 6736705600} +{"current_steps": 25030, "total_steps": 25209, "loss": 0.9192, "lr": 2.671505881565772e-05, "epoch": 2.978705363451769, "percentage": 99.29, "elapsed_time": "2 days, 20:48:45", "remaining_time": "0:29:31", "throughput": 27205.22, "total_tokens": 6739434240} +{"current_steps": 25040, "total_steps": 25209, "loss": 0.9182, "lr": 2.671124635451696e-05, "epoch": 2.979895423475422, "percentage": 99.33, "elapsed_time": "2 days, 20:50:27", "remaining_time": "0:27:52", "throughput": 27204.97, "total_tokens": 6742135168} +{"current_steps": 25050, "total_steps": 25209, "loss": 0.9151, "lr": 2.6707435525120237e-05, "epoch": 2.981085483499074, "percentage": 99.37, "elapsed_time": "2 days, 20:52:01", "remaining_time": "0:26:13", "throughput": 27205.36, "total_tokens": 6744786112} +{"current_steps": 25060, "total_steps": 25209, "loss": 0.9134, "lr": 2.6703626326303906e-05, "epoch": 2.9822755435227264, "percentage": 99.41, "elapsed_time": "2 days, 20:53:38", "remaining_time": "0:24:34", "throughput": 27205.59, "total_tokens": 6747497280} +{"current_steps": 25070, "total_steps": 25209, "loss": 0.9283, "lr": 2.669981875690547e-05, "epoch": 2.983465603546379, "percentage": 99.45, "elapsed_time": "2 days, 20:55:15", "remaining_time": "0:22:55", "throughput": 27205.63, "total_tokens": 6750142272} +{"current_steps": 25080, "total_steps": 25209, "loss": 0.9209, "lr": 2.6696012815763604e-05, "epoch": 2.9846556635700314, "percentage": 99.49, "elapsed_time": "2 days, 20:56:53", "remaining_time": "0:21:16", "throughput": 27205.78, "total_tokens": 6752842752} +{"current_steps": 25090, "total_steps": 25209, "loss": 0.922, "lr": 2.669220850171813e-05, "epoch": 2.985845723593684, "percentage": 99.53, "elapsed_time": "2 days, 20:58:32", "remaining_time": "0:19:37", "throughput": 27205.69, "total_tokens": 6755516416} +{"current_steps": 25100, "total_steps": 25209, "loss": 0.9253, "lr": 2.668840581361003e-05, "epoch": 2.987035783617336, "percentage": 99.57, "elapsed_time": "2 days, 21:00:12", "remaining_time": "0:17:58", "throughput": 27205.8, "total_tokens": 6758271552} +{"current_steps": 25110, "total_steps": 25209, "loss": 0.9281, "lr": 2.668460475028145e-05, "epoch": 2.9882258436409885, "percentage": 99.61, "elapsed_time": "2 days, 21:01:49", "remaining_time": "0:16:19", "throughput": 27205.96, "total_tokens": 6760949632} +{"current_steps": 25120, "total_steps": 25209, "loss": 0.9167, "lr": 2.6680805310575686e-05, "epoch": 2.989415903664641, "percentage": 99.65, "elapsed_time": "2 days, 21:03:28", "remaining_time": "0:14:40", "throughput": 27206.15, "total_tokens": 6763667776} +{"current_steps": 25130, "total_steps": 25209, "loss": 0.9158, "lr": 2.6677007493337164e-05, "epoch": 2.9906059636882936, "percentage": 99.69, "elapsed_time": "2 days, 21:05:08", "remaining_time": "0:13:01", "throughput": 27206.28, "total_tokens": 6766445568} +{"current_steps": 25140, "total_steps": 25209, "loss": 0.9111, "lr": 2.6673211297411503e-05, "epoch": 2.991796023711946, "percentage": 99.73, "elapsed_time": "2 days, 21:06:44", "remaining_time": "0:11:22", "throughput": 27206.7, "total_tokens": 6769147584} +{"current_steps": 25150, "total_steps": 25209, "loss": 0.9267, "lr": 2.6669416721645447e-05, "epoch": 2.992986083735598, "percentage": 99.77, "elapsed_time": "2 days, 21:08:20", "remaining_time": "0:09:43", "throughput": 27206.93, "total_tokens": 6771825984} +{"current_steps": 25160, "total_steps": 25209, "loss": 0.9143, "lr": 2.6665623764886876e-05, "epoch": 2.994176143759251, "percentage": 99.81, "elapsed_time": "2 days, 21:09:59", "remaining_time": "0:08:04", "throughput": 27206.99, "total_tokens": 6774523968} +{"current_steps": 25170, "total_steps": 25209, "loss": 0.9377, "lr": 2.6661832425984847e-05, "epoch": 2.995366203782903, "percentage": 99.85, "elapsed_time": "2 days, 21:11:41", "remaining_time": "0:06:25", "throughput": 27206.86, "total_tokens": 6777281728} +{"current_steps": 25180, "total_steps": 25209, "loss": 0.9184, "lr": 2.665804270378953e-05, "epoch": 2.9965562638065557, "percentage": 99.88, "elapsed_time": "2 days, 21:13:15", "remaining_time": "0:04:47", "throughput": 27207.35, "total_tokens": 6779959744} +{"current_steps": 25190, "total_steps": 25209, "loss": 0.9102, "lr": 2.665425459715228e-05, "epoch": 2.9977463238302082, "percentage": 99.92, "elapsed_time": "2 days, 21:14:56", "remaining_time": "0:03:08", "throughput": 27207.21, "total_tokens": 6782662592} +{"current_steps": 25200, "total_steps": 25209, "loss": 0.9326, "lr": 2.6650468104925547e-05, "epoch": 2.9989363838538607, "percentage": 99.96, "elapsed_time": "2 days, 21:16:38", "remaining_time": "0:01:29", "throughput": 27206.97, "total_tokens": 6785388800} +{"current_steps": 25209, "total_steps": 25209, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2 days, 21:20:11", "remaining_time": "0:00:00", "throughput": 27193.46, "total_tokens": 6787789376}