commit 3ee7e919fed7c8b6c8dad4f6a38451b26ef87389 Author: ModelHub XC Date: Sat May 2 19:15:18 2026 +0800 初始化项目,由ModelHub XC社区提供模型 Model: baban/QwenTranslate_English_Hindi Source: Original Platform diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..f499802 --- /dev/null +++ b/README.md @@ -0,0 +1,63 @@ +--- +library_name: transformers +license: other +base_model: Qwen/Qwen2.5-3B-Instruct +tags: +- llama-factory +- full +- generated_from_trainer +model-index: +- name: MT_En_Hindi + results: [] +--- + + + +# MT_En_Hindi + +This model is a fine-tuned version of [Qwen/Qwen2.5-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-3B-Instruct) on the MT_En_Hindi dataset. +It achieves the following results on the evaluation set: +- Loss: 0.3296 +- Num Input Tokens Seen: 8707477248 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 5e-05 +- train_batch_size: 8 +- eval_batch_size: 16 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 8 +- gradient_accumulation_steps: 16 +- total_train_batch_size: 1024 +- total_eval_batch_size: 128 +- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: inverse_sqrt +- num_epochs: 3.0 + +### Training results + + + +### Framework versions + +- Transformers 4.52.4 +- Pytorch 2.5.1+cu124 +- Datasets 3.6.0 +- Tokenizers 0.21.1 diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..bdf7919 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,54 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0]['role'] == 'system' %} + {{- messages[0]['content'] }} + {%- else %} + {{- 'You are Qwen, created by Alibaba Cloud. You are a helpful assistant.' }} + {%- endif %} + {{- "\n\n# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0]['role'] == 'system' %} + {{- '<|im_start|>system\n' + messages[0]['content'] + '<|im_end|>\n' }} + {%- else %} + {{- '<|im_start|>system\nYou are Qwen, created by Alibaba Cloud. You are a helpful assistant.<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- for message in messages %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) or (message.role == "assistant" and not message.tool_calls) %} + {{- '<|im_start|>' + message.role + '\n' + message.content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {{- '<|im_start|>' + message.role }} + {%- if message.content %} + {{- '\n' + message.content }} + {%- endif %} + {%- for tool_call in message.tool_calls %} + {%- if tool_call.function is defined %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {{- tool_call.arguments | tojson }} + {{- '}\n' }} + {%- endfor %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if (loop.index0 == 0) or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- message.content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} +{%- endif %} diff --git a/config.json b/config.json new file mode 100644 index 0000000..fb880d9 --- /dev/null +++ b/config.json @@ -0,0 +1,28 @@ +{ + "architectures": [ + "Qwen2ForCausalLM" + ], + "attention_dropout": 0.0, + "bos_token_id": 151643, + "eos_token_id": 151645, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 11008, + "max_position_embeddings": 32768, + "max_window_layers": 70, + "model_type": "qwen2", + "num_attention_heads": 16, + "num_hidden_layers": 36, + "num_key_value_heads": 2, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000.0, + "sliding_window": 32768, + "tie_word_embeddings": true, + "torch_dtype": "bfloat16", + "transformers_version": "4.52.4", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..028ef0a --- /dev/null +++ b/generation_config.json @@ -0,0 +1,14 @@ +{ + "bos_token_id": 151643, + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "repetition_penalty": 1.05, + "temperature": 0.7, + "top_k": 20, + "top_p": 0.8, + "transformers_version": "4.52.4" +} diff --git a/model-00001-of-00002.safetensors b/model-00001-of-00002.safetensors new file mode 100644 index 0000000..97f4988 --- /dev/null +++ b/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860d9d3f5e7e9c1e09820c77cdb45ed41beb59aaac9477dd9b47d67ba7ccf9ad +size 4957560304 diff --git a/model-00002-of-00002.safetensors b/model-00002-of-00002.safetensors new file mode 100644 index 0000000..0c41c6c --- /dev/null +++ b/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2942ece722e6c339d9d18c70e6c3c36992ccdf8fe74e1c65fb3ab1c347b4a17d +size 1214366696 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..f19a648 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,441 @@ +{ + "metadata": { + "total_size": 6171877376 + }, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-00002.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.28.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.29.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.30.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.gate_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.mlp.up_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.norm.weight": "model-00002-of-00002.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..ac23c0a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..51ebb3b --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5ae00e602b8860cbd784ba82a8aa14e8feecec692e7076590d014d7b7fdafa +size 11421896 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..fb44f02 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,208 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 131072, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..097d7f1 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,3106 @@ +{"current_steps": 10, "total_steps": 29667, "loss": 1.0561, "lr": 4.9977515176118345e-05, "epoch": 0.0010112757243262375, "percentage": 0.03, "elapsed_time": "0:04:19", "remaining_time": "8 days, 21:22:49", "throughput": 13164.79, "total_tokens": 3409920} +{"current_steps": 20, "total_steps": 29667, "loss": 0.8222, "lr": 4.9952567580506e-05, "epoch": 0.002022551448652475, "percentage": 0.07, "elapsed_time": "0:08:24", "remaining_time": "8 days, 15:38:27", "throughput": 13590.89, "total_tokens": 6853504} +{"current_steps": 30, "total_steps": 29667, "loss": 0.7587, "lr": 4.992765730738634e-05, "epoch": 0.0030338271729787127, "percentage": 0.1, "elapsed_time": "0:11:30", "remaining_time": "7 days, 21:31:58", "throughput": 14902.98, "total_tokens": 10293120} +{"current_steps": 40, "total_steps": 29667, "loss": 0.723, "lr": 4.9902784263792476e-05, "epoch": 0.00404510289730495, "percentage": 0.13, "elapsed_time": "0:14:43", "remaining_time": "7 days, 13:45:13", "throughput": 15624.11, "total_tokens": 13802368} +{"current_steps": 50, "total_steps": 29667, "loss": 0.6987, "lr": 4.987794835708133e-05, "epoch": 0.005056378621631188, "percentage": 0.17, "elapsed_time": "0:17:25", "remaining_time": "7 days, 3:59:32", "throughput": 16502.5, "total_tokens": 17250048} +{"current_steps": 60, "total_steps": 29667, "loss": 0.6807, "lr": 4.985314949493234e-05, "epoch": 0.0060676543459574255, "percentage": 0.2, "elapsed_time": "0:20:49", "remaining_time": "7 days, 3:14:27", "throughput": 16577.6, "total_tokens": 20710400} +{"current_steps": 70, "total_steps": 29667, "loss": 0.6664, "lr": 4.982838758534584e-05, "epoch": 0.007078930070283663, "percentage": 0.24, "elapsed_time": "0:23:49", "remaining_time": "6 days, 23:53:50", "throughput": 16881.28, "total_tokens": 24132480} +{"current_steps": 80, "total_steps": 29667, "loss": 0.6547, "lr": 4.980366253664179e-05, "epoch": 0.0080902057946099, "percentage": 0.27, "elapsed_time": "0:27:09", "remaining_time": "6 days, 23:26:44", "throughput": 16925.59, "total_tokens": 27587328} +{"current_steps": 90, "total_steps": 29667, "loss": 0.6496, "lr": 4.977897425745825e-05, "epoch": 0.009101481518936139, "percentage": 0.3, "elapsed_time": "0:30:20", "remaining_time": "6 days, 22:09:07", "throughput": 17055.02, "total_tokens": 31041920} +{"current_steps": 100, "total_steps": 29667, "loss": 0.6275, "lr": 4.975432265674997e-05, "epoch": 0.010112757243262376, "percentage": 0.34, "elapsed_time": "0:34:12", "remaining_time": "7 days, 0:34:46", "throughput": 16833.29, "total_tokens": 34551680} +{"current_steps": 110, "total_steps": 29667, "loss": 0.6265, "lr": 4.972970764378705e-05, "epoch": 0.011124032967588612, "percentage": 0.37, "elapsed_time": "0:37:45", "remaining_time": "7 days, 1:06:05", "throughput": 16787.1, "total_tokens": 38032768} +{"current_steps": 120, "total_steps": 29667, "loss": 0.6233, "lr": 4.970512912815344e-05, "epoch": 0.012135308691914851, "percentage": 0.4, "elapsed_time": "0:41:03", "remaining_time": "7 days, 0:30:15", "throughput": 16868.96, "total_tokens": 41559424} +{"current_steps": 130, "total_steps": 29667, "loss": 0.6158, "lr": 4.968058701974564e-05, "epoch": 0.013146584416241088, "percentage": 0.44, "elapsed_time": "0:45:37", "remaining_time": "7 days, 4:46:02", "throughput": 16459.12, "total_tokens": 45055488} +{"current_steps": 140, "total_steps": 29667, "loss": 0.6036, "lr": 4.96560812287712e-05, "epoch": 0.014157860140567326, "percentage": 0.47, "elapsed_time": "0:49:49", "remaining_time": "7 days, 7:08:01", "throughput": 16242.71, "total_tokens": 48555648} +{"current_steps": 150, "total_steps": 29667, "loss": 0.5977, "lr": 4.963161166574748e-05, "epoch": 0.015169135864893563, "percentage": 0.51, "elapsed_time": "0:53:49", "remaining_time": "7 days, 8:31:42", "throughput": 16109.93, "total_tokens": 52027136} +{"current_steps": 160, "total_steps": 29667, "loss": 0.5948, "lr": 4.960717824150013e-05, "epoch": 0.0161804115892198, "percentage": 0.54, "elapsed_time": "0:57:57", "remaining_time": "7 days, 10:09:40", "throughput": 15982.15, "total_tokens": 55583488} +{"current_steps": 170, "total_steps": 29667, "loss": 0.5909, "lr": 4.9582780867161893e-05, "epoch": 0.017191687313546037, "percentage": 0.57, "elapsed_time": "1:02:33", "remaining_time": "7 days, 12:53:47", "throughput": 15758.71, "total_tokens": 59145856} +{"current_steps": 180, "total_steps": 29667, "loss": 0.5873, "lr": 4.955841945417105e-05, "epoch": 0.018202963037872277, "percentage": 0.61, "elapsed_time": "1:06:19", "remaining_time": "7 days, 13:05:43", "throughput": 15743.81, "total_tokens": 62655872} +{"current_steps": 190, "total_steps": 29667, "loss": 0.5803, "lr": 4.953409391427024e-05, "epoch": 0.019214238762198514, "percentage": 0.64, "elapsed_time": "1:09:55", "remaining_time": "7 days, 12:48:17", "throughput": 15760.35, "total_tokens": 66122368} +{"current_steps": 200, "total_steps": 29667, "loss": 0.5805, "lr": 4.950980415950502e-05, "epoch": 0.02022551448652475, "percentage": 0.67, "elapsed_time": "1:13:29", "remaining_time": "7 days, 12:27:38", "throughput": 15789.85, "total_tokens": 69623680} +{"current_steps": 210, "total_steps": 29667, "loss": 0.5674, "lr": 4.9485550102222575e-05, "epoch": 0.021236790210850988, "percentage": 0.71, "elapsed_time": "1:16:34", "remaining_time": "7 days, 11:00:07", "throughput": 15910.24, "total_tokens": 73091712} +{"current_steps": 220, "total_steps": 29667, "loss": 0.57, "lr": 4.946133165507037e-05, "epoch": 0.022248065935177225, "percentage": 0.74, "elapsed_time": "1:20:17", "remaining_time": "7 days, 11:06:54", "throughput": 15900.3, "total_tokens": 76598784} +{"current_steps": 230, "total_steps": 29667, "loss": 0.5627, "lr": 4.943714873099483e-05, "epoch": 0.023259341659503465, "percentage": 0.78, "elapsed_time": "1:23:48", "remaining_time": "7 days, 10:45:26", "throughput": 15935.54, "total_tokens": 80124928} +{"current_steps": 240, "total_steps": 29667, "loss": 0.5612, "lr": 4.9413001243240024e-05, "epoch": 0.024270617383829702, "percentage": 0.81, "elapsed_time": "1:27:26", "remaining_time": "7 days, 10:41:11", "throughput": 15933.69, "total_tokens": 83594112} +{"current_steps": 250, "total_steps": 29667, "loss": 0.5601, "lr": 4.938888910534637e-05, "epoch": 0.02528189310815594, "percentage": 0.84, "elapsed_time": "1:31:16", "remaining_time": "7 days, 11:00:34", "throughput": 15881.91, "total_tokens": 86980736} +{"current_steps": 260, "total_steps": 29667, "loss": 0.5573, "lr": 4.936481223114932e-05, "epoch": 0.026293168832482176, "percentage": 0.88, "elapsed_time": "1:34:48", "remaining_time": "7 days, 10:42:26", "throughput": 15897.98, "total_tokens": 90429440} +{"current_steps": 270, "total_steps": 29667, "loss": 0.5569, "lr": 4.934077053477808e-05, "epoch": 0.027304444556808413, "percentage": 0.91, "elapsed_time": "1:38:04", "remaining_time": "7 days, 9:58:46", "throughput": 15977.33, "total_tokens": 94023808} +{"current_steps": 280, "total_steps": 29667, "loss": 0.5574, "lr": 4.931676393065431e-05, "epoch": 0.028315720281134653, "percentage": 0.94, "elapsed_time": "1:41:08", "remaining_time": "7 days, 8:54:23", "throughput": 16079.19, "total_tokens": 97569280} +{"current_steps": 290, "total_steps": 29667, "loss": 0.5529, "lr": 4.929279233349088e-05, "epoch": 0.02932699600546089, "percentage": 0.98, "elapsed_time": "1:44:36", "remaining_time": "7 days, 8:37:25", "throughput": 16090.85, "total_tokens": 100999936} +{"current_steps": 300, "total_steps": 29667, "loss": 0.5504, "lr": 4.926885565829051e-05, "epoch": 0.030338271729787127, "percentage": 1.01, "elapsed_time": "1:48:47", "remaining_time": "7 days, 9:29:30", "throughput": 16005.99, "total_tokens": 104478080} +{"current_steps": 310, "total_steps": 29667, "loss": 0.5434, "lr": 4.924495382034461e-05, "epoch": 0.03134954745411336, "percentage": 1.04, "elapsed_time": "1:53:01", "remaining_time": "7 days, 10:23:01", "throughput": 15904.42, "total_tokens": 107851392} +{"current_steps": 320, "total_steps": 29667, "loss": 0.5421, "lr": 4.9221086735231975e-05, "epoch": 0.0323608231784396, "percentage": 1.08, "elapsed_time": "1:58:04", "remaining_time": "7 days, 12:28:16", "throughput": 15722.73, "total_tokens": 111384576} +{"current_steps": 330, "total_steps": 29667, "loss": 0.5428, "lr": 4.919725431881751e-05, "epoch": 0.03337209890276584, "percentage": 1.11, "elapsed_time": "2:00:48", "remaining_time": "7 days, 10:59:34", "throughput": 15846.45, "total_tokens": 114859904} +{"current_steps": 340, "total_steps": 29667, "loss": 0.5368, "lr": 4.917345648725101e-05, "epoch": 0.034383374627092074, "percentage": 1.15, "elapsed_time": "2:03:19", "remaining_time": "7 days, 9:17:15", "throughput": 15989.75, "total_tokens": 118313472} +{"current_steps": 350, "total_steps": 29667, "loss": 0.5362, "lr": 4.914969315696596e-05, "epoch": 0.03539465035141831, "percentage": 1.18, "elapsed_time": "2:06:15", "remaining_time": "7 days, 8:15:26", "throughput": 16091.14, "total_tokens": 121894784} +{"current_steps": 360, "total_steps": 29667, "loss": 0.5354, "lr": 4.912596424467818e-05, "epoch": 0.036405926075744555, "percentage": 1.21, "elapsed_time": "2:09:36", "remaining_time": "7 days, 7:50:34", "throughput": 16115.25, "total_tokens": 125312768} +{"current_steps": 370, "total_steps": 29667, "loss": 0.5389, "lr": 4.910226966738475e-05, "epoch": 0.03741720180007079, "percentage": 1.25, "elapsed_time": "2:13:15", "remaining_time": "7 days, 7:51:54", "throughput": 16109.51, "total_tokens": 128808064} +{"current_steps": 380, "total_steps": 29667, "loss": 0.5366, "lr": 4.9078609342362666e-05, "epoch": 0.03842847752439703, "percentage": 1.28, "elapsed_time": "2:16:44", "remaining_time": "7 days, 7:38:33", "throughput": 16126.17, "total_tokens": 132303872} +{"current_steps": 390, "total_steps": 29667, "loss": 0.532, "lr": 4.905498318716775e-05, "epoch": 0.039439753248723265, "percentage": 1.31, "elapsed_time": "2:20:10", "remaining_time": "7 days, 7:23:07", "throughput": 16149.71, "total_tokens": 135831040} +{"current_steps": 400, "total_steps": 29667, "loss": 0.5272, "lr": 4.9031391119633295e-05, "epoch": 0.0404510289730495, "percentage": 1.35, "elapsed_time": "2:23:34", "remaining_time": "7 days, 7:05:10", "throughput": 16171.29, "total_tokens": 139309568} +{"current_steps": 410, "total_steps": 29667, "loss": 0.5241, "lr": 4.9007833057869e-05, "epoch": 0.04146230469737574, "percentage": 1.38, "elapsed_time": "2:27:36", "remaining_time": "7 days, 7:32:31", "throughput": 16131.53, "total_tokens": 142860928} +{"current_steps": 420, "total_steps": 29667, "loss": 0.5205, "lr": 4.898430892025967e-05, "epoch": 0.042473580421701976, "percentage": 1.42, "elapsed_time": "2:31:57", "remaining_time": "7 days, 8:22:02", "throughput": 16049.59, "total_tokens": 146336512} +{"current_steps": 430, "total_steps": 29667, "loss": 0.5253, "lr": 4.896081862546415e-05, "epoch": 0.04348485614602821, "percentage": 1.45, "elapsed_time": "2:36:31", "remaining_time": "7 days, 9:22:32", "throughput": 15945.49, "total_tokens": 149751040} +{"current_steps": 440, "total_steps": 29667, "loss": 0.5144, "lr": 4.8937362092414e-05, "epoch": 0.04449613187035445, "percentage": 1.48, "elapsed_time": "2:40:04", "remaining_time": "7 days, 9:12:32", "throughput": 15948.67, "total_tokens": 153172608} +{"current_steps": 450, "total_steps": 29667, "loss": 0.519, "lr": 4.891393924031244e-05, "epoch": 0.045507407594680686, "percentage": 1.52, "elapsed_time": "2:43:35", "remaining_time": "7 days, 9:01:20", "throughput": 15970.6, "total_tokens": 156757632} +{"current_steps": 460, "total_steps": 29667, "loss": 0.5193, "lr": 4.8890549988633095e-05, "epoch": 0.04651868331900693, "percentage": 1.55, "elapsed_time": "2:47:07", "remaining_time": "7 days, 8:51:40", "throughput": 15984.68, "total_tokens": 160291200} +{"current_steps": 470, "total_steps": 29667, "loss": 0.5189, "lr": 4.8867194257118907e-05, "epoch": 0.04752995904333317, "percentage": 1.58, "elapsed_time": "2:50:27", "remaining_time": "7 days, 8:29:05", "throughput": 16006.9, "total_tokens": 163710464} +{"current_steps": 480, "total_steps": 29667, "loss": 0.5137, "lr": 4.884387196578093e-05, "epoch": 0.048541234767659404, "percentage": 1.62, "elapsed_time": "2:53:40", "remaining_time": "7 days, 8:00:56", "throughput": 16045.21, "total_tokens": 167205632} +{"current_steps": 490, "total_steps": 29667, "loss": 0.516, "lr": 4.882058303489718e-05, "epoch": 0.04955251049198564, "percentage": 1.65, "elapsed_time": "2:56:44", "remaining_time": "7 days, 7:24:25", "throughput": 16091.32, "total_tokens": 170646272} +{"current_steps": 500, "total_steps": 29667, "loss": 0.5144, "lr": 4.8797327385011496e-05, "epoch": 0.05056378621631188, "percentage": 1.69, "elapsed_time": "2:59:34", "remaining_time": "7 days, 6:35:01", "throughput": 16167.28, "total_tokens": 174189312} +{"current_steps": 510, "total_steps": 29667, "loss": 0.5061, "lr": 4.8774104936932425e-05, "epoch": 0.051575061940638114, "percentage": 1.72, "elapsed_time": "3:02:25", "remaining_time": "7 days, 5:49:24", "throughput": 16234.17, "total_tokens": 177692160} +{"current_steps": 520, "total_steps": 29667, "loss": 0.5115, "lr": 4.8750915611732076e-05, "epoch": 0.05258633766496435, "percentage": 1.75, "elapsed_time": "3:05:10", "remaining_time": "7 days, 4:59:28", "throughput": 16308.61, "total_tokens": 181197952} +{"current_steps": 530, "total_steps": 29667, "loss": 0.5082, "lr": 4.8727759330744986e-05, "epoch": 0.05359761338929059, "percentage": 1.79, "elapsed_time": "3:07:45", "remaining_time": "7 days, 4:01:48", "throughput": 16393.39, "total_tokens": 184674560} +{"current_steps": 540, "total_steps": 29667, "loss": 0.5097, "lr": 4.870463601556696e-05, "epoch": 0.054608889113616825, "percentage": 1.82, "elapsed_time": "3:10:32", "remaining_time": "7 days, 3:17:38", "throughput": 16466.95, "total_tokens": 188259200} +{"current_steps": 550, "total_steps": 29667, "loss": 0.505, "lr": 4.8681545588054075e-05, "epoch": 0.05562016483794306, "percentage": 1.85, "elapsed_time": "3:13:52", "remaining_time": "7 days, 3:04:04", "throughput": 16479.66, "total_tokens": 191705856} +{"current_steps": 560, "total_steps": 29667, "loss": 0.5094, "lr": 4.8658487970321404e-05, "epoch": 0.056631440562269306, "percentage": 1.89, "elapsed_time": "3:17:12", "remaining_time": "7 days, 2:50:27", "throughput": 16500.94, "total_tokens": 195251200} +{"current_steps": 570, "total_steps": 29667, "loss": 0.4982, "lr": 4.863546308474209e-05, "epoch": 0.05764271628659554, "percentage": 1.92, "elapsed_time": "3:20:26", "remaining_time": "7 days, 2:32:17", "throughput": 16532.39, "total_tokens": 198832000} +{"current_steps": 580, "total_steps": 29667, "loss": 0.508, "lr": 4.86124708539461e-05, "epoch": 0.05865399201092178, "percentage": 1.96, "elapsed_time": "3:23:55", "remaining_time": "7 days, 2:26:55", "throughput": 16535.96, "total_tokens": 202327424} +{"current_steps": 590, "total_steps": 29667, "loss": 0.5014, "lr": 4.8589511200819216e-05, "epoch": 0.059665267735248016, "percentage": 1.99, "elapsed_time": "3:27:27", "remaining_time": "7 days, 2:24:21", "throughput": 16538.79, "total_tokens": 205870208} +{"current_steps": 600, "total_steps": 29667, "loss": 0.5016, "lr": 4.8566584048501926e-05, "epoch": 0.06067654345957425, "percentage": 2.02, "elapsed_time": "3:30:37", "remaining_time": "7 days, 2:03:56", "throughput": 16565.57, "total_tokens": 209351680} +{"current_steps": 610, "total_steps": 29667, "loss": 0.5022, "lr": 4.854368932038835e-05, "epoch": 0.06168781918390049, "percentage": 2.06, "elapsed_time": "3:33:38", "remaining_time": "7 days, 1:37:03", "throughput": 16598.37, "total_tokens": 212773888} +{"current_steps": 620, "total_steps": 29667, "loss": 0.4979, "lr": 4.8520826940125144e-05, "epoch": 0.06269909490822673, "percentage": 2.09, "elapsed_time": "3:37:03", "remaining_time": "7 days, 1:28:55", "throughput": 16611.27, "total_tokens": 216331264} +{"current_steps": 630, "total_steps": 29667, "loss": 0.4986, "lr": 4.849799683161046e-05, "epoch": 0.06371037063255297, "percentage": 2.12, "elapsed_time": "3:40:16", "remaining_time": "7 days, 1:12:44", "throughput": 16632.64, "total_tokens": 219828864} +{"current_steps": 640, "total_steps": 29667, "loss": 0.4991, "lr": 4.8475198918992835e-05, "epoch": 0.0647216463568792, "percentage": 2.16, "elapsed_time": "3:43:32", "remaining_time": "7 days, 0:58:54", "throughput": 16639.25, "total_tokens": 223179520} +{"current_steps": 650, "total_steps": 29667, "loss": 0.4996, "lr": 4.845243312667023e-05, "epoch": 0.06573292208120544, "percentage": 2.19, "elapsed_time": "3:46:49", "remaining_time": "7 days, 0:45:43", "throughput": 16661.38, "total_tokens": 226750976} +{"current_steps": 660, "total_steps": 29667, "loss": 0.4993, "lr": 4.842969937928884e-05, "epoch": 0.06674419780553167, "percentage": 2.22, "elapsed_time": "3:49:52", "remaining_time": "7 days, 0:22:56", "throughput": 16692.84, "total_tokens": 230234624} +{"current_steps": 670, "total_steps": 29667, "loss": 0.4898, "lr": 4.840699760174217e-05, "epoch": 0.06775547352985792, "percentage": 2.26, "elapsed_time": "3:52:29", "remaining_time": "6 days, 23:41:54", "throughput": 16750.46, "total_tokens": 233657600} +{"current_steps": 680, "total_steps": 29667, "loss": 0.4962, "lr": 4.8384327719169906e-05, "epoch": 0.06876674925418415, "percentage": 2.29, "elapsed_time": "3:55:12", "remaining_time": "6 days, 23:06:40", "throughput": 16806.33, "total_tokens": 237184512} +{"current_steps": 690, "total_steps": 29667, "loss": 0.4919, "lr": 4.836168965695694e-05, "epoch": 0.06977802497851039, "percentage": 2.33, "elapsed_time": "3:57:57", "remaining_time": "6 days, 22:33:19", "throughput": 16853.42, "total_tokens": 240627584} +{"current_steps": 700, "total_steps": 29667, "loss": 0.4906, "lr": 4.8339083340732304e-05, "epoch": 0.07078930070283662, "percentage": 2.36, "elapsed_time": "4:00:33", "remaining_time": "6 days, 21:54:34", "throughput": 16911.0, "total_tokens": 244083328} +{"current_steps": 710, "total_steps": 29667, "loss": 0.4887, "lr": 4.8316508696368154e-05, "epoch": 0.07180057642716287, "percentage": 2.39, "elapsed_time": "4:03:13", "remaining_time": "6 days, 21:19:51", "throughput": 16961.26, "total_tokens": 247525376} +{"current_steps": 720, "total_steps": 29667, "loss": 0.4904, "lr": 4.8293965649978714e-05, "epoch": 0.07281185215148911, "percentage": 2.43, "elapsed_time": "4:05:38", "remaining_time": "6 days, 20:36:02", "throughput": 17029.16, "total_tokens": 250989824} +{"current_steps": 730, "total_steps": 29667, "loss": 0.4878, "lr": 4.8271454127919364e-05, "epoch": 0.07382312787581534, "percentage": 2.46, "elapsed_time": "4:08:09", "remaining_time": "6 days, 19:56:36", "throughput": 17085.25, "total_tokens": 254382336} +{"current_steps": 740, "total_steps": 29667, "loss": 0.4916, "lr": 4.824897405678549e-05, "epoch": 0.07483440360014158, "percentage": 2.49, "elapsed_time": "4:10:33", "remaining_time": "6 days, 19:14:28", "throughput": 17150.85, "total_tokens": 257837824} +{"current_steps": 750, "total_steps": 29667, "loss": 0.4867, "lr": 4.8226525363411576e-05, "epoch": 0.07584567932446781, "percentage": 2.53, "elapsed_time": "4:13:01", "remaining_time": "6 days, 18:35:31", "throughput": 17213.24, "total_tokens": 261319808} +{"current_steps": 760, "total_steps": 29667, "loss": 0.4852, "lr": 4.820410797487017e-05, "epoch": 0.07685695504879406, "percentage": 2.56, "elapsed_time": "4:15:39", "remaining_time": "6 days, 18:03:50", "throughput": 17265.76, "total_tokens": 264840960} +{"current_steps": 770, "total_steps": 29667, "loss": 0.4875, "lr": 4.818172181847091e-05, "epoch": 0.07786823077312029, "percentage": 2.6, "elapsed_time": "4:18:29", "remaining_time": "6 days, 17:40:34", "throughput": 17301.64, "total_tokens": 268332800} +{"current_steps": 780, "total_steps": 29667, "loss": 0.4854, "lr": 4.81593668217595e-05, "epoch": 0.07887950649744653, "percentage": 2.63, "elapsed_time": "4:21:11", "remaining_time": "6 days, 17:13:09", "throughput": 17344.76, "total_tokens": 271819136} +{"current_steps": 790, "total_steps": 29667, "loss": 0.484, "lr": 4.813704291251675e-05, "epoch": 0.07989078222177276, "percentage": 2.66, "elapsed_time": "4:23:39", "remaining_time": "6 days, 16:37:38", "throughput": 17403.2, "total_tokens": 275312768} +{"current_steps": 800, "total_steps": 29667, "loss": 0.488, "lr": 4.811475001875759e-05, "epoch": 0.080902057946099, "percentage": 2.7, "elapsed_time": "4:26:13", "remaining_time": "6 days, 16:06:21", "throughput": 17451.88, "total_tokens": 278766464} +{"current_steps": 810, "total_steps": 29667, "loss": 0.4863, "lr": 4.8092488068730105e-05, "epoch": 0.08191333367042525, "percentage": 2.73, "elapsed_time": "4:28:57", "remaining_time": "6 days, 15:42:04", "throughput": 17491.62, "total_tokens": 282276480} +{"current_steps": 820, "total_steps": 29667, "loss": 0.482, "lr": 4.807025699091452e-05, "epoch": 0.08292460939475148, "percentage": 2.76, "elapsed_time": "4:31:23", "remaining_time": "6 days, 15:07:06", "throughput": 17552.33, "total_tokens": 285805696} +{"current_steps": 830, "total_steps": 29667, "loss": 0.4885, "lr": 4.8048056714022325e-05, "epoch": 0.08393588511907772, "percentage": 2.8, "elapsed_time": "4:33:51", "remaining_time": "6 days, 14:34:33", "throughput": 17607.48, "total_tokens": 289311232} +{"current_steps": 840, "total_steps": 29667, "loss": 0.4837, "lr": 4.802588716699519e-05, "epoch": 0.08494716084340395, "percentage": 2.83, "elapsed_time": "4:36:24", "remaining_time": "6 days, 14:05:54", "throughput": 17655.92, "total_tokens": 292819968} +{"current_steps": 850, "total_steps": 29667, "loss": 0.4758, "lr": 4.8003748279004156e-05, "epoch": 0.0859584365677302, "percentage": 2.87, "elapsed_time": "4:39:12", "remaining_time": "6 days, 13:45:35", "throughput": 17684.07, "total_tokens": 296245376} +{"current_steps": 860, "total_steps": 29667, "loss": 0.4844, "lr": 4.798163997944854e-05, "epoch": 0.08696971229205643, "percentage": 2.9, "elapsed_time": "4:41:52", "remaining_time": "6 days, 13:21:37", "throughput": 17725.17, "total_tokens": 299770240} +{"current_steps": 870, "total_steps": 29667, "loss": 0.4809, "lr": 4.79595621979551e-05, "epoch": 0.08798098801638267, "percentage": 2.93, "elapsed_time": "4:44:08", "remaining_time": "6 days, 12:44:58", "throughput": 17789.72, "total_tokens": 303284096} +{"current_steps": 880, "total_steps": 29667, "loss": 0.4786, "lr": 4.793751486437702e-05, "epoch": 0.0889922637407089, "percentage": 2.97, "elapsed_time": "4:46:22", "remaining_time": "6 days, 12:08:06", "throughput": 17850.78, "total_tokens": 306723456} +{"current_steps": 890, "total_steps": 29667, "loss": 0.4794, "lr": 4.7915497908793064e-05, "epoch": 0.09000353946503514, "percentage": 3.0, "elapsed_time": "4:48:48", "remaining_time": "6 days, 11:38:24", "throughput": 17900.47, "total_tokens": 310193664} +{"current_steps": 900, "total_steps": 29667, "loss": 0.48, "lr": 4.7893511261506516e-05, "epoch": 0.09101481518936137, "percentage": 3.03, "elapsed_time": "4:51:35", "remaining_time": "6 days, 11:20:19", "throughput": 17931.38, "total_tokens": 313721088} +{"current_steps": 910, "total_steps": 29667, "loss": 0.474, "lr": 4.787155485304435e-05, "epoch": 0.09202609091368762, "percentage": 3.07, "elapsed_time": "4:54:26", "remaining_time": "6 days, 11:04:50", "throughput": 17953.08, "total_tokens": 317173760} +{"current_steps": 920, "total_steps": 29667, "loss": 0.4749, "lr": 4.784962861415629e-05, "epoch": 0.09303736663801386, "percentage": 3.1, "elapsed_time": "4:56:56", "remaining_time": "6 days, 10:38:24", "throughput": 17995.82, "total_tokens": 320620800} +{"current_steps": 930, "total_steps": 29667, "loss": 0.4738, "lr": 4.7827732475813884e-05, "epoch": 0.09404864236234009, "percentage": 3.13, "elapsed_time": "5:00:11", "remaining_time": "6 days, 10:35:57", "throughput": 17995.61, "total_tokens": 324129152} +{"current_steps": 940, "total_steps": 29667, "loss": 0.4761, "lr": 4.7805866369209576e-05, "epoch": 0.09505991808666633, "percentage": 3.17, "elapsed_time": "5:03:30", "remaining_time": "6 days, 10:35:16", "throughput": 17993.48, "total_tokens": 327665408} +{"current_steps": 950, "total_steps": 29667, "loss": 0.4707, "lr": 4.778403022575583e-05, "epoch": 0.09607119381099256, "percentage": 3.2, "elapsed_time": "5:07:19", "remaining_time": "6 days, 10:50:05", "throughput": 17957.84, "total_tokens": 331138688} +{"current_steps": 960, "total_steps": 29667, "loss": 0.4754, "lr": 4.7762223977084195e-05, "epoch": 0.09708246953531881, "percentage": 3.24, "elapsed_time": "5:11:25", "remaining_time": "6 days, 11:12:40", "throughput": 17904.64, "total_tokens": 334560256} +{"current_steps": 970, "total_steps": 29667, "loss": 0.4705, "lr": 4.774044755504444e-05, "epoch": 0.09809374525964504, "percentage": 3.27, "elapsed_time": "5:14:33", "remaining_time": "6 days, 11:06:09", "throughput": 17912.44, "total_tokens": 338073856} +{"current_steps": 980, "total_steps": 29667, "loss": 0.4723, "lr": 4.7718700891703616e-05, "epoch": 0.09910502098397128, "percentage": 3.3, "elapsed_time": "5:17:54", "remaining_time": "6 days, 11:05:43", "throughput": 17905.41, "total_tokens": 341528576} +{"current_steps": 990, "total_steps": 29667, "loss": 0.4756, "lr": 4.7696983919345215e-05, "epoch": 0.10011629670829751, "percentage": 3.34, "elapsed_time": "5:20:57", "remaining_time": "6 days, 10:56:59", "throughput": 17919.94, "total_tokens": 345089536} +{"current_steps": 1000, "total_steps": 29667, "loss": 0.4747, "lr": 4.7675296570468216e-05, "epoch": 0.10112757243262376, "percentage": 3.37, "elapsed_time": "5:23:51", "remaining_time": "6 days, 10:43:59", "throughput": 17941.64, "total_tokens": 348630784} +{"current_steps": 1010, "total_steps": 29667, "loss": 0.4717, "lr": 4.76536387777863e-05, "epoch": 0.10213884815695, "percentage": 3.4, "elapsed_time": "5:27:15", "remaining_time": "6 days, 10:45:12", "throughput": 17934.81, "total_tokens": 352152320} +{"current_steps": 1020, "total_steps": 29667, "loss": 0.4728, "lr": 4.7632010474226915e-05, "epoch": 0.10315012388127623, "percentage": 3.44, "elapsed_time": "5:30:37", "remaining_time": "6 days, 10:45:38", "throughput": 17930.02, "total_tokens": 355684608} +{"current_steps": 1030, "total_steps": 29667, "loss": 0.4669, "lr": 4.761041159293035e-05, "epoch": 0.10416139960560247, "percentage": 3.47, "elapsed_time": "5:34:13", "remaining_time": "6 days, 10:52:19", "throughput": 17910.12, "total_tokens": 359156864} +{"current_steps": 1040, "total_steps": 29667, "loss": 0.4666, "lr": 4.7588842067249e-05, "epoch": 0.1051726753299287, "percentage": 3.51, "elapsed_time": "5:37:55", "remaining_time": "6 days, 11:01:43", "throughput": 17886.29, "total_tokens": 362653952} +{"current_steps": 1050, "total_steps": 29667, "loss": 0.4648, "lr": 4.756730183074637e-05, "epoch": 0.10618395105425495, "percentage": 3.54, "elapsed_time": "5:41:07", "remaining_time": "6 days, 10:57:20", "throughput": 17889.56, "total_tokens": 366163328} +{"current_steps": 1060, "total_steps": 29667, "loss": 0.4706, "lr": 4.7545790817196314e-05, "epoch": 0.10719522677858118, "percentage": 3.57, "elapsed_time": "5:43:59", "remaining_time": "6 days, 10:43:40", "throughput": 17914.96, "total_tokens": 369760768} +{"current_steps": 1070, "total_steps": 29667, "loss": 0.469, "lr": 4.752430896058212e-05, "epoch": 0.10820650250290742, "percentage": 3.61, "elapsed_time": "5:47:06", "remaining_time": "6 days, 10:36:57", "throughput": 17920.91, "total_tokens": 373233408} +{"current_steps": 1080, "total_steps": 29667, "loss": 0.467, "lr": 4.750285619509567e-05, "epoch": 0.10921777822723365, "percentage": 3.64, "elapsed_time": "5:50:35", "remaining_time": "6 days, 10:39:51", "throughput": 17912.73, "total_tokens": 376798720} +{"current_steps": 1090, "total_steps": 29667, "loss": 0.4701, "lr": 4.7481432455136644e-05, "epoch": 0.1102290539515599, "percentage": 3.67, "elapsed_time": "5:53:54", "remaining_time": "6 days, 10:38:34", "throughput": 17907.15, "total_tokens": 380249472} +{"current_steps": 1100, "total_steps": 29667, "loss": 0.4704, "lr": 4.7460037675311584e-05, "epoch": 0.11124032967588612, "percentage": 3.71, "elapsed_time": "5:57:29", "remaining_time": "6 days, 10:43:59", "throughput": 17888.08, "total_tokens": 383687680} +{"current_steps": 1110, "total_steps": 29667, "loss": 0.4673, "lr": 4.7438671790433126e-05, "epoch": 0.11225160540021237, "percentage": 3.74, "elapsed_time": "6:00:50", "remaining_time": "6 days, 10:43:23", "throughput": 17880.65, "total_tokens": 387125376} +{"current_steps": 1120, "total_steps": 29667, "loss": 0.4615, "lr": 4.741733473551915e-05, "epoch": 0.11326288112453861, "percentage": 3.78, "elapsed_time": "6:04:02", "remaining_time": "6 days, 10:38:44", "throughput": 17879.08, "total_tokens": 390519936} +{"current_steps": 1130, "total_steps": 29667, "loss": 0.4708, "lr": 4.7396026445791966e-05, "epoch": 0.11427415684886484, "percentage": 3.81, "elapsed_time": "6:07:21", "remaining_time": "6 days, 10:37:12", "throughput": 17873.19, "total_tokens": 393949440} +{"current_steps": 1140, "total_steps": 29667, "loss": 0.4638, "lr": 4.737474685667742e-05, "epoch": 0.11528543257319109, "percentage": 3.84, "elapsed_time": "6:10:47", "remaining_time": "6 days, 10:38:32", "throughput": 17864.92, "total_tokens": 397448704} +{"current_steps": 1150, "total_steps": 29667, "loss": 0.4692, "lr": 4.7353495903804165e-05, "epoch": 0.11629670829751731, "percentage": 3.88, "elapsed_time": "6:13:51", "remaining_time": "6 days, 10:30:39", "throughput": 17874.15, "total_tokens": 400941440} +{"current_steps": 1160, "total_steps": 29667, "loss": 0.4648, "lr": 4.733227352300277e-05, "epoch": 0.11730798402184356, "percentage": 3.91, "elapsed_time": "6:16:54", "remaining_time": "6 days, 10:22:21", "throughput": 17886.31, "total_tokens": 404482816} +{"current_steps": 1170, "total_steps": 29667, "loss": 0.472, "lr": 4.731107965030496e-05, "epoch": 0.11831925974616979, "percentage": 3.94, "elapsed_time": "6:20:24", "remaining_time": "6 days, 10:25:33", "throughput": 17874.51, "total_tokens": 407984768} +{"current_steps": 1180, "total_steps": 29667, "loss": 0.4632, "lr": 4.728991422194278e-05, "epoch": 0.11933053547049603, "percentage": 3.98, "elapsed_time": "6:23:17", "remaining_time": "6 days, 10:13:05", "throughput": 17891.72, "total_tokens": 411457792} +{"current_steps": 1190, "total_steps": 29667, "loss": 0.4638, "lr": 4.726877717434773e-05, "epoch": 0.12034181119482226, "percentage": 4.01, "elapsed_time": "6:25:39", "remaining_time": "6 days, 9:48:44", "throughput": 17933.55, "total_tokens": 414966016} +{"current_steps": 1200, "total_steps": 29667, "loss": 0.4592, "lr": 4.724766844415013e-05, "epoch": 0.1213530869191485, "percentage": 4.04, "elapsed_time": "6:27:46", "remaining_time": "6 days, 9:19:07", "throughput": 17983.6, "total_tokens": 418421248} +{"current_steps": 1210, "total_steps": 29667, "loss": 0.4615, "lr": 4.722658796817813e-05, "epoch": 0.12236436264347475, "percentage": 4.08, "elapsed_time": "6:30:16", "remaining_time": "6 days, 8:58:42", "throughput": 18020.13, "total_tokens": 421975296} +{"current_steps": 1220, "total_steps": 29667, "loss": 0.4627, "lr": 4.7205535683457044e-05, "epoch": 0.12337563836780098, "percentage": 4.11, "elapsed_time": "6:32:57", "remaining_time": "6 days, 8:42:37", "throughput": 18046.31, "total_tokens": 425483776} +{"current_steps": 1230, "total_steps": 29667, "loss": 0.461, "lr": 4.7184511527208484e-05, "epoch": 0.12438691409212722, "percentage": 4.15, "elapsed_time": "6:35:32", "remaining_time": "6 days, 8:24:43", "throughput": 18081.55, "total_tokens": 429120256} +{"current_steps": 1240, "total_steps": 29667, "loss": 0.4555, "lr": 4.7163515436849644e-05, "epoch": 0.12539818981645345, "percentage": 4.18, "elapsed_time": "6:38:06", "remaining_time": "6 days, 8:06:28", "throughput": 18108.27, "total_tokens": 432535552} +{"current_steps": 1250, "total_steps": 29667, "loss": 0.462, "lr": 4.714254734999245e-05, "epoch": 0.1264094655407797, "percentage": 4.21, "elapsed_time": "6:40:28", "remaining_time": "6 days, 7:44:11", "throughput": 18143.1, "total_tokens": 435949568} +{"current_steps": 1260, "total_steps": 29667, "loss": 0.4565, "lr": 4.712160720444284e-05, "epoch": 0.12742074126510594, "percentage": 4.25, "elapsed_time": "6:43:19", "remaining_time": "6 days, 7:32:58", "throughput": 18159.93, "total_tokens": 439457536} +{"current_steps": 1270, "total_steps": 29667, "loss": 0.4589, "lr": 4.710069493819992e-05, "epoch": 0.12843201698943216, "percentage": 4.28, "elapsed_time": "6:46:19", "remaining_time": "6 days, 7:25:31", "throughput": 18168.98, "total_tokens": 442958592} +{"current_steps": 1280, "total_steps": 29667, "loss": 0.4636, "lr": 4.70798104894553e-05, "epoch": 0.1294432927137584, "percentage": 4.31, "elapsed_time": "6:49:02", "remaining_time": "6 days, 7:11:29", "throughput": 18190.47, "total_tokens": 446441216} +{"current_steps": 1290, "total_steps": 29667, "loss": 0.457, "lr": 4.705895379659219e-05, "epoch": 0.13045456843808464, "percentage": 4.35, "elapsed_time": "6:51:07", "remaining_time": "6 days, 6:43:54", "throughput": 18239.76, "total_tokens": 449934976} +{"current_steps": 1300, "total_steps": 29667, "loss": 0.459, "lr": 4.7038124798184766e-05, "epoch": 0.1314658441624109, "percentage": 4.38, "elapsed_time": "6:52:59", "remaining_time": "6 days, 6:11:46", "throughput": 18298.36, "total_tokens": 453423360} +{"current_steps": 1310, "total_steps": 29667, "loss": 0.4543, "lr": 4.7017323432997304e-05, "epoch": 0.13247711988673713, "percentage": 4.42, "elapsed_time": "6:54:47", "remaining_time": "6 days, 5:38:51", "throughput": 18356.88, "total_tokens": 456859008} +{"current_steps": 1320, "total_steps": 29667, "loss": 0.4564, "lr": 4.6996549639983506e-05, "epoch": 0.13348839561106335, "percentage": 4.45, "elapsed_time": "6:56:38", "remaining_time": "6 days, 5:07:32", "throughput": 18415.84, "total_tokens": 460376576} +{"current_steps": 1330, "total_steps": 29667, "loss": 0.4568, "lr": 4.697580335828569e-05, "epoch": 0.1344996713353896, "percentage": 4.48, "elapsed_time": "6:58:28", "remaining_time": "6 days, 4:36:05", "throughput": 18475.77, "total_tokens": 463901440} +{"current_steps": 1340, "total_steps": 29667, "loss": 0.4547, "lr": 4.6955084527234076e-05, "epoch": 0.13551094705971584, "percentage": 4.52, "elapsed_time": "7:00:17", "remaining_time": "6 days, 4:04:48", "throughput": 18532.59, "total_tokens": 467346816} +{"current_steps": 10, "total_steps": 29667, "loss": 1.0459, "lr": 4.9977515176118345e-05, "epoch": 0.001011282116107828, "percentage": 0.03, "elapsed_time": "0:01:49", "remaining_time": "3 days, 17:52:29", "throughput": 26427.79, "total_tokens": 2883200} +{"current_steps": 20, "total_steps": 29667, "loss": 0.8173, "lr": 4.9952567580506e-05, "epoch": 0.002022564232215656, "percentage": 0.07, "elapsed_time": "0:03:34", "remaining_time": "3 days, 16:12:01", "throughput": 27069.53, "total_tokens": 5798336} +{"current_steps": 30, "total_steps": 29667, "loss": 0.7557, "lr": 4.992765730738634e-05, "epoch": 0.003033846348323484, "percentage": 0.1, "elapsed_time": "0:05:17", "remaining_time": "3 days, 14:59:25", "throughput": 27473.62, "total_tokens": 8709184} +{"current_steps": 40, "total_steps": 29667, "loss": 0.722, "lr": 4.9902784263792476e-05, "epoch": 0.004045128464431312, "percentage": 0.13, "elapsed_time": "0:07:02", "remaining_time": "3 days, 15:01:10", "throughput": 27536.86, "total_tokens": 11646784} +{"current_steps": 50, "total_steps": 29667, "loss": 0.6983, "lr": 4.987794835708133e-05, "epoch": 0.00505641058053914, "percentage": 0.17, "elapsed_time": "0:08:45", "remaining_time": "3 days, 14:26:40", "throughput": 27732.42, "total_tokens": 14569920} +{"current_steps": 60, "total_steps": 29667, "loss": 0.6801, "lr": 4.985314949493234e-05, "epoch": 0.006067692696646968, "percentage": 0.2, "elapsed_time": "0:10:29", "remaining_time": "3 days, 14:20:06", "throughput": 27754.35, "total_tokens": 17481472} +{"current_steps": 70, "total_steps": 29667, "loss": 0.6657, "lr": 4.982838758534584e-05, "epoch": 0.007078974812754796, "percentage": 0.24, "elapsed_time": "0:12:13", "remaining_time": "3 days, 14:09:49", "throughput": 27773.47, "total_tokens": 20375488} +{"current_steps": 80, "total_steps": 29667, "loss": 0.6541, "lr": 4.980366253664179e-05, "epoch": 0.008090256928862624, "percentage": 0.27, "elapsed_time": "0:13:56", "remaining_time": "3 days, 13:54:18", "throughput": 27856.45, "total_tokens": 23293632} +{"current_steps": 90, "total_steps": 29667, "loss": 0.6487, "lr": 4.977897425745825e-05, "epoch": 0.009101539044970451, "percentage": 0.3, "elapsed_time": "0:15:40", "remaining_time": "3 days, 13:52:52", "throughput": 27850.75, "total_tokens": 26201472} +{"current_steps": 100, "total_steps": 29667, "loss": 0.627, "lr": 4.975432265674997e-05, "epoch": 0.01011282116107828, "percentage": 0.34, "elapsed_time": "0:17:24", "remaining_time": "3 days, 13:48:26", "throughput": 27887.03, "total_tokens": 29135424} +{"current_steps": 110, "total_steps": 29667, "loss": 0.6262, "lr": 4.972970764378705e-05, "epoch": 0.011124103277186107, "percentage": 0.37, "elapsed_time": "0:19:13", "remaining_time": "3 days, 14:05:00", "throughput": 27803.06, "total_tokens": 32066176} +{"current_steps": 120, "total_steps": 29667, "loss": 0.6229, "lr": 4.970512912815344e-05, "epoch": 0.012135385393293936, "percentage": 0.4, "elapsed_time": "0:21:00", "remaining_time": "3 days, 14:10:55", "throughput": 27801.07, "total_tokens": 35030720} +{"current_steps": 130, "total_steps": 29667, "loss": 0.6156, "lr": 4.968058701974564e-05, "epoch": 0.013146667509401763, "percentage": 0.44, "elapsed_time": "0:22:45", "remaining_time": "3 days, 14:12:08", "throughput": 27795.18, "total_tokens": 37963648} +{"current_steps": 140, "total_steps": 29667, "loss": 0.6032, "lr": 4.96560812287712e-05, "epoch": 0.014157949625509592, "percentage": 0.47, "elapsed_time": "0:24:30", "remaining_time": "3 days, 14:09:21", "throughput": 27821.25, "total_tokens": 40914112} +{"current_steps": 150, "total_steps": 29667, "loss": 0.5976, "lr": 4.963161166574748e-05, "epoch": 0.015169231741617419, "percentage": 0.51, "elapsed_time": "0:26:13", "remaining_time": "3 days, 14:01:47", "throughput": 27866.24, "total_tokens": 43858048} +{"current_steps": 160, "total_steps": 29667, "loss": 0.5941, "lr": 4.960717824150013e-05, "epoch": 0.01618051385772525, "percentage": 0.54, "elapsed_time": "0:28:03", "remaining_time": "3 days, 14:13:56", "throughput": 27818.66, "total_tokens": 46827776} +{"current_steps": 170, "total_steps": 29667, "loss": 0.5908, "lr": 4.9582780867161893e-05, "epoch": 0.017191795973833076, "percentage": 0.57, "elapsed_time": "0:29:51", "remaining_time": "3 days, 14:19:27", "throughput": 27810.08, "total_tokens": 49809152} +{"current_steps": 180, "total_steps": 29667, "loss": 0.5872, "lr": 4.955841945417105e-05, "epoch": 0.018203078089940903, "percentage": 0.61, "elapsed_time": "0:31:37", "remaining_time": "3 days, 14:19:37", "throughput": 27809.91, "total_tokens": 52758400} +{"current_steps": 190, "total_steps": 29667, "loss": 0.58, "lr": 4.953409391427024e-05, "epoch": 0.01921436020604873, "percentage": 0.64, "elapsed_time": "0:33:31", "remaining_time": "3 days, 14:40:12", "throughput": 27683.34, "total_tokens": 55675008} +{"current_steps": 200, "total_steps": 29667, "loss": 0.5803, "lr": 4.950980415950502e-05, "epoch": 0.02022564232215656, "percentage": 0.67, "elapsed_time": "0:35:37", "remaining_time": "3 days, 15:28:12", "throughput": 27425.27, "total_tokens": 58614848} +{"current_steps": 210, "total_steps": 29667, "loss": 0.5673, "lr": 4.9485550102222575e-05, "epoch": 0.021236924438264387, "percentage": 0.71, "elapsed_time": "0:37:31", "remaining_time": "3 days, 15:43:45", "throughput": 27330.31, "total_tokens": 61535040} +{"current_steps": 220, "total_steps": 29667, "loss": 0.57, "lr": 4.946133165507037e-05, "epoch": 0.022248206554372214, "percentage": 0.74, "elapsed_time": "0:39:16", "remaining_time": "3 days, 15:36:26", "throughput": 27362.02, "total_tokens": 64472320} +{"current_steps": 230, "total_steps": 29667, "loss": 0.5629, "lr": 4.943714873099483e-05, "epoch": 0.02325948867048004, "percentage": 0.78, "elapsed_time": "0:41:02", "remaining_time": "3 days, 15:33:01", "throughput": 27374.15, "total_tokens": 67411776} +{"current_steps": 240, "total_steps": 29667, "loss": 0.5613, "lr": 4.9413001243240024e-05, "epoch": 0.024270770786587872, "percentage": 0.81, "elapsed_time": "0:42:45", "remaining_time": "3 days, 15:21:57", "throughput": 27415.91, "total_tokens": 70325440} +{"current_steps": 250, "total_steps": 29667, "loss": 0.5599, "lr": 4.938888910534637e-05, "epoch": 0.0252820529026957, "percentage": 0.84, "elapsed_time": "0:44:24", "remaining_time": "3 days, 15:05:13", "throughput": 27479.07, "total_tokens": 73215040} +{"current_steps": 260, "total_steps": 29667, "loss": 0.5573, "lr": 4.936481223114932e-05, "epoch": 0.026293335018803526, "percentage": 0.88, "elapsed_time": "0:46:07", "remaining_time": "3 days, 14:56:05", "throughput": 27511.56, "total_tokens": 76126272} +{"current_steps": 270, "total_steps": 29667, "loss": 0.5571, "lr": 4.934077053477808e-05, "epoch": 0.027304617134911356, "percentage": 0.91, "elapsed_time": "0:47:56", "remaining_time": "3 days, 14:59:56", "throughput": 27502.39, "total_tokens": 79113024} +{"current_steps": 280, "total_steps": 29667, "loss": 0.5575, "lr": 4.931676393065431e-05, "epoch": 0.028315899251019183, "percentage": 0.94, "elapsed_time": "0:49:44", "remaining_time": "3 days, 15:00:39", "throughput": 27506.15, "total_tokens": 82093632} +{"current_steps": 290, "total_steps": 29667, "loss": 0.5529, "lr": 4.929279233349088e-05, "epoch": 0.02932718136712701, "percentage": 0.98, "elapsed_time": "0:51:24", "remaining_time": "3 days, 14:48:19", "throughput": 27549.73, "total_tokens": 84987776} +{"current_steps": 300, "total_steps": 29667, "loss": 0.5507, "lr": 4.926885565829051e-05, "epoch": 0.030338463483234837, "percentage": 1.01, "elapsed_time": "0:53:09", "remaining_time": "3 days, 14:42:57", "throughput": 27568.59, "total_tokens": 87917952} +{"current_steps": 310, "total_steps": 29667, "loss": 0.5435, "lr": 4.924495382034461e-05, "epoch": 0.031349745599342664, "percentage": 1.04, "elapsed_time": "0:54:49", "remaining_time": "3 days, 14:31:13", "throughput": 27605.41, "total_tokens": 90795712} +{"current_steps": 320, "total_steps": 29667, "loss": 0.5423, "lr": 4.9221086735231975e-05, "epoch": 0.0323610277154505, "percentage": 1.08, "elapsed_time": "0:56:35", "remaining_time": "3 days, 14:29:48", "throughput": 27613.58, "total_tokens": 93758848} +{"current_steps": 330, "total_steps": 29667, "loss": 0.5425, "lr": 4.919725431881751e-05, "epoch": 0.033372309831558325, "percentage": 1.11, "elapsed_time": "0:58:18", "remaining_time": "3 days, 14:23:55", "throughput": 27632.69, "total_tokens": 96678976} +{"current_steps": 340, "total_steps": 29667, "loss": 0.5367, "lr": 4.917345648725101e-05, "epoch": 0.03438359194766615, "percentage": 1.15, "elapsed_time": "1:00:02", "remaining_time": "3 days, 14:18:40", "throughput": 27646.63, "total_tokens": 99591808} +{"current_steps": 350, "total_steps": 29667, "loss": 0.5363, "lr": 4.914969315696596e-05, "epoch": 0.03539487406377398, "percentage": 1.18, "elapsed_time": "1:01:49", "remaining_time": "3 days, 14:18:43", "throughput": 27659.11, "total_tokens": 102603136} +{"current_steps": 360, "total_steps": 29667, "loss": 0.5354, "lr": 4.912596424467818e-05, "epoch": 0.036406156179881806, "percentage": 1.21, "elapsed_time": "1:03:30", "remaining_time": "3 days, 14:09:55", "throughput": 27690.02, "total_tokens": 105508928} +{"current_steps": 370, "total_steps": 29667, "loss": 0.5389, "lr": 4.910226966738475e-05, "epoch": 0.03741743829598963, "percentage": 1.25, "elapsed_time": "1:05:12", "remaining_time": "3 days, 14:03:37", "throughput": 27719.05, "total_tokens": 108458368} +{"current_steps": 380, "total_steps": 29667, "loss": 0.5365, "lr": 4.9078609342362666e-05, "epoch": 0.03842872041209746, "percentage": 1.28, "elapsed_time": "1:06:57", "remaining_time": "3 days, 14:00:20", "throughput": 27727.88, "total_tokens": 111392256} +{"current_steps": 390, "total_steps": 29667, "loss": 0.5323, "lr": 4.905498318716775e-05, "epoch": 0.03944000252820529, "percentage": 1.31, "elapsed_time": "1:08:42", "remaining_time": "3 days, 13:58:22", "throughput": 27734.02, "total_tokens": 114344384} +{"current_steps": 400, "total_steps": 29667, "loss": 0.5274, "lr": 4.9031391119633295e-05, "epoch": 0.04045128464431312, "percentage": 1.35, "elapsed_time": "1:10:26", "remaining_time": "3 days, 13:54:16", "throughput": 27747.81, "total_tokens": 117281344} +{"current_steps": 410, "total_steps": 29667, "loss": 0.524, "lr": 4.9007833057869e-05, "epoch": 0.04146256676042095, "percentage": 1.38, "elapsed_time": "1:12:13", "remaining_time": "3 days, 13:53:20", "throughput": 27753.77, "total_tokens": 120258816} +{"current_steps": 420, "total_steps": 29667, "loss": 0.5203, "lr": 4.898430892025967e-05, "epoch": 0.042473848876528775, "percentage": 1.42, "elapsed_time": "1:13:57", "remaining_time": "3 days, 13:50:27", "throughput": 27757.64, "total_tokens": 123182272} +{"current_steps": 430, "total_steps": 29667, "loss": 0.5252, "lr": 4.896081862546415e-05, "epoch": 0.0434851309926366, "percentage": 1.45, "elapsed_time": "1:15:40", "remaining_time": "3 days, 13:44:49", "throughput": 27769.59, "total_tokens": 126074496} +{"current_steps": 440, "total_steps": 29667, "loss": 0.5146, "lr": 4.8937362092414e-05, "epoch": 0.04449641310874443, "percentage": 1.48, "elapsed_time": "1:17:20", "remaining_time": "3 days, 13:37:35", "throughput": 27791.86, "total_tokens": 128972288} +{"current_steps": 450, "total_steps": 29667, "loss": 0.5193, "lr": 4.891393924031244e-05, "epoch": 0.045507695224852256, "percentage": 1.52, "elapsed_time": "1:19:08", "remaining_time": "3 days, 13:38:47", "throughput": 27789.43, "total_tokens": 131968064} +{"current_steps": 460, "total_steps": 29667, "loss": 0.5193, "lr": 4.8890549988633095e-05, "epoch": 0.04651897734096008, "percentage": 1.55, "elapsed_time": "1:20:53", "remaining_time": "3 days, 13:36:17", "throughput": 27799.59, "total_tokens": 134930624} +{"current_steps": 470, "total_steps": 29667, "loss": 0.5188, "lr": 4.8867194257118907e-05, "epoch": 0.04753025945706792, "percentage": 1.58, "elapsed_time": "1:22:33", "remaining_time": "3 days, 13:28:58", "throughput": 27823.19, "total_tokens": 137831616} +{"current_steps": 480, "total_steps": 29667, "loss": 0.5135, "lr": 4.884387196578093e-05, "epoch": 0.048541541573175744, "percentage": 1.62, "elapsed_time": "1:24:17", "remaining_time": "3 days, 13:25:19", "throughput": 27837.2, "total_tokens": 140783104} +{"current_steps": 490, "total_steps": 29667, "loss": 0.5157, "lr": 4.882058303489718e-05, "epoch": 0.04955282368928357, "percentage": 1.65, "elapsed_time": "1:26:04", "remaining_time": "3 days, 13:25:09", "throughput": 27826.26, "total_tokens": 143704064} +{"current_steps": 500, "total_steps": 29667, "loss": 0.5141, "lr": 4.8797327385011496e-05, "epoch": 0.0505641058053914, "percentage": 1.69, "elapsed_time": "1:27:55", "remaining_time": "3 days, 13:28:56", "throughput": 27802.07, "total_tokens": 146667520} +{"current_steps": 510, "total_steps": 29667, "loss": 0.5058, "lr": 4.8774104936932425e-05, "epoch": 0.051575387921499224, "percentage": 1.72, "elapsed_time": "1:29:41", "remaining_time": "3 days, 13:27:49", "throughput": 27798.31, "total_tokens": 149599424} +{"current_steps": 520, "total_steps": 29667, "loss": 0.5112, "lr": 4.8750915611732076e-05, "epoch": 0.05258667003760705, "percentage": 1.75, "elapsed_time": "1:31:26", "remaining_time": "3 days, 13:25:34", "throughput": 27804.2, "total_tokens": 152550464} +{"current_steps": 530, "total_steps": 29667, "loss": 0.5086, "lr": 4.8727759330744986e-05, "epoch": 0.05359795215371488, "percentage": 1.79, "elapsed_time": "1:33:07", "remaining_time": "3 days, 13:19:42", "throughput": 27825.34, "total_tokens": 155477760} +{"current_steps": 540, "total_steps": 29667, "loss": 0.5097, "lr": 4.870463601556696e-05, "epoch": 0.05460923426982271, "percentage": 1.82, "elapsed_time": "1:34:55", "remaining_time": "3 days, 13:20:02", "throughput": 27824.07, "total_tokens": 158468800} +{"current_steps": 550, "total_steps": 29667, "loss": 0.505, "lr": 4.8681545588054075e-05, "epoch": 0.05562051638593054, "percentage": 1.85, "elapsed_time": "1:36:37", "remaining_time": "3 days, 13:15:38", "throughput": 27836.26, "total_tokens": 161390784} +{"current_steps": 560, "total_steps": 29667, "loss": 0.5096, "lr": 4.8658487970321404e-05, "epoch": 0.056631798502038366, "percentage": 1.89, "elapsed_time": "1:38:23", "remaining_time": "3 days, 13:14:20", "throughput": 27840.04, "total_tokens": 164361792} +{"current_steps": 570, "total_steps": 29667, "loss": 0.4983, "lr": 4.863546308474209e-05, "epoch": 0.05764308061814619, "percentage": 1.92, "elapsed_time": "1:40:09", "remaining_time": "3 days, 13:12:39", "throughput": 27845.97, "total_tokens": 167334848} +{"current_steps": 580, "total_steps": 29667, "loss": 0.5078, "lr": 4.86124708539461e-05, "epoch": 0.05865436273425402, "percentage": 1.96, "elapsed_time": "1:42:02", "remaining_time": "3 days, 13:17:32", "throughput": 27811.7, "total_tokens": 170282240} +{"current_steps": 590, "total_steps": 29667, "loss": 0.5015, "lr": 4.8589511200819216e-05, "epoch": 0.05966564485036185, "percentage": 1.99, "elapsed_time": "1:43:50", "remaining_time": "3 days, 13:17:40", "throughput": 27807.79, "total_tokens": 173257728} +{"current_steps": 600, "total_steps": 29667, "loss": 0.5013, "lr": 4.8566584048501926e-05, "epoch": 0.060676926966469674, "percentage": 2.02, "elapsed_time": "1:45:34", "remaining_time": "3 days, 13:14:20", "throughput": 27816.29, "total_tokens": 176194240} +{"current_steps": 610, "total_steps": 29667, "loss": 0.5021, "lr": 4.854368932038835e-05, "epoch": 0.06168820908257751, "percentage": 2.06, "elapsed_time": "1:47:14", "remaining_time": "3 days, 13:08:38", "throughput": 27832.44, "total_tokens": 179096640} +{"current_steps": 620, "total_steps": 29667, "loss": 0.4978, "lr": 4.8520826940125144e-05, "epoch": 0.06269949119868533, "percentage": 2.09, "elapsed_time": "1:49:00", "remaining_time": "3 days, 13:06:57", "throughput": 27840.22, "total_tokens": 182085760} +{"current_steps": 630, "total_steps": 29667, "loss": 0.4986, "lr": 4.849799683161046e-05, "epoch": 0.06371077331479316, "percentage": 2.12, "elapsed_time": "1:50:43", "remaining_time": "3 days, 13:03:35", "throughput": 27849.54, "total_tokens": 185026240} +{"current_steps": 640, "total_steps": 29667, "loss": 0.4993, "lr": 4.8475198918992835e-05, "epoch": 0.064722055430901, "percentage": 2.16, "elapsed_time": "1:52:21", "remaining_time": "3 days, 12:55:38", "throughput": 27867.31, "total_tokens": 187854848} +{"current_steps": 650, "total_steps": 29667, "loss": 0.4998, "lr": 4.845243312667023e-05, "epoch": 0.06573333754700882, "percentage": 2.19, "elapsed_time": "1:54:06", "remaining_time": "3 days, 12:53:58", "throughput": 27876.01, "total_tokens": 190852992} +{"current_steps": 660, "total_steps": 29667, "loss": 0.4992, "lr": 4.842969937928884e-05, "epoch": 0.06674461966311665, "percentage": 2.22, "elapsed_time": "1:55:50", "remaining_time": "3 days, 12:50:55", "throughput": 27884.37, "total_tokens": 193798272} +{"current_steps": 670, "total_steps": 29667, "loss": 0.4895, "lr": 4.840699760174217e-05, "epoch": 0.06775590177922447, "percentage": 2.26, "elapsed_time": "1:57:29", "remaining_time": "3 days, 12:45:12", "throughput": 27898.04, "total_tokens": 196677888} +{"current_steps": 680, "total_steps": 29667, "loss": 0.4962, "lr": 4.8384327719169906e-05, "epoch": 0.0687671838953323, "percentage": 2.29, "elapsed_time": "1:59:15", "remaining_time": "3 days, 12:43:47", "throughput": 27899.24, "total_tokens": 199635456} +{"current_steps": 690, "total_steps": 29667, "loss": 0.4917, "lr": 4.836168965695694e-05, "epoch": 0.06977846601144012, "percentage": 2.33, "elapsed_time": "2:00:57", "remaining_time": "3 days, 12:39:51", "throughput": 27909.34, "total_tokens": 202557120} +{"current_steps": 700, "total_steps": 29667, "loss": 0.4902, "lr": 4.8339083340732304e-05, "epoch": 0.07078974812754796, "percentage": 2.36, "elapsed_time": "2:02:46", "remaining_time": "3 days, 12:40:32", "throughput": 27894.33, "total_tokens": 205480832} +{"current_steps": 710, "total_steps": 29667, "loss": 0.4883, "lr": 4.8316508696368154e-05, "epoch": 0.07180103024365579, "percentage": 2.39, "elapsed_time": "2:04:27", "remaining_time": "3 days, 12:35:47", "throughput": 27906.76, "total_tokens": 208386496} +{"current_steps": 720, "total_steps": 29667, "loss": 0.4902, "lr": 4.8293965649978714e-05, "epoch": 0.07281231235976361, "percentage": 2.43, "elapsed_time": "2:06:08", "remaining_time": "3 days, 12:31:38", "throughput": 27917.76, "total_tokens": 211305088} +{"current_steps": 730, "total_steps": 29667, "loss": 0.4877, "lr": 4.8271454127919364e-05, "epoch": 0.07382359447587145, "percentage": 2.46, "elapsed_time": "2:07:48", "remaining_time": "3 days, 12:26:11", "throughput": 27931.75, "total_tokens": 214190272} +{"current_steps": 740, "total_steps": 29667, "loss": 0.4915, "lr": 4.824897405678549e-05, "epoch": 0.07483487659197927, "percentage": 2.49, "elapsed_time": "2:09:30", "remaining_time": "3 days, 12:22:32", "throughput": 27937.26, "total_tokens": 217085888} +{"current_steps": 750, "total_steps": 29667, "loss": 0.4868, "lr": 4.8226525363411576e-05, "epoch": 0.0758461587080871, "percentage": 2.53, "elapsed_time": "2:11:12", "remaining_time": "3 days, 12:18:42", "throughput": 27948.73, "total_tokens": 220019648} +{"current_steps": 760, "total_steps": 29667, "loss": 0.4851, "lr": 4.820410797487017e-05, "epoch": 0.07685744082419492, "percentage": 2.56, "elapsed_time": "2:12:54", "remaining_time": "3 days, 12:15:15", "throughput": 27961.85, "total_tokens": 222982336} +{"current_steps": 770, "total_steps": 29667, "loss": 0.4874, "lr": 4.818172181847091e-05, "epoch": 0.07786872294030275, "percentage": 2.6, "elapsed_time": "2:14:37", "remaining_time": "3 days, 12:12:32", "throughput": 27965.91, "total_tokens": 225905920} +{"current_steps": 780, "total_steps": 29667, "loss": 0.4851, "lr": 4.81593668217595e-05, "epoch": 0.07888000505641057, "percentage": 2.63, "elapsed_time": "2:16:21", "remaining_time": "3 days, 12:10:10", "throughput": 27969.81, "total_tokens": 228844032} +{"current_steps": 790, "total_steps": 29667, "loss": 0.4839, "lr": 4.813704291251675e-05, "epoch": 0.07989128717251841, "percentage": 2.66, "elapsed_time": "2:18:05", "remaining_time": "3 days, 12:07:27", "throughput": 27975.97, "total_tokens": 231784640} +{"current_steps": 800, "total_steps": 29667, "loss": 0.4878, "lr": 4.811475001875759e-05, "epoch": 0.08090256928862624, "percentage": 2.7, "elapsed_time": "2:19:48", "remaining_time": "3 days, 12:04:30", "throughput": 27981.24, "total_tokens": 234706688} +{"current_steps": 810, "total_steps": 29667, "loss": 0.4864, "lr": 4.8092488068730105e-05, "epoch": 0.08191385140473406, "percentage": 2.73, "elapsed_time": "2:21:50", "remaining_time": "3 days, 12:13:09", "throughput": 27924.82, "total_tokens": 237650688} +{"current_steps": 820, "total_steps": 29667, "loss": 0.4821, "lr": 4.807025699091452e-05, "epoch": 0.0829251335208419, "percentage": 2.76, "elapsed_time": "2:23:39", "remaining_time": "3 days, 12:13:40", "throughput": 27914.24, "total_tokens": 240600768} +{"current_steps": 830, "total_steps": 29667, "loss": 0.4885, "lr": 4.8048056714022325e-05, "epoch": 0.08393641563694972, "percentage": 2.8, "elapsed_time": "2:25:22", "remaining_time": "3 days, 12:10:54", "throughput": 27921.88, "total_tokens": 243553216} +{"current_steps": 840, "total_steps": 29667, "loss": 0.4834, "lr": 4.802588716699519e-05, "epoch": 0.08494769775305755, "percentage": 2.83, "elapsed_time": "2:27:06", "remaining_time": "3 days, 12:08:13", "throughput": 27930.17, "total_tokens": 246515392} +{"current_steps": 850, "total_steps": 29667, "loss": 0.4758, "lr": 4.8003748279004156e-05, "epoch": 0.08595897986916537, "percentage": 2.87, "elapsed_time": "2:28:46", "remaining_time": "3 days, 12:03:41", "throughput": 27940.93, "total_tokens": 249407936} +{"current_steps": 860, "total_steps": 29667, "loss": 0.4843, "lr": 4.798163997944854e-05, "epoch": 0.0869702619852732, "percentage": 2.9, "elapsed_time": "2:30:30", "remaining_time": "3 days, 12:01:35", "throughput": 27944.63, "total_tokens": 252358208} +{"current_steps": 870, "total_steps": 29667, "loss": 0.4812, "lr": 4.79595621979551e-05, "epoch": 0.08798154410138104, "percentage": 2.93, "elapsed_time": "2:32:12", "remaining_time": "3 days, 11:58:12", "throughput": 27957.21, "total_tokens": 255324672} +{"current_steps": 880, "total_steps": 29667, "loss": 0.4785, "lr": 4.793751486437702e-05, "epoch": 0.08899282621748886, "percentage": 2.97, "elapsed_time": "2:33:53", "remaining_time": "3 days, 11:54:07", "throughput": 27967.73, "total_tokens": 258237312} +{"current_steps": 890, "total_steps": 29667, "loss": 0.4793, "lr": 4.7915497908793064e-05, "epoch": 0.09000410833359669, "percentage": 3.0, "elapsed_time": "2:35:36", "remaining_time": "3 days, 11:51:11", "throughput": 27971.34, "total_tokens": 261144128} +{"current_steps": 900, "total_steps": 29667, "loss": 0.4796, "lr": 4.7893511261506516e-05, "epoch": 0.09101539044970451, "percentage": 3.03, "elapsed_time": "2:37:19", "remaining_time": "3 days, 11:48:22", "throughput": 27980.37, "total_tokens": 264107200} +{"current_steps": 910, "total_steps": 29667, "loss": 0.4738, "lr": 4.787155485304435e-05, "epoch": 0.09202667256581235, "percentage": 3.07, "elapsed_time": "2:39:00", "remaining_time": "3 days, 11:44:44", "throughput": 27990.04, "total_tokens": 267033600} +{"current_steps": 920, "total_steps": 29667, "loss": 0.4748, "lr": 4.784962861415629e-05, "epoch": 0.09303795468192017, "percentage": 3.1, "elapsed_time": "2:40:41", "remaining_time": "3 days, 11:41:11", "throughput": 27997.27, "total_tokens": 269941312} +{"current_steps": 930, "total_steps": 29667, "loss": 0.4738, "lr": 4.7827732475813884e-05, "epoch": 0.094049236798028, "percentage": 3.13, "elapsed_time": "2:42:32", "remaining_time": "3 days, 11:42:45", "throughput": 27980.29, "total_tokens": 272890240} +{"current_steps": 940, "total_steps": 29667, "loss": 0.476, "lr": 4.7805866369209576e-05, "epoch": 0.09506051891413583, "percentage": 3.17, "elapsed_time": "2:44:21", "remaining_time": "3 days, 11:42:58", "throughput": 27971.73, "total_tokens": 275847552} +{"current_steps": 950, "total_steps": 29667, "loss": 0.4706, "lr": 4.778403022575583e-05, "epoch": 0.09607180103024365, "percentage": 3.2, "elapsed_time": "2:46:03", "remaining_time": "3 days, 11:39:31", "throughput": 27981.88, "total_tokens": 278788992} +{"current_steps": 960, "total_steps": 29667, "loss": 0.4756, "lr": 4.7762223977084195e-05, "epoch": 0.09708308314635149, "percentage": 3.24, "elapsed_time": "2:47:43", "remaining_time": "3 days, 11:35:43", "throughput": 27989.67, "total_tokens": 281686464} +{"current_steps": 970, "total_steps": 29667, "loss": 0.4704, "lr": 4.774044755504444e-05, "epoch": 0.09809436526245931, "percentage": 3.27, "elapsed_time": "2:49:27", "remaining_time": "3 days, 11:33:20", "throughput": 27994.9, "total_tokens": 284637696} +{"current_steps": 980, "total_steps": 29667, "loss": 0.4725, "lr": 4.7718700891703616e-05, "epoch": 0.09910564737856714, "percentage": 3.3, "elapsed_time": "2:51:08", "remaining_time": "3 days, 11:29:29", "throughput": 28003.33, "total_tokens": 287538496} +{"current_steps": 990, "total_steps": 29667, "loss": 0.4756, "lr": 4.7696983919345215e-05, "epoch": 0.10011692949467496, "percentage": 3.34, "elapsed_time": "2:52:54", "remaining_time": "3 days, 11:28:21", "throughput": 28004.25, "total_tokens": 290517056} +{"current_steps": 1000, "total_steps": 29667, "loss": 0.4748, "lr": 4.7675296570468216e-05, "epoch": 0.1011282116107828, "percentage": 3.37, "elapsed_time": "2:54:40", "remaining_time": "3 days, 11:27:34", "throughput": 27999.89, "total_tokens": 293462592} +{"current_steps": 1010, "total_steps": 29667, "loss": 0.4719, "lr": 4.76536387777863e-05, "epoch": 0.10213949372689063, "percentage": 3.4, "elapsed_time": "2:56:24", "remaining_time": "3 days, 11:25:07", "throughput": 28005.27, "total_tokens": 296412864} +{"current_steps": 1020, "total_steps": 29667, "loss": 0.4729, "lr": 4.7632010474226915e-05, "epoch": 0.10315077584299845, "percentage": 3.44, "elapsed_time": "2:58:16", "remaining_time": "3 days, 11:26:50", "throughput": 27990.81, "total_tokens": 299399680} +{"current_steps": 1030, "total_steps": 29667, "loss": 0.467, "lr": 4.761041159293035e-05, "epoch": 0.10416205795910628, "percentage": 3.47, "elapsed_time": "3:00:11", "remaining_time": "3 days, 11:30:01", "throughput": 27963.21, "total_tokens": 302334656} +{"current_steps": 1040, "total_steps": 29667, "loss": 0.4667, "lr": 4.7588842067249e-05, "epoch": 0.1051733400752141, "percentage": 3.51, "elapsed_time": "3:02:16", "remaining_time": "3 days, 11:37:10", "throughput": 27914.99, "total_tokens": 305284736} +{"current_steps": 1050, "total_steps": 29667, "loss": 0.4651, "lr": 4.756730183074637e-05, "epoch": 0.10618462219132194, "percentage": 3.54, "elapsed_time": "3:04:18", "remaining_time": "3 days, 11:43:15", "throughput": 27872.28, "total_tokens": 308229888} +{"current_steps": 1060, "total_steps": 29667, "loss": 0.4708, "lr": 4.7545790817196314e-05, "epoch": 0.10719590430742976, "percentage": 3.57, "elapsed_time": "3:06:20", "remaining_time": "3 days, 11:48:49", "throughput": 27837.1, "total_tokens": 311225152} +{"current_steps": 1070, "total_steps": 29667, "loss": 0.4688, "lr": 4.752430896058212e-05, "epoch": 0.10820718642353759, "percentage": 3.61, "elapsed_time": "3:08:22", "remaining_time": "3 days, 11:54:41", "throughput": 27794.5, "total_tokens": 314157248} +{"current_steps": 1080, "total_steps": 29667, "loss": 0.4669, "lr": 4.750285619509567e-05, "epoch": 0.10921846853964542, "percentage": 3.64, "elapsed_time": "3:10:17", "remaining_time": "3 days, 11:56:59", "throughput": 27775.33, "total_tokens": 317129728} +{"current_steps": 1090, "total_steps": 29667, "loss": 0.4702, "lr": 4.7481432455136644e-05, "epoch": 0.11022975065575324, "percentage": 3.67, "elapsed_time": "3:12:08", "remaining_time": "3 days, 11:57:32", "throughput": 27760.29, "total_tokens": 320039872} +{"current_steps": 1100, "total_steps": 29667, "loss": 0.4703, "lr": 4.7460037675311584e-05, "epoch": 0.11124103277186108, "percentage": 3.71, "elapsed_time": "3:14:03", "remaining_time": "3 days, 11:59:32", "throughput": 27736.76, "total_tokens": 322943168} +{"current_steps": 1110, "total_steps": 29667, "loss": 0.4674, "lr": 4.7438671790433126e-05, "epoch": 0.1122523148879689, "percentage": 3.74, "elapsed_time": "3:16:00", "remaining_time": "3 days, 12:02:33", "throughput": 27707.53, "total_tokens": 325843904} +{"current_steps": 1120, "total_steps": 29667, "loss": 0.4615, "lr": 4.741733473551915e-05, "epoch": 0.11326359700407673, "percentage": 3.78, "elapsed_time": "3:17:48", "remaining_time": "3 days, 12:01:42", "throughput": 27698.97, "total_tokens": 328737792} +{"current_steps": 1130, "total_steps": 29667, "loss": 0.4711, "lr": 4.7396026445791966e-05, "epoch": 0.11427487912018455, "percentage": 3.81, "elapsed_time": "3:19:43", "remaining_time": "3 days, 12:03:38", "throughput": 27676.87, "total_tokens": 331652288} +{"current_steps": 1140, "total_steps": 29667, "loss": 0.464, "lr": 4.737474685667742e-05, "epoch": 0.11528616123629239, "percentage": 3.84, "elapsed_time": "3:21:42", "remaining_time": "3 days, 12:07:27", "throughput": 27647.79, "total_tokens": 334606016} +{"current_steps": 1150, "total_steps": 29667, "loss": 0.4693, "lr": 4.7353495903804165e-05, "epoch": 0.11629744335240022, "percentage": 3.88, "elapsed_time": "3:23:32", "remaining_time": "3 days, 12:07:25", "throughput": 27640.02, "total_tokens": 337561856} +{"current_steps": 1160, "total_steps": 29667, "loss": 0.4648, "lr": 4.733227352300277e-05, "epoch": 0.11730872546850804, "percentage": 3.91, "elapsed_time": "3:25:17", "remaining_time": "3 days, 12:05:01", "throughput": 27644.84, "total_tokens": 340514304} +{"current_steps": 1170, "total_steps": 29667, "loss": 0.4717, "lr": 4.731107965030496e-05, "epoch": 0.11832000758461587, "percentage": 3.94, "elapsed_time": "3:27:22", "remaining_time": "3 days, 12:10:48", "throughput": 27603.61, "total_tokens": 343450880} +{"current_steps": 1180, "total_steps": 29667, "loss": 0.4636, "lr": 4.728991422194278e-05, "epoch": 0.1193312897007237, "percentage": 3.98, "elapsed_time": "3:29:37", "remaining_time": "3 days, 12:20:50", "throughput": 27537.55, "total_tokens": 346365888} +{"current_steps": 1190, "total_steps": 29667, "loss": 0.4638, "lr": 4.726877717434773e-05, "epoch": 0.12034257181683153, "percentage": 4.01, "elapsed_time": "3:31:23", "remaining_time": "3 days, 12:18:28", "throughput": 27540.91, "total_tokens": 349302784} +{"current_steps": 1200, "total_steps": 29667, "loss": 0.4593, "lr": 4.724766844415013e-05, "epoch": 0.12135385393293935, "percentage": 4.04, "elapsed_time": "3:33:05", "remaining_time": "3 days, 12:14:54", "throughput": 27548.24, "total_tokens": 352206656} +{"current_steps": 1210, "total_steps": 29667, "loss": 0.4611, "lr": 4.722658796817813e-05, "epoch": 0.12236513604904718, "percentage": 4.08, "elapsed_time": "3:34:52", "remaining_time": "3 days, 12:13:25", "throughput": 27548.22, "total_tokens": 355162432} +{"current_steps": 1220, "total_steps": 29667, "loss": 0.4625, "lr": 4.7205535683457044e-05, "epoch": 0.12337641816515502, "percentage": 4.11, "elapsed_time": "3:36:36", "remaining_time": "3 days, 12:10:39", "throughput": 27553.61, "total_tokens": 358097216} +{"current_steps": 1230, "total_steps": 29667, "loss": 0.4615, "lr": 4.7184511527208484e-05, "epoch": 0.12438770028126284, "percentage": 4.15, "elapsed_time": "3:38:25", "remaining_time": "3 days, 12:09:45", "throughput": 27556.29, "total_tokens": 361129664} +{"current_steps": 1240, "total_steps": 29667, "loss": 0.4555, "lr": 4.7163515436849644e-05, "epoch": 0.12539898239737066, "percentage": 4.18, "elapsed_time": "3:40:05", "remaining_time": "3 days, 12:05:46", "throughput": 27565.1, "total_tokens": 364023168} +{"current_steps": 1250, "total_steps": 29667, "loss": 0.4621, "lr": 4.714254734999245e-05, "epoch": 0.1264102645134785, "percentage": 4.21, "elapsed_time": "3:41:45", "remaining_time": "3 days, 12:01:28", "throughput": 27575.96, "total_tokens": 366920512} +{"current_steps": 1260, "total_steps": 29667, "loss": 0.4565, "lr": 4.712160720444284e-05, "epoch": 0.12742154662958632, "percentage": 4.25, "elapsed_time": "3:43:29", "remaining_time": "3 days, 11:58:46", "throughput": 27580.83, "total_tokens": 369852992} +{"current_steps": 1270, "total_steps": 29667, "loss": 0.4585, "lr": 4.710069493819992e-05, "epoch": 0.12843282874569414, "percentage": 4.28, "elapsed_time": "3:45:18", "remaining_time": "3 days, 11:57:46", "throughput": 27577.79, "total_tokens": 372803584} +{"current_steps": 1280, "total_steps": 29667, "loss": 0.4636, "lr": 4.70798104894553e-05, "epoch": 0.129444110861802, "percentage": 4.31, "elapsed_time": "3:47:01", "remaining_time": "3 days, 11:54:54", "throughput": 27584.18, "total_tokens": 375745024} +{"current_steps": 1290, "total_steps": 29667, "loss": 0.4569, "lr": 4.705895379659219e-05, "epoch": 0.1304553929779098, "percentage": 4.35, "elapsed_time": "3:48:47", "remaining_time": "3 days, 11:52:53", "throughput": 27587.17, "total_tokens": 378703040} +{"current_steps": 1300, "total_steps": 29667, "loss": 0.4589, "lr": 4.7038124798184766e-05, "epoch": 0.13146667509401763, "percentage": 4.38, "elapsed_time": "3:50:31", "remaining_time": "3 days, 11:50:16", "throughput": 27591.48, "total_tokens": 381634752} +{"current_steps": 1310, "total_steps": 29667, "loss": 0.4542, "lr": 4.7017323432997304e-05, "epoch": 0.13247795721012545, "percentage": 4.42, "elapsed_time": "3:52:16", "remaining_time": "3 days, 11:47:49", "throughput": 27593.76, "total_tokens": 384550208} +{"current_steps": 1320, "total_steps": 29667, "loss": 0.4564, "lr": 4.6996549639983506e-05, "epoch": 0.1334892393262333, "percentage": 4.45, "elapsed_time": "3:53:58", "remaining_time": "3 days, 11:44:37", "throughput": 27602.74, "total_tokens": 387502208} +{"current_steps": 1330, "total_steps": 29667, "loss": 0.4569, "lr": 4.697580335828569e-05, "epoch": 0.13450052144234112, "percentage": 4.48, "elapsed_time": "3:55:42", "remaining_time": "3 days, 11:41:51", "throughput": 27609.35, "total_tokens": 390454208} +{"current_steps": 1340, "total_steps": 29667, "loss": 0.4544, "lr": 4.6955084527234076e-05, "epoch": 0.13551180355844894, "percentage": 4.52, "elapsed_time": "3:57:22", "remaining_time": "3 days, 11:37:51", "throughput": 27618.58, "total_tokens": 393346048} +{"current_steps": 1350, "total_steps": 29667, "loss": 0.4563, "lr": 4.6934393086346034e-05, "epoch": 0.1365230856745568, "percentage": 4.55, "elapsed_time": "3:59:01", "remaining_time": "3 days, 11:33:50", "throughput": 27625.91, "total_tokens": 396209984} +{"current_steps": 1360, "total_steps": 29667, "loss": 0.4566, "lr": 4.6913728975325324e-05, "epoch": 0.1375343677906646, "percentage": 4.58, "elapsed_time": "4:00:44", "remaining_time": "3 days, 11:30:49", "throughput": 27631.28, "total_tokens": 399122816} +{"current_steps": 1370, "total_steps": 29667, "loss": 0.4598, "lr": 4.6893092134061393e-05, "epoch": 0.13854564990677243, "percentage": 4.62, "elapsed_time": "4:02:29", "remaining_time": "3 days, 11:28:29", "throughput": 27635.31, "total_tokens": 402070272} +{"current_steps": 1380, "total_steps": 29667, "loss": 0.4514, "lr": 4.687248250262859e-05, "epoch": 0.13955693202288025, "percentage": 4.65, "elapsed_time": "4:04:14", "remaining_time": "3 days, 11:26:18", "throughput": 27640.7, "total_tokens": 405051456} +{"current_steps": 1390, "total_steps": 29667, "loss": 0.4551, "lr": 4.685190002128548e-05, "epoch": 0.1405682141389881, "percentage": 4.69, "elapsed_time": "4:05:58", "remaining_time": "3 days, 11:23:58", "throughput": 27646.78, "total_tokens": 408029760} +{"current_steps": 1400, "total_steps": 29667, "loss": 0.4492, "lr": 4.6831344630474114e-05, "epoch": 0.14157949625509592, "percentage": 4.72, "elapsed_time": "4:07:44", "remaining_time": "3 days, 11:22:01", "throughput": 27649.59, "total_tokens": 410992320} +{"current_steps": 1410, "total_steps": 29667, "loss": 0.4526, "lr": 4.6810816270819276e-05, "epoch": 0.14259077837120374, "percentage": 4.75, "elapsed_time": "4:09:26", "remaining_time": "3 days, 11:18:45", "throughput": 27657.67, "total_tokens": 413925504} +{"current_steps": 1420, "total_steps": 29667, "loss": 0.4525, "lr": 4.679031488312777e-05, "epoch": 0.14360206048731158, "percentage": 4.79, "elapsed_time": "4:11:11", "remaining_time": "3 days, 11:16:39", "throughput": 27656.36, "total_tokens": 416812928} +{"current_steps": 1430, "total_steps": 29667, "loss": 0.4534, "lr": 4.6769840408387717e-05, "epoch": 0.1446133426034194, "percentage": 4.82, "elapsed_time": "4:12:54", "remaining_time": "3 days, 11:13:56", "throughput": 27661.86, "total_tokens": 419752576} +{"current_steps": 1440, "total_steps": 29667, "loss": 0.4528, "lr": 4.674939278776787e-05, "epoch": 0.14562462471952722, "percentage": 4.85, "elapsed_time": "4:14:36", "remaining_time": "3 days, 11:10:49", "throughput": 27668.16, "total_tokens": 422670848} +{"current_steps": 1450, "total_steps": 29667, "loss": 0.4496, "lr": 4.672897196261683e-05, "epoch": 0.14663590683563504, "percentage": 4.89, "elapsed_time": "4:16:22", "remaining_time": "3 days, 11:08:56", "throughput": 27671.6, "total_tokens": 425648448} +{"current_steps": 1460, "total_steps": 29667, "loss": 0.4558, "lr": 4.670857787446238e-05, "epoch": 0.1476471889517429, "percentage": 4.92, "elapsed_time": "4:18:07", "remaining_time": "3 days, 11:06:48", "throughput": 27677.32, "total_tokens": 428640576} +{"current_steps": 1470, "total_steps": 29667, "loss": 0.4562, "lr": 4.668821046501082e-05, "epoch": 0.1486584710678507, "percentage": 4.96, "elapsed_time": "4:19:51", "remaining_time": "3 days, 11:04:28", "throughput": 27682.07, "total_tokens": 431602432} +{"current_steps": 1480, "total_steps": 29667, "loss": 0.446, "lr": 4.6667869676146194e-05, "epoch": 0.14966975318395853, "percentage": 4.99, "elapsed_time": "4:21:33", "remaining_time": "3 days, 11:01:31", "throughput": 27689.7, "total_tokens": 434554560} +{"current_steps": 1490, "total_steps": 29667, "loss": 0.4499, "lr": 4.6647555449929645e-05, "epoch": 0.15068103530006635, "percentage": 5.02, "elapsed_time": "4:23:11", "remaining_time": "3 days, 10:57:06", "throughput": 27700.56, "total_tokens": 437429952} +{"current_steps": 1500, "total_steps": 29667, "loss": 0.455, "lr": 4.662726772859869e-05, "epoch": 0.1516923174161742, "percentage": 5.06, "elapsed_time": "4:24:58", "remaining_time": "3 days, 10:55:43", "throughput": 27701.05, "total_tokens": 440406656} +{"current_steps": 1510, "total_steps": 29667, "loss": 0.4539, "lr": 4.660700645456655e-05, "epoch": 0.15270359953228202, "percentage": 5.09, "elapsed_time": "4:26:39", "remaining_time": "3 days, 10:52:27", "throughput": 27709.95, "total_tokens": 443351552} +{"current_steps": 1520, "total_steps": 29667, "loss": 0.4458, "lr": 4.658677157042149e-05, "epoch": 0.15371488164838984, "percentage": 5.12, "elapsed_time": "4:28:27", "remaining_time": "3 days, 10:51:11", "throughput": 27708.44, "total_tokens": 446308224} +{"current_steps": 1530, "total_steps": 29667, "loss": 0.4511, "lr": 4.656656301892605e-05, "epoch": 0.1547261637644977, "percentage": 5.16, "elapsed_time": "4:30:13", "remaining_time": "3 days, 10:49:29", "throughput": 27708.24, "total_tokens": 449248256} +{"current_steps": 1540, "total_steps": 29667, "loss": 0.4479, "lr": 4.6546380743016465e-05, "epoch": 0.1557374458806055, "percentage": 5.19, "elapsed_time": "4:32:03", "remaining_time": "3 days, 10:48:59", "throughput": 27700.68, "total_tokens": 452175168} +{"current_steps": 1550, "total_steps": 29667, "loss": 0.4484, "lr": 4.652622468580193e-05, "epoch": 0.15674872799671333, "percentage": 5.22, "elapsed_time": "4:34:23", "remaining_time": "3 days, 10:57:35", "throughput": 27641.32, "total_tokens": 455083968} +{"current_steps": 1560, "total_steps": 29667, "loss": 0.4429, "lr": 4.650609479056392e-05, "epoch": 0.15776001011282115, "percentage": 5.26, "elapsed_time": "4:36:17", "remaining_time": "3 days, 10:58:07", "throughput": 27630.05, "total_tokens": 458045760} +{"current_steps": 1570, "total_steps": 29667, "loss": 0.4477, "lr": 4.648599100075556e-05, "epoch": 0.158771292228929, "percentage": 5.29, "elapsed_time": "4:37:59", "remaining_time": "3 days, 10:54:59", "throughput": 27637.74, "total_tokens": 460984384} +{"current_steps": 1580, "total_steps": 29667, "loss": 0.4426, "lr": 4.6465913260000945e-05, "epoch": 0.15978257434503682, "percentage": 5.33, "elapsed_time": "4:39:40", "remaining_time": "3 days, 10:51:38", "throughput": 27648.55, "total_tokens": 463953984} +{"current_steps": 1590, "total_steps": 29667, "loss": 0.4447, "lr": 4.644586151209444e-05, "epoch": 0.16079385646114464, "percentage": 5.36, "elapsed_time": "4:41:22", "remaining_time": "3 days, 10:48:31", "throughput": 27653.79, "total_tokens": 466852608} +{"current_steps": 1600, "total_steps": 29667, "loss": 0.4482, "lr": 4.6425835701000084e-05, "epoch": 0.16180513857725248, "percentage": 5.39, "elapsed_time": "4:43:02", "remaining_time": "3 days, 10:45:03", "throughput": 27661.21, "total_tokens": 469754560} +{"current_steps": 1610, "total_steps": 29667, "loss": 0.4483, "lr": 4.640583577085084e-05, "epoch": 0.1628164206933603, "percentage": 5.43, "elapsed_time": "4:44:43", "remaining_time": "3 days, 10:41:45", "throughput": 27670.56, "total_tokens": 472704320} +{"current_steps": 1620, "total_steps": 29667, "loss": 0.4448, "lr": 4.638586166594806e-05, "epoch": 0.16382770280946812, "percentage": 5.46, "elapsed_time": "4:46:26", "remaining_time": "3 days, 10:39:14", "throughput": 27678.61, "total_tokens": 475706560} +{"current_steps": 1630, "total_steps": 29667, "loss": 0.4482, "lr": 4.6365913330760726e-05, "epoch": 0.16483898492557594, "percentage": 5.49, "elapsed_time": "4:48:05", "remaining_time": "3 days, 10:35:20", "throughput": 27690.96, "total_tokens": 478651328} +{"current_steps": 1640, "total_steps": 29667, "loss": 0.4448, "lr": 4.6345990709924855e-05, "epoch": 0.1658502670416838, "percentage": 5.53, "elapsed_time": "4:49:47", "remaining_time": "3 days, 10:32:25", "throughput": 27696.34, "total_tokens": 481568704} +{"current_steps": 1650, "total_steps": 29667, "loss": 0.4433, "lr": 4.632609374824284e-05, "epoch": 0.1668615491577916, "percentage": 5.56, "elapsed_time": "4:51:31", "remaining_time": "3 days, 10:30:08", "throughput": 27699.07, "total_tokens": 484502656} +{"current_steps": 1660, "total_steps": 29667, "loss": 0.4502, "lr": 4.630622239068285e-05, "epoch": 0.16787283127389943, "percentage": 5.6, "elapsed_time": "4:53:20", "remaining_time": "3 days, 10:29:16", "throughput": 27696.09, "total_tokens": 487475840} +{"current_steps": 1670, "total_steps": 29667, "loss": 0.4422, "lr": 4.628637658237808e-05, "epoch": 0.16888411339000728, "percentage": 5.63, "elapsed_time": "4:55:02", "remaining_time": "3 days, 10:26:19", "throughput": 27702.22, "total_tokens": 490403456} +{"current_steps": 1680, "total_steps": 29667, "loss": 0.4413, "lr": 4.626655626862625e-05, "epoch": 0.1698953955061151, "percentage": 5.66, "elapsed_time": "4:56:45", "remaining_time": "3 days, 10:23:47", "throughput": 27706.97, "total_tokens": 493347968} +{"current_steps": 1690, "total_steps": 29667, "loss": 0.4424, "lr": 4.624676139488888e-05, "epoch": 0.17090667762222292, "percentage": 5.7, "elapsed_time": "4:58:27", "remaining_time": "3 days, 10:20:48", "throughput": 27713.35, "total_tokens": 496277184} +{"current_steps": 1700, "total_steps": 29667, "loss": 0.4396, "lr": 4.6226991906790686e-05, "epoch": 0.17191795973833074, "percentage": 5.73, "elapsed_time": "5:00:08", "remaining_time": "3 days, 10:17:43", "throughput": 27718.1, "total_tokens": 499165824} +{"current_steps": 1710, "total_steps": 29667, "loss": 0.4418, "lr": 4.620724775011897e-05, "epoch": 0.1729292418544386, "percentage": 5.76, "elapsed_time": "5:01:48", "remaining_time": "3 days, 10:14:10", "throughput": 27727.99, "total_tokens": 502099456} +{"current_steps": 1720, "total_steps": 29667, "loss": 0.4431, "lr": 4.618752887082297e-05, "epoch": 0.1739405239705464, "percentage": 5.8, "elapsed_time": "5:03:30", "remaining_time": "3 days, 10:11:28", "throughput": 27733.82, "total_tokens": 505046400} +{"current_steps": 1730, "total_steps": 29667, "loss": 0.4443, "lr": 4.616783521501325e-05, "epoch": 0.17495180608665423, "percentage": 5.83, "elapsed_time": "5:05:11", "remaining_time": "3 days, 10:08:17", "throughput": 27740.01, "total_tokens": 507950336} +{"current_steps": 1740, "total_steps": 29667, "loss": 0.4396, "lr": 4.614816672896108e-05, "epoch": 0.17596308820276207, "percentage": 5.87, "elapsed_time": "5:06:52", "remaining_time": "3 days, 10:05:20", "throughput": 27748.84, "total_tokens": 510925952} +{"current_steps": 1750, "total_steps": 29667, "loss": 0.4412, "lr": 4.612852335909782e-05, "epoch": 0.1769743703188699, "percentage": 5.9, "elapsed_time": "5:08:33", "remaining_time": "3 days, 10:02:12", "throughput": 27756.95, "total_tokens": 513869632} +{"current_steps": 1760, "total_steps": 29667, "loss": 0.4437, "lr": 4.6108905052014323e-05, "epoch": 0.17798565243497771, "percentage": 5.93, "elapsed_time": "5:10:14", "remaining_time": "3 days, 9:59:16", "throughput": 27763.02, "total_tokens": 516795712} +{"current_steps": 1770, "total_steps": 29667, "loss": 0.436, "lr": 4.608931175446027e-05, "epoch": 0.17899693455108553, "percentage": 5.97, "elapsed_time": "5:11:59", "remaining_time": "3 days, 9:57:13", "throughput": 27764.1, "total_tokens": 519721856} +{"current_steps": 1780, "total_steps": 29667, "loss": 0.4455, "lr": 4.606974341334367e-05, "epoch": 0.18000821666719338, "percentage": 6.0, "elapsed_time": "5:13:39", "remaining_time": "3 days, 9:54:09", "throughput": 27770.59, "total_tokens": 522641600} +{"current_steps": 1790, "total_steps": 29667, "loss": 0.4409, "lr": 4.605019997573011e-05, "epoch": 0.1810194987833012, "percentage": 6.03, "elapsed_time": "5:15:26", "remaining_time": "3 days, 9:52:39", "throughput": 27772.12, "total_tokens": 525634560} +{"current_steps": 1800, "total_steps": 29667, "loss": 0.4418, "lr": 4.603068138884229e-05, "epoch": 0.18203078089940902, "percentage": 6.07, "elapsed_time": "5:17:03", "remaining_time": "3 days, 9:48:39", "throughput": 27782.04, "total_tokens": 528518464} +{"current_steps": 1810, "total_steps": 29667, "loss": 0.4451, "lr": 4.6011187600059345e-05, "epoch": 0.18304206301551687, "percentage": 6.1, "elapsed_time": "5:18:47", "remaining_time": "3 days, 9:46:18", "throughput": 27787.64, "total_tokens": 531499008} +{"current_steps": 1820, "total_steps": 29667, "loss": 0.4409, "lr": 4.599171855691629e-05, "epoch": 0.1840533451316247, "percentage": 6.13, "elapsed_time": "5:20:30", "remaining_time": "3 days, 9:44:01", "throughput": 27792.3, "total_tokens": 534468416} +{"current_steps": 1830, "total_steps": 29667, "loss": 0.4407, "lr": 4.597227420710335e-05, "epoch": 0.1850646272477325, "percentage": 6.17, "elapsed_time": "5:22:12", "remaining_time": "3 days, 9:41:15", "throughput": 27798.16, "total_tokens": 537407232} +{"current_steps": 1840, "total_steps": 29667, "loss": 0.4375, "lr": 4.595285449846551e-05, "epoch": 0.18607590936384033, "percentage": 6.2, "elapsed_time": "5:23:56", "remaining_time": "3 days, 9:39:00", "throughput": 27803.03, "total_tokens": 540383680} +{"current_steps": 1850, "total_steps": 29667, "loss": 0.4351, "lr": 4.593345937900178e-05, "epoch": 0.18708719147994818, "percentage": 6.24, "elapsed_time": "5:25:35", "remaining_time": "3 days, 9:35:33", "throughput": 27809.54, "total_tokens": 543261312} +{"current_steps": 1860, "total_steps": 29667, "loss": 0.4437, "lr": 4.591408879686472e-05, "epoch": 0.188098473596056, "percentage": 6.27, "elapsed_time": "5:27:19", "remaining_time": "3 days, 9:33:30", "throughput": 27814.42, "total_tokens": 546261824} +{"current_steps": 1870, "total_steps": 29667, "loss": 0.4378, "lr": 4.5894742700359775e-05, "epoch": 0.18910975571216382, "percentage": 6.3, "elapsed_time": "5:29:01", "remaining_time": "3 days, 9:30:51", "throughput": 27820.64, "total_tokens": 549220416} +{"current_steps": 1880, "total_steps": 29667, "loss": 0.4335, "lr": 4.587542103794477e-05, "epoch": 0.19012103782827167, "percentage": 6.34, "elapsed_time": "5:30:44", "remaining_time": "3 days, 9:28:23", "throughput": 27824.77, "total_tokens": 552160448} +{"current_steps": 1890, "total_steps": 29667, "loss": 0.4343, "lr": 4.5856123758229247e-05, "epoch": 0.1911323199443795, "percentage": 6.37, "elapsed_time": "5:32:27", "remaining_time": "3 days, 9:26:03", "throughput": 27829.46, "total_tokens": 555125568} +{"current_steps": 1900, "total_steps": 29667, "loss": 0.4348, "lr": 4.5836850809973993e-05, "epoch": 0.1921436020604873, "percentage": 6.4, "elapsed_time": "5:34:11", "remaining_time": "3 days, 9:23:56", "throughput": 27833.7, "total_tokens": 558107584} +{"current_steps": 1910, "total_steps": 29667, "loss": 0.4349, "lr": 4.5817602142090385e-05, "epoch": 0.19315488417659513, "percentage": 6.44, "elapsed_time": "5:35:49", "remaining_time": "3 days, 9:20:19", "throughput": 27843.55, "total_tokens": 561028544} +{"current_steps": 1920, "total_steps": 29667, "loss": 0.4363, "lr": 4.579837770363989e-05, "epoch": 0.19416616629270297, "percentage": 6.47, "elapsed_time": "5:37:35", "remaining_time": "3 days, 9:18:50", "throughput": 27846.91, "total_tokens": 564066176} +{"current_steps": 1930, "total_steps": 29667, "loss": 0.4312, "lr": 4.57791774438334e-05, "epoch": 0.1951774484088108, "percentage": 6.51, "elapsed_time": "5:39:18", "remaining_time": "3 days, 9:16:17", "throughput": 27852.36, "total_tokens": 567023360} +{"current_steps": 1940, "total_steps": 29667, "loss": 0.4398, "lr": 4.576000131203078e-05, "epoch": 0.19618873052491861, "percentage": 6.54, "elapsed_time": "5:40:59", "remaining_time": "3 days, 9:13:35", "throughput": 27857.83, "total_tokens": 569962368} +{"current_steps": 1950, "total_steps": 29667, "loss": 0.4361, "lr": 4.574084925774023e-05, "epoch": 0.19720001264102646, "percentage": 6.57, "elapsed_time": "5:42:41", "remaining_time": "3 days, 9:10:56", "throughput": 27864.61, "total_tokens": 572935616} +{"current_steps": 1960, "total_steps": 29667, "loss": 0.4396, "lr": 4.5721721230617795e-05, "epoch": 0.19821129475713428, "percentage": 6.61, "elapsed_time": "5:44:21", "remaining_time": "3 days, 9:07:52", "throughput": 27871.7, "total_tokens": 575865152} +{"current_steps": 1970, "total_steps": 29667, "loss": 0.429, "lr": 4.57026171804667e-05, "epoch": 0.1992225768732421, "percentage": 6.64, "elapsed_time": "5:46:00", "remaining_time": "3 days, 9:04:35", "throughput": 27877.78, "total_tokens": 578746816} +{"current_steps": 1980, "total_steps": 29667, "loss": 0.4322, "lr": 4.568353705723692e-05, "epoch": 0.20023385898934992, "percentage": 6.67, "elapsed_time": "5:47:38", "remaining_time": "3 days, 9:01:06", "throughput": 27884.34, "total_tokens": 581615552} +{"current_steps": 1990, "total_steps": 29667, "loss": 0.4359, "lr": 4.566448081102455e-05, "epoch": 0.20124514110545777, "percentage": 6.71, "elapsed_time": "5:49:17", "remaining_time": "3 days, 8:58:04", "throughput": 27892.23, "total_tokens": 584565056} +{"current_steps": 2000, "total_steps": 29667, "loss": 0.4324, "lr": 4.564544839207128e-05, "epoch": 0.2022564232215656, "percentage": 6.74, "elapsed_time": "5:51:00", "remaining_time": "3 days, 8:55:39", "throughput": 27895.8, "total_tokens": 587496896} +{"current_steps": 2010, "total_steps": 29667, "loss": 0.4351, "lr": 4.562643975076387e-05, "epoch": 0.2032677053376734, "percentage": 6.78, "elapsed_time": "5:52:39", "remaining_time": "3 days, 8:52:23", "throughput": 27902.67, "total_tokens": 590396928} +{"current_steps": 2020, "total_steps": 29667, "loss": 0.4373, "lr": 4.560745483763357e-05, "epoch": 0.20427898745378126, "percentage": 6.81, "elapsed_time": "5:54:22", "remaining_time": "3 days, 8:50:14", "throughput": 27905.7, "total_tokens": 593350144} +{"current_steps": 2030, "total_steps": 29667, "loss": 0.4401, "lr": 4.5588493603355595e-05, "epoch": 0.20529026956988908, "percentage": 6.84, "elapsed_time": "5:56:04", "remaining_time": "3 days, 8:47:40", "throughput": 27910.28, "total_tokens": 596286080} +{"current_steps": 2040, "total_steps": 29667, "loss": 0.436, "lr": 4.556955599874859e-05, "epoch": 0.2063015516859969, "percentage": 6.88, "elapsed_time": "5:57:43", "remaining_time": "3 days, 8:44:38", "throughput": 27916.36, "total_tokens": 599194368} +{"current_steps": 2050, "total_steps": 29667, "loss": 0.4336, "lr": 4.555064197477409e-05, "epoch": 0.20731283380210472, "percentage": 6.91, "elapsed_time": "5:59:26", "remaining_time": "3 days, 8:42:24", "throughput": 27919.88, "total_tokens": 602147968} +{"current_steps": 2060, "total_steps": 29667, "loss": 0.4297, "lr": 4.5531751482536e-05, "epoch": 0.20832411591821257, "percentage": 6.94, "elapsed_time": "6:01:10", "remaining_time": "3 days, 8:40:18", "throughput": 27922.95, "total_tokens": 605108864} +{"current_steps": 2070, "total_steps": 29667, "loss": 0.4398, "lr": 4.5512884473280024e-05, "epoch": 0.20933539803432039, "percentage": 6.98, "elapsed_time": "6:02:55", "remaining_time": "3 days, 8:38:34", "throughput": 27925.49, "total_tokens": 608103744} +{"current_steps": 2080, "total_steps": 29667, "loss": 0.4319, "lr": 4.549404089839322e-05, "epoch": 0.2103466801504282, "percentage": 7.01, "elapsed_time": "6:04:38", "remaining_time": "3 days, 8:36:17", "throughput": 27929.76, "total_tokens": 611068288} +{"current_steps": 2090, "total_steps": 29667, "loss": 0.4364, "lr": 4.547522070940335e-05, "epoch": 0.21135796226653605, "percentage": 7.04, "elapsed_time": "6:06:18", "remaining_time": "3 days, 8:33:17", "throughput": 27935.86, "total_tokens": 613981888} +{"current_steps": 2100, "total_steps": 29667, "loss": 0.4399, "lr": 4.545642385797848e-05, "epoch": 0.21236924438264387, "percentage": 7.08, "elapsed_time": "6:08:00", "remaining_time": "3 days, 8:30:47", "throughput": 27940.22, "total_tokens": 616920640} +{"current_steps": 2110, "total_steps": 29667, "loss": 0.4337, "lr": 4.543765029592637e-05, "epoch": 0.2133805264987517, "percentage": 7.11, "elapsed_time": "6:09:43", "remaining_time": "3 days, 8:28:41", "throughput": 27943.81, "total_tokens": 619892352} +{"current_steps": 2120, "total_steps": 29667, "loss": 0.43, "lr": 4.541889997519403e-05, "epoch": 0.2143918086148595, "percentage": 7.15, "elapsed_time": "6:11:22", "remaining_time": "3 days, 8:25:42", "throughput": 27951.25, "total_tokens": 622837696} +{"current_steps": 2130, "total_steps": 29667, "loss": 0.4355, "lr": 4.5400172847867095e-05, "epoch": 0.21540309073096736, "percentage": 7.18, "elapsed_time": "6:13:09", "remaining_time": "3 days, 8:24:13", "throughput": 27950.7, "total_tokens": 625798144} +{"current_steps": 2140, "total_steps": 29667, "loss": 0.4351, "lr": 4.5381468866169466e-05, "epoch": 0.21641437284707518, "percentage": 7.21, "elapsed_time": "6:14:50", "remaining_time": "3 days, 8:21:43", "throughput": 27955.62, "total_tokens": 628749248} +{"current_steps": 2150, "total_steps": 29667, "loss": 0.43, "lr": 4.5362787982462616e-05, "epoch": 0.217425654963183, "percentage": 7.25, "elapsed_time": "6:16:32", "remaining_time": "3 days, 8:19:11", "throughput": 27959.83, "total_tokens": 631679936} +{"current_steps": 2160, "total_steps": 29667, "loss": 0.4259, "lr": 4.5344130149245275e-05, "epoch": 0.21843693707929085, "percentage": 7.28, "elapsed_time": "6:18:15", "remaining_time": "3 days, 8:17:05", "throughput": 27961.92, "total_tokens": 634618816} +{"current_steps": 2170, "total_steps": 29667, "loss": 0.4336, "lr": 4.5325495319152715e-05, "epoch": 0.21944821919539867, "percentage": 7.31, "elapsed_time": "6:19:55", "remaining_time": "3 days, 8:14:15", "throughput": 27967.62, "total_tokens": 637545344} +{"current_steps": 2180, "total_steps": 29667, "loss": 0.4299, "lr": 4.530688344495644e-05, "epoch": 0.2204595013115065, "percentage": 7.35, "elapsed_time": "6:21:33", "remaining_time": "3 days, 8:10:58", "throughput": 27973.49, "total_tokens": 640412480} +{"current_steps": 2190, "total_steps": 29667, "loss": 0.4283, "lr": 4.528829447956357e-05, "epoch": 0.2214707834276143, "percentage": 7.38, "elapsed_time": "6:23:18", "remaining_time": "3 days, 8:09:08", "throughput": 27975.1, "total_tokens": 643376768} +{"current_steps": 2200, "total_steps": 29667, "loss": 0.4299, "lr": 4.526972837601633e-05, "epoch": 0.22248206554372216, "percentage": 7.42, "elapsed_time": "6:24:58", "remaining_time": "3 days, 8:06:23", "throughput": 27979.32, "total_tokens": 646277632} +{"current_steps": 2210, "total_steps": 29667, "loss": 0.4293, "lr": 4.525118508749165e-05, "epoch": 0.22349334765982998, "percentage": 7.45, "elapsed_time": "6:26:35", "remaining_time": "3 days, 8:02:59", "throughput": 27987.49, "total_tokens": 649182528} +{"current_steps": 2220, "total_steps": 29667, "loss": 0.4281, "lr": 4.5232664567300546e-05, "epoch": 0.2245046297759378, "percentage": 7.48, "elapsed_time": "6:28:18", "remaining_time": "3 days, 8:00:46", "throughput": 27991.12, "total_tokens": 652141376} +{"current_steps": 2230, "total_steps": 29667, "loss": 0.4269, "lr": 4.521416676888773e-05, "epoch": 0.22551591189204565, "percentage": 7.52, "elapsed_time": "6:30:00", "remaining_time": "3 days, 7:58:24", "throughput": 27995.01, "total_tokens": 655083968} +{"current_steps": 2240, "total_steps": 29667, "loss": 0.4224, "lr": 4.519569164583107e-05, "epoch": 0.22652719400815347, "percentage": 7.55, "elapsed_time": "6:31:38", "remaining_time": "3 days, 7:55:25", "throughput": 28000.99, "total_tokens": 657993600} +{"current_steps": 2250, "total_steps": 29667, "loss": 0.4311, "lr": 4.517723915184109e-05, "epoch": 0.22753847612426129, "percentage": 7.58, "elapsed_time": "6:33:17", "remaining_time": "3 days, 7:52:29", "throughput": 28006.25, "total_tokens": 660891328} +{"current_steps": 2260, "total_steps": 29667, "loss": 0.4313, "lr": 4.5158809240760506e-05, "epoch": 0.2285497582403691, "percentage": 7.62, "elapsed_time": "6:34:59", "remaining_time": "3 days, 7:50:03", "throughput": 28008.38, "total_tokens": 663784576} +{"current_steps": 2270, "total_steps": 29667, "loss": 0.4258, "lr": 4.514040186656375e-05, "epoch": 0.22956104035647695, "percentage": 7.65, "elapsed_time": "6:36:46", "remaining_time": "3 days, 7:48:45", "throughput": 28007.37, "total_tokens": 666759360} +{"current_steps": 2280, "total_steps": 29667, "loss": 0.428, "lr": 4.512201698335644e-05, "epoch": 0.23057232247258477, "percentage": 7.69, "elapsed_time": "6:38:27", "remaining_time": "3 days, 7:46:13", "throughput": 28011.45, "total_tokens": 669684480} +{"current_steps": 2290, "total_steps": 29667, "loss": 0.4311, "lr": 4.510365454537496e-05, "epoch": 0.2315836045886926, "percentage": 7.72, "elapsed_time": "6:40:10", "remaining_time": "3 days, 7:44:02", "throughput": 28011.96, "total_tokens": 672573440} +{"current_steps": 2300, "total_steps": 29667, "loss": 0.425, "lr": 4.5085314506985945e-05, "epoch": 0.23259488670480044, "percentage": 7.75, "elapsed_time": "6:41:51", "remaining_time": "3 days, 7:41:38", "throughput": 28014.86, "total_tokens": 675488000} +{"current_steps": 2310, "total_steps": 29667, "loss": 0.4366, "lr": 4.50669968226858e-05, "epoch": 0.23360616882090826, "percentage": 7.79, "elapsed_time": "6:43:37", "remaining_time": "3 days, 7:40:04", "throughput": 28015.06, "total_tokens": 678454528} +{"current_steps": 2320, "total_steps": 29667, "loss": 0.4253, "lr": 4.504870144710027e-05, "epoch": 0.23461745093701608, "percentage": 7.82, "elapsed_time": "6:45:18", "remaining_time": "3 days, 7:37:38", "throughput": 28017.25, "total_tokens": 681347904} +{"current_steps": 2330, "total_steps": 29667, "loss": 0.4301, "lr": 4.5030428334983884e-05, "epoch": 0.2356287330531239, "percentage": 7.85, "elapsed_time": "6:46:59", "remaining_time": "3 days, 7:35:06", "throughput": 28021.77, "total_tokens": 684283072} +{"current_steps": 2340, "total_steps": 29667, "loss": 0.4248, "lr": 4.501217744121959e-05, "epoch": 0.23664001516923175, "percentage": 7.89, "elapsed_time": "6:48:35", "remaining_time": "3 days, 7:31:35", "throughput": 28027.96, "total_tokens": 687116416} +{"current_steps": 2350, "total_steps": 29667, "loss": 0.4258, "lr": 4.499394872081821e-05, "epoch": 0.23765129728533957, "percentage": 7.92, "elapsed_time": "6:50:18", "remaining_time": "3 days, 7:29:26", "throughput": 28030.28, "total_tokens": 690051456} +{"current_steps": 2360, "total_steps": 29667, "loss": 0.4297, "lr": 4.4975742128918e-05, "epoch": 0.2386625794014474, "percentage": 7.95, "elapsed_time": "6:52:01", "remaining_time": "3 days, 7:27:23", "throughput": 28032.08, "total_tokens": 692986624} +{"current_steps": 2370, "total_steps": 29667, "loss": 0.4281, "lr": 4.495755762078418e-05, "epoch": 0.23967386151755524, "percentage": 7.99, "elapsed_time": "6:53:43", "remaining_time": "3 days, 7:25:12", "throughput": 28034.96, "total_tokens": 695930560} +{"current_steps": 2380, "total_steps": 29667, "loss": 0.422, "lr": 4.49393951518085e-05, "epoch": 0.24068514363366306, "percentage": 8.02, "elapsed_time": "6:55:23", "remaining_time": "3 days, 7:22:30", "throughput": 28040.76, "total_tokens": 698871552} +{"current_steps": 2390, "total_steps": 29667, "loss": 0.4243, "lr": 4.4921254677508716e-05, "epoch": 0.24169642574977088, "percentage": 8.06, "elapsed_time": "6:57:04", "remaining_time": "3 days, 7:20:06", "throughput": 28043.78, "total_tokens": 701789184} +{"current_steps": 2400, "total_steps": 29667, "loss": 0.4219, "lr": 4.490313615352821e-05, "epoch": 0.2427077078658787, "percentage": 8.09, "elapsed_time": "6:58:47", "remaining_time": "3 days, 7:18:01", "throughput": 28046.97, "total_tokens": 704753536} +{"current_steps": 2410, "total_steps": 29667, "loss": 0.4233, "lr": 4.48850395356355e-05, "epoch": 0.24371898998198654, "percentage": 8.12, "elapsed_time": "7:00:29", "remaining_time": "3 days, 7:15:49", "throughput": 28050.46, "total_tokens": 707710272} +{"current_steps": 2420, "total_steps": 29667, "loss": 0.4253, "lr": 4.486696477972375e-05, "epoch": 0.24473027209809436, "percentage": 8.16, "elapsed_time": "7:02:13", "remaining_time": "3 days, 7:13:52", "throughput": 28053.3, "total_tokens": 710689664} +{"current_steps": 2430, "total_steps": 29667, "loss": 0.4249, "lr": 4.484891184181041e-05, "epoch": 0.24574155421420218, "percentage": 8.19, "elapsed_time": "7:03:52", "remaining_time": "3 days, 7:11:04", "throughput": 28057.93, "total_tokens": 713586112} +{"current_steps": 2440, "total_steps": 29667, "loss": 0.4261, "lr": 4.483088067803662e-05, "epoch": 0.24675283633031003, "percentage": 8.22, "elapsed_time": "7:05:32", "remaining_time": "3 days, 7:08:24", "throughput": 28061.45, "total_tokens": 716472576} +{"current_steps": 2450, "total_steps": 29667, "loss": 0.4224, "lr": 4.481287124466697e-05, "epoch": 0.24776411844641785, "percentage": 8.26, "elapsed_time": "7:07:11", "remaining_time": "3 days, 7:05:39", "throughput": 28065.48, "total_tokens": 719358656} +{"current_steps": 2460, "total_steps": 29667, "loss": 0.4224, "lr": 4.479488349808885e-05, "epoch": 0.24877540056252567, "percentage": 8.29, "elapsed_time": "7:08:50", "remaining_time": "3 days, 7:02:53", "throughput": 28070.14, "total_tokens": 722259072} +{"current_steps": 2470, "total_steps": 29667, "loss": 0.4206, "lr": 4.4776917394812114e-05, "epoch": 0.2497866826786335, "percentage": 8.33, "elapsed_time": "7:10:31", "remaining_time": "3 days, 7:00:30", "throughput": 28073.88, "total_tokens": 725194240} +{"current_steps": 2480, "total_steps": 29667, "loss": 0.4225, "lr": 4.475897289146862e-05, "epoch": 0.2507979647947413, "percentage": 8.36, "elapsed_time": "7:12:12", "remaining_time": "3 days, 6:58:03", "throughput": 28077.96, "total_tokens": 728128192} +{"current_steps": 2490, "total_steps": 29667, "loss": 0.4154, "lr": 4.4741049944811806e-05, "epoch": 0.25180924691084916, "percentage": 8.39, "elapsed_time": "7:13:47", "remaining_time": "3 days, 6:54:39", "throughput": 28087.25, "total_tokens": 731050880} +{"current_steps": 2500, "total_steps": 29667, "loss": 0.4246, "lr": 4.472314851171621e-05, "epoch": 0.252820529026957, "percentage": 8.43, "elapsed_time": "7:15:27", "remaining_time": "3 days, 6:52:05", "throughput": 28090.9, "total_tokens": 733953856} +{"current_steps": 2510, "total_steps": 29667, "loss": 0.4187, "lr": 4.4705268549177084e-05, "epoch": 0.2538318111430648, "percentage": 8.46, "elapsed_time": "7:17:07", "remaining_time": "3 days, 6:49:30", "throughput": 28094.5, "total_tokens": 736852736} +{"current_steps": 2520, "total_steps": 29667, "loss": 0.425, "lr": 4.468741001430989e-05, "epoch": 0.25484309325917265, "percentage": 8.49, "elapsed_time": "7:18:51", "remaining_time": "3 days, 6:47:36", "throughput": 28096.19, "total_tokens": 739806912} +{"current_steps": 2530, "total_steps": 29667, "loss": 0.4262, "lr": 4.466957286434997e-05, "epoch": 0.2558543753752805, "percentage": 8.53, "elapsed_time": "7:20:32", "remaining_time": "3 days, 6:45:12", "throughput": 28099.7, "total_tokens": 742732096} +{"current_steps": 2540, "total_steps": 29667, "loss": 0.4237, "lr": 4.4651757056652e-05, "epoch": 0.2568656574913883, "percentage": 8.56, "elapsed_time": "7:22:08", "remaining_time": "3 days, 6:41:59", "throughput": 28106.47, "total_tokens": 745615872} +{"current_steps": 2550, "total_steps": 29667, "loss": 0.4224, "lr": 4.463396254868968e-05, "epoch": 0.25787693960749614, "percentage": 8.6, "elapsed_time": "7:23:48", "remaining_time": "3 days, 6:39:28", "throughput": 28110.7, "total_tokens": 748539968} +{"current_steps": 2560, "total_steps": 29667, "loss": 0.4221, "lr": 4.461618929805519e-05, "epoch": 0.258888221723604, "percentage": 8.63, "elapsed_time": "7:25:30", "remaining_time": "3 days, 6:37:18", "throughput": 28114.55, "total_tokens": 751510400} +{"current_steps": 2570, "total_steps": 29667, "loss": 0.4223, "lr": 4.459843726245888e-05, "epoch": 0.2598995038397118, "percentage": 8.66, "elapsed_time": "7:27:12", "remaining_time": "3 days, 6:35:15", "throughput": 28116.31, "total_tokens": 754442880} +{"current_steps": 2580, "total_steps": 29667, "loss": 0.4218, "lr": 4.458070639972875e-05, "epoch": 0.2609107859558196, "percentage": 8.7, "elapsed_time": "7:28:52", "remaining_time": "3 days, 6:32:44", "throughput": 28121.88, "total_tokens": 757403904} +{"current_steps": 2590, "total_steps": 29667, "loss": 0.4202, "lr": 4.456299666781007e-05, "epoch": 0.2619220680719274, "percentage": 8.73, "elapsed_time": "7:30:34", "remaining_time": "3 days, 6:30:26", "throughput": 28126.05, "total_tokens": 760361920} +{"current_steps": 2600, "total_steps": 29667, "loss": 0.4267, "lr": 4.4545308024764984e-05, "epoch": 0.26293335018803526, "percentage": 8.76, "elapsed_time": "7:32:17", "remaining_time": "3 days, 6:28:33", "throughput": 28127.79, "total_tokens": 763323840} +{"current_steps": 2610, "total_steps": 29667, "loss": 0.4233, "lr": 4.452764042877207e-05, "epoch": 0.2639446323041431, "percentage": 8.8, "elapsed_time": "7:33:56", "remaining_time": "3 days, 6:25:49", "throughput": 28132.72, "total_tokens": 766230208} +{"current_steps": 2620, "total_steps": 29667, "loss": 0.4159, "lr": 4.45099938381259e-05, "epoch": 0.2649559144202509, "percentage": 8.83, "elapsed_time": "7:35:34", "remaining_time": "3 days, 6:22:59", "throughput": 28137.96, "total_tokens": 769129920} +{"current_steps": 2630, "total_steps": 29667, "loss": 0.4169, "lr": 4.449236821123667e-05, "epoch": 0.26596719653635875, "percentage": 8.87, "elapsed_time": "7:37:13", "remaining_time": "3 days, 6:20:20", "throughput": 28141.86, "total_tokens": 772023744} +{"current_steps": 2640, "total_steps": 29667, "loss": 0.4181, "lr": 4.447476350662976e-05, "epoch": 0.2669784786524666, "percentage": 8.9, "elapsed_time": "7:38:52", "remaining_time": "3 days, 6:17:47", "throughput": 28146.59, "total_tokens": 774955584} +{"current_steps": 2650, "total_steps": 29667, "loss": 0.413, "lr": 4.4457179682945346e-05, "epoch": 0.2679897607685744, "percentage": 8.93, "elapsed_time": "7:40:30", "remaining_time": "3 days, 6:15:00", "throughput": 28152.13, "total_tokens": 777871360} +{"current_steps": 2660, "total_steps": 29667, "loss": 0.417, "lr": 4.443961669893798e-05, "epoch": 0.26900104288468224, "percentage": 8.97, "elapsed_time": "7:42:10", "remaining_time": "3 days, 6:12:27", "throughput": 28156.73, "total_tokens": 780799296} +{"current_steps": 2670, "total_steps": 29667, "loss": 0.4204, "lr": 4.4422074513476155e-05, "epoch": 0.2700123250007901, "percentage": 9.0, "elapsed_time": "7:43:45", "remaining_time": "3 days, 6:09:14", "throughput": 28163.59, "total_tokens": 783678528} +{"current_steps": 2680, "total_steps": 29667, "loss": 0.4176, "lr": 4.4404553085541955e-05, "epoch": 0.2710236071168979, "percentage": 9.03, "elapsed_time": "7:45:25", "remaining_time": "3 days, 6:06:46", "throughput": 28167.71, "total_tokens": 786604608} +{"current_steps": 2690, "total_steps": 29667, "loss": 0.4216, "lr": 4.438705237423063e-05, "epoch": 0.27203488923300573, "percentage": 9.07, "elapsed_time": "7:47:06", "remaining_time": "3 days, 6:04:25", "throughput": 28172.15, "total_tokens": 789563072} +{"current_steps": 2700, "total_steps": 29667, "loss": 0.4167, "lr": 4.436957233875017e-05, "epoch": 0.2730461713491136, "percentage": 9.1, "elapsed_time": "7:48:49", "remaining_time": "3 days, 6:02:27", "throughput": 28175.54, "total_tokens": 792552576} +{"current_steps": 2710, "total_steps": 29667, "loss": 0.4174, "lr": 4.4352112938420956e-05, "epoch": 0.27405745346522137, "percentage": 9.13, "elapsed_time": "7:50:32", "remaining_time": "3 days, 6:00:35", "throughput": 28176.52, "total_tokens": 795493632} +{"current_steps": 2720, "total_steps": 29667, "loss": 0.4223, "lr": 4.433467413267529e-05, "epoch": 0.2750687355813292, "percentage": 9.17, "elapsed_time": "7:52:15", "remaining_time": "3 days, 5:58:34", "throughput": 28178.77, "total_tokens": 798446336} +{"current_steps": 2730, "total_steps": 29667, "loss": 0.4175, "lr": 4.431725588105708e-05, "epoch": 0.276080017697437, "percentage": 9.2, "elapsed_time": "7:53:56", "remaining_time": "3 days, 5:56:25", "throughput": 28181.31, "total_tokens": 801383360} +{"current_steps": 2740, "total_steps": 29667, "loss": 0.4201, "lr": 4.4299858143221377e-05, "epoch": 0.27709129981354486, "percentage": 9.24, "elapsed_time": "7:55:38", "remaining_time": "3 days, 5:54:19", "throughput": 28184.09, "total_tokens": 804334912} +{"current_steps": 2750, "total_steps": 29667, "loss": 0.4215, "lr": 4.4282480878934065e-05, "epoch": 0.2781025819296527, "percentage": 9.27, "elapsed_time": "7:57:20", "remaining_time": "3 days, 5:52:08", "throughput": 28187.25, "total_tokens": 807284736} +{"current_steps": 2760, "total_steps": 29667, "loss": 0.4186, "lr": 4.4265124048071346e-05, "epoch": 0.2791138640457605, "percentage": 9.3, "elapsed_time": "7:58:57", "remaining_time": "3 days, 5:49:24", "throughput": 28192.41, "total_tokens": 810193216} +{"current_steps": 2770, "total_steps": 29667, "loss": 0.4131, "lr": 4.4247787610619477e-05, "epoch": 0.28012514616186834, "percentage": 9.34, "elapsed_time": "8:00:39", "remaining_time": "3 days, 5:47:18", "throughput": 28194.94, "total_tokens": 813139968} +{"current_steps": 2780, "total_steps": 29667, "loss": 0.4167, "lr": 4.42304715266743e-05, "epoch": 0.2811364282779762, "percentage": 9.37, "elapsed_time": "8:02:20", "remaining_time": "3 days, 5:45:01", "throughput": 28197.01, "total_tokens": 816037952} +{"current_steps": 2790, "total_steps": 29667, "loss": 0.418, "lr": 4.421317575644092e-05, "epoch": 0.282147710394084, "percentage": 9.4, "elapsed_time": "8:04:03", "remaining_time": "3 days, 5:43:09", "throughput": 28199.97, "total_tokens": 819036288} +{"current_steps": 2800, "total_steps": 29667, "loss": 0.4156, "lr": 4.419590026023325e-05, "epoch": 0.28315899251019183, "percentage": 9.44, "elapsed_time": "8:05:47", "remaining_time": "3 days, 5:41:16", "throughput": 28200.06, "total_tokens": 821948032} +{"current_steps": 2810, "total_steps": 29667, "loss": 0.4164, "lr": 4.417864499847368e-05, "epoch": 0.2841702746262997, "percentage": 9.47, "elapsed_time": "8:07:36", "remaining_time": "3 days, 5:40:23", "throughput": 28192.41, "total_tokens": 824810624} +{"current_steps": 2820, "total_steps": 29667, "loss": 0.4186, "lr": 4.4161409931692676e-05, "epoch": 0.28518155674240747, "percentage": 9.51, "elapsed_time": "8:09:13", "remaining_time": "3 days, 5:37:30", "throughput": 28197.63, "total_tokens": 827696448} +{"current_steps": 2830, "total_steps": 29667, "loss": 0.413, "lr": 4.414419502052841e-05, "epoch": 0.2861928388585153, "percentage": 9.54, "elapsed_time": "8:10:54", "remaining_time": "3 days, 5:35:19", "throughput": 28200.78, "total_tokens": 830645248} +{"current_steps": 2840, "total_steps": 29667, "loss": 0.4131, "lr": 4.412700022572637e-05, "epoch": 0.28720412097462317, "percentage": 9.57, "elapsed_time": "8:12:32", "remaining_time": "3 days, 5:32:38", "throughput": 28205.48, "total_tokens": 833548352} +{"current_steps": 2850, "total_steps": 29667, "loss": 0.4138, "lr": 4.410982550813902e-05, "epoch": 0.28821540309073096, "percentage": 9.61, "elapsed_time": "8:14:10", "remaining_time": "3 days, 5:29:53", "throughput": 28211.68, "total_tokens": 836484032} +{"current_steps": 2860, "total_steps": 29667, "loss": 0.4191, "lr": 4.409267082872535e-05, "epoch": 0.2892266852068388, "percentage": 9.64, "elapsed_time": "8:15:56", "remaining_time": "3 days, 5:28:27", "throughput": 28209.37, "total_tokens": 839405440} +{"current_steps": 2870, "total_steps": 29667, "loss": 0.4132, "lr": 4.407553614855059e-05, "epoch": 0.2902379673229466, "percentage": 9.67, "elapsed_time": "8:17:40", "remaining_time": "3 days, 5:26:43", "throughput": 28208.56, "total_tokens": 842314496} +{"current_steps": 2880, "total_steps": 29667, "loss": 0.4143, "lr": 4.405842142878579e-05, "epoch": 0.29124924943905445, "percentage": 9.71, "elapsed_time": "8:19:21", "remaining_time": "3 days, 5:24:32", "throughput": 28211.47, "total_tokens": 845256384} +{"current_steps": 2890, "total_steps": 29667, "loss": 0.4167, "lr": 4.404132663070745e-05, "epoch": 0.2922605315551623, "percentage": 9.74, "elapsed_time": "8:21:02", "remaining_time": "3 days, 5:22:22", "throughput": 28214.34, "total_tokens": 848198080} +{"current_steps": 2900, "total_steps": 29667, "loss": 0.4178, "lr": 4.402425171569716e-05, "epoch": 0.2932718136712701, "percentage": 9.78, "elapsed_time": "8:22:46", "remaining_time": "3 days, 5:20:41", "throughput": 28216.24, "total_tokens": 851198208} +{"current_steps": 2910, "total_steps": 29667, "loss": 0.4128, "lr": 4.400719664524127e-05, "epoch": 0.29428309578737794, "percentage": 9.81, "elapsed_time": "8:24:27", "remaining_time": "3 days, 5:18:25", "throughput": 28220.06, "total_tokens": 854152128} +{"current_steps": 2920, "total_steps": 29667, "loss": 0.4176, "lr": 4.399016138093044e-05, "epoch": 0.2952943779034858, "percentage": 9.84, "elapsed_time": "8:26:11", "remaining_time": "3 days, 5:16:37", "throughput": 28221.8, "total_tokens": 857127360} +{"current_steps": 2930, "total_steps": 29667, "loss": 0.4228, "lr": 4.397314588445937e-05, "epoch": 0.2963056600195936, "percentage": 9.88, "elapsed_time": "8:27:57", "remaining_time": "3 days, 5:15:14", "throughput": 28219.87, "total_tokens": 860069760} +{"current_steps": 2940, "total_steps": 29667, "loss": 0.4112, "lr": 4.395615011762637e-05, "epoch": 0.2973169421357014, "percentage": 9.91, "elapsed_time": "8:29:49", "remaining_time": "3 days, 5:14:40", "throughput": 28213.45, "total_tokens": 863027008} +{"current_steps": 2950, "total_steps": 29667, "loss": 0.4156, "lr": 4.3939174042333057e-05, "epoch": 0.29832822425180927, "percentage": 9.94, "elapsed_time": "8:31:35", "remaining_time": "3 days, 5:13:20", "throughput": 28212.66, "total_tokens": 866010944} +{"current_steps": 2960, "total_steps": 29667, "loss": 0.415, "lr": 4.3922217620583904e-05, "epoch": 0.29933950636791706, "percentage": 9.98, "elapsed_time": "8:33:19", "remaining_time": "3 days, 5:11:36", "throughput": 28212.82, "total_tokens": 868952192} +{"current_steps": 2970, "total_steps": 29667, "loss": 0.4112, "lr": 4.3905280814486025e-05, "epoch": 0.3003507884840249, "percentage": 10.01, "elapsed_time": "8:35:01", "remaining_time": "3 days, 5:09:28", "throughput": 28216.33, "total_tokens": 871921408} +{"current_steps": 2980, "total_steps": 29667, "loss": 0.4121, "lr": 4.388836358624867e-05, "epoch": 0.3013620706001327, "percentage": 10.04, "elapsed_time": "8:36:36", "remaining_time": "3 days, 5:06:21", "throughput": 28223.58, "total_tokens": 874821312} +{"current_steps": 2990, "total_steps": 29667, "loss": 0.4112, "lr": 4.3871465898182976e-05, "epoch": 0.30237335271624055, "percentage": 10.08, "elapsed_time": "8:38:20", "remaining_time": "3 days, 5:04:38", "throughput": 28224.69, "total_tokens": 877794560} +{"current_steps": 3000, "total_steps": 29667, "loss": 0.4096, "lr": 4.385458771270156e-05, "epoch": 0.3033846348323484, "percentage": 10.11, "elapsed_time": "8:40:01", "remaining_time": "3 days, 5:02:32", "throughput": 28227.3, "total_tokens": 880740672} +{"current_steps": 3010, "total_steps": 29667, "loss": 0.413, "lr": 4.3837728992318205e-05, "epoch": 0.3043959169484562, "percentage": 10.15, "elapsed_time": "8:41:47", "remaining_time": "3 days, 5:01:06", "throughput": 28224.66, "total_tokens": 883653440} +{"current_steps": 3020, "total_steps": 29667, "loss": 0.4171, "lr": 4.382088969964746e-05, "epoch": 0.30540719906456404, "percentage": 10.18, "elapsed_time": "8:43:45", "remaining_time": "3 days, 5:01:21", "throughput": 28210.99, "total_tokens": 886537472} +{"current_steps": 3030, "total_steps": 29667, "loss": 0.4117, "lr": 4.380406979740436e-05, "epoch": 0.3064184811806719, "percentage": 10.21, "elapsed_time": "8:45:26", "remaining_time": "3 days, 4:59:12", "throughput": 28214.69, "total_tokens": 889512128} +{"current_steps": 3040, "total_steps": 29667, "loss": 0.4128, "lr": 4.3787269248403994e-05, "epoch": 0.3074297632967797, "percentage": 10.25, "elapsed_time": "8:47:05", "remaining_time": "3 days, 4:56:45", "throughput": 28219.09, "total_tokens": 892446400} +{"current_steps": 3050, "total_steps": 29667, "loss": 0.4148, "lr": 4.377048801556126e-05, "epoch": 0.3084410454128875, "percentage": 10.28, "elapsed_time": "8:48:46", "remaining_time": "3 days, 4:54:31", "throughput": 28222.76, "total_tokens": 895402368} +{"current_steps": 3060, "total_steps": 29667, "loss": 0.4123, "lr": 4.3753726061890446e-05, "epoch": 0.3094523275289954, "percentage": 10.31, "elapsed_time": "8:50:28", "remaining_time": "3 days, 4:52:29", "throughput": 28224.11, "total_tokens": 898321728} +{"current_steps": 3070, "total_steps": 29667, "loss": 0.4148, "lr": 4.373698335050488e-05, "epoch": 0.31046360964510317, "percentage": 10.35, "elapsed_time": "8:52:05", "remaining_time": "3 days, 4:49:50", "throughput": 28229.34, "total_tokens": 901245888} +{"current_steps": 3080, "total_steps": 29667, "loss": 0.4141, "lr": 4.372025984461667e-05, "epoch": 0.311474891761211, "percentage": 10.38, "elapsed_time": "8:53:45", "remaining_time": "3 days, 4:47:32", "throughput": 28232.78, "total_tokens": 904182080} +{"current_steps": 3090, "total_steps": 29667, "loss": 0.4148, "lr": 4.370355550753629e-05, "epoch": 0.31248617387731886, "percentage": 10.42, "elapsed_time": "8:55:29", "remaining_time": "3 days, 4:45:44", "throughput": 28234.7, "total_tokens": 907164352} +{"current_steps": 3100, "total_steps": 29667, "loss": 0.4085, "lr": 4.368687030267226e-05, "epoch": 0.31349745599342665, "percentage": 10.45, "elapsed_time": "8:57:09", "remaining_time": "3 days, 4:43:25", "throughput": 28238.57, "total_tokens": 910109184} +{"current_steps": 3110, "total_steps": 29667, "loss": 0.4132, "lr": 4.367020419353081e-05, "epoch": 0.3145087381095345, "percentage": 10.48, "elapsed_time": "8:58:50", "remaining_time": "3 days, 4:41:17", "throughput": 28241.03, "total_tokens": 913045440} +{"current_steps": 3120, "total_steps": 29667, "loss": 0.412, "lr": 4.365355714371558e-05, "epoch": 0.3155200202256423, "percentage": 10.52, "elapsed_time": "9:00:29", "remaining_time": "3 days, 4:38:47", "throughput": 28245.38, "total_tokens": 915972160} +{"current_steps": 3130, "total_steps": 29667, "loss": 0.4156, "lr": 4.3636929116927235e-05, "epoch": 0.31653130234175014, "percentage": 10.55, "elapsed_time": "9:02:10", "remaining_time": "3 days, 4:36:39", "throughput": 28248.16, "total_tokens": 918917952} +{"current_steps": 3140, "total_steps": 29667, "loss": 0.4109, "lr": 4.362032007696314e-05, "epoch": 0.317542584457858, "percentage": 10.58, "elapsed_time": "9:03:53", "remaining_time": "3 days, 4:34:52", "throughput": 28250.18, "total_tokens": 921907264} +{"current_steps": 3150, "total_steps": 29667, "loss": 0.4111, "lr": 4.360372998771707e-05, "epoch": 0.3185538665739658, "percentage": 10.62, "elapsed_time": "9:05:30", "remaining_time": "3 days, 4:32:11", "throughput": 28256.62, "total_tokens": 924863616} +{"current_steps": 3160, "total_steps": 29667, "loss": 0.4057, "lr": 4.358715881317884e-05, "epoch": 0.31956514869007363, "percentage": 10.65, "elapsed_time": "9:07:11", "remaining_time": "3 days, 4:29:58", "throughput": 28259.74, "total_tokens": 927805312} +{"current_steps": 3170, "total_steps": 29667, "loss": 0.4081, "lr": 4.357060651743399e-05, "epoch": 0.3205764308061815, "percentage": 10.69, "elapsed_time": "9:08:50", "remaining_time": "3 days, 4:27:31", "throughput": 28263.59, "total_tokens": 930721408} +{"current_steps": 3180, "total_steps": 29667, "loss": 0.4168, "lr": 4.3554073064663454e-05, "epoch": 0.32158771292228927, "percentage": 10.72, "elapsed_time": "9:10:31", "remaining_time": "3 days, 4:25:23", "throughput": 28266.76, "total_tokens": 933681472} +{"current_steps": 3190, "total_steps": 29667, "loss": 0.4103, "lr": 4.353755841914325e-05, "epoch": 0.3225989950383971, "percentage": 10.75, "elapsed_time": "9:12:12", "remaining_time": "3 days, 4:23:23", "throughput": 28268.7, "total_tokens": 936625600} +{"current_steps": 3200, "total_steps": 29667, "loss": 0.4079, "lr": 4.3521062545244116e-05, "epoch": 0.32361027715450497, "percentage": 10.79, "elapsed_time": "9:13:58", "remaining_time": "3 days, 4:21:50", "throughput": 28268.85, "total_tokens": 939603648} +{"current_steps": 3210, "total_steps": 29667, "loss": 0.4078, "lr": 4.350458540743126e-05, "epoch": 0.32462155927061276, "percentage": 10.82, "elapsed_time": "9:15:34", "remaining_time": "3 days, 4:19:03", "throughput": 28273.74, "total_tokens": 942485888} +{"current_steps": 3220, "total_steps": 29667, "loss": 0.4082, "lr": 4.3488126970263955e-05, "epoch": 0.3256328413867206, "percentage": 10.85, "elapsed_time": "9:17:11", "remaining_time": "3 days, 4:16:23", "throughput": 28278.08, "total_tokens": 945375680} +{"current_steps": 3230, "total_steps": 29667, "loss": 0.4116, "lr": 4.347168719839527e-05, "epoch": 0.32664412350282845, "percentage": 10.89, "elapsed_time": "9:18:54", "remaining_time": "3 days, 4:14:30", "throughput": 28279.68, "total_tokens": 948333440} +{"current_steps": 3240, "total_steps": 29667, "loss": 0.4118, "lr": 4.345526605657173e-05, "epoch": 0.32765540561893625, "percentage": 10.92, "elapsed_time": "9:20:35", "remaining_time": "3 days, 4:12:27", "throughput": 28280.94, "total_tokens": 951242304} +{"current_steps": 3250, "total_steps": 29667, "loss": 0.4101, "lr": 4.343886350963304e-05, "epoch": 0.3286666877350441, "percentage": 10.95, "elapsed_time": "9:22:12", "remaining_time": "3 days, 4:09:51", "throughput": 28284.84, "total_tokens": 954129792} +{"current_steps": 3260, "total_steps": 29667, "loss": 0.4104, "lr": 4.3422479522511697e-05, "epoch": 0.3296779698511519, "percentage": 10.99, "elapsed_time": "9:23:54", "remaining_time": "3 days, 4:07:50", "throughput": 28288.21, "total_tokens": 957119296} +{"current_steps": 3270, "total_steps": 29667, "loss": 0.4078, "lr": 4.340611406023272e-05, "epoch": 0.33068925196725973, "percentage": 11.02, "elapsed_time": "9:25:39", "remaining_time": "3 days, 4:06:13", "throughput": 28288.77, "total_tokens": 960098176} +{"current_steps": 3280, "total_steps": 29667, "loss": 0.41, "lr": 4.338976708791336e-05, "epoch": 0.3317005340833676, "percentage": 11.06, "elapsed_time": "9:27:27", "remaining_time": "3 days, 4:05:04", "throughput": 28286.0, "total_tokens": 963062336} +{"current_steps": 3290, "total_steps": 29667, "loss": 0.4091, "lr": 4.337343857076272e-05, "epoch": 0.3327118161994754, "percentage": 11.09, "elapsed_time": "9:29:06", "remaining_time": "3 days, 4:02:44", "throughput": 28289.36, "total_tokens": 965985728} +{"current_steps": 3300, "total_steps": 29667, "loss": 0.41, "lr": 4.33571284740815e-05, "epoch": 0.3337230983155832, "percentage": 11.12, "elapsed_time": "9:30:48", "remaining_time": "3 days, 4:00:43", "throughput": 28291.17, "total_tokens": 968923840} +{"current_steps": 3310, "total_steps": 29667, "loss": 0.4064, "lr": 4.3340836763261675e-05, "epoch": 0.33473438043169107, "percentage": 11.16, "elapsed_time": "9:32:32", "remaining_time": "3 days, 3:59:07", "throughput": 28290.78, "total_tokens": 971872320} +{"current_steps": 3320, "total_steps": 29667, "loss": 0.4066, "lr": 4.332456340378618e-05, "epoch": 0.33574566254779886, "percentage": 11.19, "elapsed_time": "9:34:11", "remaining_time": "3 days, 3:56:43", "throughput": 28294.28, "total_tokens": 974787328} +{"current_steps": 3330, "total_steps": 29667, "loss": 0.4132, "lr": 4.3308308361228586e-05, "epoch": 0.3367569446639067, "percentage": 11.22, "elapsed_time": "9:35:44", "remaining_time": "3 days, 3:53:35", "throughput": 28301.19, "total_tokens": 977662080} +{"current_steps": 3340, "total_steps": 29667, "loss": 0.4085, "lr": 4.329207160125282e-05, "epoch": 0.33776822678001456, "percentage": 11.26, "elapsed_time": "9:37:20", "remaining_time": "3 days, 3:50:47", "throughput": 28307.38, "total_tokens": 980581248} +{"current_steps": 3350, "total_steps": 29667, "loss": 0.4062, "lr": 4.327585308961287e-05, "epoch": 0.33877950889612235, "percentage": 11.29, "elapsed_time": "9:38:57", "remaining_time": "3 days, 3:48:07", "throughput": 28312.33, "total_tokens": 983485952} +{"current_steps": 3360, "total_steps": 29667, "loss": 0.4057, "lr": 4.325965279215243e-05, "epoch": 0.3397907910122302, "percentage": 11.33, "elapsed_time": "9:40:34", "remaining_time": "3 days, 3:45:34", "throughput": 28317.23, "total_tokens": 986411584} +{"current_steps": 3370, "total_steps": 29667, "loss": 0.4079, "lr": 4.3243470674804686e-05, "epoch": 0.34080207312833805, "percentage": 11.36, "elapsed_time": "9:42:11", "remaining_time": "3 days, 3:43:00", "throughput": 28321.72, "total_tokens": 989323776} +{"current_steps": 3380, "total_steps": 29667, "loss": 0.41, "lr": 4.3227306703591904e-05, "epoch": 0.34181335524444584, "percentage": 11.39, "elapsed_time": "9:43:56", "remaining_time": "3 days, 3:41:23", "throughput": 28324.05, "total_tokens": 992364672} +{"current_steps": 3390, "total_steps": 29667, "loss": 0.4065, "lr": 4.32111608446252e-05, "epoch": 0.3428246373605537, "percentage": 11.43, "elapsed_time": "9:45:36", "remaining_time": "3 days, 3:39:17", "throughput": 28326.56, "total_tokens": 995308544} +{"current_steps": 3400, "total_steps": 29667, "loss": 0.4122, "lr": 4.319503306410426e-05, "epoch": 0.3438359194766615, "percentage": 11.46, "elapsed_time": "9:47:17", "remaining_time": "3 days, 3:37:13", "throughput": 28328.93, "total_tokens": 998252288} +{"current_steps": 3410, "total_steps": 29667, "loss": 0.412, "lr": 4.317892332831699e-05, "epoch": 0.3448472015927693, "percentage": 11.49, "elapsed_time": "9:48:56", "remaining_time": "3 days, 3:34:52", "throughput": 28332.37, "total_tokens": 1001172800} +{"current_steps": 3420, "total_steps": 29667, "loss": 0.4026, "lr": 4.316283160363922e-05, "epoch": 0.3458584837088772, "percentage": 11.53, "elapsed_time": "9:50:38", "remaining_time": "3 days, 3:32:53", "throughput": 28333.49, "total_tokens": 1004090496} +{"current_steps": 3430, "total_steps": 29667, "loss": 0.4102, "lr": 4.314675785653447e-05, "epoch": 0.34686976582498497, "percentage": 11.56, "elapsed_time": "9:52:17", "remaining_time": "3 days, 3:30:33", "throughput": 28337.15, "total_tokens": 1007023936} +{"current_steps": 3440, "total_steps": 29667, "loss": 0.409, "lr": 4.3130702053553606e-05, "epoch": 0.3478810479410928, "percentage": 11.6, "elapsed_time": "9:53:56", "remaining_time": "3 days, 3:28:17", "throughput": 28340.57, "total_tokens": 1009959296} +{"current_steps": 3450, "total_steps": 29667, "loss": 0.4032, "lr": 4.3114664161334546e-05, "epoch": 0.34889233005720066, "percentage": 11.63, "elapsed_time": "9:55:30", "remaining_time": "3 days, 3:25:19", "throughput": 28347.21, "total_tokens": 1012854272} +{"current_steps": 3460, "total_steps": 29667, "loss": 0.4086, "lr": 4.3098644146601984e-05, "epoch": 0.34990361217330845, "percentage": 11.66, "elapsed_time": "9:57:15", "remaining_time": "3 days, 3:23:45", "throughput": 28345.13, "total_tokens": 1015751872} +{"current_steps": 3470, "total_steps": 29667, "loss": 0.4076, "lr": 4.30826419761671e-05, "epoch": 0.3509148942894163, "percentage": 11.7, "elapsed_time": "9:58:54", "remaining_time": "3 days, 3:21:28", "throughput": 28348.79, "total_tokens": 1018695488} +{"current_steps": 3480, "total_steps": 29667, "loss": 0.4066, "lr": 4.30666576169273e-05, "epoch": 0.35192617640552415, "percentage": 11.73, "elapsed_time": "10:00:32", "remaining_time": "3 days, 3:19:01", "throughput": 28351.97, "total_tokens": 1021581568} +{"current_steps": 3490, "total_steps": 29667, "loss": 0.4068, "lr": 4.305069103586585e-05, "epoch": 0.35293745852163194, "percentage": 11.76, "elapsed_time": "10:02:12", "remaining_time": "3 days, 3:16:57", "throughput": 28352.86, "total_tokens": 1024472832} +{"current_steps": 3500, "total_steps": 29667, "loss": 0.4044, "lr": 4.303474220005164e-05, "epoch": 0.3539487406377398, "percentage": 11.8, "elapsed_time": "10:03:56", "remaining_time": "3 days, 3:15:11", "throughput": 28353.95, "total_tokens": 1027437568} +{"current_steps": 3510, "total_steps": 29667, "loss": 0.4039, "lr": 4.3018811076638944e-05, "epoch": 0.35496002275384764, "percentage": 11.83, "elapsed_time": "10:05:34", "remaining_time": "3 days, 3:12:52", "throughput": 28357.85, "total_tokens": 1030379712} +{"current_steps": 3520, "total_steps": 29667, "loss": 0.4042, "lr": 4.300289763286704e-05, "epoch": 0.35597130486995543, "percentage": 11.87, "elapsed_time": "10:07:16", "remaining_time": "3 days, 3:10:54", "throughput": 28359.99, "total_tokens": 1033337984} +{"current_steps": 3530, "total_steps": 29667, "loss": 0.4055, "lr": 4.298700183606e-05, "epoch": 0.3569825869860633, "percentage": 11.9, "elapsed_time": "10:08:58", "remaining_time": "3 days, 3:08:56", "throughput": 28361.52, "total_tokens": 1036274176} +{"current_steps": 3540, "total_steps": 29667, "loss": 0.4088, "lr": 4.297112365362637e-05, "epoch": 0.35799386910217107, "percentage": 11.93, "elapsed_time": "10:10:33", "remaining_time": "3 days, 3:06:12", "throughput": 28365.89, "total_tokens": 1039135104} +{"current_steps": 3550, "total_steps": 29667, "loss": 0.4073, "lr": 4.295526305305891e-05, "epoch": 0.3590051512182789, "percentage": 11.97, "elapsed_time": "10:12:13", "remaining_time": "3 days, 3:04:07", "throughput": 28368.39, "total_tokens": 1042081024} +{"current_steps": 3560, "total_steps": 29667, "loss": 0.4027, "lr": 4.293942000193429e-05, "epoch": 0.36001643333438677, "percentage": 12.0, "elapsed_time": "10:13:50", "remaining_time": "3 days, 3:01:34", "throughput": 28372.64, "total_tokens": 1044982528} +{"current_steps": 3570, "total_steps": 29667, "loss": 0.405, "lr": 4.2923594467912866e-05, "epoch": 0.36102771545049456, "percentage": 12.03, "elapsed_time": "10:15:31", "remaining_time": "3 days, 2:59:31", "throughput": 28374.73, "total_tokens": 1047918208} +{"current_steps": 3580, "total_steps": 29667, "loss": 0.4079, "lr": 4.290778641873832e-05, "epoch": 0.3620389975666024, "percentage": 12.07, "elapsed_time": "10:17:07", "remaining_time": "3 days, 2:56:51", "throughput": 28379.58, "total_tokens": 1050813696} +{"current_steps": 3590, "total_steps": 29667, "loss": 0.4044, "lr": 4.2891995822237455e-05, "epoch": 0.36305027968271025, "percentage": 12.1, "elapsed_time": "10:18:51", "remaining_time": "3 days, 2:55:14", "throughput": 28380.55, "total_tokens": 1053809984} +{"current_steps": 3600, "total_steps": 29667, "loss": 0.4042, "lr": 4.28762226463199e-05, "epoch": 0.36406156179881805, "percentage": 12.13, "elapsed_time": "10:20:28", "remaining_time": "3 days, 2:52:42", "throughput": 28385.51, "total_tokens": 1056738240} +{"current_steps": 3610, "total_steps": 29667, "loss": 0.4041, "lr": 4.286046685897781e-05, "epoch": 0.3650728439149259, "percentage": 12.17, "elapsed_time": "10:22:09", "remaining_time": "3 days, 2:50:43", "throughput": 28387.56, "total_tokens": 1059690304} +{"current_steps": 3620, "total_steps": 29667, "loss": 0.4034, "lr": 4.284472842828562e-05, "epoch": 0.36608412603103374, "percentage": 12.2, "elapsed_time": "10:23:51", "remaining_time": "3 days, 2:48:54", "throughput": 28389.02, "total_tokens": 1062656640} +{"current_steps": 3630, "total_steps": 29667, "loss": 0.4064, "lr": 4.282900732239977e-05, "epoch": 0.36709540814714153, "percentage": 12.24, "elapsed_time": "10:25:29", "remaining_time": "3 days, 2:46:26", "throughput": 28392.61, "total_tokens": 1065549248} +{"current_steps": 3640, "total_steps": 29667, "loss": 0.4052, "lr": 4.281330350955845e-05, "epoch": 0.3681066902632494, "percentage": 12.27, "elapsed_time": "10:27:11", "remaining_time": "3 days, 2:44:35", "throughput": 28394.25, "total_tokens": 1068516160} +{"current_steps": 3650, "total_steps": 29667, "loss": 0.4033, "lr": 4.279761695808125e-05, "epoch": 0.36911797237935723, "percentage": 12.3, "elapsed_time": "10:28:53", "remaining_time": "3 days, 2:42:44", "throughput": 28395.99, "total_tokens": 1071488768} +{"current_steps": 3660, "total_steps": 29667, "loss": 0.4065, "lr": 4.278194763636904e-05, "epoch": 0.370129254495465, "percentage": 12.34, "elapsed_time": "10:30:33", "remaining_time": "3 days, 2:40:32", "throughput": 28399.79, "total_tokens": 1074453760} +{"current_steps": 3670, "total_steps": 29667, "loss": 0.4031, "lr": 4.276629551290354e-05, "epoch": 0.37114053661157287, "percentage": 12.37, "elapsed_time": "10:32:12", "remaining_time": "3 days, 2:38:19", "throughput": 28403.49, "total_tokens": 1077410432} +{"current_steps": 3680, "total_steps": 29667, "loss": 0.4048, "lr": 4.2750660556247175e-05, "epoch": 0.37215181872768066, "percentage": 12.4, "elapsed_time": "10:33:59", "remaining_time": "3 days, 2:37:01", "throughput": 28401.08, "total_tokens": 1080358144} +{"current_steps": 3690, "total_steps": 29667, "loss": 0.4075, "lr": 4.273504273504274e-05, "epoch": 0.3731631008437885, "percentage": 12.44, "elapsed_time": "10:35:44", "remaining_time": "3 days, 2:35:31", "throughput": 28401.32, "total_tokens": 1083355456} +{"current_steps": 3700, "total_steps": 29667, "loss": 0.4011, "lr": 4.271944201801317e-05, "epoch": 0.37417438295989636, "percentage": 12.47, "elapsed_time": "10:37:21", "remaining_time": "3 days, 2:33:05", "throughput": 28404.27, "total_tokens": 1086233280} +{"current_steps": 3710, "total_steps": 29667, "loss": 0.4005, "lr": 4.270385837396127e-05, "epoch": 0.37518566507600415, "percentage": 12.51, "elapsed_time": "10:39:01", "remaining_time": "3 days, 2:30:58", "throughput": 28407.41, "total_tokens": 1089194112} +{"current_steps": 3720, "total_steps": 29667, "loss": 0.4087, "lr": 4.268829177176945e-05, "epoch": 0.376196947192112, "percentage": 12.54, "elapsed_time": "10:40:38", "remaining_time": "3 days, 2:28:28", "throughput": 28412.27, "total_tokens": 1092124288} +{"current_steps": 3730, "total_steps": 29667, "loss": 0.4046, "lr": 4.2672742180399455e-05, "epoch": 0.37720822930821984, "percentage": 12.57, "elapsed_time": "10:42:19", "remaining_time": "3 days, 2:26:28", "throughput": 28414.53, "total_tokens": 1095079040} +{"current_steps": 3740, "total_steps": 29667, "loss": 0.3976, "lr": 4.265720956889213e-05, "epoch": 0.37821951142432764, "percentage": 12.61, "elapsed_time": "10:43:53", "remaining_time": "3 days, 2:23:44", "throughput": 28418.63, "total_tokens": 1097924736} +{"current_steps": 3750, "total_steps": 29667, "loss": 0.403, "lr": 4.2641693906367113e-05, "epoch": 0.3792307935404355, "percentage": 12.64, "elapsed_time": "10:45:34", "remaining_time": "3 days, 2:21:41", "throughput": 28421.26, "total_tokens": 1100881216} +{"current_steps": 3760, "total_steps": 29667, "loss": 0.4047, "lr": 4.2626195162022646e-05, "epoch": 0.38024207565654333, "percentage": 12.67, "elapsed_time": "10:47:12", "remaining_time": "3 days, 2:19:24", "throughput": 28423.77, "total_tokens": 1103774976} +{"current_steps": 3770, "total_steps": 29667, "loss": 0.4041, "lr": 4.2610713305135255e-05, "epoch": 0.3812533577726511, "percentage": 12.71, "elapsed_time": "10:48:49", "remaining_time": "3 days, 2:16:53", "throughput": 28427.72, "total_tokens": 1106667200} +{"current_steps": 3780, "total_steps": 29667, "loss": 0.4057, "lr": 4.2595248305059546e-05, "epoch": 0.382264639888759, "percentage": 12.74, "elapsed_time": "10:50:28", "remaining_time": "3 days, 2:14:40", "throughput": 28430.6, "total_tokens": 1109594112} +{"current_steps": 3790, "total_steps": 29667, "loss": 0.406, "lr": 4.2579800131227916e-05, "epoch": 0.3832759220048668, "percentage": 12.78, "elapsed_time": "10:52:07", "remaining_time": "3 days, 2:12:30", "throughput": 28433.8, "total_tokens": 1112542336} +{"current_steps": 3800, "total_steps": 29667, "loss": 0.4033, "lr": 4.256436875315028e-05, "epoch": 0.3842872041209746, "percentage": 12.81, "elapsed_time": "10:53:45", "remaining_time": "3 days, 2:10:12", "throughput": 28436.4, "total_tokens": 1115432448} +{"current_steps": 3810, "total_steps": 29667, "loss": 0.405, "lr": 4.2548954140413895e-05, "epoch": 0.38529848623708246, "percentage": 12.84, "elapsed_time": "10:55:20", "remaining_time": "3 days, 2:07:29", "throughput": 28440.92, "total_tokens": 1118297216} +{"current_steps": 3820, "total_steps": 29667, "loss": 0.4046, "lr": 4.253355626268302e-05, "epoch": 0.38630976835319025, "percentage": 12.88, "elapsed_time": "10:56:52", "remaining_time": "3 days, 2:04:36", "throughput": 28446.24, "total_tokens": 1121149504} +{"current_steps": 3830, "total_steps": 29667, "loss": 0.4037, "lr": 4.2518175089698716e-05, "epoch": 0.3873210504692981, "percentage": 12.91, "elapsed_time": "10:58:28", "remaining_time": "3 days, 2:02:05", "throughput": 28450.04, "total_tokens": 1124029312} +{"current_steps": 3840, "total_steps": 29667, "loss": 0.4003, "lr": 4.25028105912786e-05, "epoch": 0.38833233258540595, "percentage": 12.94, "elapsed_time": "11:00:06", "remaining_time": "3 days, 1:59:44", "throughput": 28453.84, "total_tokens": 1126957056} +{"current_steps": 3850, "total_steps": 29667, "loss": 0.4044, "lr": 4.2487462737316565e-05, "epoch": 0.38934361470151374, "percentage": 12.98, "elapsed_time": "11:01:43", "remaining_time": "3 days, 1:57:18", "throughput": 28457.93, "total_tokens": 1129871936} +{"current_steps": 3860, "total_steps": 29667, "loss": 0.3999, "lr": 4.2472131497782555e-05, "epoch": 0.3903548968176216, "percentage": 13.01, "elapsed_time": "11:03:25", "remaining_time": "3 days, 1:55:26", "throughput": 28460.21, "total_tokens": 1132861376} +{"current_steps": 3870, "total_steps": 29667, "loss": 0.4029, "lr": 4.245681684272231e-05, "epoch": 0.39136617893372944, "percentage": 13.04, "elapsed_time": "11:05:05", "remaining_time": "3 days, 1:53:24", "throughput": 28462.57, "total_tokens": 1135806848} +{"current_steps": 3880, "total_steps": 29667, "loss": 0.4036, "lr": 4.244151874225712e-05, "epoch": 0.39237746104983723, "percentage": 13.08, "elapsed_time": "11:06:50", "remaining_time": "3 days, 1:51:57", "throughput": 28461.79, "total_tokens": 1138781568} +{"current_steps": 3890, "total_steps": 29667, "loss": 0.4049, "lr": 4.2426237166583596e-05, "epoch": 0.3933887431659451, "percentage": 13.11, "elapsed_time": "11:08:30", "remaining_time": "3 days, 1:49:49", "throughput": 28463.79, "total_tokens": 1141689152} +{"current_steps": 3900, "total_steps": 29667, "loss": 0.4036, "lr": 4.241097208597339e-05, "epoch": 0.3944000252820529, "percentage": 13.15, "elapsed_time": "11:10:07", "remaining_time": "3 days, 1:47:28", "throughput": 28467.23, "total_tokens": 1144599872} +{"current_steps": 3910, "total_steps": 29667, "loss": 0.4006, "lr": 4.2395723470773005e-05, "epoch": 0.3954113073981607, "percentage": 13.18, "elapsed_time": "11:11:47", "remaining_time": "3 days, 1:45:23", "throughput": 28470.35, "total_tokens": 1147562688} +{"current_steps": 3920, "total_steps": 29667, "loss": 0.401, "lr": 4.238049129140347e-05, "epoch": 0.39642258951426856, "percentage": 13.21, "elapsed_time": "11:13:27", "remaining_time": "3 days, 1:43:24", "throughput": 28472.35, "total_tokens": 1150510464} +{"current_steps": 3930, "total_steps": 29667, "loss": 0.4017, "lr": 4.236527551836022e-05, "epoch": 0.3974338716303764, "percentage": 13.25, "elapsed_time": "11:15:09", "remaining_time": "3 days, 1:41:33", "throughput": 28473.26, "total_tokens": 1153450432} +{"current_steps": 3940, "total_steps": 29667, "loss": 0.4059, "lr": 4.235007612221274e-05, "epoch": 0.3984451537464842, "percentage": 13.28, "elapsed_time": "11:16:48", "remaining_time": "3 days, 1:39:21", "throughput": 28476.08, "total_tokens": 1156371200} +{"current_steps": 3950, "total_steps": 29667, "loss": 0.4036, "lr": 4.2334893073604386e-05, "epoch": 0.39945643586259205, "percentage": 13.31, "elapsed_time": "11:18:27", "remaining_time": "3 days, 1:37:12", "throughput": 28478.99, "total_tokens": 1159313088} +{"current_steps": 3960, "total_steps": 29667, "loss": 0.3994, "lr": 4.231972634325214e-05, "epoch": 0.40046771797869984, "percentage": 13.35, "elapsed_time": "11:20:09", "remaining_time": "3 days, 1:35:20", "throughput": 28480.64, "total_tokens": 1162274496} +{"current_steps": 3970, "total_steps": 29667, "loss": 0.3996, "lr": 4.230457590194635e-05, "epoch": 0.4014790000948077, "percentage": 13.38, "elapsed_time": "11:21:49", "remaining_time": "3 days, 1:33:18", "throughput": 28481.81, "total_tokens": 1165174336} +{"current_steps": 3980, "total_steps": 29667, "loss": 0.4008, "lr": 4.228944172055053e-05, "epoch": 0.40249028221091554, "percentage": 13.42, "elapsed_time": "11:23:27", "remaining_time": "3 days, 1:31:04", "throughput": 28486.18, "total_tokens": 1168153856} +{"current_steps": 3990, "total_steps": 29667, "loss": 0.4015, "lr": 4.22743237700011e-05, "epoch": 0.40350156432702333, "percentage": 13.45, "elapsed_time": "11:25:07", "remaining_time": "3 days, 1:29:02", "throughput": 28488.07, "total_tokens": 1171081152} +{"current_steps": 4000, "total_steps": 29667, "loss": 0.4046, "lr": 4.225922202130716e-05, "epoch": 0.4045128464431312, "percentage": 13.48, "elapsed_time": "11:26:51", "remaining_time": "3 days, 1:27:20", "throughput": 28489.4, "total_tokens": 1174076928} +{"current_steps": 4010, "total_steps": 29667, "loss": 0.3995, "lr": 4.224413644555024e-05, "epoch": 0.405524128559239, "percentage": 13.52, "elapsed_time": "11:28:28", "remaining_time": "3 days, 1:25:04", "throughput": 28493.06, "total_tokens": 1177013312} +{"current_steps": 4020, "total_steps": 29667, "loss": 0.4019, "lr": 4.222906701388411e-05, "epoch": 0.4065354106753468, "percentage": 13.55, "elapsed_time": "11:30:10", "remaining_time": "3 days, 1:23:14", "throughput": 28494.13, "total_tokens": 1179965888} +{"current_steps": 4030, "total_steps": 29667, "loss": 0.3965, "lr": 4.2214013697534466e-05, "epoch": 0.40754669279145467, "percentage": 13.58, "elapsed_time": "11:31:46", "remaining_time": "3 days, 1:20:44", "throughput": 28498.81, "total_tokens": 1182884352} +{"current_steps": 4040, "total_steps": 29667, "loss": 0.3957, "lr": 4.219897646779882e-05, "epoch": 0.4085579749075625, "percentage": 13.62, "elapsed_time": "11:33:30", "remaining_time": "3 days, 1:19:06", "throughput": 28500.2, "total_tokens": 1185900224} +{"current_steps": 4050, "total_steps": 29667, "loss": 0.4005, "lr": 4.2183955296046145e-05, "epoch": 0.4095692570236703, "percentage": 13.65, "elapsed_time": "11:35:11", "remaining_time": "3 days, 1:17:13", "throughput": 28501.54, "total_tokens": 1188842176} +{"current_steps": 4060, "total_steps": 29667, "loss": 0.4, "lr": 4.2168950153716746e-05, "epoch": 0.41058053913977816, "percentage": 13.69, "elapsed_time": "11:36:53", "remaining_time": "3 days, 1:15:24", "throughput": 28502.56, "total_tokens": 1191795264} +{"current_steps": 4070, "total_steps": 29667, "loss": 0.3996, "lr": 4.215396101232197e-05, "epoch": 0.411591821255886, "percentage": 13.72, "elapsed_time": "11:38:32", "remaining_time": "3 days, 1:13:15", "throughput": 28505.64, "total_tokens": 1194742848} +{"current_steps": 4080, "total_steps": 29667, "loss": 0.4017, "lr": 4.213898784344398e-05, "epoch": 0.4126031033719938, "percentage": 13.75, "elapsed_time": "11:40:09", "remaining_time": "3 days, 1:10:58", "throughput": 28509.42, "total_tokens": 1197680384} +{"current_steps": 4090, "total_steps": 29667, "loss": 0.399, "lr": 4.21240306187356e-05, "epoch": 0.41361438548810164, "percentage": 13.79, "elapsed_time": "11:41:50", "remaining_time": "3 days, 1:09:02", "throughput": 28511.59, "total_tokens": 1200648512} +{"current_steps": 4100, "total_steps": 29667, "loss": 0.3982, "lr": 4.2109089309919967e-05, "epoch": 0.41462566760420944, "percentage": 13.82, "elapsed_time": "11:43:30", "remaining_time": "3 days, 1:06:59", "throughput": 28513.24, "total_tokens": 1203564928} +{"current_steps": 4110, "total_steps": 29667, "loss": 0.397, "lr": 4.2094163888790445e-05, "epoch": 0.4156369497203173, "percentage": 13.85, "elapsed_time": "11:45:18", "remaining_time": "3 days, 1:05:49", "throughput": 28511.24, "total_tokens": 1206565568} +{"current_steps": 4120, "total_steps": 29667, "loss": 0.3972, "lr": 4.2079254327210294e-05, "epoch": 0.41664823183642513, "percentage": 13.89, "elapsed_time": "11:46:55", "remaining_time": "3 days, 1:03:25", "throughput": 28513.98, "total_tokens": 1209427648} +{"current_steps": 4130, "total_steps": 29667, "loss": 0.4004, "lr": 4.206436059711249e-05, "epoch": 0.4176595139525329, "percentage": 13.92, "elapsed_time": "11:48:39", "remaining_time": "3 days, 1:01:52", "throughput": 28512.48, "total_tokens": 1212345536} +{"current_steps": 4140, "total_steps": 29667, "loss": 0.3978, "lr": 4.20494826704995e-05, "epoch": 0.41867079606864077, "percentage": 13.95, "elapsed_time": "11:50:30", "remaining_time": "3 days, 1:00:58", "throughput": 28507.3, "total_tokens": 1215284096} +{"current_steps": 4150, "total_steps": 29667, "loss": 0.4028, "lr": 4.203462051944307e-05, "epoch": 0.4196820781847486, "percentage": 13.99, "elapsed_time": "11:52:15", "remaining_time": "3 days, 0:59:29", "throughput": 28504.13, "total_tokens": 1218152384} +{"current_steps": 4160, "total_steps": 29667, "loss": 0.4015, "lr": 4.201977411608398e-05, "epoch": 0.4206933603008564, "percentage": 14.02, "elapsed_time": "11:54:02", "remaining_time": "3 days, 0:58:08", "throughput": 28500.81, "total_tokens": 1221048000} +{"current_steps": 4170, "total_steps": 29667, "loss": 0.401, "lr": 4.200494343263185e-05, "epoch": 0.42170464241696426, "percentage": 14.06, "elapsed_time": "11:55:54", "remaining_time": "3 days, 0:57:22", "throughput": 28493.8, "total_tokens": 1223946880} +{"current_steps": 4180, "total_steps": 29667, "loss": 0.3971, "lr": 4.1990128441364914e-05, "epoch": 0.4227159245330721, "percentage": 14.09, "elapsed_time": "11:57:35", "remaining_time": "3 days, 0:55:24", "throughput": 28495.9, "total_tokens": 1226901696} +{"current_steps": 4190, "total_steps": 29667, "loss": 0.3991, "lr": 4.197532911462977e-05, "epoch": 0.4237272066491799, "percentage": 14.12, "elapsed_time": "11:59:15", "remaining_time": "3 days, 0:53:25", "throughput": 28497.43, "total_tokens": 1229828544} +{"current_steps": 4200, "total_steps": 29667, "loss": 0.4011, "lr": 4.196054542484125e-05, "epoch": 0.42473848876528775, "percentage": 14.16, "elapsed_time": "12:00:57", "remaining_time": "3 days, 0:51:35", "throughput": 28497.96, "total_tokens": 1232751552} +{"current_steps": 4210, "total_steps": 29667, "loss": 0.3961, "lr": 4.1945777344482084e-05, "epoch": 0.4257497708813956, "percentage": 14.19, "elapsed_time": "12:02:54", "remaining_time": "3 days, 0:51:17", "throughput": 28488.68, "total_tokens": 1235688128} +{"current_steps": 4220, "total_steps": 29667, "loss": 0.3982, "lr": 4.19310248461028e-05, "epoch": 0.4267610529975034, "percentage": 14.22, "elapsed_time": "12:04:42", "remaining_time": "3 days, 0:50:05", "throughput": 28486.21, "total_tokens": 1238659584} +{"current_steps": 4230, "total_steps": 29667, "loss": 0.4031, "lr": 4.1916287902321405e-05, "epoch": 0.42777233511361124, "percentage": 14.26, "elapsed_time": "12:06:38", "remaining_time": "3 days, 0:49:38", "throughput": 28478.91, "total_tokens": 1241637952} +{"current_steps": 4240, "total_steps": 29667, "loss": 0.4015, "lr": 4.190156648582328e-05, "epoch": 0.428783617229719, "percentage": 14.29, "elapsed_time": "12:08:18", "remaining_time": "3 days, 0:47:38", "throughput": 28480.57, "total_tokens": 1244565568} +{"current_steps": 4250, "total_steps": 29667, "loss": 0.3962, "lr": 4.188686056936087e-05, "epoch": 0.4297948993458269, "percentage": 14.33, "elapsed_time": "12:10:09", "remaining_time": "3 days, 0:46:41", "throughput": 28474.75, "total_tokens": 1247467264} +{"current_steps": 4260, "total_steps": 29667, "loss": 0.395, "lr": 4.187217012575352e-05, "epoch": 0.4308061814619347, "percentage": 14.36, "elapsed_time": "12:11:52", "remaining_time": "3 days, 0:44:59", "throughput": 28473.97, "total_tokens": 1250371136} +{"current_steps": 4270, "total_steps": 29667, "loss": 0.3976, "lr": 4.185749512788727e-05, "epoch": 0.4318174635780425, "percentage": 14.39, "elapsed_time": "12:13:34", "remaining_time": "3 days, 0:43:09", "throughput": 28474.74, "total_tokens": 1253305088} +{"current_steps": 4280, "total_steps": 29667, "loss": 0.401, "lr": 4.184283554871462e-05, "epoch": 0.43282874569415036, "percentage": 14.43, "elapsed_time": "12:15:19", "remaining_time": "3 days, 0:41:35", "throughput": 28474.13, "total_tokens": 1256256960} +{"current_steps": 4290, "total_steps": 29667, "loss": 0.3985, "lr": 4.1828191361254344e-05, "epoch": 0.4338400278102582, "percentage": 14.46, "elapsed_time": "12:17:12", "remaining_time": "3 days, 0:40:52", "throughput": 28467.66, "total_tokens": 1259195648} +{"current_steps": 4300, "total_steps": 29667, "loss": 0.3986, "lr": 4.181356253859127e-05, "epoch": 0.434851309926366, "percentage": 14.49, "elapsed_time": "12:19:02", "remaining_time": "3 days, 0:39:51", "throughput": 28463.75, "total_tokens": 1262164096} +{"current_steps": 4310, "total_steps": 29667, "loss": 0.3965, "lr": 4.179894905387606e-05, "epoch": 0.43586259204247385, "percentage": 14.53, "elapsed_time": "12:20:43", "remaining_time": "3 days, 0:37:52", "throughput": 28464.75, "total_tokens": 1265066624} +{"current_steps": 4320, "total_steps": 29667, "loss": 0.3949, "lr": 4.178435088032502e-05, "epoch": 0.4368738741585817, "percentage": 14.56, "elapsed_time": "12:22:32", "remaining_time": "3 days, 0:36:43", "throughput": 28460.96, "total_tokens": 1267997760} +{"current_steps": 4330, "total_steps": 29667, "loss": 0.4017, "lr": 4.176976799121989e-05, "epoch": 0.4378851562746895, "percentage": 14.6, "elapsed_time": "12:24:21", "remaining_time": "3 days, 0:35:33", "throughput": 28457.73, "total_tokens": 1270951168} +{"current_steps": 4340, "total_steps": 29667, "loss": 0.3942, "lr": 4.1755200359907657e-05, "epoch": 0.43889643839079734, "percentage": 14.63, "elapsed_time": "12:26:10", "remaining_time": "3 days, 0:34:30", "throughput": 28454.15, "total_tokens": 1273919936} +{"current_steps": 4350, "total_steps": 29667, "loss": 0.3959, "lr": 4.174064795980028e-05, "epoch": 0.4399077205069052, "percentage": 14.66, "elapsed_time": "12:27:54", "remaining_time": "3 days, 0:32:47", "throughput": 28453.94, "total_tokens": 1276844928} +{"current_steps": 4360, "total_steps": 29667, "loss": 0.4, "lr": 4.17261107643746e-05, "epoch": 0.440919002623013, "percentage": 14.7, "elapsed_time": "12:29:31", "remaining_time": "3 days, 0:30:33", "throughput": 28456.99, "total_tokens": 1279765760} +{"current_steps": 4370, "total_steps": 29667, "loss": 0.3972, "lr": 4.171158874717204e-05, "epoch": 0.4419302847391208, "percentage": 14.73, "elapsed_time": "12:31:09", "remaining_time": "3 days, 0:28:19", "throughput": 28460.27, "total_tokens": 1282697664} +{"current_steps": 4380, "total_steps": 29667, "loss": 0.3959, "lr": 4.169708188179844e-05, "epoch": 0.4429415668552286, "percentage": 14.76, "elapsed_time": "12:32:45", "remaining_time": "3 days, 0:25:51", "throughput": 28464.04, "total_tokens": 1285584192} +{"current_steps": 4390, "total_steps": 29667, "loss": 0.3907, "lr": 4.1682590141923846e-05, "epoch": 0.44395284897133647, "percentage": 14.8, "elapsed_time": "12:34:27", "remaining_time": "3 days, 0:24:05", "throughput": 28465.03, "total_tokens": 1288549184} +{"current_steps": 4400, "total_steps": 29667, "loss": 0.3953, "lr": 4.1668113501282335e-05, "epoch": 0.4449641310874443, "percentage": 14.83, "elapsed_time": "12:36:09", "remaining_time": "3 days, 0:22:11", "throughput": 28466.71, "total_tokens": 1291507520} +{"current_steps": 4410, "total_steps": 29667, "loss": 0.3944, "lr": 4.165365193367178e-05, "epoch": 0.4459754132035521, "percentage": 14.87, "elapsed_time": "12:37:48", "remaining_time": "3 days, 0:20:07", "throughput": 28469.32, "total_tokens": 1294456960} +{"current_steps": 4420, "total_steps": 29667, "loss": 0.3946, "lr": 4.163920541295369e-05, "epoch": 0.44698669531965995, "percentage": 14.9, "elapsed_time": "12:39:26", "remaining_time": "3 days, 0:17:53", "throughput": 28471.89, "total_tokens": 1297352768} +{"current_steps": 4430, "total_steps": 29667, "loss": 0.3997, "lr": 4.1624773913052946e-05, "epoch": 0.4479979774357678, "percentage": 14.93, "elapsed_time": "12:41:05", "remaining_time": "3 days, 0:15:51", "throughput": 28474.03, "total_tokens": 1300292544} +{"current_steps": 4440, "total_steps": 29667, "loss": 0.3976, "lr": 4.161035740795769e-05, "epoch": 0.4490092595518756, "percentage": 14.97, "elapsed_time": "12:42:45", "remaining_time": "3 days, 0:13:47", "throughput": 28476.31, "total_tokens": 1303229760} +{"current_steps": 4450, "total_steps": 29667, "loss": 0.3961, "lr": 4.1595955871719055e-05, "epoch": 0.45002054166798344, "percentage": 15.0, "elapsed_time": "12:44:24", "remaining_time": "3 days, 0:11:41", "throughput": 28478.1, "total_tokens": 1306130048} +{"current_steps": 4460, "total_steps": 29667, "loss": 0.3935, "lr": 4.158156927845101e-05, "epoch": 0.4510318237840913, "percentage": 15.03, "elapsed_time": "12:46:06", "remaining_time": "3 days, 0:09:54", "throughput": 28478.73, "total_tokens": 1309073664} +{"current_steps": 4470, "total_steps": 29667, "loss": 0.3961, "lr": 4.156719760233016e-05, "epoch": 0.4520431059001991, "percentage": 15.07, "elapsed_time": "12:47:44", "remaining_time": "3 days, 0:07:40", "throughput": 28481.7, "total_tokens": 1311987904} +{"current_steps": 4480, "total_steps": 29667, "loss": 0.394, "lr": 4.155284081759552e-05, "epoch": 0.45305438801630693, "percentage": 15.1, "elapsed_time": "12:49:25", "remaining_time": "3 days, 0:05:47", "throughput": 28483.75, "total_tokens": 1314966784} +{"current_steps": 4490, "total_steps": 29667, "loss": 0.3928, "lr": 4.1538498898548356e-05, "epoch": 0.4540656701324148, "percentage": 15.13, "elapsed_time": "12:51:05", "remaining_time": "3 days, 0:03:48", "throughput": 28486.21, "total_tokens": 1317939648} +{"current_steps": 4500, "total_steps": 29667, "loss": 0.3967, "lr": 4.1524171819552e-05, "epoch": 0.45507695224852257, "percentage": 15.17, "elapsed_time": "12:52:41", "remaining_time": "3 days, 0:01:22", "throughput": 28490.16, "total_tokens": 1320839296} +{"current_steps": 4510, "total_steps": 29667, "loss": 0.393, "lr": 4.15098595550316e-05, "epoch": 0.4560882343646304, "percentage": 15.2, "elapsed_time": "12:54:24", "remaining_time": "2 days, 23:59:41", "throughput": 28490.24, "total_tokens": 1323784768} +{"current_steps": 4520, "total_steps": 29667, "loss": 0.3984, "lr": 4.1495562079474e-05, "epoch": 0.4570995164807382, "percentage": 15.24, "elapsed_time": "12:56:00", "remaining_time": "2 days, 23:57:18", "throughput": 28493.35, "total_tokens": 1326663360} +{"current_steps": 4530, "total_steps": 29667, "loss": 0.396, "lr": 4.148127936742749e-05, "epoch": 0.45811079859684606, "percentage": 15.27, "elapsed_time": "12:57:38", "remaining_time": "2 days, 23:55:09", "throughput": 28496.46, "total_tokens": 1329607552} +{"current_steps": 4540, "total_steps": 29667, "loss": 0.3918, "lr": 4.146701139350166e-05, "epoch": 0.4591220807129539, "percentage": 15.3, "elapsed_time": "12:59:20", "remaining_time": "2 days, 23:53:18", "throughput": 28497.5, "total_tokens": 1332553024} +{"current_steps": 4550, "total_steps": 29667, "loss": 0.3965, "lr": 4.1452758132367196e-05, "epoch": 0.4601333628290617, "percentage": 15.34, "elapsed_time": "13:01:01", "remaining_time": "2 days, 23:51:24", "throughput": 28499.85, "total_tokens": 1335540608} +{"current_steps": 4560, "total_steps": 29667, "loss": 0.3972, "lr": 4.1438519558755656e-05, "epoch": 0.46114464494516955, "percentage": 15.37, "elapsed_time": "13:02:40", "remaining_time": "2 days, 23:49:23", "throughput": 28501.56, "total_tokens": 1338460928} +{"current_steps": 4570, "total_steps": 29667, "loss": 0.3926, "lr": 4.1424295647459336e-05, "epoch": 0.4621559270612774, "percentage": 15.4, "elapsed_time": "13:04:18", "remaining_time": "2 days, 23:47:09", "throughput": 28504.47, "total_tokens": 1341374720} +{"current_steps": 4580, "total_steps": 29667, "loss": 0.3977, "lr": 4.141008637333106e-05, "epoch": 0.4631672091773852, "percentage": 15.44, "elapsed_time": "13:05:57", "remaining_time": "2 days, 23:45:03", "throughput": 28506.57, "total_tokens": 1344288704} +{"current_steps": 4590, "total_steps": 29667, "loss": 0.3956, "lr": 4.1395891711283974e-05, "epoch": 0.46417849129349303, "percentage": 15.47, "elapsed_time": "13:07:33", "remaining_time": "2 days, 23:42:45", "throughput": 28509.28, "total_tokens": 1347168448} +{"current_steps": 4600, "total_steps": 29667, "loss": 0.3961, "lr": 4.1381711636291395e-05, "epoch": 0.4651897734096009, "percentage": 15.51, "elapsed_time": "13:09:10", "remaining_time": "2 days, 23:40:28", "throughput": 28513.12, "total_tokens": 1350108608} +{"current_steps": 4610, "total_steps": 29667, "loss": 0.3896, "lr": 4.1367546123386604e-05, "epoch": 0.4662010555257087, "percentage": 15.54, "elapsed_time": "13:10:51", "remaining_time": "2 days, 23:38:36", "throughput": 28515.11, "total_tokens": 1353088000} +{"current_steps": 4620, "total_steps": 29667, "loss": 0.3962, "lr": 4.1353395147662673e-05, "epoch": 0.4672123376418165, "percentage": 15.57, "elapsed_time": "13:12:30", "remaining_time": "2 days, 23:36:34", "throughput": 28517.22, "total_tokens": 1356020928} +{"current_steps": 4630, "total_steps": 29667, "loss": 0.3952, "lr": 4.133925868427225e-05, "epoch": 0.46822361975792437, "percentage": 15.61, "elapsed_time": "13:14:10", "remaining_time": "2 days, 23:34:35", "throughput": 28519.49, "total_tokens": 1358979072} +{"current_steps": 4640, "total_steps": 29667, "loss": 0.3958, "lr": 4.132513670842744e-05, "epoch": 0.46923490187403216, "percentage": 15.64, "elapsed_time": "13:15:54", "remaining_time": "2 days, 23:32:57", "throughput": 28519.05, "total_tokens": 1361922560} +{"current_steps": 4650, "total_steps": 29667, "loss": 0.3972, "lr": 4.1311029195399534e-05, "epoch": 0.47024618399014, "percentage": 15.67, "elapsed_time": "13:17:32", "remaining_time": "2 days, 23:30:45", "throughput": 28521.41, "total_tokens": 1364817152} +{"current_steps": 4660, "total_steps": 29667, "loss": 0.3938, "lr": 4.129693612051892e-05, "epoch": 0.4712574661062478, "percentage": 15.71, "elapsed_time": "13:19:09", "remaining_time": "2 days, 23:28:33", "throughput": 28524.69, "total_tokens": 1367750848} +{"current_steps": 4670, "total_steps": 29667, "loss": 0.3939, "lr": 4.1282857459174826e-05, "epoch": 0.47226874822235565, "percentage": 15.74, "elapsed_time": "13:20:47", "remaining_time": "2 days, 23:26:20", "throughput": 28527.98, "total_tokens": 1370685504} +{"current_steps": 4680, "total_steps": 29667, "loss": 0.3905, "lr": 4.1268793186815184e-05, "epoch": 0.4732800303384635, "percentage": 15.78, "elapsed_time": "13:22:29", "remaining_time": "2 days, 23:24:34", "throughput": 28529.08, "total_tokens": 1373659136} +{"current_steps": 4690, "total_steps": 29667, "loss": 0.3916, "lr": 4.1254743278946456e-05, "epoch": 0.4742913124545713, "percentage": 15.81, "elapsed_time": "13:24:05", "remaining_time": "2 days, 23:22:14", "throughput": 28532.42, "total_tokens": 1376556032} +{"current_steps": 4700, "total_steps": 29667, "loss": 0.3955, "lr": 4.1240707711133394e-05, "epoch": 0.47530259457067914, "percentage": 15.84, "elapsed_time": "13:25:43", "remaining_time": "2 days, 23:20:06", "throughput": 28534.48, "total_tokens": 1379454080} +{"current_steps": 4710, "total_steps": 29667, "loss": 0.3939, "lr": 4.122668645899893e-05, "epoch": 0.476313876686787, "percentage": 15.88, "elapsed_time": "13:27:23", "remaining_time": "2 days, 23:18:08", "throughput": 28536.25, "total_tokens": 1382391744} +{"current_steps": 4720, "total_steps": 29667, "loss": 0.3943, "lr": 4.1212679498223975e-05, "epoch": 0.4773251588028948, "percentage": 15.91, "elapsed_time": "13:28:58", "remaining_time": "2 days, 23:15:45", "throughput": 28540.33, "total_tokens": 1385308032} +{"current_steps": 4730, "total_steps": 29667, "loss": 0.392, "lr": 4.1198686804547215e-05, "epoch": 0.4783364409190026, "percentage": 15.94, "elapsed_time": "13:30:37", "remaining_time": "2 days, 23:13:43", "throughput": 28542.78, "total_tokens": 1388258368} +{"current_steps": 4740, "total_steps": 29667, "loss": 0.3927, "lr": 4.118470835376499e-05, "epoch": 0.4793477230351105, "percentage": 15.98, "elapsed_time": "13:32:16", "remaining_time": "2 days, 23:11:40", "throughput": 28545.02, "total_tokens": 1391195648} +{"current_steps": 4750, "total_steps": 29667, "loss": 0.392, "lr": 4.117074412173107e-05, "epoch": 0.48035900515121827, "percentage": 16.01, "elapsed_time": "13:33:50", "remaining_time": "2 days, 23:09:09", "throughput": 28548.97, "total_tokens": 1394063232} +{"current_steps": 4760, "total_steps": 29667, "loss": 0.3921, "lr": 4.115679408435648e-05, "epoch": 0.4813702872673261, "percentage": 16.04, "elapsed_time": "13:35:28", "remaining_time": "2 days, 23:07:03", "throughput": 28550.94, "total_tokens": 1396963328} +{"current_steps": 4770, "total_steps": 29667, "loss": 0.3972, "lr": 4.114285821760937e-05, "epoch": 0.48238156938343396, "percentage": 16.08, "elapsed_time": "13:37:06", "remaining_time": "2 days, 23:04:54", "throughput": 28554.1, "total_tokens": 1399910656} +{"current_steps": 4780, "total_steps": 29667, "loss": 0.3916, "lr": 4.11289364975148e-05, "epoch": 0.48339285149954175, "percentage": 16.11, "elapsed_time": "13:38:49", "remaining_time": "2 days, 23:03:13", "throughput": 28554.98, "total_tokens": 1402901696} +{"current_steps": 4790, "total_steps": 29667, "loss": 0.3942, "lr": 4.111502890015456e-05, "epoch": 0.4844041336156496, "percentage": 16.15, "elapsed_time": "13:40:23", "remaining_time": "2 days, 23:00:41", "throughput": 28559.22, "total_tokens": 1405771712} +{"current_steps": 4800, "total_steps": 29667, "loss": 0.3911, "lr": 4.1101135401667056e-05, "epoch": 0.4854154157317574, "percentage": 16.18, "elapsed_time": "13:41:59", "remaining_time": "2 days, 22:58:26", "throughput": 28562.12, "total_tokens": 1408673600} +{"current_steps": 4810, "total_steps": 29667, "loss": 0.3889, "lr": 4.108725597824708e-05, "epoch": 0.48642669784786524, "percentage": 16.21, "elapsed_time": "13:43:39", "remaining_time": "2 days, 22:56:26", "throughput": 28565.14, "total_tokens": 1411662016} +{"current_steps": 4820, "total_steps": 29667, "loss": 0.3919, "lr": 4.107339060614564e-05, "epoch": 0.4874379799639731, "percentage": 16.25, "elapsed_time": "13:45:17", "remaining_time": "2 days, 22:54:22", "throughput": 28567.45, "total_tokens": 1414594816} +{"current_steps": 4830, "total_steps": 29667, "loss": 0.3903, "lr": 4.1059539261669825e-05, "epoch": 0.4884492620800809, "percentage": 16.28, "elapsed_time": "13:46:54", "remaining_time": "2 days, 22:52:10", "throughput": 28570.46, "total_tokens": 1417513728} +{"current_steps": 4840, "total_steps": 29667, "loss": 0.3899, "lr": 4.104570192118262e-05, "epoch": 0.48946054419618873, "percentage": 16.31, "elapsed_time": "13:48:33", "remaining_time": "2 days, 22:50:05", "throughput": 28573.05, "total_tokens": 1420455040} +{"current_steps": 4850, "total_steps": 29667, "loss": 0.3916, "lr": 4.1031878561102714e-05, "epoch": 0.4904718263122966, "percentage": 16.35, "elapsed_time": "13:50:09", "remaining_time": "2 days, 22:47:52", "throughput": 28576.35, "total_tokens": 1423382976} +{"current_steps": 4860, "total_steps": 29667, "loss": 0.3908, "lr": 4.1018069157904385e-05, "epoch": 0.49148310842840437, "percentage": 16.38, "elapsed_time": "13:51:47", "remaining_time": "2 days, 22:45:44", "throughput": 28579.5, "total_tokens": 1426331904} +{"current_steps": 4870, "total_steps": 29667, "loss": 0.3917, "lr": 4.100427368811727e-05, "epoch": 0.4924943905445122, "percentage": 16.42, "elapsed_time": "13:53:28", "remaining_time": "2 days, 22:43:51", "throughput": 28581.21, "total_tokens": 1429298304} +{"current_steps": 4880, "total_steps": 29667, "loss": 0.389, "lr": 4.099049212832622e-05, "epoch": 0.49350567266062006, "percentage": 16.45, "elapsed_time": "13:55:04", "remaining_time": "2 days, 22:41:37", "throughput": 28583.87, "total_tokens": 1432190656} +{"current_steps": 4890, "total_steps": 29667, "loss": 0.39, "lr": 4.0976724455171155e-05, "epoch": 0.49451695477672786, "percentage": 16.48, "elapsed_time": "13:56:44", "remaining_time": "2 days, 22:39:37", "throughput": 28585.79, "total_tokens": 1435123712} +{"current_steps": 4900, "total_steps": 29667, "loss": 0.3919, "lr": 4.096297064534688e-05, "epoch": 0.4955282368928357, "percentage": 16.52, "elapsed_time": "13:58:22", "remaining_time": "2 days, 22:37:34", "throughput": 28587.7, "total_tokens": 1438039872} +{"current_steps": 4910, "total_steps": 29667, "loss": 0.3924, "lr": 4.0949230675602904e-05, "epoch": 0.49653951900894355, "percentage": 16.55, "elapsed_time": "14:00:05", "remaining_time": "2 days, 22:35:50", "throughput": 28588.77, "total_tokens": 1441021952} +{"current_steps": 4920, "total_steps": 29667, "loss": 0.3875, "lr": 4.09355045227433e-05, "epoch": 0.49755080112505135, "percentage": 16.58, "elapsed_time": "14:01:48", "remaining_time": "2 days, 22:34:11", "throughput": 28590.23, "total_tokens": 1444049472} +{"current_steps": 4930, "total_steps": 29667, "loss": 0.3897, "lr": 4.092179216362654e-05, "epoch": 0.4985620832411592, "percentage": 16.62, "elapsed_time": "14:03:27", "remaining_time": "2 days, 22:32:12", "throughput": 28592.26, "total_tokens": 1446995456} +{"current_steps": 4940, "total_steps": 29667, "loss": 0.3912, "lr": 4.090809357516532e-05, "epoch": 0.499573365357267, "percentage": 16.65, "elapsed_time": "14:05:08", "remaining_time": "2 days, 22:30:18", "throughput": 28593.98, "total_tokens": 1449951808} +{"current_steps": 4950, "total_steps": 29667, "loss": 0.3935, "lr": 4.089440873432638e-05, "epoch": 0.5005846474733748, "percentage": 16.69, "elapsed_time": "14:06:45", "remaining_time": "2 days, 22:28:09", "throughput": 28596.33, "total_tokens": 1452856832} +{"current_steps": 4960, "total_steps": 29667, "loss": 0.394, "lr": 4.088073761813037e-05, "epoch": 0.5015959295894826, "percentage": 16.72, "elapsed_time": "14:08:26", "remaining_time": "2 days, 22:26:20", "throughput": 28597.76, "total_tokens": 1455824384} +{"current_steps": 4970, "total_steps": 29667, "loss": 0.3943, "lr": 4.086708020365172e-05, "epoch": 0.5026072117055905, "percentage": 16.75, "elapsed_time": "14:10:05", "remaining_time": "2 days, 22:24:18", "throughput": 28599.8, "total_tokens": 1458751296} +{"current_steps": 4980, "total_steps": 29667, "loss": 0.3926, "lr": 4.0853436468018354e-05, "epoch": 0.5036184938216983, "percentage": 16.79, "elapsed_time": "14:11:42", "remaining_time": "2 days, 22:22:05", "throughput": 28602.83, "total_tokens": 1461669760} +{"current_steps": 4990, "total_steps": 29667, "loss": 0.3944, "lr": 4.0839806388411686e-05, "epoch": 0.5046297759378061, "percentage": 16.82, "elapsed_time": "14:13:23", "remaining_time": "2 days, 22:20:15", "throughput": 28604.23, "total_tokens": 1464629824} +{"current_steps": 5000, "total_steps": 29667, "loss": 0.3946, "lr": 4.0826189942066346e-05, "epoch": 0.505641058053914, "percentage": 16.85, "elapsed_time": "14:14:58", "remaining_time": "2 days, 22:17:53", "throughput": 28607.38, "total_tokens": 1467501760} +{"current_steps": 5000, "total_steps": 29667, "eval_loss": 0.33851784467697144, "epoch": 0.505641058053914, "percentage": 16.85, "elapsed_time": "14:14:59", "remaining_time": "2 days, 22:18:02", "throughput": 28606.39, "total_tokens": 1467501760} +{"current_steps": 5010, "total_steps": 29667, "loss": 0.3941, "lr": 4.081258710627008e-05, "epoch": 0.5066523401700218, "percentage": 16.89, "elapsed_time": "14:17:09", "remaining_time": "2 days, 22:18:32", "throughput": 28591.93, "total_tokens": 1470466944} +{"current_steps": 5020, "total_steps": 29667, "loss": 0.3887, "lr": 4.0798997858363557e-05, "epoch": 0.5076636222861296, "percentage": 16.92, "elapsed_time": "14:18:47", "remaining_time": "2 days, 22:16:25", "throughput": 28594.86, "total_tokens": 1473408768} +{"current_steps": 5030, "total_steps": 29667, "loss": 0.3945, "lr": 4.078542217574024e-05, "epoch": 0.5086749044022375, "percentage": 16.95, "elapsed_time": "14:20:27", "remaining_time": "2 days, 22:14:31", "throughput": 28596.78, "total_tokens": 1476377088} +{"current_steps": 5040, "total_steps": 29667, "loss": 0.3914, "lr": 4.0771860035846196e-05, "epoch": 0.5096861865183453, "percentage": 16.99, "elapsed_time": "14:22:07", "remaining_time": "2 days, 22:12:36", "throughput": 28598.23, "total_tokens": 1479316096} +{"current_steps": 5050, "total_steps": 29667, "loss": 0.3917, "lr": 4.0758311416179965e-05, "epoch": 0.5106974686344531, "percentage": 17.02, "elapsed_time": "14:23:42", "remaining_time": "2 days, 22:10:14", "throughput": 28602.79, "total_tokens": 1482256448} +{"current_steps": 5060, "total_steps": 29667, "loss": 0.3875, "lr": 4.0744776294292386e-05, "epoch": 0.511708750750561, "percentage": 17.06, "elapsed_time": "14:25:22", "remaining_time": "2 days, 22:08:19", "throughput": 28604.59, "total_tokens": 1485208768} +{"current_steps": 5070, "total_steps": 29667, "loss": 0.3919, "lr": 4.073125464778646e-05, "epoch": 0.5127200328666688, "percentage": 17.09, "elapsed_time": "14:27:00", "remaining_time": "2 days, 22:06:15", "throughput": 28607.29, "total_tokens": 1488159680} +{"current_steps": 5080, "total_steps": 29667, "loss": 0.3854, "lr": 4.071774645431717e-05, "epoch": 0.5137313149827766, "percentage": 17.12, "elapsed_time": "14:28:37", "remaining_time": "2 days, 22:04:04", "throughput": 28610.63, "total_tokens": 1491102464} +{"current_steps": 5090, "total_steps": 29667, "loss": 0.3887, "lr": 4.070425169159135e-05, "epoch": 0.5147425970988845, "percentage": 17.16, "elapsed_time": "14:30:16", "remaining_time": "2 days, 22:02:05", "throughput": 28612.9, "total_tokens": 1494057728} +{"current_steps": 5100, "total_steps": 29667, "loss": 0.3876, "lr": 4.069077033736751e-05, "epoch": 0.5157538792149923, "percentage": 17.19, "elapsed_time": "14:31:53", "remaining_time": "2 days, 21:59:58", "throughput": 28615.75, "total_tokens": 1496999168} +{"current_steps": 5110, "total_steps": 29667, "loss": 0.394, "lr": 4.06773023694557e-05, "epoch": 0.5167651613311001, "percentage": 17.22, "elapsed_time": "14:33:32", "remaining_time": "2 days, 21:57:58", "throughput": 28617.14, "total_tokens": 1499902784} +{"current_steps": 5120, "total_steps": 29667, "loss": 0.3927, "lr": 4.066384776571732e-05, "epoch": 0.517776443447208, "percentage": 17.26, "elapsed_time": "14:35:10", "remaining_time": "2 days, 21:55:50", "throughput": 28619.6, "total_tokens": 1502816832} +{"current_steps": 5130, "total_steps": 29667, "loss": 0.3889, "lr": 4.065040650406504e-05, "epoch": 0.5187877255633158, "percentage": 17.29, "elapsed_time": "14:36:46", "remaining_time": "2 days, 21:53:38", "throughput": 28621.9, "total_tokens": 1505694400} +{"current_steps": 5140, "total_steps": 29667, "loss": 0.3913, "lr": 4.0636978562462576e-05, "epoch": 0.5197990076794236, "percentage": 17.33, "elapsed_time": "14:38:26", "remaining_time": "2 days, 21:51:46", "throughput": 28623.24, "total_tokens": 1508641024} +{"current_steps": 5150, "total_steps": 29667, "loss": 0.3891, "lr": 4.062356391892456e-05, "epoch": 0.5208102897955313, "percentage": 17.36, "elapsed_time": "14:40:03", "remaining_time": "2 days, 21:49:37", "throughput": 28626.07, "total_tokens": 1511568704} +{"current_steps": 5160, "total_steps": 29667, "loss": 0.3871, "lr": 4.0610162551516395e-05, "epoch": 0.5218215719116392, "percentage": 17.39, "elapsed_time": "14:41:42", "remaining_time": "2 days, 21:47:38", "throughput": 28627.15, "total_tokens": 1514459904} +{"current_steps": 5170, "total_steps": 29667, "loss": 0.3904, "lr": 4.059677443835412e-05, "epoch": 0.522832854027747, "percentage": 17.43, "elapsed_time": "14:43:22", "remaining_time": "2 days, 21:45:42", "throughput": 28628.76, "total_tokens": 1517403456} +{"current_steps": 5180, "total_steps": 29667, "loss": 0.386, "lr": 4.058339955760423e-05, "epoch": 0.5238441361438548, "percentage": 17.46, "elapsed_time": "14:45:02", "remaining_time": "2 days, 21:43:45", "throughput": 28630.45, "total_tokens": 1520338112} +{"current_steps": 5190, "total_steps": 29667, "loss": 0.3871, "lr": 4.0570037887483535e-05, "epoch": 0.5248554182599627, "percentage": 17.49, "elapsed_time": "14:46:41", "remaining_time": "2 days, 21:41:48", "throughput": 28632.37, "total_tokens": 1523284224} +{"current_steps": 5200, "total_steps": 29667, "loss": 0.3858, "lr": 4.0556689406259025e-05, "epoch": 0.5258667003760705, "percentage": 17.53, "elapsed_time": "14:48:18", "remaining_time": "2 days, 21:39:41", "throughput": 28634.91, "total_tokens": 1526207744} +{"current_steps": 5210, "total_steps": 29667, "loss": 0.3927, "lr": 4.054335409224771e-05, "epoch": 0.5268779824921783, "percentage": 17.56, "elapsed_time": "14:49:54", "remaining_time": "2 days, 21:37:26", "throughput": 28637.69, "total_tokens": 1529095424} +{"current_steps": 5220, "total_steps": 29667, "loss": 0.3892, "lr": 4.053003192381646e-05, "epoch": 0.5278892646082862, "percentage": 17.6, "elapsed_time": "14:51:35", "remaining_time": "2 days, 21:35:36", "throughput": 28638.87, "total_tokens": 1532049152} +{"current_steps": 5230, "total_steps": 29667, "loss": 0.3924, "lr": 4.051672287938189e-05, "epoch": 0.528900546724394, "percentage": 17.63, "elapsed_time": "14:53:14", "remaining_time": "2 days, 21:33:36", "throughput": 28640.92, "total_tokens": 1534985344} +{"current_steps": 5240, "total_steps": 29667, "loss": 0.3946, "lr": 4.050342693741019e-05, "epoch": 0.5299118288405018, "percentage": 17.66, "elapsed_time": "14:54:53", "remaining_time": "2 days, 21:31:38", "throughput": 28642.59, "total_tokens": 1537911744} +{"current_steps": 5250, "total_steps": 29667, "loss": 0.3908, "lr": 4.049014407641699e-05, "epoch": 0.5309231109566097, "percentage": 17.7, "elapsed_time": "14:56:35", "remaining_time": "2 days, 21:29:53", "throughput": 28644.06, "total_tokens": 1540909952} +{"current_steps": 5260, "total_steps": 29667, "loss": 0.3908, "lr": 4.047687427496717e-05, "epoch": 0.5319343930727175, "percentage": 17.73, "elapsed_time": "14:58:11", "remaining_time": "2 days, 21:27:44", "throughput": 28646.72, "total_tokens": 1543823488} +{"current_steps": 5270, "total_steps": 29667, "loss": 0.3899, "lr": 4.046361751167479e-05, "epoch": 0.5329456751888253, "percentage": 17.76, "elapsed_time": "14:59:40", "remaining_time": "2 days, 21:25:00", "throughput": 28651.47, "total_tokens": 1546633792} +{"current_steps": 5280, "total_steps": 29667, "loss": 0.3915, "lr": 4.045037376520292e-05, "epoch": 0.5339569573049332, "percentage": 17.8, "elapsed_time": "15:01:21", "remaining_time": "2 days, 21:23:08", "throughput": 28652.52, "total_tokens": 1549567936} +{"current_steps": 5290, "total_steps": 29667, "loss": 0.3884, "lr": 4.043714301426344e-05, "epoch": 0.534968239421041, "percentage": 17.83, "elapsed_time": "15:03:02", "remaining_time": "2 days, 21:21:19", "throughput": 28653.7, "total_tokens": 1552523712} +{"current_steps": 5300, "total_steps": 29667, "loss": 0.3868, "lr": 4.042392523761696e-05, "epoch": 0.5359795215371488, "percentage": 17.86, "elapsed_time": "15:04:42", "remaining_time": "2 days, 21:19:24", "throughput": 28654.26, "total_tokens": 1555413504} +{"current_steps": 5310, "total_steps": 29667, "loss": 0.3881, "lr": 4.041072041407267e-05, "epoch": 0.5369908036532567, "percentage": 17.9, "elapsed_time": "15:06:18", "remaining_time": "2 days, 21:17:16", "throughput": 28657.45, "total_tokens": 1558363072} +{"current_steps": 5320, "total_steps": 29667, "loss": 0.389, "lr": 4.039752852248815e-05, "epoch": 0.5380020857693645, "percentage": 17.93, "elapsed_time": "15:07:54", "remaining_time": "2 days, 21:15:02", "throughput": 28660.01, "total_tokens": 1561239488} +{"current_steps": 5330, "total_steps": 29667, "loss": 0.3843, "lr": 4.0384349541769286e-05, "epoch": 0.5390133678854723, "percentage": 17.97, "elapsed_time": "15:09:36", "remaining_time": "2 days, 21:13:17", "throughput": 28660.88, "total_tokens": 1564200896} +{"current_steps": 5340, "total_steps": 29667, "loss": 0.3898, "lr": 4.037118345087011e-05, "epoch": 0.5400246500015802, "percentage": 18.0, "elapsed_time": "15:11:14", "remaining_time": "2 days, 21:11:16", "throughput": 28662.44, "total_tokens": 1567105152} +{"current_steps": 5350, "total_steps": 29667, "loss": 0.3804, "lr": 4.0358030228792636e-05, "epoch": 0.541035932117688, "percentage": 18.03, "elapsed_time": "15:12:52", "remaining_time": "2 days, 21:09:15", "throughput": 28664.95, "total_tokens": 1570061504} +{"current_steps": 5360, "total_steps": 29667, "loss": 0.3903, "lr": 4.034488985458673e-05, "epoch": 0.5420472142337958, "percentage": 18.07, "elapsed_time": "15:14:26", "remaining_time": "2 days, 21:06:51", "throughput": 28669.22, "total_tokens": 1572967872} +{"current_steps": 5370, "total_steps": 29667, "loss": 0.3862, "lr": 4.033176230735001e-05, "epoch": 0.5430584963499037, "percentage": 18.1, "elapsed_time": "15:16:05", "remaining_time": "2 days, 21:04:57", "throughput": 28670.85, "total_tokens": 1575917632} +{"current_steps": 5380, "total_steps": 29667, "loss": 0.3852, "lr": 4.0318647566227626e-05, "epoch": 0.5440697784660115, "percentage": 18.13, "elapsed_time": "15:17:48", "remaining_time": "2 days, 21:03:17", "throughput": 28671.53, "total_tokens": 1578905792} +{"current_steps": 5390, "total_steps": 29667, "loss": 0.3885, "lr": 4.0305545610412205e-05, "epoch": 0.5450810605821192, "percentage": 18.17, "elapsed_time": "15:19:28", "remaining_time": "2 days, 21:01:22", "throughput": 28673.02, "total_tokens": 1581844864} +{"current_steps": 5400, "total_steps": 29667, "loss": 0.3896, "lr": 4.029245641914365e-05, "epoch": 0.5460923426982272, "percentage": 18.2, "elapsed_time": "15:21:06", "remaining_time": "2 days, 20:59:20", "throughput": 28675.21, "total_tokens": 1584769984} +{"current_steps": 5410, "total_steps": 29667, "loss": 0.3898, "lr": 4.027937997170904e-05, "epoch": 0.5471036248143349, "percentage": 18.24, "elapsed_time": "15:22:45", "remaining_time": "2 days, 20:57:22", "throughput": 28677.3, "total_tokens": 1587720576} +{"current_steps": 5420, "total_steps": 29667, "loss": 0.3897, "lr": 4.026631624744247e-05, "epoch": 0.5481149069304427, "percentage": 18.27, "elapsed_time": "15:24:20", "remaining_time": "2 days, 20:55:08", "throughput": 28679.94, "total_tokens": 1590598400} +{"current_steps": 5430, "total_steps": 29667, "loss": 0.3864, "lr": 4.025326522572493e-05, "epoch": 0.5491261890465505, "percentage": 18.3, "elapsed_time": "15:25:56", "remaining_time": "2 days, 20:52:59", "throughput": 28681.93, "total_tokens": 1593473728} +{"current_steps": 5440, "total_steps": 29667, "loss": 0.3875, "lr": 4.024022688598415e-05, "epoch": 0.5501374711626584, "percentage": 18.34, "elapsed_time": "15:27:36", "remaining_time": "2 days, 20:51:07", "throughput": 28682.73, "total_tokens": 1596390016} +{"current_steps": 5450, "total_steps": 29667, "loss": 0.3855, "lr": 4.0227201207694494e-05, "epoch": 0.5511487532787662, "percentage": 18.37, "elapsed_time": "15:29:12", "remaining_time": "2 days, 20:48:55", "throughput": 28685.72, "total_tokens": 1599299904} +{"current_steps": 5460, "total_steps": 29667, "loss": 0.3884, "lr": 4.021418817037677e-05, "epoch": 0.552160035394874, "percentage": 18.4, "elapsed_time": "15:30:46", "remaining_time": "2 days, 20:46:34", "throughput": 28689.25, "total_tokens": 1602181952} +{"current_steps": 5470, "total_steps": 29667, "loss": 0.3828, "lr": 4.0201187753598174e-05, "epoch": 0.5531713175109819, "percentage": 18.44, "elapsed_time": "15:32:25", "remaining_time": "2 days, 20:44:37", "throughput": 28691.05, "total_tokens": 1605123328} +{"current_steps": 5480, "total_steps": 29667, "loss": 0.3847, "lr": 4.018819993697208e-05, "epoch": 0.5541825996270897, "percentage": 18.47, "elapsed_time": "15:34:04", "remaining_time": "2 days, 20:42:41", "throughput": 28693.09, "total_tokens": 1608079168} +{"current_steps": 5490, "total_steps": 29667, "loss": 0.396, "lr": 4.017522470015793e-05, "epoch": 0.5551938817431975, "percentage": 18.51, "elapsed_time": "15:35:43", "remaining_time": "2 days, 20:40:45", "throughput": 28695.3, "total_tokens": 1611053312} +{"current_steps": 5500, "total_steps": 29667, "loss": 0.3805, "lr": 4.0162262022861144e-05, "epoch": 0.5562051638593054, "percentage": 18.54, "elapsed_time": "15:37:19", "remaining_time": "2 days, 20:38:38", "throughput": 28697.8, "total_tokens": 1613960960} +{"current_steps": 5510, "total_steps": 29667, "loss": 0.3864, "lr": 4.0149311884832906e-05, "epoch": 0.5572164459754132, "percentage": 18.57, "elapsed_time": "15:38:56", "remaining_time": "2 days, 20:36:31", "throughput": 28700.35, "total_tokens": 1616881024} +{"current_steps": 5520, "total_steps": 29667, "loss": 0.3895, "lr": 4.0136374265870116e-05, "epoch": 0.558227728091521, "percentage": 18.61, "elapsed_time": "15:40:37", "remaining_time": "2 days, 20:34:43", "throughput": 28701.81, "total_tokens": 1619859840} +{"current_steps": 5530, "total_steps": 29667, "loss": 0.3882, "lr": 4.0123449145815174e-05, "epoch": 0.5592390102076289, "percentage": 18.64, "elapsed_time": "15:42:17", "remaining_time": "2 days, 20:32:51", "throughput": 28702.51, "total_tokens": 1622767040} +{"current_steps": 5540, "total_steps": 29667, "loss": 0.3863, "lr": 4.011053650455592e-05, "epoch": 0.5602502923237367, "percentage": 18.67, "elapsed_time": "15:43:55", "remaining_time": "2 days, 20:30:50", "throughput": 28704.28, "total_tokens": 1625683072} +{"current_steps": 5550, "total_steps": 29667, "loss": 0.3861, "lr": 4.0097636322025466e-05, "epoch": 0.5612615744398445, "percentage": 18.71, "elapsed_time": "15:45:33", "remaining_time": "2 days, 20:28:50", "throughput": 28706.18, "total_tokens": 1628606016} +{"current_steps": 5560, "total_steps": 29667, "loss": 0.3898, "lr": 4.008474857820206e-05, "epoch": 0.5622728565559524, "percentage": 18.74, "elapsed_time": "15:47:12", "remaining_time": "2 days, 20:26:53", "throughput": 28708.37, "total_tokens": 1631565632} +{"current_steps": 5570, "total_steps": 29667, "loss": 0.388, "lr": 4.007187325310899e-05, "epoch": 0.5632841386720602, "percentage": 18.78, "elapsed_time": "15:48:51", "remaining_time": "2 days, 20:24:56", "throughput": 28710.39, "total_tokens": 1634515136} +{"current_steps": 5580, "total_steps": 29667, "loss": 0.3911, "lr": 4.00590103268144e-05, "epoch": 0.564295420788168, "percentage": 18.81, "elapsed_time": "15:50:27", "remaining_time": "2 days, 20:22:50", "throughput": 28713.44, "total_tokens": 1637466432} +{"current_steps": 5590, "total_steps": 29667, "loss": 0.3833, "lr": 4.004615977943124e-05, "epoch": 0.5653067029042759, "percentage": 18.84, "elapsed_time": "15:52:07", "remaining_time": "2 days, 20:20:57", "throughput": 28715.11, "total_tokens": 1640427520} +{"current_steps": 5600, "total_steps": 29667, "loss": 0.3868, "lr": 4.0033321591117025e-05, "epoch": 0.5663179850203837, "percentage": 18.88, "elapsed_time": "15:53:44", "remaining_time": "2 days, 20:18:53", "throughput": 28717.96, "total_tokens": 1643374912} +{"current_steps": 5610, "total_steps": 29667, "loss": 0.3918, "lr": 4.002049574207381e-05, "epoch": 0.5673292671364915, "percentage": 18.91, "elapsed_time": "15:55:23", "remaining_time": "2 days, 20:16:57", "throughput": 28719.96, "total_tokens": 1646335232} +{"current_steps": 5620, "total_steps": 29667, "loss": 0.3901, "lr": 4.000768221254803e-05, "epoch": 0.5683405492525994, "percentage": 18.94, "elapsed_time": "15:57:05", "remaining_time": "2 days, 20:15:11", "throughput": 28719.93, "total_tokens": 1649244032} +{"current_steps": 5630, "total_steps": 29667, "loss": 0.3886, "lr": 3.999488098283034e-05, "epoch": 0.5693518313687072, "percentage": 18.98, "elapsed_time": "15:58:43", "remaining_time": "2 days, 20:13:11", "throughput": 28721.48, "total_tokens": 1652146752} +{"current_steps": 5640, "total_steps": 29667, "loss": 0.3858, "lr": 3.9982092033255506e-05, "epoch": 0.5703631134848149, "percentage": 19.01, "elapsed_time": "16:00:21", "remaining_time": "2 days, 20:11:12", "throughput": 28723.39, "total_tokens": 1655078336} +{"current_steps": 5650, "total_steps": 29667, "loss": 0.3856, "lr": 3.996931534420232e-05, "epoch": 0.5713743956009228, "percentage": 19.04, "elapsed_time": "16:02:00", "remaining_time": "2 days, 20:09:16", "throughput": 28724.51, "total_tokens": 1657985408} +{"current_steps": 5660, "total_steps": 29667, "loss": 0.3832, "lr": 3.995655089609339e-05, "epoch": 0.5723856777170306, "percentage": 19.08, "elapsed_time": "16:03:39", "remaining_time": "2 days, 20:07:21", "throughput": 28726.01, "total_tokens": 1660918656} +{"current_steps": 5670, "total_steps": 29667, "loss": 0.3842, "lr": 3.994379866939511e-05, "epoch": 0.5733969598331384, "percentage": 19.11, "elapsed_time": "16:05:15", "remaining_time": "2 days, 20:05:12", "throughput": 28728.45, "total_tokens": 1663811904} +{"current_steps": 5680, "total_steps": 29667, "loss": 0.3879, "lr": 3.993105864461745e-05, "epoch": 0.5744082419492463, "percentage": 19.15, "elapsed_time": "16:06:52", "remaining_time": "2 days, 20:03:08", "throughput": 28730.15, "total_tokens": 1666696320} +{"current_steps": 5690, "total_steps": 29667, "loss": 0.3857, "lr": 3.9918330802313866e-05, "epoch": 0.5754195240653541, "percentage": 19.18, "elapsed_time": "16:08:32", "remaining_time": "2 days, 20:01:20", "throughput": 28730.98, "total_tokens": 1669640192} +{"current_steps": 5700, "total_steps": 29667, "loss": 0.3879, "lr": 3.9905615123081206e-05, "epoch": 0.5764308061814619, "percentage": 19.21, "elapsed_time": "16:10:12", "remaining_time": "2 days, 19:59:26", "throughput": 28732.94, "total_tokens": 1672607232} +{"current_steps": 5710, "total_steps": 29667, "loss": 0.3834, "lr": 3.989291158755953e-05, "epoch": 0.5774420882975697, "percentage": 19.25, "elapsed_time": "16:11:47", "remaining_time": "2 days, 19:57:17", "throughput": 28735.24, "total_tokens": 1675486848} +{"current_steps": 5720, "total_steps": 29667, "loss": 0.3864, "lr": 3.988022017643201e-05, "epoch": 0.5784533704136776, "percentage": 19.28, "elapsed_time": "16:13:25", "remaining_time": "2 days, 19:55:18", "throughput": 28737.07, "total_tokens": 1678413312} +{"current_steps": 5730, "total_steps": 29667, "loss": 0.3882, "lr": 3.9867540870424826e-05, "epoch": 0.5794646525297854, "percentage": 19.31, "elapsed_time": "16:15:03", "remaining_time": "2 days, 19:53:16", "throughput": 28738.61, "total_tokens": 1681300928} +{"current_steps": 5740, "total_steps": 29667, "loss": 0.3846, "lr": 3.985487365030702e-05, "epoch": 0.5804759346458932, "percentage": 19.35, "elapsed_time": "16:16:43", "remaining_time": "2 days, 19:51:26", "throughput": 28739.75, "total_tokens": 1684244736} +{"current_steps": 5750, "total_steps": 29667, "loss": 0.3839, "lr": 3.984221849689036e-05, "epoch": 0.5814872167620011, "percentage": 19.38, "elapsed_time": "16:18:20", "remaining_time": "2 days, 19:49:25", "throughput": 28742.36, "total_tokens": 1687201536} +{"current_steps": 5760, "total_steps": 29667, "loss": 0.3878, "lr": 3.982957539102927e-05, "epoch": 0.5824984988781089, "percentage": 19.42, "elapsed_time": "16:20:01", "remaining_time": "2 days, 19:47:36", "throughput": 28743.43, "total_tokens": 1690153728} +{"current_steps": 5770, "total_steps": 29667, "loss": 0.3897, "lr": 3.981694431362065e-05, "epoch": 0.5835097809942167, "percentage": 19.45, "elapsed_time": "16:21:41", "remaining_time": "2 days, 19:45:47", "throughput": 28744.14, "total_tokens": 1693083968} +{"current_steps": 5780, "total_steps": 29667, "loss": 0.3862, "lr": 3.9804325245603786e-05, "epoch": 0.5845210631103246, "percentage": 19.48, "elapsed_time": "16:23:22", "remaining_time": "2 days, 19:44:00", "throughput": 28745.14, "total_tokens": 1696041472} +{"current_steps": 5790, "total_steps": 29667, "loss": 0.3857, "lr": 3.9791718167960226e-05, "epoch": 0.5855323452264324, "percentage": 19.52, "elapsed_time": "16:25:04", "remaining_time": "2 days, 19:42:16", "throughput": 28745.84, "total_tokens": 1699001536} +{"current_steps": 5800, "total_steps": 29667, "loss": 0.3826, "lr": 3.9779123061713665e-05, "epoch": 0.5865436273425402, "percentage": 19.55, "elapsed_time": "16:26:43", "remaining_time": "2 days, 19:40:23", "throughput": 28746.84, "total_tokens": 1701922432} +{"current_steps": 5810, "total_steps": 29667, "loss": 0.3858, "lr": 3.976653990792979e-05, "epoch": 0.5875549094586481, "percentage": 19.58, "elapsed_time": "16:28:21", "remaining_time": "2 days, 19:38:21", "throughput": 28748.68, "total_tokens": 1704828672} +{"current_steps": 5820, "total_steps": 29667, "loss": 0.3855, "lr": 3.9753968687716206e-05, "epoch": 0.5885661915747559, "percentage": 19.62, "elapsed_time": "16:29:58", "remaining_time": "2 days, 19:36:22", "throughput": 28750.42, "total_tokens": 1707742144} +{"current_steps": 5830, "total_steps": 29667, "loss": 0.3827, "lr": 3.974140938222232e-05, "epoch": 0.5895774736908637, "percentage": 19.65, "elapsed_time": "16:31:37", "remaining_time": "2 days, 19:34:25", "throughput": 28751.52, "total_tokens": 1710637376} +{"current_steps": 5840, "total_steps": 29667, "loss": 0.3868, "lr": 3.972886197263915e-05, "epoch": 0.5905887558069716, "percentage": 19.69, "elapsed_time": "16:33:15", "remaining_time": "2 days, 19:32:28", "throughput": 28753.2, "total_tokens": 1713568512} +{"current_steps": 5850, "total_steps": 29667, "loss": 0.3864, "lr": 3.97163264401993e-05, "epoch": 0.5916000379230794, "percentage": 19.72, "elapsed_time": "16:34:50", "remaining_time": "2 days, 19:30:18", "throughput": 28755.44, "total_tokens": 1716440448} +{"current_steps": 5860, "total_steps": 29667, "loss": 0.3872, "lr": 3.970380276617677e-05, "epoch": 0.5926113200391872, "percentage": 19.75, "elapsed_time": "16:36:29", "remaining_time": "2 days, 19:28:21", "throughput": 28756.84, "total_tokens": 1719353216} +{"current_steps": 5870, "total_steps": 29667, "loss": 0.3894, "lr": 3.96912909318869e-05, "epoch": 0.593622602155295, "percentage": 19.79, "elapsed_time": "16:38:07", "remaining_time": "2 days, 19:26:25", "throughput": 28758.76, "total_tokens": 1722299968} +{"current_steps": 5880, "total_steps": 29667, "loss": 0.3876, "lr": 3.96787909186862e-05, "epoch": 0.5946338842714028, "percentage": 19.82, "elapsed_time": "16:39:48", "remaining_time": "2 days, 19:24:36", "throughput": 28759.79, "total_tokens": 1725245824} +{"current_steps": 5890, "total_steps": 29667, "loss": 0.3918, "lr": 3.9666302707972244e-05, "epoch": 0.5956451663875106, "percentage": 19.85, "elapsed_time": "16:41:25", "remaining_time": "2 days, 19:22:35", "throughput": 28761.52, "total_tokens": 1728151296} +{"current_steps": 5900, "total_steps": 29667, "loss": 0.385, "lr": 3.965382628118358e-05, "epoch": 0.5966564485036185, "percentage": 19.89, "elapsed_time": "16:43:02", "remaining_time": "2 days, 19:20:32", "throughput": 28763.56, "total_tokens": 1731056256} +{"current_steps": 5910, "total_steps": 29667, "loss": 0.3868, "lr": 3.964136161979959e-05, "epoch": 0.5976677306197263, "percentage": 19.92, "elapsed_time": "16:44:42", "remaining_time": "2 days, 19:18:43", "throughput": 28764.36, "total_tokens": 1733985792} +{"current_steps": 5920, "total_steps": 29667, "loss": 0.3855, "lr": 3.9628908705340406e-05, "epoch": 0.5986790127358341, "percentage": 19.95, "elapsed_time": "16:46:23", "remaining_time": "2 days, 19:16:57", "throughput": 28765.58, "total_tokens": 1736967232} +{"current_steps": 5930, "total_steps": 29667, "loss": 0.385, "lr": 3.961646751936673e-05, "epoch": 0.599690294851942, "percentage": 19.99, "elapsed_time": "16:48:02", "remaining_time": "2 days, 19:15:03", "throughput": 28766.9, "total_tokens": 1739892480} +{"current_steps": 5940, "total_steps": 29667, "loss": 0.3861, "lr": 3.960403804347979e-05, "epoch": 0.6007015769680498, "percentage": 20.02, "elapsed_time": "16:49:40", "remaining_time": "2 days, 19:13:03", "throughput": 28768.79, "total_tokens": 1742815488} +{"current_steps": 5950, "total_steps": 29667, "loss": 0.3872, "lr": 3.959162025932119e-05, "epoch": 0.6017128590841576, "percentage": 20.06, "elapsed_time": "16:51:22", "remaining_time": "2 days, 19:11:24", "throughput": 28768.7, "total_tokens": 1745765504} +{"current_steps": 5960, "total_steps": 29667, "loss": 0.3895, "lr": 3.95792141485728e-05, "epoch": 0.6027241412002654, "percentage": 20.09, "elapsed_time": "16:53:01", "remaining_time": "2 days, 19:09:28", "throughput": 28770.29, "total_tokens": 1748694336} +{"current_steps": 5970, "total_steps": 29667, "loss": 0.3851, "lr": 3.956681969295664e-05, "epoch": 0.6037354233163733, "percentage": 20.12, "elapsed_time": "16:54:41", "remaining_time": "2 days, 19:07:38", "throughput": 28771.46, "total_tokens": 1751643904} +{"current_steps": 5980, "total_steps": 29667, "loss": 0.3804, "lr": 3.955443687423479e-05, "epoch": 0.6047467054324811, "percentage": 20.16, "elapsed_time": "16:56:17", "remaining_time": "2 days, 19:05:35", "throughput": 28773.2, "total_tokens": 1754525376} +{"current_steps": 5990, "total_steps": 29667, "loss": 0.3862, "lr": 3.954206567420924e-05, "epoch": 0.6057579875485889, "percentage": 20.19, "elapsed_time": "16:57:57", "remaining_time": "2 days, 19:03:44", "throughput": 28774.27, "total_tokens": 1757459264} +{"current_steps": 6000, "total_steps": 29667, "loss": 0.3838, "lr": 3.952970607472179e-05, "epoch": 0.6067692696646968, "percentage": 20.22, "elapsed_time": "16:59:36", "remaining_time": "2 days, 19:01:49", "throughput": 28775.34, "total_tokens": 1760362880} +{"current_steps": 6010, "total_steps": 29667, "loss": 0.3885, "lr": 3.951735805765399e-05, "epoch": 0.6077805517808046, "percentage": 20.26, "elapsed_time": "17:01:13", "remaining_time": "2 days, 18:59:51", "throughput": 28777.88, "total_tokens": 1763335104} +{"current_steps": 6020, "total_steps": 29667, "loss": 0.3819, "lr": 3.950502160492692e-05, "epoch": 0.6087918338969124, "percentage": 20.29, "elapsed_time": "17:02:52", "remaining_time": "2 days, 18:57:53", "throughput": 28779.33, "total_tokens": 1766246592} +{"current_steps": 6030, "total_steps": 29667, "loss": 0.3863, "lr": 3.9492696698501205e-05, "epoch": 0.6098031160130203, "percentage": 20.33, "elapsed_time": "17:04:30", "remaining_time": "2 days, 18:55:58", "throughput": 28781.41, "total_tokens": 1769212800} +{"current_steps": 6040, "total_steps": 29667, "loss": 0.3846, "lr": 3.9480383320376784e-05, "epoch": 0.6108143981291281, "percentage": 20.36, "elapsed_time": "17:06:12", "remaining_time": "2 days, 18:54:14", "throughput": 28781.87, "total_tokens": 1772159616} +{"current_steps": 6050, "total_steps": 29667, "loss": 0.385, "lr": 3.94680814525929e-05, "epoch": 0.6118256802452359, "percentage": 20.39, "elapsed_time": "17:07:50", "remaining_time": "2 days, 18:52:20", "throughput": 28783.29, "total_tokens": 1775091840} +{"current_steps": 6060, "total_steps": 29667, "loss": 0.3856, "lr": 3.945579107722792e-05, "epoch": 0.6128369623613438, "percentage": 20.43, "elapsed_time": "17:09:24", "remaining_time": "2 days, 18:50:06", "throughput": 28786.56, "total_tokens": 1777991104} +{"current_steps": 6070, "total_steps": 29667, "loss": 0.3875, "lr": 3.9443512176399276e-05, "epoch": 0.6138482444774516, "percentage": 20.46, "elapsed_time": "17:11:01", "remaining_time": "2 days, 18:48:03", "throughput": 28788.63, "total_tokens": 1780894400} +{"current_steps": 6080, "total_steps": 29667, "loss": 0.3836, "lr": 3.9431244732263307e-05, "epoch": 0.6148595265935594, "percentage": 20.49, "elapsed_time": "17:12:45", "remaining_time": "2 days, 18:46:32", "throughput": 28788.69, "total_tokens": 1783916544} +{"current_steps": 6090, "total_steps": 29667, "loss": 0.386, "lr": 3.941898872701519e-05, "epoch": 0.6158708087096673, "percentage": 20.53, "elapsed_time": "17:14:23", "remaining_time": "2 days, 18:44:34", "throughput": 28791.04, "total_tokens": 1786870400} +{"current_steps": 6100, "total_steps": 29667, "loss": 0.3836, "lr": 3.940674414288882e-05, "epoch": 0.616882090825775, "percentage": 20.56, "elapsed_time": "17:16:00", "remaining_time": "2 days, 18:42:34", "throughput": 28793.39, "total_tokens": 1789822336} +{"current_steps": 6110, "total_steps": 29667, "loss": 0.3867, "lr": 3.939451096215668e-05, "epoch": 0.6178933729418828, "percentage": 20.6, "elapsed_time": "17:17:43", "remaining_time": "2 days, 18:40:56", "throughput": 28793.5, "total_tokens": 1792791872} +{"current_steps": 6120, "total_steps": 29667, "loss": 0.387, "lr": 3.938228916712978e-05, "epoch": 0.6189046550579907, "percentage": 20.63, "elapsed_time": "17:19:21", "remaining_time": "2 days, 18:38:59", "throughput": 28795.61, "total_tokens": 1795744512} +{"current_steps": 6130, "total_steps": 29667, "loss": 0.3856, "lr": 3.937007874015748e-05, "epoch": 0.6199159371740985, "percentage": 20.66, "elapsed_time": "17:20:59", "remaining_time": "2 days, 18:37:02", "throughput": 28797.05, "total_tokens": 1798655168} +{"current_steps": 6140, "total_steps": 29667, "loss": 0.3847, "lr": 3.935787966362748e-05, "epoch": 0.6209272192902063, "percentage": 20.7, "elapsed_time": "17:22:38", "remaining_time": "2 days, 18:35:10", "throughput": 28798.48, "total_tokens": 1801603328} +{"current_steps": 6150, "total_steps": 29667, "loss": 0.3846, "lr": 3.9345691919965595e-05, "epoch": 0.6219385014063142, "percentage": 20.73, "elapsed_time": "17:24:15", "remaining_time": "2 days, 18:33:08", "throughput": 28799.68, "total_tokens": 1804461824} +{"current_steps": 6160, "total_steps": 29667, "loss": 0.3811, "lr": 3.9333515491635764e-05, "epoch": 0.622949783522422, "percentage": 20.76, "elapsed_time": "17:25:53", "remaining_time": "2 days, 18:31:12", "throughput": 28802.07, "total_tokens": 1807433600} +{"current_steps": 6170, "total_steps": 29667, "loss": 0.3795, "lr": 3.932135036113987e-05, "epoch": 0.6239610656385298, "percentage": 20.8, "elapsed_time": "17:27:29", "remaining_time": "2 days, 18:29:06", "throughput": 28804.53, "total_tokens": 1810346048} +{"current_steps": 6180, "total_steps": 29667, "loss": 0.385, "lr": 3.930919651101764e-05, "epoch": 0.6249723477546377, "percentage": 20.83, "elapsed_time": "17:29:10", "remaining_time": "2 days, 18:27:22", "throughput": 28805.28, "total_tokens": 1813308352} +{"current_steps": 6190, "total_steps": 29667, "loss": 0.3823, "lr": 3.9297053923846576e-05, "epoch": 0.6259836298707455, "percentage": 20.86, "elapsed_time": "17:30:45", "remaining_time": "2 days, 18:25:16", "throughput": 28807.64, "total_tokens": 1816205376} +{"current_steps": 6200, "total_steps": 29667, "loss": 0.3835, "lr": 3.928492258224183e-05, "epoch": 0.6269949119868533, "percentage": 20.9, "elapsed_time": "17:32:23", "remaining_time": "2 days, 18:23:18", "throughput": 28809.92, "total_tokens": 1819158720} +{"current_steps": 6210, "total_steps": 29667, "loss": 0.3813, "lr": 3.927280246885609e-05, "epoch": 0.6280061941029612, "percentage": 20.93, "elapsed_time": "17:34:01", "remaining_time": "2 days, 18:21:23", "throughput": 28811.64, "total_tokens": 1822105280} +{"current_steps": 6220, "total_steps": 29667, "loss": 0.3845, "lr": 3.9260693566379486e-05, "epoch": 0.629017476219069, "percentage": 20.97, "elapsed_time": "17:35:41", "remaining_time": "2 days, 18:19:33", "throughput": 28813.31, "total_tokens": 1825078464} +{"current_steps": 6230, "total_steps": 29667, "loss": 0.3775, "lr": 3.924859585753948e-05, "epoch": 0.6300287583351768, "percentage": 21.0, "elapsed_time": "17:37:23", "remaining_time": "2 days, 18:17:50", "throughput": 28813.99, "total_tokens": 1828051456} +{"current_steps": 6240, "total_steps": 29667, "loss": 0.3835, "lr": 3.923650932510079e-05, "epoch": 0.6310400404512846, "percentage": 21.03, "elapsed_time": "17:38:58", "remaining_time": "2 days, 18:15:46", "throughput": 28815.96, "total_tokens": 1830937280} +{"current_steps": 6250, "total_steps": 29667, "loss": 0.384, "lr": 3.9224433951865215e-05, "epoch": 0.6320513225673925, "percentage": 21.07, "elapsed_time": "17:40:34", "remaining_time": "2 days, 18:13:41", "throughput": 28817.85, "total_tokens": 1833814912} +{"current_steps": 6260, "total_steps": 29667, "loss": 0.3871, "lr": 3.921236972067165e-05, "epoch": 0.6330626046835003, "percentage": 21.1, "elapsed_time": "17:42:13", "remaining_time": "2 days, 18:11:48", "throughput": 28819.18, "total_tokens": 1836751808} +{"current_steps": 6270, "total_steps": 29667, "loss": 0.3797, "lr": 3.920031661439585e-05, "epoch": 0.6340738867996081, "percentage": 21.13, "elapsed_time": "17:43:50", "remaining_time": "2 days, 18:09:49", "throughput": 28821.27, "total_tokens": 1839686400} +{"current_steps": 6280, "total_steps": 29667, "loss": 0.3835, "lr": 3.918827461595045e-05, "epoch": 0.635085168915716, "percentage": 21.17, "elapsed_time": "17:45:24", "remaining_time": "2 days, 18:07:38", "throughput": 28824.11, "total_tokens": 1842574400} +{"current_steps": 6290, "total_steps": 29667, "loss": 0.3844, "lr": 3.9176243708284746e-05, "epoch": 0.6360964510318238, "percentage": 21.2, "elapsed_time": "17:47:03", "remaining_time": "2 days, 18:05:44", "throughput": 28825.25, "total_tokens": 1845486400} +{"current_steps": 6300, "total_steps": 29667, "loss": 0.3828, "lr": 3.9164223874384715e-05, "epoch": 0.6371077331479316, "percentage": 21.24, "elapsed_time": "17:48:42", "remaining_time": "2 days, 18:03:53", "throughput": 28826.99, "total_tokens": 1848459776} +{"current_steps": 6310, "total_steps": 29667, "loss": 0.3846, "lr": 3.91522150972728e-05, "epoch": 0.6381190152640395, "percentage": 21.27, "elapsed_time": "17:50:19", "remaining_time": "2 days, 18:01:52", "throughput": 28828.88, "total_tokens": 1851363968} +{"current_steps": 6320, "total_steps": 29667, "loss": 0.3846, "lr": 3.9140217360007896e-05, "epoch": 0.6391302973801473, "percentage": 21.3, "elapsed_time": "17:51:56", "remaining_time": "2 days, 17:59:55", "throughput": 28830.66, "total_tokens": 1854295744} +{"current_steps": 6330, "total_steps": 29667, "loss": 0.3827, "lr": 3.912823064568521e-05, "epoch": 0.640141579496255, "percentage": 21.34, "elapsed_time": "17:53:33", "remaining_time": "2 days, 17:57:54", "throughput": 28832.51, "total_tokens": 1857198208} +{"current_steps": 6340, "total_steps": 29667, "loss": 0.3825, "lr": 3.9116254937436155e-05, "epoch": 0.641152861612363, "percentage": 21.37, "elapsed_time": "17:55:12", "remaining_time": "2 days, 17:56:03", "throughput": 28833.56, "total_tokens": 1860128896} +{"current_steps": 6350, "total_steps": 29667, "loss": 0.3842, "lr": 3.910429021842825e-05, "epoch": 0.6421641437284707, "percentage": 21.4, "elapsed_time": "17:56:53", "remaining_time": "2 days, 17:54:17", "throughput": 28834.65, "total_tokens": 1863096896} +{"current_steps": 6360, "total_steps": 29667, "loss": 0.3835, "lr": 3.9092336471865084e-05, "epoch": 0.6431754258445785, "percentage": 21.44, "elapsed_time": "17:58:28", "remaining_time": "2 days, 17:52:11", "throughput": 28837.24, "total_tokens": 1866006016} +{"current_steps": 6370, "total_steps": 29667, "loss": 0.3871, "lr": 3.908039368098611e-05, "epoch": 0.6441867079606864, "percentage": 21.47, "elapsed_time": "18:00:06", "remaining_time": "2 days, 17:50:15", "throughput": 28838.96, "total_tokens": 1868944960} +{"current_steps": 6380, "total_steps": 29667, "loss": 0.3805, "lr": 3.9068461829066633e-05, "epoch": 0.6451979900767942, "percentage": 21.51, "elapsed_time": "18:01:40", "remaining_time": "2 days, 17:48:07", "throughput": 28841.62, "total_tokens": 1871844096} +{"current_steps": 6390, "total_steps": 29667, "loss": 0.3901, "lr": 3.9056540899417656e-05, "epoch": 0.646209272192902, "percentage": 21.54, "elapsed_time": "18:03:19", "remaining_time": "2 days, 17:46:16", "throughput": 28842.85, "total_tokens": 1874781952} +{"current_steps": 6400, "total_steps": 29667, "loss": 0.3802, "lr": 3.904463087538585e-05, "epoch": 0.6472205543090099, "percentage": 21.57, "elapsed_time": "18:04:56", "remaining_time": "2 days, 17:44:14", "throughput": 28845.01, "total_tokens": 1877696640} +{"current_steps": 6410, "total_steps": 29667, "loss": 0.3847, "lr": 3.903273174035336e-05, "epoch": 0.6482318364251177, "percentage": 21.61, "elapsed_time": "18:06:35", "remaining_time": "2 days, 17:42:24", "throughput": 28845.88, "total_tokens": 1880615680} +{"current_steps": 6420, "total_steps": 29667, "loss": 0.3846, "lr": 3.902084347773779e-05, "epoch": 0.6492431185412255, "percentage": 21.64, "elapsed_time": "18:08:12", "remaining_time": "2 days, 17:40:26", "throughput": 28847.35, "total_tokens": 1883517696} +{"current_steps": 6430, "total_steps": 29667, "loss": 0.384, "lr": 3.900896607099207e-05, "epoch": 0.6502544006573334, "percentage": 21.67, "elapsed_time": "18:09:51", "remaining_time": "2 days, 17:38:34", "throughput": 28848.52, "total_tokens": 1886449536} +{"current_steps": 6440, "total_steps": 29667, "loss": 0.3742, "lr": 3.899709950360437e-05, "epoch": 0.6512656827734412, "percentage": 21.71, "elapsed_time": "18:11:33", "remaining_time": "2 days, 17:36:54", "throughput": 28849.2, "total_tokens": 1889437952} +{"current_steps": 6450, "total_steps": 29667, "loss": 0.38, "lr": 3.8985243759097997e-05, "epoch": 0.652276964889549, "percentage": 21.74, "elapsed_time": "18:13:09", "remaining_time": "2 days, 17:34:51", "throughput": 28850.95, "total_tokens": 1892318080} +{"current_steps": 6460, "total_steps": 29667, "loss": 0.3849, "lr": 3.897339882103129e-05, "epoch": 0.6532882470056569, "percentage": 21.78, "elapsed_time": "18:14:45", "remaining_time": "2 days, 17:32:49", "throughput": 28853.03, "total_tokens": 1895225920} +{"current_steps": 6470, "total_steps": 29667, "loss": 0.383, "lr": 3.8961564672997544e-05, "epoch": 0.6542995291217647, "percentage": 21.81, "elapsed_time": "18:16:23", "remaining_time": "2 days, 17:30:52", "throughput": 28854.9, "total_tokens": 1898162240} +{"current_steps": 6480, "total_steps": 29667, "loss": 0.3859, "lr": 3.8949741298624924e-05, "epoch": 0.6553108112378725, "percentage": 21.84, "elapsed_time": "18:18:01", "remaining_time": "2 days, 17:28:59", "throughput": 28855.99, "total_tokens": 1901071104} +{"current_steps": 6490, "total_steps": 29667, "loss": 0.3846, "lr": 3.8937928681576305e-05, "epoch": 0.6563220933539804, "percentage": 21.88, "elapsed_time": "18:19:38", "remaining_time": "2 days, 17:27:03", "throughput": 28857.77, "total_tokens": 1904005056} +{"current_steps": 6500, "total_steps": 29667, "loss": 0.3856, "lr": 3.8926126805549276e-05, "epoch": 0.6573333754700882, "percentage": 21.91, "elapsed_time": "18:21:18", "remaining_time": "2 days, 17:25:12", "throughput": 28858.97, "total_tokens": 1906945344} +{"current_steps": 6510, "total_steps": 29667, "loss": 0.3825, "lr": 3.891433565427596e-05, "epoch": 0.658344657586196, "percentage": 21.94, "elapsed_time": "18:22:54", "remaining_time": "2 days, 17:23:13", "throughput": 28860.44, "total_tokens": 1909838016} +{"current_steps": 6520, "total_steps": 29667, "loss": 0.3853, "lr": 3.8902555211522964e-05, "epoch": 0.6593559397023038, "percentage": 21.98, "elapsed_time": "18:24:28", "remaining_time": "2 days, 17:21:04", "throughput": 28862.91, "total_tokens": 1912714816} +{"current_steps": 6530, "total_steps": 29667, "loss": 0.3801, "lr": 3.889078546109127e-05, "epoch": 0.6603672218184117, "percentage": 22.01, "elapsed_time": "18:26:07", "remaining_time": "2 days, 17:19:11", "throughput": 28864.23, "total_tokens": 1915635968} +{"current_steps": 6540, "total_steps": 29667, "loss": 0.3861, "lr": 3.887902638681616e-05, "epoch": 0.6613785039345195, "percentage": 22.04, "elapsed_time": "18:27:50", "remaining_time": "2 days, 17:17:34", "throughput": 28864.22, "total_tokens": 1918612224} +{"current_steps": 6550, "total_steps": 29667, "loss": 0.3811, "lr": 3.886727797256707e-05, "epoch": 0.6623897860506273, "percentage": 22.08, "elapsed_time": "18:29:25", "remaining_time": "2 days, 17:15:29", "throughput": 28866.45, "total_tokens": 1921503680} +{"current_steps": 6560, "total_steps": 29667, "loss": 0.3847, "lr": 3.88555402022476e-05, "epoch": 0.6634010681667352, "percentage": 22.11, "elapsed_time": "18:31:03", "remaining_time": "2 days, 17:13:34", "throughput": 28868.38, "total_tokens": 1924454720} +{"current_steps": 6570, "total_steps": 29667, "loss": 0.3854, "lr": 3.884381305979528e-05, "epoch": 0.664412350282843, "percentage": 22.15, "elapsed_time": "18:32:42", "remaining_time": "2 days, 17:11:44", "throughput": 28869.17, "total_tokens": 1927373440} +{"current_steps": 6580, "total_steps": 29667, "loss": 0.378, "lr": 3.883209652918163e-05, "epoch": 0.6654236323989507, "percentage": 22.18, "elapsed_time": "18:34:24", "remaining_time": "2 days, 17:10:04", "throughput": 28869.42, "total_tokens": 1930338752} +{"current_steps": 6590, "total_steps": 29667, "loss": 0.3816, "lr": 3.8820390594411935e-05, "epoch": 0.6664349145150587, "percentage": 22.21, "elapsed_time": "18:36:00", "remaining_time": "2 days, 17:08:03", "throughput": 28871.06, "total_tokens": 1933217216} +{"current_steps": 6600, "total_steps": 29667, "loss": 0.3837, "lr": 3.880869523952524e-05, "epoch": 0.6674461966311664, "percentage": 22.25, "elapsed_time": "18:37:36", "remaining_time": "2 days, 17:06:03", "throughput": 28873.34, "total_tokens": 1936154368} +{"current_steps": 6610, "total_steps": 29667, "loss": 0.3797, "lr": 3.879701044859422e-05, "epoch": 0.6684574787472742, "percentage": 22.28, "elapsed_time": "18:39:12", "remaining_time": "2 days, 17:04:01", "throughput": 28875.08, "total_tokens": 1939033536} +{"current_steps": 6620, "total_steps": 29667, "loss": 0.3817, "lr": 3.87853362057251e-05, "epoch": 0.6694687608633821, "percentage": 22.31, "elapsed_time": "18:40:51", "remaining_time": "2 days, 17:02:10", "throughput": 28876.4, "total_tokens": 1941981824} +{"current_steps": 6630, "total_steps": 29667, "loss": 0.3775, "lr": 3.8773672495057576e-05, "epoch": 0.6704800429794899, "percentage": 22.35, "elapsed_time": "18:42:32", "remaining_time": "2 days, 17:00:28", "throughput": 28877.47, "total_tokens": 1944979968} +{"current_steps": 6640, "total_steps": 29667, "loss": 0.3847, "lr": 3.8762019300764674e-05, "epoch": 0.6714913250955977, "percentage": 22.38, "elapsed_time": "18:44:11", "remaining_time": "2 days, 16:58:35", "throughput": 28878.8, "total_tokens": 1947909120} +{"current_steps": 6650, "total_steps": 29667, "loss": 0.3817, "lr": 3.875037660705273e-05, "epoch": 0.6725026072117056, "percentage": 22.42, "elapsed_time": "18:45:45", "remaining_time": "2 days, 16:56:29", "throughput": 28881.43, "total_tokens": 1950815104} +{"current_steps": 6660, "total_steps": 29667, "loss": 0.3792, "lr": 3.873874439816127e-05, "epoch": 0.6735138893278134, "percentage": 22.45, "elapsed_time": "18:47:21", "remaining_time": "2 days, 16:54:27", "throughput": 28883.78, "total_tokens": 1953738944} +{"current_steps": 6670, "total_steps": 29667, "loss": 0.3793, "lr": 3.872712265836289e-05, "epoch": 0.6745251714439212, "percentage": 22.48, "elapsed_time": "18:48:52", "remaining_time": "2 days, 16:52:08", "throughput": 28887.32, "total_tokens": 1956602752} +{"current_steps": 6680, "total_steps": 29667, "loss": 0.3807, "lr": 3.8715511371963225e-05, "epoch": 0.6755364535600291, "percentage": 22.52, "elapsed_time": "18:50:31", "remaining_time": "2 days, 16:50:21", "throughput": 28888.41, "total_tokens": 1959558208} +{"current_steps": 6690, "total_steps": 29667, "loss": 0.3836, "lr": 3.87039105233008e-05, "epoch": 0.6765477356761369, "percentage": 22.55, "elapsed_time": "18:52:13", "remaining_time": "2 days, 16:48:39", "throughput": 28888.91, "total_tokens": 1962527424} +{"current_steps": 6700, "total_steps": 29667, "loss": 0.3785, "lr": 3.8692320096746975e-05, "epoch": 0.6775590177922447, "percentage": 22.58, "elapsed_time": "18:53:47", "remaining_time": "2 days, 16:46:31", "throughput": 28891.29, "total_tokens": 1965399360} +{"current_steps": 6710, "total_steps": 29667, "loss": 0.3802, "lr": 3.868074007670589e-05, "epoch": 0.6785702999083526, "percentage": 22.62, "elapsed_time": "18:55:28", "remaining_time": "2 days, 16:44:48", "throughput": 28891.76, "total_tokens": 1968353600} +{"current_steps": 6720, "total_steps": 29667, "loss": 0.3851, "lr": 3.866917044761428e-05, "epoch": 0.6795815820244604, "percentage": 22.65, "elapsed_time": "18:57:07", "remaining_time": "2 days, 16:42:59", "throughput": 28893.04, "total_tokens": 1971308992} +{"current_steps": 6730, "total_steps": 29667, "loss": 0.3824, "lr": 3.8657611193941486e-05, "epoch": 0.6805928641405682, "percentage": 22.69, "elapsed_time": "18:58:45", "remaining_time": "2 days, 16:41:03", "throughput": 28895.14, "total_tokens": 1974262720} +{"current_steps": 6740, "total_steps": 29667, "loss": 0.382, "lr": 3.8646062300189315e-05, "epoch": 0.6816041462566761, "percentage": 22.72, "elapsed_time": "19:00:27", "remaining_time": "2 days, 16:39:24", "throughput": 28895.56, "total_tokens": 1977241408} +{"current_steps": 6750, "total_steps": 29667, "loss": 0.3802, "lr": 3.8634523750891984e-05, "epoch": 0.6826154283727839, "percentage": 22.75, "elapsed_time": "19:02:03", "remaining_time": "2 days, 16:37:24", "throughput": 28897.15, "total_tokens": 1980132160} +{"current_steps": 6760, "total_steps": 29667, "loss": 0.379, "lr": 3.862299553061597e-05, "epoch": 0.6836267104888917, "percentage": 22.79, "elapsed_time": "19:03:38", "remaining_time": "2 days, 16:35:22", "throughput": 28898.77, "total_tokens": 1982999104} +{"current_steps": 6770, "total_steps": 29667, "loss": 0.3796, "lr": 3.861147762396e-05, "epoch": 0.6846379926049996, "percentage": 22.82, "elapsed_time": "19:05:17", "remaining_time": "2 days, 16:33:30", "throughput": 28900.15, "total_tokens": 1985942784} +{"current_steps": 6780, "total_steps": 29667, "loss": 0.3782, "lr": 3.859997001555494e-05, "epoch": 0.6856492747211074, "percentage": 22.85, "elapsed_time": "19:06:55", "remaining_time": "2 days, 16:31:36", "throughput": 28901.74, "total_tokens": 1988875968} +{"current_steps": 6790, "total_steps": 29667, "loss": 0.3854, "lr": 3.8588472690063676e-05, "epoch": 0.6866605568372152, "percentage": 22.89, "elapsed_time": "19:08:31", "remaining_time": "2 days, 16:29:39", "throughput": 28903.68, "total_tokens": 1991809216} +{"current_steps": 6800, "total_steps": 29667, "loss": 0.3784, "lr": 3.857698563218106e-05, "epoch": 0.687671838953323, "percentage": 22.92, "elapsed_time": "19:10:05", "remaining_time": "2 days, 16:27:30", "throughput": 28906.08, "total_tokens": 1994675904} +{"current_steps": 6810, "total_steps": 29667, "loss": 0.3778, "lr": 3.8565508826633836e-05, "epoch": 0.6886831210694309, "percentage": 22.95, "elapsed_time": "19:11:42", "remaining_time": "2 days, 16:25:35", "throughput": 28908.25, "total_tokens": 1997635904} +{"current_steps": 6820, "total_steps": 29667, "loss": 0.3821, "lr": 3.855404225818049e-05, "epoch": 0.6896944031855387, "percentage": 22.99, "elapsed_time": "19:13:14", "remaining_time": "2 days, 16:23:23", "throughput": 28911.43, "total_tokens": 2000525312} +{"current_steps": 6830, "total_steps": 29667, "loss": 0.3777, "lr": 3.8542585911611286e-05, "epoch": 0.6907056853016464, "percentage": 23.02, "elapsed_time": "19:14:54", "remaining_time": "2 days, 16:21:35", "throughput": 28912.53, "total_tokens": 2003482304} +{"current_steps": 6840, "total_steps": 29667, "loss": 0.3804, "lr": 3.853113977174803e-05, "epoch": 0.6917169674177543, "percentage": 23.06, "elapsed_time": "19:16:37", "remaining_time": "2 days, 16:19:59", "throughput": 28912.71, "total_tokens": 2006475520} +{"current_steps": 6850, "total_steps": 29667, "loss": 0.3799, "lr": 3.851970382344411e-05, "epoch": 0.6927282495338621, "percentage": 23.09, "elapsed_time": "19:18:15", "remaining_time": "2 days, 16:18:05", "throughput": 28914.06, "total_tokens": 2009396544} +{"current_steps": 6860, "total_steps": 29667, "loss": 0.3817, "lr": 3.850827805158433e-05, "epoch": 0.6937395316499699, "percentage": 23.12, "elapsed_time": "19:19:58", "remaining_time": "2 days, 16:16:30", "throughput": 28914.19, "total_tokens": 2012390976} +{"current_steps": 6870, "total_steps": 29667, "loss": 0.3797, "lr": 3.8496862441084896e-05, "epoch": 0.6947508137660778, "percentage": 23.16, "elapsed_time": "19:21:36", "remaining_time": "2 days, 16:14:36", "throughput": 28915.44, "total_tokens": 2015300224} +{"current_steps": 6880, "total_steps": 29667, "loss": 0.3777, "lr": 3.848545697689328e-05, "epoch": 0.6957620958821856, "percentage": 23.19, "elapsed_time": "19:23:16", "remaining_time": "2 days, 16:12:51", "throughput": 28916.01, "total_tokens": 2018241856} +{"current_steps": 6890, "total_steps": 29667, "loss": 0.3835, "lr": 3.8474061643988136e-05, "epoch": 0.6967733779982934, "percentage": 23.22, "elapsed_time": "19:24:57", "remaining_time": "2 days, 16:11:08", "throughput": 28916.45, "total_tokens": 2021193664} +{"current_steps": 6900, "total_steps": 29667, "loss": 0.3825, "lr": 3.846267642737925e-05, "epoch": 0.6977846601144013, "percentage": 23.26, "elapsed_time": "19:26:34", "remaining_time": "2 days, 16:09:10", "throughput": 28918.26, "total_tokens": 2024109952} +{"current_steps": 6910, "total_steps": 29667, "loss": 0.3811, "lr": 3.8451301312107455e-05, "epoch": 0.6987959422305091, "percentage": 23.29, "elapsed_time": "19:28:16", "remaining_time": "2 days, 16:07:30", "throughput": 28918.61, "total_tokens": 2027079296} +{"current_steps": 6920, "total_steps": 29667, "loss": 0.3805, "lr": 3.843993628324451e-05, "epoch": 0.6998072243466169, "percentage": 23.33, "elapsed_time": "19:29:54", "remaining_time": "2 days, 16:05:38", "throughput": 28920.1, "total_tokens": 2030025984} +{"current_steps": 6930, "total_steps": 29667, "loss": 0.3793, "lr": 3.8428581325893034e-05, "epoch": 0.7008185064627248, "percentage": 23.36, "elapsed_time": "19:31:32", "remaining_time": "2 days, 16:03:45", "throughput": 28921.78, "total_tokens": 2032974848} +{"current_steps": 6940, "total_steps": 29667, "loss": 0.3839, "lr": 3.8417236425186484e-05, "epoch": 0.7018297885788326, "percentage": 23.39, "elapsed_time": "19:33:08", "remaining_time": "2 days, 16:01:48", "throughput": 28923.6, "total_tokens": 2035898688} +{"current_steps": 6950, "total_steps": 29667, "loss": 0.3816, "lr": 3.840590156628895e-05, "epoch": 0.7028410706949404, "percentage": 23.43, "elapsed_time": "19:34:48", "remaining_time": "2 days, 16:00:00", "throughput": 28925.0, "total_tokens": 2038872512} +{"current_steps": 6960, "total_steps": 29667, "loss": 0.3778, "lr": 3.8394576734395205e-05, "epoch": 0.7038523528110483, "percentage": 23.46, "elapsed_time": "19:36:27", "remaining_time": "2 days, 15:58:10", "throughput": 28926.44, "total_tokens": 2041835072} +{"current_steps": 6970, "total_steps": 29667, "loss": 0.3815, "lr": 3.838326191473054e-05, "epoch": 0.7048636349271561, "percentage": 23.49, "elapsed_time": "19:38:03", "remaining_time": "2 days, 15:56:13", "throughput": 28928.08, "total_tokens": 2044744832} +{"current_steps": 6980, "total_steps": 29667, "loss": 0.3784, "lr": 3.837195709255069e-05, "epoch": 0.7058749170432639, "percentage": 23.53, "elapsed_time": "19:39:40", "remaining_time": "2 days, 15:54:15", "throughput": 28930.0, "total_tokens": 2047669120} +{"current_steps": 6990, "total_steps": 29667, "loss": 0.3858, "lr": 3.8360662253141796e-05, "epoch": 0.7068861991593718, "percentage": 23.56, "elapsed_time": "19:41:24", "remaining_time": "2 days, 15:52:42", "throughput": 28929.81, "total_tokens": 2050663552} +{"current_steps": 7000, "total_steps": 29667, "loss": 0.381, "lr": 3.834937738182029e-05, "epoch": 0.7078974812754796, "percentage": 23.6, "elapsed_time": "19:43:03", "remaining_time": "2 days, 15:50:53", "throughput": 28930.94, "total_tokens": 2053611008} +{"current_steps": 7010, "total_steps": 29667, "loss": 0.3805, "lr": 3.833810246393281e-05, "epoch": 0.7089087633915874, "percentage": 23.63, "elapsed_time": "19:44:39", "remaining_time": "2 days, 15:48:55", "throughput": 28932.82, "total_tokens": 2056529664} +{"current_steps": 7020, "total_steps": 29667, "loss": 0.3823, "lr": 3.832683748485616e-05, "epoch": 0.7099200455076953, "percentage": 23.66, "elapsed_time": "19:46:17", "remaining_time": "2 days, 15:47:03", "throughput": 28934.49, "total_tokens": 2059484864} +{"current_steps": 7030, "total_steps": 29667, "loss": 0.3776, "lr": 3.8315582429997184e-05, "epoch": 0.7109313276238031, "percentage": 23.7, "elapsed_time": "19:47:50", "remaining_time": "2 days, 15:44:55", "throughput": 28938.06, "total_tokens": 2062434880} +{"current_steps": 7040, "total_steps": 29667, "loss": 0.3812, "lr": 3.830433728479272e-05, "epoch": 0.7119426097399109, "percentage": 23.73, "elapsed_time": "19:49:27", "remaining_time": "2 days, 15:42:58", "throughput": 28939.92, "total_tokens": 2065364032} +{"current_steps": 7050, "total_steps": 29667, "loss": 0.3822, "lr": 3.829310203470948e-05, "epoch": 0.7129538918560188, "percentage": 23.76, "elapsed_time": "19:51:10", "remaining_time": "2 days, 15:41:23", "throughput": 28939.7, "total_tokens": 2068334272} +{"current_steps": 7060, "total_steps": 29667, "loss": 0.376, "lr": 3.828187666524403e-05, "epoch": 0.7139651739721266, "percentage": 23.8, "elapsed_time": "19:52:46", "remaining_time": "2 days, 15:39:24", "throughput": 28941.35, "total_tokens": 2071223616} +{"current_steps": 7070, "total_steps": 29667, "loss": 0.3848, "lr": 3.827066116192266e-05, "epoch": 0.7149764560882343, "percentage": 23.83, "elapsed_time": "19:54:27", "remaining_time": "2 days, 15:37:41", "throughput": 28942.21, "total_tokens": 2074210176} +{"current_steps": 7080, "total_steps": 29667, "loss": 0.3754, "lr": 3.825945551030135e-05, "epoch": 0.7159877382043421, "percentage": 23.86, "elapsed_time": "19:56:03", "remaining_time": "2 days, 15:35:44", "throughput": 28944.15, "total_tokens": 2077141696} +{"current_steps": 7090, "total_steps": 29667, "loss": 0.3843, "lr": 3.824825969596561e-05, "epoch": 0.71699902032045, "percentage": 23.9, "elapsed_time": "19:57:41", "remaining_time": "2 days, 15:33:50", "throughput": 28945.47, "total_tokens": 2080054464} +{"current_steps": 7100, "total_steps": 29667, "loss": 0.3743, "lr": 3.823707370453054e-05, "epoch": 0.7180103024365578, "percentage": 23.93, "elapsed_time": "19:59:18", "remaining_time": "2 days, 15:31:56", "throughput": 28947.16, "total_tokens": 2082993152} +{"current_steps": 7110, "total_steps": 29667, "loss": 0.3802, "lr": 3.8225897521640614e-05, "epoch": 0.7190215845526656, "percentage": 23.97, "elapsed_time": "20:00:58", "remaining_time": "2 days, 15:30:09", "throughput": 28948.05, "total_tokens": 2085939968} +{"current_steps": 7120, "total_steps": 29667, "loss": 0.3826, "lr": 3.8214731132969675e-05, "epoch": 0.7200328666687735, "percentage": 24.0, "elapsed_time": "20:02:40", "remaining_time": "2 days, 15:28:30", "throughput": 28947.97, "total_tokens": 2088893120} +{"current_steps": 7130, "total_steps": 29667, "loss": 0.3818, "lr": 3.820357452422084e-05, "epoch": 0.7210441487848813, "percentage": 24.03, "elapsed_time": "20:04:19", "remaining_time": "2 days, 15:26:42", "throughput": 28948.85, "total_tokens": 2091823488} +{"current_steps": 7140, "total_steps": 29667, "loss": 0.38, "lr": 3.8192427681126445e-05, "epoch": 0.7220554309009891, "percentage": 24.07, "elapsed_time": "20:05:58", "remaining_time": "2 days, 15:24:54", "throughput": 28950.11, "total_tokens": 2094791936} +{"current_steps": 7150, "total_steps": 29667, "loss": 0.3803, "lr": 3.818129058944793e-05, "epoch": 0.723066713017097, "percentage": 24.1, "elapsed_time": "20:07:39", "remaining_time": "2 days, 15:23:10", "throughput": 28951.17, "total_tokens": 2097780288} +{"current_steps": 7160, "total_steps": 29667, "loss": 0.3813, "lr": 3.817016323497578e-05, "epoch": 0.7240779951332048, "percentage": 24.13, "elapsed_time": "20:09:21", "remaining_time": "2 days, 15:21:32", "throughput": 28950.96, "total_tokens": 2100725248} +{"current_steps": 7170, "total_steps": 29667, "loss": 0.3751, "lr": 3.8159045603529455e-05, "epoch": 0.7250892772493126, "percentage": 24.17, "elapsed_time": "20:11:01", "remaining_time": "2 days, 15:19:48", "throughput": 28951.71, "total_tokens": 2103685632} +{"current_steps": 7180, "total_steps": 29667, "loss": 0.3762, "lr": 3.8147937680957334e-05, "epoch": 0.7261005593654205, "percentage": 24.2, "elapsed_time": "20:12:44", "remaining_time": "2 days, 15:18:10", "throughput": 28952.39, "total_tokens": 2106700992} +{"current_steps": 7190, "total_steps": 29667, "loss": 0.377, "lr": 3.813683945313658e-05, "epoch": 0.7271118414815283, "percentage": 24.24, "elapsed_time": "20:14:25", "remaining_time": "2 days, 15:16:27", "throughput": 28952.83, "total_tokens": 2109656896} +{"current_steps": 7200, "total_steps": 29667, "loss": 0.3775, "lr": 3.812575090597313e-05, "epoch": 0.7281231235976361, "percentage": 24.27, "elapsed_time": "20:16:00", "remaining_time": "2 days, 15:14:27", "throughput": 28954.79, "total_tokens": 2112558848} +{"current_steps": 7210, "total_steps": 29667, "loss": 0.382, "lr": 3.811467202540156e-05, "epoch": 0.729134405713744, "percentage": 24.3, "elapsed_time": "20:17:40", "remaining_time": "2 days, 15:12:41", "throughput": 28955.5, "total_tokens": 2115502912} +{"current_steps": 7220, "total_steps": 29667, "loss": 0.3761, "lr": 3.810360279738507e-05, "epoch": 0.7301456878298518, "percentage": 24.34, "elapsed_time": "20:19:21", "remaining_time": "2 days, 15:11:00", "throughput": 28956.17, "total_tokens": 2118488064} +{"current_steps": 7230, "total_steps": 29667, "loss": 0.3747, "lr": 3.809254320791535e-05, "epoch": 0.7311569699459596, "percentage": 24.37, "elapsed_time": "20:21:01", "remaining_time": "2 days, 15:09:12", "throughput": 28957.1, "total_tokens": 2121426304} +{"current_steps": 7240, "total_steps": 29667, "loss": 0.3811, "lr": 3.808149324301256e-05, "epoch": 0.7321682520620675, "percentage": 24.4, "elapsed_time": "20:22:38", "remaining_time": "2 days, 15:07:18", "throughput": 28958.57, "total_tokens": 2124348416} +{"current_steps": 7250, "total_steps": 29667, "loss": 0.383, "lr": 3.807045288872522e-05, "epoch": 0.7331795341781753, "percentage": 24.44, "elapsed_time": "20:24:13", "remaining_time": "2 days, 15:05:18", "throughput": 28960.57, "total_tokens": 2127256512} +{"current_steps": 7260, "total_steps": 29667, "loss": 0.3819, "lr": 3.805942213113015e-05, "epoch": 0.7341908162942831, "percentage": 24.47, "elapsed_time": "20:25:51", "remaining_time": "2 days, 15:03:26", "throughput": 28961.97, "total_tokens": 2130193408} +{"current_steps": 7270, "total_steps": 29667, "loss": 0.3793, "lr": 3.8048400956332385e-05, "epoch": 0.735202098410391, "percentage": 24.51, "elapsed_time": "20:27:32", "remaining_time": "2 days, 15:01:44", "throughput": 28962.3, "total_tokens": 2133145536} +{"current_steps": 7280, "total_steps": 29667, "loss": 0.374, "lr": 3.803738935046512e-05, "epoch": 0.7362133805264988, "percentage": 24.54, "elapsed_time": "20:29:11", "remaining_time": "2 days, 14:59:55", "throughput": 28963.54, "total_tokens": 2136096128} +{"current_steps": 7290, "total_steps": 29667, "loss": 0.3779, "lr": 3.802638729968962e-05, "epoch": 0.7372246626426066, "percentage": 24.57, "elapsed_time": "20:30:51", "remaining_time": "2 days, 14:58:10", "throughput": 28964.34, "total_tokens": 2139061312} +{"current_steps": 7300, "total_steps": 29667, "loss": 0.3808, "lr": 3.8015394790195145e-05, "epoch": 0.7382359447587145, "percentage": 24.61, "elapsed_time": "20:32:30", "remaining_time": "2 days, 14:56:22", "throughput": 28964.91, "total_tokens": 2141971456} +{"current_steps": 7310, "total_steps": 29667, "loss": 0.3781, "lr": 3.800441180819891e-05, "epoch": 0.7392472268748222, "percentage": 24.64, "elapsed_time": "20:34:07", "remaining_time": "2 days, 14:54:27", "throughput": 28966.54, "total_tokens": 2144894400} +{"current_steps": 7320, "total_steps": 29667, "loss": 0.3858, "lr": 3.7993438339945965e-05, "epoch": 0.74025850899093, "percentage": 24.67, "elapsed_time": "20:35:46", "remaining_time": "2 days, 14:52:38", "throughput": 28966.99, "total_tokens": 2147793600} +{"current_steps": 7330, "total_steps": 29667, "loss": 0.3791, "lr": 3.798247437170914e-05, "epoch": 0.741269791107038, "percentage": 24.71, "elapsed_time": "20:37:27", "remaining_time": "2 days, 14:50:56", "throughput": 28967.55, "total_tokens": 2150758080} +{"current_steps": 7340, "total_steps": 29667, "loss": 0.3792, "lr": 3.797151988978901e-05, "epoch": 0.7422810732231457, "percentage": 24.74, "elapsed_time": "20:39:07", "remaining_time": "2 days, 14:49:11", "throughput": 28968.25, "total_tokens": 2153709184} +{"current_steps": 7350, "total_steps": 29667, "loss": 0.3791, "lr": 3.796057488051377e-05, "epoch": 0.7432923553392535, "percentage": 24.78, "elapsed_time": "20:40:45", "remaining_time": "2 days, 14:47:22", "throughput": 28968.94, "total_tokens": 2156620608} +{"current_steps": 7360, "total_steps": 29667, "loss": 0.3782, "lr": 3.794963933023918e-05, "epoch": 0.7443036374553613, "percentage": 24.81, "elapsed_time": "20:42:23", "remaining_time": "2 days, 14:45:29", "throughput": 28970.18, "total_tokens": 2159533696} +{"current_steps": 7370, "total_steps": 29667, "loss": 0.3792, "lr": 3.79387132253485e-05, "epoch": 0.7453149195714692, "percentage": 24.84, "elapsed_time": "20:43:58", "remaining_time": "2 days, 14:43:30", "throughput": 28972.0, "total_tokens": 2162438400} +{"current_steps": 7380, "total_steps": 29667, "loss": 0.3758, "lr": 3.792779655225243e-05, "epoch": 0.746326201687577, "percentage": 24.88, "elapsed_time": "20:45:34", "remaining_time": "2 days, 14:41:33", "throughput": 28973.64, "total_tokens": 2165343104} +{"current_steps": 7390, "total_steps": 29667, "loss": 0.3765, "lr": 3.791688929738902e-05, "epoch": 0.7473374838036848, "percentage": 24.91, "elapsed_time": "20:47:15", "remaining_time": "2 days, 14:39:51", "throughput": 28974.71, "total_tokens": 2168346816} +{"current_steps": 7400, "total_steps": 29667, "loss": 0.3745, "lr": 3.79059914472236e-05, "epoch": 0.7483487659197927, "percentage": 24.94, "elapsed_time": "20:48:55", "remaining_time": "2 days, 14:38:05", "throughput": 28975.64, "total_tokens": 2171306368} +{"current_steps": 7410, "total_steps": 29667, "loss": 0.38, "lr": 3.7895102988248716e-05, "epoch": 0.7493600480359005, "percentage": 24.98, "elapsed_time": "20:50:30", "remaining_time": "2 days, 14:36:05", "throughput": 28977.85, "total_tokens": 2174228800} +{"current_steps": 7420, "total_steps": 29667, "loss": 0.3775, "lr": 3.7884223906984064e-05, "epoch": 0.7503713301520083, "percentage": 25.01, "elapsed_time": "20:52:06", "remaining_time": "2 days, 14:34:07", "throughput": 28979.69, "total_tokens": 2177140416} +{"current_steps": 7430, "total_steps": 29667, "loss": 0.3806, "lr": 3.787335418997641e-05, "epoch": 0.7513826122681162, "percentage": 25.04, "elapsed_time": "20:53:45", "remaining_time": "2 days, 14:32:19", "throughput": 28980.82, "total_tokens": 2180095168} +{"current_steps": 7440, "total_steps": 29667, "loss": 0.3803, "lr": 3.786249382379952e-05, "epoch": 0.752393894384224, "percentage": 25.08, "elapsed_time": "20:55:22", "remaining_time": "2 days, 14:30:25", "throughput": 28981.82, "total_tokens": 2182981568} +{"current_steps": 7450, "total_steps": 29667, "loss": 0.3786, "lr": 3.785164279505411e-05, "epoch": 0.7534051765003318, "percentage": 25.11, "elapsed_time": "20:57:00", "remaining_time": "2 days, 14:28:34", "throughput": 28982.91, "total_tokens": 2185898112} +{"current_steps": 7460, "total_steps": 29667, "loss": 0.3772, "lr": 3.7840801090367744e-05, "epoch": 0.7544164586164397, "percentage": 25.15, "elapsed_time": "20:58:40", "remaining_time": "2 days, 14:26:51", "throughput": 28983.56, "total_tokens": 2188865536} +{"current_steps": 7470, "total_steps": 29667, "loss": 0.3762, "lr": 3.782996869639479e-05, "epoch": 0.7554277407325475, "percentage": 25.18, "elapsed_time": "21:00:20", "remaining_time": "2 days, 14:25:06", "throughput": 28984.33, "total_tokens": 2191817600} +{"current_steps": 7480, "total_steps": 29667, "loss": 0.3796, "lr": 3.7819145599816354e-05, "epoch": 0.7564390228486553, "percentage": 25.21, "elapsed_time": "21:02:02", "remaining_time": "2 days, 14:23:24", "throughput": 28984.75, "total_tokens": 2194783424} +{"current_steps": 7490, "total_steps": 29667, "loss": 0.3791, "lr": 3.780833178734018e-05, "epoch": 0.7574503049647632, "percentage": 25.25, "elapsed_time": "21:03:42", "remaining_time": "2 days, 14:21:42", "throughput": 28985.39, "total_tokens": 2197753792} +{"current_steps": 7500, "total_steps": 29667, "loss": 0.381, "lr": 3.77975272457006e-05, "epoch": 0.758461587080871, "percentage": 25.28, "elapsed_time": "21:05:23", "remaining_time": "2 days, 14:19:59", "throughput": 28985.83, "total_tokens": 2200703104} +{"current_steps": 7510, "total_steps": 29667, "loss": 0.3755, "lr": 3.778673196165851e-05, "epoch": 0.7594728691969788, "percentage": 25.31, "elapsed_time": "21:07:00", "remaining_time": "2 days, 14:18:04", "throughput": 28987.64, "total_tokens": 2203643072} +{"current_steps": 7520, "total_steps": 29667, "loss": 0.3765, "lr": 3.7775945922001186e-05, "epoch": 0.7604841513130867, "percentage": 25.35, "elapsed_time": "21:08:40", "remaining_time": "2 days, 14:16:20", "throughput": 28988.1, "total_tokens": 2206587648} +{"current_steps": 7530, "total_steps": 29667, "loss": 0.3761, "lr": 3.776516911354236e-05, "epoch": 0.7614954334291945, "percentage": 25.38, "elapsed_time": "21:10:19", "remaining_time": "2 days, 14:14:33", "throughput": 28989.03, "total_tokens": 2209532352} +{"current_steps": 7540, "total_steps": 29667, "loss": 0.3782, "lr": 3.775440152312205e-05, "epoch": 0.7625067155453022, "percentage": 25.42, "elapsed_time": "21:11:57", "remaining_time": "2 days, 14:12:41", "throughput": 28990.18, "total_tokens": 2212449600} +{"current_steps": 7550, "total_steps": 29667, "loss": 0.38, "lr": 3.774364313760652e-05, "epoch": 0.7635179976614102, "percentage": 25.45, "elapsed_time": "21:13:34", "remaining_time": "2 days, 14:10:49", "throughput": 28991.27, "total_tokens": 2215359104} +{"current_steps": 7560, "total_steps": 29667, "loss": 0.3778, "lr": 3.7732893943888224e-05, "epoch": 0.764529279777518, "percentage": 25.48, "elapsed_time": "21:15:13", "remaining_time": "2 days, 14:09:01", "throughput": 28991.81, "total_tokens": 2218270848} +{"current_steps": 7570, "total_steps": 29667, "loss": 0.3814, "lr": 3.772215392888574e-05, "epoch": 0.7655405618936257, "percentage": 25.52, "elapsed_time": "21:16:50", "remaining_time": "2 days, 14:07:07", "throughput": 28993.26, "total_tokens": 2221186176} +{"current_steps": 7580, "total_steps": 29667, "loss": 0.3781, "lr": 3.771142307954368e-05, "epoch": 0.7665518440097336, "percentage": 25.55, "elapsed_time": "21:18:26", "remaining_time": "2 days, 14:05:11", "throughput": 28994.81, "total_tokens": 2224091904} +{"current_steps": 7590, "total_steps": 29667, "loss": 0.3776, "lr": 3.770070138283264e-05, "epoch": 0.7675631261258414, "percentage": 25.58, "elapsed_time": "21:20:01", "remaining_time": "2 days, 14:03:10", "throughput": 28997.03, "total_tokens": 2227000960} +{"current_steps": 7600, "total_steps": 29667, "loss": 0.3779, "lr": 3.768998882574915e-05, "epoch": 0.7685744082419492, "percentage": 25.62, "elapsed_time": "21:21:42", "remaining_time": "2 days, 14:01:30", "throughput": 28997.17, "total_tokens": 2229955136} +{"current_steps": 7610, "total_steps": 29667, "loss": 0.3725, "lr": 3.767928539531557e-05, "epoch": 0.7695856903580571, "percentage": 25.65, "elapsed_time": "21:23:21", "remaining_time": "2 days, 13:59:43", "throughput": 28997.83, "total_tokens": 2232881216} +{"current_steps": 7620, "total_steps": 29667, "loss": 0.3771, "lr": 3.7668591078580055e-05, "epoch": 0.7705969724741649, "percentage": 25.69, "elapsed_time": "21:24:56", "remaining_time": "2 days, 13:57:44", "throughput": 28999.66, "total_tokens": 2235779264} +{"current_steps": 7630, "total_steps": 29667, "loss": 0.3802, "lr": 3.765790586261647e-05, "epoch": 0.7716082545902727, "percentage": 25.72, "elapsed_time": "21:26:32", "remaining_time": "2 days, 13:55:49", "throughput": 29001.3, "total_tokens": 2238695424} +{"current_steps": 7640, "total_steps": 29667, "loss": 0.3807, "lr": 3.7647229734524326e-05, "epoch": 0.7726195367063805, "percentage": 25.75, "elapsed_time": "21:28:11", "remaining_time": "2 days, 13:53:58", "throughput": 29002.6, "total_tokens": 2241640960} +{"current_steps": 7650, "total_steps": 29667, "loss": 0.3754, "lr": 3.7636562681428744e-05, "epoch": 0.7736308188224884, "percentage": 25.79, "elapsed_time": "21:29:51", "remaining_time": "2 days, 13:52:16", "throughput": 29003.13, "total_tokens": 2244607168} +{"current_steps": 7660, "total_steps": 29667, "loss": 0.3832, "lr": 3.7625904690480346e-05, "epoch": 0.7746421009385962, "percentage": 25.82, "elapsed_time": "21:31:31", "remaining_time": "2 days, 13:50:29", "throughput": 29003.64, "total_tokens": 2247522112} +{"current_steps": 7670, "total_steps": 29667, "loss": 0.3788, "lr": 3.7615255748855224e-05, "epoch": 0.775653383054704, "percentage": 25.85, "elapsed_time": "21:33:07", "remaining_time": "2 days, 13:48:36", "throughput": 29005.4, "total_tokens": 2250464960} +{"current_steps": 7680, "total_steps": 29667, "loss": 0.3778, "lr": 3.7604615843754845e-05, "epoch": 0.7766646651708119, "percentage": 25.89, "elapsed_time": "21:34:48", "remaining_time": "2 days, 13:46:52", "throughput": 29005.68, "total_tokens": 2253401088} +{"current_steps": 7690, "total_steps": 29667, "loss": 0.3822, "lr": 3.759398496240601e-05, "epoch": 0.7776759472869197, "percentage": 25.92, "elapsed_time": "21:36:29", "remaining_time": "2 days, 13:45:10", "throughput": 29006.33, "total_tokens": 2256375360} +{"current_steps": 7700, "total_steps": 29667, "loss": 0.3782, "lr": 3.7583363092060815e-05, "epoch": 0.7786872294030275, "percentage": 25.95, "elapsed_time": "21:38:10", "remaining_time": "2 days, 13:43:29", "throughput": 29006.45, "total_tokens": 2259313472} +{"current_steps": 7710, "total_steps": 29667, "loss": 0.3797, "lr": 3.757275021999649e-05, "epoch": 0.7796985115191354, "percentage": 25.99, "elapsed_time": "21:39:48", "remaining_time": "2 days, 13:41:39", "throughput": 29007.42, "total_tokens": 2262231680} +{"current_steps": 7720, "total_steps": 29667, "loss": 0.3786, "lr": 3.7562146333515445e-05, "epoch": 0.7807097936352432, "percentage": 26.02, "elapsed_time": "21:41:26", "remaining_time": "2 days, 13:39:50", "throughput": 29009.01, "total_tokens": 2265213120} +{"current_steps": 7730, "total_steps": 29667, "loss": 0.377, "lr": 3.7551551419945167e-05, "epoch": 0.781721075751351, "percentage": 26.06, "elapsed_time": "21:43:07", "remaining_time": "2 days, 13:38:07", "throughput": 29009.97, "total_tokens": 2268204416} +{"current_steps": 7740, "total_steps": 29667, "loss": 0.3785, "lr": 3.7540965466638104e-05, "epoch": 0.7827323578674589, "percentage": 26.09, "elapsed_time": "21:44:46", "remaining_time": "2 days, 13:36:21", "throughput": 29010.53, "total_tokens": 2271136000} +{"current_steps": 7750, "total_steps": 29667, "loss": 0.3789, "lr": 3.753038846097172e-05, "epoch": 0.7837436399835667, "percentage": 26.12, "elapsed_time": "21:46:25", "remaining_time": "2 days, 13:34:33", "throughput": 29011.64, "total_tokens": 2274083328} +{"current_steps": 7760, "total_steps": 29667, "loss": 0.3827, "lr": 3.751982039034827e-05, "epoch": 0.7847549220996745, "percentage": 26.16, "elapsed_time": "21:48:02", "remaining_time": "2 days, 13:32:40", "throughput": 29013.06, "total_tokens": 2277004160} +{"current_steps": 7770, "total_steps": 29667, "loss": 0.3801, "lr": 3.75092612421949e-05, "epoch": 0.7857662042157824, "percentage": 26.19, "elapsed_time": "21:49:42", "remaining_time": "2 days, 13:30:57", "throughput": 29013.58, "total_tokens": 2279967936} +{"current_steps": 7780, "total_steps": 29667, "loss": 0.3781, "lr": 3.7498711003963475e-05, "epoch": 0.7867774863318902, "percentage": 26.22, "elapsed_time": "21:51:21", "remaining_time": "2 days, 13:29:10", "throughput": 29014.42, "total_tokens": 2282903936} +{"current_steps": 7790, "total_steps": 29667, "loss": 0.3801, "lr": 3.748816966313058e-05, "epoch": 0.787788768447998, "percentage": 26.26, "elapsed_time": "21:53:01", "remaining_time": "2 days, 13:27:25", "throughput": 29014.95, "total_tokens": 2285837248} +{"current_steps": 7800, "total_steps": 29667, "loss": 0.376, "lr": 3.7477637207197374e-05, "epoch": 0.7888000505641058, "percentage": 26.29, "elapsed_time": "21:54:41", "remaining_time": "2 days, 13:25:39", "throughput": 29016.21, "total_tokens": 2288829120} +{"current_steps": 7810, "total_steps": 29667, "loss": 0.3769, "lr": 3.7467113623689666e-05, "epoch": 0.7898113326802136, "percentage": 26.33, "elapsed_time": "21:56:24", "remaining_time": "2 days, 13:24:04", "throughput": 29016.09, "total_tokens": 2291810496} +{"current_steps": 7820, "total_steps": 29667, "loss": 0.3781, "lr": 3.745659890015768e-05, "epoch": 0.7908226147963214, "percentage": 26.36, "elapsed_time": "21:58:02", "remaining_time": "2 days, 13:22:14", "throughput": 29016.79, "total_tokens": 2294714560} +{"current_steps": 7830, "total_steps": 29667, "loss": 0.3764, "lr": 3.744609302417615e-05, "epoch": 0.7918338969124293, "percentage": 26.39, "elapsed_time": "21:59:40", "remaining_time": "2 days, 13:20:24", "throughput": 29018.19, "total_tokens": 2297666176} +{"current_steps": 7840, "total_steps": 29667, "loss": 0.3743, "lr": 3.7435595983344175e-05, "epoch": 0.7928451790285371, "percentage": 26.43, "elapsed_time": "22:01:18", "remaining_time": "2 days, 13:18:36", "throughput": 29019.2, "total_tokens": 2300605696} +{"current_steps": 7850, "total_steps": 29667, "loss": 0.375, "lr": 3.7425107765285155e-05, "epoch": 0.7938564611446449, "percentage": 26.46, "elapsed_time": "22:02:57", "remaining_time": "2 days, 13:16:48", "throughput": 29020.09, "total_tokens": 2303536192} +{"current_steps": 7860, "total_steps": 29667, "loss": 0.3837, "lr": 3.741462835764676e-05, "epoch": 0.7948677432607528, "percentage": 26.49, "elapsed_time": "22:04:34", "remaining_time": "2 days, 13:14:55", "throughput": 29021.15, "total_tokens": 2306431680} +{"current_steps": 7870, "total_steps": 29667, "loss": 0.3772, "lr": 3.740415774810088e-05, "epoch": 0.7958790253768606, "percentage": 26.53, "elapsed_time": "22:06:16", "remaining_time": "2 days, 13:13:18", "throughput": 29021.29, "total_tokens": 2309424064} +{"current_steps": 7880, "total_steps": 29667, "loss": 0.3783, "lr": 3.739369592434351e-05, "epoch": 0.7968903074929684, "percentage": 26.56, "elapsed_time": "22:07:57", "remaining_time": "2 days, 13:11:37", "throughput": 29021.69, "total_tokens": 2312387584} +{"current_steps": 7890, "total_steps": 29667, "loss": 0.3782, "lr": 3.738324287409473e-05, "epoch": 0.7979015896090763, "percentage": 26.6, "elapsed_time": "22:09:34", "remaining_time": "2 days, 13:09:44", "throughput": 29023.66, "total_tokens": 2315355520} +{"current_steps": 7900, "total_steps": 29667, "loss": 0.3764, "lr": 3.7372798585098644e-05, "epoch": 0.7989128717251841, "percentage": 26.63, "elapsed_time": "22:11:10", "remaining_time": "2 days, 13:07:48", "throughput": 29024.81, "total_tokens": 2318230848} +{"current_steps": 7910, "total_steps": 29667, "loss": 0.3756, "lr": 3.736236304512331e-05, "epoch": 0.7999241538412919, "percentage": 26.66, "elapsed_time": "22:12:47", "remaining_time": "2 days, 13:05:56", "throughput": 29026.49, "total_tokens": 2321183232} +{"current_steps": 7920, "total_steps": 29667, "loss": 0.3771, "lr": 3.735193624196067e-05, "epoch": 0.8009354359573997, "percentage": 26.7, "elapsed_time": "22:14:27", "remaining_time": "2 days, 13:04:11", "throughput": 29027.16, "total_tokens": 2324126592} +{"current_steps": 7930, "total_steps": 29667, "loss": 0.3777, "lr": 3.7341518163426514e-05, "epoch": 0.8019467180735076, "percentage": 26.73, "elapsed_time": "22:16:02", "remaining_time": "2 days, 13:02:15", "throughput": 29028.51, "total_tokens": 2327008384} +{"current_steps": 7940, "total_steps": 29667, "loss": 0.3764, "lr": 3.73311087973604e-05, "epoch": 0.8029580001896154, "percentage": 26.76, "elapsed_time": "22:17:37", "remaining_time": "2 days, 13:00:16", "throughput": 29030.71, "total_tokens": 2329935360} +{"current_steps": 7950, "total_steps": 29667, "loss": 0.3782, "lr": 3.732070813162561e-05, "epoch": 0.8039692823057232, "percentage": 26.8, "elapsed_time": "22:19:15", "remaining_time": "2 days, 12:58:26", "throughput": 29031.72, "total_tokens": 2332850048} +{"current_steps": 7960, "total_steps": 29667, "loss": 0.3754, "lr": 3.731031615410908e-05, "epoch": 0.8049805644218311, "percentage": 26.83, "elapsed_time": "22:20:52", "remaining_time": "2 days, 12:56:33", "throughput": 29033.73, "total_tokens": 2335825344} +{"current_steps": 7970, "total_steps": 29667, "loss": 0.3782, "lr": 3.729993285272132e-05, "epoch": 0.8059918465379389, "percentage": 26.86, "elapsed_time": "22:22:30", "remaining_time": "2 days, 12:54:45", "throughput": 29034.46, "total_tokens": 2338744576} +{"current_steps": 7980, "total_steps": 29667, "loss": 0.3772, "lr": 3.7289558215396414e-05, "epoch": 0.8070031286540467, "percentage": 26.9, "elapsed_time": "22:24:10", "remaining_time": "2 days, 12:53:00", "throughput": 29035.25, "total_tokens": 2341698496} +{"current_steps": 7990, "total_steps": 29667, "loss": 0.3778, "lr": 3.727919223009191e-05, "epoch": 0.8080144107701546, "percentage": 26.93, "elapsed_time": "22:25:49", "remaining_time": "2 days, 12:51:14", "throughput": 29036.02, "total_tokens": 2344636608} +{"current_steps": 8000, "total_steps": 29667, "loss": 0.3733, "lr": 3.726883488478877e-05, "epoch": 0.8090256928862624, "percentage": 26.97, "elapsed_time": "22:27:28", "remaining_time": "2 days, 12:49:27", "throughput": 29036.81, "total_tokens": 2347579648} +{"current_steps": 8010, "total_steps": 29667, "loss": 0.3754, "lr": 3.7258486167491323e-05, "epoch": 0.8100369750023702, "percentage": 27.0, "elapsed_time": "22:29:04", "remaining_time": "2 days, 12:47:32", "throughput": 29038.24, "total_tokens": 2350479488} +{"current_steps": 8020, "total_steps": 29667, "loss": 0.377, "lr": 3.724814606622721e-05, "epoch": 0.811048257118478, "percentage": 27.03, "elapsed_time": "22:30:46", "remaining_time": "2 days, 12:45:53", "throughput": 29038.28, "total_tokens": 2353441856} +{"current_steps": 8030, "total_steps": 29667, "loss": 0.3805, "lr": 3.7237814569047294e-05, "epoch": 0.8120595392345858, "percentage": 27.07, "elapsed_time": "22:32:23", "remaining_time": "2 days, 12:44:02", "throughput": 29039.65, "total_tokens": 2356377216} +{"current_steps": 8040, "total_steps": 29667, "loss": 0.3737, "lr": 3.7227491664025656e-05, "epoch": 0.8130708213506936, "percentage": 27.1, "elapsed_time": "22:34:02", "remaining_time": "2 days, 12:42:15", "throughput": 29040.76, "total_tokens": 2359335552} +{"current_steps": 8050, "total_steps": 29667, "loss": 0.3746, "lr": 3.721717733925948e-05, "epoch": 0.8140821034668015, "percentage": 27.13, "elapsed_time": "22:35:35", "remaining_time": "2 days, 12:40:14", "throughput": 29042.88, "total_tokens": 2362228736} +{"current_steps": 8060, "total_steps": 29667, "loss": 0.3749, "lr": 3.720687158286904e-05, "epoch": 0.8150933855829093, "percentage": 27.17, "elapsed_time": "22:37:08", "remaining_time": "2 days, 12:38:11", "throughput": 29045.22, "total_tokens": 2365110720} +{"current_steps": 8070, "total_steps": 29667, "loss": 0.3758, "lr": 3.719657438299762e-05, "epoch": 0.8161046676990171, "percentage": 27.2, "elapsed_time": "22:38:52", "remaining_time": "2 days, 12:36:37", "throughput": 29044.99, "total_tokens": 2368102784} +{"current_steps": 8080, "total_steps": 29667, "loss": 0.3775, "lr": 3.7186285727811446e-05, "epoch": 0.817115949815125, "percentage": 27.24, "elapsed_time": "22:40:33", "remaining_time": "2 days, 12:34:55", "throughput": 29045.36, "total_tokens": 2371064960} +{"current_steps": 8090, "total_steps": 29667, "loss": 0.3784, "lr": 3.717600560549967e-05, "epoch": 0.8181272319312328, "percentage": 27.27, "elapsed_time": "22:42:13", "remaining_time": "2 days, 12:33:14", "throughput": 29045.8, "total_tokens": 2374026496} +{"current_steps": 8100, "total_steps": 29667, "loss": 0.3758, "lr": 3.716573400427426e-05, "epoch": 0.8191385140473406, "percentage": 27.3, "elapsed_time": "22:43:52", "remaining_time": "2 days, 12:31:27", "throughput": 29046.77, "total_tokens": 2376983616} +{"current_steps": 8110, "total_steps": 29667, "loss": 0.3712, "lr": 3.7155470912370004e-05, "epoch": 0.8201497961634485, "percentage": 27.34, "elapsed_time": "22:45:35", "remaining_time": "2 days, 12:29:50", "throughput": 29046.79, "total_tokens": 2379958464} +{"current_steps": 8120, "total_steps": 29667, "loss": 0.3737, "lr": 3.714521631804439e-05, "epoch": 0.8211610782795563, "percentage": 27.37, "elapsed_time": "22:47:11", "remaining_time": "2 days, 12:27:56", "throughput": 29048.5, "total_tokens": 2382895424} +{"current_steps": 8130, "total_steps": 29667, "loss": 0.374, "lr": 3.713497020957759e-05, "epoch": 0.8221723603956641, "percentage": 27.4, "elapsed_time": "22:48:55", "remaining_time": "2 days, 12:26:22", "throughput": 29048.63, "total_tokens": 2385915392} +{"current_steps": 8140, "total_steps": 29667, "loss": 0.3806, "lr": 3.712473257527238e-05, "epoch": 0.823183642511772, "percentage": 27.44, "elapsed_time": "22:50:36", "remaining_time": "2 days, 12:24:43", "throughput": 29048.6, "total_tokens": 2388864576} +{"current_steps": 8150, "total_steps": 29667, "loss": 0.3747, "lr": 3.711450340345412e-05, "epoch": 0.8241949246278798, "percentage": 27.47, "elapsed_time": "22:52:15", "remaining_time": "2 days, 12:22:56", "throughput": 29049.57, "total_tokens": 2391818560} +{"current_steps": 8160, "total_steps": 29667, "loss": 0.3688, "lr": 3.710428268247067e-05, "epoch": 0.8252062067439876, "percentage": 27.51, "elapsed_time": "22:53:51", "remaining_time": "2 days, 12:21:02", "throughput": 29051.3, "total_tokens": 2394749504} +{"current_steps": 8170, "total_steps": 29667, "loss": 0.3758, "lr": 3.709407040069233e-05, "epoch": 0.8262174888600955, "percentage": 27.54, "elapsed_time": "22:55:31", "remaining_time": "2 days, 12:19:18", "throughput": 29051.88, "total_tokens": 2397703232} +{"current_steps": 8180, "total_steps": 29667, "loss": 0.373, "lr": 3.708386654651179e-05, "epoch": 0.8272287709762033, "percentage": 27.57, "elapsed_time": "22:57:11", "remaining_time": "2 days, 12:17:33", "throughput": 29052.59, "total_tokens": 2400649536} +{"current_steps": 8190, "total_steps": 29667, "loss": 0.3781, "lr": 3.707367110834409e-05, "epoch": 0.8282400530923111, "percentage": 27.61, "elapsed_time": "22:58:48", "remaining_time": "2 days, 12:15:42", "throughput": 29054.22, "total_tokens": 2403610304} +{"current_steps": 8200, "total_steps": 29667, "loss": 0.3766, "lr": 3.7063484074626555e-05, "epoch": 0.8292513352084189, "percentage": 27.64, "elapsed_time": "23:00:25", "remaining_time": "2 days, 12:13:52", "throughput": 29055.63, "total_tokens": 2406560448} +{"current_steps": 8210, "total_steps": 29667, "loss": 0.3763, "lr": 3.7053305433818725e-05, "epoch": 0.8302626173245268, "percentage": 27.67, "elapsed_time": "23:02:01", "remaining_time": "2 days, 12:11:56", "throughput": 29057.21, "total_tokens": 2409459264} +{"current_steps": 8220, "total_steps": 29667, "loss": 0.3742, "lr": 3.704313517440232e-05, "epoch": 0.8312738994406346, "percentage": 27.71, "elapsed_time": "23:03:41", "remaining_time": "2 days, 12:10:14", "throughput": 29057.71, "total_tokens": 2412425088} +{"current_steps": 8230, "total_steps": 29667, "loss": 0.378, "lr": 3.703297328488118e-05, "epoch": 0.8322851815567424, "percentage": 27.74, "elapsed_time": "23:05:20", "remaining_time": "2 days, 12:08:26", "throughput": 29058.87, "total_tokens": 2415375040} +{"current_steps": 8240, "total_steps": 29667, "loss": 0.3734, "lr": 3.70228197537812e-05, "epoch": 0.8332964636728503, "percentage": 27.77, "elapsed_time": "23:06:54", "remaining_time": "2 days, 12:06:29", "throughput": 29060.37, "total_tokens": 2418257920} +{"current_steps": 8250, "total_steps": 29667, "loss": 0.3751, "lr": 3.7012674569650305e-05, "epoch": 0.834307745788958, "percentage": 27.81, "elapsed_time": "23:08:28", "remaining_time": "2 days, 12:04:29", "throughput": 29062.23, "total_tokens": 2421139968} +{"current_steps": 8260, "total_steps": 29667, "loss": 0.3744, "lr": 3.700253772105835e-05, "epoch": 0.8353190279050658, "percentage": 27.84, "elapsed_time": "23:10:05", "remaining_time": "2 days, 12:02:37", "throughput": 29063.56, "total_tokens": 2424064000} +{"current_steps": 8270, "total_steps": 29667, "loss": 0.3729, "lr": 3.699240919659711e-05, "epoch": 0.8363303100211738, "percentage": 27.88, "elapsed_time": "23:11:43", "remaining_time": "2 days, 12:00:49", "throughput": 29064.64, "total_tokens": 2427003136} +{"current_steps": 8280, "total_steps": 29667, "loss": 0.3782, "lr": 3.698228898488019e-05, "epoch": 0.8373415921372815, "percentage": 27.91, "elapsed_time": "23:13:23", "remaining_time": "2 days, 11:59:04", "throughput": 29065.44, "total_tokens": 2429958656} +{"current_steps": 8290, "total_steps": 29667, "loss": 0.3728, "lr": 3.6972177074543e-05, "epoch": 0.8383528742533893, "percentage": 27.94, "elapsed_time": "23:15:02", "remaining_time": "2 days, 11:57:19", "throughput": 29066.27, "total_tokens": 2432916544} +{"current_steps": 8300, "total_steps": 29667, "loss": 0.3755, "lr": 3.69620734542427e-05, "epoch": 0.8393641563694972, "percentage": 27.98, "elapsed_time": "23:16:36", "remaining_time": "2 days, 11:55:21", "throughput": 29067.86, "total_tokens": 2435791296} +{"current_steps": 8310, "total_steps": 29667, "loss": 0.3738, "lr": 3.695197811265811e-05, "epoch": 0.840375438485605, "percentage": 28.01, "elapsed_time": "23:18:15", "remaining_time": "2 days, 11:53:33", "throughput": 29068.57, "total_tokens": 2438713536} +{"current_steps": 8320, "total_steps": 29667, "loss": 0.3798, "lr": 3.6941891038489694e-05, "epoch": 0.8413867206017128, "percentage": 28.04, "elapsed_time": "23:19:52", "remaining_time": "2 days, 11:51:44", "throughput": 29069.69, "total_tokens": 2441644096} +{"current_steps": 8330, "total_steps": 29667, "loss": 0.3771, "lr": 3.693181222045952e-05, "epoch": 0.8423980027178207, "percentage": 28.08, "elapsed_time": "23:21:33", "remaining_time": "2 days, 11:50:02", "throughput": 29069.97, "total_tokens": 2444596544} +{"current_steps": 8340, "total_steps": 29667, "loss": 0.3714, "lr": 3.692174164731113e-05, "epoch": 0.8434092848339285, "percentage": 28.11, "elapsed_time": "23:23:08", "remaining_time": "2 days, 11:48:07", "throughput": 29071.54, "total_tokens": 2447498944} +{"current_steps": 8350, "total_steps": 29667, "loss": 0.3724, "lr": 3.6911679307809595e-05, "epoch": 0.8444205669500363, "percentage": 28.15, "elapsed_time": "23:24:47", "remaining_time": "2 days, 11:46:20", "throughput": 29072.68, "total_tokens": 2450459520} +{"current_steps": 8360, "total_steps": 29667, "loss": 0.3771, "lr": 3.690162519074137e-05, "epoch": 0.8454318490661442, "percentage": 28.18, "elapsed_time": "23:26:28", "remaining_time": "2 days, 11:44:39", "throughput": 29073.23, "total_tokens": 2453439296} +{"current_steps": 8370, "total_steps": 29667, "loss": 0.3791, "lr": 3.689157928491431e-05, "epoch": 0.846443131182252, "percentage": 28.21, "elapsed_time": "23:28:07", "remaining_time": "2 days, 11:42:52", "throughput": 29073.88, "total_tokens": 2456371136} +{"current_steps": 8380, "total_steps": 29667, "loss": 0.3732, "lr": 3.6881541579157566e-05, "epoch": 0.8474544132983598, "percentage": 28.25, "elapsed_time": "23:29:43", "remaining_time": "2 days, 11:41:00", "throughput": 29075.11, "total_tokens": 2459279296} +{"current_steps": 8390, "total_steps": 29667, "loss": 0.3742, "lr": 3.687151206232154e-05, "epoch": 0.8484656954144677, "percentage": 28.28, "elapsed_time": "23:31:21", "remaining_time": "2 days, 11:39:10", "throughput": 29075.83, "total_tokens": 2462172864} +{"current_steps": 8400, "total_steps": 29667, "loss": 0.3719, "lr": 3.686149072327788e-05, "epoch": 0.8494769775305755, "percentage": 28.31, "elapsed_time": "23:32:56", "remaining_time": "2 days, 11:37:16", "throughput": 29077.76, "total_tokens": 2465115200} +{"current_steps": 8410, "total_steps": 29667, "loss": 0.3748, "lr": 3.685147755091937e-05, "epoch": 0.8504882596466833, "percentage": 28.35, "elapsed_time": "23:34:35", "remaining_time": "2 days, 11:35:30", "throughput": 29078.36, "total_tokens": 2468045184} +{"current_steps": 8420, "total_steps": 29667, "loss": 0.3716, "lr": 3.684147253415992e-05, "epoch": 0.8514995417627912, "percentage": 28.38, "elapsed_time": "23:36:16", "remaining_time": "2 days, 11:33:50", "throughput": 29078.66, "total_tokens": 2471010304} +{"current_steps": 8430, "total_steps": 29667, "loss": 0.3735, "lr": 3.683147566193448e-05, "epoch": 0.852510823878899, "percentage": 28.42, "elapsed_time": "23:37:52", "remaining_time": "2 days, 11:31:55", "throughput": 29080.23, "total_tokens": 2473923456} +{"current_steps": 8440, "total_steps": 29667, "loss": 0.3768, "lr": 3.6821486923199025e-05, "epoch": 0.8535221059950068, "percentage": 28.45, "elapsed_time": "23:39:24", "remaining_time": "2 days, 11:29:53", "throughput": 29082.28, "total_tokens": 2476786624} +{"current_steps": 8450, "total_steps": 29667, "loss": 0.372, "lr": 3.681150630693046e-05, "epoch": 0.8545333881111147, "percentage": 28.48, "elapsed_time": "23:41:03", "remaining_time": "2 days, 11:28:07", "throughput": 29082.8, "total_tokens": 2479711296} +{"current_steps": 8460, "total_steps": 29667, "loss": 0.3775, "lr": 3.6801533802126615e-05, "epoch": 0.8555446702272225, "percentage": 28.52, "elapsed_time": "23:42:36", "remaining_time": "2 days, 11:26:06", "throughput": 29085.0, "total_tokens": 2482595072} +{"current_steps": 8470, "total_steps": 29667, "loss": 0.3743, "lr": 3.679156939780617e-05, "epoch": 0.8565559523433303, "percentage": 28.55, "elapsed_time": "23:44:14", "remaining_time": "2 days, 11:24:17", "throughput": 29086.2, "total_tokens": 2485536704} +{"current_steps": 8480, "total_steps": 29667, "loss": 0.3831, "lr": 3.6781613083008594e-05, "epoch": 0.857567234459438, "percentage": 28.58, "elapsed_time": "23:45:54", "remaining_time": "2 days, 11:22:34", "throughput": 29086.97, "total_tokens": 2488513856} +{"current_steps": 8490, "total_steps": 29667, "loss": 0.3813, "lr": 3.677166484679412e-05, "epoch": 0.858578516575546, "percentage": 28.62, "elapsed_time": "23:47:31", "remaining_time": "2 days, 11:20:45", "throughput": 29087.65, "total_tokens": 2491409536} +{"current_steps": 8500, "total_steps": 29667, "loss": 0.3751, "lr": 3.676172467824368e-05, "epoch": 0.8595897986916538, "percentage": 28.65, "elapsed_time": "23:49:09", "remaining_time": "2 days, 11:18:56", "throughput": 29088.38, "total_tokens": 2494314688} +{"current_steps": 8510, "total_steps": 29667, "loss": 0.3748, "lr": 3.675179256645885e-05, "epoch": 0.8606010808077615, "percentage": 28.69, "elapsed_time": "23:50:46", "remaining_time": "2 days, 11:17:05", "throughput": 29090.08, "total_tokens": 2497281600} +{"current_steps": 8520, "total_steps": 29667, "loss": 0.3778, "lr": 3.674186850056181e-05, "epoch": 0.8616123629238694, "percentage": 28.72, "elapsed_time": "23:52:26", "remaining_time": "2 days, 11:15:22", "throughput": 29090.77, "total_tokens": 2500246080} +{"current_steps": 8530, "total_steps": 29667, "loss": 0.3734, "lr": 3.67319524696953e-05, "epoch": 0.8626236450399772, "percentage": 28.75, "elapsed_time": "23:54:06", "remaining_time": "2 days, 11:13:39", "throughput": 29091.13, "total_tokens": 2503185856} +{"current_steps": 8540, "total_steps": 29667, "loss": 0.3727, "lr": 3.6722044463022536e-05, "epoch": 0.863634927156085, "percentage": 28.79, "elapsed_time": "23:55:43", "remaining_time": "2 days, 11:11:49", "throughput": 29092.37, "total_tokens": 2506117312} +{"current_steps": 8550, "total_steps": 29667, "loss": 0.3785, "lr": 3.6712144469727214e-05, "epoch": 0.8646462092721929, "percentage": 28.82, "elapsed_time": "23:57:23", "remaining_time": "2 days, 11:10:05", "throughput": 29093.04, "total_tokens": 2509072640} +{"current_steps": 8560, "total_steps": 29667, "loss": 0.3775, "lr": 3.67022524790134e-05, "epoch": 0.8656574913883007, "percentage": 28.85, "elapsed_time": "23:59:01", "remaining_time": "2 days, 11:08:18", "throughput": 29093.74, "total_tokens": 2512003200} +{"current_steps": 8570, "total_steps": 29667, "loss": 0.3704, "lr": 3.6692368480105546e-05, "epoch": 0.8666687735044085, "percentage": 28.89, "elapsed_time": "1 day, 0:00:37", "remaining_time": "2 days, 11:06:24", "throughput": 29095.26, "total_tokens": 2514908224} +{"current_steps": 8580, "total_steps": 29667, "loss": 0.3731, "lr": 3.6682492462248374e-05, "epoch": 0.8676800556205164, "percentage": 28.92, "elapsed_time": "1 day, 0:02:08", "remaining_time": "2 days, 11:04:20", "throughput": 29097.7, "total_tokens": 2517782720} +{"current_steps": 8590, "total_steps": 29667, "loss": 0.3778, "lr": 3.667262441470689e-05, "epoch": 0.8686913377366242, "percentage": 28.95, "elapsed_time": "1 day, 0:03:43", "remaining_time": "2 days, 11:02:26", "throughput": 29099.06, "total_tokens": 2520674048} +{"current_steps": 8600, "total_steps": 29667, "loss": 0.3765, "lr": 3.6662764326766255e-05, "epoch": 0.869702619852732, "percentage": 28.99, "elapsed_time": "1 day, 0:05:23", "remaining_time": "2 days, 11:00:43", "throughput": 29100.03, "total_tokens": 2523667200} +{"current_steps": 8610, "total_steps": 29667, "loss": 0.3768, "lr": 3.665291218773185e-05, "epoch": 0.8707139019688399, "percentage": 29.02, "elapsed_time": "1 day, 0:07:02", "remaining_time": "2 days, 10:58:56", "throughput": 29100.78, "total_tokens": 2526602368} +{"current_steps": 8620, "total_steps": 29667, "loss": 0.3744, "lr": 3.664306798692912e-05, "epoch": 0.8717251840849477, "percentage": 29.06, "elapsed_time": "1 day, 0:08:40", "remaining_time": "2 days, 10:57:08", "throughput": 29101.79, "total_tokens": 2529531712} +{"current_steps": 8630, "total_steps": 29667, "loss": 0.3744, "lr": 3.6633231713703576e-05, "epoch": 0.8727364662010555, "percentage": 29.09, "elapsed_time": "1 day, 0:10:15", "remaining_time": "2 days, 10:55:14", "throughput": 29103.2, "total_tokens": 2532437440} +{"current_steps": 8640, "total_steps": 29667, "loss": 0.377, "lr": 3.6623403357420745e-05, "epoch": 0.8737477483171634, "percentage": 29.12, "elapsed_time": "1 day, 0:11:52", "remaining_time": "2 days, 10:53:24", "throughput": 29103.98, "total_tokens": 2535323648} +{"current_steps": 8650, "total_steps": 29667, "loss": 0.3747, "lr": 3.661358290746611e-05, "epoch": 0.8747590304332712, "percentage": 29.16, "elapsed_time": "1 day, 0:13:30", "remaining_time": "2 days, 10:51:35", "throughput": 29105.18, "total_tokens": 2538269952} +{"current_steps": 8660, "total_steps": 29667, "loss": 0.3804, "lr": 3.6603770353245056e-05, "epoch": 0.875770312549379, "percentage": 29.19, "elapsed_time": "1 day, 0:15:08", "remaining_time": "2 days, 10:49:48", "throughput": 29105.72, "total_tokens": 2541169856} +{"current_steps": 8670, "total_steps": 29667, "loss": 0.3727, "lr": 3.659396568418286e-05, "epoch": 0.8767815946654869, "percentage": 29.22, "elapsed_time": "1 day, 0:16:49", "remaining_time": "2 days, 10:48:09", "throughput": 29105.71, "total_tokens": 2544126912} +{"current_steps": 8680, "total_steps": 29667, "loss": 0.3793, "lr": 3.658416888972459e-05, "epoch": 0.8777928767815947, "percentage": 29.26, "elapsed_time": "1 day, 0:18:27", "remaining_time": "2 days, 10:46:21", "throughput": 29106.66, "total_tokens": 2547064704} +{"current_steps": 8690, "total_steps": 29667, "loss": 0.3712, "lr": 3.6574379959335106e-05, "epoch": 0.8788041588977025, "percentage": 29.29, "elapsed_time": "1 day, 0:20:03", "remaining_time": "2 days, 10:44:28", "throughput": 29107.98, "total_tokens": 2549963392} +{"current_steps": 8700, "total_steps": 29667, "loss": 0.3722, "lr": 3.6564598882498976e-05, "epoch": 0.8798154410138104, "percentage": 29.33, "elapsed_time": "1 day, 0:21:41", "remaining_time": "2 days, 10:42:40", "throughput": 29109.28, "total_tokens": 2552925696} +{"current_steps": 8710, "total_steps": 29667, "loss": 0.3769, "lr": 3.655482564872043e-05, "epoch": 0.8808267231299182, "percentage": 29.36, "elapsed_time": "1 day, 0:23:22", "remaining_time": "2 days, 10:41:00", "throughput": 29109.58, "total_tokens": 2555892096} +{"current_steps": 8720, "total_steps": 29667, "loss": 0.3738, "lr": 3.654506024752336e-05, "epoch": 0.881838005246026, "percentage": 29.39, "elapsed_time": "1 day, 0:25:02", "remaining_time": "2 days, 10:39:17", "throughput": 29109.8, "total_tokens": 2558827392} +{"current_steps": 8730, "total_steps": 29667, "loss": 0.3687, "lr": 3.653530266845121e-05, "epoch": 0.8828492873621338, "percentage": 29.43, "elapsed_time": "1 day, 0:26:40", "remaining_time": "2 days, 10:37:29", "throughput": 29110.83, "total_tokens": 2561756736} +{"current_steps": 8740, "total_steps": 29667, "loss": 0.372, "lr": 3.652555290106696e-05, "epoch": 0.8838605694782417, "percentage": 29.46, "elapsed_time": "1 day, 0:28:18", "remaining_time": "2 days, 10:35:41", "throughput": 29111.99, "total_tokens": 2564708736} +{"current_steps": 8750, "total_steps": 29667, "loss": 0.371, "lr": 3.6515810934953084e-05, "epoch": 0.8848718515943494, "percentage": 29.49, "elapsed_time": "1 day, 0:29:52", "remaining_time": "2 days, 10:33:45", "throughput": 29113.55, "total_tokens": 2567599552} +{"current_steps": 8760, "total_steps": 29667, "loss": 0.3718, "lr": 3.650607675971151e-05, "epoch": 0.8858831337104572, "percentage": 29.53, "elapsed_time": "1 day, 0:31:34", "remaining_time": "2 days, 10:32:07", "throughput": 29113.51, "total_tokens": 2570556800} +{"current_steps": 8770, "total_steps": 29667, "loss": 0.3729, "lr": 3.649635036496351e-05, "epoch": 0.8868944158265651, "percentage": 29.56, "elapsed_time": "1 day, 0:33:15", "remaining_time": "2 days, 10:30:26", "throughput": 29113.69, "total_tokens": 2573512832} +{"current_steps": 8780, "total_steps": 29667, "loss": 0.3777, "lr": 3.6486631740349746e-05, "epoch": 0.8879056979426729, "percentage": 29.6, "elapsed_time": "1 day, 0:34:57", "remaining_time": "2 days, 10:28:49", "throughput": 29113.76, "total_tokens": 2576498560} +{"current_steps": 8790, "total_steps": 29667, "loss": 0.3811, "lr": 3.647692087553018e-05, "epoch": 0.8889169800587807, "percentage": 29.63, "elapsed_time": "1 day, 0:36:39", "remaining_time": "2 days, 10:27:10", "throughput": 29113.95, "total_tokens": 2579468672} +{"current_steps": 8800, "total_steps": 29667, "loss": 0.3711, "lr": 3.6467217760184005e-05, "epoch": 0.8899282621748886, "percentage": 29.66, "elapsed_time": "1 day, 0:38:17", "remaining_time": "2 days, 10:25:24", "throughput": 29114.77, "total_tokens": 2582415168} +{"current_steps": 8810, "total_steps": 29667, "loss": 0.3669, "lr": 3.6457522384009625e-05, "epoch": 0.8909395442909964, "percentage": 29.7, "elapsed_time": "1 day, 0:39:57", "remaining_time": "2 days, 10:23:40", "throughput": 29115.5, "total_tokens": 2585370176} +{"current_steps": 8820, "total_steps": 29667, "loss": 0.3782, "lr": 3.644783473672462e-05, "epoch": 0.8919508264071042, "percentage": 29.73, "elapsed_time": "1 day, 0:41:37", "remaining_time": "2 days, 10:21:59", "throughput": 29115.74, "total_tokens": 2588324608} +{"current_steps": 8830, "total_steps": 29667, "loss": 0.3764, "lr": 3.643815480806568e-05, "epoch": 0.8929621085232121, "percentage": 29.76, "elapsed_time": "1 day, 0:43:12", "remaining_time": "2 days, 10:20:03", "throughput": 29116.96, "total_tokens": 2591188544} +{"current_steps": 8840, "total_steps": 29667, "loss": 0.3667, "lr": 3.6428482587788555e-05, "epoch": 0.8939733906393199, "percentage": 29.8, "elapsed_time": "1 day, 0:44:50", "remaining_time": "2 days, 10:18:16", "throughput": 29117.85, "total_tokens": 2594116160} +{"current_steps": 8850, "total_steps": 29667, "loss": 0.3743, "lr": 3.641881806566803e-05, "epoch": 0.8949846727554277, "percentage": 29.83, "elapsed_time": "1 day, 0:46:33", "remaining_time": "2 days, 10:16:41", "throughput": 29117.56, "total_tokens": 2597102208} +{"current_steps": 8860, "total_steps": 29667, "loss": 0.3748, "lr": 3.640916123149788e-05, "epoch": 0.8959959548715356, "percentage": 29.86, "elapsed_time": "1 day, 0:48:08", "remaining_time": "2 days, 10:14:47", "throughput": 29119.04, "total_tokens": 2600006400} +{"current_steps": 8870, "total_steps": 29667, "loss": 0.3728, "lr": 3.639951207509079e-05, "epoch": 0.8970072369876434, "percentage": 29.9, "elapsed_time": "1 day, 0:49:49", "remaining_time": "2 days, 10:13:05", "throughput": 29119.83, "total_tokens": 2602993216} +{"current_steps": 8880, "total_steps": 29667, "loss": 0.37, "lr": 3.6389870586278333e-05, "epoch": 0.8980185191037512, "percentage": 29.93, "elapsed_time": "1 day, 0:51:30", "remaining_time": "2 days, 10:11:26", "throughput": 29119.9, "total_tokens": 2605956096} +{"current_steps": 8890, "total_steps": 29667, "loss": 0.373, "lr": 3.6380236754910965e-05, "epoch": 0.8990298012198591, "percentage": 29.97, "elapsed_time": "1 day, 0:53:07", "remaining_time": "2 days, 10:09:37", "throughput": 29120.93, "total_tokens": 2608874816} +{"current_steps": 8900, "total_steps": 29667, "loss": 0.3743, "lr": 3.6370610570857897e-05, "epoch": 0.9000410833359669, "percentage": 30.0, "elapsed_time": "1 day, 0:54:41", "remaining_time": "2 days, 10:07:40", "throughput": 29122.93, "total_tokens": 2611785664} +{"current_steps": 8910, "total_steps": 29667, "loss": 0.3745, "lr": 3.6360992024007114e-05, "epoch": 0.9010523654520747, "percentage": 30.03, "elapsed_time": "1 day, 0:56:17", "remaining_time": "2 days, 10:05:47", "throughput": 29124.01, "total_tokens": 2614666816} +{"current_steps": 8920, "total_steps": 29667, "loss": 0.372, "lr": 3.6351381104265304e-05, "epoch": 0.9020636475681826, "percentage": 30.07, "elapsed_time": "1 day, 0:57:56", "remaining_time": "2 days, 10:04:04", "throughput": 29124.65, "total_tokens": 2617633536} +{"current_steps": 8930, "total_steps": 29667, "loss": 0.3726, "lr": 3.634177780155783e-05, "epoch": 0.9030749296842904, "percentage": 30.1, "elapsed_time": "1 day, 0:59:34", "remaining_time": "2 days, 10:02:15", "throughput": 29125.85, "total_tokens": 2620575744} +{"current_steps": 8940, "total_steps": 29667, "loss": 0.3714, "lr": 3.633218210582867e-05, "epoch": 0.9040862118003982, "percentage": 30.13, "elapsed_time": "1 day, 1:01:11", "remaining_time": "2 days, 10:00:25", "throughput": 29126.92, "total_tokens": 2623493952} +{"current_steps": 8950, "total_steps": 29667, "loss": 0.3716, "lr": 3.6322594007040376e-05, "epoch": 0.9050974939165061, "percentage": 30.17, "elapsed_time": "1 day, 1:02:48", "remaining_time": "2 days, 9:58:37", "throughput": 29127.87, "total_tokens": 2626418944} +{"current_steps": 8960, "total_steps": 29667, "loss": 0.3767, "lr": 3.631301349517403e-05, "epoch": 0.9061087760326139, "percentage": 30.2, "elapsed_time": "1 day, 1:04:28", "remaining_time": "2 days, 9:56:54", "throughput": 29128.51, "total_tokens": 2629378048} +{"current_steps": 8970, "total_steps": 29667, "loss": 0.376, "lr": 3.6303440560229216e-05, "epoch": 0.9071200581487217, "percentage": 30.24, "elapsed_time": "1 day, 1:06:06", "remaining_time": "2 days, 9:55:07", "throughput": 29129.33, "total_tokens": 2632314688} +{"current_steps": 8980, "total_steps": 29667, "loss": 0.3747, "lr": 3.629387519222395e-05, "epoch": 0.9081313402648296, "percentage": 30.27, "elapsed_time": "1 day, 1:07:44", "remaining_time": "2 days, 9:53:21", "throughput": 29130.04, "total_tokens": 2635247488} +{"current_steps": 8990, "total_steps": 29667, "loss": 0.3755, "lr": 3.628431738119464e-05, "epoch": 0.9091426223809373, "percentage": 30.3, "elapsed_time": "1 day, 1:09:22", "remaining_time": "2 days, 9:51:32", "throughput": 29130.96, "total_tokens": 2638158464} +{"current_steps": 9000, "total_steps": 29667, "loss": 0.3718, "lr": 3.62747671171961e-05, "epoch": 0.9101539044970451, "percentage": 30.34, "elapsed_time": "1 day, 1:10:58", "remaining_time": "2 days, 9:49:42", "throughput": 29132.05, "total_tokens": 2641077120} +{"current_steps": 9010, "total_steps": 29667, "loss": 0.3795, "lr": 3.626522439030138e-05, "epoch": 0.9111651866131529, "percentage": 30.37, "elapsed_time": "1 day, 1:12:34", "remaining_time": "2 days, 9:47:50", "throughput": 29133.45, "total_tokens": 2643989504} +{"current_steps": 9020, "total_steps": 29667, "loss": 0.3732, "lr": 3.6255689190601863e-05, "epoch": 0.9121764687292608, "percentage": 30.4, "elapsed_time": "1 day, 1:14:15", "remaining_time": "2 days, 9:46:10", "throughput": 29133.45, "total_tokens": 2646931904} +{"current_steps": 9030, "total_steps": 29667, "loss": 0.3729, "lr": 3.624616150820714e-05, "epoch": 0.9131877508453686, "percentage": 30.44, "elapsed_time": "1 day, 1:15:51", "remaining_time": "2 days, 9:44:19", "throughput": 29134.82, "total_tokens": 2649865088} +{"current_steps": 9040, "total_steps": 29667, "loss": 0.3761, "lr": 3.623664133324499e-05, "epoch": 0.9141990329614764, "percentage": 30.47, "elapsed_time": "1 day, 1:17:30", "remaining_time": "2 days, 9:42:33", "throughput": 29135.44, "total_tokens": 2652786880} +{"current_steps": 9050, "total_steps": 29667, "loss": 0.3776, "lr": 3.622712865586131e-05, "epoch": 0.9152103150775843, "percentage": 30.51, "elapsed_time": "1 day, 1:19:11", "remaining_time": "2 days, 9:40:53", "throughput": 29135.48, "total_tokens": 2655733888} +{"current_steps": 9060, "total_steps": 29667, "loss": 0.3739, "lr": 3.621762346622014e-05, "epoch": 0.9162215971936921, "percentage": 30.54, "elapsed_time": "1 day, 1:20:47", "remaining_time": "2 days, 9:39:02", "throughput": 29136.86, "total_tokens": 2658657792} +{"current_steps": 9070, "total_steps": 29667, "loss": 0.3755, "lr": 3.620812575450352e-05, "epoch": 0.9172328793097999, "percentage": 30.57, "elapsed_time": "1 day, 1:22:23", "remaining_time": "2 days, 9:37:11", "throughput": 29137.57, "total_tokens": 2661532224} +{"current_steps": 9080, "total_steps": 29667, "loss": 0.3776, "lr": 3.6198635510911556e-05, "epoch": 0.9182441614259078, "percentage": 30.61, "elapsed_time": "1 day, 1:24:00", "remaining_time": "2 days, 9:35:22", "throughput": 29138.51, "total_tokens": 2664444800} +{"current_steps": 9090, "total_steps": 29667, "loss": 0.3699, "lr": 3.618915272566228e-05, "epoch": 0.9192554435420156, "percentage": 30.64, "elapsed_time": "1 day, 1:25:40", "remaining_time": "2 days, 9:33:38", "throughput": 29138.77, "total_tokens": 2667364416} +{"current_steps": 9100, "total_steps": 29667, "loss": 0.3719, "lr": 3.6179677388991694e-05, "epoch": 0.9202667256581234, "percentage": 30.67, "elapsed_time": "1 day, 1:27:19", "remaining_time": "2 days, 9:31:55", "throughput": 29139.57, "total_tokens": 2670338624} +{"current_steps": 9110, "total_steps": 29667, "loss": 0.3715, "lr": 3.617020949115366e-05, "epoch": 0.9212780077742313, "percentage": 30.71, "elapsed_time": "1 day, 1:28:56", "remaining_time": "2 days, 9:30:06", "throughput": 29140.97, "total_tokens": 2673289664} +{"current_steps": 9120, "total_steps": 29667, "loss": 0.3707, "lr": 3.6160749022419886e-05, "epoch": 0.9222892898903391, "percentage": 30.74, "elapsed_time": "1 day, 1:30:34", "remaining_time": "2 days, 9:28:19", "throughput": 29142.06, "total_tokens": 2676243904} +{"current_steps": 9130, "total_steps": 29667, "loss": 0.369, "lr": 3.6151295973079887e-05, "epoch": 0.9233005720064469, "percentage": 30.77, "elapsed_time": "1 day, 1:32:11", "remaining_time": "2 days, 9:26:30", "throughput": 29143.49, "total_tokens": 2679200192} +{"current_steps": 9140, "total_steps": 29667, "loss": 0.3726, "lr": 3.6141850333440934e-05, "epoch": 0.9243118541225548, "percentage": 30.81, "elapsed_time": "1 day, 1:33:48", "remaining_time": "2 days, 9:24:41", "throughput": 29144.4, "total_tokens": 2682111424} +{"current_steps": 9150, "total_steps": 29667, "loss": 0.372, "lr": 3.613241209382803e-05, "epoch": 0.9253231362386626, "percentage": 30.84, "elapsed_time": "1 day, 1:35:28", "remaining_time": "2 days, 9:22:59", "throughput": 29145.18, "total_tokens": 2685102144} +{"current_steps": 9160, "total_steps": 29667, "loss": 0.3738, "lr": 3.6122981244583834e-05, "epoch": 0.9263344183547704, "percentage": 30.88, "elapsed_time": "1 day, 1:37:02", "remaining_time": "2 days, 9:21:04", "throughput": 29146.77, "total_tokens": 2688000896} +{"current_steps": 9170, "total_steps": 29667, "loss": 0.3714, "lr": 3.6113557776068644e-05, "epoch": 0.9273457004708783, "percentage": 30.91, "elapsed_time": "1 day, 1:38:43", "remaining_time": "2 days, 9:19:23", "throughput": 29147.46, "total_tokens": 2690988288} +{"current_steps": 9180, "total_steps": 29667, "loss": 0.3696, "lr": 3.6104141678660386e-05, "epoch": 0.9283569825869861, "percentage": 30.94, "elapsed_time": "1 day, 1:40:20", "remaining_time": "2 days, 9:17:34", "throughput": 29148.74, "total_tokens": 2693937984} +{"current_steps": 9190, "total_steps": 29667, "loss": 0.3752, "lr": 3.6094732942754487e-05, "epoch": 0.9293682647030939, "percentage": 30.98, "elapsed_time": "1 day, 1:42:00", "remaining_time": "2 days, 9:15:51", "throughput": 29148.82, "total_tokens": 2696848704} +{"current_steps": 9200, "total_steps": 29667, "loss": 0.3735, "lr": 3.60853315587639e-05, "epoch": 0.9303795468192018, "percentage": 31.01, "elapsed_time": "1 day, 1:43:36", "remaining_time": "2 days, 9:14:01", "throughput": 29150.08, "total_tokens": 2699781376} +{"current_steps": 9210, "total_steps": 29667, "loss": 0.3733, "lr": 3.607593751711909e-05, "epoch": 0.9313908289353096, "percentage": 31.04, "elapsed_time": "1 day, 1:45:19", "remaining_time": "2 days, 9:12:25", "throughput": 29150.24, "total_tokens": 2702792128} +{"current_steps": 9220, "total_steps": 29667, "loss": 0.3751, "lr": 3.60665508082679e-05, "epoch": 0.9324021110514173, "percentage": 31.08, "elapsed_time": "1 day, 1:47:02", "remaining_time": "2 days, 9:10:50", "throughput": 29150.05, "total_tokens": 2705775680} +{"current_steps": 9230, "total_steps": 29667, "loss": 0.3743, "lr": 3.6057171422675585e-05, "epoch": 0.9334133931675253, "percentage": 31.11, "elapsed_time": "1 day, 1:48:43", "remaining_time": "2 days, 9:09:10", "throughput": 29150.07, "total_tokens": 2708724544} +{"current_steps": 9240, "total_steps": 29667, "loss": 0.3765, "lr": 3.604779935082474e-05, "epoch": 0.934424675283633, "percentage": 31.15, "elapsed_time": "1 day, 1:50:21", "remaining_time": "2 days, 9:07:23", "throughput": 29150.51, "total_tokens": 2711619392} +{"current_steps": 9250, "total_steps": 29667, "loss": 0.3747, "lr": 3.603843458321526e-05, "epoch": 0.9354359573997408, "percentage": 31.18, "elapsed_time": "1 day, 1:52:01", "remaining_time": "2 days, 9:05:41", "throughput": 29151.23, "total_tokens": 2714601216} +{"current_steps": 9260, "total_steps": 29667, "loss": 0.3741, "lr": 3.6029077110364355e-05, "epoch": 0.9364472395158487, "percentage": 31.21, "elapsed_time": "1 day, 1:53:39", "remaining_time": "2 days, 9:03:54", "throughput": 29152.28, "total_tokens": 2717546944} +{"current_steps": 9270, "total_steps": 29667, "loss": 0.3734, "lr": 3.60197269228064e-05, "epoch": 0.9374585216319565, "percentage": 31.25, "elapsed_time": "1 day, 1:55:16", "remaining_time": "2 days, 9:02:06", "throughput": 29153.25, "total_tokens": 2720485056} +{"current_steps": 9280, "total_steps": 29667, "loss": 0.3727, "lr": 3.601038401109299e-05, "epoch": 0.9384698037480643, "percentage": 31.28, "elapsed_time": "1 day, 1:56:58", "remaining_time": "2 days, 9:00:28", "throughput": 29153.29, "total_tokens": 2723459456} +{"current_steps": 9290, "total_steps": 29667, "loss": 0.3723, "lr": 3.6001048365792846e-05, "epoch": 0.9394810858641721, "percentage": 31.31, "elapsed_time": "1 day, 1:58:35", "remaining_time": "2 days, 8:58:41", "throughput": 29153.9, "total_tokens": 2726355392} +{"current_steps": 9300, "total_steps": 29667, "loss": 0.3724, "lr": 3.599171997749182e-05, "epoch": 0.94049236798028, "percentage": 31.35, "elapsed_time": "1 day, 2:00:11", "remaining_time": "2 days, 8:56:50", "throughput": 29155.08, "total_tokens": 2729264576} +{"current_steps": 9310, "total_steps": 29667, "loss": 0.3724, "lr": 3.598239883679281e-05, "epoch": 0.9415036500963878, "percentage": 31.38, "elapsed_time": "1 day, 2:01:55", "remaining_time": "2 days, 8:55:16", "throughput": 29155.06, "total_tokens": 2732289024} +{"current_steps": 9320, "total_steps": 29667, "loss": 0.3825, "lr": 3.597308493431576e-05, "epoch": 0.9425149322124956, "percentage": 31.42, "elapsed_time": "1 day, 2:03:36", "remaining_time": "2 days, 8:53:36", "throughput": 29155.23, "total_tokens": 2735253120} +{"current_steps": 9330, "total_steps": 29667, "loss": 0.3729, "lr": 3.596377826069758e-05, "epoch": 0.9435262143286035, "percentage": 31.45, "elapsed_time": "1 day, 2:05:16", "remaining_time": "2 days, 8:51:54", "throughput": 29155.58, "total_tokens": 2738199232} +{"current_steps": 9340, "total_steps": 29667, "loss": 0.3708, "lr": 3.5954478806592155e-05, "epoch": 0.9445374964447113, "percentage": 31.48, "elapsed_time": "1 day, 2:06:59", "remaining_time": "2 days, 8:50:18", "throughput": 29155.56, "total_tokens": 2741200384} +{"current_steps": 9350, "total_steps": 29667, "loss": 0.3707, "lr": 3.594518656267024e-05, "epoch": 0.9455487785608191, "percentage": 31.52, "elapsed_time": "1 day, 2:08:41", "remaining_time": "2 days, 8:48:40", "throughput": 29155.85, "total_tokens": 2744195520} +{"current_steps": 9360, "total_steps": 29667, "loss": 0.3694, "lr": 3.5935901519619496e-05, "epoch": 0.946560060676927, "percentage": 31.55, "elapsed_time": "1 day, 2:10:18", "remaining_time": "2 days, 8:46:51", "throughput": 29156.64, "total_tokens": 2747095040} +{"current_steps": 9370, "total_steps": 29667, "loss": 0.3772, "lr": 3.5926623668144385e-05, "epoch": 0.9475713427930348, "percentage": 31.58, "elapsed_time": "1 day, 2:11:55", "remaining_time": "2 days, 8:45:03", "throughput": 29157.48, "total_tokens": 2749999040} +{"current_steps": 9380, "total_steps": 29667, "loss": 0.372, "lr": 3.5917352998966194e-05, "epoch": 0.9485826249091426, "percentage": 31.62, "elapsed_time": "1 day, 2:13:32", "remaining_time": "2 days, 8:43:14", "throughput": 29158.14, "total_tokens": 2752884864} +{"current_steps": 9390, "total_steps": 29667, "loss": 0.3683, "lr": 3.5908089502822914e-05, "epoch": 0.9495939070252505, "percentage": 31.65, "elapsed_time": "1 day, 2:15:12", "remaining_time": "2 days, 8:41:33", "throughput": 29158.28, "total_tokens": 2755829120} +{"current_steps": 9400, "total_steps": 29667, "loss": 0.3745, "lr": 3.589883317046929e-05, "epoch": 0.9506051891413583, "percentage": 31.69, "elapsed_time": "1 day, 2:16:51", "remaining_time": "2 days, 8:39:47", "throughput": 29158.86, "total_tokens": 2758752448} +{"current_steps": 9410, "total_steps": 29667, "loss": 0.3759, "lr": 3.5889583992676715e-05, "epoch": 0.9516164712574661, "percentage": 31.72, "elapsed_time": "1 day, 2:18:28", "remaining_time": "2 days, 8:37:59", "throughput": 29159.82, "total_tokens": 2761675648} +{"current_steps": 9420, "total_steps": 29667, "loss": 0.3739, "lr": 3.5880341960233244e-05, "epoch": 0.952627753373574, "percentage": 31.75, "elapsed_time": "1 day, 2:20:06", "remaining_time": "2 days, 8:36:14", "throughput": 29160.61, "total_tokens": 2764629440} +{"current_steps": 9430, "total_steps": 29667, "loss": 0.3763, "lr": 3.58711070639435e-05, "epoch": 0.9536390354896818, "percentage": 31.79, "elapsed_time": "1 day, 2:21:43", "remaining_time": "2 days, 8:34:24", "throughput": 29161.9, "total_tokens": 2767562560} +{"current_steps": 9440, "total_steps": 29667, "loss": 0.3719, "lr": 3.586187929462869e-05, "epoch": 0.9546503176057896, "percentage": 31.82, "elapsed_time": "1 day, 2:23:26", "remaining_time": "2 days, 8:32:48", "throughput": 29162.09, "total_tokens": 2770573824} +{"current_steps": 9450, "total_steps": 29667, "loss": 0.3755, "lr": 3.585265864312651e-05, "epoch": 0.9556615997218975, "percentage": 31.85, "elapsed_time": "1 day, 2:24:57", "remaining_time": "2 days, 8:30:48", "throughput": 29164.21, "total_tokens": 2773443136} +{"current_steps": 9460, "total_steps": 29667, "loss": 0.3691, "lr": 3.584344510029118e-05, "epoch": 0.9566728818380053, "percentage": 31.89, "elapsed_time": "1 day, 2:26:36", "remaining_time": "2 days, 8:29:03", "throughput": 29165.37, "total_tokens": 2776430848} +{"current_steps": 9470, "total_steps": 29667, "loss": 0.3722, "lr": 3.583423865699333e-05, "epoch": 0.957684163954113, "percentage": 31.92, "elapsed_time": "1 day, 2:28:14", "remaining_time": "2 days, 8:27:18", "throughput": 29165.71, "total_tokens": 2779344640} +{"current_steps": 9480, "total_steps": 29667, "loss": 0.3742, "lr": 3.5825039304119994e-05, "epoch": 0.958695446070221, "percentage": 31.95, "elapsed_time": "1 day, 2:29:54", "remaining_time": "2 days, 8:25:35", "throughput": 29166.47, "total_tokens": 2782307520} +{"current_steps": 9490, "total_steps": 29667, "loss": 0.3726, "lr": 3.581584703257461e-05, "epoch": 0.9597067281863287, "percentage": 31.99, "elapsed_time": "1 day, 2:31:33", "remaining_time": "2 days, 8:23:51", "throughput": 29166.98, "total_tokens": 2785251392} +{"current_steps": 9500, "total_steps": 29667, "loss": 0.3741, "lr": 3.580666183327689e-05, "epoch": 0.9607180103024365, "percentage": 32.02, "elapsed_time": "1 day, 2:33:12", "remaining_time": "2 days, 8:22:08", "throughput": 29167.57, "total_tokens": 2788215424} +{"current_steps": 9510, "total_steps": 29667, "loss": 0.3749, "lr": 3.5797483697162906e-05, "epoch": 0.9617292924185444, "percentage": 32.06, "elapsed_time": "1 day, 2:34:52", "remaining_time": "2 days, 8:20:26", "throughput": 29167.95, "total_tokens": 2791157376} +{"current_steps": 9520, "total_steps": 29667, "loss": 0.369, "lr": 3.5788312615184936e-05, "epoch": 0.9627405745346522, "percentage": 32.09, "elapsed_time": "1 day, 2:36:32", "remaining_time": "2 days, 8:18:44", "throughput": 29168.3, "total_tokens": 2794110336} +{"current_steps": 9530, "total_steps": 29667, "loss": 0.3758, "lr": 3.5779148578311476e-05, "epoch": 0.96375185665076, "percentage": 32.12, "elapsed_time": "1 day, 2:38:09", "remaining_time": "2 days, 8:16:56", "throughput": 29169.24, "total_tokens": 2797036736} +{"current_steps": 9540, "total_steps": 29667, "loss": 0.3698, "lr": 3.5769991577527236e-05, "epoch": 0.9647631387668679, "percentage": 32.16, "elapsed_time": "1 day, 2:39:51", "remaining_time": "2 days, 8:15:18", "throughput": 29169.33, "total_tokens": 2800022208} +{"current_steps": 9550, "total_steps": 29667, "loss": 0.3761, "lr": 3.5760841603833034e-05, "epoch": 0.9657744208829757, "percentage": 32.19, "elapsed_time": "1 day, 2:41:26", "remaining_time": "2 days, 8:13:26", "throughput": 29170.62, "total_tokens": 2802911360} +{"current_steps": 9560, "total_steps": 29667, "loss": 0.374, "lr": 3.5751698648245814e-05, "epoch": 0.9667857029990835, "percentage": 32.22, "elapsed_time": "1 day, 2:43:02", "remaining_time": "2 days, 8:11:36", "throughput": 29171.71, "total_tokens": 2805822464} +{"current_steps": 9570, "total_steps": 29667, "loss": 0.3734, "lr": 3.574256270179857e-05, "epoch": 0.9677969851151913, "percentage": 32.26, "elapsed_time": "1 day, 2:44:45", "remaining_time": "2 days, 8:09:58", "throughput": 29171.44, "total_tokens": 2808778240} +{"current_steps": 9580, "total_steps": 29667, "loss": 0.3734, "lr": 3.573343375554037e-05, "epoch": 0.9688082672312992, "percentage": 32.29, "elapsed_time": "1 day, 2:46:24", "remaining_time": "2 days, 8:08:14", "throughput": 29172.27, "total_tokens": 2811746368} +{"current_steps": 9590, "total_steps": 29667, "loss": 0.3737, "lr": 3.572431180053621e-05, "epoch": 0.969819549347407, "percentage": 32.33, "elapsed_time": "1 day, 2:48:04", "remaining_time": "2 days, 8:06:34", "throughput": 29172.6, "total_tokens": 2814716736} +{"current_steps": 9600, "total_steps": 29667, "loss": 0.3729, "lr": 3.571519682786711e-05, "epoch": 0.9708308314635148, "percentage": 32.36, "elapsed_time": "1 day, 2:49:46", "remaining_time": "2 days, 8:04:56", "throughput": 29172.66, "total_tokens": 2817695936} +{"current_steps": 9610, "total_steps": 29667, "loss": 0.3751, "lr": 3.570608882862996e-05, "epoch": 0.9718421135796227, "percentage": 32.39, "elapsed_time": "1 day, 2:51:28", "remaining_time": "2 days, 8:03:18", "throughput": 29172.3, "total_tokens": 2820625024} +{"current_steps": 9620, "total_steps": 29667, "loss": 0.3703, "lr": 3.569698779393757e-05, "epoch": 0.9728533956957305, "percentage": 32.43, "elapsed_time": "1 day, 2:53:07", "remaining_time": "2 days, 8:01:35", "throughput": 29172.54, "total_tokens": 2823549120} +{"current_steps": 9630, "total_steps": 29667, "loss": 0.3693, "lr": 3.568789371491859e-05, "epoch": 0.9738646778118383, "percentage": 32.46, "elapsed_time": "1 day, 2:54:49", "remaining_time": "2 days, 7:59:56", "throughput": 29172.52, "total_tokens": 2826508928} +{"current_steps": 9640, "total_steps": 29667, "loss": 0.3718, "lr": 3.567880658271748e-05, "epoch": 0.9748759599279462, "percentage": 32.49, "elapsed_time": "1 day, 2:56:29", "remaining_time": "2 days, 7:58:13", "throughput": 29173.1, "total_tokens": 2829472256} +{"current_steps": 9650, "total_steps": 29667, "loss": 0.3715, "lr": 3.566972638849445e-05, "epoch": 0.975887242044054, "percentage": 32.53, "elapsed_time": "1 day, 2:58:05", "remaining_time": "2 days, 7:56:25", "throughput": 29174.16, "total_tokens": 2832402560} +{"current_steps": 9660, "total_steps": 29667, "loss": 0.3772, "lr": 3.566065312342551e-05, "epoch": 0.9768985241601618, "percentage": 32.56, "elapsed_time": "1 day, 2:59:40", "remaining_time": "2 days, 7:54:31", "throughput": 29175.26, "total_tokens": 2835255232} +{"current_steps": 9670, "total_steps": 29667, "loss": 0.3732, "lr": 3.565158677870231e-05, "epoch": 0.9779098062762697, "percentage": 32.6, "elapsed_time": "1 day, 3:01:17", "remaining_time": "2 days, 7:52:43", "throughput": 29176.17, "total_tokens": 2838177472} +{"current_steps": 9680, "total_steps": 29667, "loss": 0.3688, "lr": 3.564252734553221e-05, "epoch": 0.9789210883923775, "percentage": 32.63, "elapsed_time": "1 day, 3:02:57", "remaining_time": "2 days, 7:51:01", "throughput": 29176.62, "total_tokens": 2841132160} +{"current_steps": 9690, "total_steps": 29667, "loss": 0.3739, "lr": 3.563347481513818e-05, "epoch": 0.9799323705084853, "percentage": 32.66, "elapsed_time": "1 day, 3:04:37", "remaining_time": "2 days, 7:49:20", "throughput": 29176.77, "total_tokens": 2844084992} +{"current_steps": 9700, "total_steps": 29667, "loss": 0.374, "lr": 3.56244291787588e-05, "epoch": 0.9809436526245932, "percentage": 32.7, "elapsed_time": "1 day, 3:06:17", "remaining_time": "2 days, 7:47:39", "throughput": 29177.52, "total_tokens": 2847074304} +{"current_steps": 9710, "total_steps": 29667, "loss": 0.3696, "lr": 3.5615390427648216e-05, "epoch": 0.981954934740701, "percentage": 32.73, "elapsed_time": "1 day, 3:07:54", "remaining_time": "2 days, 7:45:50", "throughput": 29178.97, "total_tokens": 2850035904} +{"current_steps": 9720, "total_steps": 29667, "loss": 0.3726, "lr": 3.5606358553076075e-05, "epoch": 0.9829662168568087, "percentage": 32.76, "elapsed_time": "1 day, 3:09:31", "remaining_time": "2 days, 7:44:02", "throughput": 29179.4, "total_tokens": 2852911424} +{"current_steps": 9730, "total_steps": 29667, "loss": 0.3766, "lr": 3.5597333546327526e-05, "epoch": 0.9839774989729166, "percentage": 32.8, "elapsed_time": "1 day, 3:11:06", "remaining_time": "2 days, 7:42:10", "throughput": 29180.6, "total_tokens": 2855793920} +{"current_steps": 9740, "total_steps": 29667, "loss": 0.3705, "lr": 3.5588315398703186e-05, "epoch": 0.9849887810890244, "percentage": 32.83, "elapsed_time": "1 day, 3:12:45", "remaining_time": "2 days, 7:40:27", "throughput": 29181.18, "total_tokens": 2858753088} +{"current_steps": 9750, "total_steps": 29667, "loss": 0.3749, "lr": 3.557930410151907e-05, "epoch": 0.9860000632051322, "percentage": 32.86, "elapsed_time": "1 day, 3:14:26", "remaining_time": "2 days, 7:38:47", "throughput": 29181.48, "total_tokens": 2861735424} +{"current_steps": 9760, "total_steps": 29667, "loss": 0.3725, "lr": 3.5570299646106606e-05, "epoch": 0.9870113453212401, "percentage": 32.9, "elapsed_time": "1 day, 3:16:02", "remaining_time": "2 days, 7:36:57", "throughput": 29182.73, "total_tokens": 2864653632} +{"current_steps": 9770, "total_steps": 29667, "loss": 0.3729, "lr": 3.556130202381253e-05, "epoch": 0.9880226274373479, "percentage": 32.93, "elapsed_time": "1 day, 3:17:41", "remaining_time": "2 days, 7:35:12", "throughput": 29183.05, "total_tokens": 2867559360} +{"current_steps": 9780, "total_steps": 29667, "loss": 0.3701, "lr": 3.555231122599892e-05, "epoch": 0.9890339095534557, "percentage": 32.97, "elapsed_time": "1 day, 3:19:17", "remaining_time": "2 days, 7:33:24", "throughput": 29184.1, "total_tokens": 2870483328} +{"current_steps": 9790, "total_steps": 29667, "loss": 0.3709, "lr": 3.554332724404313e-05, "epoch": 0.9900451916695636, "percentage": 33.0, "elapsed_time": "1 day, 3:20:57", "remaining_time": "2 days, 7:31:42", "throughput": 29184.73, "total_tokens": 2873465664} +{"current_steps": 9800, "total_steps": 29667, "loss": 0.3721, "lr": 3.553435006933777e-05, "epoch": 0.9910564737856714, "percentage": 33.03, "elapsed_time": "1 day, 3:22:33", "remaining_time": "2 days, 7:29:52", "throughput": 29185.86, "total_tokens": 2876379840} +{"current_steps": 9810, "total_steps": 29667, "loss": 0.3696, "lr": 3.5525379693290626e-05, "epoch": 0.9920677559017792, "percentage": 33.07, "elapsed_time": "1 day, 3:24:12", "remaining_time": "2 days, 7:28:08", "throughput": 29186.23, "total_tokens": 2879292800} +{"current_steps": 9820, "total_steps": 29667, "loss": 0.3759, "lr": 3.551641610732469e-05, "epoch": 0.9930790380178871, "percentage": 33.1, "elapsed_time": "1 day, 3:25:51", "remaining_time": "2 days, 7:26:24", "throughput": 29186.69, "total_tokens": 2882230656} +{"current_steps": 9830, "total_steps": 29667, "loss": 0.3673, "lr": 3.55074593028781e-05, "epoch": 0.9940903201339949, "percentage": 33.13, "elapsed_time": "1 day, 3:27:30", "remaining_time": "2 days, 7:24:40", "throughput": 29187.38, "total_tokens": 2885174336} +{"current_steps": 9840, "total_steps": 29667, "loss": 0.371, "lr": 3.5498509271404065e-05, "epoch": 0.9951016022501027, "percentage": 33.17, "elapsed_time": "1 day, 3:29:08", "remaining_time": "2 days, 7:22:56", "throughput": 29188.03, "total_tokens": 2888125504} +{"current_steps": 9850, "total_steps": 29667, "loss": 0.3694, "lr": 3.5489566004370893e-05, "epoch": 0.9961128843662105, "percentage": 33.2, "elapsed_time": "1 day, 3:30:42", "remaining_time": "2 days, 7:21:00", "throughput": 29189.97, "total_tokens": 2891034560} +{"current_steps": 9860, "total_steps": 29667, "loss": 0.3688, "lr": 3.548062949326194e-05, "epoch": 0.9971241664823184, "percentage": 33.24, "elapsed_time": "1 day, 3:32:21", "remaining_time": "2 days, 7:19:18", "throughput": 29190.59, "total_tokens": 2894011840} +{"current_steps": 9870, "total_steps": 29667, "loss": 0.3727, "lr": 3.547169972957554e-05, "epoch": 0.9981354485984262, "percentage": 33.27, "elapsed_time": "1 day, 3:34:00", "remaining_time": "2 days, 7:17:34", "throughput": 29190.98, "total_tokens": 2896928320} +{"current_steps": 9880, "total_steps": 29667, "loss": 0.3709, "lr": 3.5462776704825e-05, "epoch": 0.999146730714534, "percentage": 33.3, "elapsed_time": "1 day, 3:35:41", "remaining_time": "2 days, 7:15:53", "throughput": 29191.05, "total_tokens": 2899872320} +{"current_steps": 9890, "total_steps": 29667, "loss": 0.3665, "lr": 3.5453860410538594e-05, "epoch": 1.0001011282116108, "percentage": 33.34, "elapsed_time": "1 day, 3:37:18", "remaining_time": "2 days, 7:14:05", "throughput": 29190.62, "total_tokens": 2902657472} +{"current_steps": 9900, "total_steps": 29667, "loss": 0.3615, "lr": 3.5444950838259455e-05, "epoch": 1.0011124103277187, "percentage": 33.37, "elapsed_time": "1 day, 3:38:57", "remaining_time": "2 days, 7:12:23", "throughput": 29191.11, "total_tokens": 2905616512} +{"current_steps": 9910, "total_steps": 29667, "loss": 0.3546, "lr": 3.543604797954563e-05, "epoch": 1.0021236924438264, "percentage": 33.4, "elapsed_time": "1 day, 3:40:41", "remaining_time": "2 days, 7:10:49", "throughput": 29190.68, "total_tokens": 2908599808} +{"current_steps": 9920, "total_steps": 29667, "loss": 0.359, "lr": 3.542715182596996e-05, "epoch": 1.0031349745599343, "percentage": 33.44, "elapsed_time": "1 day, 3:42:20", "remaining_time": "2 days, 7:09:06", "throughput": 29191.26, "total_tokens": 2911554176} +{"current_steps": 9930, "total_steps": 29667, "loss": 0.3594, "lr": 3.5418262369120115e-05, "epoch": 1.0041462566760422, "percentage": 33.47, "elapsed_time": "1 day, 3:44:00", "remaining_time": "2 days, 7:07:23", "throughput": 29191.75, "total_tokens": 2914506112} +{"current_steps": 9940, "total_steps": 29667, "loss": 0.361, "lr": 3.5409379600598526e-05, "epoch": 1.0051575387921499, "percentage": 33.51, "elapsed_time": "1 day, 3:45:35", "remaining_time": "2 days, 7:05:33", "throughput": 29192.91, "total_tokens": 2917413696} +{"current_steps": 9950, "total_steps": 29667, "loss": 0.356, "lr": 3.540050351202235e-05, "epoch": 1.0061688209082578, "percentage": 33.54, "elapsed_time": "1 day, 3:47:17", "remaining_time": "2 days, 7:03:54", "throughput": 29193.3, "total_tokens": 2920421952} +{"current_steps": 9960, "total_steps": 29667, "loss": 0.3588, "lr": 3.539163409502347e-05, "epoch": 1.0071801030243657, "percentage": 33.57, "elapsed_time": "1 day, 3:48:53", "remaining_time": "2 days, 7:02:05", "throughput": 29194.34, "total_tokens": 2923327680} +{"current_steps": 9970, "total_steps": 29667, "loss": 0.3611, "lr": 3.5382771341248416e-05, "epoch": 1.0081913851404734, "percentage": 33.61, "elapsed_time": "1 day, 3:50:27", "remaining_time": "2 days, 7:00:13", "throughput": 29195.94, "total_tokens": 2926249408} +{"current_steps": 9980, "total_steps": 29667, "loss": 0.3591, "lr": 3.537391524235835e-05, "epoch": 1.0092026672565813, "percentage": 33.64, "elapsed_time": "1 day, 3:52:06", "remaining_time": "2 days, 6:58:28", "throughput": 29196.6, "total_tokens": 2929188224} +{"current_steps": 9990, "total_steps": 29667, "loss": 0.36, "lr": 3.5365065790029055e-05, "epoch": 1.0102139493726892, "percentage": 33.67, "elapsed_time": "1 day, 3:53:44", "remaining_time": "2 days, 6:56:43", "throughput": 29197.14, "total_tokens": 2932117376} +{"current_steps": 10000, "total_steps": 29667, "loss": 0.3608, "lr": 3.535622297595087e-05, "epoch": 1.0112252314887968, "percentage": 33.71, "elapsed_time": "1 day, 3:55:24", "remaining_time": "2 days, 6:55:02", "throughput": 29197.46, "total_tokens": 2935067456} +{"current_steps": 10000, "total_steps": 29667, "eval_loss": 0.33349609375, "epoch": 1.0112252314887968, "percentage": 33.71, "elapsed_time": "1 day, 3:55:26", "remaining_time": "2 days, 6:55:05", "throughput": 29196.95, "total_tokens": 2935067456} +{"current_steps": 10010, "total_steps": 29667, "loss": 0.3584, "lr": 3.534738679182869e-05, "epoch": 1.0122365136049047, "percentage": 33.74, "elapsed_time": "1 day, 3:57:32", "remaining_time": "2 days, 6:54:15", "throughput": 29189.64, "total_tokens": 2938024064} +{"current_steps": 10020, "total_steps": 29667, "loss": 0.3565, "lr": 3.533855722938188e-05, "epoch": 1.0132477957210126, "percentage": 33.77, "elapsed_time": "1 day, 3:59:09", "remaining_time": "2 days, 6:52:27", "throughput": 29190.56, "total_tokens": 2940932032} +{"current_steps": 10030, "total_steps": 29667, "loss": 0.3593, "lr": 3.5329734280344325e-05, "epoch": 1.0142590778371203, "percentage": 33.81, "elapsed_time": "1 day, 4:00:52", "remaining_time": "2 days, 6:50:52", "throughput": 29190.34, "total_tokens": 2943928192} +{"current_steps": 10040, "total_steps": 29667, "loss": 0.3569, "lr": 3.5320917936464294e-05, "epoch": 1.0152703599532282, "percentage": 33.84, "elapsed_time": "1 day, 4:02:30", "remaining_time": "2 days, 6:49:06", "throughput": 29191.69, "total_tokens": 2946916032} +{"current_steps": 10050, "total_steps": 29667, "loss": 0.3574, "lr": 3.5312108189504505e-05, "epoch": 1.0162816420693361, "percentage": 33.88, "elapsed_time": "1 day, 4:04:09", "remaining_time": "2 days, 6:47:23", "throughput": 29192.28, "total_tokens": 2949875392} +{"current_steps": 10060, "total_steps": 29667, "loss": 0.3583, "lr": 3.530330503124204e-05, "epoch": 1.0172929241854438, "percentage": 33.91, "elapsed_time": "1 day, 4:05:43", "remaining_time": "2 days, 6:45:30", "throughput": 29193.7, "total_tokens": 2952764480} +{"current_steps": 10070, "total_steps": 29667, "loss": 0.3569, "lr": 3.5294508453468325e-05, "epoch": 1.0183042063015517, "percentage": 33.94, "elapsed_time": "1 day, 4:07:21", "remaining_time": "2 days, 6:43:42", "throughput": 29194.78, "total_tokens": 2955710464} +{"current_steps": 10080, "total_steps": 29667, "loss": 0.3604, "lr": 3.528571844798908e-05, "epoch": 1.0193154884176596, "percentage": 33.98, "elapsed_time": "1 day, 4:09:01", "remaining_time": "2 days, 6:42:02", "throughput": 29194.93, "total_tokens": 2958661184} +{"current_steps": 10090, "total_steps": 29667, "loss": 0.3625, "lr": 3.527693500662431e-05, "epoch": 1.0203267705337673, "percentage": 34.01, "elapsed_time": "1 day, 4:10:43", "remaining_time": "2 days, 6:40:24", "throughput": 29194.89, "total_tokens": 2961633344} +{"current_steps": 10100, "total_steps": 29667, "loss": 0.3602, "lr": 3.5268158121208294e-05, "epoch": 1.0213380526498752, "percentage": 34.04, "elapsed_time": "1 day, 4:12:25", "remaining_time": "2 days, 6:38:47", "throughput": 29194.66, "total_tokens": 2964599808} +{"current_steps": 10110, "total_steps": 29667, "loss": 0.3525, "lr": 3.525938778358949e-05, "epoch": 1.022349334765983, "percentage": 34.08, "elapsed_time": "1 day, 4:14:02", "remaining_time": "2 days, 6:36:58", "throughput": 29195.8, "total_tokens": 2967523712} +{"current_steps": 10120, "total_steps": 29667, "loss": 0.3612, "lr": 3.5250623985630537e-05, "epoch": 1.0233606168820908, "percentage": 34.11, "elapsed_time": "1 day, 4:15:42", "remaining_time": "2 days, 6:35:18", "throughput": 29196.18, "total_tokens": 2970498560} +{"current_steps": 10130, "total_steps": 29667, "loss": 0.3542, "lr": 3.524186671920826e-05, "epoch": 1.0243718989981987, "percentage": 34.15, "elapsed_time": "1 day, 4:17:19", "remaining_time": "2 days, 6:33:31", "throughput": 29196.84, "total_tokens": 2973402496} +{"current_steps": 10140, "total_steps": 29667, "loss": 0.3587, "lr": 3.523311597621358e-05, "epoch": 1.0253831811143064, "percentage": 34.18, "elapsed_time": "1 day, 4:18:53", "remaining_time": "2 days, 6:31:36", "throughput": 29198.51, "total_tokens": 2976295424} +{"current_steps": 10150, "total_steps": 29667, "loss": 0.3596, "lr": 3.5224371748551505e-05, "epoch": 1.0263944632304143, "percentage": 34.21, "elapsed_time": "1 day, 4:20:31", "remaining_time": "2 days, 6:29:51", "throughput": 29199.28, "total_tokens": 2979245440} +{"current_steps": 10160, "total_steps": 29667, "loss": 0.3628, "lr": 3.521563402814109e-05, "epoch": 1.0274057453465222, "percentage": 34.25, "elapsed_time": "1 day, 4:22:13", "remaining_time": "2 days, 6:28:14", "throughput": 29199.49, "total_tokens": 2982249792} +{"current_steps": 10170, "total_steps": 29667, "loss": 0.3616, "lr": 3.5206902806915436e-05, "epoch": 1.0284170274626299, "percentage": 34.28, "elapsed_time": "1 day, 4:23:49", "remaining_time": "2 days, 6:26:25", "throughput": 29200.3, "total_tokens": 2985142656} +{"current_steps": 10180, "total_steps": 29667, "loss": 0.3597, "lr": 3.5198178076821644e-05, "epoch": 1.0294283095787378, "percentage": 34.31, "elapsed_time": "1 day, 4:25:24", "remaining_time": "2 days, 6:24:34", "throughput": 29201.66, "total_tokens": 2988047232} +{"current_steps": 10190, "total_steps": 29667, "loss": 0.354, "lr": 3.5189459829820743e-05, "epoch": 1.0304395916948457, "percentage": 34.35, "elapsed_time": "1 day, 4:27:03", "remaining_time": "2 days, 6:22:50", "throughput": 29202.36, "total_tokens": 2990998400} +{"current_steps": 10200, "total_steps": 29667, "loss": 0.36, "lr": 3.5180748057887714e-05, "epoch": 1.0314508738109534, "percentage": 34.38, "elapsed_time": "1 day, 4:28:38", "remaining_time": "2 days, 6:20:59", "throughput": 29203.56, "total_tokens": 2993903552} +{"current_steps": 10210, "total_steps": 29667, "loss": 0.3609, "lr": 3.517204275301144e-05, "epoch": 1.0324621559270613, "percentage": 34.42, "elapsed_time": "1 day, 4:30:14", "remaining_time": "2 days, 6:19:11", "throughput": 29204.77, "total_tokens": 2996842176} +{"current_steps": 10220, "total_steps": 29667, "loss": 0.3605, "lr": 3.5163343907194676e-05, "epoch": 1.0334734380431692, "percentage": 34.45, "elapsed_time": "1 day, 4:31:55", "remaining_time": "2 days, 6:17:30", "throughput": 29204.98, "total_tokens": 2999797888} +{"current_steps": 10230, "total_steps": 29667, "loss": 0.36, "lr": 3.5154651512453995e-05, "epoch": 1.0344847201592768, "percentage": 34.48, "elapsed_time": "1 day, 4:33:32", "remaining_time": "2 days, 6:15:43", "throughput": 29205.57, "total_tokens": 3002701312} +{"current_steps": 10240, "total_steps": 29667, "loss": 0.3581, "lr": 3.514596556081981e-05, "epoch": 1.0354960022753847, "percentage": 34.52, "elapsed_time": "1 day, 4:35:10", "remaining_time": "2 days, 6:13:58", "throughput": 29206.29, "total_tokens": 3005634688} +{"current_steps": 10250, "total_steps": 29667, "loss": 0.3561, "lr": 3.513728604433628e-05, "epoch": 1.0365072843914926, "percentage": 34.55, "elapsed_time": "1 day, 4:36:49", "remaining_time": "2 days, 6:12:14", "throughput": 29206.76, "total_tokens": 3008561664} +{"current_steps": 10260, "total_steps": 29667, "loss": 0.3553, "lr": 3.5128612955061334e-05, "epoch": 1.0375185665076003, "percentage": 34.58, "elapsed_time": "1 day, 4:38:28", "remaining_time": "2 days, 6:10:31", "throughput": 29207.39, "total_tokens": 3011518976} +{"current_steps": 10270, "total_steps": 29667, "loss": 0.362, "lr": 3.5119946285066595e-05, "epoch": 1.0385298486237082, "percentage": 34.62, "elapsed_time": "1 day, 4:40:09", "remaining_time": "2 days, 6:08:52", "throughput": 29207.24, "total_tokens": 3014470272} +{"current_steps": 10280, "total_steps": 29667, "loss": 0.3615, "lr": 3.511128602643739e-05, "epoch": 1.0395411307398161, "percentage": 34.65, "elapsed_time": "1 day, 4:41:47", "remaining_time": "2 days, 6:07:07", "throughput": 29207.93, "total_tokens": 3017399552} +{"current_steps": 10290, "total_steps": 29667, "loss": 0.3583, "lr": 3.510263217127269e-05, "epoch": 1.0405524128559238, "percentage": 34.69, "elapsed_time": "1 day, 4:43:26", "remaining_time": "2 days, 6:05:24", "throughput": 29208.12, "total_tokens": 3020320896} +{"current_steps": 10300, "total_steps": 29667, "loss": 0.3608, "lr": 3.50939847116851e-05, "epoch": 1.0415636949720317, "percentage": 34.72, "elapsed_time": "1 day, 4:45:03", "remaining_time": "2 days, 6:03:36", "throughput": 29208.8, "total_tokens": 3023215680} +{"current_steps": 10310, "total_steps": 29667, "loss": 0.363, "lr": 3.508534363980081e-05, "epoch": 1.0425749770881396, "percentage": 34.75, "elapsed_time": "1 day, 4:46:41", "remaining_time": "2 days, 6:01:51", "throughput": 29209.66, "total_tokens": 3026157632} +{"current_steps": 10320, "total_steps": 29667, "loss": 0.3608, "lr": 3.507670894775958e-05, "epoch": 1.0435862592042473, "percentage": 34.79, "elapsed_time": "1 day, 4:48:18", "remaining_time": "2 days, 6:00:04", "throughput": 29210.45, "total_tokens": 3029079168} +{"current_steps": 10330, "total_steps": 29667, "loss": 0.3636, "lr": 3.506808062771471e-05, "epoch": 1.0445975413203552, "percentage": 34.82, "elapsed_time": "1 day, 4:49:56", "remaining_time": "2 days, 5:58:18", "throughput": 29211.33, "total_tokens": 3032026240} +{"current_steps": 10340, "total_steps": 29667, "loss": 0.3613, "lr": 3.505945867183298e-05, "epoch": 1.045608823436463, "percentage": 34.85, "elapsed_time": "1 day, 4:51:32", "remaining_time": "2 days, 5:56:29", "throughput": 29212.11, "total_tokens": 3034904704} +{"current_steps": 10350, "total_steps": 29667, "loss": 0.3623, "lr": 3.505084307229468e-05, "epoch": 1.0466201055525708, "percentage": 34.89, "elapsed_time": "1 day, 4:53:09", "remaining_time": "2 days, 5:54:44", "throughput": 29212.76, "total_tokens": 3037833920} +{"current_steps": 10360, "total_steps": 29667, "loss": 0.3603, "lr": 3.5042233821293525e-05, "epoch": 1.0476313876686787, "percentage": 34.92, "elapsed_time": "1 day, 4:54:45", "remaining_time": "2 days, 5:52:54", "throughput": 29214.03, "total_tokens": 3040746560} +{"current_steps": 10370, "total_steps": 29667, "loss": 0.3566, "lr": 3.503363091103664e-05, "epoch": 1.0486426697847866, "percentage": 34.95, "elapsed_time": "1 day, 4:56:22", "remaining_time": "2 days, 5:51:08", "throughput": 29214.73, "total_tokens": 3043671744} +{"current_steps": 10380, "total_steps": 29667, "loss": 0.3601, "lr": 3.5025034333744545e-05, "epoch": 1.0496539519008943, "percentage": 34.99, "elapsed_time": "1 day, 4:57:59", "remaining_time": "2 days, 5:49:21", "throughput": 29215.63, "total_tokens": 3046593408} +{"current_steps": 10390, "total_steps": 29667, "loss": 0.3568, "lr": 3.501644408165112e-05, "epoch": 1.0506652340170022, "percentage": 35.02, "elapsed_time": "1 day, 4:59:36", "remaining_time": "2 days, 5:47:34", "throughput": 29216.16, "total_tokens": 3049492800} +{"current_steps": 10400, "total_steps": 29667, "loss": 0.3609, "lr": 3.500786014700357e-05, "epoch": 1.05167651613311, "percentage": 35.06, "elapsed_time": "1 day, 5:01:15", "remaining_time": "2 days, 5:45:51", "throughput": 29216.77, "total_tokens": 3052438912} +{"current_steps": 10410, "total_steps": 29667, "loss": 0.3574, "lr": 3.499928252206237e-05, "epoch": 1.0526877982492178, "percentage": 35.09, "elapsed_time": "1 day, 5:02:56", "remaining_time": "2 days, 5:44:11", "throughput": 29216.89, "total_tokens": 3055394752} +{"current_steps": 10420, "total_steps": 29667, "loss": 0.3536, "lr": 3.499071119910131e-05, "epoch": 1.0536990803653257, "percentage": 35.12, "elapsed_time": "1 day, 5:04:35", "remaining_time": "2 days, 5:42:28", "throughput": 29217.55, "total_tokens": 3058359296} +{"current_steps": 10430, "total_steps": 29667, "loss": 0.358, "lr": 3.498214617040739e-05, "epoch": 1.0547103624814336, "percentage": 35.16, "elapsed_time": "1 day, 5:06:14", "remaining_time": "2 days, 5:40:45", "throughput": 29217.72, "total_tokens": 3061272000} +{"current_steps": 10440, "total_steps": 29667, "loss": 0.3625, "lr": 3.49735874282808e-05, "epoch": 1.0557216445975413, "percentage": 35.19, "elapsed_time": "1 day, 5:07:57", "remaining_time": "2 days, 5:39:08", "throughput": 29217.62, "total_tokens": 3064263488} +{"current_steps": 10450, "total_steps": 29667, "loss": 0.3553, "lr": 3.4965034965034965e-05, "epoch": 1.0567329267136492, "percentage": 35.22, "elapsed_time": "1 day, 5:09:39", "remaining_time": "2 days, 5:37:31", "throughput": 29217.59, "total_tokens": 3067248832} +{"current_steps": 10460, "total_steps": 29667, "loss": 0.3558, "lr": 3.495648877299642e-05, "epoch": 1.057744208829757, "percentage": 35.26, "elapsed_time": "1 day, 5:11:22", "remaining_time": "2 days, 5:35:55", "throughput": 29217.57, "total_tokens": 3070243584} +{"current_steps": 10470, "total_steps": 29667, "loss": 0.3626, "lr": 3.494794884450483e-05, "epoch": 1.0587554909458647, "percentage": 35.29, "elapsed_time": "1 day, 5:12:57", "remaining_time": "2 days, 5:34:04", "throughput": 29218.83, "total_tokens": 3073152384} +{"current_steps": 10480, "total_steps": 29667, "loss": 0.3594, "lr": 3.4939415171912954e-05, "epoch": 1.0597667730619726, "percentage": 35.33, "elapsed_time": "1 day, 5:14:32", "remaining_time": "2 days, 5:32:15", "throughput": 29219.84, "total_tokens": 3076050560} +{"current_steps": 10490, "total_steps": 29667, "loss": 0.3572, "lr": 3.4930887747586616e-05, "epoch": 1.0607780551780805, "percentage": 35.36, "elapsed_time": "1 day, 5:16:14", "remaining_time": "2 days, 5:30:37", "throughput": 29219.48, "total_tokens": 3078984320} +{"current_steps": 10500, "total_steps": 29667, "loss": 0.3585, "lr": 3.492236656390469e-05, "epoch": 1.0617893372941882, "percentage": 35.39, "elapsed_time": "1 day, 5:17:53", "remaining_time": "2 days, 5:28:53", "throughput": 29220.0, "total_tokens": 3081926976} +{"current_steps": 10510, "total_steps": 29667, "loss": 0.3579, "lr": 3.4913851613259034e-05, "epoch": 1.0628006194102961, "percentage": 35.43, "elapsed_time": "1 day, 5:19:30", "remaining_time": "2 days, 5:27:07", "throughput": 29221.08, "total_tokens": 3084888384} +{"current_steps": 10520, "total_steps": 29667, "loss": 0.3649, "lr": 3.490534288805452e-05, "epoch": 1.063811901526404, "percentage": 35.46, "elapsed_time": "1 day, 5:21:06", "remaining_time": "2 days, 5:25:19", "throughput": 29221.92, "total_tokens": 3087786432} +{"current_steps": 10530, "total_steps": 29667, "loss": 0.3594, "lr": 3.489684038070891e-05, "epoch": 1.0648231836425117, "percentage": 35.49, "elapsed_time": "1 day, 5:22:44", "remaining_time": "2 days, 5:23:34", "throughput": 29222.37, "total_tokens": 3090698752} +{"current_steps": 10540, "total_steps": 29667, "loss": 0.3616, "lr": 3.488834408365296e-05, "epoch": 1.0658344657586196, "percentage": 35.53, "elapsed_time": "1 day, 5:24:27", "remaining_time": "2 days, 5:21:58", "throughput": 29221.98, "total_tokens": 3093652928} +{"current_steps": 10550, "total_steps": 29667, "loss": 0.3608, "lr": 3.487985398933027e-05, "epoch": 1.0668457478747275, "percentage": 35.56, "elapsed_time": "1 day, 5:26:05", "remaining_time": "2 days, 5:20:13", "throughput": 29222.45, "total_tokens": 3096570688} +{"current_steps": 10560, "total_steps": 29667, "loss": 0.356, "lr": 3.4871370090197324e-05, "epoch": 1.0678570299908352, "percentage": 35.6, "elapsed_time": "1 day, 5:27:43", "remaining_time": "2 days, 5:18:28", "throughput": 29223.43, "total_tokens": 3099534656} +{"current_steps": 10570, "total_steps": 29667, "loss": 0.3591, "lr": 3.486289237872343e-05, "epoch": 1.068868312106943, "percentage": 35.63, "elapsed_time": "1 day, 5:29:20", "remaining_time": "2 days, 5:16:42", "throughput": 29223.9, "total_tokens": 3102430336} +{"current_steps": 10580, "total_steps": 29667, "loss": 0.3571, "lr": 3.485442084739075e-05, "epoch": 1.069879594223051, "percentage": 35.66, "elapsed_time": "1 day, 5:30:57", "remaining_time": "2 days, 5:14:55", "throughput": 29224.67, "total_tokens": 3105349056} +{"current_steps": 10590, "total_steps": 29667, "loss": 0.358, "lr": 3.484595548869416e-05, "epoch": 1.0708908763391587, "percentage": 35.7, "elapsed_time": "1 day, 5:32:42", "remaining_time": "2 days, 5:13:22", "throughput": 29224.4, "total_tokens": 3108368640} +{"current_steps": 10600, "total_steps": 29667, "loss": 0.3623, "lr": 3.4837496295141335e-05, "epoch": 1.0719021584552666, "percentage": 35.73, "elapsed_time": "1 day, 5:34:16", "remaining_time": "2 days, 5:11:31", "throughput": 29225.55, "total_tokens": 3111248704} +{"current_steps": 10610, "total_steps": 29667, "loss": 0.3565, "lr": 3.482904325925266e-05, "epoch": 1.0729134405713745, "percentage": 35.76, "elapsed_time": "1 day, 5:35:55", "remaining_time": "2 days, 5:09:48", "throughput": 29226.14, "total_tokens": 3114204096} +{"current_steps": 10620, "total_steps": 29667, "loss": 0.3624, "lr": 3.482059637356124e-05, "epoch": 1.0739247226874822, "percentage": 35.8, "elapsed_time": "1 day, 5:37:35", "remaining_time": "2 days, 5:08:07", "throughput": 29226.16, "total_tokens": 3117131712} +{"current_steps": 10630, "total_steps": 29667, "loss": 0.3586, "lr": 3.481215563061281e-05, "epoch": 1.07493600480359, "percentage": 35.83, "elapsed_time": "1 day, 5:39:11", "remaining_time": "2 days, 5:06:17", "throughput": 29227.29, "total_tokens": 3120046272} +{"current_steps": 10640, "total_steps": 29667, "loss": 0.3599, "lr": 3.4803721022965785e-05, "epoch": 1.075947286919698, "percentage": 35.86, "elapsed_time": "1 day, 5:40:47", "remaining_time": "2 days, 5:04:31", "throughput": 29228.46, "total_tokens": 3123001536} +{"current_steps": 10650, "total_steps": 29667, "loss": 0.3607, "lr": 3.479529254319117e-05, "epoch": 1.0769585690358057, "percentage": 35.9, "elapsed_time": "1 day, 5:42:26", "remaining_time": "2 days, 5:02:46", "throughput": 29229.16, "total_tokens": 3125951168} +{"current_steps": 10660, "total_steps": 29667, "loss": 0.3607, "lr": 3.478687018387257e-05, "epoch": 1.0779698511519136, "percentage": 35.93, "elapsed_time": "1 day, 5:44:04", "remaining_time": "2 days, 5:01:02", "throughput": 29229.72, "total_tokens": 3128883904} +{"current_steps": 10670, "total_steps": 29667, "loss": 0.3586, "lr": 3.477845393760616e-05, "epoch": 1.0789811332680213, "percentage": 35.97, "elapsed_time": "1 day, 5:45:39", "remaining_time": "2 days, 4:59:12", "throughput": 29230.83, "total_tokens": 3131775680} +{"current_steps": 10680, "total_steps": 29667, "loss": 0.3563, "lr": 3.4770043797000614e-05, "epoch": 1.0799924153841292, "percentage": 36.0, "elapsed_time": "1 day, 5:47:19", "remaining_time": "2 days, 4:57:30", "throughput": 29231.45, "total_tokens": 3134754752} +{"current_steps": 10690, "total_steps": 29667, "loss": 0.3567, "lr": 3.4761639754677146e-05, "epoch": 1.081003697500237, "percentage": 36.03, "elapsed_time": "1 day, 5:48:53", "remaining_time": "2 days, 4:55:39", "throughput": 29232.59, "total_tokens": 3137636032} +{"current_steps": 10700, "total_steps": 29667, "loss": 0.3604, "lr": 3.4753241803269435e-05, "epoch": 1.082014979616345, "percentage": 36.07, "elapsed_time": "1 day, 5:50:29", "remaining_time": "2 days, 4:53:50", "throughput": 29233.63, "total_tokens": 3140547392} +{"current_steps": 10710, "total_steps": 29667, "loss": 0.3566, "lr": 3.474484993542361e-05, "epoch": 1.0830262617324526, "percentage": 36.1, "elapsed_time": "1 day, 5:52:10", "remaining_time": "2 days, 4:52:11", "throughput": 29233.82, "total_tokens": 3143516480} +{"current_steps": 10720, "total_steps": 29667, "loss": 0.3573, "lr": 3.473646414379822e-05, "epoch": 1.0840375438485605, "percentage": 36.13, "elapsed_time": "1 day, 5:53:46", "remaining_time": "2 days, 4:50:24", "throughput": 29234.94, "total_tokens": 3146458176} +{"current_steps": 10730, "total_steps": 29667, "loss": 0.3631, "lr": 3.472808442106422e-05, "epoch": 1.0850488259646682, "percentage": 36.17, "elapsed_time": "1 day, 5:55:25", "remaining_time": "2 days, 4:48:40", "throughput": 29235.58, "total_tokens": 3149409024} +{"current_steps": 10740, "total_steps": 29667, "loss": 0.3553, "lr": 3.4719710759904936e-05, "epoch": 1.0860601080807761, "percentage": 36.2, "elapsed_time": "1 day, 5:57:04", "remaining_time": "2 days, 4:46:58", "throughput": 29236.1, "total_tokens": 3152379328} +{"current_steps": 10750, "total_steps": 29667, "loss": 0.359, "lr": 3.471134315301603e-05, "epoch": 1.087071390196884, "percentage": 36.24, "elapsed_time": "1 day, 5:58:44", "remaining_time": "2 days, 4:45:16", "throughput": 29236.39, "total_tokens": 3155314944} +{"current_steps": 10760, "total_steps": 29667, "loss": 0.3629, "lr": 3.470298159310549e-05, "epoch": 1.0880826723129917, "percentage": 36.27, "elapsed_time": "1 day, 6:00:22", "remaining_time": "2 days, 4:43:31", "throughput": 29236.94, "total_tokens": 3158232960} +{"current_steps": 10770, "total_steps": 29667, "loss": 0.3578, "lr": 3.4694626072893585e-05, "epoch": 1.0890939544290996, "percentage": 36.3, "elapsed_time": "1 day, 6:01:57", "remaining_time": "2 days, 4:41:42", "throughput": 29237.89, "total_tokens": 3161123968} +{"current_steps": 10780, "total_steps": 29667, "loss": 0.3584, "lr": 3.468627658511285e-05, "epoch": 1.0901052365452075, "percentage": 36.34, "elapsed_time": "1 day, 6:03:35", "remaining_time": "2 days, 4:39:57", "throughput": 29238.5, "total_tokens": 3164050624} +{"current_steps": 10790, "total_steps": 29667, "loss": 0.356, "lr": 3.467793312250806e-05, "epoch": 1.0911165186613152, "percentage": 36.37, "elapsed_time": "1 day, 6:05:14", "remaining_time": "2 days, 4:38:15", "throughput": 29238.88, "total_tokens": 3167000832} +{"current_steps": 10800, "total_steps": 29667, "loss": 0.3637, "lr": 3.466959567783619e-05, "epoch": 1.092127800777423, "percentage": 36.4, "elapsed_time": "1 day, 6:06:55", "remaining_time": "2 days, 4:36:35", "throughput": 29238.91, "total_tokens": 3169950656} +{"current_steps": 10810, "total_steps": 29667, "loss": 0.3646, "lr": 3.466126424386642e-05, "epoch": 1.093139082893531, "percentage": 36.44, "elapsed_time": "1 day, 6:08:35", "remaining_time": "2 days, 4:34:54", "throughput": 29239.3, "total_tokens": 3172912640} +{"current_steps": 10820, "total_steps": 29667, "loss": 0.3588, "lr": 3.4652938813380056e-05, "epoch": 1.0941503650096387, "percentage": 36.47, "elapsed_time": "1 day, 6:10:14", "remaining_time": "2 days, 4:33:11", "throughput": 29239.77, "total_tokens": 3175862336} +{"current_steps": 10830, "total_steps": 29667, "loss": 0.3572, "lr": 3.464461937917057e-05, "epoch": 1.0951616471257466, "percentage": 36.51, "elapsed_time": "1 day, 6:11:50", "remaining_time": "2 days, 4:31:23", "throughput": 29240.65, "total_tokens": 3178765248} +{"current_steps": 10840, "total_steps": 29667, "loss": 0.3605, "lr": 3.4636305934043525e-05, "epoch": 1.0961729292418545, "percentage": 36.54, "elapsed_time": "1 day, 6:13:26", "remaining_time": "2 days, 4:29:36", "throughput": 29241.53, "total_tokens": 3181676736} +{"current_steps": 10850, "total_steps": 29667, "loss": 0.359, "lr": 3.4627998470816544e-05, "epoch": 1.0971842113579622, "percentage": 36.57, "elapsed_time": "1 day, 6:15:04", "remaining_time": "2 days, 4:27:51", "throughput": 29242.22, "total_tokens": 3184615744} +{"current_steps": 10860, "total_steps": 29667, "loss": 0.3592, "lr": 3.4619696982319334e-05, "epoch": 1.09819549347407, "percentage": 36.61, "elapsed_time": "1 day, 6:16:41", "remaining_time": "2 days, 4:26:04", "throughput": 29243.27, "total_tokens": 3187548096} +{"current_steps": 10870, "total_steps": 29667, "loss": 0.3583, "lr": 3.461140146139361e-05, "epoch": 1.099206775590178, "percentage": 36.64, "elapsed_time": "1 day, 6:18:17", "remaining_time": "2 days, 4:24:17", "throughput": 29244.11, "total_tokens": 3190470080} +{"current_steps": 10880, "total_steps": 29667, "loss": 0.3616, "lr": 3.460311190089309e-05, "epoch": 1.1002180577062857, "percentage": 36.67, "elapsed_time": "1 day, 6:19:57", "remaining_time": "2 days, 4:22:35", "throughput": 29244.53, "total_tokens": 3193417280} +{"current_steps": 10890, "total_steps": 29667, "loss": 0.3576, "lr": 3.459482829368348e-05, "epoch": 1.1012293398223936, "percentage": 36.71, "elapsed_time": "1 day, 6:21:36", "remaining_time": "2 days, 4:20:53", "throughput": 29245.03, "total_tokens": 3196374656} +{"current_steps": 10900, "total_steps": 29667, "loss": 0.3603, "lr": 3.4586550632642425e-05, "epoch": 1.1022406219385015, "percentage": 36.74, "elapsed_time": "1 day, 6:23:13", "remaining_time": "2 days, 4:19:07", "throughput": 29245.69, "total_tokens": 3199289280} +{"current_steps": 10910, "total_steps": 29667, "loss": 0.3606, "lr": 3.457827891065949e-05, "epoch": 1.1032519040546092, "percentage": 36.77, "elapsed_time": "1 day, 6:24:51", "remaining_time": "2 days, 4:17:22", "throughput": 29246.25, "total_tokens": 3202214848} +{"current_steps": 10920, "total_steps": 29667, "loss": 0.3578, "lr": 3.457001312063614e-05, "epoch": 1.104263186170717, "percentage": 36.81, "elapsed_time": "1 day, 6:26:29", "remaining_time": "2 days, 4:15:38", "throughput": 29247.07, "total_tokens": 3205175040} +{"current_steps": 10930, "total_steps": 29667, "loss": 0.3562, "lr": 3.45617532554857e-05, "epoch": 1.105274468286825, "percentage": 36.84, "elapsed_time": "1 day, 6:28:08", "remaining_time": "2 days, 4:13:55", "throughput": 29247.49, "total_tokens": 3208103744} +{"current_steps": 10940, "total_steps": 29667, "loss": 0.3577, "lr": 3.455349930813339e-05, "epoch": 1.1062857504029326, "percentage": 36.88, "elapsed_time": "1 day, 6:29:45", "remaining_time": "2 days, 4:12:10", "throughput": 29248.65, "total_tokens": 3211087360} +{"current_steps": 10950, "total_steps": 29667, "loss": 0.3593, "lr": 3.45452512715162e-05, "epoch": 1.1072970325190405, "percentage": 36.91, "elapsed_time": "1 day, 6:31:22", "remaining_time": "2 days, 4:10:23", "throughput": 29249.29, "total_tokens": 3213987712} +{"current_steps": 10960, "total_steps": 29667, "loss": 0.3588, "lr": 3.4537009138582935e-05, "epoch": 1.1083083146351485, "percentage": 36.94, "elapsed_time": "1 day, 6:33:00", "remaining_time": "2 days, 4:08:39", "throughput": 29249.95, "total_tokens": 3216923072} +{"current_steps": 10970, "total_steps": 29667, "loss": 0.3579, "lr": 3.4528772902294174e-05, "epoch": 1.1093195967512561, "percentage": 36.98, "elapsed_time": "1 day, 6:34:35", "remaining_time": "2 days, 4:06:50", "throughput": 29250.82, "total_tokens": 3219806784} +{"current_steps": 10980, "total_steps": 29667, "loss": 0.3538, "lr": 3.452054255562222e-05, "epoch": 1.110330878867364, "percentage": 37.01, "elapsed_time": "1 day, 6:36:15", "remaining_time": "2 days, 4:05:08", "throughput": 29251.25, "total_tokens": 3222762048} +{"current_steps": 10990, "total_steps": 29667, "loss": 0.3551, "lr": 3.451231809155115e-05, "epoch": 1.111342160983472, "percentage": 37.04, "elapsed_time": "1 day, 6:37:51", "remaining_time": "2 days, 4:03:21", "throughput": 29251.93, "total_tokens": 3225660608} +{"current_steps": 11000, "total_steps": 29667, "loss": 0.3591, "lr": 3.450409950307666e-05, "epoch": 1.1123534430995796, "percentage": 37.08, "elapsed_time": "1 day, 6:39:28", "remaining_time": "2 days, 4:01:35", "throughput": 29252.53, "total_tokens": 3228558336} +{"current_steps": 11010, "total_steps": 29667, "loss": 0.3614, "lr": 3.449588678320619e-05, "epoch": 1.1133647252156875, "percentage": 37.11, "elapsed_time": "1 day, 6:41:06", "remaining_time": "2 days, 3:59:51", "throughput": 29253.1, "total_tokens": 3231491904} +{"current_steps": 11020, "total_steps": 29667, "loss": 0.3585, "lr": 3.4487679924958767e-05, "epoch": 1.1143760073317954, "percentage": 37.15, "elapsed_time": "1 day, 6:42:46", "remaining_time": "2 days, 3:58:10", "throughput": 29253.31, "total_tokens": 3234443968} +{"current_steps": 11030, "total_steps": 29667, "loss": 0.3598, "lr": 3.4479478921365076e-05, "epoch": 1.115387289447903, "percentage": 37.18, "elapsed_time": "1 day, 6:44:22", "remaining_time": "2 days, 3:56:22", "throughput": 29254.59, "total_tokens": 3237387456} +{"current_steps": 11040, "total_steps": 29667, "loss": 0.3563, "lr": 3.447128376546738e-05, "epoch": 1.116398571564011, "percentage": 37.21, "elapsed_time": "1 day, 6:46:00", "remaining_time": "2 days, 3:54:38", "throughput": 29255.02, "total_tokens": 3240308608} +{"current_steps": 11050, "total_steps": 29667, "loss": 0.3577, "lr": 3.4463094450319505e-05, "epoch": 1.117409853680119, "percentage": 37.25, "elapsed_time": "1 day, 6:47:40", "remaining_time": "2 days, 3:52:57", "throughput": 29255.11, "total_tokens": 3243232448} +{"current_steps": 11060, "total_steps": 29667, "loss": 0.3596, "lr": 3.4454910968986855e-05, "epoch": 1.1184211357962266, "percentage": 37.28, "elapsed_time": "1 day, 6:49:21", "remaining_time": "2 days, 3:51:17", "throughput": 29255.3, "total_tokens": 3246206592} +{"current_steps": 11070, "total_steps": 29667, "loss": 0.3558, "lr": 3.4446733314546336e-05, "epoch": 1.1194324179123345, "percentage": 37.31, "elapsed_time": "1 day, 6:50:54", "remaining_time": "2 days, 3:49:25", "throughput": 29256.76, "total_tokens": 3249096960} +{"current_steps": 11080, "total_steps": 29667, "loss": 0.3622, "lr": 3.443856148008633e-05, "epoch": 1.1204437000284424, "percentage": 37.35, "elapsed_time": "1 day, 6:52:30", "remaining_time": "2 days, 3:47:38", "throughput": 29257.44, "total_tokens": 3251980224} +{"current_steps": 11090, "total_steps": 29667, "loss": 0.3604, "lr": 3.443039545870672e-05, "epoch": 1.12145498214455, "percentage": 37.38, "elapsed_time": "1 day, 6:54:07", "remaining_time": "2 days, 3:45:52", "throughput": 29257.98, "total_tokens": 3254878592} +{"current_steps": 11100, "total_steps": 29667, "loss": 0.3592, "lr": 3.442223524351883e-05, "epoch": 1.122466264260658, "percentage": 37.42, "elapsed_time": "1 day, 6:55:39", "remaining_time": "2 days, 3:43:57", "throughput": 29259.47, "total_tokens": 3257729856} +{"current_steps": 11110, "total_steps": 29667, "loss": 0.3575, "lr": 3.44140808276454e-05, "epoch": 1.123477546376766, "percentage": 37.45, "elapsed_time": "1 day, 6:57:16", "remaining_time": "2 days, 3:42:12", "throughput": 29260.17, "total_tokens": 3260653568} +{"current_steps": 11120, "total_steps": 29667, "loss": 0.355, "lr": 3.4405932204220575e-05, "epoch": 1.1244888284928736, "percentage": 37.48, "elapsed_time": "1 day, 6:58:53", "remaining_time": "2 days, 3:40:25", "throughput": 29261.07, "total_tokens": 3263583744} +{"current_steps": 11130, "total_steps": 29667, "loss": 0.3604, "lr": 3.4397789366389876e-05, "epoch": 1.1255001106089815, "percentage": 37.52, "elapsed_time": "1 day, 7:00:31", "remaining_time": "2 days, 3:38:42", "throughput": 29261.42, "total_tokens": 3266499648} +{"current_steps": 11140, "total_steps": 29667, "loss": 0.3584, "lr": 3.438965230731016e-05, "epoch": 1.1265113927250892, "percentage": 37.55, "elapsed_time": "1 day, 7:02:08", "remaining_time": "2 days, 3:36:55", "throughput": 29262.15, "total_tokens": 3269409344} +{"current_steps": 11150, "total_steps": 29667, "loss": 0.3571, "lr": 3.438152102014964e-05, "epoch": 1.127522674841197, "percentage": 37.58, "elapsed_time": "1 day, 7:03:49", "remaining_time": "2 days, 3:35:17", "throughput": 29262.54, "total_tokens": 3272411648} +{"current_steps": 11160, "total_steps": 29667, "loss": 0.3596, "lr": 3.437339549808778e-05, "epoch": 1.128533956957305, "percentage": 37.62, "elapsed_time": "1 day, 7:05:29", "remaining_time": "2 days, 3:33:35", "throughput": 29262.87, "total_tokens": 3275368512} +{"current_steps": 11170, "total_steps": 29667, "loss": 0.3595, "lr": 3.43652757343154e-05, "epoch": 1.1295452390734129, "percentage": 37.65, "elapsed_time": "1 day, 7:07:06", "remaining_time": "2 days, 3:31:51", "throughput": 29263.34, "total_tokens": 3278280000} +{"current_steps": 11180, "total_steps": 29667, "loss": 0.3632, "lr": 3.435716172203449e-05, "epoch": 1.1305565211895205, "percentage": 37.68, "elapsed_time": "1 day, 7:08:43", "remaining_time": "2 days, 3:30:04", "throughput": 29263.95, "total_tokens": 3281164480} +{"current_steps": 11190, "total_steps": 29667, "loss": 0.3633, "lr": 3.434905345445833e-05, "epoch": 1.1315678033056285, "percentage": 37.72, "elapsed_time": "1 day, 7:10:20", "remaining_time": "2 days, 3:28:18", "throughput": 29264.64, "total_tokens": 3284081024} +{"current_steps": 11200, "total_steps": 29667, "loss": 0.3609, "lr": 3.4340950924811374e-05, "epoch": 1.1325790854217361, "percentage": 37.75, "elapsed_time": "1 day, 7:11:58", "remaining_time": "2 days, 3:26:34", "throughput": 29265.04, "total_tokens": 3287000576} +{"current_steps": 11210, "total_steps": 29667, "loss": 0.3585, "lr": 3.433285412632927e-05, "epoch": 1.133590367537844, "percentage": 37.79, "elapsed_time": "1 day, 7:13:36", "remaining_time": "2 days, 3:24:51", "throughput": 29265.46, "total_tokens": 3289920576} +{"current_steps": 11220, "total_steps": 29667, "loss": 0.3584, "lr": 3.4324763052258835e-05, "epoch": 1.134601649653952, "percentage": 37.82, "elapsed_time": "1 day, 7:15:14", "remaining_time": "2 days, 3:23:06", "throughput": 29266.14, "total_tokens": 3292856000} +{"current_steps": 11230, "total_steps": 29667, "loss": 0.3633, "lr": 3.4316677695858003e-05, "epoch": 1.1356129317700598, "percentage": 37.85, "elapsed_time": "1 day, 7:16:51", "remaining_time": "2 days, 3:21:21", "throughput": 29266.82, "total_tokens": 3295783360} +{"current_steps": 11240, "total_steps": 29667, "loss": 0.3606, "lr": 3.430859805039583e-05, "epoch": 1.1366242138861675, "percentage": 37.89, "elapsed_time": "1 day, 7:18:27", "remaining_time": "2 days, 3:19:34", "throughput": 29268.01, "total_tokens": 3298732480} +{"current_steps": 11250, "total_steps": 29667, "loss": 0.3586, "lr": 3.430052410915246e-05, "epoch": 1.1376354960022754, "percentage": 37.92, "elapsed_time": "1 day, 7:23:06", "remaining_time": "2 days, 3:22:46", "throughput": 29221.76, "total_tokens": 3301671424} +{"current_steps": 11260, "total_steps": 29667, "loss": 0.3609, "lr": 3.4292455865419086e-05, "epoch": 1.138646778118383, "percentage": 37.95, "elapsed_time": "1 day, 7:27:24", "remaining_time": "2 days, 3:25:23", "throughput": 29181.18, "total_tokens": 3304605632} +{"current_steps": 11270, "total_steps": 29667, "loss": 0.3616, "lr": 3.4284393312497973e-05, "epoch": 1.139658060234491, "percentage": 37.99, "elapsed_time": "1 day, 7:31:48", "remaining_time": "2 days, 3:28:10", "throughput": 29138.66, "total_tokens": 3307496128} +{"current_steps": 11280, "total_steps": 29667, "loss": 0.3581, "lr": 3.427633644370238e-05, "epoch": 1.140669342350599, "percentage": 38.02, "elapsed_time": "1 day, 7:35:52", "remaining_time": "2 days, 3:30:22", "throughput": 29102.34, "total_tokens": 3310465472} +{"current_steps": 11290, "total_steps": 29667, "loss": 0.3555, "lr": 3.4268285252356564e-05, "epoch": 1.1416806244667068, "percentage": 38.06, "elapsed_time": "1 day, 7:39:36", "remaining_time": "2 days, 3:32:02", "throughput": 29071.13, "total_tokens": 3313432960} +{"current_steps": 11300, "total_steps": 29667, "loss": 0.3572, "lr": 3.426023973179575e-05, "epoch": 1.1426919065828145, "percentage": 38.09, "elapsed_time": "1 day, 7:42:46", "remaining_time": "2 days, 3:32:45", "throughput": 29048.51, "total_tokens": 3316364736} +{"current_steps": 11310, "total_steps": 29667, "loss": 0.3584, "lr": 3.425219987536614e-05, "epoch": 1.1437031886989224, "percentage": 38.12, "elapsed_time": "1 day, 7:45:25", "remaining_time": "2 days, 3:32:39", "throughput": 29033.77, "total_tokens": 3319311488} +{"current_steps": 11320, "total_steps": 29667, "loss": 0.356, "lr": 3.4244165676424815e-05, "epoch": 1.14471447081503, "percentage": 38.16, "elapsed_time": "1 day, 7:48:04", "remaining_time": "2 days, 3:32:31", "throughput": 29019.74, "total_tokens": 3322304192} +{"current_steps": 11330, "total_steps": 29667, "loss": 0.3554, "lr": 3.423613712833979e-05, "epoch": 1.145725752931138, "percentage": 38.19, "elapsed_time": "1 day, 7:50:24", "remaining_time": "2 days, 3:31:53", "throughput": 29009.85, "total_tokens": 3325231936} +{"current_steps": 11340, "total_steps": 29667, "loss": 0.3554, "lr": 3.422811422448995e-05, "epoch": 1.146737035047246, "percentage": 38.22, "elapsed_time": "1 day, 7:54:28", "remaining_time": "2 days, 3:34:03", "throughput": 28973.84, "total_tokens": 3328175808} +{"current_steps": 11350, "total_steps": 29667, "loss": 0.3549, "lr": 3.422009695826503e-05, "epoch": 1.1477483171633536, "percentage": 38.26, "elapsed_time": "1 day, 7:59:13", "remaining_time": "2 days, 3:37:18", "throughput": 28928.3, "total_tokens": 3331194496} +{"current_steps": 11360, "total_steps": 29667, "loss": 0.3604, "lr": 3.4212085323065626e-05, "epoch": 1.1487595992794615, "percentage": 38.29, "elapsed_time": "1 day, 8:03:54", "remaining_time": "2 days, 3:40:25", "throughput": 28883.76, "total_tokens": 3334168704} +{"current_steps": 11370, "total_steps": 29667, "loss": 0.3592, "lr": 3.4204079312303103e-05, "epoch": 1.1497708813955694, "percentage": 38.33, "elapsed_time": "1 day, 8:07:45", "remaining_time": "2 days, 3:42:12", "throughput": 28851.26, "total_tokens": 3337083264} +{"current_steps": 11380, "total_steps": 29667, "loss": 0.3615, "lr": 3.419607891939964e-05, "epoch": 1.150782163511677, "percentage": 38.36, "elapsed_time": "1 day, 8:12:23", "remaining_time": "2 days, 3:45:15", "throughput": 28807.4, "total_tokens": 3340041664} +{"current_steps": 11390, "total_steps": 29667, "loss": 0.3594, "lr": 3.4188084137788166e-05, "epoch": 1.151793445627785, "percentage": 38.39, "elapsed_time": "1 day, 8:17:08", "remaining_time": "2 days, 3:48:26", "throughput": 28762.15, "total_tokens": 3342974720} +{"current_steps": 11400, "total_steps": 29667, "loss": 0.3558, "lr": 3.418009496091238e-05, "epoch": 1.1528047277438929, "percentage": 38.43, "elapsed_time": "1 day, 8:22:04", "remaining_time": "2 days, 3:51:55", "throughput": 28714.27, "total_tokens": 3345926464} +{"current_steps": 11410, "total_steps": 29667, "loss": 0.3554, "lr": 3.417211138222666e-05, "epoch": 1.1538160098600005, "percentage": 38.46, "elapsed_time": "1 day, 8:26:10", "remaining_time": "2 days, 3:54:03", "throughput": 28679.25, "total_tokens": 3348896192} +{"current_steps": 11420, "total_steps": 29667, "loss": 0.359, "lr": 3.416413339519612e-05, "epoch": 1.1548272919761084, "percentage": 38.49, "elapsed_time": "1 day, 8:30:19", "remaining_time": "2 days, 3:56:15", "throughput": 28643.15, "total_tokens": 3351811200} +{"current_steps": 11430, "total_steps": 29667, "loss": 0.3615, "lr": 3.4156160993296524e-05, "epoch": 1.1558385740922164, "percentage": 38.53, "elapsed_time": "1 day, 8:33:53", "remaining_time": "2 days, 3:57:30", "throughput": 28616.34, "total_tokens": 3354791552} +{"current_steps": 11440, "total_steps": 29667, "loss": 0.3574, "lr": 3.4148194170014295e-05, "epoch": 1.156849856208324, "percentage": 38.56, "elapsed_time": "1 day, 8:37:17", "remaining_time": "2 days, 3:58:30", "throughput": 28591.3, "total_tokens": 3357704000} +{"current_steps": 11450, "total_steps": 29667, "loss": 0.3619, "lr": 3.4140232918846484e-05, "epoch": 1.157861138324432, "percentage": 38.6, "elapsed_time": "1 day, 8:40:55", "remaining_time": "2 days, 3:59:49", "throughput": 28563.49, "total_tokens": 3360641920} +{"current_steps": 11460, "total_steps": 29667, "loss": 0.3574, "lr": 3.4132277233300753e-05, "epoch": 1.1588724204405398, "percentage": 38.63, "elapsed_time": "1 day, 8:44:25", "remaining_time": "2 days, 4:00:58", "throughput": 28537.65, "total_tokens": 3363617152} +{"current_steps": 11470, "total_steps": 29667, "loss": 0.3574, "lr": 3.4124327106895356e-05, "epoch": 1.1598837025566475, "percentage": 38.66, "elapsed_time": "1 day, 8:47:44", "remaining_time": "2 days, 4:01:48", "throughput": 28514.57, "total_tokens": 3366569728} +{"current_steps": 11480, "total_steps": 29667, "loss": 0.3593, "lr": 3.4116382533159097e-05, "epoch": 1.1608949846727554, "percentage": 38.7, "elapsed_time": "1 day, 8:50:52", "remaining_time": "2 days, 4:02:19", "throughput": 28493.78, "total_tokens": 3369455744} +{"current_steps": 11490, "total_steps": 29667, "loss": 0.3571, "lr": 3.4108443505631335e-05, "epoch": 1.1619062667888633, "percentage": 38.73, "elapsed_time": "1 day, 8:54:23", "remaining_time": "2 days, 4:03:27", "throughput": 28468.23, "total_tokens": 3372440896} +{"current_steps": 11500, "total_steps": 29667, "loss": 0.3546, "lr": 3.410051001786192e-05, "epoch": 1.162917548904971, "percentage": 38.76, "elapsed_time": "1 day, 8:57:14", "remaining_time": "2 days, 4:03:32", "throughput": 28451.4, "total_tokens": 3375328896} +{"current_steps": 11510, "total_steps": 29667, "loss": 0.3619, "lr": 3.409258206341124e-05, "epoch": 1.163928831021079, "percentage": 38.8, "elapsed_time": "1 day, 9:00:00", "remaining_time": "2 days, 4:03:26", "throughput": 28436.22, "total_tokens": 3378226432} +{"current_steps": 11520, "total_steps": 29667, "loss": 0.3547, "lr": 3.4084659635850134e-05, "epoch": 1.1649401131371868, "percentage": 38.83, "elapsed_time": "1 day, 9:02:56", "remaining_time": "2 days, 4:03:39", "throughput": 28418.73, "total_tokens": 3381170816} +{"current_steps": 11530, "total_steps": 29667, "loss": 0.3597, "lr": 3.40767427287599e-05, "epoch": 1.1659513952532945, "percentage": 38.86, "elapsed_time": "1 day, 9:05:47", "remaining_time": "2 days, 4:03:42", "throughput": 28402.74, "total_tokens": 3384127616} +{"current_steps": 11540, "total_steps": 29667, "loss": 0.3596, "lr": 3.406883133573224e-05, "epoch": 1.1669626773694024, "percentage": 38.9, "elapsed_time": "1 day, 9:08:40", "remaining_time": "2 days, 4:03:47", "throughput": 28386.11, "total_tokens": 3387035968} +{"current_steps": 11550, "total_steps": 29667, "loss": 0.3601, "lr": 3.406092545036932e-05, "epoch": 1.1679739594855103, "percentage": 38.93, "elapsed_time": "1 day, 9:11:31", "remaining_time": "2 days, 4:03:51", "throughput": 28369.67, "total_tokens": 3389946688} +{"current_steps": 11560, "total_steps": 29667, "loss": 0.3577, "lr": 3.405302506628365e-05, "epoch": 1.168985241601618, "percentage": 38.97, "elapsed_time": "1 day, 9:14:30", "remaining_time": "2 days, 4:04:06", "throughput": 28351.73, "total_tokens": 3392876864} +{"current_steps": 11570, "total_steps": 29667, "loss": 0.3596, "lr": 3.404513017709813e-05, "epoch": 1.169996523717726, "percentage": 39.0, "elapsed_time": "1 day, 9:17:14", "remaining_time": "2 days, 4:03:56", "throughput": 28337.8, "total_tokens": 3395847552} +{"current_steps": 11580, "total_steps": 29667, "loss": 0.3621, "lr": 3.403724077644598e-05, "epoch": 1.1710078058338338, "percentage": 39.03, "elapsed_time": "1 day, 9:20:02", "remaining_time": "2 days, 4:03:53", "throughput": 28322.63, "total_tokens": 3398784192} +{"current_steps": 11590, "total_steps": 29667, "loss": 0.3583, "lr": 3.402935685797077e-05, "epoch": 1.1720190879499415, "percentage": 39.07, "elapsed_time": "1 day, 9:22:50", "remaining_time": "2 days, 4:03:49", "throughput": 28308.29, "total_tokens": 3401806912} +{"current_steps": 11600, "total_steps": 29667, "loss": 0.3597, "lr": 3.4021478415326355e-05, "epoch": 1.1730303700660494, "percentage": 39.1, "elapsed_time": "1 day, 9:25:52", "remaining_time": "2 days, 4:04:09", "throughput": 28289.58, "total_tokens": 3404736064} +{"current_steps": 11610, "total_steps": 29667, "loss": 0.3544, "lr": 3.401360544217687e-05, "epoch": 1.1740416521821573, "percentage": 39.13, "elapsed_time": "1 day, 9:28:39", "remaining_time": "2 days, 4:04:03", "throughput": 28274.63, "total_tokens": 3407649024} +{"current_steps": 11620, "total_steps": 29667, "loss": 0.3626, "lr": 3.400573793219672e-05, "epoch": 1.175052934298265, "percentage": 39.17, "elapsed_time": "1 day, 9:31:09", "remaining_time": "2 days, 4:03:31", "throughput": 28263.68, "total_tokens": 3410559936} +{"current_steps": 11630, "total_steps": 29667, "loss": 0.364, "lr": 3.3997875879070546e-05, "epoch": 1.1760642164143729, "percentage": 39.2, "elapsed_time": "1 day, 9:33:47", "remaining_time": "2 days, 4:03:12", "throughput": 28250.66, "total_tokens": 3413466688} +{"current_steps": 11640, "total_steps": 29667, "loss": 0.3585, "lr": 3.399001927649318e-05, "epoch": 1.1770754985304808, "percentage": 39.24, "elapsed_time": "1 day, 9:36:37", "remaining_time": "2 days, 4:03:10", "throughput": 28234.89, "total_tokens": 3416355584} +{"current_steps": 11650, "total_steps": 29667, "loss": 0.3558, "lr": 3.398216811816968e-05, "epoch": 1.1780867806465884, "percentage": 39.27, "elapsed_time": "1 day, 9:39:32", "remaining_time": "2 days, 4:03:16", "throughput": 28218.17, "total_tokens": 3419278208} +{"current_steps": 11660, "total_steps": 29667, "loss": 0.3546, "lr": 3.397432239781527e-05, "epoch": 1.1790980627626964, "percentage": 39.3, "elapsed_time": "1 day, 9:42:44", "remaining_time": "2 days, 4:03:48", "throughput": 28197.84, "total_tokens": 3422220736} +{"current_steps": 11670, "total_steps": 29667, "loss": 0.3525, "lr": 3.396648210915531e-05, "epoch": 1.180109344878804, "percentage": 39.34, "elapsed_time": "1 day, 9:46:31", "remaining_time": "2 days, 4:05:14", "throughput": 28169.32, "total_tokens": 3425162944} +{"current_steps": 11680, "total_steps": 29667, "loss": 0.366, "lr": 3.3958647245925315e-05, "epoch": 1.181120626994912, "percentage": 39.37, "elapsed_time": "1 day, 9:48:47", "remaining_time": "2 days, 4:04:17", "throughput": 28162.17, "total_tokens": 3428098816} +{"current_steps": 11690, "total_steps": 29667, "loss": 0.3576, "lr": 3.3950817801870885e-05, "epoch": 1.1821319091110198, "percentage": 39.4, "elapsed_time": "1 day, 9:51:32", "remaining_time": "2 days, 4:04:08", "throughput": 28147.43, "total_tokens": 3430972352} +{"current_steps": 11700, "total_steps": 29667, "loss": 0.3576, "lr": 3.3942993770747735e-05, "epoch": 1.1831431912271277, "percentage": 39.44, "elapsed_time": "1 day, 9:54:51", "remaining_time": "2 days, 4:04:48", "throughput": 28125.37, "total_tokens": 3433871168} +{"current_steps": 11710, "total_steps": 29667, "loss": 0.362, "lr": 3.3935175146321626e-05, "epoch": 1.1841544733432354, "percentage": 39.47, "elapsed_time": "1 day, 9:57:41", "remaining_time": "2 days, 4:04:44", "throughput": 28110.24, "total_tokens": 3436796736} +{"current_steps": 11720, "total_steps": 29667, "loss": 0.3518, "lr": 3.392736192236839e-05, "epoch": 1.1851657554593433, "percentage": 39.51, "elapsed_time": "1 day, 10:01:44", "remaining_time": "2 days, 4:06:33", "throughput": 28078.53, "total_tokens": 3439756864} +{"current_steps": 11730, "total_steps": 29667, "loss": 0.3561, "lr": 3.391955409267387e-05, "epoch": 1.186177037575451, "percentage": 39.54, "elapsed_time": "1 day, 10:06:50", "remaining_time": "2 days, 4:09:56", "throughput": 28032.23, "total_tokens": 3442659712} +{"current_steps": 11740, "total_steps": 29667, "loss": 0.3581, "lr": 3.3911751651033896e-05, "epoch": 1.187188319691559, "percentage": 39.57, "elapsed_time": "1 day, 10:10:31", "remaining_time": "2 days, 4:11:09", "throughput": 28006.09, "total_tokens": 3445629184} +{"current_steps": 11750, "total_steps": 29667, "loss": 0.3626, "lr": 3.3903954591254334e-05, "epoch": 1.1881996018076668, "percentage": 39.61, "elapsed_time": "1 day, 10:14:30", "remaining_time": "2 days, 4:12:48", "throughput": 27975.79, "total_tokens": 3448578112} +{"current_steps": 11760, "total_steps": 29667, "loss": 0.3615, "lr": 3.389616290715097e-05, "epoch": 1.1892108839237747, "percentage": 39.64, "elapsed_time": "1 day, 10:17:46", "remaining_time": "2 days, 4:13:22", "throughput": 27954.84, "total_tokens": 3451482496} +{"current_steps": 11770, "total_steps": 29667, "loss": 0.3595, "lr": 3.388837659254955e-05, "epoch": 1.1902221660398824, "percentage": 39.67, "elapsed_time": "1 day, 10:21:14", "remaining_time": "2 days, 4:14:14", "throughput": 27931.6, "total_tokens": 3454431680} +{"current_steps": 11780, "total_steps": 29667, "loss": 0.3559, "lr": 3.3880595641285746e-05, "epoch": 1.1912334481559903, "percentage": 39.71, "elapsed_time": "1 day, 10:24:26", "remaining_time": "2 days, 4:14:41", "throughput": 27911.77, "total_tokens": 3457340992} +{"current_steps": 11790, "total_steps": 29667, "loss": 0.3578, "lr": 3.387282004720513e-05, "epoch": 1.192244730272098, "percentage": 39.74, "elapsed_time": "1 day, 10:27:27", "remaining_time": "2 days, 4:14:51", "throughput": 27894.56, "total_tokens": 3460257536} +{"current_steps": 11800, "total_steps": 29667, "loss": 0.3563, "lr": 3.386504980416316e-05, "epoch": 1.1932560123882059, "percentage": 39.77, "elapsed_time": "1 day, 10:31:01", "remaining_time": "2 days, 4:15:50", "throughput": 27870.28, "total_tokens": 3463204544} +{"current_steps": 11810, "total_steps": 29667, "loss": 0.3585, "lr": 3.385728490602515e-05, "epoch": 1.1942672945043138, "percentage": 39.81, "elapsed_time": "1 day, 10:34:41", "remaining_time": "2 days, 4:16:59", "throughput": 27844.37, "total_tokens": 3466119552} +{"current_steps": 11820, "total_steps": 29667, "loss": 0.3566, "lr": 3.384952534666625e-05, "epoch": 1.1952785766204217, "percentage": 39.84, "elapsed_time": "1 day, 10:38:24", "remaining_time": "2 days, 4:18:10", "throughput": 27818.1, "total_tokens": 3469033728} +{"current_steps": 11830, "total_steps": 29667, "loss": 0.3601, "lr": 3.3841771119971455e-05, "epoch": 1.1962898587365294, "percentage": 39.88, "elapsed_time": "1 day, 10:41:52", "remaining_time": "2 days, 4:18:59", "throughput": 27795.48, "total_tokens": 3471994816} +{"current_steps": 11840, "total_steps": 29667, "loss": 0.3598, "lr": 3.383402221983554e-05, "epoch": 1.1973011408526373, "percentage": 39.91, "elapsed_time": "1 day, 10:44:38", "remaining_time": "2 days, 4:18:45", "throughput": 27782.13, "total_tokens": 3474947392} +{"current_steps": 11850, "total_steps": 29667, "loss": 0.3647, "lr": 3.3826278640163064e-05, "epoch": 1.198312422968745, "percentage": 39.94, "elapsed_time": "1 day, 10:47:38", "remaining_time": "2 days, 4:18:52", "throughput": 27765.62, "total_tokens": 3477885440} +{"current_steps": 11860, "total_steps": 29667, "loss": 0.3572, "lr": 3.3818540374868354e-05, "epoch": 1.1993237050848529, "percentage": 39.98, "elapsed_time": "1 day, 10:51:07", "remaining_time": "2 days, 4:19:41", "throughput": 27742.56, "total_tokens": 3480790464} +{"current_steps": 11870, "total_steps": 29667, "loss": 0.3613, "lr": 3.381080741787547e-05, "epoch": 1.2003349872009608, "percentage": 40.01, "elapsed_time": "1 day, 10:55:02", "remaining_time": "2 days, 4:21:09", "throughput": 27713.83, "total_tokens": 3483700160} +{"current_steps": 11880, "total_steps": 29667, "loss": 0.3599, "lr": 3.38030797631182e-05, "epoch": 1.2013462693170684, "percentage": 40.04, "elapsed_time": "1 day, 10:58:54", "remaining_time": "2 days, 4:22:31", "throughput": 27686.5, "total_tokens": 3486685824} +{"current_steps": 11890, "total_steps": 29667, "loss": 0.3618, "lr": 3.379535740454003e-05, "epoch": 1.2023575514331764, "percentage": 40.08, "elapsed_time": "1 day, 11:03:26", "remaining_time": "2 days, 4:24:54", "throughput": 27650.33, "total_tokens": 3489661952} +{"current_steps": 11900, "total_steps": 29667, "loss": 0.3614, "lr": 3.3787640336094126e-05, "epoch": 1.2033688335492843, "percentage": 40.11, "elapsed_time": "1 day, 11:08:11", "remaining_time": "2 days, 4:27:35", "throughput": 27611.43, "total_tokens": 3492616768} +{"current_steps": 11910, "total_steps": 29667, "loss": 0.3616, "lr": 3.3779928551743325e-05, "epoch": 1.204380115665392, "percentage": 40.15, "elapsed_time": "1 day, 11:11:46", "remaining_time": "2 days, 4:28:30", "throughput": 27587.84, "total_tokens": 3495553152} +{"current_steps": 11920, "total_steps": 29667, "loss": 0.3578, "lr": 3.3772222045460084e-05, "epoch": 1.2053913977814998, "percentage": 40.18, "elapsed_time": "1 day, 11:15:59", "remaining_time": "2 days, 4:30:23", "throughput": 27555.91, "total_tokens": 3498491712} +{"current_steps": 11930, "total_steps": 29667, "loss": 0.3557, "lr": 3.37645208112265e-05, "epoch": 1.2064026798976077, "percentage": 40.21, "elapsed_time": "1 day, 11:19:30", "remaining_time": "2 days, 4:31:11", "throughput": 27533.44, "total_tokens": 3501434560} +{"current_steps": 11940, "total_steps": 29667, "loss": 0.3571, "lr": 3.3756824843034255e-05, "epoch": 1.2074139620137154, "percentage": 40.25, "elapsed_time": "1 day, 11:23:01", "remaining_time": "2 days, 4:31:59", "throughput": 27510.92, "total_tokens": 3504379072} +{"current_steps": 11950, "total_steps": 29667, "loss": 0.3565, "lr": 3.374913413488464e-05, "epoch": 1.2084252441298233, "percentage": 40.28, "elapsed_time": "1 day, 11:25:54", "remaining_time": "2 days, 4:31:51", "throughput": 27496.64, "total_tokens": 3507317696} +{"current_steps": 11960, "total_steps": 29667, "loss": 0.3551, "lr": 3.374144868078848e-05, "epoch": 1.2094365262459312, "percentage": 40.31, "elapsed_time": "1 day, 11:28:44", "remaining_time": "2 days, 4:31:38", "throughput": 27483.1, "total_tokens": 3510275008} +{"current_steps": 11970, "total_steps": 29667, "loss": 0.361, "lr": 3.373376847476615e-05, "epoch": 1.210447808362039, "percentage": 40.35, "elapsed_time": "1 day, 11:30:59", "remaining_time": "2 days, 4:30:34", "throughput": 27476.66, "total_tokens": 3513163136} +{"current_steps": 11980, "total_steps": 29667, "loss": 0.3573, "lr": 3.3726093510847566e-05, "epoch": 1.2114590904781468, "percentage": 40.38, "elapsed_time": "1 day, 11:33:26", "remaining_time": "2 days, 4:29:46", "throughput": 27467.84, "total_tokens": 3516069056} +{"current_steps": 11990, "total_steps": 29667, "loss": 0.361, "lr": 3.371842378307212e-05, "epoch": 1.2124703725942547, "percentage": 40.42, "elapsed_time": "1 day, 11:36:29", "remaining_time": "2 days, 4:29:51", "throughput": 27451.23, "total_tokens": 3518965824} +{"current_steps": 12000, "total_steps": 29667, "loss": 0.3608, "lr": 3.371075928548872e-05, "epoch": 1.2134816547103624, "percentage": 40.45, "elapsed_time": "1 day, 11:39:36", "remaining_time": "2 days, 4:30:02", "throughput": 27434.61, "total_tokens": 3521954816} +{"current_steps": 12010, "total_steps": 29667, "loss": 0.361, "lr": 3.37031000121557e-05, "epoch": 1.2144929368264703, "percentage": 40.48, "elapsed_time": "1 day, 11:42:27", "remaining_time": "2 days, 4:29:49", "throughput": 27420.84, "total_tokens": 3524887424} +{"current_steps": 12020, "total_steps": 29667, "loss": 0.3639, "lr": 3.369544595714088e-05, "epoch": 1.2155042189425782, "percentage": 40.52, "elapsed_time": "1 day, 11:44:57", "remaining_time": "2 days, 4:29:05", "throughput": 27412.04, "total_tokens": 3527854208} +{"current_steps": 12030, "total_steps": 29667, "loss": 0.3607, "lr": 3.368779711452148e-05, "epoch": 1.2165155010586859, "percentage": 40.55, "elapsed_time": "1 day, 11:46:53", "remaining_time": "2 days, 4:27:31", "throughput": 27409.91, "total_tokens": 3530775040} +{"current_steps": 12040, "total_steps": 29667, "loss": 0.3561, "lr": 3.368015347838413e-05, "epoch": 1.2175267831747938, "percentage": 40.58, "elapsed_time": "1 day, 11:48:38", "remaining_time": "2 days, 4:25:40", "throughput": 27410.38, "total_tokens": 3533694976} +{"current_steps": 12050, "total_steps": 29667, "loss": 0.3617, "lr": 3.3672515042824855e-05, "epoch": 1.2185380652909017, "percentage": 40.62, "elapsed_time": "1 day, 11:50:35", "remaining_time": "2 days, 4:24:08", "throughput": 27408.4, "total_tokens": 3536655744} +{"current_steps": 12060, "total_steps": 29667, "loss": 0.355, "lr": 3.366488180194904e-05, "epoch": 1.2195493474070094, "percentage": 40.65, "elapsed_time": "1 day, 11:52:29", "remaining_time": "2 days, 4:22:31", "throughput": 27406.97, "total_tokens": 3539592320} +{"current_steps": 12070, "total_steps": 29667, "loss": 0.3604, "lr": 3.365725374987143e-05, "epoch": 1.2205606295231173, "percentage": 40.68, "elapsed_time": "1 day, 11:54:20", "remaining_time": "2 days, 4:20:49", "throughput": 27406.41, "total_tokens": 3542553216} +{"current_steps": 12080, "total_steps": 29667, "loss": 0.3586, "lr": 3.36496308807161e-05, "epoch": 1.2215719116392252, "percentage": 40.72, "elapsed_time": "1 day, 11:56:19", "remaining_time": "2 days, 4:19:20", "throughput": 27404.29, "total_tokens": 3545551360} +{"current_steps": 12090, "total_steps": 29667, "loss": 0.3603, "lr": 3.3642013188616426e-05, "epoch": 1.2225831937553329, "percentage": 40.75, "elapsed_time": "1 day, 11:58:12", "remaining_time": "2 days, 4:17:42", "throughput": 27403.08, "total_tokens": 3548490368} +{"current_steps": 12100, "total_steps": 29667, "loss": 0.3551, "lr": 3.3634400667715074e-05, "epoch": 1.2235944758714408, "percentage": 40.79, "elapsed_time": "1 day, 11:59:58", "remaining_time": "2 days, 4:15:53", "throughput": 27403.24, "total_tokens": 3551424512} +{"current_steps": 12110, "total_steps": 29667, "loss": 0.3644, "lr": 3.3626793312164013e-05, "epoch": 1.2246057579875487, "percentage": 40.82, "elapsed_time": "1 day, 12:01:43", "remaining_time": "2 days, 4:14:02", "throughput": 27403.07, "total_tokens": 3554267392} +{"current_steps": 12120, "total_steps": 29667, "loss": 0.3608, "lr": 3.361919111612443e-05, "epoch": 1.2256170401036564, "percentage": 40.85, "elapsed_time": "1 day, 12:03:29", "remaining_time": "2 days, 4:12:15", "throughput": 27402.87, "total_tokens": 3557161280} +{"current_steps": 12130, "total_steps": 29667, "loss": 0.3572, "lr": 3.361159407376678e-05, "epoch": 1.2266283222197643, "percentage": 40.89, "elapsed_time": "1 day, 12:05:22", "remaining_time": "2 days, 4:10:36", "throughput": 27401.58, "total_tokens": 3560086528} +{"current_steps": 12140, "total_steps": 29667, "loss": 0.358, "lr": 3.3604002179270685e-05, "epoch": 1.2276396043358722, "percentage": 40.92, "elapsed_time": "1 day, 12:07:11", "remaining_time": "2 days, 4:08:51", "throughput": 27401.27, "total_tokens": 3563030912} +{"current_steps": 12150, "total_steps": 29667, "loss": 0.3589, "lr": 3.359641542682504e-05, "epoch": 1.2286508864519798, "percentage": 40.95, "elapsed_time": "1 day, 12:09:01", "remaining_time": "2 days, 4:07:08", "throughput": 27400.9, "total_tokens": 3565983808} +{"current_steps": 12160, "total_steps": 29667, "loss": 0.3578, "lr": 3.3588833810627854e-05, "epoch": 1.2296621685680877, "percentage": 40.99, "elapsed_time": "1 day, 12:11:06", "remaining_time": "2 days, 4:05:47", "throughput": 27397.06, "total_tokens": 3568927104} +{"current_steps": 12170, "total_steps": 29667, "loss": 0.3592, "lr": 3.358125732488632e-05, "epoch": 1.2306734506841956, "percentage": 41.02, "elapsed_time": "1 day, 12:12:57", "remaining_time": "2 days, 4:04:05", "throughput": 27396.27, "total_tokens": 3571860160} +{"current_steps": 12180, "total_steps": 29667, "loss": 0.3621, "lr": 3.357368596381679e-05, "epoch": 1.2316847328003033, "percentage": 41.06, "elapsed_time": "1 day, 12:14:49", "remaining_time": "2 days, 4:02:25", "throughput": 27395.0, "total_tokens": 3574764288} +{"current_steps": 12190, "total_steps": 29667, "loss": 0.3604, "lr": 3.356611972164471e-05, "epoch": 1.2326960149164112, "percentage": 41.09, "elapsed_time": "1 day, 12:16:45", "remaining_time": "2 days, 4:00:50", "throughput": 27392.88, "total_tokens": 3577651520} +{"current_steps": 12200, "total_steps": 29667, "loss": 0.3576, "lr": 3.355855859260466e-05, "epoch": 1.2337072970325191, "percentage": 41.12, "elapsed_time": "1 day, 12:19:15", "remaining_time": "2 days, 4:00:05", "throughput": 27383.26, "total_tokens": 3580518016} +{"current_steps": 12210, "total_steps": 29667, "loss": 0.3605, "lr": 3.3551002570940285e-05, "epoch": 1.2347185791486268, "percentage": 41.16, "elapsed_time": "1 day, 12:21:22", "remaining_time": "2 days, 3:58:46", "throughput": 27379.65, "total_tokens": 3583507328} +{"current_steps": 12220, "total_steps": 29667, "loss": 0.3594, "lr": 3.354345165090431e-05, "epoch": 1.2357298612647347, "percentage": 41.19, "elapsed_time": "1 day, 12:23:18", "remaining_time": "2 days, 3:57:12", "throughput": 27377.58, "total_tokens": 3586425856} +{"current_steps": 12230, "total_steps": 29667, "loss": 0.3588, "lr": 3.3535905826758515e-05, "epoch": 1.2367411433808426, "percentage": 41.22, "elapsed_time": "1 day, 12:25:18", "remaining_time": "2 days, 3:55:42", "throughput": 27375.13, "total_tokens": 3589381312} +{"current_steps": 12240, "total_steps": 29667, "loss": 0.3568, "lr": 3.352836509277369e-05, "epoch": 1.2377524254969503, "percentage": 41.26, "elapsed_time": "1 day, 12:27:07", "remaining_time": "2 days, 3:53:58", "throughput": 27374.6, "total_tokens": 3592311360} +{"current_steps": 12250, "total_steps": 29667, "loss": 0.3602, "lr": 3.352082944322966e-05, "epoch": 1.2387637076130582, "percentage": 41.29, "elapsed_time": "1 day, 12:28:53", "remaining_time": "2 days, 3:52:09", "throughput": 27375.17, "total_tokens": 3595268544} +{"current_steps": 12260, "total_steps": 29667, "loss": 0.3583, "lr": 3.351329887241524e-05, "epoch": 1.2397749897291659, "percentage": 41.33, "elapsed_time": "1 day, 12:30:41", "remaining_time": "2 days, 3:50:22", "throughput": 27375.08, "total_tokens": 3598209792} +{"current_steps": 12270, "total_steps": 29667, "loss": 0.3584, "lr": 3.3505773374628225e-05, "epoch": 1.2407862718452738, "percentage": 41.36, "elapsed_time": "1 day, 12:32:31", "remaining_time": "2 days, 3:48:40", "throughput": 27374.36, "total_tokens": 3601148352} +{"current_steps": 12280, "total_steps": 29667, "loss": 0.3605, "lr": 3.3498252944175354e-05, "epoch": 1.2417975539613817, "percentage": 41.39, "elapsed_time": "1 day, 12:34:21", "remaining_time": "2 days, 3:46:56", "throughput": 27373.83, "total_tokens": 3604067584} +{"current_steps": 12290, "total_steps": 29667, "loss": 0.3648, "lr": 3.3490737575372326e-05, "epoch": 1.2428088360774896, "percentage": 41.43, "elapsed_time": "1 day, 12:36:07", "remaining_time": "2 days, 3:45:08", "throughput": 27374.09, "total_tokens": 3607021440} +{"current_steps": 12300, "total_steps": 29667, "loss": 0.3577, "lr": 3.348322726254375e-05, "epoch": 1.2438201181935973, "percentage": 41.46, "elapsed_time": "1 day, 12:37:54", "remaining_time": "2 days, 3:43:20", "throughput": 27374.32, "total_tokens": 3609979328} +{"current_steps": 12310, "total_steps": 29667, "loss": 0.3587, "lr": 3.347572200002315e-05, "epoch": 1.2448314003097052, "percentage": 41.49, "elapsed_time": "1 day, 12:39:40", "remaining_time": "2 days, 3:41:31", "throughput": 27374.55, "total_tokens": 3612906624} +{"current_steps": 12320, "total_steps": 29667, "loss": 0.3492, "lr": 3.3468221782152924e-05, "epoch": 1.2458426824258129, "percentage": 41.53, "elapsed_time": "1 day, 12:41:32", "remaining_time": "2 days, 3:39:51", "throughput": 27373.67, "total_tokens": 3615860352} +{"current_steps": 12330, "total_steps": 29667, "loss": 0.3636, "lr": 3.346072660328435e-05, "epoch": 1.2468539645419208, "percentage": 41.56, "elapsed_time": "1 day, 12:43:16", "remaining_time": "2 days, 3:37:59", "throughput": 27373.84, "total_tokens": 3618737536} +{"current_steps": 12340, "total_steps": 29667, "loss": 0.3598, "lr": 3.345323645777756e-05, "epoch": 1.2478652466580287, "percentage": 41.6, "elapsed_time": "1 day, 12:45:03", "remaining_time": "2 days, 3:36:11", "throughput": 27374.12, "total_tokens": 3621693312} +{"current_steps": 12350, "total_steps": 29667, "loss": 0.3583, "lr": 3.34457513400015e-05, "epoch": 1.2488765287741366, "percentage": 41.63, "elapsed_time": "1 day, 12:46:58", "remaining_time": "2 days, 3:34:36", "throughput": 27372.46, "total_tokens": 3624633280} +{"current_steps": 12360, "total_steps": 29667, "loss": 0.358, "lr": 3.343827124433396e-05, "epoch": 1.2498878108902443, "percentage": 41.66, "elapsed_time": "1 day, 12:48:52", "remaining_time": "2 days, 3:32:57", "throughput": 27371.08, "total_tokens": 3627558464} +{"current_steps": 12370, "total_steps": 29667, "loss": 0.3525, "lr": 3.343079616516151e-05, "epoch": 1.2508990930063522, "percentage": 41.7, "elapsed_time": "1 day, 12:50:34", "remaining_time": "2 days, 3:31:03", "throughput": 27372.1, "total_tokens": 3630489344} +{"current_steps": 12380, "total_steps": 29667, "loss": 0.3592, "lr": 3.3423326096879495e-05, "epoch": 1.2519103751224598, "percentage": 41.73, "elapsed_time": "1 day, 12:52:22", "remaining_time": "2 days, 3:29:17", "throughput": 27371.7, "total_tokens": 3633399232} +{"current_steps": 12390, "total_steps": 29667, "loss": 0.356, "lr": 3.341586103389203e-05, "epoch": 1.2529216572385677, "percentage": 41.76, "elapsed_time": "1 day, 12:54:06", "remaining_time": "2 days, 3:27:24", "throughput": 27372.38, "total_tokens": 3636314304} +{"current_steps": 12400, "total_steps": 29667, "loss": 0.3531, "lr": 3.3408400970611995e-05, "epoch": 1.2539329393546756, "percentage": 41.8, "elapsed_time": "1 day, 12:55:48", "remaining_time": "2 days, 3:25:30", "throughput": 27373.38, "total_tokens": 3639238976} +{"current_steps": 12410, "total_steps": 29667, "loss": 0.3556, "lr": 3.340094590146095e-05, "epoch": 1.2549442214707835, "percentage": 41.83, "elapsed_time": "1 day, 12:57:40", "remaining_time": "2 days, 3:23:50", "throughput": 27372.36, "total_tokens": 3642180864} +{"current_steps": 12420, "total_steps": 29667, "loss": 0.3592, "lr": 3.3393495820869215e-05, "epoch": 1.2559555035868912, "percentage": 41.86, "elapsed_time": "1 day, 12:59:28", "remaining_time": "2 days, 3:22:04", "throughput": 27372.05, "total_tokens": 3645101376} +{"current_steps": 12430, "total_steps": 29667, "loss": 0.3586, "lr": 3.338605072327576e-05, "epoch": 1.2569667857029991, "percentage": 41.9, "elapsed_time": "1 day, 13:01:17", "remaining_time": "2 days, 3:20:19", "throughput": 27371.82, "total_tokens": 3648051840} +{"current_steps": 12440, "total_steps": 29667, "loss": 0.359, "lr": 3.337861060312827e-05, "epoch": 1.2579780678191068, "percentage": 41.93, "elapsed_time": "1 day, 13:03:02", "remaining_time": "2 days, 3:18:29", "throughput": 27371.87, "total_tokens": 3650936960} +{"current_steps": 12450, "total_steps": 29667, "loss": 0.3628, "lr": 3.337117545488306e-05, "epoch": 1.2589893499352147, "percentage": 41.97, "elapsed_time": "1 day, 13:04:45", "remaining_time": "2 days, 3:16:36", "throughput": 27372.61, "total_tokens": 3653851520} +{"current_steps": 12460, "total_steps": 29667, "loss": 0.3585, "lr": 3.33637452730051e-05, "epoch": 1.2600006320513226, "percentage": 42.0, "elapsed_time": "1 day, 13:06:36", "remaining_time": "2 days, 3:14:54", "throughput": 27372.17, "total_tokens": 3656835392} +{"current_steps": 12470, "total_steps": 29667, "loss": 0.3565, "lr": 3.335632005196796e-05, "epoch": 1.2610119141674305, "percentage": 42.03, "elapsed_time": "1 day, 13:08:29", "remaining_time": "2 days, 3:13:14", "throughput": 27371.37, "total_tokens": 3659805248} +{"current_steps": 12480, "total_steps": 29667, "loss": 0.3585, "lr": 3.334889978625383e-05, "epoch": 1.2620231962835382, "percentage": 42.07, "elapsed_time": "1 day, 13:10:13", "remaining_time": "2 days, 3:11:23", "throughput": 27372.12, "total_tokens": 3662761728} +{"current_steps": 12490, "total_steps": 29667, "loss": 0.3571, "lr": 3.3341484470353515e-05, "epoch": 1.263034478399646, "percentage": 42.1, "elapsed_time": "1 day, 13:12:03", "remaining_time": "2 days, 3:09:39", "throughput": 27371.83, "total_tokens": 3665733888} +{"current_steps": 12500, "total_steps": 29667, "loss": 0.3593, "lr": 3.333407409876635e-05, "epoch": 1.2640457605157538, "percentage": 42.13, "elapsed_time": "1 day, 13:13:47", "remaining_time": "2 days, 3:07:48", "throughput": 27372.42, "total_tokens": 3668658560} +{"current_steps": 12510, "total_steps": 29667, "loss": 0.3613, "lr": 3.332666866600024e-05, "epoch": 1.2650570426318617, "percentage": 42.17, "elapsed_time": "1 day, 13:15:34", "remaining_time": "2 days, 3:06:00", "throughput": 27372.51, "total_tokens": 3671595264} +{"current_steps": 12520, "total_steps": 29667, "loss": 0.3606, "lr": 3.331926816657162e-05, "epoch": 1.2660683247479696, "percentage": 42.2, "elapsed_time": "1 day, 13:17:19", "remaining_time": "2 days, 3:04:10", "throughput": 27372.86, "total_tokens": 3674532032} +{"current_steps": 12530, "total_steps": 29667, "loss": 0.359, "lr": 3.331187259500546e-05, "epoch": 1.2670796068640775, "percentage": 42.24, "elapsed_time": "1 day, 13:19:02", "remaining_time": "2 days, 3:02:17", "throughput": 27373.46, "total_tokens": 3677416128} +{"current_steps": 12540, "total_steps": 29667, "loss": 0.3587, "lr": 3.3304481945835235e-05, "epoch": 1.2680908889801852, "percentage": 42.27, "elapsed_time": "1 day, 13:20:49", "remaining_time": "2 days, 3:00:29", "throughput": 27373.81, "total_tokens": 3680386240} +{"current_steps": 12550, "total_steps": 29667, "loss": 0.3544, "lr": 3.329709621360288e-05, "epoch": 1.269102171096293, "percentage": 42.3, "elapsed_time": "1 day, 13:22:36", "remaining_time": "2 days, 2:58:41", "throughput": 27373.66, "total_tokens": 3683299584} +{"current_steps": 12560, "total_steps": 29667, "loss": 0.3607, "lr": 3.328971539285882e-05, "epoch": 1.2701134532124008, "percentage": 42.34, "elapsed_time": "1 day, 13:24:21", "remaining_time": "2 days, 2:56:51", "throughput": 27374.18, "total_tokens": 3686242560} +{"current_steps": 12570, "total_steps": 29667, "loss": 0.362, "lr": 3.3282339478161935e-05, "epoch": 1.2711247353285087, "percentage": 42.37, "elapsed_time": "1 day, 13:26:02", "remaining_time": "2 days, 2:54:56", "throughput": 27375.02, "total_tokens": 3689127680} +{"current_steps": 12580, "total_steps": 29667, "loss": 0.3599, "lr": 3.327496846407953e-05, "epoch": 1.2721360174446166, "percentage": 42.4, "elapsed_time": "1 day, 13:27:47", "remaining_time": "2 days, 2:53:06", "throughput": 27375.27, "total_tokens": 3692038784} +{"current_steps": 12590, "total_steps": 29667, "loss": 0.3551, "lr": 3.3267602345187304e-05, "epoch": 1.2731472995607243, "percentage": 42.44, "elapsed_time": "1 day, 13:29:31", "remaining_time": "2 days, 2:51:14", "throughput": 27376.04, "total_tokens": 3694989504} +{"current_steps": 12600, "total_steps": 29667, "loss": 0.3571, "lr": 3.326024111606942e-05, "epoch": 1.2741585816768322, "percentage": 42.47, "elapsed_time": "1 day, 13:31:19", "remaining_time": "2 days, 2:49:28", "throughput": 27376.34, "total_tokens": 3697982848} +{"current_steps": 12610, "total_steps": 29667, "loss": 0.3613, "lr": 3.325288477131839e-05, "epoch": 1.27516986379294, "percentage": 42.51, "elapsed_time": "1 day, 13:33:07", "remaining_time": "2 days, 2:47:41", "throughput": 27376.22, "total_tokens": 3700912256} +{"current_steps": 12620, "total_steps": 29667, "loss": 0.3566, "lr": 3.324553330553507e-05, "epoch": 1.2761811459090477, "percentage": 42.54, "elapsed_time": "1 day, 13:34:52", "remaining_time": "2 days, 2:45:52", "throughput": 27376.52, "total_tokens": 3703845824} +{"current_steps": 12630, "total_steps": 29667, "loss": 0.3596, "lr": 3.323818671332871e-05, "epoch": 1.2771924280251556, "percentage": 42.57, "elapsed_time": "1 day, 13:36:38", "remaining_time": "2 days, 2:44:03", "throughput": 27377.15, "total_tokens": 3706838976} +{"current_steps": 12640, "total_steps": 29667, "loss": 0.3593, "lr": 3.323084498931687e-05, "epoch": 1.2782037101412635, "percentage": 42.61, "elapsed_time": "1 day, 13:38:24", "remaining_time": "2 days, 2:42:13", "throughput": 27377.32, "total_tokens": 3709738048} +{"current_steps": 12650, "total_steps": 29667, "loss": 0.3557, "lr": 3.322350812812545e-05, "epoch": 1.2792149922573712, "percentage": 42.64, "elapsed_time": "1 day, 13:40:10", "remaining_time": "2 days, 2:40:25", "throughput": 27377.62, "total_tokens": 3712684416} +{"current_steps": 12660, "total_steps": 29667, "loss": 0.3572, "lr": 3.321617612438862e-05, "epoch": 1.2802262743734791, "percentage": 42.67, "elapsed_time": "1 day, 13:41:56", "remaining_time": "2 days, 2:38:37", "throughput": 27377.84, "total_tokens": 3715635008} +{"current_steps": 12670, "total_steps": 29667, "loss": 0.3593, "lr": 3.320884897274886e-05, "epoch": 1.281237556489587, "percentage": 42.71, "elapsed_time": "1 day, 13:43:43", "remaining_time": "2 days, 2:36:48", "throughput": 27378.38, "total_tokens": 3718614208} +{"current_steps": 12680, "total_steps": 29667, "loss": 0.3551, "lr": 3.320152666785692e-05, "epoch": 1.2822488386056947, "percentage": 42.74, "elapsed_time": "1 day, 13:45:26", "remaining_time": "2 days, 2:34:56", "throughput": 27379.15, "total_tokens": 3721543168} +{"current_steps": 12690, "total_steps": 29667, "loss": 0.3553, "lr": 3.319420920437179e-05, "epoch": 1.2832601207218026, "percentage": 42.77, "elapsed_time": "1 day, 13:47:13", "remaining_time": "2 days, 2:33:09", "throughput": 27379.05, "total_tokens": 3724475584} +{"current_steps": 12700, "total_steps": 29667, "loss": 0.3526, "lr": 3.31868965769607e-05, "epoch": 1.2842714028379105, "percentage": 42.81, "elapsed_time": "1 day, 13:49:00", "remaining_time": "2 days, 2:31:22", "throughput": 27378.98, "total_tokens": 3727400960} +{"current_steps": 12710, "total_steps": 29667, "loss": 0.355, "lr": 3.317958878029911e-05, "epoch": 1.2852826849540182, "percentage": 42.84, "elapsed_time": "1 day, 13:50:45", "remaining_time": "2 days, 2:29:31", "throughput": 27379.68, "total_tokens": 3730368960} +{"current_steps": 12720, "total_steps": 29667, "loss": 0.3668, "lr": 3.3172285809070665e-05, "epoch": 1.286293967070126, "percentage": 42.88, "elapsed_time": "1 day, 13:52:43", "remaining_time": "2 days, 2:27:58", "throughput": 27377.61, "total_tokens": 3733309120} +{"current_steps": 12730, "total_steps": 29667, "loss": 0.3588, "lr": 3.3164987657967214e-05, "epoch": 1.2873052491862338, "percentage": 42.91, "elapsed_time": "1 day, 13:54:24", "remaining_time": "2 days, 2:26:03", "throughput": 27378.85, "total_tokens": 3736241216} +{"current_steps": 12740, "total_steps": 29667, "loss": 0.356, "lr": 3.315769432168877e-05, "epoch": 1.2883165313023417, "percentage": 42.94, "elapsed_time": "1 day, 13:56:04", "remaining_time": "2 days, 2:24:06", "throughput": 27379.88, "total_tokens": 3739129984} +{"current_steps": 12750, "total_steps": 29667, "loss": 0.3544, "lr": 3.315040579494349e-05, "epoch": 1.2893278134184496, "percentage": 42.98, "elapsed_time": "1 day, 13:57:50", "remaining_time": "2 days, 2:22:17", "throughput": 27380.11, "total_tokens": 3742052864} +{"current_steps": 12760, "total_steps": 29667, "loss": 0.3591, "lr": 3.31431220724477e-05, "epoch": 1.2903390955345575, "percentage": 43.01, "elapsed_time": "1 day, 13:59:39", "remaining_time": "2 days, 2:20:32", "throughput": 27379.9, "total_tokens": 3745009408} +{"current_steps": 12770, "total_steps": 29667, "loss": 0.36, "lr": 3.3135843148925834e-05, "epoch": 1.2913503776506652, "percentage": 43.04, "elapsed_time": "1 day, 14:01:25", "remaining_time": "2 days, 2:18:43", "throughput": 27380.29, "total_tokens": 3747962048} +{"current_steps": 12780, "total_steps": 29667, "loss": 0.3603, "lr": 3.3128569019110414e-05, "epoch": 1.292361659766773, "percentage": 43.08, "elapsed_time": "1 day, 14:03:08", "remaining_time": "2 days, 2:16:51", "throughput": 27380.89, "total_tokens": 3750872896} +{"current_steps": 12790, "total_steps": 29667, "loss": 0.3564, "lr": 3.312129967774207e-05, "epoch": 1.2933729418828808, "percentage": 43.11, "elapsed_time": "1 day, 14:04:48", "remaining_time": "2 days, 2:14:55", "throughput": 27381.72, "total_tokens": 3753732928} +{"current_steps": 12800, "total_steps": 29667, "loss": 0.3526, "lr": 3.311403511956952e-05, "epoch": 1.2943842239989887, "percentage": 43.15, "elapsed_time": "1 day, 14:06:28", "remaining_time": "2 days, 2:12:57", "throughput": 27382.86, "total_tokens": 3756603328} +{"current_steps": 12810, "total_steps": 29667, "loss": 0.3615, "lr": 3.310677533934952e-05, "epoch": 1.2953955061150966, "percentage": 43.18, "elapsed_time": "1 day, 14:08:16", "remaining_time": "2 days, 2:11:11", "throughput": 27383.08, "total_tokens": 3759588928} +{"current_steps": 12820, "total_steps": 29667, "loss": 0.3534, "lr": 3.309952033184686e-05, "epoch": 1.2964067882312045, "percentage": 43.21, "elapsed_time": "1 day, 14:09:57", "remaining_time": "2 days, 2:09:16", "throughput": 27383.89, "total_tokens": 3762484864} +{"current_steps": 12830, "total_steps": 29667, "loss": 0.3581, "lr": 3.309227009183439e-05, "epoch": 1.2974180703473122, "percentage": 43.25, "elapsed_time": "1 day, 14:11:43", "remaining_time": "2 days, 2:07:28", "throughput": 27384.5, "total_tokens": 3765471232} +{"current_steps": 12840, "total_steps": 29667, "loss": 0.3605, "lr": 3.308502461409295e-05, "epoch": 1.29842935246342, "percentage": 43.28, "elapsed_time": "1 day, 14:13:25", "remaining_time": "2 days, 2:05:34", "throughput": 27385.35, "total_tokens": 3768377088} +{"current_steps": 12850, "total_steps": 29667, "loss": 0.3577, "lr": 3.3077783893411386e-05, "epoch": 1.2994406345795277, "percentage": 43.31, "elapsed_time": "1 day, 14:15:11", "remaining_time": "2 days, 2:03:45", "throughput": 27385.65, "total_tokens": 3771315904} +{"current_steps": 12860, "total_steps": 29667, "loss": 0.3549, "lr": 3.30705479245865e-05, "epoch": 1.3004519166956356, "percentage": 43.35, "elapsed_time": "1 day, 14:16:53", "remaining_time": "2 days, 2:01:50", "throughput": 27386.62, "total_tokens": 3774238144} +{"current_steps": 12870, "total_steps": 29667, "loss": 0.3587, "lr": 3.3063316702423094e-05, "epoch": 1.3014631988117435, "percentage": 43.38, "elapsed_time": "1 day, 14:18:40", "remaining_time": "2 days, 2:00:04", "throughput": 27386.8, "total_tokens": 3777211840} +{"current_steps": 12880, "total_steps": 29667, "loss": 0.3587, "lr": 3.305609022173388e-05, "epoch": 1.3024744809278515, "percentage": 43.42, "elapsed_time": "1 day, 14:20:25", "remaining_time": "2 days, 1:58:13", "throughput": 27387.15, "total_tokens": 3780125632} +{"current_steps": 12890, "total_steps": 29667, "loss": 0.3565, "lr": 3.304886847733954e-05, "epoch": 1.3034857630439591, "percentage": 43.45, "elapsed_time": "1 day, 14:22:09", "remaining_time": "2 days, 1:56:22", "throughput": 27387.96, "total_tokens": 3783078464} +{"current_steps": 12900, "total_steps": 29667, "loss": 0.3572, "lr": 3.304165146406865e-05, "epoch": 1.304497045160067, "percentage": 43.48, "elapsed_time": "1 day, 14:23:55", "remaining_time": "2 days, 1:54:34", "throughput": 27388.17, "total_tokens": 3786026176} +{"current_steps": 12910, "total_steps": 29667, "loss": 0.3577, "lr": 3.30344391767577e-05, "epoch": 1.3055083272761747, "percentage": 43.52, "elapsed_time": "1 day, 14:25:42", "remaining_time": "2 days, 1:52:46", "throughput": 27388.51, "total_tokens": 3788989952} +{"current_steps": 12920, "total_steps": 29667, "loss": 0.3558, "lr": 3.302723161025104e-05, "epoch": 1.3065196093922826, "percentage": 43.55, "elapsed_time": "1 day, 14:27:27", "remaining_time": "2 days, 1:50:56", "throughput": 27389.13, "total_tokens": 3791948928} +{"current_steps": 12930, "total_steps": 29667, "loss": 0.3593, "lr": 3.302002875940093e-05, "epoch": 1.3075308915083905, "percentage": 43.58, "elapsed_time": "1 day, 14:29:11", "remaining_time": "2 days, 1:49:05", "throughput": 27389.74, "total_tokens": 3794883584} +{"current_steps": 12940, "total_steps": 29667, "loss": 0.3578, "lr": 3.3012830619067466e-05, "epoch": 1.3085421736244984, "percentage": 43.62, "elapsed_time": "1 day, 14:30:55", "remaining_time": "2 days, 1:47:13", "throughput": 27390.49, "total_tokens": 3797832832} +{"current_steps": 12950, "total_steps": 29667, "loss": 0.361, "lr": 3.300563718411857e-05, "epoch": 1.309553455740606, "percentage": 43.65, "elapsed_time": "1 day, 14:32:40", "remaining_time": "2 days, 1:45:23", "throughput": 27390.97, "total_tokens": 3800775296} +{"current_steps": 12960, "total_steps": 29667, "loss": 0.3578, "lr": 3.299844844943e-05, "epoch": 1.310564737856714, "percentage": 43.68, "elapsed_time": "1 day, 14:34:28", "remaining_time": "2 days, 1:43:37", "throughput": 27391.04, "total_tokens": 3803741312} +{"current_steps": 12970, "total_steps": 29667, "loss": 0.3563, "lr": 3.299126440988535e-05, "epoch": 1.3115760199728217, "percentage": 43.72, "elapsed_time": "1 day, 14:36:13", "remaining_time": "2 days, 1:41:47", "throughput": 27391.5, "total_tokens": 3806679488} +{"current_steps": 12980, "total_steps": 29667, "loss": 0.3548, "lr": 3.298408506037596e-05, "epoch": 1.3125873020889296, "percentage": 43.75, "elapsed_time": "1 day, 14:37:58", "remaining_time": "2 days, 1:39:58", "throughput": 27392.15, "total_tokens": 3809657472} +{"current_steps": 12990, "total_steps": 29667, "loss": 0.3566, "lr": 3.297691039580097e-05, "epoch": 1.3135985842050375, "percentage": 43.79, "elapsed_time": "1 day, 14:39:38", "remaining_time": "2 days, 1:38:02", "throughput": 27393.33, "total_tokens": 3812567360} +{"current_steps": 13000, "total_steps": 29667, "loss": 0.3546, "lr": 3.29697404110673e-05, "epoch": 1.3146098663211454, "percentage": 43.82, "elapsed_time": "1 day, 14:41:23", "remaining_time": "2 days, 1:36:12", "throughput": 27393.86, "total_tokens": 3815512768} +{"current_steps": 13010, "total_steps": 29667, "loss": 0.3553, "lr": 3.2962575101089594e-05, "epoch": 1.315621148437253, "percentage": 43.85, "elapsed_time": "1 day, 14:43:08", "remaining_time": "2 days, 1:34:22", "throughput": 27393.9, "total_tokens": 3818406272} +{"current_steps": 13020, "total_steps": 29667, "loss": 0.3606, "lr": 3.295541446079024e-05, "epoch": 1.316632430553361, "percentage": 43.89, "elapsed_time": "1 day, 14:44:53", "remaining_time": "2 days, 1:32:32", "throughput": 27394.29, "total_tokens": 3821317632} +{"current_steps": 13030, "total_steps": 29667, "loss": 0.3582, "lr": 3.2948258485099336e-05, "epoch": 1.3176437126694687, "percentage": 43.92, "elapsed_time": "1 day, 14:46:38", "remaining_time": "2 days, 1:30:42", "throughput": 27394.43, "total_tokens": 3824222976} +{"current_steps": 13040, "total_steps": 29667, "loss": 0.3588, "lr": 3.29411071689547e-05, "epoch": 1.3186549947855766, "percentage": 43.95, "elapsed_time": "1 day, 14:48:22", "remaining_time": "2 days, 1:28:51", "throughput": 27394.99, "total_tokens": 3827143488} +{"current_steps": 13050, "total_steps": 29667, "loss": 0.3586, "lr": 3.2933960507301826e-05, "epoch": 1.3196662769016845, "percentage": 43.99, "elapsed_time": "1 day, 14:50:06", "remaining_time": "2 days, 1:26:59", "throughput": 27395.73, "total_tokens": 3830089216} +{"current_steps": 13060, "total_steps": 29667, "loss": 0.3624, "lr": 3.292681849509387e-05, "epoch": 1.3206775590177924, "percentage": 44.02, "elapsed_time": "1 day, 14:51:52", "remaining_time": "2 days, 1:25:11", "throughput": 27396.09, "total_tokens": 3833055616} +{"current_steps": 13070, "total_steps": 29667, "loss": 0.356, "lr": 3.291968112729166e-05, "epoch": 1.3216888411339, "percentage": 44.06, "elapsed_time": "1 day, 14:53:29", "remaining_time": "2 days, 1:23:11", "throughput": 27397.65, "total_tokens": 3835927296} +{"current_steps": 13080, "total_steps": 29667, "loss": 0.3566, "lr": 3.291254839886367e-05, "epoch": 1.322700123250008, "percentage": 44.09, "elapsed_time": "1 day, 14:55:10", "remaining_time": "2 days, 1:21:16", "throughput": 27398.88, "total_tokens": 3838858752} +{"current_steps": 13090, "total_steps": 29667, "loss": 0.3551, "lr": 3.2905420304785995e-05, "epoch": 1.3237114053661156, "percentage": 44.12, "elapsed_time": "1 day, 14:56:52", "remaining_time": "2 days, 1:19:23", "throughput": 27399.81, "total_tokens": 3841800384} +{"current_steps": 13100, "total_steps": 29667, "loss": 0.3539, "lr": 3.289829684004235e-05, "epoch": 1.3247226874822235, "percentage": 44.16, "elapsed_time": "1 day, 14:58:36", "remaining_time": "2 days, 1:17:32", "throughput": 27400.53, "total_tokens": 3844745536} +{"current_steps": 13110, "total_steps": 29667, "loss": 0.3555, "lr": 3.289117799962402e-05, "epoch": 1.3257339695983315, "percentage": 44.19, "elapsed_time": "1 day, 15:00:22", "remaining_time": "2 days, 1:15:43", "throughput": 27400.77, "total_tokens": 3847690496} +{"current_steps": 13120, "total_steps": 29667, "loss": 0.3544, "lr": 3.2884063778529914e-05, "epoch": 1.3267452517144391, "percentage": 44.22, "elapsed_time": "1 day, 15:02:10", "remaining_time": "2 days, 1:13:57", "throughput": 27400.97, "total_tokens": 3850658880} +{"current_steps": 13130, "total_steps": 29667, "loss": 0.3569, "lr": 3.28769541717665e-05, "epoch": 1.327756533830547, "percentage": 44.26, "elapsed_time": "1 day, 15:03:58", "remaining_time": "2 days, 1:12:11", "throughput": 27400.98, "total_tokens": 3853623104} +{"current_steps": 13140, "total_steps": 29667, "loss": 0.3606, "lr": 3.2869849174347775e-05, "epoch": 1.328767815946655, "percentage": 44.29, "elapsed_time": "1 day, 15:05:41", "remaining_time": "2 days, 1:10:19", "throughput": 27401.68, "total_tokens": 3856547200} +{"current_steps": 13150, "total_steps": 29667, "loss": 0.3541, "lr": 3.2862748781295294e-05, "epoch": 1.3297790980627626, "percentage": 44.33, "elapsed_time": "1 day, 15:07:26", "remaining_time": "2 days, 1:08:29", "throughput": 27402.01, "total_tokens": 3859479104} +{"current_steps": 13160, "total_steps": 29667, "loss": 0.3573, "lr": 3.2855652987638146e-05, "epoch": 1.3307903801788705, "percentage": 44.36, "elapsed_time": "1 day, 15:09:14", "remaining_time": "2 days, 1:06:43", "throughput": 27402.04, "total_tokens": 3862443840} +{"current_steps": 13170, "total_steps": 29667, "loss": 0.3625, "lr": 3.284856178841291e-05, "epoch": 1.3318016622949784, "percentage": 44.39, "elapsed_time": "1 day, 15:10:54", "remaining_time": "2 days, 1:04:47", "throughput": 27403.29, "total_tokens": 3865358912} +{"current_steps": 13180, "total_steps": 29667, "loss": 0.3561, "lr": 3.284147517866367e-05, "epoch": 1.332812944411086, "percentage": 44.43, "elapsed_time": "1 day, 15:12:40", "remaining_time": "2 days, 1:02:59", "throughput": 27403.53, "total_tokens": 3868299648} +{"current_steps": 13190, "total_steps": 29667, "loss": 0.3581, "lr": 3.2834393153441976e-05, "epoch": 1.333824226527194, "percentage": 44.46, "elapsed_time": "1 day, 15:14:20", "remaining_time": "2 days, 1:01:03", "throughput": 27404.85, "total_tokens": 3871235776} +{"current_steps": 13200, "total_steps": 29667, "loss": 0.3505, "lr": 3.282731570780689e-05, "epoch": 1.334835508643302, "percentage": 44.49, "elapsed_time": "1 day, 15:16:05", "remaining_time": "2 days, 0:59:12", "throughput": 27405.66, "total_tokens": 3874203584} +{"current_steps": 13210, "total_steps": 29667, "loss": 0.3532, "lr": 3.2820242836824875e-05, "epoch": 1.3358467907594096, "percentage": 44.53, "elapsed_time": "1 day, 15:17:50", "remaining_time": "2 days, 0:57:24", "throughput": 27406.28, "total_tokens": 3877185984} +{"current_steps": 13220, "total_steps": 29667, "loss": 0.3574, "lr": 3.2813174535569854e-05, "epoch": 1.3368580728755175, "percentage": 44.56, "elapsed_time": "1 day, 15:19:37", "remaining_time": "2 days, 0:55:37", "throughput": 27406.58, "total_tokens": 3880166592} +{"current_steps": 13230, "total_steps": 29667, "loss": 0.3635, "lr": 3.280611079912318e-05, "epoch": 1.3378693549916254, "percentage": 44.6, "elapsed_time": "1 day, 15:21:28", "remaining_time": "2 days, 0:53:54", "throughput": 27406.19, "total_tokens": 3883151232} +{"current_steps": 13240, "total_steps": 29667, "loss": 0.3529, "lr": 3.279905162257358e-05, "epoch": 1.338880637107733, "percentage": 44.63, "elapsed_time": "1 day, 15:23:12", "remaining_time": "2 days, 0:52:03", "throughput": 27407.02, "total_tokens": 3886110336} +{"current_steps": 13250, "total_steps": 29667, "loss": 0.3579, "lr": 3.279199700101723e-05, "epoch": 1.339891919223841, "percentage": 44.66, "elapsed_time": "1 day, 15:24:52", "remaining_time": "2 days, 0:50:07", "throughput": 27408.29, "total_tokens": 3889023936} +{"current_steps": 13260, "total_steps": 29667, "loss": 0.3533, "lr": 3.2784946929557644e-05, "epoch": 1.3409032013399487, "percentage": 44.7, "elapsed_time": "1 day, 15:26:35", "remaining_time": "2 days, 0:48:15", "throughput": 27409.05, "total_tokens": 3891960064} +{"current_steps": 13270, "total_steps": 29667, "loss": 0.3633, "lr": 3.277790140330571e-05, "epoch": 1.3419144834560566, "percentage": 44.73, "elapsed_time": "1 day, 15:28:16", "remaining_time": "2 days, 0:46:21", "throughput": 27410.02, "total_tokens": 3894880192} +{"current_steps": 13280, "total_steps": 29667, "loss": 0.3577, "lr": 3.277086041737968e-05, "epoch": 1.3429257655721645, "percentage": 44.76, "elapsed_time": "1 day, 15:29:59", "remaining_time": "2 days, 0:44:29", "throughput": 27410.51, "total_tokens": 3897774400} +{"current_steps": 13290, "total_steps": 29667, "loss": 0.3582, "lr": 3.276382396690513e-05, "epoch": 1.3439370476882724, "percentage": 44.8, "elapsed_time": "1 day, 15:31:45", "remaining_time": "2 days, 0:42:40", "throughput": 27410.21, "total_tokens": 3900633536} +{"current_steps": 13300, "total_steps": 29667, "loss": 0.3563, "lr": 3.275679204701496e-05, "epoch": 1.34494832980438, "percentage": 44.83, "elapsed_time": "1 day, 15:33:30", "remaining_time": "2 days, 0:40:51", "throughput": 27410.73, "total_tokens": 3903586816} +{"current_steps": 13310, "total_steps": 29667, "loss": 0.3591, "lr": 3.274976465284939e-05, "epoch": 1.345959611920488, "percentage": 44.86, "elapsed_time": "1 day, 15:35:11", "remaining_time": "2 days, 0:38:56", "throughput": 27411.81, "total_tokens": 3906511168} +{"current_steps": 13320, "total_steps": 29667, "loss": 0.3576, "lr": 3.274274177955593e-05, "epoch": 1.3469708940365956, "percentage": 44.9, "elapsed_time": "1 day, 15:36:57", "remaining_time": "2 days, 0:37:07", "throughput": 27411.97, "total_tokens": 3909429248} +{"current_steps": 13330, "total_steps": 29667, "loss": 0.3577, "lr": 3.273572342228937e-05, "epoch": 1.3479821761527035, "percentage": 44.93, "elapsed_time": "1 day, 15:38:42", "remaining_time": "2 days, 0:35:17", "throughput": 27412.69, "total_tokens": 3912397120} +{"current_steps": 13340, "total_steps": 29667, "loss": 0.3529, "lr": 3.272870957621176e-05, "epoch": 1.3489934582688115, "percentage": 44.97, "elapsed_time": "1 day, 15:40:22", "remaining_time": "2 days, 0:33:22", "throughput": 27413.76, "total_tokens": 3915314176} +{"current_steps": 13350, "total_steps": 29667, "loss": 0.3575, "lr": 3.2721700236492414e-05, "epoch": 1.3500047403849194, "percentage": 45.0, "elapsed_time": "1 day, 15:42:03", "remaining_time": "2 days, 0:31:28", "throughput": 27414.99, "total_tokens": 3918252032} +{"current_steps": 13360, "total_steps": 29667, "loss": 0.3554, "lr": 3.271469539830788e-05, "epoch": 1.351016022501027, "percentage": 45.03, "elapsed_time": "1 day, 15:43:46", "remaining_time": "2 days, 0:29:35", "throughput": 27415.75, "total_tokens": 3921177664} +{"current_steps": 13370, "total_steps": 29667, "loss": 0.3554, "lr": 3.270769505684193e-05, "epoch": 1.352027304617135, "percentage": 45.07, "elapsed_time": "1 day, 15:45:26", "remaining_time": "2 days, 0:27:39", "throughput": 27417.12, "total_tokens": 3924108096} +{"current_steps": 13380, "total_steps": 29667, "loss": 0.3595, "lr": 3.2700699207285544e-05, "epoch": 1.3530385867332426, "percentage": 45.1, "elapsed_time": "1 day, 15:47:07", "remaining_time": "2 days, 0:25:45", "throughput": 27418.16, "total_tokens": 3927028032} +{"current_steps": 13390, "total_steps": 29667, "loss": 0.3536, "lr": 3.269370784483691e-05, "epoch": 1.3540498688493505, "percentage": 45.13, "elapsed_time": "1 day, 15:48:45", "remaining_time": "2 days, 0:23:47", "throughput": 27419.35, "total_tokens": 3929895488} +{"current_steps": 13400, "total_steps": 29667, "loss": 0.3582, "lr": 3.268672096470138e-05, "epoch": 1.3550611509654584, "percentage": 45.17, "elapsed_time": "1 day, 15:50:28", "remaining_time": "2 days, 0:21:55", "throughput": 27420.22, "total_tokens": 3932829504} +{"current_steps": 13410, "total_steps": 29667, "loss": 0.3633, "lr": 3.2679738562091506e-05, "epoch": 1.3560724330815663, "percentage": 45.2, "elapsed_time": "1 day, 15:52:06", "remaining_time": "2 days, 0:19:58", "throughput": 27421.46, "total_tokens": 3935714112} +{"current_steps": 13420, "total_steps": 29667, "loss": 0.3582, "lr": 3.2672760632226964e-05, "epoch": 1.357083715197674, "percentage": 45.24, "elapsed_time": "1 day, 15:53:49", "remaining_time": "2 days, 0:18:05", "throughput": 27422.38, "total_tokens": 3938659648} +{"current_steps": 13430, "total_steps": 29667, "loss": 0.3552, "lr": 3.266578717033458e-05, "epoch": 1.358094997313782, "percentage": 45.27, "elapsed_time": "1 day, 15:55:35", "remaining_time": "2 days, 0:16:17", "throughput": 27422.43, "total_tokens": 3941578304} +{"current_steps": 13440, "total_steps": 29667, "loss": 0.3593, "lr": 3.265881817164833e-05, "epoch": 1.3591062794298896, "percentage": 45.3, "elapsed_time": "1 day, 15:57:19", "remaining_time": "2 days, 0:14:26", "throughput": 27423.12, "total_tokens": 3944525696} +{"current_steps": 13450, "total_steps": 29667, "loss": 0.3567, "lr": 3.265185363140928e-05, "epoch": 1.3601175615459975, "percentage": 45.34, "elapsed_time": "1 day, 15:59:06", "remaining_time": "2 days, 0:12:39", "throughput": 27423.63, "total_tokens": 3947527488} +{"current_steps": 13460, "total_steps": 29667, "loss": 0.3592, "lr": 3.26448935448656e-05, "epoch": 1.3611288436621054, "percentage": 45.37, "elapsed_time": "1 day, 16:00:46", "remaining_time": "2 days, 0:10:44", "throughput": 27424.84, "total_tokens": 3950456768} +{"current_steps": 13470, "total_steps": 29667, "loss": 0.3582, "lr": 3.263793790727256e-05, "epoch": 1.3621401257782133, "percentage": 45.4, "elapsed_time": "1 day, 16:02:26", "remaining_time": "2 days, 0:08:49", "throughput": 27426.09, "total_tokens": 3953377664} +{"current_steps": 13480, "total_steps": 29667, "loss": 0.3577, "lr": 3.2630986713892495e-05, "epoch": 1.363151407894321, "percentage": 45.44, "elapsed_time": "1 day, 16:04:12", "remaining_time": "2 days, 0:07:00", "throughput": 27426.6, "total_tokens": 3956357888} +{"current_steps": 13490, "total_steps": 29667, "loss": 0.3542, "lr": 3.26240399599948e-05, "epoch": 1.364162690010429, "percentage": 45.47, "elapsed_time": "1 day, 16:05:55", "remaining_time": "2 days, 0:05:09", "throughput": 27427.24, "total_tokens": 3959281536} +{"current_steps": 13500, "total_steps": 29667, "loss": 0.3556, "lr": 3.2617097640855914e-05, "epoch": 1.3651739721265366, "percentage": 45.51, "elapsed_time": "1 day, 16:07:39", "remaining_time": "2 days, 0:03:17", "throughput": 27427.72, "total_tokens": 3962181376} +{"current_steps": 13510, "total_steps": 29667, "loss": 0.3546, "lr": 3.2610159751759314e-05, "epoch": 1.3661852542426445, "percentage": 45.54, "elapsed_time": "1 day, 16:09:23", "remaining_time": "2 days, 0:01:28", "throughput": 27428.42, "total_tokens": 3965156096} +{"current_steps": 13520, "total_steps": 29667, "loss": 0.3509, "lr": 3.26032262879955e-05, "epoch": 1.3671965363587524, "percentage": 45.57, "elapsed_time": "1 day, 16:11:02", "remaining_time": "1 day, 23:59:31", "throughput": 27429.93, "total_tokens": 3968091008} +{"current_steps": 13530, "total_steps": 29667, "loss": 0.362, "lr": 3.259629724486198e-05, "epoch": 1.3682078184748603, "percentage": 45.61, "elapsed_time": "1 day, 16:12:46", "remaining_time": "1 day, 23:57:40", "throughput": 27430.38, "total_tokens": 3971008512} +{"current_steps": 13540, "total_steps": 29667, "loss": 0.3568, "lr": 3.258937261766323e-05, "epoch": 1.369219100590968, "percentage": 45.64, "elapsed_time": "1 day, 16:14:37", "remaining_time": "1 day, 23:55:57", "throughput": 27429.49, "total_tokens": 3973902656} +{"current_steps": 13550, "total_steps": 29667, "loss": 0.3602, "lr": 3.258245240171074e-05, "epoch": 1.3702303827070759, "percentage": 45.67, "elapsed_time": "1 day, 16:16:47", "remaining_time": "1 day, 23:54:39", "throughput": 27424.63, "total_tokens": 3976785344} +{"current_steps": 13560, "total_steps": 29667, "loss": 0.3591, "lr": 3.2575536592322935e-05, "epoch": 1.3712416648231835, "percentage": 45.71, "elapsed_time": "1 day, 16:18:36", "remaining_time": "1 day, 23:52:53", "throughput": 27424.77, "total_tokens": 3979773696} +{"current_steps": 13570, "total_steps": 29667, "loss": 0.3603, "lr": 3.256862518482523e-05, "epoch": 1.3722529469392915, "percentage": 45.74, "elapsed_time": "1 day, 16:20:15", "remaining_time": "1 day, 23:50:57", "throughput": 27426.05, "total_tokens": 3982685312} +{"current_steps": 13580, "total_steps": 29667, "loss": 0.3563, "lr": 3.256171817454994e-05, "epoch": 1.3732642290553994, "percentage": 45.77, "elapsed_time": "1 day, 16:22:00", "remaining_time": "1 day, 23:49:07", "throughput": 27426.58, "total_tokens": 3985642368} +{"current_steps": 13590, "total_steps": 29667, "loss": 0.361, "lr": 3.255481555683633e-05, "epoch": 1.3742755111715073, "percentage": 45.81, "elapsed_time": "1 day, 16:23:43", "remaining_time": "1 day, 23:47:15", "throughput": 27427.28, "total_tokens": 3988561728} +{"current_steps": 13600, "total_steps": 29667, "loss": 0.3562, "lr": 3.254791732703057e-05, "epoch": 1.375286793287615, "percentage": 45.84, "elapsed_time": "1 day, 16:25:23", "remaining_time": "1 day, 23:45:21", "throughput": 27428.43, "total_tokens": 3991489600} +{"current_steps": 13610, "total_steps": 29667, "loss": 0.3555, "lr": 3.254102348048575e-05, "epoch": 1.3762980754037228, "percentage": 45.88, "elapsed_time": "1 day, 16:27:07", "remaining_time": "1 day, 23:43:30", "throughput": 27429.19, "total_tokens": 3994442624} +{"current_steps": 13620, "total_steps": 29667, "loss": 0.3603, "lr": 3.25341340125618e-05, "epoch": 1.3773093575198305, "percentage": 45.91, "elapsed_time": "1 day, 16:28:49", "remaining_time": "1 day, 23:41:37", "throughput": 27430.28, "total_tokens": 3997396864} +{"current_steps": 13630, "total_steps": 29667, "loss": 0.3579, "lr": 3.2527248918625575e-05, "epoch": 1.3783206396359384, "percentage": 45.94, "elapsed_time": "1 day, 16:30:29", "remaining_time": "1 day, 23:39:42", "throughput": 27431.45, "total_tokens": 4000319680} +{"current_steps": 13640, "total_steps": 29667, "loss": 0.36, "lr": 3.252036819405075e-05, "epoch": 1.3793319217520463, "percentage": 45.98, "elapsed_time": "1 day, 16:32:11", "remaining_time": "1 day, 23:37:49", "throughput": 27432.3, "total_tokens": 4003231360} +{"current_steps": 13650, "total_steps": 29667, "loss": 0.3569, "lr": 3.251349183421788e-05, "epoch": 1.380343203868154, "percentage": 46.01, "elapsed_time": "1 day, 16:33:53", "remaining_time": "1 day, 23:35:56", "throughput": 27433.02, "total_tokens": 4006130368} +{"current_steps": 13660, "total_steps": 29667, "loss": 0.3572, "lr": 3.250661983451434e-05, "epoch": 1.381354485984262, "percentage": 46.04, "elapsed_time": "1 day, 16:35:33", "remaining_time": "1 day, 23:34:01", "throughput": 27434.15, "total_tokens": 4009039488} +{"current_steps": 13670, "total_steps": 29667, "loss": 0.3548, "lr": 3.2499752190334326e-05, "epoch": 1.3823657681003698, "percentage": 46.08, "elapsed_time": "1 day, 16:37:11", "remaining_time": "1 day, 23:32:03", "throughput": 27435.58, "total_tokens": 4011942272} +{"current_steps": 13680, "total_steps": 29667, "loss": 0.3594, "lr": 3.2492888897078834e-05, "epoch": 1.3833770502164775, "percentage": 46.11, "elapsed_time": "1 day, 16:38:55", "remaining_time": "1 day, 23:30:13", "throughput": 27436.13, "total_tokens": 4014874880} +{"current_steps": 13690, "total_steps": 29667, "loss": 0.3585, "lr": 3.248602995015567e-05, "epoch": 1.3843883323325854, "percentage": 46.15, "elapsed_time": "1 day, 16:40:37", "remaining_time": "1 day, 23:28:20", "throughput": 27437.09, "total_tokens": 4017822144} +{"current_steps": 13700, "total_steps": 29667, "loss": 0.3585, "lr": 3.247917534497943e-05, "epoch": 1.3853996144486933, "percentage": 46.18, "elapsed_time": "1 day, 16:42:18", "remaining_time": "1 day, 23:26:27", "throughput": 27438.02, "total_tokens": 4020735808} +{"current_steps": 13710, "total_steps": 29667, "loss": 0.353, "lr": 3.247232507697145e-05, "epoch": 1.386410896564801, "percentage": 46.21, "elapsed_time": "1 day, 16:44:00", "remaining_time": "1 day, 23:24:34", "throughput": 27439.06, "total_tokens": 4023674816} +{"current_steps": 13720, "total_steps": 29667, "loss": 0.3566, "lr": 3.246547914155985e-05, "epoch": 1.387422178680909, "percentage": 46.25, "elapsed_time": "1 day, 16:45:42", "remaining_time": "1 day, 23:22:41", "throughput": 27439.96, "total_tokens": 4026622464} +{"current_steps": 13730, "total_steps": 29667, "loss": 0.3535, "lr": 3.245863753417949e-05, "epoch": 1.3884334607970168, "percentage": 46.28, "elapsed_time": "1 day, 16:47:25", "remaining_time": "1 day, 23:20:50", "throughput": 27441.01, "total_tokens": 4029593728} +{"current_steps": 13740, "total_steps": 29667, "loss": 0.3542, "lr": 3.2451800250271944e-05, "epoch": 1.3894447429131245, "percentage": 46.31, "elapsed_time": "1 day, 16:49:06", "remaining_time": "1 day, 23:18:56", "throughput": 27442.26, "total_tokens": 4032554496} +{"current_steps": 13750, "total_steps": 29667, "loss": 0.355, "lr": 3.244496728528553e-05, "epoch": 1.3904560250292324, "percentage": 46.35, "elapsed_time": "1 day, 16:50:47", "remaining_time": "1 day, 23:17:01", "throughput": 27443.38, "total_tokens": 4035467072} +{"current_steps": 13760, "total_steps": 29667, "loss": 0.3518, "lr": 3.243813863467525e-05, "epoch": 1.3914673071453403, "percentage": 46.38, "elapsed_time": "1 day, 16:52:31", "remaining_time": "1 day, 23:15:11", "throughput": 27444.05, "total_tokens": 4038432192} +{"current_steps": 13770, "total_steps": 29667, "loss": 0.3552, "lr": 3.243131429390281e-05, "epoch": 1.392478589261448, "percentage": 46.42, "elapsed_time": "1 day, 16:54:15", "remaining_time": "1 day, 23:13:21", "throughput": 27445.08, "total_tokens": 4041429440} +{"current_steps": 13780, "total_steps": 29667, "loss": 0.3542, "lr": 3.2424494258436594e-05, "epoch": 1.3934898713775559, "percentage": 46.45, "elapsed_time": "1 day, 16:55:59", "remaining_time": "1 day, 23:11:31", "throughput": 27445.21, "total_tokens": 4044322432} +{"current_steps": 13790, "total_steps": 29667, "loss": 0.3618, "lr": 3.241767852375166e-05, "epoch": 1.3945011534936635, "percentage": 46.48, "elapsed_time": "1 day, 16:57:38", "remaining_time": "1 day, 23:09:35", "throughput": 27446.73, "total_tokens": 4047252288} +{"current_steps": 13800, "total_steps": 29667, "loss": 0.3502, "lr": 3.241086708532971e-05, "epoch": 1.3955124356097715, "percentage": 46.52, "elapsed_time": "1 day, 16:59:23", "remaining_time": "1 day, 23:07:46", "throughput": 27447.59, "total_tokens": 4050268096} +{"current_steps": 13810, "total_steps": 29667, "loss": 0.3575, "lr": 3.24040599386591e-05, "epoch": 1.3965237177258794, "percentage": 46.55, "elapsed_time": "1 day, 17:01:08", "remaining_time": "1 day, 23:05:56", "throughput": 27448.11, "total_tokens": 4053214720} +{"current_steps": 13820, "total_steps": 29667, "loss": 0.3623, "lr": 3.23972570792348e-05, "epoch": 1.3975349998419873, "percentage": 46.58, "elapsed_time": "1 day, 17:02:51", "remaining_time": "1 day, 23:04:05", "throughput": 27448.72, "total_tokens": 4056147904} +{"current_steps": 13830, "total_steps": 29667, "loss": 0.358, "lr": 3.239045850255842e-05, "epoch": 1.398546281958095, "percentage": 46.62, "elapsed_time": "1 day, 17:04:29", "remaining_time": "1 day, 23:02:08", "throughput": 27449.92, "total_tokens": 4059015424} +{"current_steps": 13840, "total_steps": 29667, "loss": 0.3546, "lr": 3.238366420413817e-05, "epoch": 1.3995575640742028, "percentage": 46.65, "elapsed_time": "1 day, 17:06:12", "remaining_time": "1 day, 23:00:16", "throughput": 27450.98, "total_tokens": 4061980800} +{"current_steps": 13850, "total_steps": 29667, "loss": 0.3603, "lr": 3.237687417948882e-05, "epoch": 1.4005688461903105, "percentage": 46.68, "elapsed_time": "1 day, 17:07:56", "remaining_time": "1 day, 22:58:27", "throughput": 27451.38, "total_tokens": 4064916416} +{"current_steps": 13860, "total_steps": 29667, "loss": 0.3586, "lr": 3.2370088424131776e-05, "epoch": 1.4015801283064184, "percentage": 46.72, "elapsed_time": "1 day, 17:09:39", "remaining_time": "1 day, 22:56:34", "throughput": 27452.33, "total_tokens": 4067862720} +{"current_steps": 13870, "total_steps": 29667, "loss": 0.3576, "lr": 3.236330693359497e-05, "epoch": 1.4025914104225263, "percentage": 46.75, "elapsed_time": "1 day, 17:11:18", "remaining_time": "1 day, 22:54:38", "throughput": 27453.81, "total_tokens": 4070800128} +{"current_steps": 13880, "total_steps": 29667, "loss": 0.3503, "lr": 3.2356529703412894e-05, "epoch": 1.4036026925386342, "percentage": 46.79, "elapsed_time": "1 day, 17:12:57", "remaining_time": "1 day, 22:52:42", "throughput": 27455.14, "total_tokens": 4073710784} +{"current_steps": 13890, "total_steps": 29667, "loss": 0.3561, "lr": 3.234975672912661e-05, "epoch": 1.404613974654742, "percentage": 46.82, "elapsed_time": "1 day, 17:14:37", "remaining_time": "1 day, 22:50:48", "throughput": 27456.33, "total_tokens": 4076656128} +{"current_steps": 13900, "total_steps": 29667, "loss": 0.3554, "lr": 3.234298800628368e-05, "epoch": 1.4056252567708498, "percentage": 46.85, "elapsed_time": "1 day, 17:16:15", "remaining_time": "1 day, 22:48:51", "throughput": 27458.0, "total_tokens": 4079585088} +{"current_steps": 13910, "total_steps": 29667, "loss": 0.3553, "lr": 3.2336223530438195e-05, "epoch": 1.4066365388869575, "percentage": 46.89, "elapsed_time": "1 day, 17:17:55", "remaining_time": "1 day, 22:46:57", "throughput": 27459.19, "total_tokens": 4082509696} +{"current_steps": 13920, "total_steps": 29667, "loss": 0.3556, "lr": 3.232946329715076e-05, "epoch": 1.4076478210030654, "percentage": 46.92, "elapsed_time": "1 day, 17:19:37", "remaining_time": "1 day, 22:45:04", "throughput": 27460.16, "total_tokens": 4085442944} +{"current_steps": 13930, "total_steps": 29667, "loss": 0.3565, "lr": 3.2322707301988456e-05, "epoch": 1.4086591031191733, "percentage": 46.95, "elapsed_time": "1 day, 17:21:19", "remaining_time": "1 day, 22:43:12", "throughput": 27460.8, "total_tokens": 4088354304} +{"current_steps": 13940, "total_steps": 29667, "loss": 0.3547, "lr": 3.231595554052488e-05, "epoch": 1.4096703852352812, "percentage": 46.99, "elapsed_time": "1 day, 17:22:55", "remaining_time": "1 day, 22:41:13", "throughput": 27462.54, "total_tokens": 4091245888} +{"current_steps": 13950, "total_steps": 29667, "loss": 0.3598, "lr": 3.230920800834005e-05, "epoch": 1.410681667351389, "percentage": 47.02, "elapsed_time": "1 day, 17:24:38", "remaining_time": "1 day, 22:39:22", "throughput": 27463.5, "total_tokens": 4094225792} +{"current_steps": 13960, "total_steps": 29667, "loss": 0.3527, "lr": 3.2302464701020486e-05, "epoch": 1.4116929494674968, "percentage": 47.06, "elapsed_time": "1 day, 17:26:19", "remaining_time": "1 day, 22:37:28", "throughput": 27464.7, "total_tokens": 4097167104} +{"current_steps": 13970, "total_steps": 29667, "loss": 0.3589, "lr": 3.2295725614159126e-05, "epoch": 1.4127042315836045, "percentage": 47.09, "elapsed_time": "1 day, 17:28:01", "remaining_time": "1 day, 22:35:36", "throughput": 27465.61, "total_tokens": 4100118080} +{"current_steps": 13980, "total_steps": 29667, "loss": 0.3585, "lr": 3.228899074335536e-05, "epoch": 1.4137155136997124, "percentage": 47.12, "elapsed_time": "1 day, 17:29:45", "remaining_time": "1 day, 22:33:45", "throughput": 27466.33, "total_tokens": 4103063872} +{"current_steps": 13990, "total_steps": 29667, "loss": 0.3549, "lr": 3.228226008421498e-05, "epoch": 1.4147267958158203, "percentage": 47.16, "elapsed_time": "1 day, 17:31:32", "remaining_time": "1 day, 22:31:59", "throughput": 27466.46, "total_tokens": 4106041088} +{"current_steps": 14000, "total_steps": 29667, "loss": 0.3593, "lr": 3.2275533632350193e-05, "epoch": 1.4157380779319282, "percentage": 47.19, "elapsed_time": "1 day, 17:33:13", "remaining_time": "1 day, 22:30:05", "throughput": 27467.67, "total_tokens": 4108978688} +{"current_steps": 14010, "total_steps": 29667, "loss": 0.3566, "lr": 3.226881138337963e-05, "epoch": 1.4167493600480359, "percentage": 47.22, "elapsed_time": "1 day, 17:34:54", "remaining_time": "1 day, 22:28:12", "throughput": 27468.88, "total_tokens": 4111929728} +{"current_steps": 14020, "total_steps": 29667, "loss": 0.3551, "lr": 3.2262093332928256e-05, "epoch": 1.4177606421641438, "percentage": 47.26, "elapsed_time": "1 day, 17:36:39", "remaining_time": "1 day, 22:26:22", "throughput": 27469.36, "total_tokens": 4114883712} +{"current_steps": 14030, "total_steps": 29667, "loss": 0.3578, "lr": 3.225537947662746e-05, "epoch": 1.4187719242802515, "percentage": 47.29, "elapsed_time": "1 day, 17:38:22", "remaining_time": "1 day, 22:24:32", "throughput": 27469.93, "total_tokens": 4117807104} +{"current_steps": 14040, "total_steps": 29667, "loss": 0.3551, "lr": 3.224866981011494e-05, "epoch": 1.4197832063963594, "percentage": 47.33, "elapsed_time": "1 day, 17:40:04", "remaining_time": "1 day, 22:22:40", "throughput": 27470.98, "total_tokens": 4120783488} +{"current_steps": 14050, "total_steps": 29667, "loss": 0.3632, "lr": 3.22419643290348e-05, "epoch": 1.4207944885124673, "percentage": 47.36, "elapsed_time": "1 day, 17:41:47", "remaining_time": "1 day, 22:20:49", "throughput": 27471.85, "total_tokens": 4123733760} +{"current_steps": 14060, "total_steps": 29667, "loss": 0.3601, "lr": 3.2235263029037446e-05, "epoch": 1.4218057706285752, "percentage": 47.39, "elapsed_time": "1 day, 17:43:35", "remaining_time": "1 day, 22:19:03", "throughput": 27471.97, "total_tokens": 4126705152} +{"current_steps": 14070, "total_steps": 29667, "loss": 0.356, "lr": 3.222856590577962e-05, "epoch": 1.4228170527446828, "percentage": 47.43, "elapsed_time": "1 day, 17:45:17", "remaining_time": "1 day, 22:17:11", "throughput": 27472.78, "total_tokens": 4129634112} +{"current_steps": 14080, "total_steps": 29667, "loss": 0.3577, "lr": 3.222187295492436e-05, "epoch": 1.4238283348607907, "percentage": 47.46, "elapsed_time": "1 day, 17:47:00", "remaining_time": "1 day, 22:15:19", "throughput": 27473.62, "total_tokens": 4132589696} +{"current_steps": 14090, "total_steps": 29667, "loss": 0.3564, "lr": 3.221518417214104e-05, "epoch": 1.4248396169768984, "percentage": 47.49, "elapsed_time": "1 day, 17:48:39", "remaining_time": "1 day, 22:13:24", "throughput": 27474.77, "total_tokens": 4135495680} +{"current_steps": 14100, "total_steps": 29667, "loss": 0.3572, "lr": 3.22084995531053e-05, "epoch": 1.4258508990930063, "percentage": 47.53, "elapsed_time": "1 day, 17:50:19", "remaining_time": "1 day, 22:11:30", "throughput": 27476.07, "total_tokens": 4138443584} +{"current_steps": 14110, "total_steps": 29667, "loss": 0.3586, "lr": 3.220181909349907e-05, "epoch": 1.4268621812091142, "percentage": 47.56, "elapsed_time": "1 day, 17:52:05", "remaining_time": "1 day, 22:09:42", "throughput": 27476.75, "total_tokens": 4141446016} +{"current_steps": 14120, "total_steps": 29667, "loss": 0.3581, "lr": 3.219514278901053e-05, "epoch": 1.4278734633252221, "percentage": 47.59, "elapsed_time": "1 day, 17:53:47", "remaining_time": "1 day, 22:07:49", "throughput": 27477.98, "total_tokens": 4144422080} +{"current_steps": 14130, "total_steps": 29667, "loss": 0.3549, "lr": 3.218847063533413e-05, "epoch": 1.4288847454413298, "percentage": 47.63, "elapsed_time": "1 day, 17:55:25", "remaining_time": "1 day, 22:05:54", "throughput": 27479.37, "total_tokens": 4147347136} +{"current_steps": 14140, "total_steps": 29667, "loss": 0.3486, "lr": 3.218180262817055e-05, "epoch": 1.4298960275574377, "percentage": 47.66, "elapsed_time": "1 day, 17:57:07", "remaining_time": "1 day, 22:04:02", "throughput": 27480.43, "total_tokens": 4150310144} +{"current_steps": 14150, "total_steps": 29667, "loss": 0.3619, "lr": 3.217513876322674e-05, "epoch": 1.4309073096735454, "percentage": 47.7, "elapsed_time": "1 day, 17:58:47", "remaining_time": "1 day, 22:02:07", "throughput": 27481.53, "total_tokens": 4153225728} +{"current_steps": 14160, "total_steps": 29667, "loss": 0.3578, "lr": 3.216847903621581e-05, "epoch": 1.4319185917896533, "percentage": 47.73, "elapsed_time": "1 day, 18:00:31", "remaining_time": "1 day, 22:00:18", "throughput": 27482.37, "total_tokens": 4156209728} +{"current_steps": 14170, "total_steps": 29667, "loss": 0.353, "lr": 3.216182344285713e-05, "epoch": 1.4329298739057612, "percentage": 47.76, "elapsed_time": "1 day, 18:02:13", "remaining_time": "1 day, 21:58:25", "throughput": 27483.38, "total_tokens": 4159153472} +{"current_steps": 14180, "total_steps": 29667, "loss": 0.3593, "lr": 3.215517197887625e-05, "epoch": 1.4339411560218691, "percentage": 47.8, "elapsed_time": "1 day, 18:03:55", "remaining_time": "1 day, 21:56:33", "throughput": 27484.32, "total_tokens": 4162102720} +{"current_steps": 14190, "total_steps": 29667, "loss": 0.3601, "lr": 3.214852464000488e-05, "epoch": 1.4349524381379768, "percentage": 47.83, "elapsed_time": "1 day, 18:05:34", "remaining_time": "1 day, 21:54:37", "throughput": 27485.59, "total_tokens": 4165006720} +{"current_steps": 14200, "total_steps": 29667, "loss": 0.3591, "lr": 3.2141881421980945e-05, "epoch": 1.4359637202540847, "percentage": 47.86, "elapsed_time": "1 day, 18:07:17", "remaining_time": "1 day, 21:52:47", "throughput": 27486.27, "total_tokens": 4167947904} +{"current_steps": 14210, "total_steps": 29667, "loss": 0.3566, "lr": 3.213524232054851e-05, "epoch": 1.4369750023701924, "percentage": 47.9, "elapsed_time": "1 day, 18:09:00", "remaining_time": "1 day, 21:50:56", "throughput": 27487.04, "total_tokens": 4170908928} +{"current_steps": 14220, "total_steps": 29667, "loss": 0.3527, "lr": 3.21286073314578e-05, "epoch": 1.4379862844863003, "percentage": 47.93, "elapsed_time": "1 day, 18:10:42", "remaining_time": "1 day, 21:49:04", "throughput": 27488.07, "total_tokens": 4173860032} +{"current_steps": 14230, "total_steps": 29667, "loss": 0.3549, "lr": 3.2121976450465155e-05, "epoch": 1.4389975666024082, "percentage": 47.97, "elapsed_time": "1 day, 18:12:20", "remaining_time": "1 day, 21:47:08", "throughput": 27489.33, "total_tokens": 4176746176} +{"current_steps": 14240, "total_steps": 29667, "loss": 0.3537, "lr": 3.211534967333308e-05, "epoch": 1.4400088487185159, "percentage": 48.0, "elapsed_time": "1 day, 18:14:00", "remaining_time": "1 day, 21:45:14", "throughput": 27490.49, "total_tokens": 4179668608} +{"current_steps": 14250, "total_steps": 29667, "loss": 0.3566, "lr": 3.210872699583019e-05, "epoch": 1.4410201308346238, "percentage": 48.03, "elapsed_time": "1 day, 18:15:42", "remaining_time": "1 day, 21:43:22", "throughput": 27491.46, "total_tokens": 4182620544} +{"current_steps": 14260, "total_steps": 29667, "loss": 0.3549, "lr": 3.210210841373118e-05, "epoch": 1.4420314129507317, "percentage": 48.07, "elapsed_time": "1 day, 18:17:23", "remaining_time": "1 day, 21:41:29", "throughput": 27492.48, "total_tokens": 4185553344} +{"current_steps": 14270, "total_steps": 29667, "loss": 0.3537, "lr": 3.2095493922816855e-05, "epoch": 1.4430426950668394, "percentage": 48.1, "elapsed_time": "1 day, 18:19:04", "remaining_time": "1 day, 21:39:35", "throughput": 27493.73, "total_tokens": 4188513088} +{"current_steps": 14280, "total_steps": 29667, "loss": 0.3548, "lr": 3.2088883518874105e-05, "epoch": 1.4440539771829473, "percentage": 48.13, "elapsed_time": "1 day, 18:20:42", "remaining_time": "1 day, 21:37:39", "throughput": 27495.19, "total_tokens": 4191430272} +{"current_steps": 14290, "total_steps": 29667, "loss": 0.3525, "lr": 3.208227719769589e-05, "epoch": 1.4450652592990552, "percentage": 48.17, "elapsed_time": "1 day, 18:22:26", "remaining_time": "1 day, 21:35:49", "throughput": 27495.87, "total_tokens": 4194387456} +{"current_steps": 14300, "total_steps": 29667, "loss": 0.3553, "lr": 3.207567495508124e-05, "epoch": 1.4460765414151628, "percentage": 48.2, "elapsed_time": "1 day, 18:24:10", "remaining_time": "1 day, 21:34:00", "throughput": 27496.48, "total_tokens": 4197358080} +{"current_steps": 14310, "total_steps": 29667, "loss": 0.3539, "lr": 3.2069076786835205e-05, "epoch": 1.4470878235312707, "percentage": 48.24, "elapsed_time": "1 day, 18:25:47", "remaining_time": "1 day, 21:32:03", "throughput": 27498.06, "total_tokens": 4200264896} +{"current_steps": 14320, "total_steps": 29667, "loss": 0.3542, "lr": 3.2062482688768904e-05, "epoch": 1.4480991056473786, "percentage": 48.27, "elapsed_time": "1 day, 18:27:27", "remaining_time": "1 day, 21:30:09", "throughput": 27499.1, "total_tokens": 4203162368} +{"current_steps": 14330, "total_steps": 29667, "loss": 0.3564, "lr": 3.205589265669947e-05, "epoch": 1.4491103877634863, "percentage": 48.3, "elapsed_time": "1 day, 18:29:11", "remaining_time": "1 day, 21:28:19", "throughput": 27499.35, "total_tokens": 4206066560} +{"current_steps": 14340, "total_steps": 29667, "loss": 0.3549, "lr": 3.204930668645005e-05, "epoch": 1.4501216698795942, "percentage": 48.34, "elapsed_time": "1 day, 18:30:52", "remaining_time": "1 day, 21:26:26", "throughput": 27500.0, "total_tokens": 4208947456} +{"current_steps": 14350, "total_steps": 29667, "loss": 0.3568, "lr": 3.20427247738498e-05, "epoch": 1.4511329519957021, "percentage": 48.37, "elapsed_time": "1 day, 18:32:32", "remaining_time": "1 day, 21:24:33", "throughput": 27501.28, "total_tokens": 4211898112} +{"current_steps": 14360, "total_steps": 29667, "loss": 0.3566, "lr": 3.2036146914733854e-05, "epoch": 1.4521442341118098, "percentage": 48.4, "elapsed_time": "1 day, 18:34:13", "remaining_time": "1 day, 21:22:39", "throughput": 27502.32, "total_tokens": 4214814848} +{"current_steps": 14370, "total_steps": 29667, "loss": 0.3572, "lr": 3.202957310494336e-05, "epoch": 1.4531555162279177, "percentage": 48.44, "elapsed_time": "1 day, 18:35:55", "remaining_time": "1 day, 21:20:48", "throughput": 27503.18, "total_tokens": 4217773824} +{"current_steps": 14380, "total_steps": 29667, "loss": 0.3555, "lr": 3.202300334032542e-05, "epoch": 1.4541667983440254, "percentage": 48.47, "elapsed_time": "1 day, 18:37:35", "remaining_time": "1 day, 21:18:54", "throughput": 27504.51, "total_tokens": 4220726464} +{"current_steps": 14390, "total_steps": 29667, "loss": 0.357, "lr": 3.201643761673308e-05, "epoch": 1.4551780804601333, "percentage": 48.51, "elapsed_time": "1 day, 18:39:13", "remaining_time": "1 day, 21:16:58", "throughput": 27505.7, "total_tokens": 4223590272} +{"current_steps": 14400, "total_steps": 29667, "loss": 0.3613, "lr": 3.200987593002536e-05, "epoch": 1.4561893625762412, "percentage": 48.54, "elapsed_time": "1 day, 18:40:48", "remaining_time": "1 day, 21:14:59", "throughput": 27507.3, "total_tokens": 4226453632} +{"current_steps": 14410, "total_steps": 29667, "loss": 0.3571, "lr": 3.200331827606721e-05, "epoch": 1.4572006446923491, "percentage": 48.57, "elapsed_time": "1 day, 18:42:28", "remaining_time": "1 day, 21:13:05", "throughput": 27508.33, "total_tokens": 4229371904} +{"current_steps": 14420, "total_steps": 29667, "loss": 0.3542, "lr": 3.199676465072951e-05, "epoch": 1.4582119268084568, "percentage": 48.61, "elapsed_time": "1 day, 18:44:11", "remaining_time": "1 day, 21:11:15", "throughput": 27508.96, "total_tokens": 4232296832} +{"current_steps": 14430, "total_steps": 29667, "loss": 0.3552, "lr": 3.1990215049889046e-05, "epoch": 1.4592232089245647, "percentage": 48.64, "elapsed_time": "1 day, 18:45:53", "remaining_time": "1 day, 21:09:23", "throughput": 27510.0, "total_tokens": 4235273600} +{"current_steps": 14440, "total_steps": 29667, "loss": 0.3582, "lr": 3.198366946942851e-05, "epoch": 1.4602344910406724, "percentage": 48.67, "elapsed_time": "1 day, 18:47:33", "remaining_time": "1 day, 21:07:29", "throughput": 27511.18, "total_tokens": 4238200128} +{"current_steps": 14450, "total_steps": 29667, "loss": 0.3532, "lr": 3.1977127905236514e-05, "epoch": 1.4612457731567803, "percentage": 48.71, "elapsed_time": "1 day, 18:49:18", "remaining_time": "1 day, 21:05:40", "throughput": 27511.43, "total_tokens": 4241110272} +{"current_steps": 14460, "total_steps": 29667, "loss": 0.3533, "lr": 3.197059035320752e-05, "epoch": 1.4622570552728882, "percentage": 48.74, "elapsed_time": "1 day, 18:50:59", "remaining_time": "1 day, 21:03:48", "throughput": 27512.37, "total_tokens": 4244042816} +{"current_steps": 14470, "total_steps": 29667, "loss": 0.3564, "lr": 3.196405680924189e-05, "epoch": 1.463268337388996, "percentage": 48.77, "elapsed_time": "1 day, 18:52:40", "remaining_time": "1 day, 21:01:55", "throughput": 27513.28, "total_tokens": 4246952256} +{"current_steps": 14480, "total_steps": 29667, "loss": 0.3526, "lr": 3.195752726924582e-05, "epoch": 1.4642796195051038, "percentage": 48.81, "elapsed_time": "1 day, 18:54:22", "remaining_time": "1 day, 21:00:04", "throughput": 27513.94, "total_tokens": 4249872064} +{"current_steps": 14490, "total_steps": 29667, "loss": 0.3526, "lr": 3.195100172913139e-05, "epoch": 1.4652909016212117, "percentage": 48.84, "elapsed_time": "1 day, 18:56:08", "remaining_time": "1 day, 20:58:17", "throughput": 27514.09, "total_tokens": 4252817024} +{"current_steps": 14500, "total_steps": 29667, "loss": 0.3527, "lr": 3.19444801848165e-05, "epoch": 1.4663021837373194, "percentage": 48.88, "elapsed_time": "1 day, 18:57:56", "remaining_time": "1 day, 20:56:31", "throughput": 27514.06, "total_tokens": 4255773632} +{"current_steps": 14510, "total_steps": 29667, "loss": 0.3564, "lr": 3.1937962632224885e-05, "epoch": 1.4673134658534273, "percentage": 48.91, "elapsed_time": "1 day, 18:59:40", "remaining_time": "1 day, 20:54:42", "throughput": 27514.57, "total_tokens": 4258732736} +{"current_steps": 14520, "total_steps": 29667, "loss": 0.3539, "lr": 3.193144906728609e-05, "epoch": 1.4683247479695352, "percentage": 48.94, "elapsed_time": "1 day, 19:01:21", "remaining_time": "1 day, 20:52:49", "throughput": 27515.61, "total_tokens": 4261670016} +{"current_steps": 14530, "total_steps": 29667, "loss": 0.358, "lr": 3.1924939485935494e-05, "epoch": 1.469336030085643, "percentage": 48.98, "elapsed_time": "1 day, 19:03:04", "remaining_time": "1 day, 20:50:59", "throughput": 27516.29, "total_tokens": 4264610880} +{"current_steps": 14540, "total_steps": 29667, "loss": 0.3563, "lr": 3.1918433884114253e-05, "epoch": 1.4703473122017507, "percentage": 49.01, "elapsed_time": "1 day, 19:04:42", "remaining_time": "1 day, 20:49:03", "throughput": 27517.63, "total_tokens": 4267502272} +{"current_steps": 14550, "total_steps": 29667, "loss": 0.3562, "lr": 3.191193225776931e-05, "epoch": 1.4713585943178586, "percentage": 49.04, "elapsed_time": "1 day, 19:06:27", "remaining_time": "1 day, 20:47:15", "throughput": 27518.16, "total_tokens": 4270480576} +{"current_steps": 14560, "total_steps": 29667, "loss": 0.3538, "lr": 3.190543460285339e-05, "epoch": 1.4723698764339663, "percentage": 49.08, "elapsed_time": "1 day, 19:08:07", "remaining_time": "1 day, 20:45:21", "throughput": 27519.19, "total_tokens": 4273393600} +{"current_steps": 14570, "total_steps": 29667, "loss": 0.3591, "lr": 3.189894091532499e-05, "epoch": 1.4733811585500742, "percentage": 49.11, "elapsed_time": "1 day, 19:09:47", "remaining_time": "1 day, 20:43:28", "throughput": 27520.35, "total_tokens": 4276323392} +{"current_steps": 14580, "total_steps": 29667, "loss": 0.3543, "lr": 3.1892451191148346e-05, "epoch": 1.4743924406661821, "percentage": 49.15, "elapsed_time": "1 day, 19:11:27", "remaining_time": "1 day, 20:41:34", "throughput": 27521.21, "total_tokens": 4279211456} +{"current_steps": 14590, "total_steps": 29667, "loss": 0.3523, "lr": 3.1885965426293465e-05, "epoch": 1.47540372278229, "percentage": 49.18, "elapsed_time": "1 day, 19:13:07", "remaining_time": "1 day, 20:39:40", "throughput": 27522.29, "total_tokens": 4282124032} +{"current_steps": 14600, "total_steps": 29667, "loss": 0.3565, "lr": 3.187948361673606e-05, "epoch": 1.4764150048983977, "percentage": 49.21, "elapsed_time": "1 day, 19:14:46", "remaining_time": "1 day, 20:37:46", "throughput": 27523.54, "total_tokens": 4285043968} +{"current_steps": 14610, "total_steps": 29667, "loss": 0.3516, "lr": 3.187300575845759e-05, "epoch": 1.4774262870145056, "percentage": 49.25, "elapsed_time": "1 day, 19:16:27", "remaining_time": "1 day, 20:35:53", "throughput": 27524.77, "total_tokens": 4288003968} +{"current_steps": 14620, "total_steps": 29667, "loss": 0.3528, "lr": 3.186653184744521e-05, "epoch": 1.4784375691306133, "percentage": 49.28, "elapsed_time": "1 day, 19:18:10", "remaining_time": "1 day, 20:34:03", "throughput": 27525.4, "total_tokens": 4290934464} +{"current_steps": 14630, "total_steps": 29667, "loss": 0.3557, "lr": 3.18600618796918e-05, "epoch": 1.4794488512467212, "percentage": 49.31, "elapsed_time": "1 day, 19:19:50", "remaining_time": "1 day, 20:32:09", "throughput": 27526.55, "total_tokens": 4293877248} +{"current_steps": 14640, "total_steps": 29667, "loss": 0.3542, "lr": 3.185359585119591e-05, "epoch": 1.4804601333628291, "percentage": 49.35, "elapsed_time": "1 day, 19:21:29", "remaining_time": "1 day, 20:30:15", "throughput": 27527.78, "total_tokens": 4296790528} +{"current_steps": 14650, "total_steps": 29667, "loss": 0.3606, "lr": 3.184713375796178e-05, "epoch": 1.481471415478937, "percentage": 49.38, "elapsed_time": "1 day, 19:23:09", "remaining_time": "1 day, 20:28:22", "throughput": 27528.94, "total_tokens": 4299740992} +{"current_steps": 14660, "total_steps": 29667, "loss": 0.3547, "lr": 3.1840675595999344e-05, "epoch": 1.4824826975950447, "percentage": 49.42, "elapsed_time": "1 day, 19:24:50", "remaining_time": "1 day, 20:26:30", "throughput": 27530.16, "total_tokens": 4302713600} +{"current_steps": 14670, "total_steps": 29667, "loss": 0.3561, "lr": 3.1834221361324155e-05, "epoch": 1.4834939797111526, "percentage": 49.45, "elapsed_time": "1 day, 19:26:31", "remaining_time": "1 day, 20:24:38", "throughput": 27531.01, "total_tokens": 4305628800} +{"current_steps": 14680, "total_steps": 29667, "loss": 0.3536, "lr": 3.182777104995744e-05, "epoch": 1.4845052618272603, "percentage": 49.48, "elapsed_time": "1 day, 19:28:11", "remaining_time": "1 day, 20:22:44", "throughput": 27532.17, "total_tokens": 4308554496} +{"current_steps": 14690, "total_steps": 29667, "loss": 0.3605, "lr": 3.182132465792609e-05, "epoch": 1.4855165439433682, "percentage": 49.52, "elapsed_time": "1 day, 19:29:46", "remaining_time": "1 day, 20:20:45", "throughput": 27533.7, "total_tokens": 4311409984} +{"current_steps": 14700, "total_steps": 29667, "loss": 0.3617, "lr": 3.181488218126259e-05, "epoch": 1.486527826059476, "percentage": 49.55, "elapsed_time": "1 day, 19:31:30", "remaining_time": "1 day, 20:18:56", "throughput": 27534.11, "total_tokens": 4314327104} +{"current_steps": 14710, "total_steps": 29667, "loss": 0.3547, "lr": 3.180844361600506e-05, "epoch": 1.487539108175584, "percentage": 49.58, "elapsed_time": "1 day, 19:33:10", "remaining_time": "1 day, 20:17:02", "throughput": 27535.3, "total_tokens": 4317263808} +{"current_steps": 14720, "total_steps": 29667, "loss": 0.3562, "lr": 3.180200895819722e-05, "epoch": 1.4885503902916917, "percentage": 49.62, "elapsed_time": "1 day, 19:34:52", "remaining_time": "1 day, 20:15:12", "throughput": 27535.88, "total_tokens": 4320183104} +{"current_steps": 14730, "total_steps": 29667, "loss": 0.3583, "lr": 3.1795578203888424e-05, "epoch": 1.4895616724077996, "percentage": 49.65, "elapsed_time": "1 day, 19:36:32", "remaining_time": "1 day, 20:13:18", "throughput": 27536.65, "total_tokens": 4323041728} +{"current_steps": 14740, "total_steps": 29667, "loss": 0.3535, "lr": 3.178915134913357e-05, "epoch": 1.4905729545239073, "percentage": 49.68, "elapsed_time": "1 day, 19:38:10", "remaining_time": "1 day, 20:11:23", "throughput": 27537.89, "total_tokens": 4325953792} +{"current_steps": 14750, "total_steps": 29667, "loss": 0.3545, "lr": 3.178272838999316e-05, "epoch": 1.4915842366400152, "percentage": 49.72, "elapsed_time": "1 day, 19:39:53", "remaining_time": "1 day, 20:09:33", "throughput": 27538.6, "total_tokens": 4328891008} +{"current_steps": 14760, "total_steps": 29667, "loss": 0.3573, "lr": 3.1776309322533274e-05, "epoch": 1.492595518756123, "percentage": 49.75, "elapsed_time": "1 day, 19:41:34", "remaining_time": "1 day, 20:07:40", "throughput": 27539.68, "total_tokens": 4331837376} +{"current_steps": 14770, "total_steps": 29667, "loss": 0.36, "lr": 3.1769894142825536e-05, "epoch": 1.4936068008722307, "percentage": 49.79, "elapsed_time": "1 day, 19:43:15", "remaining_time": "1 day, 20:05:48", "throughput": 27540.65, "total_tokens": 4334771328} +{"current_steps": 14780, "total_steps": 29667, "loss": 0.3593, "lr": 3.176348284694712e-05, "epoch": 1.4946180829883386, "percentage": 49.82, "elapsed_time": "1 day, 19:44:56", "remaining_time": "1 day, 20:03:56", "throughput": 27541.57, "total_tokens": 4337701632} +{"current_steps": 14790, "total_steps": 29667, "loss": 0.3585, "lr": 3.175707543098075e-05, "epoch": 1.4956293651044466, "percentage": 49.85, "elapsed_time": "1 day, 19:46:34", "remaining_time": "1 day, 20:02:01", "throughput": 27542.88, "total_tokens": 4340605760} +{"current_steps": 14800, "total_steps": 29667, "loss": 0.3522, "lr": 3.1750671891014653e-05, "epoch": 1.4966406472205542, "percentage": 49.89, "elapsed_time": "1 day, 19:48:18", "remaining_time": "1 day, 20:00:12", "throughput": 27543.46, "total_tokens": 4343555648} +{"current_steps": 14810, "total_steps": 29667, "loss": 0.3552, "lr": 3.174427222314262e-05, "epoch": 1.4976519293366621, "percentage": 49.92, "elapsed_time": "1 day, 19:49:57", "remaining_time": "1 day, 19:58:18", "throughput": 27544.5, "total_tokens": 4346447424} +{"current_steps": 14820, "total_steps": 29667, "loss": 0.358, "lr": 3.173787642346391e-05, "epoch": 1.49866321145277, "percentage": 49.95, "elapsed_time": "1 day, 19:51:34", "remaining_time": "1 day, 19:56:22", "throughput": 27545.99, "total_tokens": 4349371200} +{"current_steps": 14830, "total_steps": 29667, "loss": 0.3518, "lr": 3.173148448808331e-05, "epoch": 1.4996744935688777, "percentage": 49.99, "elapsed_time": "1 day, 19:53:17", "remaining_time": "1 day, 19:54:31", "throughput": 27546.64, "total_tokens": 4352290688} +{"current_steps": 14840, "total_steps": 29667, "loss": 0.354, "lr": 3.172509641311107e-05, "epoch": 1.5006857756849856, "percentage": 50.02, "elapsed_time": "1 day, 19:54:55", "remaining_time": "1 day, 19:52:37", "throughput": 27547.7, "total_tokens": 4355177408} +{"current_steps": 14850, "total_steps": 29667, "loss": 0.3547, "lr": 3.171871219466293e-05, "epoch": 1.5016970578010933, "percentage": 50.06, "elapsed_time": "1 day, 19:56:37", "remaining_time": "1 day, 19:50:46", "throughput": 27548.65, "total_tokens": 4358133696} +{"current_steps": 14860, "total_steps": 29667, "loss": 0.359, "lr": 3.171233182886011e-05, "epoch": 1.5027083399172012, "percentage": 50.09, "elapsed_time": "1 day, 19:58:19", "remaining_time": "1 day, 19:48:54", "throughput": 27549.43, "total_tokens": 4361062784} +{"current_steps": 14870, "total_steps": 29667, "loss": 0.3575, "lr": 3.170595531182928e-05, "epoch": 1.5037196220333091, "percentage": 50.12, "elapsed_time": "1 day, 19:59:59", "remaining_time": "1 day, 19:47:02", "throughput": 27550.71, "total_tokens": 4364031872} +{"current_steps": 14880, "total_steps": 29667, "loss": 0.3622, "lr": 3.169958263970256e-05, "epoch": 1.504730904149417, "percentage": 50.16, "elapsed_time": "1 day, 20:01:40", "remaining_time": "1 day, 19:45:09", "throughput": 27551.89, "total_tokens": 4366987392} +{"current_steps": 14890, "total_steps": 29667, "loss": 0.3523, "lr": 3.169321380861751e-05, "epoch": 1.505742186265525, "percentage": 50.19, "elapsed_time": "1 day, 20:03:21", "remaining_time": "1 day, 19:43:18", "throughput": 27552.66, "total_tokens": 4369899712} +{"current_steps": 14900, "total_steps": 29667, "loss": 0.357, "lr": 3.168684881471711e-05, "epoch": 1.5067534683816326, "percentage": 50.22, "elapsed_time": "1 day, 20:05:00", "remaining_time": "1 day, 19:41:23", "throughput": 27554.01, "total_tokens": 4372821120} +{"current_steps": 14910, "total_steps": 29667, "loss": 0.3562, "lr": 3.168048765414979e-05, "epoch": 1.5077647504977403, "percentage": 50.26, "elapsed_time": "1 day, 20:06:35", "remaining_time": "1 day, 19:39:26", "throughput": 27555.53, "total_tokens": 4375702400} +{"current_steps": 14920, "total_steps": 29667, "loss": 0.3544, "lr": 3.167413032306936e-05, "epoch": 1.5087760326138482, "percentage": 50.29, "elapsed_time": "1 day, 20:08:17", "remaining_time": "1 day, 19:37:34", "throughput": 27556.41, "total_tokens": 4378641600} +{"current_steps": 14930, "total_steps": 29667, "loss": 0.357, "lr": 3.166777681763504e-05, "epoch": 1.509787314729956, "percentage": 50.33, "elapsed_time": "1 day, 20:09:55", "remaining_time": "1 day, 19:35:40", "throughput": 27557.64, "total_tokens": 4381549440} +{"current_steps": 14940, "total_steps": 29667, "loss": 0.3532, "lr": 3.166142713401144e-05, "epoch": 1.510798596846064, "percentage": 50.36, "elapsed_time": "1 day, 20:11:38", "remaining_time": "1 day, 19:33:50", "throughput": 27558.2, "total_tokens": 4384473600} +{"current_steps": 14950, "total_steps": 29667, "loss": 0.3544, "lr": 3.165508126836857e-05, "epoch": 1.511809878962172, "percentage": 50.39, "elapsed_time": "1 day, 20:13:21", "remaining_time": "1 day, 19:32:00", "throughput": 27558.51, "total_tokens": 4387358848} +{"current_steps": 14960, "total_steps": 29667, "loss": 0.3544, "lr": 3.164873921688177e-05, "epoch": 1.5128211610782796, "percentage": 50.43, "elapsed_time": "1 day, 20:15:13", "remaining_time": "1 day, 19:30:18", "throughput": 27557.69, "total_tokens": 4390299968} +{"current_steps": 14970, "total_steps": 29667, "loss": 0.3521, "lr": 3.164240097573178e-05, "epoch": 1.5138324431943873, "percentage": 50.46, "elapsed_time": "1 day, 20:16:55", "remaining_time": "1 day, 19:28:27", "throughput": 27558.47, "total_tokens": 4393237760} +{"current_steps": 14980, "total_steps": 29667, "loss": 0.3584, "lr": 3.163606654110467e-05, "epoch": 1.5148437253104952, "percentage": 50.49, "elapsed_time": "1 day, 20:18:36", "remaining_time": "1 day, 19:26:36", "throughput": 27559.33, "total_tokens": 4396175296} +{"current_steps": 14990, "total_steps": 29667, "loss": 0.3593, "lr": 3.162973590919187e-05, "epoch": 1.515855007426603, "percentage": 50.53, "elapsed_time": "1 day, 20:20:15", "remaining_time": "1 day, 19:24:43", "throughput": 27560.63, "total_tokens": 4399116800} +{"current_steps": 15000, "total_steps": 29667, "loss": 0.3556, "lr": 3.162340907619012e-05, "epoch": 1.516866289542711, "percentage": 50.56, "elapsed_time": "1 day, 20:21:59", "remaining_time": "1 day, 19:22:53", "throughput": 27561.4, "total_tokens": 4402080256} +{"current_steps": 15000, "total_steps": 29667, "eval_loss": 0.33106303215026855, "epoch": 1.516866289542711, "percentage": 50.56, "elapsed_time": "1 day, 20:22:00", "remaining_time": "1 day, 19:22:55", "throughput": 27561.09, "total_tokens": 4402080256} +{"current_steps": 15010, "total_steps": 29667, "loss": 0.3536, "lr": 3.1617086038301516e-05, "epoch": 1.5178775716588186, "percentage": 50.59, "elapsed_time": "1 day, 20:24:19", "remaining_time": "1 day, 19:21:39", "throughput": 27555.91, "total_tokens": 4405059968} +{"current_steps": 15020, "total_steps": 29667, "loss": 0.3558, "lr": 3.161076679173344e-05, "epoch": 1.5188888537749266, "percentage": 50.63, "elapsed_time": "1 day, 20:26:01", "remaining_time": "1 day, 19:19:49", "throughput": 27556.73, "total_tokens": 4408022464} +{"current_steps": 15030, "total_steps": 29667, "loss": 0.3566, "lr": 3.1604451332698575e-05, "epoch": 1.5199001358910342, "percentage": 50.66, "elapsed_time": "1 day, 20:27:37", "remaining_time": "1 day, 19:17:52", "throughput": 27558.3, "total_tokens": 4410906752} +{"current_steps": 15040, "total_steps": 29667, "loss": 0.3575, "lr": 3.1598139657414923e-05, "epoch": 1.5209114180071421, "percentage": 50.7, "elapsed_time": "1 day, 20:29:14", "remaining_time": "1 day, 19:15:56", "throughput": 27559.68, "total_tokens": 4413797248} +{"current_steps": 15050, "total_steps": 29667, "loss": 0.3579, "lr": 3.159183176210574e-05, "epoch": 1.52192270012325, "percentage": 50.73, "elapsed_time": "1 day, 20:30:53", "remaining_time": "1 day, 19:14:03", "throughput": 27560.9, "total_tokens": 4416743360} +{"current_steps": 15060, "total_steps": 29667, "loss": 0.3569, "lr": 3.1585527642999595e-05, "epoch": 1.522933982239358, "percentage": 50.76, "elapsed_time": "1 day, 20:32:32", "remaining_time": "1 day, 19:12:08", "throughput": 27562.18, "total_tokens": 4419655488} +{"current_steps": 15070, "total_steps": 29667, "loss": 0.3581, "lr": 3.1579227296330294e-05, "epoch": 1.5239452643554656, "percentage": 50.8, "elapsed_time": "1 day, 20:34:10", "remaining_time": "1 day, 19:10:14", "throughput": 27563.36, "total_tokens": 4422547328} +{"current_steps": 15080, "total_steps": 29667, "loss": 0.3598, "lr": 3.157293071833691e-05, "epoch": 1.5249565464715735, "percentage": 50.83, "elapsed_time": "1 day, 20:35:48", "remaining_time": "1 day, 19:08:19", "throughput": 27564.75, "total_tokens": 4425484544} +{"current_steps": 15090, "total_steps": 29667, "loss": 0.3596, "lr": 3.156663790526375e-05, "epoch": 1.5259678285876812, "percentage": 50.86, "elapsed_time": "1 day, 20:37:31", "remaining_time": "1 day, 19:06:29", "throughput": 27565.54, "total_tokens": 4428436928} +{"current_steps": 15100, "total_steps": 29667, "loss": 0.357, "lr": 3.156034885336039e-05, "epoch": 1.526979110703789, "percentage": 50.9, "elapsed_time": "1 day, 20:39:13", "remaining_time": "1 day, 19:04:39", "throughput": 27566.38, "total_tokens": 4431395200} +{"current_steps": 15110, "total_steps": 29667, "loss": 0.3562, "lr": 3.155406355888161e-05, "epoch": 1.527990392819897, "percentage": 50.93, "elapsed_time": "1 day, 20:40:55", "remaining_time": "1 day, 19:02:48", "throughput": 27566.88, "total_tokens": 4434296000} +{"current_steps": 15120, "total_steps": 29667, "loss": 0.3559, "lr": 3.1547782018087407e-05, "epoch": 1.529001674936005, "percentage": 50.97, "elapsed_time": "1 day, 20:42:38", "remaining_time": "1 day, 19:00:58", "throughput": 27567.83, "total_tokens": 4437273408} +{"current_steps": 15130, "total_steps": 29667, "loss": 0.3573, "lr": 3.154150422724299e-05, "epoch": 1.5300129570521126, "percentage": 51.0, "elapsed_time": "1 day, 20:44:17", "remaining_time": "1 day, 18:59:04", "throughput": 27568.9, "total_tokens": 4440173376} +{"current_steps": 15140, "total_steps": 29667, "loss": 0.3514, "lr": 3.1535230182618783e-05, "epoch": 1.5310242391682205, "percentage": 51.03, "elapsed_time": "1 day, 20:45:58", "remaining_time": "1 day, 18:57:12", "throughput": 27569.97, "total_tokens": 4443121984} +{"current_steps": 15150, "total_steps": 29667, "loss": 0.3548, "lr": 3.1528959880490387e-05, "epoch": 1.5320355212843282, "percentage": 51.07, "elapsed_time": "1 day, 20:47:37", "remaining_time": "1 day, 18:55:20", "throughput": 27571.11, "total_tokens": 4446062400} +{"current_steps": 15160, "total_steps": 29667, "loss": 0.3542, "lr": 3.152269331713859e-05, "epoch": 1.533046803400436, "percentage": 51.1, "elapsed_time": "1 day, 20:49:17", "remaining_time": "1 day, 18:53:27", "throughput": 27572.44, "total_tokens": 4449025792} +{"current_steps": 15170, "total_steps": 29667, "loss": 0.3517, "lr": 3.151643048884935e-05, "epoch": 1.534058085516544, "percentage": 51.13, "elapsed_time": "1 day, 20:50:56", "remaining_time": "1 day, 18:51:34", "throughput": 27573.44, "total_tokens": 4451921728} +{"current_steps": 15180, "total_steps": 29667, "loss": 0.3552, "lr": 3.151017139191379e-05, "epoch": 1.535069367632652, "percentage": 51.17, "elapsed_time": "1 day, 20:52:38", "remaining_time": "1 day, 18:49:43", "throughput": 27574.17, "total_tokens": 4454842880} +{"current_steps": 15190, "total_steps": 29667, "loss": 0.354, "lr": 3.150391602262818e-05, "epoch": 1.5360806497487596, "percentage": 51.2, "elapsed_time": "1 day, 20:54:20", "remaining_time": "1 day, 18:47:52", "throughput": 27574.86, "total_tokens": 4457773952} +{"current_steps": 15200, "total_steps": 29667, "loss": 0.3537, "lr": 3.149766437729394e-05, "epoch": 1.5370919318648675, "percentage": 51.24, "elapsed_time": "1 day, 20:55:56", "remaining_time": "1 day, 18:45:56", "throughput": 27576.32, "total_tokens": 4460654592} +{"current_steps": 15210, "total_steps": 29667, "loss": 0.3544, "lr": 3.1491416452217635e-05, "epoch": 1.5381032139809752, "percentage": 51.27, "elapsed_time": "1 day, 20:57:38", "remaining_time": "1 day, 18:44:05", "throughput": 27577.4, "total_tokens": 4463642496} +{"current_steps": 15220, "total_steps": 29667, "loss": 0.3562, "lr": 3.1485172243710954e-05, "epoch": 1.539114496097083, "percentage": 51.3, "elapsed_time": "1 day, 20:59:20", "remaining_time": "1 day, 18:42:15", "throughput": 27578.28, "total_tokens": 4466603776} +{"current_steps": 15230, "total_steps": 29667, "loss": 0.3572, "lr": 3.1478931748090676e-05, "epoch": 1.540125778213191, "percentage": 51.34, "elapsed_time": "1 day, 21:01:01", "remaining_time": "1 day, 18:40:23", "throughput": 27579.16, "total_tokens": 4469521792} +{"current_steps": 15240, "total_steps": 29667, "loss": 0.3548, "lr": 3.147269496167873e-05, "epoch": 1.5411370603292989, "percentage": 51.37, "elapsed_time": "1 day, 21:02:39", "remaining_time": "1 day, 18:38:28", "throughput": 27580.41, "total_tokens": 4472426752} +{"current_steps": 15250, "total_steps": 29667, "loss": 0.351, "lr": 3.1466461880802105e-05, "epoch": 1.5421483424454066, "percentage": 51.4, "elapsed_time": "1 day, 21:04:24", "remaining_time": "1 day, 18:36:41", "throughput": 27580.93, "total_tokens": 4475404352} +{"current_steps": 15260, "total_steps": 29667, "loss": 0.3516, "lr": 3.146023250179291e-05, "epoch": 1.5431596245615142, "percentage": 51.44, "elapsed_time": "1 day, 21:06:04", "remaining_time": "1 day, 18:34:48", "throughput": 27581.9, "total_tokens": 4478321600} +{"current_steps": 15270, "total_steps": 29667, "loss": 0.3541, "lr": 3.145400682098833e-05, "epoch": 1.5441709066776221, "percentage": 51.47, "elapsed_time": "1 day, 21:07:41", "remaining_time": "1 day, 18:32:53", "throughput": 27583.54, "total_tokens": 4481252224} +{"current_steps": 15280, "total_steps": 29667, "loss": 0.3506, "lr": 3.14477848347306e-05, "epoch": 1.54518218879373, "percentage": 51.51, "elapsed_time": "1 day, 21:09:21", "remaining_time": "1 day, 18:31:01", "throughput": 27584.64, "total_tokens": 4484212544} +{"current_steps": 15290, "total_steps": 29667, "loss": 0.3588, "lr": 3.144156653936703e-05, "epoch": 1.546193470909838, "percentage": 51.54, "elapsed_time": "1 day, 21:11:01", "remaining_time": "1 day, 18:29:08", "throughput": 27585.81, "total_tokens": 4487144576} +{"current_steps": 15300, "total_steps": 29667, "loss": 0.3501, "lr": 3.1435351931250004e-05, "epoch": 1.5472047530259458, "percentage": 51.57, "elapsed_time": "1 day, 21:12:45", "remaining_time": "1 day, 18:27:20", "throughput": 27586.47, "total_tokens": 4490125888} +{"current_steps": 15310, "total_steps": 29667, "loss": 0.3562, "lr": 3.142914100673692e-05, "epoch": 1.5482160351420535, "percentage": 51.61, "elapsed_time": "1 day, 21:14:20", "remaining_time": "1 day, 18:25:23", "throughput": 27588.21, "total_tokens": 4493042368} +{"current_steps": 15320, "total_steps": 29667, "loss": 0.3622, "lr": 3.1422933762190235e-05, "epoch": 1.5492273172581612, "percentage": 51.64, "elapsed_time": "1 day, 21:16:06", "remaining_time": "1 day, 18:23:36", "throughput": 27588.58, "total_tokens": 4496012352} +{"current_steps": 15330, "total_steps": 29667, "loss": 0.3558, "lr": 3.141673019397741e-05, "epoch": 1.550238599374269, "percentage": 51.67, "elapsed_time": "1 day, 21:17:50", "remaining_time": "1 day, 18:21:47", "throughput": 27589.15, "total_tokens": 4498983488} +{"current_steps": 15340, "total_steps": 29667, "loss": 0.3595, "lr": 3.141053029847095e-05, "epoch": 1.551249881490377, "percentage": 51.71, "elapsed_time": "1 day, 21:19:29", "remaining_time": "1 day, 18:19:54", "throughput": 27590.26, "total_tokens": 4501887552} +{"current_steps": 15350, "total_steps": 29667, "loss": 0.3607, "lr": 3.140433407204835e-05, "epoch": 1.552261163606485, "percentage": 51.74, "elapsed_time": "1 day, 21:21:06", "remaining_time": "1 day, 18:17:59", "throughput": 27591.53, "total_tokens": 4504769280} +{"current_steps": 15360, "total_steps": 29667, "loss": 0.3615, "lr": 3.1398141511092124e-05, "epoch": 1.5532724457225928, "percentage": 51.77, "elapsed_time": "1 day, 21:22:44", "remaining_time": "1 day, 18:16:05", "throughput": 27592.91, "total_tokens": 4507714048} +{"current_steps": 15370, "total_steps": 29667, "loss": 0.3569, "lr": 3.1391952611989736e-05, "epoch": 1.5542837278387005, "percentage": 51.81, "elapsed_time": "1 day, 21:24:22", "remaining_time": "1 day, 18:14:11", "throughput": 27594.08, "total_tokens": 4510606400} +{"current_steps": 15380, "total_steps": 29667, "loss": 0.3565, "lr": 3.138576737113369e-05, "epoch": 1.5552950099548082, "percentage": 51.84, "elapsed_time": "1 day, 21:26:04", "remaining_time": "1 day, 18:12:20", "throughput": 27594.96, "total_tokens": 4513565504} +{"current_steps": 15390, "total_steps": 29667, "loss": 0.3544, "lr": 3.137958578492143e-05, "epoch": 1.556306292070916, "percentage": 51.88, "elapsed_time": "1 day, 21:27:45", "remaining_time": "1 day, 18:10:28", "throughput": 27596.23, "total_tokens": 4516541056} +{"current_steps": 15400, "total_steps": 29667, "loss": 0.3536, "lr": 3.137340784975535e-05, "epoch": 1.557317574187024, "percentage": 51.91, "elapsed_time": "1 day, 21:29:26", "remaining_time": "1 day, 18:08:38", "throughput": 27596.95, "total_tokens": 4519466816} +{"current_steps": 15410, "total_steps": 29667, "loss": 0.3588, "lr": 3.136723356204285e-05, "epoch": 1.558328856303132, "percentage": 51.94, "elapsed_time": "1 day, 21:31:05", "remaining_time": "1 day, 18:06:44", "throughput": 27598.19, "total_tokens": 4522395648} +{"current_steps": 15420, "total_steps": 29667, "loss": 0.3538, "lr": 3.136106291819622e-05, "epoch": 1.5593401384192398, "percentage": 51.98, "elapsed_time": "1 day, 21:32:45", "remaining_time": "1 day, 18:04:52", "throughput": 27599.46, "total_tokens": 4525347840} +{"current_steps": 15430, "total_steps": 29667, "loss": 0.3533, "lr": 3.1354895914632736e-05, "epoch": 1.5603514205353475, "percentage": 52.01, "elapsed_time": "1 day, 21:34:34", "remaining_time": "1 day, 18:03:08", "throughput": 27599.09, "total_tokens": 4528301056} +{"current_steps": 15440, "total_steps": 29667, "loss": 0.3569, "lr": 3.1348732547774575e-05, "epoch": 1.5613627026514552, "percentage": 52.04, "elapsed_time": "1 day, 21:36:13", "remaining_time": "1 day, 18:01:15", "throughput": 27600.13, "total_tokens": 4531218048} +{"current_steps": 15450, "total_steps": 29667, "loss": 0.3545, "lr": 3.134257281404883e-05, "epoch": 1.562373984767563, "percentage": 52.08, "elapsed_time": "1 day, 21:37:52", "remaining_time": "1 day, 17:59:22", "throughput": 27601.41, "total_tokens": 4534151168} +{"current_steps": 15460, "total_steps": 29667, "loss": 0.3511, "lr": 3.133641670988755e-05, "epoch": 1.563385266883671, "percentage": 52.11, "elapsed_time": "1 day, 21:39:33", "remaining_time": "1 day, 17:57:31", "throughput": 27602.4, "total_tokens": 4537114304} +{"current_steps": 15470, "total_steps": 29667, "loss": 0.3504, "lr": 3.133026423172764e-05, "epoch": 1.5643965489997789, "percentage": 52.15, "elapsed_time": "1 day, 21:41:15", "remaining_time": "1 day, 17:55:41", "throughput": 27603.5, "total_tokens": 4540104896} +{"current_steps": 15480, "total_steps": 29667, "loss": 0.3578, "lr": 3.1324115376010897e-05, "epoch": 1.5654078311158868, "percentage": 52.18, "elapsed_time": "1 day, 21:42:53", "remaining_time": "1 day, 17:53:47", "throughput": 27604.72, "total_tokens": 4543017600} +{"current_steps": 15490, "total_steps": 29667, "loss": 0.3545, "lr": 3.131797013918406e-05, "epoch": 1.5664191132319945, "percentage": 52.21, "elapsed_time": "1 day, 21:44:31", "remaining_time": "1 day, 17:51:53", "throughput": 27606.06, "total_tokens": 4545928704} +{"current_steps": 15500, "total_steps": 29667, "loss": 0.3575, "lr": 3.13118285176987e-05, "epoch": 1.5674303953481021, "percentage": 52.25, "elapsed_time": "1 day, 21:46:16", "remaining_time": "1 day, 17:50:05", "throughput": 27606.5, "total_tokens": 4548908288} +{"current_steps": 15510, "total_steps": 29667, "loss": 0.3551, "lr": 3.130569050801126e-05, "epoch": 1.56844167746421, "percentage": 52.28, "elapsed_time": "1 day, 21:47:58", "remaining_time": "1 day, 17:48:15", "throughput": 27607.45, "total_tokens": 4551886848} +{"current_steps": 15520, "total_steps": 29667, "loss": 0.3556, "lr": 3.129955610658306e-05, "epoch": 1.569452959580318, "percentage": 52.31, "elapsed_time": "1 day, 21:49:36", "remaining_time": "1 day, 17:46:21", "throughput": 27608.88, "total_tokens": 4554813056} +{"current_steps": 15530, "total_steps": 29667, "loss": 0.3635, "lr": 3.129342530988025e-05, "epoch": 1.5704642416964258, "percentage": 52.35, "elapsed_time": "1 day, 21:51:15", "remaining_time": "1 day, 17:44:28", "throughput": 27609.88, "total_tokens": 4557723712} +{"current_steps": 15540, "total_steps": 29667, "loss": 0.354, "lr": 3.128729811437385e-05, "epoch": 1.5714755238125335, "percentage": 52.38, "elapsed_time": "1 day, 21:52:53", "remaining_time": "1 day, 17:42:34", "throughput": 27611.13, "total_tokens": 4560629056} +{"current_steps": 15550, "total_steps": 29667, "loss": 0.3549, "lr": 3.12811745165397e-05, "epoch": 1.5724868059286414, "percentage": 52.42, "elapsed_time": "1 day, 21:54:30", "remaining_time": "1 day, 17:40:40", "throughput": 27612.32, "total_tokens": 4563507136} +{"current_steps": 15560, "total_steps": 29667, "loss": 0.355, "lr": 3.127505451285846e-05, "epoch": 1.573498088044749, "percentage": 52.45, "elapsed_time": "1 day, 21:56:08", "remaining_time": "1 day, 17:38:46", "throughput": 27613.8, "total_tokens": 4566452160} +{"current_steps": 15570, "total_steps": 29667, "loss": 0.354, "lr": 3.126893809981563e-05, "epoch": 1.574509370160857, "percentage": 52.48, "elapsed_time": "1 day, 21:57:51", "remaining_time": "1 day, 17:36:56", "throughput": 27614.61, "total_tokens": 4569428928} +{"current_steps": 15580, "total_steps": 29667, "loss": 0.3588, "lr": 3.126282527390149e-05, "epoch": 1.575520652276965, "percentage": 52.52, "elapsed_time": "1 day, 21:59:28", "remaining_time": "1 day, 17:35:02", "throughput": 27615.69, "total_tokens": 4572279872} +{"current_steps": 15590, "total_steps": 29667, "loss": 0.3533, "lr": 3.1256716031611146e-05, "epoch": 1.5765319343930728, "percentage": 52.55, "elapsed_time": "1 day, 22:01:09", "remaining_time": "1 day, 17:33:11", "throughput": 27616.79, "total_tokens": 4575261504} +{"current_steps": 15600, "total_steps": 29667, "loss": 0.3527, "lr": 3.1250610369444475e-05, "epoch": 1.5775432165091805, "percentage": 52.58, "elapsed_time": "1 day, 22:02:44", "remaining_time": "1 day, 17:31:14", "throughput": 27618.38, "total_tokens": 4578145984} +{"current_steps": 15610, "total_steps": 29667, "loss": 0.3527, "lr": 3.124450828390616e-05, "epoch": 1.5785544986252884, "percentage": 52.62, "elapsed_time": "1 day, 22:04:22", "remaining_time": "1 day, 17:29:21", "throughput": 27619.77, "total_tokens": 4581093056} +{"current_steps": 15620, "total_steps": 29667, "loss": 0.3604, "lr": 3.123840977150566e-05, "epoch": 1.579565780741396, "percentage": 52.65, "elapsed_time": "1 day, 22:06:01", "remaining_time": "1 day, 17:27:28", "throughput": 27621.05, "total_tokens": 4584042240} +{"current_steps": 15630, "total_steps": 29667, "loss": 0.3571, "lr": 3.123231482875717e-05, "epoch": 1.580577062857504, "percentage": 52.68, "elapsed_time": "1 day, 22:07:40", "remaining_time": "1 day, 17:25:35", "throughput": 27622.3, "total_tokens": 4586967168} +{"current_steps": 15640, "total_steps": 29667, "loss": 0.3546, "lr": 3.122622345217967e-05, "epoch": 1.581588344973612, "percentage": 52.72, "elapsed_time": "1 day, 22:09:21", "remaining_time": "1 day, 17:23:44", "throughput": 27623.08, "total_tokens": 4589885120} +{"current_steps": 15650, "total_steps": 29667, "loss": 0.355, "lr": 3.12201356382969e-05, "epoch": 1.5825996270897198, "percentage": 52.75, "elapsed_time": "1 day, 22:10:55", "remaining_time": "1 day, 17:21:47", "throughput": 27624.85, "total_tokens": 4592777728} +{"current_steps": 15660, "total_steps": 29667, "loss": 0.3528, "lr": 3.1214051383637304e-05, "epoch": 1.5836109092058275, "percentage": 52.79, "elapsed_time": "1 day, 22:12:37", "remaining_time": "1 day, 17:19:57", "throughput": 27625.93, "total_tokens": 4595786304} +{"current_steps": 15670, "total_steps": 29667, "loss": 0.3581, "lr": 3.1207970684734104e-05, "epoch": 1.5846221913219354, "percentage": 52.82, "elapsed_time": "1 day, 22:14:14", "remaining_time": "1 day, 17:18:03", "throughput": 27627.19, "total_tokens": 4598670912} +{"current_steps": 15680, "total_steps": 29667, "loss": 0.3579, "lr": 3.120189353812521e-05, "epoch": 1.585633473438043, "percentage": 52.85, "elapsed_time": "1 day, 22:15:53", "remaining_time": "1 day, 17:16:10", "throughput": 27628.2, "total_tokens": 4601583808} +{"current_steps": 15690, "total_steps": 29667, "loss": 0.3566, "lr": 3.1195819940353294e-05, "epoch": 1.586644755554151, "percentage": 52.89, "elapsed_time": "1 day, 22:17:32", "remaining_time": "1 day, 17:14:17", "throughput": 27629.47, "total_tokens": 4604512256} +{"current_steps": 15700, "total_steps": 29667, "loss": 0.3521, "lr": 3.1189749887965684e-05, "epoch": 1.5876560376702589, "percentage": 52.92, "elapsed_time": "1 day, 22:19:12", "remaining_time": "1 day, 17:12:25", "throughput": 27630.66, "total_tokens": 4607473216} +{"current_steps": 15710, "total_steps": 29667, "loss": 0.3567, "lr": 3.118368337751443e-05, "epoch": 1.5886673197863668, "percentage": 52.95, "elapsed_time": "1 day, 22:20:51", "remaining_time": "1 day, 17:10:33", "throughput": 27631.57, "total_tokens": 4610373120} +{"current_steps": 15720, "total_steps": 29667, "loss": 0.3556, "lr": 3.1177620405556305e-05, "epoch": 1.5896786019024745, "percentage": 52.99, "elapsed_time": "1 day, 22:22:28", "remaining_time": "1 day, 17:08:38", "throughput": 27633.05, "total_tokens": 4613292352} +{"current_steps": 15730, "total_steps": 29667, "loss": 0.3534, "lr": 3.117156096865272e-05, "epoch": 1.5906898840185824, "percentage": 53.02, "elapsed_time": "1 day, 22:24:07", "remaining_time": "1 day, 17:06:46", "throughput": 27634.4, "total_tokens": 4616257152} +{"current_steps": 15740, "total_steps": 29667, "loss": 0.3607, "lr": 3.116550506336979e-05, "epoch": 1.59170116613469, "percentage": 53.06, "elapsed_time": "1 day, 22:25:48", "remaining_time": "1 day, 17:04:55", "throughput": 27635.42, "total_tokens": 4619207552} +{"current_steps": 15750, "total_steps": 29667, "loss": 0.3536, "lr": 3.11594526862783e-05, "epoch": 1.592712448250798, "percentage": 53.09, "elapsed_time": "1 day, 22:27:30", "remaining_time": "1 day, 17:03:06", "throughput": 27636.25, "total_tokens": 4622186560} +{"current_steps": 15760, "total_steps": 29667, "loss": 0.3605, "lr": 3.115340383395367e-05, "epoch": 1.5937237303669058, "percentage": 53.12, "elapsed_time": "1 day, 22:29:07", "remaining_time": "1 day, 17:01:11", "throughput": 27637.63, "total_tokens": 4625090496} +{"current_steps": 15770, "total_steps": 29667, "loss": 0.3526, "lr": 3.1147358502975995e-05, "epoch": 1.5947350124830137, "percentage": 53.16, "elapsed_time": "1 day, 22:30:42", "remaining_time": "1 day, 16:59:15", "throughput": 27639.08, "total_tokens": 4627964864} +{"current_steps": 15780, "total_steps": 29667, "loss": 0.3566, "lr": 3.114131668993e-05, "epoch": 1.5957462945991214, "percentage": 53.19, "elapsed_time": "1 day, 22:32:15", "remaining_time": "1 day, 16:57:17", "throughput": 27640.66, "total_tokens": 4630790592} +{"current_steps": 15790, "total_steps": 29667, "loss": 0.3529, "lr": 3.113527839140507e-05, "epoch": 1.5967575767152293, "percentage": 53.22, "elapsed_time": "1 day, 22:33:52", "remaining_time": "1 day, 16:55:23", "throughput": 27641.91, "total_tokens": 4633681088} +{"current_steps": 15800, "total_steps": 29667, "loss": 0.3514, "lr": 3.112924360399517e-05, "epoch": 1.597768858831337, "percentage": 53.26, "elapsed_time": "1 day, 22:35:35", "remaining_time": "1 day, 16:53:34", "throughput": 27642.55, "total_tokens": 4636625088} +{"current_steps": 15810, "total_steps": 29667, "loss": 0.3582, "lr": 3.112321232429894e-05, "epoch": 1.598780140947445, "percentage": 53.29, "elapsed_time": "1 day, 22:37:14", "remaining_time": "1 day, 16:51:41", "throughput": 27643.79, "total_tokens": 4639578880} +{"current_steps": 15820, "total_steps": 29667, "loss": 0.3539, "lr": 3.11171845489196e-05, "epoch": 1.5997914230635528, "percentage": 53.33, "elapsed_time": "1 day, 22:38:55", "remaining_time": "1 day, 16:49:51", "throughput": 27644.8, "total_tokens": 4642542336} +{"current_steps": 15830, "total_steps": 29667, "loss": 0.3537, "lr": 3.1111160274464965e-05, "epoch": 1.6008027051796607, "percentage": 53.36, "elapsed_time": "1 day, 22:40:36", "remaining_time": "1 day, 16:48:00", "throughput": 27645.83, "total_tokens": 4645516672} +{"current_steps": 15840, "total_steps": 29667, "loss": 0.3489, "lr": 3.1105139497547466e-05, "epoch": 1.6018139872957684, "percentage": 53.39, "elapsed_time": "1 day, 22:42:13", "remaining_time": "1 day, 16:46:06", "throughput": 27647.27, "total_tokens": 4648445312} +{"current_steps": 15850, "total_steps": 29667, "loss": 0.3539, "lr": 3.109912221478411e-05, "epoch": 1.602825269411876, "percentage": 53.43, "elapsed_time": "1 day, 22:43:51", "remaining_time": "1 day, 16:44:13", "throughput": 27648.7, "total_tokens": 4651390784} +{"current_steps": 15860, "total_steps": 29667, "loss": 0.3529, "lr": 3.10931084227965e-05, "epoch": 1.603836551527984, "percentage": 53.46, "elapsed_time": "1 day, 22:45:34", "remaining_time": "1 day, 16:42:24", "throughput": 27649.49, "total_tokens": 4654357696} +{"current_steps": 15870, "total_steps": 29667, "loss": 0.3581, "lr": 3.108709811821079e-05, "epoch": 1.604847833644092, "percentage": 53.49, "elapsed_time": "1 day, 22:47:15", "remaining_time": "1 day, 16:40:33", "throughput": 27650.48, "total_tokens": 4657312192} +{"current_steps": 15880, "total_steps": 29667, "loss": 0.3575, "lr": 3.1081091297657696e-05, "epoch": 1.6058591157601998, "percentage": 53.53, "elapsed_time": "1 day, 22:48:54", "remaining_time": "1 day, 16:38:41", "throughput": 27651.58, "total_tokens": 4660253632} +{"current_steps": 15890, "total_steps": 29667, "loss": 0.3527, "lr": 3.107508795777251e-05, "epoch": 1.6068703978763077, "percentage": 53.56, "elapsed_time": "1 day, 22:50:32", "remaining_time": "1 day, 16:36:48", "throughput": 27652.75, "total_tokens": 4663154176} +{"current_steps": 15900, "total_steps": 29667, "loss": 0.3569, "lr": 3.1069088095195056e-05, "epoch": 1.6078816799924154, "percentage": 53.59, "elapsed_time": "1 day, 22:52:12", "remaining_time": "1 day, 16:34:56", "throughput": 27653.89, "total_tokens": 4666105792} +{"current_steps": 15910, "total_steps": 29667, "loss": 0.3573, "lr": 3.1063091706569703e-05, "epoch": 1.608892962108523, "percentage": 53.63, "elapsed_time": "1 day, 22:53:53", "remaining_time": "1 day, 16:33:06", "throughput": 27654.76, "total_tokens": 4669061184} +{"current_steps": 15920, "total_steps": 29667, "loss": 0.3543, "lr": 3.105709878854535e-05, "epoch": 1.609904244224631, "percentage": 53.66, "elapsed_time": "1 day, 22:55:34", "remaining_time": "1 day, 16:31:15", "throughput": 27655.8, "total_tokens": 4672022144} +{"current_steps": 15930, "total_steps": 29667, "loss": 0.3564, "lr": 3.105110933777541e-05, "epoch": 1.6109155263407389, "percentage": 53.7, "elapsed_time": "1 day, 22:57:17", "remaining_time": "1 day, 16:29:26", "throughput": 27656.68, "total_tokens": 4675007232} +{"current_steps": 15940, "total_steps": 29667, "loss": 0.3519, "lr": 3.104512335091783e-05, "epoch": 1.6119268084568468, "percentage": 53.73, "elapsed_time": "1 day, 22:58:57", "remaining_time": "1 day, 16:27:35", "throughput": 27657.65, "total_tokens": 4677951360} +{"current_steps": 15950, "total_steps": 29667, "loss": 0.3599, "lr": 3.1039140824635074e-05, "epoch": 1.6129380905729547, "percentage": 53.76, "elapsed_time": "1 day, 23:00:34", "remaining_time": "1 day, 16:25:41", "throughput": 27659.06, "total_tokens": 4680875648} +{"current_steps": 15960, "total_steps": 29667, "loss": 0.3597, "lr": 3.103316175559406e-05, "epoch": 1.6139493726890624, "percentage": 53.8, "elapsed_time": "1 day, 23:02:13", "remaining_time": "1 day, 16:23:49", "throughput": 27660.25, "total_tokens": 4683795328} +{"current_steps": 15970, "total_steps": 29667, "loss": 0.3577, "lr": 3.102718614046624e-05, "epoch": 1.61496065480517, "percentage": 53.83, "elapsed_time": "1 day, 23:03:52", "remaining_time": "1 day, 16:21:56", "throughput": 27661.36, "total_tokens": 4686723520} +{"current_steps": 15980, "total_steps": 29667, "loss": 0.3489, "lr": 3.1021213975927546e-05, "epoch": 1.615971936921278, "percentage": 53.86, "elapsed_time": "1 day, 23:05:31", "remaining_time": "1 day, 16:20:05", "throughput": 27662.47, "total_tokens": 4689673792} +{"current_steps": 15990, "total_steps": 29667, "loss": 0.3541, "lr": 3.1015245258658374e-05, "epoch": 1.6169832190373858, "percentage": 53.9, "elapsed_time": "1 day, 23:07:10", "remaining_time": "1 day, 16:18:13", "throughput": 27663.71, "total_tokens": 4692614272} +{"current_steps": 16000, "total_steps": 29667, "loss": 0.3574, "lr": 3.1009279985343606e-05, "epoch": 1.6179945011534937, "percentage": 53.93, "elapsed_time": "1 day, 23:08:48", "remaining_time": "1 day, 16:16:20", "throughput": 27664.84, "total_tokens": 4695520448} +{"current_steps": 16010, "total_steps": 29667, "loss": 0.3535, "lr": 3.100331815267255e-05, "epoch": 1.6190057832696017, "percentage": 53.97, "elapsed_time": "1 day, 23:10:28", "remaining_time": "1 day, 16:14:28", "throughput": 27666.09, "total_tokens": 4698485440} +{"current_steps": 16020, "total_steps": 29667, "loss": 0.3498, "lr": 3.099735975733902e-05, "epoch": 1.6200170653857093, "percentage": 54.0, "elapsed_time": "1 day, 23:12:06", "remaining_time": "1 day, 16:12:35", "throughput": 27667.45, "total_tokens": 4701426368} +{"current_steps": 16030, "total_steps": 29667, "loss": 0.3563, "lr": 3.099140479604123e-05, "epoch": 1.621028347501817, "percentage": 54.03, "elapsed_time": "1 day, 23:13:44", "remaining_time": "1 day, 16:10:43", "throughput": 27668.63, "total_tokens": 4704353536} +{"current_steps": 16040, "total_steps": 29667, "loss": 0.3561, "lr": 3.098545326548186e-05, "epoch": 1.622039629617925, "percentage": 54.07, "elapsed_time": "1 day, 23:15:22", "remaining_time": "1 day, 16:08:49", "throughput": 27669.96, "total_tokens": 4707277184} +{"current_steps": 16050, "total_steps": 29667, "loss": 0.3564, "lr": 3.0979505162368014e-05, "epoch": 1.6230509117340328, "percentage": 54.1, "elapsed_time": "1 day, 23:17:04", "remaining_time": "1 day, 16:07:00", "throughput": 27670.58, "total_tokens": 4710209472} +{"current_steps": 16060, "total_steps": 29667, "loss": 0.3556, "lr": 3.097356048341121e-05, "epoch": 1.6240621938501407, "percentage": 54.13, "elapsed_time": "1 day, 23:18:39", "remaining_time": "1 day, 16:05:05", "throughput": 27672.04, "total_tokens": 4713097088} +{"current_steps": 16070, "total_steps": 29667, "loss": 0.3575, "lr": 3.0967619225327396e-05, "epoch": 1.6250734759662484, "percentage": 54.17, "elapsed_time": "1 day, 23:20:19", "remaining_time": "1 day, 16:03:13", "throughput": 27673.19, "total_tokens": 4716044096} +{"current_steps": 16080, "total_steps": 29667, "loss": 0.3564, "lr": 3.0961681384836924e-05, "epoch": 1.6260847580823563, "percentage": 54.2, "elapsed_time": "1 day, 23:21:59", "remaining_time": "1 day, 16:01:22", "throughput": 27674.12, "total_tokens": 4718982784} +{"current_steps": 16090, "total_steps": 29667, "loss": 0.3518, "lr": 3.095574695866453e-05, "epoch": 1.627096040198464, "percentage": 54.24, "elapsed_time": "1 day, 23:23:40", "remaining_time": "1 day, 15:59:32", "throughput": 27675.22, "total_tokens": 4721953600} +{"current_steps": 16100, "total_steps": 29667, "loss": 0.358, "lr": 3.0949815943539355e-05, "epoch": 1.628107322314572, "percentage": 54.27, "elapsed_time": "1 day, 23:25:20", "remaining_time": "1 day, 15:57:41", "throughput": 27676.41, "total_tokens": 4724924416} +{"current_steps": 16110, "total_steps": 29667, "loss": 0.3556, "lr": 3.094388833619495e-05, "epoch": 1.6291186044306798, "percentage": 54.3, "elapsed_time": "1 day, 23:27:03", "remaining_time": "1 day, 15:55:52", "throughput": 27677.11, "total_tokens": 4727908736} +{"current_steps": 16120, "total_steps": 29667, "loss": 0.3538, "lr": 3.0937964133369196e-05, "epoch": 1.6301298865467877, "percentage": 54.34, "elapsed_time": "1 day, 23:28:41", "remaining_time": "1 day, 15:53:59", "throughput": 27678.51, "total_tokens": 4730842944} +{"current_steps": 16130, "total_steps": 29667, "loss": 0.3575, "lr": 3.093204333180437e-05, "epoch": 1.6311411686628954, "percentage": 54.37, "elapsed_time": "1 day, 23:30:23", "remaining_time": "1 day, 15:52:10", "throughput": 27679.09, "total_tokens": 4733782720} +{"current_steps": 16140, "total_steps": 29667, "loss": 0.3564, "lr": 3.0926125928247114e-05, "epoch": 1.6321524507790033, "percentage": 54.4, "elapsed_time": "1 day, 23:32:02", "remaining_time": "1 day, 15:50:18", "throughput": 27680.0, "total_tokens": 4736683904} +{"current_steps": 16150, "total_steps": 29667, "loss": 0.3557, "lr": 3.092021191944842e-05, "epoch": 1.633163732895111, "percentage": 54.44, "elapsed_time": "1 day, 23:33:37", "remaining_time": "1 day, 15:48:23", "throughput": 27681.62, "total_tokens": 4739581888} +{"current_steps": 16160, "total_steps": 29667, "loss": 0.3515, "lr": 3.091430130216363e-05, "epoch": 1.6341750150112189, "percentage": 54.47, "elapsed_time": "1 day, 23:35:18", "remaining_time": "1 day, 15:46:32", "throughput": 27682.57, "total_tokens": 4742535232} +{"current_steps": 16170, "total_steps": 29667, "loss": 0.3544, "lr": 3.090839407315242e-05, "epoch": 1.6351862971273268, "percentage": 54.51, "elapsed_time": "1 day, 23:37:00", "remaining_time": "1 day, 15:44:43", "throughput": 27683.47, "total_tokens": 4745522112} +{"current_steps": 16180, "total_steps": 29667, "loss": 0.3591, "lr": 3.0902490229178794e-05, "epoch": 1.6361975792434347, "percentage": 54.54, "elapsed_time": "1 day, 23:38:41", "remaining_time": "1 day, 15:42:53", "throughput": 27684.39, "total_tokens": 4748475264} +{"current_steps": 16190, "total_steps": 29667, "loss": 0.3528, "lr": 3.0896589767011104e-05, "epoch": 1.6372088613595424, "percentage": 54.57, "elapsed_time": "1 day, 23:40:22", "remaining_time": "1 day, 15:41:03", "throughput": 27685.42, "total_tokens": 4751443392} +{"current_steps": 16200, "total_steps": 29667, "loss": 0.3504, "lr": 3.0890692683421985e-05, "epoch": 1.6382201434756503, "percentage": 54.61, "elapsed_time": "1 day, 23:41:59", "remaining_time": "1 day, 15:39:09", "throughput": 27686.75, "total_tokens": 4754357760} +{"current_steps": 16210, "total_steps": 29667, "loss": 0.3541, "lr": 3.088479897518843e-05, "epoch": 1.639231425591758, "percentage": 54.64, "elapsed_time": "1 day, 23:43:38", "remaining_time": "1 day, 15:37:18", "throughput": 27687.91, "total_tokens": 4757307456} +{"current_steps": 16220, "total_steps": 29667, "loss": 0.3529, "lr": 3.087890863909168e-05, "epoch": 1.6402427077078658, "percentage": 54.67, "elapsed_time": "1 day, 23:45:17", "remaining_time": "1 day, 15:35:26", "throughput": 27689.19, "total_tokens": 4760251456} +{"current_steps": 16230, "total_steps": 29667, "loss": 0.3571, "lr": 3.087302167191732e-05, "epoch": 1.6412539898239737, "percentage": 54.71, "elapsed_time": "1 day, 23:47:00", "remaining_time": "1 day, 15:33:37", "throughput": 27689.96, "total_tokens": 4763237248} +{"current_steps": 16240, "total_steps": 29667, "loss": 0.3566, "lr": 3.086713807045518e-05, "epoch": 1.6422652719400817, "percentage": 54.74, "elapsed_time": "1 day, 23:48:40", "remaining_time": "1 day, 15:31:46", "throughput": 27690.93, "total_tokens": 4766172672} +{"current_steps": 16250, "total_steps": 29667, "loss": 0.3565, "lr": 3.086125783149941e-05, "epoch": 1.6432765540561893, "percentage": 54.77, "elapsed_time": "1 day, 23:50:21", "remaining_time": "1 day, 15:29:56", "throughput": 27691.87, "total_tokens": 4769135424} +{"current_steps": 16260, "total_steps": 29667, "loss": 0.3555, "lr": 3.0855380951848404e-05, "epoch": 1.6442878361722972, "percentage": 54.81, "elapsed_time": "1 day, 23:52:00", "remaining_time": "1 day, 15:28:05", "throughput": 27692.84, "total_tokens": 4772052928} +{"current_steps": 16270, "total_steps": 29667, "loss": 0.3599, "lr": 3.084950742830484e-05, "epoch": 1.645299118288405, "percentage": 54.84, "elapsed_time": "1 day, 23:53:39", "remaining_time": "1 day, 15:26:13", "throughput": 27693.82, "total_tokens": 4774968704} +{"current_steps": 16280, "total_steps": 29667, "loss": 0.3597, "lr": 3.0843637257675654e-05, "epoch": 1.6463104004045128, "percentage": 54.88, "elapsed_time": "1 day, 23:55:19", "remaining_time": "1 day, 15:24:22", "throughput": 27694.82, "total_tokens": 4777908032} +{"current_steps": 16290, "total_steps": 29667, "loss": 0.3555, "lr": 3.083777043677202e-05, "epoch": 1.6473216825206207, "percentage": 54.91, "elapsed_time": "1 day, 23:57:02", "remaining_time": "1 day, 15:22:33", "throughput": 27695.36, "total_tokens": 4780829888} +{"current_steps": 16300, "total_steps": 29667, "loss": 0.3548, "lr": 3.083190696240936e-05, "epoch": 1.6483329646367286, "percentage": 54.94, "elapsed_time": "1 day, 23:58:40", "remaining_time": "1 day, 15:20:41", "throughput": 27696.48, "total_tokens": 4783747712} +{"current_steps": 16310, "total_steps": 29667, "loss": 0.3529, "lr": 3.082604683140735e-05, "epoch": 1.6493442467528363, "percentage": 54.98, "elapsed_time": "2 days, 0:00:16", "remaining_time": "1 day, 15:18:47", "throughput": 27698.05, "total_tokens": 4786685952} +{"current_steps": 16320, "total_steps": 29667, "loss": 0.3575, "lr": 3.082019004058987e-05, "epoch": 1.6503555288689442, "percentage": 55.01, "elapsed_time": "2 days, 0:01:53", "remaining_time": "1 day, 15:16:54", "throughput": 27699.24, "total_tokens": 4789580864} +{"current_steps": 16330, "total_steps": 29667, "loss": 0.3555, "lr": 3.081433658678505e-05, "epoch": 1.651366810985052, "percentage": 55.04, "elapsed_time": "2 days, 0:03:34", "remaining_time": "1 day, 15:15:03", "throughput": 27700.1, "total_tokens": 4792516800} +{"current_steps": 16340, "total_steps": 29667, "loss": 0.36, "lr": 3.080848646682521e-05, "epoch": 1.6523780931011598, "percentage": 55.08, "elapsed_time": "2 days, 0:05:13", "remaining_time": "1 day, 15:13:12", "throughput": 27701.12, "total_tokens": 4795431936} +{"current_steps": 16350, "total_steps": 29667, "loss": 0.3583, "lr": 3.080263967754689e-05, "epoch": 1.6533893752172677, "percentage": 55.11, "elapsed_time": "2 days, 0:06:51", "remaining_time": "1 day, 15:11:19", "throughput": 27702.38, "total_tokens": 4798357248} +{"current_steps": 16360, "total_steps": 29667, "loss": 0.3563, "lr": 3.079679621579083e-05, "epoch": 1.6544006573333756, "percentage": 55.15, "elapsed_time": "2 days, 0:08:31", "remaining_time": "1 day, 15:09:29", "throughput": 27703.38, "total_tokens": 4801315712} +{"current_steps": 16370, "total_steps": 29667, "loss": 0.3534, "lr": 3.079095607840197e-05, "epoch": 1.6554119394494833, "percentage": 55.18, "elapsed_time": "2 days, 0:10:13", "remaining_time": "1 day, 15:07:40", "throughput": 27703.63, "total_tokens": 4804196160} +{"current_steps": 16380, "total_steps": 29667, "loss": 0.3569, "lr": 3.0785119262229416e-05, "epoch": 1.656423221565591, "percentage": 55.21, "elapsed_time": "2 days, 0:12:02", "remaining_time": "1 day, 15:05:56", "throughput": 27703.23, "total_tokens": 4807135936} +{"current_steps": 16390, "total_steps": 29667, "loss": 0.3574, "lr": 3.0779285764126485e-05, "epoch": 1.6574345036816989, "percentage": 55.25, "elapsed_time": "2 days, 0:13:44", "remaining_time": "1 day, 15:04:07", "throughput": 27703.88, "total_tokens": 4810062144} +{"current_steps": 16400, "total_steps": 29667, "loss": 0.3545, "lr": 3.077345558095064e-05, "epoch": 1.6584457857978068, "percentage": 55.28, "elapsed_time": "2 days, 0:15:22", "remaining_time": "1 day, 15:02:15", "throughput": 27705.1, "total_tokens": 4813002880} +{"current_steps": 16410, "total_steps": 29667, "loss": 0.3596, "lr": 3.076762870956352e-05, "epoch": 1.6594570679139147, "percentage": 55.31, "elapsed_time": "2 days, 0:17:02", "remaining_time": "1 day, 15:00:24", "throughput": 27706.25, "total_tokens": 4815956544} +{"current_steps": 16420, "total_steps": 29667, "loss": 0.3576, "lr": 3.076180514683092e-05, "epoch": 1.6604683500300226, "percentage": 55.35, "elapsed_time": "2 days, 0:18:37", "remaining_time": "1 day, 14:58:29", "throughput": 27707.77, "total_tokens": 4818860416} +{"current_steps": 16430, "total_steps": 29667, "loss": 0.353, "lr": 3.075598488962278e-05, "epoch": 1.6614796321461303, "percentage": 55.38, "elapsed_time": "2 days, 0:20:15", "remaining_time": "1 day, 14:56:37", "throughput": 27708.9, "total_tokens": 4821775808} +{"current_steps": 16440, "total_steps": 29667, "loss": 0.3559, "lr": 3.0750167934813207e-05, "epoch": 1.662490914262238, "percentage": 55.42, "elapsed_time": "2 days, 0:21:55", "remaining_time": "1 day, 14:54:46", "throughput": 27710.03, "total_tokens": 4824739904} +{"current_steps": 16450, "total_steps": 29667, "loss": 0.3551, "lr": 3.074435427928041e-05, "epoch": 1.6635021963783458, "percentage": 55.45, "elapsed_time": "2 days, 0:23:32", "remaining_time": "1 day, 14:52:53", "throughput": 27711.35, "total_tokens": 4827664384} +{"current_steps": 16460, "total_steps": 29667, "loss": 0.3581, "lr": 3.073854391990675e-05, "epoch": 1.6645134784944537, "percentage": 55.48, "elapsed_time": "2 days, 0:25:13", "remaining_time": "1 day, 14:51:04", "throughput": 27712.34, "total_tokens": 4830642880} +{"current_steps": 16470, "total_steps": 29667, "loss": 0.3577, "lr": 3.073273685357871e-05, "epoch": 1.6655247606105616, "percentage": 55.52, "elapsed_time": "2 days, 0:26:50", "remaining_time": "1 day, 14:49:11", "throughput": 27713.73, "total_tokens": 4833577344} +{"current_steps": 16480, "total_steps": 29667, "loss": 0.3572, "lr": 3.072693307718689e-05, "epoch": 1.6665360427266696, "percentage": 55.55, "elapsed_time": "2 days, 0:28:32", "remaining_time": "1 day, 14:47:22", "throughput": 27714.5, "total_tokens": 4836538368} +{"current_steps": 16490, "total_steps": 29667, "loss": 0.3561, "lr": 3.0721132587626e-05, "epoch": 1.6675473248427772, "percentage": 55.58, "elapsed_time": "2 days, 0:30:12", "remaining_time": "1 day, 14:45:31", "throughput": 27715.69, "total_tokens": 4839502144} +{"current_steps": 16500, "total_steps": 29667, "loss": 0.3545, "lr": 3.071533538179482e-05, "epoch": 1.668558606958885, "percentage": 55.62, "elapsed_time": "2 days, 0:31:54", "remaining_time": "1 day, 14:43:41", "throughput": 27716.53, "total_tokens": 4842469056} +{"current_steps": 16510, "total_steps": 29667, "loss": 0.3582, "lr": 3.070954145659627e-05, "epoch": 1.6695698890749928, "percentage": 55.65, "elapsed_time": "2 days, 0:33:36", "remaining_time": "1 day, 14:41:52", "throughput": 27717.25, "total_tokens": 4845419712} +{"current_steps": 16520, "total_steps": 29667, "loss": 0.3578, "lr": 3.070375080893734e-05, "epoch": 1.6705811711911007, "percentage": 55.68, "elapsed_time": "2 days, 0:35:15", "remaining_time": "1 day, 14:40:01", "throughput": 27718.27, "total_tokens": 4848355264} +{"current_steps": 16530, "total_steps": 29667, "loss": 0.3592, "lr": 3.06979634357291e-05, "epoch": 1.6715924533072086, "percentage": 55.72, "elapsed_time": "2 days, 0:36:54", "remaining_time": "1 day, 14:38:10", "throughput": 27719.25, "total_tokens": 4851259968} +{"current_steps": 16540, "total_steps": 29667, "loss": 0.3568, "lr": 3.0692179333886686e-05, "epoch": 1.6726037354233165, "percentage": 55.75, "elapsed_time": "2 days, 0:38:33", "remaining_time": "1 day, 14:36:19", "throughput": 27720.29, "total_tokens": 4854202688} +{"current_steps": 16550, "total_steps": 29667, "loss": 0.3544, "lr": 3.068639850032933e-05, "epoch": 1.6736150175394242, "percentage": 55.79, "elapsed_time": "2 days, 0:40:15", "remaining_time": "1 day, 14:34:30", "throughput": 27721.01, "total_tokens": 4857149184} +{"current_steps": 16560, "total_steps": 29667, "loss": 0.359, "lr": 3.068062093198028e-05, "epoch": 1.674626299655532, "percentage": 55.82, "elapsed_time": "2 days, 0:41:55", "remaining_time": "1 day, 14:32:39", "throughput": 27722.01, "total_tokens": 4860085696} +{"current_steps": 16570, "total_steps": 29667, "loss": 0.3521, "lr": 3.067484662576687e-05, "epoch": 1.6756375817716398, "percentage": 55.85, "elapsed_time": "2 days, 0:43:33", "remaining_time": "1 day, 14:30:47", "throughput": 27723.22, "total_tokens": 4863027392} +{"current_steps": 16580, "total_steps": 29667, "loss": 0.3528, "lr": 3.066907557862048e-05, "epoch": 1.6766488638877477, "percentage": 55.89, "elapsed_time": "2 days, 0:45:15", "remaining_time": "1 day, 14:28:58", "throughput": 27724.11, "total_tokens": 4866001024} +{"current_steps": 16590, "total_steps": 29667, "loss": 0.3564, "lr": 3.066330778747651e-05, "epoch": 1.6776601460038556, "percentage": 55.92, "elapsed_time": "2 days, 0:46:54", "remaining_time": "1 day, 14:27:07", "throughput": 27725.2, "total_tokens": 4868943360} +{"current_steps": 16600, "total_steps": 29667, "loss": 0.3542, "lr": 3.065754324927441e-05, "epoch": 1.6786714281199635, "percentage": 55.95, "elapsed_time": "2 days, 0:48:31", "remaining_time": "1 day, 14:25:14", "throughput": 27726.34, "total_tokens": 4871847040} +{"current_steps": 16610, "total_steps": 29667, "loss": 0.3597, "lr": 3.065178196095765e-05, "epoch": 1.6796827102360712, "percentage": 55.99, "elapsed_time": "2 days, 0:50:11", "remaining_time": "1 day, 14:23:23", "throughput": 27727.37, "total_tokens": 4874780160} +{"current_steps": 16620, "total_steps": 29667, "loss": 0.3495, "lr": 3.064602391947372e-05, "epoch": 1.6806939923521789, "percentage": 56.02, "elapsed_time": "2 days, 0:51:50", "remaining_time": "1 day, 14:21:33", "throughput": 27728.6, "total_tokens": 4877755264} +{"current_steps": 16630, "total_steps": 29667, "loss": 0.3544, "lr": 3.0640269121774126e-05, "epoch": 1.6817052744682868, "percentage": 56.06, "elapsed_time": "2 days, 0:53:32", "remaining_time": "1 day, 14:19:44", "throughput": 27729.35, "total_tokens": 4880720960} +{"current_steps": 16640, "total_steps": 29667, "loss": 0.355, "lr": 3.063451756481437e-05, "epoch": 1.6827165565843947, "percentage": 56.09, "elapsed_time": "2 days, 0:55:07", "remaining_time": "1 day, 14:17:50", "throughput": 27730.7, "total_tokens": 4883595136} +{"current_steps": 16650, "total_steps": 29667, "loss": 0.3508, "lr": 3.062876924555396e-05, "epoch": 1.6837278387005026, "percentage": 56.12, "elapsed_time": "2 days, 0:56:43", "remaining_time": "1 day, 14:15:56", "throughput": 27732.3, "total_tokens": 4886526016} +{"current_steps": 16660, "total_steps": 29667, "loss": 0.3547, "lr": 3.06230241609564e-05, "epoch": 1.6847391208166103, "percentage": 56.16, "elapsed_time": "2 days, 0:58:20", "remaining_time": "1 day, 14:14:03", "throughput": 27733.61, "total_tokens": 4889439168} +{"current_steps": 16670, "total_steps": 29667, "loss": 0.3533, "lr": 3.061728230798916e-05, "epoch": 1.6857504029327182, "percentage": 56.19, "elapsed_time": "2 days, 0:59:59", "remaining_time": "1 day, 14:12:12", "throughput": 27734.59, "total_tokens": 4892364160} +{"current_steps": 16680, "total_steps": 29667, "loss": 0.3518, "lr": 3.061154368362373e-05, "epoch": 1.6867616850488258, "percentage": 56.22, "elapsed_time": "2 days, 1:01:38", "remaining_time": "1 day, 14:10:20", "throughput": 27735.66, "total_tokens": 4895293248} +{"current_steps": 16690, "total_steps": 29667, "loss": 0.3576, "lr": 3.060580828483552e-05, "epoch": 1.6877729671649337, "percentage": 56.26, "elapsed_time": "2 days, 1:03:15", "remaining_time": "1 day, 14:08:28", "throughput": 27737.05, "total_tokens": 4898229056} +{"current_steps": 16700, "total_steps": 29667, "loss": 0.3537, "lr": 3.060007610860395e-05, "epoch": 1.6887842492810416, "percentage": 56.29, "elapsed_time": "2 days, 1:04:53", "remaining_time": "1 day, 14:06:36", "throughput": 27738.15, "total_tokens": 4901162048} +{"current_steps": 16710, "total_steps": 29667, "loss": 0.3543, "lr": 3.059434715191236e-05, "epoch": 1.6897955313971496, "percentage": 56.33, "elapsed_time": "2 days, 1:06:33", "remaining_time": "1 day, 14:04:46", "throughput": 27739.21, "total_tokens": 4904119040} +{"current_steps": 16720, "total_steps": 29667, "loss": 0.3538, "lr": 3.0588621411748074e-05, "epoch": 1.6908068135132572, "percentage": 56.36, "elapsed_time": "2 days, 1:08:11", "remaining_time": "1 day, 14:02:54", "throughput": 27740.48, "total_tokens": 4907045888} +{"current_steps": 16730, "total_steps": 29667, "loss": 0.3548, "lr": 3.0582898885102344e-05, "epoch": 1.6918180956293651, "percentage": 56.39, "elapsed_time": "2 days, 1:09:54", "remaining_time": "1 day, 14:01:06", "throughput": 27741.24, "total_tokens": 4910045376} +{"current_steps": 16740, "total_steps": 29667, "loss": 0.3531, "lr": 3.0577179568970366e-05, "epoch": 1.6928293777454728, "percentage": 56.43, "elapsed_time": "2 days, 1:11:32", "remaining_time": "1 day, 13:59:14", "throughput": 27742.36, "total_tokens": 4912963712} +{"current_steps": 16750, "total_steps": 29667, "loss": 0.3522, "lr": 3.057146346035127e-05, "epoch": 1.6938406598615807, "percentage": 56.46, "elapsed_time": "2 days, 1:13:10", "remaining_time": "1 day, 13:57:22", "throughput": 27743.46, "total_tokens": 4915869440} +{"current_steps": 16760, "total_steps": 29667, "loss": 0.3556, "lr": 3.056575055624811e-05, "epoch": 1.6948519419776886, "percentage": 56.49, "elapsed_time": "2 days, 1:14:46", "remaining_time": "1 day, 13:55:29", "throughput": 27744.92, "total_tokens": 4918785472} +{"current_steps": 16770, "total_steps": 29667, "loss": 0.3596, "lr": 3.0560040853667846e-05, "epoch": 1.6958632240937965, "percentage": 56.53, "elapsed_time": "2 days, 1:16:26", "remaining_time": "1 day, 13:53:39", "throughput": 27745.89, "total_tokens": 4921743744} +{"current_steps": 16780, "total_steps": 29667, "loss": 0.3529, "lr": 3.0554334349621366e-05, "epoch": 1.6968745062099042, "percentage": 56.56, "elapsed_time": "2 days, 1:18:04", "remaining_time": "1 day, 13:51:47", "throughput": 27747.13, "total_tokens": 4924693568} +{"current_steps": 16790, "total_steps": 29667, "loss": 0.356, "lr": 3.054863104112347e-05, "epoch": 1.6978857883260121, "percentage": 56.59, "elapsed_time": "2 days, 1:19:44", "remaining_time": "1 day, 13:49:57", "throughput": 27748.0, "total_tokens": 4927627648} +{"current_steps": 16800, "total_steps": 29667, "loss": 0.3563, "lr": 3.0542930925192835e-05, "epoch": 1.6988970704421198, "percentage": 56.63, "elapsed_time": "2 days, 1:21:29", "remaining_time": "1 day, 13:48:11", "throughput": 27748.36, "total_tokens": 4930597184} +{"current_steps": 16810, "total_steps": 29667, "loss": 0.3514, "lr": 3.053723399885205e-05, "epoch": 1.6999083525582277, "percentage": 56.66, "elapsed_time": "2 days, 1:23:10", "remaining_time": "1 day, 13:46:21", "throughput": 27749.25, "total_tokens": 4933542912} +{"current_steps": 16820, "total_steps": 29667, "loss": 0.3534, "lr": 3.0531540259127565e-05, "epoch": 1.7009196346743356, "percentage": 56.7, "elapsed_time": "2 days, 1:24:49", "remaining_time": "1 day, 13:44:30", "throughput": 27750.27, "total_tokens": 4936469952} +{"current_steps": 16830, "total_steps": 29667, "loss": 0.3566, "lr": 3.052584970304976e-05, "epoch": 1.7019309167904435, "percentage": 56.73, "elapsed_time": "2 days, 1:26:23", "remaining_time": "1 day, 13:42:35", "throughput": 27751.73, "total_tokens": 4939337984} +{"current_steps": 16840, "total_steps": 29667, "loss": 0.3539, "lr": 3.052016232765282e-05, "epoch": 1.7029421989065512, "percentage": 56.76, "elapsed_time": "2 days, 1:28:02", "remaining_time": "1 day, 13:40:45", "throughput": 27752.85, "total_tokens": 4942307712} +{"current_steps": 16850, "total_steps": 29667, "loss": 0.3545, "lr": 3.0514478129974845e-05, "epoch": 1.703953481022659, "percentage": 56.8, "elapsed_time": "2 days, 1:29:40", "remaining_time": "1 day, 13:38:53", "throughput": 27754.16, "total_tokens": 4945243520} +{"current_steps": 16860, "total_steps": 29667, "loss": 0.3477, "lr": 3.0508797107057785e-05, "epoch": 1.7049647631387668, "percentage": 56.83, "elapsed_time": "2 days, 1:31:20", "remaining_time": "1 day, 13:37:03", "throughput": 27755.2, "total_tokens": 4948222208} +{"current_steps": 16870, "total_steps": 29667, "loss": 0.3487, "lr": 3.0503119255947432e-05, "epoch": 1.7059760452548747, "percentage": 56.86, "elapsed_time": "2 days, 1:32:59", "remaining_time": "1 day, 13:35:12", "throughput": 27756.38, "total_tokens": 4951178432} +{"current_steps": 16880, "total_steps": 29667, "loss": 0.3563, "lr": 3.049744457369344e-05, "epoch": 1.7069873273709826, "percentage": 56.9, "elapsed_time": "2 days, 1:34:39", "remaining_time": "1 day, 13:33:22", "throughput": 27757.22, "total_tokens": 4954105664} +{"current_steps": 16890, "total_steps": 29667, "loss": 0.3479, "lr": 3.049177305734929e-05, "epoch": 1.7079986094870905, "percentage": 56.93, "elapsed_time": "2 days, 1:36:20", "remaining_time": "1 day, 13:31:33", "throughput": 27758.42, "total_tokens": 4957108288} +{"current_steps": 16900, "total_steps": 29667, "loss": 0.3522, "lr": 3.04861047039723e-05, "epoch": 1.7090098916031982, "percentage": 56.97, "elapsed_time": "2 days, 1:37:58", "remaining_time": "1 day, 13:29:41", "throughput": 27759.53, "total_tokens": 4960041344} +{"current_steps": 16910, "total_steps": 29667, "loss": 0.3542, "lr": 3.0480439510623638e-05, "epoch": 1.7100211737193058, "percentage": 57.0, "elapsed_time": "2 days, 1:39:34", "remaining_time": "1 day, 13:27:48", "throughput": 27760.84, "total_tokens": 4962924672} +{"current_steps": 16920, "total_steps": 29667, "loss": 0.3533, "lr": 3.0474777474368255e-05, "epoch": 1.7110324558354137, "percentage": 57.03, "elapsed_time": "2 days, 1:41:15", "remaining_time": "1 day, 13:25:59", "throughput": 27761.67, "total_tokens": 4965893632} +{"current_steps": 16930, "total_steps": 29667, "loss": 0.3565, "lr": 3.046911859227495e-05, "epoch": 1.7120437379515216, "percentage": 57.07, "elapsed_time": "2 days, 1:42:57", "remaining_time": "1 day, 13:24:10", "throughput": 27762.58, "total_tokens": 4968864768} +{"current_steps": 16940, "total_steps": 29667, "loss": 0.3571, "lr": 3.0463462861416302e-05, "epoch": 1.7130550200676296, "percentage": 57.1, "elapsed_time": "2 days, 1:44:37", "remaining_time": "1 day, 13:22:20", "throughput": 27763.43, "total_tokens": 4971807360} +{"current_steps": 16950, "total_steps": 29667, "loss": 0.3568, "lr": 3.045781027886873e-05, "epoch": 1.7140663021837375, "percentage": 57.13, "elapsed_time": "2 days, 1:46:12", "remaining_time": "1 day, 13:20:26", "throughput": 27764.92, "total_tokens": 4974707456} +{"current_steps": 16960, "total_steps": 29667, "loss": 0.3532, "lr": 3.0452160841712408e-05, "epoch": 1.7150775842998451, "percentage": 57.17, "elapsed_time": "2 days, 1:47:50", "remaining_time": "1 day, 13:18:35", "throughput": 27765.83, "total_tokens": 4977589120} +{"current_steps": 16970, "total_steps": 29667, "loss": 0.3524, "lr": 3.044651454703133e-05, "epoch": 1.7160888664159528, "percentage": 57.2, "elapsed_time": "2 days, 1:49:28", "remaining_time": "1 day, 13:16:43", "throughput": 27767.23, "total_tokens": 4980565056} +{"current_steps": 16980, "total_steps": 29667, "loss": 0.3546, "lr": 3.0440871391913257e-05, "epoch": 1.7171001485320607, "percentage": 57.24, "elapsed_time": "2 days, 1:51:07", "remaining_time": "1 day, 13:14:53", "throughput": 27768.19, "total_tokens": 4983500160} +{"current_steps": 16990, "total_steps": 29667, "loss": 0.3524, "lr": 3.043523137344973e-05, "epoch": 1.7181114306481686, "percentage": 57.27, "elapsed_time": "2 days, 1:52:47", "remaining_time": "1 day, 13:13:03", "throughput": 27769.02, "total_tokens": 4986412608} +{"current_steps": 17000, "total_steps": 29667, "loss": 0.353, "lr": 3.0429594488736074e-05, "epoch": 1.7191227127642765, "percentage": 57.3, "elapsed_time": "2 days, 1:54:30", "remaining_time": "1 day, 13:11:15", "throughput": 27769.62, "total_tokens": 4989382656} +{"current_steps": 17010, "total_steps": 29667, "loss": 0.3548, "lr": 3.0423960734871348e-05, "epoch": 1.7201339948803844, "percentage": 57.34, "elapsed_time": "2 days, 1:56:07", "remaining_time": "1 day, 13:09:23", "throughput": 27770.82, "total_tokens": 4992282688} +{"current_steps": 17020, "total_steps": 29667, "loss": 0.3516, "lr": 3.0418330108958404e-05, "epoch": 1.7211452769964921, "percentage": 57.37, "elapsed_time": "2 days, 1:57:41", "remaining_time": "1 day, 13:07:29", "throughput": 27772.32, "total_tokens": 4995170304} +{"current_steps": 17030, "total_steps": 29667, "loss": 0.3549, "lr": 3.0412702608103828e-05, "epoch": 1.7221565591125998, "percentage": 57.4, "elapsed_time": "2 days, 1:59:20", "remaining_time": "1 day, 13:05:38", "throughput": 27773.25, "total_tokens": 4998092736} +{"current_steps": 17040, "total_steps": 29667, "loss": 0.3591, "lr": 3.0407078229417944e-05, "epoch": 1.7231678412287077, "percentage": 57.44, "elapsed_time": "2 days, 2:01:00", "remaining_time": "1 day, 13:03:48", "throughput": 27774.3, "total_tokens": 5001042752} +{"current_steps": 17050, "total_steps": 29667, "loss": 0.3555, "lr": 3.0401456970014836e-05, "epoch": 1.7241791233448156, "percentage": 57.47, "elapsed_time": "2 days, 2:02:40", "remaining_time": "1 day, 13:01:58", "throughput": 27775.27, "total_tokens": 5004006976} +{"current_steps": 17060, "total_steps": 29667, "loss": 0.3541, "lr": 3.039583882701231e-05, "epoch": 1.7251904054609235, "percentage": 57.5, "elapsed_time": "2 days, 2:04:23", "remaining_time": "1 day, 13:00:10", "throughput": 27775.97, "total_tokens": 5006981312} +{"current_steps": 17070, "total_steps": 29667, "loss": 0.3488, "lr": 3.0390223797531887e-05, "epoch": 1.7262016875770314, "percentage": 57.54, "elapsed_time": "2 days, 2:05:58", "remaining_time": "1 day, 12:58:17", "throughput": 27777.31, "total_tokens": 5009876864} +{"current_steps": 17080, "total_steps": 29667, "loss": 0.3525, "lr": 3.0384611878698837e-05, "epoch": 1.727212969693139, "percentage": 57.57, "elapsed_time": "2 days, 2:07:32", "remaining_time": "1 day, 12:56:23", "throughput": 27778.87, "total_tokens": 5012766784} +{"current_steps": 17090, "total_steps": 29667, "loss": 0.3526, "lr": 3.0379003067642113e-05, "epoch": 1.7282242518092468, "percentage": 57.61, "elapsed_time": "2 days, 2:09:09", "remaining_time": "1 day, 12:54:31", "throughput": 27780.06, "total_tokens": 5015676288} +{"current_steps": 17100, "total_steps": 29667, "loss": 0.3592, "lr": 3.037339736149441e-05, "epoch": 1.7292355339253547, "percentage": 57.64, "elapsed_time": "2 days, 2:10:46", "remaining_time": "1 day, 12:52:39", "throughput": 27781.36, "total_tokens": 5018616704} +{"current_steps": 17110, "total_steps": 29667, "loss": 0.3574, "lr": 3.0367794757392092e-05, "epoch": 1.7302468160414626, "percentage": 57.67, "elapsed_time": "2 days, 2:12:23", "remaining_time": "1 day, 12:50:47", "throughput": 27782.71, "total_tokens": 5021537536} +{"current_steps": 17120, "total_steps": 29667, "loss": 0.351, "lr": 3.0362195252475245e-05, "epoch": 1.7312580981575705, "percentage": 57.71, "elapsed_time": "2 days, 2:14:04", "remaining_time": "1 day, 12:48:58", "throughput": 27783.75, "total_tokens": 5024545024} +{"current_steps": 17130, "total_steps": 29667, "loss": 0.3561, "lr": 3.0356598843887634e-05, "epoch": 1.7322693802736784, "percentage": 57.74, "elapsed_time": "2 days, 2:15:41", "remaining_time": "1 day, 12:47:06", "throughput": 27784.84, "total_tokens": 5027438592} +{"current_steps": 17140, "total_steps": 29667, "loss": 0.3481, "lr": 3.03510055287767e-05, "epoch": 1.733280662389786, "percentage": 57.77, "elapsed_time": "2 days, 2:17:18", "remaining_time": "1 day, 12:45:14", "throughput": 27786.07, "total_tokens": 5030361344} +{"current_steps": 17150, "total_steps": 29667, "loss": 0.3547, "lr": 3.0345415304293578e-05, "epoch": 1.7342919445058937, "percentage": 57.81, "elapsed_time": "2 days, 2:18:55", "remaining_time": "1 day, 12:43:22", "throughput": 27787.39, "total_tokens": 5033278848} +{"current_steps": 17160, "total_steps": 29667, "loss": 0.3552, "lr": 3.0339828167593065e-05, "epoch": 1.7353032266220016, "percentage": 57.84, "elapsed_time": "2 days, 2:20:34", "remaining_time": "1 day, 12:41:32", "throughput": 27788.38, "total_tokens": 5036220480} +{"current_steps": 17170, "total_steps": 29667, "loss": 0.3555, "lr": 3.033424411583363e-05, "epoch": 1.7363145087381096, "percentage": 57.88, "elapsed_time": "2 days, 2:22:15", "remaining_time": "1 day, 12:39:43", "throughput": 27789.2, "total_tokens": 5039175552} +{"current_steps": 17180, "total_steps": 29667, "loss": 0.352, "lr": 3.0328663146177387e-05, "epoch": 1.7373257908542175, "percentage": 57.91, "elapsed_time": "2 days, 2:23:54", "remaining_time": "1 day, 12:37:52", "throughput": 27790.2, "total_tokens": 5042102592} +{"current_steps": 17190, "total_steps": 29667, "loss": 0.3524, "lr": 3.032308525579013e-05, "epoch": 1.7383370729703251, "percentage": 57.94, "elapsed_time": "2 days, 2:25:37", "remaining_time": "1 day, 12:36:04", "throughput": 27790.89, "total_tokens": 5045081728} +{"current_steps": 17200, "total_steps": 29667, "loss": 0.355, "lr": 3.031751044184127e-05, "epoch": 1.739348355086433, "percentage": 57.98, "elapsed_time": "2 days, 2:27:17", "remaining_time": "1 day, 12:34:15", "throughput": 27791.66, "total_tokens": 5047999104} +{"current_steps": 17210, "total_steps": 29667, "loss": 0.3574, "lr": 3.0311938701503872e-05, "epoch": 1.7403596372025407, "percentage": 58.01, "elapsed_time": "2 days, 2:28:57", "remaining_time": "1 day, 12:32:25", "throughput": 27792.39, "total_tokens": 5050916928} +{"current_steps": 17220, "total_steps": 29667, "loss": 0.3555, "lr": 3.0306370031954646e-05, "epoch": 1.7413709193186486, "percentage": 58.04, "elapsed_time": "2 days, 2:30:38", "remaining_time": "1 day, 12:30:36", "throughput": 27793.32, "total_tokens": 5053889408} +{"current_steps": 17230, "total_steps": 29667, "loss": 0.3554, "lr": 3.030080443037393e-05, "epoch": 1.7423822014347565, "percentage": 58.08, "elapsed_time": "2 days, 2:32:19", "remaining_time": "1 day, 12:28:47", "throughput": 27793.96, "total_tokens": 5056818368} +{"current_steps": 17240, "total_steps": 29667, "loss": 0.3575, "lr": 3.0295241893945663e-05, "epoch": 1.7433934835508644, "percentage": 58.11, "elapsed_time": "2 days, 2:33:54", "remaining_time": "1 day, 12:26:54", "throughput": 27795.42, "total_tokens": 5059732800} +{"current_steps": 17250, "total_steps": 29667, "loss": 0.3552, "lr": 3.028968241985743e-05, "epoch": 1.7444047656669721, "percentage": 58.15, "elapsed_time": "2 days, 2:35:33", "remaining_time": "1 day, 12:25:04", "throughput": 27796.63, "total_tokens": 5062710720} +{"current_steps": 17260, "total_steps": 29667, "loss": 0.3504, "lr": 3.0284126005300405e-05, "epoch": 1.74541604778308, "percentage": 58.18, "elapsed_time": "2 days, 2:37:12", "remaining_time": "1 day, 12:23:14", "throughput": 27797.58, "total_tokens": 5065623424} +{"current_steps": 17270, "total_steps": 29667, "loss": 0.3568, "lr": 3.0278572647469385e-05, "epoch": 1.7464273298991877, "percentage": 58.21, "elapsed_time": "2 days, 2:38:54", "remaining_time": "1 day, 12:21:25", "throughput": 27798.15, "total_tokens": 5068556224} +{"current_steps": 17280, "total_steps": 29667, "loss": 0.3515, "lr": 3.027302234356275e-05, "epoch": 1.7474386120152956, "percentage": 58.25, "elapsed_time": "2 days, 2:40:31", "remaining_time": "1 day, 12:19:33", "throughput": 27799.38, "total_tokens": 5071472384} +{"current_steps": 17290, "total_steps": 29667, "loss": 0.3515, "lr": 3.0267475090782494e-05, "epoch": 1.7484498941314035, "percentage": 58.28, "elapsed_time": "2 days, 2:42:09", "remaining_time": "1 day, 12:17:43", "throughput": 27800.72, "total_tokens": 5074444032} +{"current_steps": 17300, "total_steps": 29667, "loss": 0.3534, "lr": 3.026193088633418e-05, "epoch": 1.7494611762475114, "percentage": 58.31, "elapsed_time": "2 days, 2:43:50", "remaining_time": "1 day, 12:15:54", "throughput": 27801.54, "total_tokens": 5077410432} +{"current_steps": 17310, "total_steps": 29667, "loss": 0.3551, "lr": 3.0256389727426952e-05, "epoch": 1.750472458363619, "percentage": 58.35, "elapsed_time": "2 days, 2:45:30", "remaining_time": "1 day, 12:14:04", "throughput": 27802.3, "total_tokens": 5080326464} +{"current_steps": 17320, "total_steps": 29667, "loss": 0.36, "lr": 3.0250851611273555e-05, "epoch": 1.751483740479727, "percentage": 58.38, "elapsed_time": "2 days, 2:47:08", "remaining_time": "1 day, 12:12:13", "throughput": 27803.37, "total_tokens": 5083243264} +{"current_steps": 17330, "total_steps": 29667, "loss": 0.3549, "lr": 3.0245316535090273e-05, "epoch": 1.7524950225958347, "percentage": 58.42, "elapsed_time": "2 days, 2:48:46", "remaining_time": "1 day, 12:10:22", "throughput": 27804.49, "total_tokens": 5086175872} +{"current_steps": 17340, "total_steps": 29667, "loss": 0.357, "lr": 3.023978449609697e-05, "epoch": 1.7535063047119426, "percentage": 58.45, "elapsed_time": "2 days, 2:50:24", "remaining_time": "1 day, 12:08:32", "throughput": 27805.49, "total_tokens": 5089099008} +{"current_steps": 17350, "total_steps": 29667, "loss": 0.3575, "lr": 3.023425549151707e-05, "epoch": 1.7545175868280505, "percentage": 58.48, "elapsed_time": "2 days, 2:52:08", "remaining_time": "1 day, 12:06:45", "throughput": 27805.93, "total_tokens": 5092055424} +{"current_steps": 17360, "total_steps": 29667, "loss": 0.3524, "lr": 3.022872951857754e-05, "epoch": 1.7555288689441584, "percentage": 58.52, "elapsed_time": "2 days, 2:53:47", "remaining_time": "1 day, 12:04:55", "throughput": 27806.82, "total_tokens": 5094975104} +{"current_steps": 17370, "total_steps": 29667, "loss": 0.3522, "lr": 3.0223206574508904e-05, "epoch": 1.756540151060266, "percentage": 58.55, "elapsed_time": "2 days, 2:55:28", "remaining_time": "1 day, 12:03:06", "throughput": 27807.62, "total_tokens": 5097935040} +{"current_steps": 17380, "total_steps": 29667, "loss": 0.3525, "lr": 3.0217686656545224e-05, "epoch": 1.757551433176374, "percentage": 58.58, "elapsed_time": "2 days, 2:57:05", "remaining_time": "1 day, 12:01:14", "throughput": 27808.97, "total_tokens": 5100867328} +{"current_steps": 17390, "total_steps": 29667, "loss": 0.3512, "lr": 3.0212169761924077e-05, "epoch": 1.7585627152924816, "percentage": 58.62, "elapsed_time": "2 days, 2:58:49", "remaining_time": "1 day, 11:59:28", "throughput": 27809.1, "total_tokens": 5103790144} +{"current_steps": 17400, "total_steps": 29667, "loss": 0.3549, "lr": 3.0206655887886604e-05, "epoch": 1.7595739974085896, "percentage": 58.65, "elapsed_time": "2 days, 3:00:44", "remaining_time": "1 day, 11:57:49", "throughput": 27808.0, "total_tokens": 5106788672} +{"current_steps": 17410, "total_steps": 29667, "loss": 0.3543, "lr": 3.0201145031677448e-05, "epoch": 1.7605852795246975, "percentage": 58.68, "elapsed_time": "2 days, 3:02:38", "remaining_time": "1 day, 11:56:09", "throughput": 27806.71, "total_tokens": 5109727936} +{"current_steps": 17420, "total_steps": 29667, "loss": 0.3599, "lr": 3.019563719054477e-05, "epoch": 1.7615965616408054, "percentage": 58.72, "elapsed_time": "2 days, 3:04:24", "remaining_time": "1 day, 11:54:24", "throughput": 27806.55, "total_tokens": 5112646336} +{"current_steps": 17430, "total_steps": 29667, "loss": 0.3484, "lr": 3.019013236174025e-05, "epoch": 1.762607843756913, "percentage": 58.75, "elapsed_time": "2 days, 3:06:15", "remaining_time": "1 day, 11:52:43", "throughput": 27805.71, "total_tokens": 5115579968} +{"current_steps": 17440, "total_steps": 29667, "loss": 0.3564, "lr": 3.018463054251906e-05, "epoch": 1.763619125873021, "percentage": 58.79, "elapsed_time": "2 days, 3:08:06", "remaining_time": "1 day, 11:51:01", "throughput": 27805.15, "total_tokens": 5118551936} +{"current_steps": 17450, "total_steps": 29667, "loss": 0.3548, "lr": 3.017913173013989e-05, "epoch": 1.7646304079891286, "percentage": 58.82, "elapsed_time": "2 days, 3:09:53", "remaining_time": "1 day, 11:49:16", "throughput": 27804.63, "total_tokens": 5121429824} +{"current_steps": 17460, "total_steps": 29667, "loss": 0.3568, "lr": 3.017363592186491e-05, "epoch": 1.7656416901052365, "percentage": 58.85, "elapsed_time": "2 days, 3:11:46", "remaining_time": "1 day, 11:47:35", "throughput": 27803.54, "total_tokens": 5124360640} +{"current_steps": 17470, "total_steps": 29667, "loss": 0.3556, "lr": 3.0168143114959797e-05, "epoch": 1.7666529722213444, "percentage": 58.89, "elapsed_time": "2 days, 3:13:44", "remaining_time": "1 day, 11:45:59", "throughput": 27801.56, "total_tokens": 5127283136} +{"current_steps": 17480, "total_steps": 29667, "loss": 0.3545, "lr": 3.016265330669369e-05, "epoch": 1.7676642543374523, "percentage": 58.92, "elapsed_time": "2 days, 3:15:28", "remaining_time": "1 day, 11:44:12", "throughput": 27801.5, "total_tokens": 5130175872} +{"current_steps": 17490, "total_steps": 29667, "loss": 0.3602, "lr": 3.0157166494339223e-05, "epoch": 1.76867553645356, "percentage": 58.95, "elapsed_time": "2 days, 3:17:17", "remaining_time": "1 day, 11:42:29", "throughput": 27800.98, "total_tokens": 5133095936} +{"current_steps": 17500, "total_steps": 29667, "loss": 0.352, "lr": 3.0151682675172482e-05, "epoch": 1.7696868185696677, "percentage": 58.99, "elapsed_time": "2 days, 3:19:09", "remaining_time": "1 day, 11:40:48", "throughput": 27800.1, "total_tokens": 5136068736} +{"current_steps": 17510, "total_steps": 29667, "loss": 0.3575, "lr": 3.0146201846473034e-05, "epoch": 1.7706981006857756, "percentage": 59.02, "elapsed_time": "2 days, 3:20:55", "remaining_time": "1 day, 11:39:03", "throughput": 27800.02, "total_tokens": 5138990656} +{"current_steps": 17520, "total_steps": 29667, "loss": 0.3572, "lr": 3.01407240055239e-05, "epoch": 1.7717093828018835, "percentage": 59.06, "elapsed_time": "2 days, 3:22:41", "remaining_time": "1 day, 11:37:18", "throughput": 27799.99, "total_tokens": 5141935424} +{"current_steps": 17530, "total_steps": 29667, "loss": 0.3572, "lr": 3.013524914961157e-05, "epoch": 1.7727206649179914, "percentage": 59.09, "elapsed_time": "2 days, 3:24:33", "remaining_time": "1 day, 11:35:36", "throughput": 27799.22, "total_tokens": 5144904704} +{"current_steps": 17540, "total_steps": 29667, "loss": 0.3493, "lr": 3.012977727602596e-05, "epoch": 1.7737319470340993, "percentage": 59.12, "elapsed_time": "2 days, 3:26:22", "remaining_time": "1 day, 11:33:53", "throughput": 27798.88, "total_tokens": 5147856768} +{"current_steps": 17550, "total_steps": 29667, "loss": 0.3565, "lr": 3.0124308382060446e-05, "epoch": 1.774743229150207, "percentage": 59.16, "elapsed_time": "2 days, 3:28:04", "remaining_time": "1 day, 11:32:05", "throughput": 27799.1, "total_tokens": 5150736384} +{"current_steps": 17560, "total_steps": 29667, "loss": 0.3561, "lr": 3.011884246501183e-05, "epoch": 1.7757545112663147, "percentage": 59.19, "elapsed_time": "2 days, 3:29:51", "remaining_time": "1 day, 11:30:20", "throughput": 27798.86, "total_tokens": 5153669632} +{"current_steps": 17570, "total_steps": 29667, "loss": 0.3548, "lr": 3.0113379522180363e-05, "epoch": 1.7767657933824226, "percentage": 59.22, "elapsed_time": "2 days, 3:31:34", "remaining_time": "1 day, 11:28:33", "throughput": 27799.17, "total_tokens": 5156594496} +{"current_steps": 17580, "total_steps": 29667, "loss": 0.3518, "lr": 3.0107919550869702e-05, "epoch": 1.7777770754985305, "percentage": 59.26, "elapsed_time": "2 days, 3:33:23", "remaining_time": "1 day, 11:26:50", "throughput": 27798.5, "total_tokens": 5159511552} +{"current_steps": 17590, "total_steps": 29667, "loss": 0.3548, "lr": 3.0102462548386933e-05, "epoch": 1.7787883576146384, "percentage": 59.29, "elapsed_time": "2 days, 3:35:09", "remaining_time": "1 day, 11:25:04", "throughput": 27798.5, "total_tokens": 5162439488} +{"current_steps": 17600, "total_steps": 29667, "loss": 0.3525, "lr": 3.0097008512042572e-05, "epoch": 1.7797996397307463, "percentage": 59.33, "elapsed_time": "2 days, 3:36:56", "remaining_time": "1 day, 11:23:20", "throughput": 27798.33, "total_tokens": 5165381696} +{"current_steps": 17610, "total_steps": 29667, "loss": 0.3576, "lr": 3.009155743915052e-05, "epoch": 1.780810921846854, "percentage": 59.36, "elapsed_time": "2 days, 3:38:43", "remaining_time": "1 day, 11:21:35", "throughput": 27798.05, "total_tokens": 5168307328} +{"current_steps": 17620, "total_steps": 29667, "loss": 0.3547, "lr": 3.00861093270281e-05, "epoch": 1.7818222039629616, "percentage": 59.39, "elapsed_time": "2 days, 3:40:31", "remaining_time": "1 day, 11:19:52", "throughput": 27797.86, "total_tokens": 5171282944} +{"current_steps": 17630, "total_steps": 29667, "loss": 0.3569, "lr": 3.008066417299602e-05, "epoch": 1.7828334860790696, "percentage": 59.43, "elapsed_time": "2 days, 3:42:19", "remaining_time": "1 day, 11:18:07", "throughput": 27797.65, "total_tokens": 5174234112} +{"current_steps": 17640, "total_steps": 29667, "loss": 0.3537, "lr": 3.00752219743784e-05, "epoch": 1.7838447681951775, "percentage": 59.46, "elapsed_time": "2 days, 3:44:05", "remaining_time": "1 day, 11:16:22", "throughput": 27797.71, "total_tokens": 5177202688} +{"current_steps": 17650, "total_steps": 29667, "loss": 0.3531, "lr": 3.0069782728502737e-05, "epoch": 1.7848560503112854, "percentage": 59.49, "elapsed_time": "2 days, 3:45:49", "remaining_time": "1 day, 11:14:36", "throughput": 27797.73, "total_tokens": 5180099712} +{"current_steps": 17660, "total_steps": 29667, "loss": 0.3528, "lr": 3.00643464326999e-05, "epoch": 1.7858673324273933, "percentage": 59.53, "elapsed_time": "2 days, 3:47:43", "remaining_time": "1 day, 11:12:56", "throughput": 27797.08, "total_tokens": 5183137408} +{"current_steps": 17670, "total_steps": 29667, "loss": 0.354, "lr": 3.0058913084304146e-05, "epoch": 1.786878614543501, "percentage": 59.56, "elapsed_time": "2 days, 3:49:29", "remaining_time": "1 day, 11:11:11", "throughput": 27797.11, "total_tokens": 5186097600} +{"current_steps": 17680, "total_steps": 29667, "loss": 0.3528, "lr": 3.0053482680653112e-05, "epoch": 1.7878898966596086, "percentage": 59.59, "elapsed_time": "2 days, 3:51:15", "remaining_time": "1 day, 11:09:25", "throughput": 27797.11, "total_tokens": 5189031744} +{"current_steps": 17690, "total_steps": 29667, "loss": 0.3529, "lr": 3.0048055219087777e-05, "epoch": 1.7889011787757165, "percentage": 59.63, "elapsed_time": "2 days, 3:53:02", "remaining_time": "1 day, 11:07:41", "throughput": 27796.93, "total_tokens": 5191992960} +{"current_steps": 17700, "total_steps": 29667, "loss": 0.357, "lr": 3.0042630696952507e-05, "epoch": 1.7899124608918244, "percentage": 59.66, "elapsed_time": "2 days, 3:54:46", "remaining_time": "1 day, 11:05:54", "throughput": 27797.15, "total_tokens": 5194922624} +{"current_steps": 17710, "total_steps": 29667, "loss": 0.3511, "lr": 3.0037209111594994e-05, "epoch": 1.7909237430079323, "percentage": 59.7, "elapsed_time": "2 days, 3:56:35", "remaining_time": "1 day, 11:04:10", "throughput": 27796.95, "total_tokens": 5197897984} +{"current_steps": 17720, "total_steps": 29667, "loss": 0.3528, "lr": 3.0031790460366305e-05, "epoch": 1.7919350251240402, "percentage": 59.73, "elapsed_time": "2 days, 3:58:17", "remaining_time": "1 day, 11:02:23", "throughput": 27797.37, "total_tokens": 5200825600} +{"current_steps": 17730, "total_steps": 29667, "loss": 0.3543, "lr": 3.002637474062083e-05, "epoch": 1.792946307240148, "percentage": 59.76, "elapsed_time": "2 days, 4:00:01", "remaining_time": "1 day, 11:00:36", "throughput": 27797.5, "total_tokens": 5203726528} +{"current_steps": 17740, "total_steps": 29667, "loss": 0.3588, "lr": 3.0020961949716325e-05, "epoch": 1.7939575893562556, "percentage": 59.8, "elapsed_time": "2 days, 4:01:45", "remaining_time": "1 day, 10:58:49", "throughput": 27797.89, "total_tokens": 5206694528} +{"current_steps": 17750, "total_steps": 29667, "loss": 0.3526, "lr": 3.0015552085013847e-05, "epoch": 1.7949688714723635, "percentage": 59.83, "elapsed_time": "2 days, 4:03:25", "remaining_time": "1 day, 10:57:00", "throughput": 27798.34, "total_tokens": 5209563136} +{"current_steps": 17760, "total_steps": 29667, "loss": 0.3536, "lr": 3.0010145143877805e-05, "epoch": 1.7959801535884714, "percentage": 59.86, "elapsed_time": "2 days, 4:05:19", "remaining_time": "1 day, 10:55:20", "throughput": 27797.04, "total_tokens": 5212499584} +{"current_steps": 17770, "total_steps": 29667, "loss": 0.3537, "lr": 3.0004741123675907e-05, "epoch": 1.7969914357045793, "percentage": 59.9, "elapsed_time": "2 days, 4:07:34", "remaining_time": "1 day, 10:53:54", "throughput": 27792.68, "total_tokens": 5215419328} +{"current_steps": 17780, "total_steps": 29667, "loss": 0.3516, "lr": 2.9999340021779205e-05, "epoch": 1.798002717820687, "percentage": 59.93, "elapsed_time": "2 days, 4:10:13", "remaining_time": "1 day, 10:52:44", "throughput": 27784.99, "total_tokens": 5218407040} +{"current_steps": 17790, "total_steps": 29667, "loss": 0.357, "lr": 2.999394183556204e-05, "epoch": 1.799013999936795, "percentage": 59.97, "elapsed_time": "2 days, 4:12:10", "remaining_time": "1 day, 10:51:06", "throughput": 27783.37, "total_tokens": 5221345536} +{"current_steps": 17800, "total_steps": 29667, "loss": 0.3488, "lr": 2.998854656240207e-05, "epoch": 1.8000252820529026, "percentage": 60.0, "elapsed_time": "2 days, 4:13:53", "remaining_time": "1 day, 10:49:19", "throughput": 27783.62, "total_tokens": 5224249856} +{"current_steps": 17810, "total_steps": 29667, "loss": 0.3553, "lr": 2.9983154199680257e-05, "epoch": 1.8010365641690105, "percentage": 60.03, "elapsed_time": "2 days, 4:15:36", "remaining_time": "1 day, 10:47:32", "throughput": 27783.86, "total_tokens": 5227168512} +{"current_steps": 17820, "total_steps": 29667, "loss": 0.3536, "lr": 2.9977764744780845e-05, "epoch": 1.8020478462851184, "percentage": 60.07, "elapsed_time": "2 days, 4:17:20", "remaining_time": "1 day, 10:45:44", "throughput": 27783.98, "total_tokens": 5230067776} +{"current_steps": 17830, "total_steps": 29667, "loss": 0.3558, "lr": 2.9972378195091384e-05, "epoch": 1.8030591284012263, "percentage": 60.1, "elapsed_time": "2 days, 4:19:04", "remaining_time": "1 day, 10:43:58", "throughput": 27784.28, "total_tokens": 5233002688} +{"current_steps": 17840, "total_steps": 29667, "loss": 0.3555, "lr": 2.996699454800269e-05, "epoch": 1.804070410517334, "percentage": 60.13, "elapsed_time": "2 days, 4:20:59", "remaining_time": "1 day, 10:42:19", "throughput": 27782.87, "total_tokens": 5235949696} +{"current_steps": 17850, "total_steps": 29667, "loss": 0.3517, "lr": 2.9961613800908883e-05, "epoch": 1.8050816926334419, "percentage": 60.17, "elapsed_time": "2 days, 4:22:53", "remaining_time": "1 day, 10:40:38", "throughput": 27781.49, "total_tokens": 5238852352} +{"current_steps": 17860, "total_steps": 29667, "loss": 0.3568, "lr": 2.995623595120733e-05, "epoch": 1.8060929747495496, "percentage": 60.2, "elapsed_time": "2 days, 4:24:39", "remaining_time": "1 day, 10:38:53", "throughput": 27781.5, "total_tokens": 5241806784} +{"current_steps": 17870, "total_steps": 29667, "loss": 0.3598, "lr": 2.995086099629869e-05, "epoch": 1.8071042568656575, "percentage": 60.24, "elapsed_time": "2 days, 4:26:24", "remaining_time": "1 day, 10:37:07", "throughput": 27781.62, "total_tokens": 5244747584} +{"current_steps": 17880, "total_steps": 29667, "loss": 0.3524, "lr": 2.9945488933586867e-05, "epoch": 1.8081155389817654, "percentage": 60.27, "elapsed_time": "2 days, 4:28:11", "remaining_time": "1 day, 10:35:22", "throughput": 27781.31, "total_tokens": 5247662272} +{"current_steps": 17890, "total_steps": 29667, "loss": 0.356, "lr": 2.9940119760479045e-05, "epoch": 1.8091268210978733, "percentage": 60.3, "elapsed_time": "2 days, 4:29:58", "remaining_time": "1 day, 10:33:37", "throughput": 27781.32, "total_tokens": 5250621440} +{"current_steps": 17900, "total_steps": 29667, "loss": 0.3528, "lr": 2.9934753474385635e-05, "epoch": 1.810138103213981, "percentage": 60.34, "elapsed_time": "2 days, 4:31:44", "remaining_time": "1 day, 10:31:52", "throughput": 27781.31, "total_tokens": 5253579584} +{"current_steps": 17910, "total_steps": 29667, "loss": 0.3572, "lr": 2.9929390072720314e-05, "epoch": 1.8111493853300888, "percentage": 60.37, "elapsed_time": "2 days, 4:33:31", "remaining_time": "1 day, 10:30:07", "throughput": 27781.04, "total_tokens": 5256492416} +{"current_steps": 17920, "total_steps": 29667, "loss": 0.3536, "lr": 2.99240295529e-05, "epoch": 1.8121606674461965, "percentage": 60.4, "elapsed_time": "2 days, 4:35:29", "remaining_time": "1 day, 10:28:30", "throughput": 27779.12, "total_tokens": 5259401216} +{"current_steps": 17930, "total_steps": 29667, "loss": 0.3515, "lr": 2.991867191234484e-05, "epoch": 1.8131719495623044, "percentage": 60.44, "elapsed_time": "2 days, 4:37:19", "remaining_time": "1 day, 10:26:47", "throughput": 27778.52, "total_tokens": 5262360640} +{"current_steps": 17940, "total_steps": 29667, "loss": 0.3552, "lr": 2.991331714847822e-05, "epoch": 1.8141832316784123, "percentage": 60.47, "elapsed_time": "2 days, 4:39:05", "remaining_time": "1 day, 10:25:02", "throughput": 27778.46, "total_tokens": 5265285888} +{"current_steps": 17950, "total_steps": 29667, "loss": 0.3493, "lr": 2.990796525872675e-05, "epoch": 1.8151945137945202, "percentage": 60.5, "elapsed_time": "2 days, 4:40:48", "remaining_time": "1 day, 10:23:14", "throughput": 27778.67, "total_tokens": 5268177280} +{"current_steps": 17960, "total_steps": 29667, "loss": 0.3507, "lr": 2.990261624052027e-05, "epoch": 1.816205795910628, "percentage": 60.54, "elapsed_time": "2 days, 4:42:32", "remaining_time": "1 day, 10:21:27", "throughput": 27778.67, "total_tokens": 5271061120} +{"current_steps": 17970, "total_steps": 29667, "loss": 0.3534, "lr": 2.989727009129182e-05, "epoch": 1.8172170780267358, "percentage": 60.57, "elapsed_time": "2 days, 4:44:15", "remaining_time": "1 day, 10:19:40", "throughput": 27778.97, "total_tokens": 5273997696} +{"current_steps": 17980, "total_steps": 29667, "loss": 0.3491, "lr": 2.989192680847766e-05, "epoch": 1.8182283601428435, "percentage": 60.61, "elapsed_time": "2 days, 4:46:00", "remaining_time": "1 day, 10:17:54", "throughput": 27779.0, "total_tokens": 5276912192} +{"current_steps": 17990, "total_steps": 29667, "loss": 0.353, "lr": 2.9886586389517267e-05, "epoch": 1.8192396422589514, "percentage": 60.64, "elapsed_time": "2 days, 4:47:49", "remaining_time": "1 day, 10:16:11", "throughput": 27778.43, "total_tokens": 5279840000} +{"current_steps": 18000, "total_steps": 29667, "loss": 0.3536, "lr": 2.98812488318533e-05, "epoch": 1.8202509243750593, "percentage": 60.67, "elapsed_time": "2 days, 4:49:34", "remaining_time": "1 day, 10:14:24", "throughput": 27778.75, "total_tokens": 5282813120} +{"current_steps": 18010, "total_steps": 29667, "loss": 0.3569, "lr": 2.987591413293162e-05, "epoch": 1.8212622064911672, "percentage": 60.71, "elapsed_time": "2 days, 4:51:21", "remaining_time": "1 day, 10:12:39", "throughput": 27778.81, "total_tokens": 5285783040} +{"current_steps": 18020, "total_steps": 29667, "loss": 0.3547, "lr": 2.98705822902013e-05, "epoch": 1.822273488607275, "percentage": 60.74, "elapsed_time": "2 days, 4:53:04", "remaining_time": "1 day, 10:10:52", "throughput": 27779.18, "total_tokens": 5288719232} +{"current_steps": 18030, "total_steps": 29667, "loss": 0.3498, "lr": 2.9865253301114553e-05, "epoch": 1.8232847707233826, "percentage": 60.77, "elapsed_time": "2 days, 4:54:50", "remaining_time": "1 day, 10:09:07", "throughput": 27779.31, "total_tokens": 5291700544} +{"current_steps": 18040, "total_steps": 29667, "loss": 0.3549, "lr": 2.985992716312683e-05, "epoch": 1.8242960528394905, "percentage": 60.81, "elapsed_time": "2 days, 4:56:36", "remaining_time": "1 day, 10:07:21", "throughput": 27779.44, "total_tokens": 5294666368} +{"current_steps": 18050, "total_steps": 29667, "loss": 0.3561, "lr": 2.9854603873696703e-05, "epoch": 1.8253073349555984, "percentage": 60.84, "elapsed_time": "2 days, 4:58:17", "remaining_time": "1 day, 10:05:33", "throughput": 27780.12, "total_tokens": 5297598400} +{"current_steps": 18060, "total_steps": 29667, "loss": 0.3567, "lr": 2.9849283430285947e-05, "epoch": 1.8263186170717063, "percentage": 60.88, "elapsed_time": "2 days, 5:00:03", "remaining_time": "1 day, 10:03:48", "throughput": 27779.96, "total_tokens": 5300527296} +{"current_steps": 18070, "total_steps": 29667, "loss": 0.3528, "lr": 2.98439658303595e-05, "epoch": 1.8273298991878142, "percentage": 60.91, "elapsed_time": "2 days, 5:01:57", "remaining_time": "1 day, 10:02:07", "throughput": 27778.87, "total_tokens": 5303465792} +{"current_steps": 18080, "total_steps": 29667, "loss": 0.3492, "lr": 2.9838651071385442e-05, "epoch": 1.8283411813039219, "percentage": 60.94, "elapsed_time": "2 days, 5:03:38", "remaining_time": "1 day, 10:00:18", "throughput": 27779.56, "total_tokens": 5306414080} +{"current_steps": 18090, "total_steps": 29667, "loss": 0.3551, "lr": 2.9833339150835037e-05, "epoch": 1.8293524634200296, "percentage": 60.98, "elapsed_time": "2 days, 5:05:26", "remaining_time": "1 day, 9:58:34", "throughput": 27779.48, "total_tokens": 5309390464} +{"current_steps": 18100, "total_steps": 29667, "loss": 0.3537, "lr": 2.982803006618267e-05, "epoch": 1.8303637455361375, "percentage": 61.01, "elapsed_time": "2 days, 5:07:06", "remaining_time": "1 day, 9:56:45", "throughput": 27780.13, "total_tokens": 5312308544} +{"current_steps": 18110, "total_steps": 29667, "loss": 0.3546, "lr": 2.982272381490588e-05, "epoch": 1.8313750276522454, "percentage": 61.04, "elapsed_time": "2 days, 5:08:49", "remaining_time": "1 day, 9:54:58", "throughput": 27780.65, "total_tokens": 5315267904} +{"current_steps": 18120, "total_steps": 29667, "loss": 0.3574, "lr": 2.9817420394485363e-05, "epoch": 1.8323863097683533, "percentage": 61.08, "elapsed_time": "2 days, 5:10:36", "remaining_time": "1 day, 9:53:13", "throughput": 27780.53, "total_tokens": 5318214208} +{"current_steps": 18130, "total_steps": 29667, "loss": 0.357, "lr": 2.9812119802404927e-05, "epoch": 1.8333975918844612, "percentage": 61.11, "elapsed_time": "2 days, 5:12:24", "remaining_time": "1 day, 9:51:28", "throughput": 27780.4, "total_tokens": 5321174016} +{"current_steps": 18140, "total_steps": 29667, "loss": 0.3503, "lr": 2.9806822036151523e-05, "epoch": 1.8344088740005688, "percentage": 61.15, "elapsed_time": "2 days, 5:14:09", "remaining_time": "1 day, 9:49:42", "throughput": 27780.45, "total_tokens": 5324098432} +{"current_steps": 18150, "total_steps": 29667, "loss": 0.3528, "lr": 2.980152709321522e-05, "epoch": 1.8354201561166765, "percentage": 61.18, "elapsed_time": "2 days, 5:15:54", "remaining_time": "1 day, 9:47:56", "throughput": 27780.59, "total_tokens": 5327050048} +{"current_steps": 18160, "total_steps": 29667, "loss": 0.3555, "lr": 2.9796234971089214e-05, "epoch": 1.8364314382327844, "percentage": 61.21, "elapsed_time": "2 days, 5:17:39", "remaining_time": "1 day, 9:46:11", "throughput": 27780.77, "total_tokens": 5330010816} +{"current_steps": 18170, "total_steps": 29667, "loss": 0.3536, "lr": 2.979094566726981e-05, "epoch": 1.8374427203488923, "percentage": 61.25, "elapsed_time": "2 days, 5:19:29", "remaining_time": "1 day, 9:44:27", "throughput": 27780.5, "total_tokens": 5333004608} +{"current_steps": 18180, "total_steps": 29667, "loss": 0.3534, "lr": 2.9785659179256427e-05, "epoch": 1.8384540024650002, "percentage": 61.28, "elapsed_time": "2 days, 5:21:12", "remaining_time": "1 day, 9:42:40", "throughput": 27780.75, "total_tokens": 5335921216} +{"current_steps": 18190, "total_steps": 29667, "loss": 0.3555, "lr": 2.978037550455159e-05, "epoch": 1.8394652845811081, "percentage": 61.31, "elapsed_time": "2 days, 5:23:01", "remaining_time": "1 day, 9:40:57", "throughput": 27780.23, "total_tokens": 5338851840} +{"current_steps": 18200, "total_steps": 29667, "loss": 0.3496, "lr": 2.977509464066091e-05, "epoch": 1.8404765666972158, "percentage": 61.35, "elapsed_time": "2 days, 5:24:45", "remaining_time": "1 day, 9:39:10", "throughput": 27780.49, "total_tokens": 5341780032} +{"current_steps": 18210, "total_steps": 29667, "loss": 0.3512, "lr": 2.9769816585093126e-05, "epoch": 1.8414878488133235, "percentage": 61.38, "elapsed_time": "2 days, 5:26:31", "remaining_time": "1 day, 9:37:24", "throughput": 27780.52, "total_tokens": 5344724544} +{"current_steps": 18220, "total_steps": 29667, "loss": 0.3527, "lr": 2.9764541335360024e-05, "epoch": 1.8424991309294314, "percentage": 61.42, "elapsed_time": "2 days, 5:28:17", "remaining_time": "1 day, 9:35:39", "throughput": 27780.39, "total_tokens": 5347664000} +{"current_steps": 18230, "total_steps": 29667, "loss": 0.3528, "lr": 2.9759268888976505e-05, "epoch": 1.8435104130455393, "percentage": 61.45, "elapsed_time": "2 days, 5:30:01", "remaining_time": "1 day, 9:33:52", "throughput": 27780.68, "total_tokens": 5350593472} +{"current_steps": 18240, "total_steps": 29667, "loss": 0.3554, "lr": 2.9753999243460546e-05, "epoch": 1.8445216951616472, "percentage": 61.48, "elapsed_time": "2 days, 5:31:40", "remaining_time": "1 day, 9:32:03", "throughput": 27781.22, "total_tokens": 5353456832} +{"current_steps": 18250, "total_steps": 29667, "loss": 0.3498, "lr": 2.974873239633319e-05, "epoch": 1.8455329772777551, "percentage": 61.52, "elapsed_time": "2 days, 5:33:24", "remaining_time": "1 day, 9:30:16", "throughput": 27781.45, "total_tokens": 5356385280} +{"current_steps": 18260, "total_steps": 29667, "loss": 0.3581, "lr": 2.9743468345118563e-05, "epoch": 1.8465442593938628, "percentage": 61.55, "elapsed_time": "2 days, 5:35:09", "remaining_time": "1 day, 9:28:30", "throughput": 27781.53, "total_tokens": 5359332672} +{"current_steps": 18270, "total_steps": 29667, "loss": 0.3583, "lr": 2.9738207087343844e-05, "epoch": 1.8475555415099705, "percentage": 61.58, "elapsed_time": "2 days, 5:36:55", "remaining_time": "1 day, 9:26:44", "throughput": 27781.52, "total_tokens": 5362253120} +{"current_steps": 18280, "total_steps": 29667, "loss": 0.3575, "lr": 2.9732948620539287e-05, "epoch": 1.8485668236260784, "percentage": 61.62, "elapsed_time": "2 days, 5:38:41", "remaining_time": "1 day, 9:24:59", "throughput": 27781.34, "total_tokens": 5365165696} +{"current_steps": 18290, "total_steps": 29667, "loss": 0.3518, "lr": 2.9727692942238188e-05, "epoch": 1.8495781057421863, "percentage": 61.65, "elapsed_time": "2 days, 5:40:24", "remaining_time": "1 day, 9:23:12", "throughput": 27781.69, "total_tokens": 5368096192} +{"current_steps": 18300, "total_steps": 29667, "loss": 0.3508, "lr": 2.97224400499769e-05, "epoch": 1.8505893878582942, "percentage": 61.68, "elapsed_time": "2 days, 5:42:08", "remaining_time": "1 day, 9:21:25", "throughput": 27781.96, "total_tokens": 5371051904} +{"current_steps": 18310, "total_steps": 29667, "loss": 0.3612, "lr": 2.9717189941294826e-05, "epoch": 1.8516006699744019, "percentage": 61.72, "elapsed_time": "2 days, 5:43:53", "remaining_time": "1 day, 9:19:39", "throughput": 27782.01, "total_tokens": 5373976000} +{"current_steps": 18320, "total_steps": 29667, "loss": 0.3522, "lr": 2.97119426137344e-05, "epoch": 1.8526119520905098, "percentage": 61.75, "elapsed_time": "2 days, 5:45:37", "remaining_time": "1 day, 9:17:52", "throughput": 27782.22, "total_tokens": 5376907008} +{"current_steps": 18330, "total_steps": 29667, "loss": 0.3543, "lr": 2.9706698064841103e-05, "epoch": 1.8536232342066175, "percentage": 61.79, "elapsed_time": "2 days, 5:47:23", "remaining_time": "1 day, 9:16:07", "throughput": 27782.34, "total_tokens": 5379870016} +{"current_steps": 18340, "total_steps": 29667, "loss": 0.3567, "lr": 2.970145629216345e-05, "epoch": 1.8546345163227254, "percentage": 61.82, "elapsed_time": "2 days, 5:49:08", "remaining_time": "1 day, 9:14:21", "throughput": 27782.62, "total_tokens": 5382833536} +{"current_steps": 18350, "total_steps": 29667, "loss": 0.35, "lr": 2.969621729325296e-05, "epoch": 1.8556457984388333, "percentage": 61.85, "elapsed_time": "2 days, 5:50:49", "remaining_time": "1 day, 9:12:32", "throughput": 27783.25, "total_tokens": 5385764992} +{"current_steps": 18360, "total_steps": 29667, "loss": 0.3553, "lr": 2.969098106566421e-05, "epoch": 1.8566570805549412, "percentage": 61.89, "elapsed_time": "2 days, 5:52:38", "remaining_time": "1 day, 9:10:49", "throughput": 27782.89, "total_tokens": 5388731648} +{"current_steps": 18370, "total_steps": 29667, "loss": 0.3532, "lr": 2.968574760695476e-05, "epoch": 1.8576683626710488, "percentage": 61.92, "elapsed_time": "2 days, 5:54:20", "remaining_time": "1 day, 9:09:01", "throughput": 27783.29, "total_tokens": 5391653376} +{"current_steps": 18380, "total_steps": 29667, "loss": 0.3534, "lr": 2.9680516914685206e-05, "epoch": 1.8586796447871567, "percentage": 61.95, "elapsed_time": "2 days, 5:56:04", "remaining_time": "1 day, 9:07:14", "throughput": 27783.71, "total_tokens": 5394608512} +{"current_steps": 18390, "total_steps": 29667, "loss": 0.351, "lr": 2.9675288986419148e-05, "epoch": 1.8596909269032644, "percentage": 61.99, "elapsed_time": "2 days, 5:57:51", "remaining_time": "1 day, 9:05:29", "throughput": 27783.67, "total_tokens": 5397568512} +{"current_steps": 18400, "total_steps": 29667, "loss": 0.353, "lr": 2.967006381972317e-05, "epoch": 1.8607022090193723, "percentage": 62.02, "elapsed_time": "2 days, 5:59:30", "remaining_time": "1 day, 9:03:39", "throughput": 27784.36, "total_tokens": 5400446912} +{"current_steps": 18410, "total_steps": 29667, "loss": 0.3552, "lr": 2.9664841412166882e-05, "epoch": 1.8617134911354802, "percentage": 62.06, "elapsed_time": "2 days, 6:01:22", "remaining_time": "1 day, 9:01:58", "throughput": 27783.44, "total_tokens": 5403386240} +{"current_steps": 18420, "total_steps": 29667, "loss": 0.3507, "lr": 2.965962176132287e-05, "epoch": 1.8627247732515881, "percentage": 62.09, "elapsed_time": "2 days, 6:03:06", "remaining_time": "1 day, 9:00:11", "throughput": 27783.47, "total_tokens": 5406292544} +{"current_steps": 18430, "total_steps": 29667, "loss": 0.3517, "lr": 2.9654404864766706e-05, "epoch": 1.8637360553676958, "percentage": 62.12, "elapsed_time": "2 days, 6:04:49", "remaining_time": "1 day, 8:58:24", "throughput": 27783.84, "total_tokens": 5409208128} +{"current_steps": 18440, "total_steps": 29667, "loss": 0.3541, "lr": 2.9649190720076962e-05, "epoch": 1.8647473374838037, "percentage": 62.16, "elapsed_time": "2 days, 6:06:32", "remaining_time": "1 day, 8:56:37", "throughput": 27783.93, "total_tokens": 5412112256} +{"current_steps": 18450, "total_steps": 29667, "loss": 0.3539, "lr": 2.9643979324835176e-05, "epoch": 1.8657586195999114, "percentage": 62.19, "elapsed_time": "2 days, 6:08:11", "remaining_time": "1 day, 8:54:47", "throughput": 27784.71, "total_tokens": 5414993088} +{"current_steps": 18460, "total_steps": 29667, "loss": 0.3518, "lr": 2.9638770676625866e-05, "epoch": 1.8667699017160193, "percentage": 62.22, "elapsed_time": "2 days, 6:09:55", "remaining_time": "1 day, 8:53:01", "throughput": 27784.81, "total_tokens": 5417914624} +{"current_steps": 18470, "total_steps": 29667, "loss": 0.3568, "lr": 2.9633564773036517e-05, "epoch": 1.8677811838321272, "percentage": 62.26, "elapsed_time": "2 days, 6:11:38", "remaining_time": "1 day, 8:51:13", "throughput": 27785.11, "total_tokens": 5420840064} +{"current_steps": 18480, "total_steps": 29667, "loss": 0.3518, "lr": 2.9628361611657578e-05, "epoch": 1.8687924659482351, "percentage": 62.29, "elapsed_time": "2 days, 6:13:20", "remaining_time": "1 day, 8:49:26", "throughput": 27785.44, "total_tokens": 5423738816} +{"current_steps": 18490, "total_steps": 29667, "loss": 0.3584, "lr": 2.9623161190082472e-05, "epoch": 1.8698037480643428, "percentage": 62.33, "elapsed_time": "2 days, 6:15:04", "remaining_time": "1 day, 8:47:39", "throughput": 27785.82, "total_tokens": 5426694272} +{"current_steps": 18500, "total_steps": 29667, "loss": 0.3541, "lr": 2.9617963505907554e-05, "epoch": 1.8708150301804507, "percentage": 62.36, "elapsed_time": "2 days, 6:16:43", "remaining_time": "1 day, 8:45:49", "throughput": 27786.4, "total_tokens": 5429558272} +{"current_steps": 18510, "total_steps": 29667, "loss": 0.3546, "lr": 2.9612768556732145e-05, "epoch": 1.8718263122965584, "percentage": 62.39, "elapsed_time": "2 days, 6:18:28", "remaining_time": "1 day, 8:44:03", "throughput": 27786.38, "total_tokens": 5432480640} +{"current_steps": 18520, "total_steps": 29667, "loss": 0.3531, "lr": 2.960757634015852e-05, "epoch": 1.8728375944126663, "percentage": 62.43, "elapsed_time": "2 days, 6:20:12", "remaining_time": "1 day, 8:42:17", "throughput": 27786.81, "total_tokens": 5435444608} +{"current_steps": 18530, "total_steps": 29667, "loss": 0.3524, "lr": 2.9602386853791885e-05, "epoch": 1.8738488765287742, "percentage": 62.46, "elapsed_time": "2 days, 6:21:54", "remaining_time": "1 day, 8:40:29", "throughput": 27787.3, "total_tokens": 5438389312} +{"current_steps": 18540, "total_steps": 29667, "loss": 0.3568, "lr": 2.959720009524038e-05, "epoch": 1.874860158644882, "percentage": 62.49, "elapsed_time": "2 days, 6:23:37", "remaining_time": "1 day, 8:38:42", "throughput": 27787.6, "total_tokens": 5441300608} +{"current_steps": 18550, "total_steps": 29667, "loss": 0.352, "lr": 2.9592016062115085e-05, "epoch": 1.8758714407609898, "percentage": 62.53, "elapsed_time": "2 days, 6:25:27", "remaining_time": "1 day, 8:36:59", "throughput": 27786.67, "total_tokens": 5444178368} +{"current_steps": 18560, "total_steps": 29667, "loss": 0.3521, "lr": 2.9586834752030002e-05, "epoch": 1.8768827228770977, "percentage": 62.56, "elapsed_time": "2 days, 6:27:34", "remaining_time": "1 day, 8:35:26", "throughput": 27783.47, "total_tokens": 5447068096} +{"current_steps": 18570, "total_steps": 29667, "loss": 0.3525, "lr": 2.958165616260206e-05, "epoch": 1.8778940049932054, "percentage": 62.59, "elapsed_time": "2 days, 6:29:28", "remaining_time": "1 day, 8:33:45", "throughput": 27782.21, "total_tokens": 5450003584} +{"current_steps": 18580, "total_steps": 29667, "loss": 0.3497, "lr": 2.9576480291451114e-05, "epoch": 1.8789052871093133, "percentage": 62.63, "elapsed_time": "2 days, 6:31:18", "remaining_time": "1 day, 8:32:02", "throughput": 27781.61, "total_tokens": 5452920000} +{"current_steps": 18590, "total_steps": 29667, "loss": 0.3532, "lr": 2.957130713619991e-05, "epoch": 1.8799165692254212, "percentage": 62.66, "elapsed_time": "2 days, 6:33:07", "remaining_time": "1 day, 8:30:19", "throughput": 27781.14, "total_tokens": 5455875904} +{"current_steps": 18600, "total_steps": 29667, "loss": 0.3541, "lr": 2.9566136694474138e-05, "epoch": 1.880927851341529, "percentage": 62.7, "elapsed_time": "2 days, 6:34:56", "remaining_time": "1 day, 8:28:35", "throughput": 27780.66, "total_tokens": 5458797824} +{"current_steps": 18610, "total_steps": 29667, "loss": 0.3516, "lr": 2.9560968963902365e-05, "epoch": 1.8819391334576367, "percentage": 62.73, "elapsed_time": "2 days, 6:36:44", "remaining_time": "1 day, 8:26:50", "throughput": 27780.37, "total_tokens": 5461735616} +{"current_steps": 18620, "total_steps": 29667, "loss": 0.3532, "lr": 2.9555803942116062e-05, "epoch": 1.8829504155737444, "percentage": 62.76, "elapsed_time": "2 days, 6:38:33", "remaining_time": "1 day, 8:25:07", "throughput": 27779.98, "total_tokens": 5464688320} +{"current_steps": 18630, "total_steps": 29667, "loss": 0.351, "lr": 2.955064162674961e-05, "epoch": 1.8839616976898523, "percentage": 62.8, "elapsed_time": "2 days, 6:40:13", "remaining_time": "1 day, 8:23:18", "throughput": 27780.43, "total_tokens": 5467576448} +{"current_steps": 18640, "total_steps": 29667, "loss": 0.356, "lr": 2.9545482015440266e-05, "epoch": 1.8849729798059602, "percentage": 62.83, "elapsed_time": "2 days, 6:42:10", "remaining_time": "1 day, 8:21:39", "throughput": 27778.87, "total_tokens": 5470506624} +{"current_steps": 18650, "total_steps": 29667, "loss": 0.3508, "lr": 2.954032510582819e-05, "epoch": 1.8859842619220681, "percentage": 62.86, "elapsed_time": "2 days, 6:44:01", "remaining_time": "1 day, 8:19:57", "throughput": 27777.88, "total_tokens": 5473405760} +{"current_steps": 18660, "total_steps": 29667, "loss": 0.3554, "lr": 2.95351708955564e-05, "epoch": 1.886995544038176, "percentage": 62.9, "elapsed_time": "2 days, 6:45:50", "remaining_time": "1 day, 8:18:13", "throughput": 27777.58, "total_tokens": 5476357184} +{"current_steps": 18670, "total_steps": 29667, "loss": 0.358, "lr": 2.9530019382270823e-05, "epoch": 1.8880068261542837, "percentage": 62.93, "elapsed_time": "2 days, 6:47:36", "remaining_time": "1 day, 8:16:28", "throughput": 27777.62, "total_tokens": 5479317248} +{"current_steps": 18680, "total_steps": 29667, "loss": 0.3539, "lr": 2.9524870563620233e-05, "epoch": 1.8890181082703914, "percentage": 62.97, "elapsed_time": "2 days, 6:49:20", "remaining_time": "1 day, 8:14:41", "throughput": 27777.96, "total_tokens": 5482260544} +{"current_steps": 18690, "total_steps": 29667, "loss": 0.3506, "lr": 2.9519724437256287e-05, "epoch": 1.8900293903864993, "percentage": 63.0, "elapsed_time": "2 days, 6:51:06", "remaining_time": "1 day, 8:12:55", "throughput": 27777.89, "total_tokens": 5485205760} +{"current_steps": 18700, "total_steps": 29667, "loss": 0.3573, "lr": 2.9514581000833496e-05, "epoch": 1.8910406725026072, "percentage": 63.03, "elapsed_time": "2 days, 6:52:50", "remaining_time": "1 day, 8:11:09", "throughput": 27778.06, "total_tokens": 5488122048} +{"current_steps": 18710, "total_steps": 29667, "loss": 0.3569, "lr": 2.950944025200924e-05, "epoch": 1.8920519546187151, "percentage": 63.07, "elapsed_time": "2 days, 6:54:37", "remaining_time": "1 day, 8:09:24", "throughput": 27777.86, "total_tokens": 5491059008} +{"current_steps": 18720, "total_steps": 29667, "loss": 0.3555, "lr": 2.950430218844375e-05, "epoch": 1.893063236734823, "percentage": 63.1, "elapsed_time": "2 days, 6:56:27", "remaining_time": "1 day, 8:07:41", "throughput": 27777.48, "total_tokens": 5494029568} +{"current_steps": 18730, "total_steps": 29667, "loss": 0.3547, "lr": 2.9499166807800106e-05, "epoch": 1.8940745188509307, "percentage": 63.13, "elapsed_time": "2 days, 6:58:17", "remaining_time": "1 day, 8:05:58", "throughput": 27776.93, "total_tokens": 5496993216} +{"current_steps": 18740, "total_steps": 29667, "loss": 0.355, "lr": 2.949403410774424e-05, "epoch": 1.8950858009670384, "percentage": 63.17, "elapsed_time": "2 days, 7:00:01", "remaining_time": "1 day, 8:04:11", "throughput": 27777.16, "total_tokens": 5499918208} +{"current_steps": 18750, "total_steps": 29667, "loss": 0.3542, "lr": 2.948890408594492e-05, "epoch": 1.8960970830831463, "percentage": 63.2, "elapsed_time": "2 days, 7:01:46", "remaining_time": "1 day, 8:02:25", "throughput": 27777.35, "total_tokens": 5502872640} +{"current_steps": 18760, "total_steps": 29667, "loss": 0.3531, "lr": 2.9483776740073748e-05, "epoch": 1.8971083651992542, "percentage": 63.24, "elapsed_time": "2 days, 7:03:29", "remaining_time": "1 day, 8:00:38", "throughput": 27777.62, "total_tokens": 5505792448} +{"current_steps": 18770, "total_steps": 29667, "loss": 0.3493, "lr": 2.947865206780518e-05, "epoch": 1.898119647315362, "percentage": 63.27, "elapsed_time": "2 days, 7:05:16", "remaining_time": "1 day, 7:58:53", "throughput": 27777.52, "total_tokens": 5508746752} +{"current_steps": 18780, "total_steps": 29667, "loss": 0.3522, "lr": 2.947353006681647e-05, "epoch": 1.89913092943147, "percentage": 63.3, "elapsed_time": "2 days, 7:07:05", "remaining_time": "1 day, 7:57:09", "throughput": 27777.38, "total_tokens": 5511737408} +{"current_steps": 18790, "total_steps": 29667, "loss": 0.3498, "lr": 2.9468410734787717e-05, "epoch": 1.9001422115475777, "percentage": 63.34, "elapsed_time": "2 days, 7:08:51", "remaining_time": "1 day, 7:55:24", "throughput": 27777.13, "total_tokens": 5514641280} +{"current_steps": 18800, "total_steps": 29667, "loss": 0.3535, "lr": 2.9463294069401838e-05, "epoch": 1.9011534936636854, "percentage": 63.37, "elapsed_time": "2 days, 7:10:38", "remaining_time": "1 day, 7:53:39", "throughput": 27777.13, "total_tokens": 5517606912} +{"current_steps": 18810, "total_steps": 29667, "loss": 0.35, "lr": 2.9458180068344555e-05, "epoch": 1.9021647757797933, "percentage": 63.4, "elapsed_time": "2 days, 7:12:24", "remaining_time": "1 day, 7:51:54", "throughput": 27777.11, "total_tokens": 5520553664} +{"current_steps": 18820, "total_steps": 29667, "loss": 0.3557, "lr": 2.9453068729304407e-05, "epoch": 1.9031760578959012, "percentage": 63.44, "elapsed_time": "2 days, 7:14:07", "remaining_time": "1 day, 7:50:06", "throughput": 27777.48, "total_tokens": 5523492224} +{"current_steps": 18830, "total_steps": 29667, "loss": 0.3555, "lr": 2.944796004997274e-05, "epoch": 1.904187340012009, "percentage": 63.47, "elapsed_time": "2 days, 7:15:53", "remaining_time": "1 day, 7:48:21", "throughput": 27777.49, "total_tokens": 5526418240} +{"current_steps": 18840, "total_steps": 29667, "loss": 0.3525, "lr": 2.94428540280437e-05, "epoch": 1.9051986221281167, "percentage": 63.5, "elapsed_time": "2 days, 7:17:39", "remaining_time": "1 day, 7:46:35", "throughput": 27777.62, "total_tokens": 5529387456} +{"current_steps": 18850, "total_steps": 29667, "loss": 0.3565, "lr": 2.9437750661214242e-05, "epoch": 1.9062099042442247, "percentage": 63.54, "elapsed_time": "2 days, 7:19:23", "remaining_time": "1 day, 7:44:49", "throughput": 27777.87, "total_tokens": 5532340672} +{"current_steps": 18860, "total_steps": 29667, "loss": 0.3488, "lr": 2.9432649947184094e-05, "epoch": 1.9072211863603323, "percentage": 63.57, "elapsed_time": "2 days, 7:21:08", "remaining_time": "1 day, 7:43:03", "throughput": 27777.91, "total_tokens": 5535271680} +{"current_steps": 18870, "total_steps": 29667, "loss": 0.3564, "lr": 2.942755188365579e-05, "epoch": 1.9082324684764402, "percentage": 63.61, "elapsed_time": "2 days, 7:22:55", "remaining_time": "1 day, 7:41:18", "throughput": 27777.71, "total_tokens": 5538206336} +{"current_steps": 18880, "total_steps": 29667, "loss": 0.3528, "lr": 2.9422456468334635e-05, "epoch": 1.9092437505925481, "percentage": 63.64, "elapsed_time": "2 days, 7:24:40", "remaining_time": "1 day, 7:39:32", "throughput": 27777.71, "total_tokens": 5541105984} +{"current_steps": 18890, "total_steps": 29667, "loss": 0.3535, "lr": 2.9417363698928734e-05, "epoch": 1.910255032708656, "percentage": 63.67, "elapsed_time": "2 days, 7:26:28", "remaining_time": "1 day, 7:37:47", "throughput": 27777.53, "total_tokens": 5544071744} +{"current_steps": 18900, "total_steps": 29667, "loss": 0.3537, "lr": 2.9412273573148946e-05, "epoch": 1.9112663148247637, "percentage": 63.71, "elapsed_time": "2 days, 7:28:09", "remaining_time": "1 day, 7:35:59", "throughput": 27778.06, "total_tokens": 5546985664} +{"current_steps": 18910, "total_steps": 29667, "loss": 0.3514, "lr": 2.940718608870891e-05, "epoch": 1.9122775969408716, "percentage": 63.74, "elapsed_time": "2 days, 7:29:53", "remaining_time": "1 day, 7:34:12", "throughput": 27778.26, "total_tokens": 5549901632} +{"current_steps": 18920, "total_steps": 29667, "loss": 0.3563, "lr": 2.940210124332504e-05, "epoch": 1.9132888790569793, "percentage": 63.77, "elapsed_time": "2 days, 7:31:39", "remaining_time": "1 day, 7:32:27", "throughput": 27778.29, "total_tokens": 5552851904} +{"current_steps": 18930, "total_steps": 29667, "loss": 0.3471, "lr": 2.9397019034716504e-05, "epoch": 1.9143001611730872, "percentage": 63.81, "elapsed_time": "2 days, 7:33:30", "remaining_time": "1 day, 7:30:44", "throughput": 27777.77, "total_tokens": 5555840832} +{"current_steps": 18940, "total_steps": 29667, "loss": 0.3544, "lr": 2.9391939460605233e-05, "epoch": 1.9153114432891951, "percentage": 63.84, "elapsed_time": "2 days, 7:35:19", "remaining_time": "1 day, 7:29:01", "throughput": 27777.45, "total_tokens": 5558815872} +{"current_steps": 18950, "total_steps": 29667, "loss": 0.3529, "lr": 2.9386862518715914e-05, "epoch": 1.916322725405303, "percentage": 63.88, "elapsed_time": "2 days, 7:37:05", "remaining_time": "1 day, 7:27:15", "throughput": 27777.51, "total_tokens": 5561758272} +{"current_steps": 18960, "total_steps": 29667, "loss": 0.3498, "lr": 2.9381788206775966e-05, "epoch": 1.9173340075214107, "percentage": 63.91, "elapsed_time": "2 days, 7:38:50", "remaining_time": "1 day, 7:25:29", "throughput": 27777.78, "total_tokens": 5564728064} +{"current_steps": 18970, "total_steps": 29667, "loss": 0.3508, "lr": 2.937671652251559e-05, "epoch": 1.9183452896375186, "percentage": 63.94, "elapsed_time": "2 days, 7:40:33", "remaining_time": "1 day, 7:23:42", "throughput": 27778.02, "total_tokens": 5567640640} +{"current_steps": 18980, "total_steps": 29667, "loss": 0.3563, "lr": 2.9371647463667696e-05, "epoch": 1.9193565717536263, "percentage": 63.98, "elapsed_time": "2 days, 7:42:20", "remaining_time": "1 day, 7:21:57", "throughput": 27777.84, "total_tokens": 5570588864} +{"current_steps": 18990, "total_steps": 29667, "loss": 0.3559, "lr": 2.9366581027967943e-05, "epoch": 1.9203678538697342, "percentage": 64.01, "elapsed_time": "2 days, 7:44:05", "remaining_time": "1 day, 7:20:11", "throughput": 27778.24, "total_tokens": 5573566656} +{"current_steps": 19000, "total_steps": 29667, "loss": 0.346, "lr": 2.9361517213154726e-05, "epoch": 1.921379135985842, "percentage": 64.04, "elapsed_time": "2 days, 7:45:49", "remaining_time": "1 day, 7:18:25", "throughput": 27778.35, "total_tokens": 5576498624} +{"current_steps": 19010, "total_steps": 29667, "loss": 0.3544, "lr": 2.935645601696917e-05, "epoch": 1.92239041810195, "percentage": 64.08, "elapsed_time": "2 days, 7:47:42", "remaining_time": "1 day, 7:16:43", "throughput": 27777.45, "total_tokens": 5579435264} +{"current_steps": 19020, "total_steps": 29667, "loss": 0.3555, "lr": 2.9351397437155114e-05, "epoch": 1.9234017002180577, "percentage": 64.11, "elapsed_time": "2 days, 7:49:31", "remaining_time": "1 day, 7:14:59", "throughput": 27776.99, "total_tokens": 5582393280} +{"current_steps": 19030, "total_steps": 29667, "loss": 0.3531, "lr": 2.934634147145913e-05, "epoch": 1.9244129823341656, "percentage": 64.15, "elapsed_time": "2 days, 7:51:16", "remaining_time": "1 day, 7:13:13", "throughput": 27776.98, "total_tokens": 5585298944} +{"current_steps": 19040, "total_steps": 29667, "loss": 0.3511, "lr": 2.9341288117630495e-05, "epoch": 1.9254242644502733, "percentage": 64.18, "elapsed_time": "2 days, 7:53:04", "remaining_time": "1 day, 7:11:29", "throughput": 27776.75, "total_tokens": 5588248768} +{"current_steps": 19050, "total_steps": 29667, "loss": 0.3541, "lr": 2.933623737342121e-05, "epoch": 1.9264355465663812, "percentage": 64.21, "elapsed_time": "2 days, 7:54:49", "remaining_time": "1 day, 7:09:43", "throughput": 27776.83, "total_tokens": 5591180352} +{"current_steps": 19060, "total_steps": 29667, "loss": 0.3548, "lr": 2.9331189236585977e-05, "epoch": 1.927446828682489, "percentage": 64.25, "elapsed_time": "2 days, 7:56:32", "remaining_time": "1 day, 7:07:56", "throughput": 27777.0, "total_tokens": 5594080896} +{"current_steps": 19070, "total_steps": 29667, "loss": 0.3513, "lr": 2.9326143704882192e-05, "epoch": 1.928458110798597, "percentage": 64.28, "elapsed_time": "2 days, 7:58:22", "remaining_time": "1 day, 7:06:12", "throughput": 27776.21, "total_tokens": 5596980736} +{"current_steps": 19080, "total_steps": 29667, "loss": 0.3488, "lr": 2.932110077606997e-05, "epoch": 1.9294693929147047, "percentage": 64.31, "elapsed_time": "2 days, 8:00:16", "remaining_time": "1 day, 7:04:31", "throughput": 27775.05, "total_tokens": 5599916480} +{"current_steps": 19090, "total_steps": 29667, "loss": 0.3552, "lr": 2.931606044791212e-05, "epoch": 1.9304806750308126, "percentage": 64.35, "elapsed_time": "2 days, 8:02:04", "remaining_time": "1 day, 7:02:47", "throughput": 27774.81, "total_tokens": 5602861568} +{"current_steps": 19100, "total_steps": 29667, "loss": 0.3462, "lr": 2.9311022718174114e-05, "epoch": 1.9314919571469202, "percentage": 64.38, "elapsed_time": "2 days, 8:03:59", "remaining_time": "1 day, 7:01:07", "throughput": 27773.5, "total_tokens": 5605798016} +{"current_steps": 19110, "total_steps": 29667, "loss": 0.3529, "lr": 2.930598758462415e-05, "epoch": 1.9325032392630281, "percentage": 64.42, "elapsed_time": "2 days, 8:06:28", "remaining_time": "1 day, 6:59:45", "throughput": 27767.45, "total_tokens": 5608703040} +{"current_steps": 19120, "total_steps": 29667, "loss": 0.3501, "lr": 2.9300955045033072e-05, "epoch": 1.933514521379136, "percentage": 64.45, "elapsed_time": "2 days, 8:08:29", "remaining_time": "1 day, 6:58:08", "throughput": 27765.1, "total_tokens": 5611594752} +{"current_steps": 19130, "total_steps": 29667, "loss": 0.3546, "lr": 2.9295925097174435e-05, "epoch": 1.934525803495244, "percentage": 64.48, "elapsed_time": "2 days, 8:10:13", "remaining_time": "1 day, 6:56:21", "throughput": 27765.28, "total_tokens": 5614514304} +{"current_steps": 19140, "total_steps": 29667, "loss": 0.3527, "lr": 2.929089773882445e-05, "epoch": 1.9355370856113516, "percentage": 64.52, "elapsed_time": "2 days, 8:11:56", "remaining_time": "1 day, 6:54:34", "throughput": 27765.41, "total_tokens": 5617408896} +{"current_steps": 19150, "total_steps": 29667, "loss": 0.3479, "lr": 2.9285872967762007e-05, "epoch": 1.9365483677274593, "percentage": 64.55, "elapsed_time": "2 days, 8:13:39", "remaining_time": "1 day, 6:52:46", "throughput": 27765.71, "total_tokens": 5620312192} +{"current_steps": 19160, "total_steps": 29667, "loss": 0.3545, "lr": 2.9280850781768638e-05, "epoch": 1.9375596498435672, "percentage": 64.58, "elapsed_time": "2 days, 8:15:27", "remaining_time": "1 day, 6:51:02", "throughput": 27765.45, "total_tokens": 5623269888} +{"current_steps": 19170, "total_steps": 29667, "loss": 0.3532, "lr": 2.9275831178628576e-05, "epoch": 1.9385709319596751, "percentage": 64.62, "elapsed_time": "2 days, 8:17:14", "remaining_time": "1 day, 6:49:17", "throughput": 27765.4, "total_tokens": 5626232192} +{"current_steps": 19180, "total_steps": 29667, "loss": 0.3564, "lr": 2.927081415612869e-05, "epoch": 1.939582214075783, "percentage": 64.65, "elapsed_time": "2 days, 8:19:00", "remaining_time": "1 day, 6:47:31", "throughput": 27765.27, "total_tokens": 5629135104} +{"current_steps": 19190, "total_steps": 29667, "loss": 0.3527, "lr": 2.9265799712058505e-05, "epoch": 1.940593496191891, "percentage": 64.68, "elapsed_time": "2 days, 8:20:50", "remaining_time": "1 day, 6:45:48", "throughput": 27765.04, "total_tokens": 5632139136} +{"current_steps": 19200, "total_steps": 29667, "loss": 0.3542, "lr": 2.926078784421019e-05, "epoch": 1.9416047783079986, "percentage": 64.72, "elapsed_time": "2 days, 8:22:38", "remaining_time": "1 day, 6:44:04", "throughput": 27764.99, "total_tokens": 5635145984} +{"current_steps": 19210, "total_steps": 29667, "loss": 0.3604, "lr": 2.9255778550378575e-05, "epoch": 1.9426160604241063, "percentage": 64.75, "elapsed_time": "2 days, 8:24:39", "remaining_time": "1 day, 6:42:26", "throughput": 27763.17, "total_tokens": 5638142848} +{"current_steps": 19220, "total_steps": 29667, "loss": 0.3525, "lr": 2.9250771828361118e-05, "epoch": 1.9436273425402142, "percentage": 64.79, "elapsed_time": "2 days, 8:26:32", "remaining_time": "1 day, 6:40:45", "throughput": 27762.15, "total_tokens": 5641073600} +{"current_steps": 19230, "total_steps": 29667, "loss": 0.3537, "lr": 2.9245767675957923e-05, "epoch": 1.944638624656322, "percentage": 64.82, "elapsed_time": "2 days, 8:28:23", "remaining_time": "1 day, 6:39:01", "throughput": 27761.78, "total_tokens": 5644059328} +{"current_steps": 19240, "total_steps": 29667, "loss": 0.3536, "lr": 2.924076609097172e-05, "epoch": 1.94564990677243, "percentage": 64.85, "elapsed_time": "2 days, 8:30:06", "remaining_time": "1 day, 6:37:14", "throughput": 27762.06, "total_tokens": 5646980224} +{"current_steps": 19250, "total_steps": 29667, "loss": 0.3492, "lr": 2.9235767071207876e-05, "epoch": 1.946661188888538, "percentage": 64.89, "elapsed_time": "2 days, 8:31:50", "remaining_time": "1 day, 6:35:28", "throughput": 27762.3, "total_tokens": 5649924800} +{"current_steps": 19260, "total_steps": 29667, "loss": 0.3574, "lr": 2.9230770614474383e-05, "epoch": 1.9476724710046456, "percentage": 64.92, "elapsed_time": "2 days, 8:33:34", "remaining_time": "1 day, 6:33:41", "throughput": 27762.47, "total_tokens": 5652841088} +{"current_steps": 19270, "total_steps": 29667, "loss": 0.35, "lr": 2.9225776718581842e-05, "epoch": 1.9486837531207533, "percentage": 64.95, "elapsed_time": "2 days, 8:35:19", "remaining_time": "1 day, 6:31:55", "throughput": 27762.63, "total_tokens": 5655781056} +{"current_steps": 19280, "total_steps": 29667, "loss": 0.3531, "lr": 2.9220785381343495e-05, "epoch": 1.9496950352368612, "percentage": 64.99, "elapsed_time": "2 days, 8:37:00", "remaining_time": "1 day, 6:30:07", "throughput": 27763.13, "total_tokens": 5658685504} +{"current_steps": 19290, "total_steps": 29667, "loss": 0.3514, "lr": 2.9215796600575174e-05, "epoch": 1.950706317352969, "percentage": 65.02, "elapsed_time": "2 days, 8:38:46", "remaining_time": "1 day, 6:28:21", "throughput": 27763.17, "total_tokens": 5661659136} +{"current_steps": 19300, "total_steps": 29667, "loss": 0.3501, "lr": 2.9210810374095332e-05, "epoch": 1.951717599469077, "percentage": 65.06, "elapsed_time": "2 days, 8:40:29", "remaining_time": "1 day, 6:26:34", "throughput": 27763.62, "total_tokens": 5664594112} +{"current_steps": 19310, "total_steps": 29667, "loss": 0.3549, "lr": 2.9205826699725026e-05, "epoch": 1.9527288815851849, "percentage": 65.09, "elapsed_time": "2 days, 8:42:14", "remaining_time": "1 day, 6:24:48", "throughput": 27763.76, "total_tokens": 5667531264} +{"current_steps": 19320, "total_steps": 29667, "loss": 0.3535, "lr": 2.920084557528791e-05, "epoch": 1.9537401637012926, "percentage": 65.12, "elapsed_time": "2 days, 8:43:58", "remaining_time": "1 day, 6:23:01", "throughput": 27764.01, "total_tokens": 5670469568} +{"current_steps": 19330, "total_steps": 29667, "loss": 0.3507, "lr": 2.9195866998610245e-05, "epoch": 1.9547514458174002, "percentage": 65.16, "elapsed_time": "2 days, 8:45:45", "remaining_time": "1 day, 6:21:16", "throughput": 27763.93, "total_tokens": 5673442496} +{"current_steps": 19340, "total_steps": 29667, "loss": 0.3528, "lr": 2.9190890967520878e-05, "epoch": 1.9557627279335081, "percentage": 65.19, "elapsed_time": "2 days, 8:47:30", "remaining_time": "1 day, 6:19:30", "throughput": 27763.96, "total_tokens": 5676349952} +{"current_steps": 19350, "total_steps": 29667, "loss": 0.3533, "lr": 2.9185917479851243e-05, "epoch": 1.956774010049616, "percentage": 65.22, "elapsed_time": "2 days, 8:49:20", "remaining_time": "1 day, 6:17:47", "throughput": 27763.3, "total_tokens": 5679282880} +{"current_steps": 19360, "total_steps": 29667, "loss": 0.352, "lr": 2.9180946533435366e-05, "epoch": 1.957785292165724, "percentage": 65.26, "elapsed_time": "2 days, 8:51:19", "remaining_time": "1 day, 6:16:08", "throughput": 27762.03, "total_tokens": 5682330496} +{"current_steps": 19370, "total_steps": 29667, "loss": 0.352, "lr": 2.9175978126109853e-05, "epoch": 1.9587965742818318, "percentage": 65.29, "elapsed_time": "2 days, 8:53:05", "remaining_time": "1 day, 6:14:23", "throughput": 27761.95, "total_tokens": 5685251328} +{"current_steps": 19380, "total_steps": 29667, "loss": 0.3541, "lr": 2.9171012255713885e-05, "epoch": 1.9598078563979395, "percentage": 65.33, "elapsed_time": "2 days, 8:54:52", "remaining_time": "1 day, 6:12:38", "throughput": 27761.91, "total_tokens": 5688220032} +{"current_steps": 19390, "total_steps": 29667, "loss": 0.3529, "lr": 2.9166048920089217e-05, "epoch": 1.9608191385140472, "percentage": 65.36, "elapsed_time": "2 days, 8:56:37", "remaining_time": "1 day, 6:10:51", "throughput": 27762.09, "total_tokens": 5691165312} +{"current_steps": 19400, "total_steps": 29667, "loss": 0.3502, "lr": 2.9161088117080175e-05, "epoch": 1.9618304206301551, "percentage": 65.39, "elapsed_time": "2 days, 8:58:19", "remaining_time": "1 day, 6:09:04", "throughput": 27762.56, "total_tokens": 5694082560} +{"current_steps": 19410, "total_steps": 29667, "loss": 0.3516, "lr": 2.9156129844533658e-05, "epoch": 1.962841702746263, "percentage": 65.43, "elapsed_time": "2 days, 9:00:05", "remaining_time": "1 day, 6:07:18", "throughput": 27762.52, "total_tokens": 5697022272} +{"current_steps": 19420, "total_steps": 29667, "loss": 0.3504, "lr": 2.9151174100299104e-05, "epoch": 1.963852984862371, "percentage": 65.46, "elapsed_time": "2 days, 9:01:46", "remaining_time": "1 day, 6:05:30", "throughput": 27763.16, "total_tokens": 5699964480} +{"current_steps": 19430, "total_steps": 29667, "loss": 0.3532, "lr": 2.9146220882228535e-05, "epoch": 1.9648642669784786, "percentage": 65.49, "elapsed_time": "2 days, 9:03:31", "remaining_time": "1 day, 6:03:44", "throughput": 27763.29, "total_tokens": 5702909376} +{"current_steps": 19440, "total_steps": 29667, "loss": 0.3511, "lr": 2.914127018817651e-05, "epoch": 1.9658755490945865, "percentage": 65.53, "elapsed_time": "2 days, 9:05:14", "remaining_time": "1 day, 6:01:57", "throughput": 27763.64, "total_tokens": 5705838080} +{"current_steps": 19450, "total_steps": 29667, "loss": 0.3543, "lr": 2.9136322016000152e-05, "epoch": 1.9668868312106942, "percentage": 65.56, "elapsed_time": "2 days, 9:07:02", "remaining_time": "1 day, 6:00:12", "throughput": 27763.27, "total_tokens": 5708743360} +{"current_steps": 19460, "total_steps": 29667, "loss": 0.353, "lr": 2.9131376363559116e-05, "epoch": 1.967898113326802, "percentage": 65.59, "elapsed_time": "2 days, 9:08:54", "remaining_time": "1 day, 5:58:30", "throughput": 27762.26, "total_tokens": 5711667456} +{"current_steps": 19470, "total_steps": 29667, "loss": 0.3493, "lr": 2.9126433228715606e-05, "epoch": 1.96890939544291, "percentage": 65.63, "elapsed_time": "2 days, 9:10:43", "remaining_time": "1 day, 5:56:46", "throughput": 27762.0, "total_tokens": 5714635904} +{"current_steps": 19480, "total_steps": 29667, "loss": 0.3497, "lr": 2.9121492609334354e-05, "epoch": 1.969920677559018, "percentage": 65.66, "elapsed_time": "2 days, 9:12:29", "remaining_time": "1 day, 5:55:00", "throughput": 27762.15, "total_tokens": 5717613440} +{"current_steps": 19490, "total_steps": 29667, "loss": 0.3535, "lr": 2.9116554503282656e-05, "epoch": 1.9709319596751256, "percentage": 65.7, "elapsed_time": "2 days, 9:14:15", "remaining_time": "1 day, 5:53:14", "throughput": 27762.3, "total_tokens": 5720569728} +{"current_steps": 19500, "total_steps": 29667, "loss": 0.3562, "lr": 2.9111618908430303e-05, "epoch": 1.9719432417912335, "percentage": 65.73, "elapsed_time": "2 days, 9:16:05", "remaining_time": "1 day, 5:51:31", "throughput": 27761.75, "total_tokens": 5723527680} +{"current_steps": 19510, "total_steps": 29667, "loss": 0.3504, "lr": 2.9106685822649643e-05, "epoch": 1.9729545239073412, "percentage": 65.76, "elapsed_time": "2 days, 9:17:55", "remaining_time": "1 day, 5:49:47", "throughput": 27761.42, "total_tokens": 5726489408} +{"current_steps": 19520, "total_steps": 29667, "loss": 0.3538, "lr": 2.910175524381552e-05, "epoch": 1.973965806023449, "percentage": 65.8, "elapsed_time": "2 days, 9:19:37", "remaining_time": "1 day, 5:48:00", "throughput": 27761.8, "total_tokens": 5729403776} +{"current_steps": 19530, "total_steps": 29667, "loss": 0.351, "lr": 2.9096827169805318e-05, "epoch": 1.974977088139557, "percentage": 65.83, "elapsed_time": "2 days, 9:21:16", "remaining_time": "1 day, 5:46:11", "throughput": 27762.48, "total_tokens": 5732307392} +{"current_steps": 19540, "total_steps": 29667, "loss": 0.3521, "lr": 2.9091901598498923e-05, "epoch": 1.9759883702556649, "percentage": 65.86, "elapsed_time": "2 days, 9:23:00", "remaining_time": "1 day, 5:44:24", "throughput": 27762.81, "total_tokens": 5735246400} +{"current_steps": 19550, "total_steps": 29667, "loss": 0.3513, "lr": 2.9086978527778736e-05, "epoch": 1.9769996523717726, "percentage": 65.9, "elapsed_time": "2 days, 9:24:43", "remaining_time": "1 day, 5:42:37", "throughput": 27763.03, "total_tokens": 5738153984} +{"current_steps": 19560, "total_steps": 29667, "loss": 0.3547, "lr": 2.9082057955529668e-05, "epoch": 1.9780109344878805, "percentage": 65.93, "elapsed_time": "2 days, 9:26:25", "remaining_time": "1 day, 5:40:49", "throughput": 27763.44, "total_tokens": 5741068608} +{"current_steps": 19570, "total_steps": 29667, "loss": 0.3581, "lr": 2.907713987963914e-05, "epoch": 1.9790222166039881, "percentage": 65.97, "elapsed_time": "2 days, 9:28:13", "remaining_time": "1 day, 5:39:05", "throughput": 27763.23, "total_tokens": 5744043136} +{"current_steps": 19580, "total_steps": 29667, "loss": 0.3555, "lr": 2.9072224297997058e-05, "epoch": 1.980033498720096, "percentage": 66.0, "elapsed_time": "2 days, 9:29:55", "remaining_time": "1 day, 5:37:17", "throughput": 27763.87, "total_tokens": 5746991040} +{"current_steps": 19590, "total_steps": 29667, "loss": 0.3532, "lr": 2.9067311208495834e-05, "epoch": 1.981044780836204, "percentage": 66.03, "elapsed_time": "2 days, 9:31:40", "remaining_time": "1 day, 5:35:31", "throughput": 27763.89, "total_tokens": 5749918656} +{"current_steps": 19600, "total_steps": 29667, "loss": 0.3526, "lr": 2.9062400609030372e-05, "epoch": 1.9820560629523118, "percentage": 66.07, "elapsed_time": "2 days, 9:33:24", "remaining_time": "1 day, 5:33:44", "throughput": 27764.23, "total_tokens": 5752875520} +{"current_steps": 19610, "total_steps": 29667, "loss": 0.3536, "lr": 2.905749249749806e-05, "epoch": 1.9830673450684195, "percentage": 66.1, "elapsed_time": "2 days, 9:35:09", "remaining_time": "1 day, 5:31:58", "throughput": 27764.5, "total_tokens": 5755837440} +{"current_steps": 19620, "total_steps": 29667, "loss": 0.3545, "lr": 2.905258687179878e-05, "epoch": 1.9840786271845274, "percentage": 66.13, "elapsed_time": "2 days, 9:36:54", "remaining_time": "1 day, 5:30:12", "throughput": 27764.57, "total_tokens": 5758761856} +{"current_steps": 19630, "total_steps": 29667, "loss": 0.3504, "lr": 2.904768372983488e-05, "epoch": 1.9850899093006351, "percentage": 66.17, "elapsed_time": "2 days, 9:38:36", "remaining_time": "1 day, 5:28:25", "throughput": 27765.02, "total_tokens": 5761696320} +{"current_steps": 19640, "total_steps": 29667, "loss": 0.3587, "lr": 2.90427830695112e-05, "epoch": 1.986101191416743, "percentage": 66.2, "elapsed_time": "2 days, 9:40:25", "remaining_time": "1 day, 5:26:41", "throughput": 27764.61, "total_tokens": 5764644928} +{"current_steps": 19650, "total_steps": 29667, "loss": 0.3565, "lr": 2.9037884888735044e-05, "epoch": 1.987112473532851, "percentage": 66.24, "elapsed_time": "2 days, 9:42:09", "remaining_time": "1 day, 5:24:54", "throughput": 27764.74, "total_tokens": 5767547456} +{"current_steps": 19660, "total_steps": 29667, "loss": 0.3516, "lr": 2.9032989185416194e-05, "epoch": 1.9881237556489588, "percentage": 66.27, "elapsed_time": "2 days, 9:43:57", "remaining_time": "1 day, 5:23:09", "throughput": 27764.77, "total_tokens": 5770550784} +{"current_steps": 19670, "total_steps": 29667, "loss": 0.3582, "lr": 2.9028095957466888e-05, "epoch": 1.9891350377650665, "percentage": 66.3, "elapsed_time": "2 days, 9:45:40", "remaining_time": "1 day, 5:21:22", "throughput": 27765.08, "total_tokens": 5773482304} +{"current_steps": 19680, "total_steps": 29667, "loss": 0.358, "lr": 2.9023205202801833e-05, "epoch": 1.9901463198811742, "percentage": 66.34, "elapsed_time": "2 days, 9:47:20", "remaining_time": "1 day, 5:19:34", "throughput": 27765.85, "total_tokens": 5776413056} +{"current_steps": 19690, "total_steps": 29667, "loss": 0.359, "lr": 2.90183169193382e-05, "epoch": 1.991157601997282, "percentage": 66.37, "elapsed_time": "2 days, 9:49:03", "remaining_time": "1 day, 5:17:47", "throughput": 27766.08, "total_tokens": 5779340160} +{"current_steps": 19700, "total_steps": 29667, "loss": 0.3493, "lr": 2.90134311049956e-05, "epoch": 1.99216888411339, "percentage": 66.4, "elapsed_time": "2 days, 9:50:47", "remaining_time": "1 day, 5:16:00", "throughput": 27766.23, "total_tokens": 5782241856} +{"current_steps": 19710, "total_steps": 29667, "loss": 0.3521, "lr": 2.90085477576961e-05, "epoch": 1.993180166229498, "percentage": 66.44, "elapsed_time": "2 days, 9:52:33", "remaining_time": "1 day, 5:14:14", "throughput": 27766.11, "total_tokens": 5785155584} +{"current_steps": 19720, "total_steps": 29667, "loss": 0.3545, "lr": 2.9003666875364226e-05, "epoch": 1.9941914483456058, "percentage": 66.47, "elapsed_time": "2 days, 9:54:19", "remaining_time": "1 day, 5:12:29", "throughput": 27766.25, "total_tokens": 5788138944} +{"current_steps": 19730, "total_steps": 29667, "loss": 0.3537, "lr": 2.899878845592694e-05, "epoch": 1.9952027304617135, "percentage": 66.5, "elapsed_time": "2 days, 9:56:06", "remaining_time": "1 day, 5:10:44", "throughput": 27765.88, "total_tokens": 5791044736} +{"current_steps": 19740, "total_steps": 29667, "loss": 0.3546, "lr": 2.8993912497313636e-05, "epoch": 1.9962140125778212, "percentage": 66.54, "elapsed_time": "2 days, 9:57:57", "remaining_time": "1 day, 5:09:01", "throughput": 27765.17, "total_tokens": 5793979712} +{"current_steps": 19750, "total_steps": 29667, "loss": 0.3549, "lr": 2.8989038997456153e-05, "epoch": 1.997225294693929, "percentage": 66.57, "elapsed_time": "2 days, 9:59:43", "remaining_time": "1 day, 5:07:15", "throughput": 27765.37, "total_tokens": 5796948608} +{"current_steps": 19760, "total_steps": 29667, "loss": 0.3555, "lr": 2.898416795428876e-05, "epoch": 1.998236576810037, "percentage": 66.61, "elapsed_time": "2 days, 10:01:28", "remaining_time": "1 day, 5:05:29", "throughput": 27765.56, "total_tokens": 5799918784} +{"current_steps": 19770, "total_steps": 29667, "loss": 0.354, "lr": 2.897929936574816e-05, "epoch": 1.9992478589261449, "percentage": 66.64, "elapsed_time": "2 days, 10:03:14", "remaining_time": "1 day, 5:03:44", "throughput": 27765.51, "total_tokens": 5802841920} +{"current_steps": 19780, "total_steps": 29667, "loss": 0.3509, "lr": 2.8974433229773478e-05, "epoch": 2.0002022564232216, "percentage": 66.67, "elapsed_time": "2 days, 10:04:56", "remaining_time": "1 day, 5:01:56", "throughput": 27765.16, "total_tokens": 5805589760} +{"current_steps": 19790, "total_steps": 29667, "loss": 0.3422, "lr": 2.896956954430625e-05, "epoch": 2.0012135385393295, "percentage": 66.71, "elapsed_time": "2 days, 10:06:41", "remaining_time": "1 day, 5:00:10", "throughput": 27765.09, "total_tokens": 5808489216} +{"current_steps": 19800, "total_steps": 29667, "loss": 0.3479, "lr": 2.896470830729045e-05, "epoch": 2.0022248206554374, "percentage": 66.74, "elapsed_time": "2 days, 10:08:29", "remaining_time": "1 day, 4:58:25", "throughput": 27764.69, "total_tokens": 5811418944} +{"current_steps": 19810, "total_steps": 29667, "loss": 0.3453, "lr": 2.895984951667245e-05, "epoch": 2.003236102771545, "percentage": 66.77, "elapsed_time": "2 days, 10:10:08", "remaining_time": "1 day, 4:56:36", "throughput": 27765.42, "total_tokens": 5814321536} +{"current_steps": 19820, "total_steps": 29667, "loss": 0.3457, "lr": 2.8954993170401047e-05, "epoch": 2.0042473848876527, "percentage": 66.81, "elapsed_time": "2 days, 10:11:49", "remaining_time": "1 day, 4:54:48", "throughput": 27766.07, "total_tokens": 5817265536} +{"current_steps": 19830, "total_steps": 29667, "loss": 0.349, "lr": 2.8950139266427423e-05, "epoch": 2.0052586670037607, "percentage": 66.84, "elapsed_time": "2 days, 10:13:37", "remaining_time": "1 day, 4:53:04", "throughput": 27765.79, "total_tokens": 5820190784} +{"current_steps": 19840, "total_steps": 29667, "loss": 0.3481, "lr": 2.8945287802705186e-05, "epoch": 2.0062699491198686, "percentage": 66.88, "elapsed_time": "2 days, 10:15:33", "remaining_time": "1 day, 4:51:23", "throughput": 27764.48, "total_tokens": 5823142912} +{"current_steps": 19850, "total_steps": 29667, "loss": 0.3418, "lr": 2.8940438777190336e-05, "epoch": 2.0072812312359765, "percentage": 66.91, "elapsed_time": "2 days, 10:17:34", "remaining_time": "1 day, 4:49:45", "throughput": 27762.19, "total_tokens": 5826026560} +{"current_steps": 19860, "total_steps": 29667, "loss": 0.3471, "lr": 2.8935592187841265e-05, "epoch": 2.0082925133520844, "percentage": 66.94, "elapsed_time": "2 days, 10:19:21", "remaining_time": "1 day, 4:48:00", "throughput": 27762.03, "total_tokens": 5828969536} +{"current_steps": 19870, "total_steps": 29667, "loss": 0.349, "lr": 2.893074803261876e-05, "epoch": 2.009303795468192, "percentage": 66.98, "elapsed_time": "2 days, 10:21:10", "remaining_time": "1 day, 4:46:16", "throughput": 27761.6, "total_tokens": 5831896384} +{"current_steps": 19880, "total_steps": 29667, "loss": 0.3443, "lr": 2.8925906309485995e-05, "epoch": 2.0103150775842997, "percentage": 67.01, "elapsed_time": "2 days, 10:22:58", "remaining_time": "1 day, 4:44:31", "throughput": 27761.09, "total_tokens": 5834772992} +{"current_steps": 19890, "total_steps": 29667, "loss": 0.3501, "lr": 2.8921067016408532e-05, "epoch": 2.0113263597004076, "percentage": 67.04, "elapsed_time": "2 days, 10:24:44", "remaining_time": "1 day, 4:42:45", "throughput": 27760.95, "total_tokens": 5837688448} +{"current_steps": 19900, "total_steps": 29667, "loss": 0.3392, "lr": 2.8916230151354316e-05, "epoch": 2.0123376418165155, "percentage": 67.08, "elapsed_time": "2 days, 10:26:32", "remaining_time": "1 day, 4:41:01", "throughput": 27760.39, "total_tokens": 5840564800} +{"current_steps": 19910, "total_steps": 29667, "loss": 0.3503, "lr": 2.8911395712293677e-05, "epoch": 2.0133489239326234, "percentage": 67.11, "elapsed_time": "2 days, 10:28:27", "remaining_time": "1 day, 4:39:20", "throughput": 27758.68, "total_tokens": 5843421056} +{"current_steps": 19920, "total_steps": 29667, "loss": 0.3477, "lr": 2.8906563697199294e-05, "epoch": 2.0143602060487313, "percentage": 67.15, "elapsed_time": "2 days, 10:30:14", "remaining_time": "1 day, 4:37:35", "throughput": 27758.62, "total_tokens": 5846364736} +{"current_steps": 19930, "total_steps": 29667, "loss": 0.3455, "lr": 2.8901734104046245e-05, "epoch": 2.015371488164839, "percentage": 67.18, "elapsed_time": "2 days, 10:32:11", "remaining_time": "1 day, 4:35:54", "throughput": 27756.8, "total_tokens": 5849229888} +{"current_steps": 19940, "total_steps": 29667, "loss": 0.3472, "lr": 2.8896906930811964e-05, "epoch": 2.0163827702809467, "percentage": 67.21, "elapsed_time": "2 days, 10:34:10", "remaining_time": "1 day, 4:34:15", "throughput": 27754.92, "total_tokens": 5852128192} +{"current_steps": 19950, "total_steps": 29667, "loss": 0.3459, "lr": 2.8892082175476243e-05, "epoch": 2.0173940523970546, "percentage": 67.25, "elapsed_time": "2 days, 10:35:59", "remaining_time": "1 day, 4:32:31", "throughput": 27754.66, "total_tokens": 5855101888} +{"current_steps": 19960, "total_steps": 29667, "loss": 0.3517, "lr": 2.8887259836021246e-05, "epoch": 2.0184053345131625, "percentage": 67.28, "elapsed_time": "2 days, 10:37:47", "remaining_time": "1 day, 4:30:46", "throughput": 27754.4, "total_tokens": 5858037760} +{"current_steps": 19970, "total_steps": 29667, "loss": 0.347, "lr": 2.8882439910431493e-05, "epoch": 2.0194166166292704, "percentage": 67.31, "elapsed_time": "2 days, 10:39:51", "remaining_time": "1 day, 4:29:10", "throughput": 27751.85, "total_tokens": 5860957888} +{"current_steps": 19980, "total_steps": 29667, "loss": 0.344, "lr": 2.8877622396693843e-05, "epoch": 2.0204278987453783, "percentage": 67.35, "elapsed_time": "2 days, 10:41:51", "remaining_time": "1 day, 4:27:30", "throughput": 27749.97, "total_tokens": 5863877760} +{"current_steps": 19990, "total_steps": 29667, "loss": 0.3445, "lr": 2.8872807292797516e-05, "epoch": 2.0214391808614858, "percentage": 67.38, "elapsed_time": "2 days, 10:43:43", "remaining_time": "1 day, 4:25:48", "throughput": 27749.04, "total_tokens": 5866806208} +{"current_steps": 20000, "total_steps": 29667, "loss": 0.3435, "lr": 2.8867994596734084e-05, "epoch": 2.0224504629775937, "percentage": 67.41, "elapsed_time": "2 days, 10:45:44", "remaining_time": "1 day, 4:24:10", "throughput": 27747.31, "total_tokens": 5869796224} +{"current_steps": 20000, "total_steps": 29667, "eval_loss": 0.3307909369468689, "epoch": 2.0224504629775937, "percentage": 67.41, "elapsed_time": "2 days, 10:45:46", "remaining_time": "1 day, 4:24:10", "throughput": 27747.08, "total_tokens": 5869796224} +{"current_steps": 20010, "total_steps": 29667, "loss": 0.3436, "lr": 2.8863184306497437e-05, "epoch": 2.0234617450937016, "percentage": 67.45, "elapsed_time": "2 days, 10:49:30", "remaining_time": "1 day, 4:23:22", "throughput": 27731.66, "total_tokens": 5872739584} +{"current_steps": 20020, "total_steps": 29667, "loss": 0.3434, "lr": 2.8858376420083848e-05, "epoch": 2.0244730272098095, "percentage": 67.48, "elapsed_time": "2 days, 10:51:32", "remaining_time": "1 day, 4:21:44", "throughput": 27729.21, "total_tokens": 5875615680} +{"current_steps": 20030, "total_steps": 29667, "loss": 0.3394, "lr": 2.8853570935491873e-05, "epoch": 2.0254843093259174, "percentage": 67.52, "elapsed_time": "2 days, 10:53:41", "remaining_time": "1 day, 4:20:09", "throughput": 27726.4, "total_tokens": 5878589888} +{"current_steps": 20040, "total_steps": 29667, "loss": 0.3469, "lr": 2.8848767850722447e-05, "epoch": 2.0264955914420253, "percentage": 67.55, "elapsed_time": "2 days, 10:55:54", "remaining_time": "1 day, 4:18:36", "throughput": 27722.68, "total_tokens": 5881493824} +{"current_steps": 20050, "total_steps": 29667, "loss": 0.3498, "lr": 2.88439671637788e-05, "epoch": 2.0275068735581327, "percentage": 67.58, "elapsed_time": "2 days, 10:57:55", "remaining_time": "1 day, 4:16:57", "throughput": 27720.8, "total_tokens": 5884435264} +{"current_steps": 20060, "total_steps": 29667, "loss": 0.3462, "lr": 2.8839168872666505e-05, "epoch": 2.0285181556742407, "percentage": 67.62, "elapsed_time": "2 days, 10:59:56", "remaining_time": "1 day, 4:15:19", "throughput": 27718.87, "total_tokens": 5887391616} +{"current_steps": 20070, "total_steps": 29667, "loss": 0.351, "lr": 2.8834372975393448e-05, "epoch": 2.0295294377903486, "percentage": 67.65, "elapsed_time": "2 days, 11:01:53", "remaining_time": "1 day, 4:13:39", "throughput": 27717.28, "total_tokens": 5890304384} +{"current_steps": 20080, "total_steps": 29667, "loss": 0.3431, "lr": 2.8829579469969843e-05, "epoch": 2.0305407199064565, "percentage": 67.68, "elapsed_time": "2 days, 11:03:48", "remaining_time": "1 day, 4:11:57", "throughput": 27716.26, "total_tokens": 5893277888} +{"current_steps": 20090, "total_steps": 29667, "loss": 0.3502, "lr": 2.88247883544082e-05, "epoch": 2.0315520020225644, "percentage": 67.72, "elapsed_time": "2 days, 11:05:37", "remaining_time": "1 day, 4:10:13", "throughput": 27715.93, "total_tokens": 5896232320} +{"current_steps": 20100, "total_steps": 29667, "loss": 0.3497, "lr": 2.8819999626723366e-05, "epoch": 2.0325632841386723, "percentage": 67.75, "elapsed_time": "2 days, 11:07:26", "remaining_time": "1 day, 4:08:28", "throughput": 27715.52, "total_tokens": 5899153856} +{"current_steps": 20110, "total_steps": 29667, "loss": 0.3431, "lr": 2.881521328493248e-05, "epoch": 2.0335745662547797, "percentage": 67.79, "elapsed_time": "2 days, 11:09:22", "remaining_time": "1 day, 4:06:47", "throughput": 27714.09, "total_tokens": 5902059520} +{"current_steps": 20120, "total_steps": 29667, "loss": 0.3493, "lr": 2.881042932705499e-05, "epoch": 2.0345858483708876, "percentage": 67.82, "elapsed_time": "2 days, 11:11:49", "remaining_time": "1 day, 4:05:20", "throughput": 27708.82, "total_tokens": 5905004864} +{"current_steps": 20130, "total_steps": 29667, "loss": 0.3475, "lr": 2.8805647751112635e-05, "epoch": 2.0355971304869955, "percentage": 67.85, "elapsed_time": "2 days, 11:13:53", "remaining_time": "1 day, 4:03:43", "throughput": 27706.48, "total_tokens": 5907959936} +{"current_steps": 20140, "total_steps": 29667, "loss": 0.3496, "lr": 2.8800868555129462e-05, "epoch": 2.0366084126031034, "percentage": 67.89, "elapsed_time": "2 days, 11:16:07", "remaining_time": "1 day, 4:02:11", "throughput": 27703.23, "total_tokens": 5910971200} +{"current_steps": 20150, "total_steps": 29667, "loss": 0.3494, "lr": 2.8796091737131814e-05, "epoch": 2.0376196947192113, "percentage": 67.92, "elapsed_time": "2 days, 11:18:12", "remaining_time": "1 day, 4:00:34", "throughput": 27700.92, "total_tokens": 5913938304} +{"current_steps": 20160, "total_steps": 29667, "loss": 0.3477, "lr": 2.8791317295148322e-05, "epoch": 2.0386309768353192, "percentage": 67.95, "elapsed_time": "2 days, 11:20:13", "remaining_time": "1 day, 3:58:55", "throughput": 27699.23, "total_tokens": 5916915776} +{"current_steps": 20170, "total_steps": 29667, "loss": 0.3477, "lr": 2.8786545227209893e-05, "epoch": 2.0396422589514267, "percentage": 67.99, "elapsed_time": "2 days, 11:22:06", "remaining_time": "1 day, 3:57:12", "throughput": 27698.23, "total_tokens": 5919853888} +{"current_steps": 20180, "total_steps": 29667, "loss": 0.3488, "lr": 2.8781775531349742e-05, "epoch": 2.0406535410675346, "percentage": 68.02, "elapsed_time": "2 days, 11:24:02", "remaining_time": "1 day, 3:55:31", "throughput": 27697.21, "total_tokens": 5922832448} +{"current_steps": 20190, "total_steps": 29667, "loss": 0.3488, "lr": 2.8777008205603334e-05, "epoch": 2.0416648231836425, "percentage": 68.06, "elapsed_time": "2 days, 11:26:38", "remaining_time": "1 day, 3:54:09", "throughput": 27690.73, "total_tokens": 5925780096} +{"current_steps": 20200, "total_steps": 29667, "loss": 0.3523, "lr": 2.877224324800844e-05, "epoch": 2.0426761052997504, "percentage": 68.09, "elapsed_time": "2 days, 11:28:55", "remaining_time": "1 day, 3:52:37", "throughput": 27686.61, "total_tokens": 5928686272} +{"current_steps": 20210, "total_steps": 29667, "loss": 0.3436, "lr": 2.8767480656605078e-05, "epoch": 2.0436873874158583, "percentage": 68.12, "elapsed_time": "2 days, 11:31:15", "remaining_time": "1 day, 3:51:07", "throughput": 27682.13, "total_tokens": 5931596160} +{"current_steps": 20220, "total_steps": 29667, "loss": 0.3426, "lr": 2.8762720429435556e-05, "epoch": 2.044698669531966, "percentage": 68.16, "elapsed_time": "2 days, 11:33:22", "remaining_time": "1 day, 3:49:31", "throughput": 27679.67, "total_tokens": 5934603264} +{"current_steps": 20230, "total_steps": 29667, "loss": 0.3489, "lr": 2.8757962564544448e-05, "epoch": 2.0457099516480737, "percentage": 68.19, "elapsed_time": "2 days, 11:35:20", "remaining_time": "1 day, 3:47:50", "throughput": 27678.12, "total_tokens": 5937517632} +{"current_steps": 20240, "total_steps": 29667, "loss": 0.3457, "lr": 2.8753207059978586e-05, "epoch": 2.0467212337641816, "percentage": 68.22, "elapsed_time": "2 days, 11:37:15", "remaining_time": "1 day, 3:46:08", "throughput": 27676.95, "total_tokens": 5940446272} +{"current_steps": 20250, "total_steps": 29667, "loss": 0.3485, "lr": 2.874845391378706e-05, "epoch": 2.0477325158802895, "percentage": 68.26, "elapsed_time": "2 days, 11:39:05", "remaining_time": "1 day, 3:44:24", "throughput": 27676.47, "total_tokens": 5943387136} +{"current_steps": 20260, "total_steps": 29667, "loss": 0.3491, "lr": 2.874370312402121e-05, "epoch": 2.0487437979963974, "percentage": 68.29, "elapsed_time": "2 days, 11:40:54", "remaining_time": "1 day, 3:42:39", "throughput": 27675.99, "total_tokens": 5946296896} +{"current_steps": 20270, "total_steps": 29667, "loss": 0.3448, "lr": 2.8738954688734647e-05, "epoch": 2.0497550801125053, "percentage": 68.33, "elapsed_time": "2 days, 11:43:08", "remaining_time": "1 day, 3:41:06", "throughput": 27671.98, "total_tokens": 5949158080} +{"current_steps": 20280, "total_steps": 29667, "loss": 0.3491, "lr": 2.8734208605983226e-05, "epoch": 2.0507663622286127, "percentage": 68.36, "elapsed_time": "2 days, 11:45:14", "remaining_time": "1 day, 3:39:30", "throughput": 27669.41, "total_tokens": 5952096832} +{"current_steps": 20290, "total_steps": 29667, "loss": 0.3436, "lr": 2.8729464873825035e-05, "epoch": 2.0517776443447207, "percentage": 68.39, "elapsed_time": "2 days, 11:47:42", "remaining_time": "1 day, 3:38:03", "throughput": 27664.15, "total_tokens": 5955056768} +{"current_steps": 20300, "total_steps": 29667, "loss": 0.3457, "lr": 2.8724723490320427e-05, "epoch": 2.0527889264608286, "percentage": 68.43, "elapsed_time": "2 days, 11:49:49", "remaining_time": "1 day, 3:36:27", "throughput": 27661.56, "total_tokens": 5958022144} +{"current_steps": 20310, "total_steps": 29667, "loss": 0.3467, "lr": 2.8719984453531983e-05, "epoch": 2.0538002085769365, "percentage": 68.46, "elapsed_time": "2 days, 11:51:43", "remaining_time": "1 day, 3:34:44", "throughput": 27660.77, "total_tokens": 5960987200} +{"current_steps": 20320, "total_steps": 29667, "loss": 0.3491, "lr": 2.871524776152452e-05, "epoch": 2.0548114906930444, "percentage": 68.49, "elapsed_time": "2 days, 11:53:42", "remaining_time": "1 day, 3:33:04", "throughput": 27658.64, "total_tokens": 5963834304} +{"current_steps": 20330, "total_steps": 29667, "loss": 0.3467, "lr": 2.8710513412365093e-05, "epoch": 2.0558227728091523, "percentage": 68.53, "elapsed_time": "2 days, 11:55:52", "remaining_time": "1 day, 3:31:28", "throughput": 27655.6, "total_tokens": 5966759104} +{"current_steps": 20340, "total_steps": 29667, "loss": 0.345, "lr": 2.8705781404122977e-05, "epoch": 2.0568340549252597, "percentage": 68.56, "elapsed_time": "2 days, 11:57:42", "remaining_time": "1 day, 3:29:44", "throughput": 27655.12, "total_tokens": 5969713216} +{"current_steps": 20350, "total_steps": 29667, "loss": 0.3469, "lr": 2.87010517348697e-05, "epoch": 2.0578453370413676, "percentage": 68.59, "elapsed_time": "2 days, 11:59:37", "remaining_time": "1 day, 3:28:02", "throughput": 27654.14, "total_tokens": 5972662144} +{"current_steps": 20360, "total_steps": 29667, "loss": 0.3475, "lr": 2.8696324402678976e-05, "epoch": 2.0588566191574755, "percentage": 68.63, "elapsed_time": "2 days, 12:01:42", "remaining_time": "1 day, 3:26:25", "throughput": 27651.67, "total_tokens": 5975603712} +{"current_steps": 20370, "total_steps": 29667, "loss": 0.3457, "lr": 2.8691599405626764e-05, "epoch": 2.0598679012735834, "percentage": 68.66, "elapsed_time": "2 days, 12:03:53", "remaining_time": "1 day, 3:24:50", "throughput": 27648.32, "total_tokens": 5978497472} +{"current_steps": 20380, "total_steps": 29667, "loss": 0.3481, "lr": 2.8686876741791234e-05, "epoch": 2.0608791833896913, "percentage": 68.7, "elapsed_time": "2 days, 12:06:29", "remaining_time": "1 day, 3:23:26", "throughput": 27642.01, "total_tokens": 5981437760} +{"current_steps": 20390, "total_steps": 29667, "loss": 0.3475, "lr": 2.8682156409252775e-05, "epoch": 2.0618904655057992, "percentage": 68.73, "elapsed_time": "2 days, 12:08:31", "remaining_time": "1 day, 3:21:48", "throughput": 27640.06, "total_tokens": 5984395520} +{"current_steps": 20400, "total_steps": 29667, "loss": 0.3494, "lr": 2.8677438406093976e-05, "epoch": 2.0629017476219067, "percentage": 68.76, "elapsed_time": "2 days, 12:10:22", "remaining_time": "1 day, 3:20:03", "throughput": 27639.62, "total_tokens": 5987350784} +{"current_steps": 20410, "total_steps": 29667, "loss": 0.3388, "lr": 2.867272273039964e-05, "epoch": 2.0639130297380146, "percentage": 68.8, "elapsed_time": "2 days, 12:12:08", "remaining_time": "1 day, 3:18:17", "throughput": 27639.41, "total_tokens": 5990261504} +{"current_steps": 20420, "total_steps": 29667, "loss": 0.3498, "lr": 2.8668009380256765e-05, "epoch": 2.0649243118541225, "percentage": 68.83, "elapsed_time": "2 days, 12:13:58", "remaining_time": "1 day, 3:16:33", "throughput": 27638.68, "total_tokens": 5993127552} +{"current_steps": 20430, "total_steps": 29667, "loss": 0.3505, "lr": 2.8663298353754574e-05, "epoch": 2.0659355939702304, "percentage": 68.86, "elapsed_time": "2 days, 12:15:45", "remaining_time": "1 day, 3:14:47", "throughput": 27638.43, "total_tokens": 5996036992} +{"current_steps": 20440, "total_steps": 29667, "loss": 0.3448, "lr": 2.865858964898445e-05, "epoch": 2.0669468760863383, "percentage": 68.9, "elapsed_time": "2 days, 12:17:32", "remaining_time": "1 day, 3:13:01", "throughput": 27638.32, "total_tokens": 5998972096} +{"current_steps": 20450, "total_steps": 29667, "loss": 0.3491, "lr": 2.8653883264040004e-05, "epoch": 2.067958158202446, "percentage": 68.93, "elapsed_time": "2 days, 12:19:22", "remaining_time": "1 day, 3:11:17", "throughput": 27637.98, "total_tokens": 6001939776} +{"current_steps": 20460, "total_steps": 29667, "loss": 0.3509, "lr": 2.8649179197017017e-05, "epoch": 2.0689694403185537, "percentage": 68.97, "elapsed_time": "2 days, 12:21:12", "remaining_time": "1 day, 3:09:32", "throughput": 27637.57, "total_tokens": 6004885056} +{"current_steps": 20470, "total_steps": 29667, "loss": 0.3459, "lr": 2.864447744601347e-05, "epoch": 2.0699807224346616, "percentage": 69.0, "elapsed_time": "2 days, 12:22:57", "remaining_time": "1 day, 3:07:46", "throughput": 27637.57, "total_tokens": 6007793024} +{"current_steps": 20480, "total_steps": 29667, "loss": 0.3486, "lr": 2.8639778009129507e-05, "epoch": 2.0709920045507695, "percentage": 69.03, "elapsed_time": "2 days, 12:24:47", "remaining_time": "1 day, 3:06:01", "throughput": 27637.28, "total_tokens": 6010769280} +{"current_steps": 20490, "total_steps": 29667, "loss": 0.3415, "lr": 2.8635080884467492e-05, "epoch": 2.0720032866668774, "percentage": 69.07, "elapsed_time": "2 days, 12:26:32", "remaining_time": "1 day, 3:04:14", "throughput": 27637.52, "total_tokens": 6013710208} +{"current_steps": 20500, "total_steps": 29667, "loss": 0.3383, "lr": 2.8630386070131927e-05, "epoch": 2.0730145687829853, "percentage": 69.1, "elapsed_time": "2 days, 12:28:21", "remaining_time": "1 day, 3:02:29", "throughput": 27637.08, "total_tokens": 6016632768} +{"current_steps": 20510, "total_steps": 29667, "loss": 0.3508, "lr": 2.8625693564229507e-05, "epoch": 2.074025850899093, "percentage": 69.13, "elapsed_time": "2 days, 12:30:07", "remaining_time": "1 day, 3:00:43", "throughput": 27636.74, "total_tokens": 6019483648} +{"current_steps": 20520, "total_steps": 29667, "loss": 0.3496, "lr": 2.8621003364869102e-05, "epoch": 2.0750371330152007, "percentage": 69.17, "elapsed_time": "2 days, 12:31:52", "remaining_time": "1 day, 2:58:56", "throughput": 27636.86, "total_tokens": 6022418240} +{"current_steps": 20530, "total_steps": 29667, "loss": 0.3516, "lr": 2.8616315470161738e-05, "epoch": 2.0760484151313086, "percentage": 69.2, "elapsed_time": "2 days, 12:33:39", "remaining_time": "1 day, 2:57:10", "throughput": 27636.74, "total_tokens": 6025352512} +{"current_steps": 20540, "total_steps": 29667, "loss": 0.3472, "lr": 2.8611629878220624e-05, "epoch": 2.0770596972474165, "percentage": 69.24, "elapsed_time": "2 days, 12:35:27", "remaining_time": "1 day, 2:55:25", "throughput": 27636.48, "total_tokens": 6028288832} +{"current_steps": 20550, "total_steps": 29667, "loss": 0.3484, "lr": 2.8606946587161116e-05, "epoch": 2.0780709793635244, "percentage": 69.27, "elapsed_time": "2 days, 12:37:16", "remaining_time": "1 day, 2:53:40", "throughput": 27636.14, "total_tokens": 6031222400} +{"current_steps": 20560, "total_steps": 29667, "loss": 0.3477, "lr": 2.860226559510072e-05, "epoch": 2.0790822614796323, "percentage": 69.3, "elapsed_time": "2 days, 12:39:02", "remaining_time": "1 day, 2:51:54", "throughput": 27636.32, "total_tokens": 6034197824} +{"current_steps": 20570, "total_steps": 29667, "loss": 0.347, "lr": 2.859758690015913e-05, "epoch": 2.08009354359574, "percentage": 69.34, "elapsed_time": "2 days, 12:40:49", "remaining_time": "1 day, 2:50:08", "throughput": 27636.35, "total_tokens": 6037153984} +{"current_steps": 20580, "total_steps": 29667, "loss": 0.3437, "lr": 2.8592910500458154e-05, "epoch": 2.0811048257118476, "percentage": 69.37, "elapsed_time": "2 days, 12:42:44", "remaining_time": "1 day, 2:48:25", "throughput": 27635.39, "total_tokens": 6040102080} +{"current_steps": 20590, "total_steps": 29667, "loss": 0.3439, "lr": 2.858823639412178e-05, "epoch": 2.0821161078279555, "percentage": 69.4, "elapsed_time": "2 days, 12:44:38", "remaining_time": "1 day, 2:46:43", "throughput": 27634.35, "total_tokens": 6043027264} +{"current_steps": 20600, "total_steps": 29667, "loss": 0.3496, "lr": 2.858356457927613e-05, "epoch": 2.0831273899440634, "percentage": 69.44, "elapsed_time": "2 days, 12:46:28", "remaining_time": "1 day, 2:44:58", "throughput": 27633.85, "total_tokens": 6045969728} +{"current_steps": 20610, "total_steps": 29667, "loss": 0.3435, "lr": 2.857889505404946e-05, "epoch": 2.0841386720601713, "percentage": 69.47, "elapsed_time": "2 days, 12:48:13", "remaining_time": "1 day, 2:43:12", "throughput": 27633.98, "total_tokens": 6048899008} +{"current_steps": 20620, "total_steps": 29667, "loss": 0.3439, "lr": 2.8574227816572184e-05, "epoch": 2.0851499541762792, "percentage": 69.5, "elapsed_time": "2 days, 12:50:02", "remaining_time": "1 day, 2:41:27", "throughput": 27633.71, "total_tokens": 6051861440} +{"current_steps": 20630, "total_steps": 29667, "loss": 0.3492, "lr": 2.856956286497684e-05, "epoch": 2.086161236292387, "percentage": 69.54, "elapsed_time": "2 days, 12:51:50", "remaining_time": "1 day, 2:39:41", "throughput": 27633.61, "total_tokens": 6054806080} +{"current_steps": 20640, "total_steps": 29667, "loss": 0.3506, "lr": 2.85649001973981e-05, "epoch": 2.0871725184084946, "percentage": 69.57, "elapsed_time": "2 days, 12:53:35", "remaining_time": "1 day, 2:37:54", "throughput": 27633.84, "total_tokens": 6057757440} +{"current_steps": 20650, "total_steps": 29667, "loss": 0.3441, "lr": 2.8560239811972754e-05, "epoch": 2.0881838005246025, "percentage": 69.61, "elapsed_time": "2 days, 12:55:24", "remaining_time": "1 day, 2:36:09", "throughput": 27633.76, "total_tokens": 6060749568} +{"current_steps": 20660, "total_steps": 29667, "loss": 0.3408, "lr": 2.855558170683976e-05, "epoch": 2.0891950826407104, "percentage": 69.64, "elapsed_time": "2 days, 12:57:07", "remaining_time": "1 day, 2:34:22", "throughput": 27634.09, "total_tokens": 6063675904} +{"current_steps": 20670, "total_steps": 29667, "loss": 0.3529, "lr": 2.855092588014017e-05, "epoch": 2.0902063647568183, "percentage": 69.67, "elapsed_time": "2 days, 12:58:50", "remaining_time": "1 day, 2:32:34", "throughput": 27634.31, "total_tokens": 6066582400} +{"current_steps": 20680, "total_steps": 29667, "loss": 0.3495, "lr": 2.854627233001715e-05, "epoch": 2.091217646872926, "percentage": 69.71, "elapsed_time": "2 days, 13:00:38", "remaining_time": "1 day, 2:30:49", "throughput": 27633.8, "total_tokens": 6069460608} +{"current_steps": 20690, "total_steps": 29667, "loss": 0.3487, "lr": 2.8541621054615992e-05, "epoch": 2.092228928989034, "percentage": 69.74, "elapsed_time": "2 days, 13:02:25", "remaining_time": "1 day, 2:29:03", "throughput": 27633.83, "total_tokens": 6072411456} +{"current_steps": 20700, "total_steps": 29667, "loss": 0.3525, "lr": 2.8536972052084122e-05, "epoch": 2.0932402111051416, "percentage": 69.77, "elapsed_time": "2 days, 13:04:17", "remaining_time": "1 day, 2:27:19", "throughput": 27633.02, "total_tokens": 6075336512} +{"current_steps": 20710, "total_steps": 29667, "loss": 0.35, "lr": 2.853232532057104e-05, "epoch": 2.0942514932212495, "percentage": 69.81, "elapsed_time": "2 days, 13:06:10", "remaining_time": "1 day, 2:25:36", "throughput": 27632.29, "total_tokens": 6078298944} +{"current_steps": 20720, "total_steps": 29667, "loss": 0.3491, "lr": 2.8527680858228395e-05, "epoch": 2.0952627753373574, "percentage": 69.84, "elapsed_time": "2 days, 13:07:52", "remaining_time": "1 day, 2:23:48", "throughput": 27632.92, "total_tokens": 6081240192} +{"current_steps": 20730, "total_steps": 29667, "loss": 0.3508, "lr": 2.8523038663209906e-05, "epoch": 2.0962740574534653, "percentage": 69.88, "elapsed_time": "2 days, 13:09:37", "remaining_time": "1 day, 2:22:01", "throughput": 27632.85, "total_tokens": 6084138112} +{"current_steps": 20740, "total_steps": 29667, "loss": 0.3453, "lr": 2.8518398733671427e-05, "epoch": 2.097285339569573, "percentage": 69.91, "elapsed_time": "2 days, 13:11:19", "remaining_time": "1 day, 2:20:13", "throughput": 27633.52, "total_tokens": 6087089152} +{"current_steps": 20750, "total_steps": 29667, "loss": 0.3489, "lr": 2.8513761067770877e-05, "epoch": 2.098296621685681, "percentage": 69.94, "elapsed_time": "2 days, 13:13:03", "remaining_time": "1 day, 2:18:26", "throughput": 27633.87, "total_tokens": 6090044224} +{"current_steps": 20760, "total_steps": 29667, "loss": 0.347, "lr": 2.85091256636683e-05, "epoch": 2.0993079038017886, "percentage": 69.98, "elapsed_time": "2 days, 13:14:43", "remaining_time": "1 day, 2:16:37", "throughput": 27634.67, "total_tokens": 6092981248} +{"current_steps": 20770, "total_steps": 29667, "loss": 0.3477, "lr": 2.850449251952582e-05, "epoch": 2.1003191859178965, "percentage": 70.01, "elapsed_time": "2 days, 13:16:24", "remaining_time": "1 day, 2:14:49", "throughput": 27635.22, "total_tokens": 6095910976} +{"current_steps": 20780, "total_steps": 29667, "loss": 0.3447, "lr": 2.849986163350766e-05, "epoch": 2.1013304680340044, "percentage": 70.04, "elapsed_time": "2 days, 13:18:05", "remaining_time": "1 day, 2:13:00", "throughput": 27635.95, "total_tokens": 6098843648} +{"current_steps": 20790, "total_steps": 29667, "loss": 0.3479, "lr": 2.8495233003780103e-05, "epoch": 2.1023417501501123, "percentage": 70.08, "elapsed_time": "2 days, 13:19:43", "remaining_time": "1 day, 2:11:11", "throughput": 27636.83, "total_tokens": 6101768448} +{"current_steps": 20800, "total_steps": 29667, "loss": 0.3437, "lr": 2.8490606628511557e-05, "epoch": 2.10335303226622, "percentage": 70.11, "elapsed_time": "2 days, 13:21:25", "remaining_time": "1 day, 2:09:23", "throughput": 27637.44, "total_tokens": 6104717696} +{"current_steps": 20810, "total_steps": 29667, "loss": 0.3478, "lr": 2.8485982505872476e-05, "epoch": 2.1043643143823276, "percentage": 70.15, "elapsed_time": "2 days, 13:23:04", "remaining_time": "1 day, 2:07:33", "throughput": 27638.24, "total_tokens": 6107634368} +{"current_steps": 20820, "total_steps": 29667, "loss": 0.3491, "lr": 2.8481360634035415e-05, "epoch": 2.1053755964984355, "percentage": 70.18, "elapsed_time": "2 days, 13:24:48", "remaining_time": "1 day, 2:05:46", "throughput": 27638.55, "total_tokens": 6110556224} +{"current_steps": 20830, "total_steps": 29667, "loss": 0.3475, "lr": 2.847674101117499e-05, "epoch": 2.1063868786145434, "percentage": 70.21, "elapsed_time": "2 days, 13:26:31", "remaining_time": "1 day, 2:03:59", "throughput": 27638.82, "total_tokens": 6113478592} +{"current_steps": 20840, "total_steps": 29667, "loss": 0.3443, "lr": 2.8472123635467896e-05, "epoch": 2.1073981607306513, "percentage": 70.25, "elapsed_time": "2 days, 13:28:16", "remaining_time": "1 day, 2:02:12", "throughput": 27638.86, "total_tokens": 6116392896} +{"current_steps": 20850, "total_steps": 29667, "loss": 0.346, "lr": 2.846750850509289e-05, "epoch": 2.1084094428467592, "percentage": 70.28, "elapsed_time": "2 days, 13:29:59", "remaining_time": "1 day, 2:00:24", "throughput": 27639.32, "total_tokens": 6119332032} +{"current_steps": 20860, "total_steps": 29667, "loss": 0.3513, "lr": 2.8462895618230813e-05, "epoch": 2.109420724962867, "percentage": 70.31, "elapsed_time": "2 days, 13:31:42", "remaining_time": "1 day, 1:58:37", "throughput": 27639.68, "total_tokens": 6122267712} +{"current_steps": 20870, "total_steps": 29667, "loss": 0.3473, "lr": 2.845828497306453e-05, "epoch": 2.1104320070789746, "percentage": 70.35, "elapsed_time": "2 days, 13:33:22", "remaining_time": "1 day, 1:56:48", "throughput": 27640.55, "total_tokens": 6125211264} +{"current_steps": 20880, "total_steps": 29667, "loss": 0.3483, "lr": 2.8453676567779018e-05, "epoch": 2.1114432891950825, "percentage": 70.38, "elapsed_time": "2 days, 13:35:01", "remaining_time": "1 day, 1:54:59", "throughput": 27641.45, "total_tokens": 6128144576} +{"current_steps": 20890, "total_steps": 29667, "loss": 0.3494, "lr": 2.8449070400561267e-05, "epoch": 2.1124545713111904, "percentage": 70.41, "elapsed_time": "2 days, 13:36:44", "remaining_time": "1 day, 1:53:11", "throughput": 27641.72, "total_tokens": 6131063232} +{"current_steps": 20900, "total_steps": 29667, "loss": 0.3462, "lr": 2.8444466469600343e-05, "epoch": 2.1134658534272983, "percentage": 70.45, "elapsed_time": "2 days, 13:38:24", "remaining_time": "1 day, 1:51:23", "throughput": 27642.56, "total_tokens": 6134015168} +{"current_steps": 20910, "total_steps": 29667, "loss": 0.3406, "lr": 2.8439864773087354e-05, "epoch": 2.114477135543406, "percentage": 70.48, "elapsed_time": "2 days, 13:40:01", "remaining_time": "1 day, 1:49:32", "throughput": 27643.57, "total_tokens": 6136908288} +{"current_steps": 20920, "total_steps": 29667, "loss": 0.3446, "lr": 2.8435265309215465e-05, "epoch": 2.115488417659514, "percentage": 70.52, "elapsed_time": "2 days, 13:41:40", "remaining_time": "1 day, 1:47:43", "throughput": 27644.31, "total_tokens": 6139817216} +{"current_steps": 20930, "total_steps": 29667, "loss": 0.3485, "lr": 2.843066807617987e-05, "epoch": 2.1164996997756216, "percentage": 70.55, "elapsed_time": "2 days, 13:43:22", "remaining_time": "1 day, 1:45:56", "throughput": 27644.75, "total_tokens": 6142742656} +{"current_steps": 20940, "total_steps": 29667, "loss": 0.3479, "lr": 2.8426073072177827e-05, "epoch": 2.1175109818917295, "percentage": 70.58, "elapsed_time": "2 days, 13:45:10", "remaining_time": "1 day, 1:44:10", "throughput": 27644.66, "total_tokens": 6145684672} +{"current_steps": 20950, "total_steps": 29667, "loss": 0.3455, "lr": 2.8421480295408616e-05, "epoch": 2.1185222640078374, "percentage": 70.62, "elapsed_time": "2 days, 13:46:50", "remaining_time": "1 day, 1:42:21", "throughput": 27645.53, "total_tokens": 6148654400} +{"current_steps": 20960, "total_steps": 29667, "loss": 0.349, "lr": 2.841688974407355e-05, "epoch": 2.1195335461239453, "percentage": 70.65, "elapsed_time": "2 days, 13:48:30", "remaining_time": "1 day, 1:40:33", "throughput": 27646.36, "total_tokens": 6151609024} +{"current_steps": 20970, "total_steps": 29667, "loss": 0.3491, "lr": 2.8412301416375984e-05, "epoch": 2.120544828240053, "percentage": 70.68, "elapsed_time": "2 days, 13:50:10", "remaining_time": "1 day, 1:38:44", "throughput": 27647.09, "total_tokens": 6154521728} +{"current_steps": 20980, "total_steps": 29667, "loss": 0.3449, "lr": 2.840771531052131e-05, "epoch": 2.121556110356161, "percentage": 70.72, "elapsed_time": "2 days, 13:51:53", "remaining_time": "1 day, 1:36:57", "throughput": 27647.44, "total_tokens": 6157467072} +{"current_steps": 20990, "total_steps": 29667, "loss": 0.3472, "lr": 2.840313142471694e-05, "epoch": 2.1225673924722686, "percentage": 70.75, "elapsed_time": "2 days, 13:53:38", "remaining_time": "1 day, 1:35:10", "throughput": 27647.74, "total_tokens": 6160423296} +{"current_steps": 21000, "total_steps": 29667, "loss": 0.3519, "lr": 2.83985497571723e-05, "epoch": 2.1235786745883765, "percentage": 70.79, "elapsed_time": "2 days, 13:55:22", "remaining_time": "1 day, 1:33:23", "throughput": 27648.06, "total_tokens": 6163384896} +{"current_steps": 21010, "total_steps": 29667, "loss": 0.3488, "lr": 2.8393970306098843e-05, "epoch": 2.1245899567044844, "percentage": 70.82, "elapsed_time": "2 days, 13:57:00", "remaining_time": "1 day, 1:31:33", "throughput": 27649.07, "total_tokens": 6166311488} +{"current_steps": 21020, "total_steps": 29667, "loss": 0.3482, "lr": 2.8389393069710053e-05, "epoch": 2.1256012388205923, "percentage": 70.85, "elapsed_time": "2 days, 13:58:40", "remaining_time": "1 day, 1:29:45", "throughput": 27649.82, "total_tokens": 6169246464} +{"current_steps": 21030, "total_steps": 29667, "loss": 0.348, "lr": 2.8384818046221418e-05, "epoch": 2.1266125209367, "percentage": 70.89, "elapsed_time": "2 days, 14:00:24", "remaining_time": "1 day, 1:27:58", "throughput": 27650.3, "total_tokens": 6172232192} +{"current_steps": 21040, "total_steps": 29667, "loss": 0.3474, "lr": 2.8380245233850434e-05, "epoch": 2.127623803052808, "percentage": 70.92, "elapsed_time": "2 days, 14:02:06", "remaining_time": "1 day, 1:26:10", "throughput": 27650.98, "total_tokens": 6175189312} +{"current_steps": 21050, "total_steps": 29667, "loss": 0.3437, "lr": 2.837567463081662e-05, "epoch": 2.1286350851689155, "percentage": 70.95, "elapsed_time": "2 days, 14:03:49", "remaining_time": "1 day, 1:24:22", "throughput": 27651.4, "total_tokens": 6178139584} +{"current_steps": 21060, "total_steps": 29667, "loss": 0.3492, "lr": 2.8371106235341477e-05, "epoch": 2.1296463672850234, "percentage": 70.99, "elapsed_time": "2 days, 14:05:33", "remaining_time": "1 day, 1:22:35", "throughput": 27651.83, "total_tokens": 6181117056} +{"current_steps": 21070, "total_steps": 29667, "loss": 0.3464, "lr": 2.836654004564855e-05, "epoch": 2.1306576494011313, "percentage": 71.02, "elapsed_time": "2 days, 14:07:15", "remaining_time": "1 day, 1:20:47", "throughput": 27652.44, "total_tokens": 6184065280} +{"current_steps": 21080, "total_steps": 29667, "loss": 0.3436, "lr": 2.8361976059963348e-05, "epoch": 2.1316689315172392, "percentage": 71.06, "elapsed_time": "2 days, 14:08:56", "remaining_time": "1 day, 1:18:59", "throughput": 27653.1, "total_tokens": 6187012736} +{"current_steps": 21090, "total_steps": 29667, "loss": 0.349, "lr": 2.835741427651339e-05, "epoch": 2.132680213633347, "percentage": 71.09, "elapsed_time": "2 days, 14:10:38", "remaining_time": "1 day, 1:17:11", "throughput": 27653.61, "total_tokens": 6189934976} +{"current_steps": 21100, "total_steps": 29667, "loss": 0.3504, "lr": 2.8352854693528197e-05, "epoch": 2.133691495749455, "percentage": 71.12, "elapsed_time": "2 days, 14:12:23", "remaining_time": "1 day, 1:15:25", "throughput": 27653.81, "total_tokens": 6192892736} +{"current_steps": 21110, "total_steps": 29667, "loss": 0.3509, "lr": 2.8348297309239274e-05, "epoch": 2.1347027778655625, "percentage": 71.16, "elapsed_time": "2 days, 14:14:03", "remaining_time": "1 day, 1:13:36", "throughput": 27654.58, "total_tokens": 6195818560} +{"current_steps": 21120, "total_steps": 29667, "loss": 0.3425, "lr": 2.834374212188012e-05, "epoch": 2.1357140599816704, "percentage": 71.19, "elapsed_time": "2 days, 14:15:44", "remaining_time": "1 day, 1:11:48", "throughput": 27655.15, "total_tokens": 6198738944} +{"current_steps": 21130, "total_steps": 29667, "loss": 0.3435, "lr": 2.833918912968621e-05, "epoch": 2.1367253420977783, "percentage": 71.22, "elapsed_time": "2 days, 14:17:23", "remaining_time": "1 day, 1:09:59", "throughput": 27655.84, "total_tokens": 6201638848} +{"current_steps": 21140, "total_steps": 29667, "loss": 0.3456, "lr": 2.833463833089502e-05, "epoch": 2.137736624213886, "percentage": 71.26, "elapsed_time": "2 days, 14:19:01", "remaining_time": "1 day, 1:08:10", "throughput": 27656.55, "total_tokens": 6204506688} +{"current_steps": 21150, "total_steps": 29667, "loss": 0.3469, "lr": 2.8330089723745985e-05, "epoch": 2.138747906329994, "percentage": 71.29, "elapsed_time": "2 days, 14:20:41", "remaining_time": "1 day, 1:06:21", "throughput": 27657.24, "total_tokens": 6207426752} +{"current_steps": 21160, "total_steps": 29667, "loss": 0.3468, "lr": 2.8325543306480538e-05, "epoch": 2.139759188446102, "percentage": 71.33, "elapsed_time": "2 days, 14:22:21", "remaining_time": "1 day, 1:04:32", "throughput": 27657.98, "total_tokens": 6210351936} +{"current_steps": 21170, "total_steps": 29667, "loss": 0.3415, "lr": 2.832099907734208e-05, "epoch": 2.1407704705622095, "percentage": 71.36, "elapsed_time": "2 days, 14:24:01", "remaining_time": "1 day, 1:02:44", "throughput": 27658.74, "total_tokens": 6213308544} +{"current_steps": 21180, "total_steps": 29667, "loss": 0.3466, "lr": 2.831645703457598e-05, "epoch": 2.1417817526783174, "percentage": 71.39, "elapsed_time": "2 days, 14:25:43", "remaining_time": "1 day, 1:00:56", "throughput": 27659.27, "total_tokens": 6216240448} +{"current_steps": 21190, "total_steps": 29667, "loss": 0.3501, "lr": 2.8311917176429582e-05, "epoch": 2.1427930347944253, "percentage": 71.43, "elapsed_time": "2 days, 14:27:25", "remaining_time": "1 day, 0:59:09", "throughput": 27659.69, "total_tokens": 6219168960} +{"current_steps": 21200, "total_steps": 29667, "loss": 0.3455, "lr": 2.830737950115218e-05, "epoch": 2.143804316910533, "percentage": 71.46, "elapsed_time": "2 days, 14:29:08", "remaining_time": "1 day, 0:57:21", "throughput": 27660.16, "total_tokens": 6222121536} +{"current_steps": 21210, "total_steps": 29667, "loss": 0.3476, "lr": 2.8302844006995062e-05, "epoch": 2.144815599026641, "percentage": 71.49, "elapsed_time": "2 days, 14:30:50", "remaining_time": "1 day, 0:55:33", "throughput": 27660.9, "total_tokens": 6225110144} +{"current_steps": 21220, "total_steps": 29667, "loss": 0.3483, "lr": 2.829831069221145e-05, "epoch": 2.145826881142749, "percentage": 71.53, "elapsed_time": "2 days, 14:32:33", "remaining_time": "1 day, 0:53:46", "throughput": 27661.38, "total_tokens": 6228047360} +{"current_steps": 21230, "total_steps": 29667, "loss": 0.3467, "lr": 2.8293779555056532e-05, "epoch": 2.1468381632588565, "percentage": 71.56, "elapsed_time": "2 days, 14:34:18", "remaining_time": "1 day, 0:51:59", "throughput": 27661.88, "total_tokens": 6231077184} +{"current_steps": 21240, "total_steps": 29667, "loss": 0.3491, "lr": 2.8289250593787454e-05, "epoch": 2.1478494453749644, "percentage": 71.59, "elapsed_time": "2 days, 14:36:00", "remaining_time": "1 day, 0:50:12", "throughput": 27662.5, "total_tokens": 6234045760} +{"current_steps": 21250, "total_steps": 29667, "loss": 0.3465, "lr": 2.8284723806663316e-05, "epoch": 2.1488607274910723, "percentage": 71.63, "elapsed_time": "2 days, 14:37:39", "remaining_time": "1 day, 0:48:23", "throughput": 27663.14, "total_tokens": 6236928320} +{"current_steps": 21260, "total_steps": 29667, "loss": 0.3496, "lr": 2.828019919194515e-05, "epoch": 2.14987200960718, "percentage": 71.66, "elapsed_time": "2 days, 14:39:23", "remaining_time": "1 day, 0:46:36", "throughput": 27663.51, "total_tokens": 6239888320} +{"current_steps": 21270, "total_steps": 29667, "loss": 0.3483, "lr": 2.827567674789597e-05, "epoch": 2.150883291723288, "percentage": 71.7, "elapsed_time": "2 days, 14:41:00", "remaining_time": "1 day, 0:44:46", "throughput": 27664.49, "total_tokens": 6242795776} +{"current_steps": 21280, "total_steps": 29667, "loss": 0.3507, "lr": 2.8271156472780697e-05, "epoch": 2.151894573839396, "percentage": 71.73, "elapsed_time": "2 days, 14:42:45", "remaining_time": "1 day, 0:42:59", "throughput": 27664.84, "total_tokens": 6245759296} +{"current_steps": 21290, "total_steps": 29667, "loss": 0.3481, "lr": 2.826663836486621e-05, "epoch": 2.1529058559555034, "percentage": 71.76, "elapsed_time": "2 days, 14:44:27", "remaining_time": "1 day, 0:41:12", "throughput": 27665.24, "total_tokens": 6248684352} +{"current_steps": 21300, "total_steps": 29667, "loss": 0.35, "lr": 2.8262122422421326e-05, "epoch": 2.1539171380716113, "percentage": 71.8, "elapsed_time": "2 days, 14:46:11", "remaining_time": "1 day, 0:39:25", "throughput": 27665.62, "total_tokens": 6251635776} +{"current_steps": 21310, "total_steps": 29667, "loss": 0.3495, "lr": 2.8257608643716797e-05, "epoch": 2.1549284201877192, "percentage": 71.83, "elapsed_time": "2 days, 14:47:49", "remaining_time": "1 day, 0:37:36", "throughput": 27666.51, "total_tokens": 6254546176} +{"current_steps": 21320, "total_steps": 29667, "loss": 0.3423, "lr": 2.8253097027025312e-05, "epoch": 2.155939702303827, "percentage": 71.86, "elapsed_time": "2 days, 14:49:27", "remaining_time": "1 day, 0:35:46", "throughput": 27667.36, "total_tokens": 6257456576} +{"current_steps": 21330, "total_steps": 29667, "loss": 0.3475, "lr": 2.8248587570621472e-05, "epoch": 2.156950984419935, "percentage": 71.9, "elapsed_time": "2 days, 14:51:09", "remaining_time": "1 day, 0:33:59", "throughput": 27667.9, "total_tokens": 6260397120} +{"current_steps": 21340, "total_steps": 29667, "loss": 0.3486, "lr": 2.824408027278182e-05, "epoch": 2.1579622665360425, "percentage": 71.93, "elapsed_time": "2 days, 14:52:50", "remaining_time": "1 day, 0:32:11", "throughput": 27668.47, "total_tokens": 6263318144} +{"current_steps": 21350, "total_steps": 29667, "loss": 0.3478, "lr": 2.823957513178483e-05, "epoch": 2.1589735486521504, "percentage": 71.97, "elapsed_time": "2 days, 14:54:29", "remaining_time": "1 day, 0:30:22", "throughput": 27669.3, "total_tokens": 6266250688} +{"current_steps": 21360, "total_steps": 29667, "loss": 0.343, "lr": 2.8235072145910878e-05, "epoch": 2.1599848307682583, "percentage": 72.0, "elapsed_time": "2 days, 14:56:15", "remaining_time": "1 day, 0:28:36", "throughput": 27669.38, "total_tokens": 6269197184} +{"current_steps": 21370, "total_steps": 29667, "loss": 0.3423, "lr": 2.8230571313442273e-05, "epoch": 2.160996112884366, "percentage": 72.03, "elapsed_time": "2 days, 14:57:56", "remaining_time": "1 day, 0:26:48", "throughput": 27669.97, "total_tokens": 6272128064} +{"current_steps": 21380, "total_steps": 29667, "loss": 0.3437, "lr": 2.822607263266324e-05, "epoch": 2.162007395000474, "percentage": 72.07, "elapsed_time": "2 days, 14:59:35", "remaining_time": "1 day, 0:24:59", "throughput": 27670.78, "total_tokens": 6275059392} +{"current_steps": 21390, "total_steps": 29667, "loss": 0.3434, "lr": 2.822157610185991e-05, "epoch": 2.163018677116582, "percentage": 72.1, "elapsed_time": "2 days, 15:01:16", "remaining_time": "1 day, 0:23:11", "throughput": 27671.38, "total_tokens": 6277975616} +{"current_steps": 21400, "total_steps": 29667, "loss": 0.3499, "lr": 2.821708171932032e-05, "epoch": 2.16402995923269, "percentage": 72.13, "elapsed_time": "2 days, 15:02:58", "remaining_time": "1 day, 0:21:23", "throughput": 27671.78, "total_tokens": 6280907776} +{"current_steps": 21410, "total_steps": 29667, "loss": 0.3445, "lr": 2.821258948333444e-05, "epoch": 2.1650412413487974, "percentage": 72.17, "elapsed_time": "2 days, 15:04:38", "remaining_time": "1 day, 0:19:35", "throughput": 27672.23, "total_tokens": 6283778048} +{"current_steps": 21420, "total_steps": 29667, "loss": 0.3463, "lr": 2.8208099392194116e-05, "epoch": 2.1660525234649053, "percentage": 72.2, "elapsed_time": "2 days, 15:06:18", "remaining_time": "1 day, 0:17:46", "throughput": 27672.92, "total_tokens": 6286681216} +{"current_steps": 21430, "total_steps": 29667, "loss": 0.3488, "lr": 2.8203611444193113e-05, "epoch": 2.167063805581013, "percentage": 72.24, "elapsed_time": "2 days, 15:07:56", "remaining_time": "1 day, 0:15:57", "throughput": 27673.96, "total_tokens": 6289640576} +{"current_steps": 21440, "total_steps": 29667, "loss": 0.3444, "lr": 2.8199125637627084e-05, "epoch": 2.168075087697121, "percentage": 72.27, "elapsed_time": "2 days, 15:09:37", "remaining_time": "1 day, 0:14:09", "throughput": 27674.54, "total_tokens": 6292578496} +{"current_steps": 21450, "total_steps": 29667, "loss": 0.3484, "lr": 2.8194641970793593e-05, "epoch": 2.169086369813229, "percentage": 72.3, "elapsed_time": "2 days, 15:11:17", "remaining_time": "1 day, 0:12:21", "throughput": 27675.18, "total_tokens": 6295484416} +{"current_steps": 21460, "total_steps": 29667, "loss": 0.3498, "lr": 2.8190160441992092e-05, "epoch": 2.1700976519293365, "percentage": 72.34, "elapsed_time": "2 days, 15:13:01", "remaining_time": "1 day, 0:10:34", "throughput": 27675.63, "total_tokens": 6298460352} +{"current_steps": 21470, "total_steps": 29667, "loss": 0.3487, "lr": 2.818568104952392e-05, "epoch": 2.1711089340454444, "percentage": 72.37, "elapsed_time": "2 days, 15:14:44", "remaining_time": "1 day, 0:08:47", "throughput": 27676.09, "total_tokens": 6301428032} +{"current_steps": 21480, "total_steps": 29667, "loss": 0.3481, "lr": 2.8181203791692306e-05, "epoch": 2.1721202161615523, "percentage": 72.4, "elapsed_time": "2 days, 15:16:29", "remaining_time": "1 day, 0:07:01", "throughput": 27676.25, "total_tokens": 6304368000} +{"current_steps": 21490, "total_steps": 29667, "loss": 0.3459, "lr": 2.8176728666802375e-05, "epoch": 2.17313149827766, "percentage": 72.44, "elapsed_time": "2 days, 15:18:15", "remaining_time": "1 day, 0:05:14", "throughput": 27676.36, "total_tokens": 6307322560} +{"current_steps": 21500, "total_steps": 29667, "loss": 0.346, "lr": 2.8172255673161124e-05, "epoch": 2.174142780393768, "percentage": 72.47, "elapsed_time": "2 days, 15:20:02", "remaining_time": "1 day, 0:03:28", "throughput": 27676.27, "total_tokens": 6310247360} +{"current_steps": 21510, "total_steps": 29667, "loss": 0.3473, "lr": 2.8167784809077436e-05, "epoch": 2.175154062509876, "percentage": 72.5, "elapsed_time": "2 days, 15:21:40", "remaining_time": "1 day, 0:01:40", "throughput": 27676.95, "total_tokens": 6313133248} +{"current_steps": 21520, "total_steps": 29667, "loss": 0.3438, "lr": 2.816331607286207e-05, "epoch": 2.1761653446259834, "percentage": 72.54, "elapsed_time": "2 days, 15:23:22", "remaining_time": "23:59:52", "throughput": 27677.47, "total_tokens": 6316075584} +{"current_steps": 21530, "total_steps": 29667, "loss": 0.3438, "lr": 2.815884946282766e-05, "epoch": 2.1771766267420913, "percentage": 72.57, "elapsed_time": "2 days, 15:25:05", "remaining_time": "23:58:05", "throughput": 27678.01, "total_tokens": 6319054336} +{"current_steps": 21540, "total_steps": 29667, "loss": 0.3449, "lr": 2.815438497728871e-05, "epoch": 2.1781879088581992, "percentage": 72.61, "elapsed_time": "2 days, 15:26:49", "remaining_time": "23:56:18", "throughput": 27678.28, "total_tokens": 6321989696} +{"current_steps": 21550, "total_steps": 29667, "loss": 0.3442, "lr": 2.8149922614561607e-05, "epoch": 2.179199190974307, "percentage": 72.64, "elapsed_time": "2 days, 15:28:30", "remaining_time": "23:54:30", "throughput": 27678.84, "total_tokens": 6324904960} +{"current_steps": 21560, "total_steps": 29667, "loss": 0.3485, "lr": 2.8145462372964588e-05, "epoch": 2.180210473090415, "percentage": 72.67, "elapsed_time": "2 days, 15:30:13", "remaining_time": "23:52:43", "throughput": 27679.41, "total_tokens": 6327892224} +{"current_steps": 21570, "total_steps": 29667, "loss": 0.3482, "lr": 2.814100425081777e-05, "epoch": 2.181221755206523, "percentage": 72.71, "elapsed_time": "2 days, 15:31:57", "remaining_time": "23:50:56", "throughput": 27679.89, "total_tokens": 6330886784} +{"current_steps": 21580, "total_steps": 29667, "loss": 0.3479, "lr": 2.8136548246443117e-05, "epoch": 2.1822330373226304, "percentage": 72.74, "elapsed_time": "2 days, 15:33:38", "remaining_time": "23:49:08", "throughput": 27680.57, "total_tokens": 6333819968} +{"current_steps": 21590, "total_steps": 29667, "loss": 0.3471, "lr": 2.8132094358164468e-05, "epoch": 2.1832443194387383, "percentage": 72.77, "elapsed_time": "2 days, 15:35:25", "remaining_time": "23:47:22", "throughput": 27680.4, "total_tokens": 6336749120} +{"current_steps": 21600, "total_steps": 29667, "loss": 0.3513, "lr": 2.8127642584307508e-05, "epoch": 2.184255601554846, "percentage": 72.81, "elapsed_time": "2 days, 15:37:11", "remaining_time": "23:45:36", "throughput": 27680.52, "total_tokens": 6339709568} +{"current_steps": 21610, "total_steps": 29667, "loss": 0.3472, "lr": 2.8123192923199776e-05, "epoch": 2.185266883670954, "percentage": 72.84, "elapsed_time": "2 days, 15:38:50", "remaining_time": "23:43:48", "throughput": 27681.09, "total_tokens": 6342595072} +{"current_steps": 21620, "total_steps": 29667, "loss": 0.3451, "lr": 2.8118745373170667e-05, "epoch": 2.186278165787062, "percentage": 72.88, "elapsed_time": "2 days, 15:40:32", "remaining_time": "23:42:00", "throughput": 27681.73, "total_tokens": 6345544832} +{"current_steps": 21630, "total_steps": 29667, "loss": 0.3462, "lr": 2.8114299932551423e-05, "epoch": 2.18728944790317, "percentage": 72.91, "elapsed_time": "2 days, 15:42:13", "remaining_time": "23:40:12", "throughput": 27682.35, "total_tokens": 6348497344} +{"current_steps": 21640, "total_steps": 29667, "loss": 0.3454, "lr": 2.8109856599675145e-05, "epoch": 2.1883007300192774, "percentage": 72.94, "elapsed_time": "2 days, 15:43:52", "remaining_time": "23:38:24", "throughput": 27683.18, "total_tokens": 6351425728} +{"current_steps": 21650, "total_steps": 29667, "loss": 0.3467, "lr": 2.8105415372876742e-05, "epoch": 2.1893120121353853, "percentage": 72.98, "elapsed_time": "2 days, 15:45:36", "remaining_time": "23:36:37", "throughput": 27683.34, "total_tokens": 6354351808} +{"current_steps": 21660, "total_steps": 29667, "loss": 0.3487, "lr": 2.8100976250493e-05, "epoch": 2.190323294251493, "percentage": 73.01, "elapsed_time": "2 days, 15:47:22", "remaining_time": "23:34:51", "throughput": 27683.56, "total_tokens": 6357331584} +{"current_steps": 21670, "total_steps": 29667, "loss": 0.3433, "lr": 2.8096539230862527e-05, "epoch": 2.191334576367601, "percentage": 73.04, "elapsed_time": "2 days, 15:49:06", "remaining_time": "23:33:04", "throughput": 27683.97, "total_tokens": 6360294336} +{"current_steps": 21680, "total_steps": 29667, "loss": 0.3469, "lr": 2.809210431232578e-05, "epoch": 2.192345858483709, "percentage": 73.08, "elapsed_time": "2 days, 15:50:47", "remaining_time": "23:31:16", "throughput": 27684.65, "total_tokens": 6363237120} +{"current_steps": 21690, "total_steps": 29667, "loss": 0.3465, "lr": 2.8087671493225025e-05, "epoch": 2.193357140599817, "percentage": 73.11, "elapsed_time": "2 days, 15:52:26", "remaining_time": "23:29:28", "throughput": 27685.49, "total_tokens": 6366185856} +{"current_steps": 21700, "total_steps": 29667, "loss": 0.3472, "lr": 2.808324077190438e-05, "epoch": 2.1943684227159244, "percentage": 73.15, "elapsed_time": "2 days, 15:54:09", "remaining_time": "23:27:41", "throughput": 27686.05, "total_tokens": 6369167680} +{"current_steps": 21710, "total_steps": 29667, "loss": 0.3453, "lr": 2.807881214670978e-05, "epoch": 2.1953797048320323, "percentage": 73.18, "elapsed_time": "2 days, 15:55:54", "remaining_time": "23:25:54", "throughput": 27686.46, "total_tokens": 6372172928} +{"current_steps": 21720, "total_steps": 29667, "loss": 0.3467, "lr": 2.8074385615988996e-05, "epoch": 2.19639098694814, "percentage": 73.21, "elapsed_time": "2 days, 15:57:34", "remaining_time": "23:24:06", "throughput": 27687.17, "total_tokens": 6375083456} +{"current_steps": 21730, "total_steps": 29667, "loss": 0.353, "lr": 2.8069961178091602e-05, "epoch": 2.197402269064248, "percentage": 73.25, "elapsed_time": "2 days, 15:59:13", "remaining_time": "23:22:18", "throughput": 27687.74, "total_tokens": 6377981696} +{"current_steps": 21740, "total_steps": 29667, "loss": 0.3418, "lr": 2.806553883136901e-05, "epoch": 2.198413551180356, "percentage": 73.28, "elapsed_time": "2 days, 16:00:59", "remaining_time": "23:20:32", "throughput": 27687.79, "total_tokens": 6380927104} +{"current_steps": 21750, "total_steps": 29667, "loss": 0.3489, "lr": 2.806111857417445e-05, "epoch": 2.199424833296464, "percentage": 73.31, "elapsed_time": "2 days, 16:03:01", "remaining_time": "23:18:51", "throughput": 27685.92, "total_tokens": 6383858432} +{"current_steps": 21760, "total_steps": 29667, "loss": 0.3475, "lr": 2.8056700404862957e-05, "epoch": 2.2004361154125713, "percentage": 73.35, "elapsed_time": "2 days, 16:04:48", "remaining_time": "23:17:05", "throughput": 27685.96, "total_tokens": 6386831296} +{"current_steps": 21770, "total_steps": 29667, "loss": 0.3437, "lr": 2.8052284321791383e-05, "epoch": 2.2014473975286792, "percentage": 73.38, "elapsed_time": "2 days, 16:06:26", "remaining_time": "23:15:17", "throughput": 27686.73, "total_tokens": 6389719232} +{"current_steps": 21780, "total_steps": 29667, "loss": 0.3456, "lr": 2.8047870323318382e-05, "epoch": 2.202458679644787, "percentage": 73.41, "elapsed_time": "2 days, 16:08:04", "remaining_time": "23:13:28", "throughput": 27687.59, "total_tokens": 6392628992} +{"current_steps": 21790, "total_steps": 29667, "loss": 0.3489, "lr": 2.8043458407804428e-05, "epoch": 2.203469961760895, "percentage": 73.45, "elapsed_time": "2 days, 16:09:43", "remaining_time": "23:11:39", "throughput": 27688.43, "total_tokens": 6395574720} +{"current_steps": 21800, "total_steps": 29667, "loss": 0.3506, "lr": 2.8039048573611805e-05, "epoch": 2.204481243877003, "percentage": 73.48, "elapsed_time": "2 days, 16:11:22", "remaining_time": "23:09:51", "throughput": 27689.21, "total_tokens": 6398489536} +{"current_steps": 21810, "total_steps": 29667, "loss": 0.3483, "lr": 2.8034640819104574e-05, "epoch": 2.205492525993111, "percentage": 73.52, "elapsed_time": "2 days, 16:13:01", "remaining_time": "23:08:02", "throughput": 27690.1, "total_tokens": 6401429248} +{"current_steps": 21820, "total_steps": 29667, "loss": 0.3455, "lr": 2.803023514264861e-05, "epoch": 2.2065038081092183, "percentage": 73.55, "elapsed_time": "2 days, 16:14:38", "remaining_time": "23:06:13", "throughput": 27691.01, "total_tokens": 6404320448} +{"current_steps": 21830, "total_steps": 29667, "loss": 0.35, "lr": 2.8025831542611596e-05, "epoch": 2.207515090225326, "percentage": 73.58, "elapsed_time": "2 days, 16:16:12", "remaining_time": "23:04:23", "throughput": 27691.99, "total_tokens": 6407168512} +{"current_steps": 21840, "total_steps": 29667, "loss": 0.3457, "lr": 2.8021430017362994e-05, "epoch": 2.208526372341434, "percentage": 73.62, "elapsed_time": "2 days, 16:17:58", "remaining_time": "23:02:36", "throughput": 27692.26, "total_tokens": 6410153664} +{"current_steps": 21850, "total_steps": 29667, "loss": 0.3449, "lr": 2.801703056527406e-05, "epoch": 2.209537654457542, "percentage": 73.65, "elapsed_time": "2 days, 16:19:38", "remaining_time": "23:00:48", "throughput": 27693.03, "total_tokens": 6413099712} +{"current_steps": 21860, "total_steps": 29667, "loss": 0.3487, "lr": 2.801263318471784e-05, "epoch": 2.21054893657365, "percentage": 73.68, "elapsed_time": "2 days, 16:21:20", "remaining_time": "22:59:01", "throughput": 27693.64, "total_tokens": 6416090752} +{"current_steps": 21870, "total_steps": 29667, "loss": 0.3456, "lr": 2.800823787406917e-05, "epoch": 2.2115602186897574, "percentage": 73.72, "elapsed_time": "2 days, 16:23:02", "remaining_time": "22:57:14", "throughput": 27694.07, "total_tokens": 6419007424} +{"current_steps": 21880, "total_steps": 29667, "loss": 0.3481, "lr": 2.8003844631704678e-05, "epoch": 2.2125715008058653, "percentage": 73.75, "elapsed_time": "2 days, 16:24:44", "remaining_time": "22:55:26", "throughput": 27694.55, "total_tokens": 6421944768} +{"current_steps": 21890, "total_steps": 29667, "loss": 0.3478, "lr": 2.7999453456002755e-05, "epoch": 2.213582782921973, "percentage": 73.79, "elapsed_time": "2 days, 16:26:26", "remaining_time": "22:53:39", "throughput": 27695.11, "total_tokens": 6424892480} +{"current_steps": 21900, "total_steps": 29667, "loss": 0.3491, "lr": 2.799506434534359e-05, "epoch": 2.214594065038081, "percentage": 73.82, "elapsed_time": "2 days, 16:28:09", "remaining_time": "22:51:52", "throughput": 27695.42, "total_tokens": 6427820224} +{"current_steps": 21910, "total_steps": 29667, "loss": 0.3467, "lr": 2.7990677298109136e-05, "epoch": 2.215605347154189, "percentage": 73.85, "elapsed_time": "2 days, 16:29:53", "remaining_time": "22:50:05", "throughput": 27695.74, "total_tokens": 6430768512} +{"current_steps": 21920, "total_steps": 29667, "loss": 0.3487, "lr": 2.7986292312683125e-05, "epoch": 2.216616629270297, "percentage": 73.89, "elapsed_time": "2 days, 16:31:34", "remaining_time": "22:48:17", "throughput": 27696.16, "total_tokens": 6433668672} +{"current_steps": 21930, "total_steps": 29667, "loss": 0.3461, "lr": 2.798190938745106e-05, "epoch": 2.217627911386405, "percentage": 73.92, "elapsed_time": "2 days, 16:33:10", "remaining_time": "22:46:28", "throughput": 27697.23, "total_tokens": 6436570176} +{"current_steps": 21940, "total_steps": 29667, "loss": 0.3493, "lr": 2.7977528520800218e-05, "epoch": 2.2186391935025123, "percentage": 73.95, "elapsed_time": "2 days, 16:34:49", "remaining_time": "22:44:39", "throughput": 27697.89, "total_tokens": 6439469120} +{"current_steps": 21950, "total_steps": 29667, "loss": 0.3422, "lr": 2.7973149711119635e-05, "epoch": 2.21965047561862, "percentage": 73.99, "elapsed_time": "2 days, 16:36:31", "remaining_time": "22:42:52", "throughput": 27698.34, "total_tokens": 6442405248} +{"current_steps": 21960, "total_steps": 29667, "loss": 0.3501, "lr": 2.7968772956800115e-05, "epoch": 2.220661757734728, "percentage": 74.02, "elapsed_time": "2 days, 16:38:16", "remaining_time": "22:41:06", "throughput": 27698.74, "total_tokens": 6445390720} +{"current_steps": 21970, "total_steps": 29667, "loss": 0.346, "lr": 2.796439825623423e-05, "epoch": 2.221673039850836, "percentage": 74.06, "elapsed_time": "2 days, 16:40:00", "remaining_time": "22:39:19", "throughput": 27698.95, "total_tokens": 6448323328} +{"current_steps": 21980, "total_steps": 29667, "loss": 0.3512, "lr": 2.79600256078163e-05, "epoch": 2.222684321966944, "percentage": 74.09, "elapsed_time": "2 days, 16:41:41", "remaining_time": "22:37:31", "throughput": 27699.37, "total_tokens": 6451217600} +{"current_steps": 21990, "total_steps": 29667, "loss": 0.3531, "lr": 2.7955655009942416e-05, "epoch": 2.2236956040830513, "percentage": 74.12, "elapsed_time": "2 days, 16:43:25", "remaining_time": "22:35:45", "throughput": 27699.65, "total_tokens": 6454180544} +{"current_steps": 22000, "total_steps": 29667, "loss": 0.3473, "lr": 2.79512864610104e-05, "epoch": 2.2247068861991592, "percentage": 74.16, "elapsed_time": "2 days, 16:45:06", "remaining_time": "22:33:57", "throughput": 27700.29, "total_tokens": 6457117760} +{"current_steps": 22010, "total_steps": 29667, "loss": 0.3491, "lr": 2.794691995941986e-05, "epoch": 2.225718168315267, "percentage": 74.19, "elapsed_time": "2 days, 16:46:53", "remaining_time": "22:32:11", "throughput": 27700.21, "total_tokens": 6460060416} +{"current_steps": 22020, "total_steps": 29667, "loss": 0.3427, "lr": 2.7942555503572115e-05, "epoch": 2.226729450431375, "percentage": 74.22, "elapsed_time": "2 days, 16:48:41", "remaining_time": "22:30:26", "throughput": 27700.15, "total_tokens": 6463043712} +{"current_steps": 22030, "total_steps": 29667, "loss": 0.3461, "lr": 2.7938193091870268e-05, "epoch": 2.227740732547483, "percentage": 74.26, "elapsed_time": "2 days, 16:50:22", "remaining_time": "22:28:39", "throughput": 27701.01, "total_tokens": 6466046016} +{"current_steps": 22040, "total_steps": 29667, "loss": 0.3482, "lr": 2.793383272271914e-05, "epoch": 2.228752014663591, "percentage": 74.29, "elapsed_time": "2 days, 16:52:07", "remaining_time": "22:26:52", "throughput": 27701.43, "total_tokens": 6469039680} +{"current_steps": 22050, "total_steps": 29667, "loss": 0.3454, "lr": 2.7929474394525307e-05, "epoch": 2.2297632967796983, "percentage": 74.33, "elapsed_time": "2 days, 16:53:51", "remaining_time": "22:25:06", "throughput": 27701.58, "total_tokens": 6471962944} +{"current_steps": 22060, "total_steps": 29667, "loss": 0.3541, "lr": 2.7925118105697078e-05, "epoch": 2.230774578895806, "percentage": 74.36, "elapsed_time": "2 days, 16:55:32", "remaining_time": "22:23:18", "throughput": 27702.37, "total_tokens": 6474946624} +{"current_steps": 22070, "total_steps": 29667, "loss": 0.3468, "lr": 2.792076385464451e-05, "epoch": 2.231785861011914, "percentage": 74.39, "elapsed_time": "2 days, 16:57:16", "remaining_time": "22:21:31", "throughput": 27702.56, "total_tokens": 6477865664} +{"current_steps": 22080, "total_steps": 29667, "loss": 0.3463, "lr": 2.7916411639779383e-05, "epoch": 2.232797143128022, "percentage": 74.43, "elapsed_time": "2 days, 16:59:03", "remaining_time": "22:19:46", "throughput": 27702.59, "total_tokens": 6480846336} +{"current_steps": 22090, "total_steps": 29667, "loss": 0.3471, "lr": 2.7912061459515215e-05, "epoch": 2.23380842524413, "percentage": 74.46, "elapsed_time": "2 days, 17:00:47", "remaining_time": "22:17:59", "throughput": 27702.72, "total_tokens": 6483750592} +{"current_steps": 22100, "total_steps": 29667, "loss": 0.3465, "lr": 2.7907713312267247e-05, "epoch": 2.234819707360238, "percentage": 74.49, "elapsed_time": "2 days, 17:02:26", "remaining_time": "22:16:11", "throughput": 27703.5, "total_tokens": 6486664448} +{"current_steps": 22110, "total_steps": 29667, "loss": 0.3459, "lr": 2.7903367196452457e-05, "epoch": 2.2358309894763453, "percentage": 74.53, "elapsed_time": "2 days, 17:04:06", "remaining_time": "22:14:23", "throughput": 27704.07, "total_tokens": 6489586752} +{"current_steps": 22120, "total_steps": 29667, "loss": 0.3424, "lr": 2.7899023110489554e-05, "epoch": 2.236842271592453, "percentage": 74.56, "elapsed_time": "2 days, 17:05:49", "remaining_time": "22:12:36", "throughput": 27704.57, "total_tokens": 6492546944} +{"current_steps": 22130, "total_steps": 29667, "loss": 0.3464, "lr": 2.789468105279895e-05, "epoch": 2.237853553708561, "percentage": 74.59, "elapsed_time": "2 days, 17:07:30", "remaining_time": "22:10:48", "throughput": 27705.22, "total_tokens": 6495503104} +{"current_steps": 22140, "total_steps": 29667, "loss": 0.3475, "lr": 2.7890341021802786e-05, "epoch": 2.238864835824669, "percentage": 74.63, "elapsed_time": "2 days, 17:09:11", "remaining_time": "22:09:01", "throughput": 27705.95, "total_tokens": 6498465152} +{"current_steps": 22150, "total_steps": 29667, "loss": 0.3485, "lr": 2.7886003015924933e-05, "epoch": 2.239876117940777, "percentage": 74.66, "elapsed_time": "2 days, 17:10:54", "remaining_time": "22:07:14", "throughput": 27706.26, "total_tokens": 6501396544} +{"current_steps": 22160, "total_steps": 29667, "loss": 0.3469, "lr": 2.788166703359096e-05, "epoch": 2.240887400056885, "percentage": 74.7, "elapsed_time": "2 days, 17:12:42", "remaining_time": "22:05:28", "throughput": 27706.17, "total_tokens": 6504362176} +{"current_steps": 22170, "total_steps": 29667, "loss": 0.3482, "lr": 2.787733307322816e-05, "epoch": 2.2418986821729923, "percentage": 74.73, "elapsed_time": "2 days, 17:14:24", "remaining_time": "22:03:41", "throughput": 27706.41, "total_tokens": 6507246976} +{"current_steps": 22180, "total_steps": 29667, "loss": 0.3465, "lr": 2.7873001133265518e-05, "epoch": 2.2429099642891, "percentage": 74.76, "elapsed_time": "2 days, 17:16:21", "remaining_time": "22:01:59", "throughput": 27705.04, "total_tokens": 6510177088} +{"current_steps": 22190, "total_steps": 29667, "loss": 0.3497, "lr": 2.7868671212133768e-05, "epoch": 2.243921246405208, "percentage": 74.8, "elapsed_time": "2 days, 17:18:26", "remaining_time": "22:00:19", "throughput": 27702.79, "total_tokens": 6513107776} +{"current_steps": 22200, "total_steps": 29667, "loss": 0.3471, "lr": 2.7864343308265313e-05, "epoch": 2.244932528521316, "percentage": 74.83, "elapsed_time": "2 days, 17:20:19", "remaining_time": "21:58:36", "throughput": 27702.04, "total_tokens": 6516056512} +{"current_steps": 22210, "total_steps": 29667, "loss": 0.3441, "lr": 2.7860017420094258e-05, "epoch": 2.245943810637424, "percentage": 74.86, "elapsed_time": "2 days, 17:22:18", "remaining_time": "21:56:54", "throughput": 27700.73, "total_tokens": 6519047680} +{"current_steps": 22220, "total_steps": 29667, "loss": 0.3449, "lr": 2.7855693546056445e-05, "epoch": 2.246955092753532, "percentage": 74.9, "elapsed_time": "2 days, 17:24:10", "remaining_time": "21:55:10", "throughput": 27700.31, "total_tokens": 6522040704} +{"current_steps": 22230, "total_steps": 29667, "loss": 0.3402, "lr": 2.785137168458937e-05, "epoch": 2.2479663748696392, "percentage": 74.93, "elapsed_time": "2 days, 17:25:55", "remaining_time": "21:53:24", "throughput": 27700.54, "total_tokens": 6525001792} +{"current_steps": 22240, "total_steps": 29667, "loss": 0.3469, "lr": 2.7847051834132265e-05, "epoch": 2.248977656985747, "percentage": 74.97, "elapsed_time": "2 days, 17:27:36", "remaining_time": "21:51:36", "throughput": 27701.13, "total_tokens": 6527952000} +{"current_steps": 22250, "total_steps": 29667, "loss": 0.3512, "lr": 2.784273399312603e-05, "epoch": 2.249988939101855, "percentage": 75.0, "elapsed_time": "2 days, 17:29:16", "remaining_time": "21:49:49", "throughput": 27701.83, "total_tokens": 6530896640} +{"current_steps": 22260, "total_steps": 29667, "loss": 0.3462, "lr": 2.783841816001326e-05, "epoch": 2.251000221217963, "percentage": 75.03, "elapsed_time": "2 days, 17:30:58", "remaining_time": "21:48:01", "throughput": 27702.28, "total_tokens": 6533813696} +{"current_steps": 22270, "total_steps": 29667, "loss": 0.3446, "lr": 2.7834104333238255e-05, "epoch": 2.252011503334071, "percentage": 75.07, "elapsed_time": "2 days, 17:32:37", "remaining_time": "21:46:13", "throughput": 27702.95, "total_tokens": 6536725312} +{"current_steps": 22280, "total_steps": 29667, "loss": 0.3506, "lr": 2.7829792511246987e-05, "epoch": 2.2530227854501783, "percentage": 75.1, "elapsed_time": "2 days, 17:34:17", "remaining_time": "21:44:25", "throughput": 27703.5, "total_tokens": 6539617664} +{"current_steps": 22290, "total_steps": 29667, "loss": 0.3419, "lr": 2.7825482692487114e-05, "epoch": 2.254034067566286, "percentage": 75.13, "elapsed_time": "2 days, 17:36:00", "remaining_time": "21:42:38", "throughput": 27703.76, "total_tokens": 6542537856} +{"current_steps": 22300, "total_steps": 29667, "loss": 0.3492, "lr": 2.7821174875407985e-05, "epoch": 2.255045349682394, "percentage": 75.17, "elapsed_time": "2 days, 17:37:45", "remaining_time": "21:40:52", "throughput": 27703.94, "total_tokens": 6545480192} +{"current_steps": 22310, "total_steps": 29667, "loss": 0.3466, "lr": 2.781686905846062e-05, "epoch": 2.256056631798502, "percentage": 75.2, "elapsed_time": "2 days, 17:39:24", "remaining_time": "21:39:03", "throughput": 27704.61, "total_tokens": 6548373632} +{"current_steps": 22320, "total_steps": 29667, "loss": 0.3463, "lr": 2.7812565240097716e-05, "epoch": 2.25706791391461, "percentage": 75.24, "elapsed_time": "2 days, 17:41:04", "remaining_time": "21:37:16", "throughput": 27705.37, "total_tokens": 6551327424} +{"current_steps": 22330, "total_steps": 29667, "loss": 0.3456, "lr": 2.7808263418773656e-05, "epoch": 2.258079196030718, "percentage": 75.27, "elapsed_time": "2 days, 17:42:46", "remaining_time": "21:35:29", "throughput": 27705.83, "total_tokens": 6554275392} +{"current_steps": 22340, "total_steps": 29667, "loss": 0.346, "lr": 2.7803963592944482e-05, "epoch": 2.2590904781468257, "percentage": 75.3, "elapsed_time": "2 days, 17:44:30", "remaining_time": "21:33:42", "throughput": 27706.2, "total_tokens": 6557251456} +{"current_steps": 22350, "total_steps": 29667, "loss": 0.3488, "lr": 2.779966576106792e-05, "epoch": 2.260101760262933, "percentage": 75.34, "elapsed_time": "2 days, 17:46:08", "remaining_time": "21:31:53", "throughput": 27707.11, "total_tokens": 6560158976} +{"current_steps": 22360, "total_steps": 29667, "loss": 0.343, "lr": 2.779536992160336e-05, "epoch": 2.261113042379041, "percentage": 75.37, "elapsed_time": "2 days, 17:47:56", "remaining_time": "21:30:08", "throughput": 27706.87, "total_tokens": 6563119104} +{"current_steps": 22370, "total_steps": 29667, "loss": 0.3455, "lr": 2.7791076073011845e-05, "epoch": 2.262124324495149, "percentage": 75.4, "elapsed_time": "2 days, 17:49:40", "remaining_time": "21:28:22", "throughput": 27707.18, "total_tokens": 6566071872} +{"current_steps": 22380, "total_steps": 29667, "loss": 0.3467, "lr": 2.7786784213756102e-05, "epoch": 2.263135606611257, "percentage": 75.44, "elapsed_time": "2 days, 17:51:25", "remaining_time": "21:26:35", "throughput": 27707.54, "total_tokens": 6569052608} +{"current_steps": 22390, "total_steps": 29667, "loss": 0.3498, "lr": 2.7782494342300502e-05, "epoch": 2.264146888727365, "percentage": 75.47, "elapsed_time": "2 days, 17:53:08", "remaining_time": "21:24:48", "throughput": 27708.04, "total_tokens": 6572027520} +{"current_steps": 22400, "total_steps": 29667, "loss": 0.349, "lr": 2.777820645711109e-05, "epoch": 2.2651581708434723, "percentage": 75.5, "elapsed_time": "2 days, 17:54:42", "remaining_time": "21:22:59", "throughput": 27709.12, "total_tokens": 6574880320} +{"current_steps": 22410, "total_steps": 29667, "loss": 0.3487, "lr": 2.777392055665556e-05, "epoch": 2.26616945295958, "percentage": 75.54, "elapsed_time": "2 days, 17:56:22", "remaining_time": "21:21:11", "throughput": 27709.62, "total_tokens": 6577790912} +{"current_steps": 22420, "total_steps": 29667, "loss": 0.3496, "lr": 2.7769636639403252e-05, "epoch": 2.267180735075688, "percentage": 75.57, "elapsed_time": "2 days, 17:58:10", "remaining_time": "21:19:25", "throughput": 27709.55, "total_tokens": 6580749824} +{"current_steps": 22430, "total_steps": 29667, "loss": 0.3458, "lr": 2.776535470382518e-05, "epoch": 2.268192017191796, "percentage": 75.61, "elapsed_time": "2 days, 18:00:19", "remaining_time": "21:17:47", "throughput": 27706.93, "total_tokens": 6583706560} +{"current_steps": 22440, "total_steps": 29667, "loss": 0.3446, "lr": 2.776107474839399e-05, "epoch": 2.269203299307904, "percentage": 75.64, "elapsed_time": "2 days, 18:02:06", "remaining_time": "21:16:01", "throughput": 27707.0, "total_tokens": 6586691072} +{"current_steps": 22450, "total_steps": 29667, "loss": 0.3477, "lr": 2.7756796771583976e-05, "epoch": 2.270214581424012, "percentage": 75.67, "elapsed_time": "2 days, 18:03:48", "remaining_time": "21:14:14", "throughput": 27707.5, "total_tokens": 6589624192} +{"current_steps": 22460, "total_steps": 29667, "loss": 0.3529, "lr": 2.775252077187109e-05, "epoch": 2.2712258635401197, "percentage": 75.71, "elapsed_time": "2 days, 18:05:27", "remaining_time": "21:12:26", "throughput": 27708.3, "total_tokens": 6592570368} +{"current_steps": 22470, "total_steps": 29667, "loss": 0.3475, "lr": 2.7748246747732902e-05, "epoch": 2.272237145656227, "percentage": 75.74, "elapsed_time": "2 days, 18:07:12", "remaining_time": "21:10:40", "throughput": 27708.67, "total_tokens": 6595553472} +{"current_steps": 22480, "total_steps": 29667, "loss": 0.342, "lr": 2.774397469764866e-05, "epoch": 2.273248427772335, "percentage": 75.77, "elapsed_time": "2 days, 18:08:55", "remaining_time": "21:08:53", "throughput": 27709.09, "total_tokens": 6598520128} +{"current_steps": 22490, "total_steps": 29667, "loss": 0.3473, "lr": 2.7739704620099226e-05, "epoch": 2.274259709888443, "percentage": 75.81, "elapsed_time": "2 days, 18:10:38", "remaining_time": "21:07:06", "throughput": 27709.56, "total_tokens": 6601485376} +{"current_steps": 22500, "total_steps": 29667, "loss": 0.3474, "lr": 2.7735436513567098e-05, "epoch": 2.275270992004551, "percentage": 75.84, "elapsed_time": "2 days, 18:12:23", "remaining_time": "21:05:20", "throughput": 27709.78, "total_tokens": 6604444736} +{"current_steps": 22510, "total_steps": 29667, "loss": 0.3484, "lr": 2.7731170376536402e-05, "epoch": 2.2762822741206588, "percentage": 75.88, "elapsed_time": "2 days, 18:14:07", "remaining_time": "21:03:33", "throughput": 27709.93, "total_tokens": 6607375104} +{"current_steps": 22520, "total_steps": 29667, "loss": 0.3471, "lr": 2.7726906207492925e-05, "epoch": 2.277293556236766, "percentage": 75.91, "elapsed_time": "2 days, 18:15:59", "remaining_time": "21:01:49", "throughput": 27709.3, "total_tokens": 6610320960} +{"current_steps": 22530, "total_steps": 29667, "loss": 0.3468, "lr": 2.7722644004924048e-05, "epoch": 2.278304838352874, "percentage": 75.94, "elapsed_time": "2 days, 18:17:43", "remaining_time": "21:00:03", "throughput": 27709.52, "total_tokens": 6613254464} +{"current_steps": 22540, "total_steps": 29667, "loss": 0.3469, "lr": 2.77183837673188e-05, "epoch": 2.279316120468982, "percentage": 75.98, "elapsed_time": "2 days, 18:19:26", "remaining_time": "20:58:16", "throughput": 27709.86, "total_tokens": 6616194496} +{"current_steps": 22550, "total_steps": 29667, "loss": 0.3448, "lr": 2.7714125493167835e-05, "epoch": 2.28032740258509, "percentage": 76.01, "elapsed_time": "2 days, 18:21:06", "remaining_time": "20:56:28", "throughput": 27710.52, "total_tokens": 6619118784} +{"current_steps": 22560, "total_steps": 29667, "loss": 0.3434, "lr": 2.770986918096342e-05, "epoch": 2.281338684701198, "percentage": 76.04, "elapsed_time": "2 days, 18:22:44", "remaining_time": "20:54:40", "throughput": 27711.29, "total_tokens": 6622004864} +{"current_steps": 22570, "total_steps": 29667, "loss": 0.3462, "lr": 2.7705614829199454e-05, "epoch": 2.2823499668173057, "percentage": 76.08, "elapsed_time": "2 days, 18:24:26", "remaining_time": "20:52:52", "throughput": 27711.8, "total_tokens": 6624952384} +{"current_steps": 22580, "total_steps": 29667, "loss": 0.3413, "lr": 2.7701362436371437e-05, "epoch": 2.2833612489334136, "percentage": 76.11, "elapsed_time": "2 days, 18:26:05", "remaining_time": "20:51:04", "throughput": 27712.45, "total_tokens": 6627865152} +{"current_steps": 22590, "total_steps": 29667, "loss": 0.3472, "lr": 2.7697112000976492e-05, "epoch": 2.284372531049521, "percentage": 76.15, "elapsed_time": "2 days, 18:27:39", "remaining_time": "20:49:15", "throughput": 27713.55, "total_tokens": 6630726144} +{"current_steps": 22600, "total_steps": 29667, "loss": 0.3477, "lr": 2.769286352151338e-05, "epoch": 2.285383813165629, "percentage": 76.18, "elapsed_time": "2 days, 18:29:21", "remaining_time": "20:47:28", "throughput": 27714.0, "total_tokens": 6633672448} +{"current_steps": 22610, "total_steps": 29667, "loss": 0.3498, "lr": 2.768861699648243e-05, "epoch": 2.286395095281737, "percentage": 76.21, "elapsed_time": "2 days, 18:31:06", "remaining_time": "20:45:41", "throughput": 27714.24, "total_tokens": 6636631872} +{"current_steps": 22620, "total_steps": 29667, "loss": 0.3493, "lr": 2.7684372424385613e-05, "epoch": 2.287406377397845, "percentage": 76.25, "elapsed_time": "2 days, 18:32:47", "remaining_time": "20:43:54", "throughput": 27714.7, "total_tokens": 6639539072} +{"current_steps": 22630, "total_steps": 29667, "loss": 0.3504, "lr": 2.7680129803726496e-05, "epoch": 2.2884176595139527, "percentage": 76.28, "elapsed_time": "2 days, 18:34:30", "remaining_time": "20:42:07", "throughput": 27715.29, "total_tokens": 6642524864} +{"current_steps": 22640, "total_steps": 29667, "loss": 0.3466, "lr": 2.767588913301025e-05, "epoch": 2.28942894163006, "percentage": 76.31, "elapsed_time": "2 days, 18:36:07", "remaining_time": "20:40:18", "throughput": 27716.22, "total_tokens": 6645438784} +{"current_steps": 22650, "total_steps": 29667, "loss": 0.3426, "lr": 2.767165041074365e-05, "epoch": 2.290440223746168, "percentage": 76.35, "elapsed_time": "2 days, 18:37:48", "remaining_time": "20:38:31", "throughput": 27716.74, "total_tokens": 6648367872} +{"current_steps": 22660, "total_steps": 29667, "loss": 0.3532, "lr": 2.766741363543507e-05, "epoch": 2.291451505862276, "percentage": 76.38, "elapsed_time": "2 days, 18:39:26", "remaining_time": "20:36:43", "throughput": 27717.73, "total_tokens": 6651327232} +{"current_steps": 22670, "total_steps": 29667, "loss": 0.3417, "lr": 2.7663178805594482e-05, "epoch": 2.292462787978384, "percentage": 76.41, "elapsed_time": "2 days, 18:41:10", "remaining_time": "20:34:56", "throughput": 27718.15, "total_tokens": 6654310016} +{"current_steps": 22680, "total_steps": 29667, "loss": 0.3462, "lr": 2.7658945919733463e-05, "epoch": 2.293474070094492, "percentage": 76.45, "elapsed_time": "2 days, 18:42:53", "remaining_time": "20:33:10", "throughput": 27718.69, "total_tokens": 6657305536} +{"current_steps": 22690, "total_steps": 29667, "loss": 0.3468, "lr": 2.7654714976365164e-05, "epoch": 2.2944853522105997, "percentage": 76.48, "elapsed_time": "2 days, 18:44:34", "remaining_time": "20:31:22", "throughput": 27719.27, "total_tokens": 6660243456} +{"current_steps": 22700, "total_steps": 29667, "loss": 0.3433, "lr": 2.765048597400436e-05, "epoch": 2.295496634326707, "percentage": 76.52, "elapsed_time": "2 days, 18:46:20", "remaining_time": "20:29:36", "throughput": 27719.4, "total_tokens": 6663198720} +{"current_steps": 22710, "total_steps": 29667, "loss": 0.3447, "lr": 2.7646258911167373e-05, "epoch": 2.296507916442815, "percentage": 76.55, "elapsed_time": "2 days, 18:48:02", "remaining_time": "20:27:49", "throughput": 27719.85, "total_tokens": 6666152704} +{"current_steps": 22720, "total_steps": 29667, "loss": 0.3475, "lr": 2.7642033786372145e-05, "epoch": 2.297519198558923, "percentage": 76.58, "elapsed_time": "2 days, 18:49:41", "remaining_time": "20:26:01", "throughput": 27720.56, "total_tokens": 6669050624} +{"current_steps": 22730, "total_steps": 29667, "loss": 0.3513, "lr": 2.7637810598138193e-05, "epoch": 2.298530480675031, "percentage": 76.62, "elapsed_time": "2 days, 18:51:28", "remaining_time": "20:24:15", "throughput": 27720.58, "total_tokens": 6672014464} +{"current_steps": 22740, "total_steps": 29667, "loss": 0.3498, "lr": 2.7633589344986615e-05, "epoch": 2.2995417627911388, "percentage": 76.65, "elapsed_time": "2 days, 18:53:16", "remaining_time": "20:22:30", "throughput": 27720.42, "total_tokens": 6674991104} +{"current_steps": 22750, "total_steps": 29667, "loss": 0.3424, "lr": 2.7629370025440087e-05, "epoch": 2.3005530449072467, "percentage": 76.68, "elapsed_time": "2 days, 18:54:56", "remaining_time": "20:20:43", "throughput": 27721.29, "total_tokens": 6677950912} +{"current_steps": 22760, "total_steps": 29667, "loss": 0.3449, "lr": 2.762515263802287e-05, "epoch": 2.301564327023354, "percentage": 76.72, "elapsed_time": "2 days, 18:56:35", "remaining_time": "20:18:55", "throughput": 27722.08, "total_tokens": 6680883136} +{"current_steps": 22770, "total_steps": 29667, "loss": 0.346, "lr": 2.762093718126081e-05, "epoch": 2.302575609139462, "percentage": 76.75, "elapsed_time": "2 days, 18:58:12", "remaining_time": "20:17:06", "throughput": 27722.87, "total_tokens": 6683784128} +{"current_steps": 22780, "total_steps": 29667, "loss": 0.3462, "lr": 2.7616723653681298e-05, "epoch": 2.30358689125557, "percentage": 76.79, "elapsed_time": "2 days, 18:59:52", "remaining_time": "20:15:19", "throughput": 27723.44, "total_tokens": 6686697216} +{"current_steps": 22790, "total_steps": 29667, "loss": 0.3432, "lr": 2.761251205381332e-05, "epoch": 2.304598173371678, "percentage": 76.82, "elapsed_time": "2 days, 19:01:33", "remaining_time": "20:13:31", "throughput": 27723.96, "total_tokens": 6689600768} +{"current_steps": 22800, "total_steps": 29667, "loss": 0.3446, "lr": 2.760830238018744e-05, "epoch": 2.3056094554877857, "percentage": 76.85, "elapsed_time": "2 days, 19:03:11", "remaining_time": "20:11:43", "throughput": 27724.69, "total_tokens": 6692511040} +{"current_steps": 22810, "total_steps": 29667, "loss": 0.3487, "lr": 2.760409463133576e-05, "epoch": 2.306620737603893, "percentage": 76.89, "elapsed_time": "2 days, 19:04:52", "remaining_time": "20:09:55", "throughput": 27725.37, "total_tokens": 6695464768} +{"current_steps": 22820, "total_steps": 29667, "loss": 0.3457, "lr": 2.7599888805791967e-05, "epoch": 2.307632019720001, "percentage": 76.92, "elapsed_time": "2 days, 19:06:32", "remaining_time": "20:08:08", "throughput": 27726.1, "total_tokens": 6698408896} +{"current_steps": 22830, "total_steps": 29667, "loss": 0.3441, "lr": 2.759568490209132e-05, "epoch": 2.308643301836109, "percentage": 76.95, "elapsed_time": "2 days, 19:08:12", "remaining_time": "20:06:20", "throughput": 27726.75, "total_tokens": 6701349184} +{"current_steps": 22840, "total_steps": 29667, "loss": 0.3457, "lr": 2.7591482918770613e-05, "epoch": 2.309654583952217, "percentage": 76.99, "elapsed_time": "2 days, 19:09:52", "remaining_time": "20:04:32", "throughput": 27727.48, "total_tokens": 6704285120} +{"current_steps": 22850, "total_steps": 29667, "loss": 0.3484, "lr": 2.7587282854368222e-05, "epoch": 2.310665866068325, "percentage": 77.02, "elapsed_time": "2 days, 19:11:36", "remaining_time": "20:02:46", "throughput": 27727.74, "total_tokens": 6707229824} +{"current_steps": 22860, "total_steps": 29667, "loss": 0.3442, "lr": 2.7583084707424072e-05, "epoch": 2.3116771481844327, "percentage": 77.06, "elapsed_time": "2 days, 19:13:17", "remaining_time": "20:00:59", "throughput": 27728.11, "total_tokens": 6710146752} +{"current_steps": 22870, "total_steps": 29667, "loss": 0.3491, "lr": 2.7578888476479643e-05, "epoch": 2.3126884303005406, "percentage": 77.09, "elapsed_time": "2 days, 19:15:00", "remaining_time": "19:59:12", "throughput": 27728.35, "total_tokens": 6713045440} +{"current_steps": 22880, "total_steps": 29667, "loss": 0.3482, "lr": 2.7574694160077964e-05, "epoch": 2.313699712416648, "percentage": 77.12, "elapsed_time": "2 days, 19:16:40", "remaining_time": "19:57:25", "throughput": 27728.92, "total_tokens": 6715955712} +{"current_steps": 22890, "total_steps": 29667, "loss": 0.3519, "lr": 2.757050175676362e-05, "epoch": 2.314710994532756, "percentage": 77.16, "elapsed_time": "2 days, 19:18:16", "remaining_time": "19:55:36", "throughput": 27729.81, "total_tokens": 6718847296} +{"current_steps": 22900, "total_steps": 29667, "loss": 0.344, "lr": 2.756631126508274e-05, "epoch": 2.315722276648864, "percentage": 77.19, "elapsed_time": "2 days, 19:19:59", "remaining_time": "19:53:49", "throughput": 27730.13, "total_tokens": 6721767424} +{"current_steps": 22910, "total_steps": 29667, "loss": 0.3382, "lr": 2.7562122683583004e-05, "epoch": 2.316733558764972, "percentage": 77.22, "elapsed_time": "2 days, 19:21:39", "remaining_time": "19:52:01", "throughput": 27730.84, "total_tokens": 6724710976} +{"current_steps": 22920, "total_steps": 29667, "loss": 0.3434, "lr": 2.7557936010813634e-05, "epoch": 2.3177448408810797, "percentage": 77.26, "elapsed_time": "2 days, 19:23:20", "remaining_time": "19:50:14", "throughput": 27731.36, "total_tokens": 6727654784} +{"current_steps": 22930, "total_steps": 29667, "loss": 0.3429, "lr": 2.75537512453254e-05, "epoch": 2.318756122997187, "percentage": 77.29, "elapsed_time": "2 days, 19:25:01", "remaining_time": "19:48:27", "throughput": 27732.1, "total_tokens": 6730608448} +{"current_steps": 22940, "total_steps": 29667, "loss": 0.3509, "lr": 2.7549568385670595e-05, "epoch": 2.319767405113295, "percentage": 77.32, "elapsed_time": "2 days, 19:26:43", "remaining_time": "19:46:40", "throughput": 27732.66, "total_tokens": 6733587072} +{"current_steps": 22950, "total_steps": 29667, "loss": 0.3466, "lr": 2.754538743040307e-05, "epoch": 2.320778687229403, "percentage": 77.36, "elapsed_time": "2 days, 19:28:19", "remaining_time": "19:44:51", "throughput": 27733.8, "total_tokens": 6736536192} +{"current_steps": 22960, "total_steps": 29667, "loss": 0.3431, "lr": 2.75412083780782e-05, "epoch": 2.321789969345511, "percentage": 77.39, "elapsed_time": "2 days, 19:29:59", "remaining_time": "19:43:04", "throughput": 27734.59, "total_tokens": 6739483904} +{"current_steps": 22970, "total_steps": 29667, "loss": 0.3516, "lr": 2.7537031227252898e-05, "epoch": 2.3228012514616188, "percentage": 77.43, "elapsed_time": "2 days, 19:31:38", "remaining_time": "19:41:16", "throughput": 27735.21, "total_tokens": 6742388928} +{"current_steps": 22980, "total_steps": 29667, "loss": 0.3427, "lr": 2.75328559764856e-05, "epoch": 2.3238125335777267, "percentage": 77.46, "elapsed_time": "2 days, 19:33:18", "remaining_time": "19:39:28", "throughput": 27735.93, "total_tokens": 6745327360} +{"current_steps": 22990, "total_steps": 29667, "loss": 0.3501, "lr": 2.752868262433629e-05, "epoch": 2.3248238156938346, "percentage": 77.49, "elapsed_time": "2 days, 19:35:02", "remaining_time": "19:37:42", "throughput": 27736.2, "total_tokens": 6748299712} +{"current_steps": 23000, "total_steps": 29667, "loss": 0.3441, "lr": 2.752451116936646e-05, "epoch": 2.325835097809942, "percentage": 77.53, "elapsed_time": "2 days, 19:36:46", "remaining_time": "19:35:56", "throughput": 27736.61, "total_tokens": 6751261632} +{"current_steps": 23010, "total_steps": 29667, "loss": 0.3458, "lr": 2.752034161013915e-05, "epoch": 2.32684637992605, "percentage": 77.56, "elapsed_time": "2 days, 19:38:27", "remaining_time": "19:34:08", "throughput": 27737.22, "total_tokens": 6754225600} +{"current_steps": 23020, "total_steps": 29667, "loss": 0.3482, "lr": 2.7516173945218888e-05, "epoch": 2.327857662042158, "percentage": 77.59, "elapsed_time": "2 days, 19:40:08", "remaining_time": "19:32:21", "throughput": 27737.78, "total_tokens": 6757165184} +{"current_steps": 23030, "total_steps": 29667, "loss": 0.3468, "lr": 2.751200817317176e-05, "epoch": 2.3288689441582657, "percentage": 77.63, "elapsed_time": "2 days, 19:41:48", "remaining_time": "19:30:34", "throughput": 27738.46, "total_tokens": 6760089472} +{"current_steps": 23040, "total_steps": 29667, "loss": 0.35, "lr": 2.7507844292565354e-05, "epoch": 2.3298802262743736, "percentage": 77.66, "elapsed_time": "2 days, 19:43:30", "remaining_time": "19:28:47", "throughput": 27738.81, "total_tokens": 6763015232} +{"current_steps": 23050, "total_steps": 29667, "loss": 0.3456, "lr": 2.7503682301968763e-05, "epoch": 2.330891508390481, "percentage": 77.7, "elapsed_time": "2 days, 19:45:08", "remaining_time": "19:26:59", "throughput": 27739.64, "total_tokens": 6765935488} +{"current_steps": 23060, "total_steps": 29667, "loss": 0.3456, "lr": 2.7499522199952627e-05, "epoch": 2.331902790506589, "percentage": 77.73, "elapsed_time": "2 days, 19:46:51", "remaining_time": "19:25:12", "throughput": 27740.12, "total_tokens": 6768915712} +{"current_steps": 23070, "total_steps": 29667, "loss": 0.349, "lr": 2.7495363985089072e-05, "epoch": 2.332914072622697, "percentage": 77.76, "elapsed_time": "2 days, 19:48:34", "remaining_time": "19:23:25", "throughput": 27740.56, "total_tokens": 6771862592} +{"current_steps": 23080, "total_steps": 29667, "loss": 0.3489, "lr": 2.7491207655951745e-05, "epoch": 2.333925354738805, "percentage": 77.8, "elapsed_time": "2 days, 19:50:13", "remaining_time": "19:21:38", "throughput": 27741.27, "total_tokens": 6774799232} +{"current_steps": 23090, "total_steps": 29667, "loss": 0.348, "lr": 2.7487053211115797e-05, "epoch": 2.3349366368549127, "percentage": 77.83, "elapsed_time": "2 days, 19:51:55", "remaining_time": "19:19:51", "throughput": 27741.75, "total_tokens": 6777747136} +{"current_steps": 23100, "total_steps": 29667, "loss": 0.3413, "lr": 2.748290064915789e-05, "epoch": 2.3359479189710206, "percentage": 77.86, "elapsed_time": "2 days, 19:53:39", "remaining_time": "19:18:05", "throughput": 27741.86, "total_tokens": 6780657856} +{"current_steps": 23110, "total_steps": 29667, "loss": 0.3465, "lr": 2.747874996865619e-05, "epoch": 2.3369592010871285, "percentage": 77.9, "elapsed_time": "2 days, 19:55:16", "remaining_time": "19:16:16", "throughput": 27742.76, "total_tokens": 6783556544} +{"current_steps": 23120, "total_steps": 29667, "loss": 0.3455, "lr": 2.747460116819037e-05, "epoch": 2.337970483203236, "percentage": 77.93, "elapsed_time": "2 days, 19:56:53", "remaining_time": "19:14:28", "throughput": 27743.59, "total_tokens": 6786445312} +{"current_steps": 23130, "total_steps": 29667, "loss": 0.3504, "lr": 2.7470454246341597e-05, "epoch": 2.338981765319344, "percentage": 77.97, "elapsed_time": "2 days, 19:58:37", "remaining_time": "19:12:41", "throughput": 27743.74, "total_tokens": 6789374272} +{"current_steps": 23140, "total_steps": 29667, "loss": 0.3441, "lr": 2.746630920169254e-05, "epoch": 2.339993047435452, "percentage": 78.0, "elapsed_time": "2 days, 20:00:21", "remaining_time": "19:10:55", "throughput": 27743.8, "total_tokens": 6792279104} +{"current_steps": 23150, "total_steps": 29667, "loss": 0.3456, "lr": 2.7462166032827358e-05, "epoch": 2.3410043295515597, "percentage": 78.03, "elapsed_time": "2 days, 20:02:11", "remaining_time": "19:09:11", "throughput": 27743.29, "total_tokens": 6795203008} +{"current_steps": 23160, "total_steps": 29667, "loss": 0.3445, "lr": 2.745802473833171e-05, "epoch": 2.3420156116676676, "percentage": 78.07, "elapsed_time": "2 days, 20:03:53", "remaining_time": "19:07:24", "throughput": 27743.53, "total_tokens": 6798100672} +{"current_steps": 23170, "total_steps": 29667, "loss": 0.3458, "lr": 2.7453885316792755e-05, "epoch": 2.343026893783775, "percentage": 78.1, "elapsed_time": "2 days, 20:05:34", "remaining_time": "19:05:37", "throughput": 27743.99, "total_tokens": 6801013568} +{"current_steps": 23180, "total_steps": 29667, "loss": 0.3466, "lr": 2.7449747766799135e-05, "epoch": 2.344038175899883, "percentage": 78.13, "elapsed_time": "2 days, 20:07:14", "remaining_time": "19:03:49", "throughput": 27744.61, "total_tokens": 6803933568} +{"current_steps": 23190, "total_steps": 29667, "loss": 0.3455, "lr": 2.744561208694097e-05, "epoch": 2.345049458015991, "percentage": 78.17, "elapsed_time": "2 days, 20:08:57", "remaining_time": "19:02:02", "throughput": 27745.0, "total_tokens": 6806876288} +{"current_steps": 23200, "total_steps": 29667, "loss": 0.3426, "lr": 2.7441478275809884e-05, "epoch": 2.3460607401320988, "percentage": 78.2, "elapsed_time": "2 days, 20:10:42", "remaining_time": "19:00:17", "throughput": 27745.01, "total_tokens": 6809801088} +{"current_steps": 23210, "total_steps": 29667, "loss": 0.3462, "lr": 2.743734633199898e-05, "epoch": 2.3470720222482067, "percentage": 78.24, "elapsed_time": "2 days, 20:12:25", "remaining_time": "18:58:30", "throughput": 27745.3, "total_tokens": 6812739584} +{"current_steps": 23220, "total_steps": 29667, "loss": 0.3468, "lr": 2.743321625410284e-05, "epoch": 2.3480833043643146, "percentage": 78.27, "elapsed_time": "2 days, 20:14:07", "remaining_time": "18:56:43", "throughput": 27745.58, "total_tokens": 6815644224} +{"current_steps": 23230, "total_steps": 29667, "loss": 0.3488, "lr": 2.7429088040717526e-05, "epoch": 2.349094586480422, "percentage": 78.3, "elapsed_time": "2 days, 20:15:47", "remaining_time": "18:54:56", "throughput": 27746.15, "total_tokens": 6818548352} +{"current_steps": 23240, "total_steps": 29667, "loss": 0.3466, "lr": 2.7424961690440586e-05, "epoch": 2.35010586859653, "percentage": 78.34, "elapsed_time": "2 days, 20:17:27", "remaining_time": "18:53:08", "throughput": 27746.81, "total_tokens": 6821474048} +{"current_steps": 23250, "total_steps": 29667, "loss": 0.3461, "lr": 2.742083720187103e-05, "epoch": 2.351117150712638, "percentage": 78.37, "elapsed_time": "2 days, 20:19:09", "remaining_time": "18:51:22", "throughput": 27747.31, "total_tokens": 6824440832} +{"current_steps": 23260, "total_steps": 29667, "loss": 0.3457, "lr": 2.7416714573609363e-05, "epoch": 2.3521284328287457, "percentage": 78.4, "elapsed_time": "2 days, 20:20:48", "remaining_time": "18:49:34", "throughput": 27748.12, "total_tokens": 6827372096} +{"current_steps": 23270, "total_steps": 29667, "loss": 0.3485, "lr": 2.7412593804257543e-05, "epoch": 2.3531397149448536, "percentage": 78.44, "elapsed_time": "2 days, 20:22:27", "remaining_time": "18:47:46", "throughput": 27748.73, "total_tokens": 6830288128} +{"current_steps": 23280, "total_steps": 29667, "loss": 0.3473, "lr": 2.740847489241901e-05, "epoch": 2.3541509970609615, "percentage": 78.47, "elapsed_time": "2 days, 20:24:07", "remaining_time": "18:45:59", "throughput": 27749.24, "total_tokens": 6833193536} +{"current_steps": 23290, "total_steps": 29667, "loss": 0.3471, "lr": 2.7404357836698668e-05, "epoch": 2.355162279177069, "percentage": 78.5, "elapsed_time": "2 days, 20:25:45", "remaining_time": "18:44:11", "throughput": 27750.11, "total_tokens": 6836102464} +{"current_steps": 23300, "total_steps": 29667, "loss": 0.3495, "lr": 2.740024263570289e-05, "epoch": 2.356173561293177, "percentage": 78.54, "elapsed_time": "2 days, 20:27:21", "remaining_time": "18:42:23", "throughput": 27750.95, "total_tokens": 6838985664} +{"current_steps": 23310, "total_steps": 29667, "loss": 0.349, "lr": 2.7396129288039503e-05, "epoch": 2.357184843409285, "percentage": 78.57, "elapsed_time": "2 days, 20:28:59", "remaining_time": "18:40:35", "throughput": 27751.72, "total_tokens": 6841892672} +{"current_steps": 23320, "total_steps": 29667, "loss": 0.3439, "lr": 2.739201779231782e-05, "epoch": 2.3581961255253927, "percentage": 78.61, "elapsed_time": "2 days, 20:30:39", "remaining_time": "18:38:47", "throughput": 27752.4, "total_tokens": 6844849024} +{"current_steps": 23330, "total_steps": 29667, "loss": 0.346, "lr": 2.7387908147148587e-05, "epoch": 2.3592074076415006, "percentage": 78.64, "elapsed_time": "2 days, 20:32:24", "remaining_time": "18:37:01", "throughput": 27752.72, "total_tokens": 6847839232} +{"current_steps": 23340, "total_steps": 29667, "loss": 0.3442, "lr": 2.7383800351144027e-05, "epoch": 2.360218689757608, "percentage": 78.67, "elapsed_time": "2 days, 20:34:02", "remaining_time": "18:35:13", "throughput": 27753.39, "total_tokens": 6850709888} +{"current_steps": 23350, "total_steps": 29667, "loss": 0.3484, "lr": 2.737969440291782e-05, "epoch": 2.361229971873716, "percentage": 78.71, "elapsed_time": "2 days, 20:35:49", "remaining_time": "18:33:28", "throughput": 27753.17, "total_tokens": 6853624256} +{"current_steps": 23360, "total_steps": 29667, "loss": 0.3436, "lr": 2.7375590301085087e-05, "epoch": 2.362241253989824, "percentage": 78.74, "elapsed_time": "2 days, 20:37:31", "remaining_time": "18:31:41", "throughput": 27753.45, "total_tokens": 6856532352} +{"current_steps": 23370, "total_steps": 29667, "loss": 0.3491, "lr": 2.7371488044262406e-05, "epoch": 2.363252536105932, "percentage": 78.77, "elapsed_time": "2 days, 20:39:16", "remaining_time": "18:29:55", "throughput": 27753.24, "total_tokens": 6859397504} +{"current_steps": 23380, "total_steps": 29667, "loss": 0.3422, "lr": 2.7367387631067816e-05, "epoch": 2.3642638182220397, "percentage": 78.81, "elapsed_time": "2 days, 20:40:55", "remaining_time": "18:28:08", "throughput": 27753.82, "total_tokens": 6862298432} +{"current_steps": 23390, "total_steps": 29667, "loss": 0.3506, "lr": 2.73632890601208e-05, "epoch": 2.3652751003381476, "percentage": 78.84, "elapsed_time": "2 days, 20:42:36", "remaining_time": "18:26:21", "throughput": 27754.29, "total_tokens": 6865192000} +{"current_steps": 23400, "total_steps": 29667, "loss": 0.3502, "lr": 2.7359192330042277e-05, "epoch": 2.3662863824542555, "percentage": 78.88, "elapsed_time": "2 days, 20:44:13", "remaining_time": "18:24:33", "throughput": 27755.09, "total_tokens": 6868092544} +{"current_steps": 23410, "total_steps": 29667, "loss": 0.3469, "lr": 2.7355097439454625e-05, "epoch": 2.367297664570363, "percentage": 78.91, "elapsed_time": "2 days, 20:45:52", "remaining_time": "18:22:45", "throughput": 27755.92, "total_tokens": 6871053504} +{"current_steps": 23420, "total_steps": 29667, "loss": 0.3494, "lr": 2.735100438698166e-05, "epoch": 2.368308946686471, "percentage": 78.94, "elapsed_time": "2 days, 20:47:35", "remaining_time": "18:20:58", "throughput": 27756.3, "total_tokens": 6873988160} +{"current_steps": 23430, "total_steps": 29667, "loss": 0.3461, "lr": 2.7346913171248635e-05, "epoch": 2.3693202288025788, "percentage": 78.98, "elapsed_time": "2 days, 20:49:20", "remaining_time": "18:19:13", "throughput": 27756.43, "total_tokens": 6876940352} +{"current_steps": 23440, "total_steps": 29667, "loss": 0.3488, "lr": 2.734282379088225e-05, "epoch": 2.3703315109186867, "percentage": 79.01, "elapsed_time": "2 days, 20:50:58", "remaining_time": "18:17:25", "throughput": 27757.14, "total_tokens": 6879853504} +{"current_steps": 23450, "total_steps": 29667, "loss": 0.3455, "lr": 2.733873624451063e-05, "epoch": 2.3713427930347946, "percentage": 79.04, "elapsed_time": "2 days, 20:52:37", "remaining_time": "18:15:37", "throughput": 27758.04, "total_tokens": 6882801088} +{"current_steps": 23460, "total_steps": 29667, "loss": 0.3535, "lr": 2.733465053076335e-05, "epoch": 2.372354075150902, "percentage": 79.08, "elapsed_time": "2 days, 20:54:19", "remaining_time": "18:13:51", "throughput": 27758.35, "total_tokens": 6885721984} +{"current_steps": 23470, "total_steps": 29667, "loss": 0.3486, "lr": 2.733056664827141e-05, "epoch": 2.37336535726701, "percentage": 79.11, "elapsed_time": "2 days, 20:56:00", "remaining_time": "18:12:04", "throughput": 27759.09, "total_tokens": 6888719552} +{"current_steps": 23480, "total_steps": 29667, "loss": 0.345, "lr": 2.732648459566724e-05, "epoch": 2.374376639383118, "percentage": 79.15, "elapsed_time": "2 days, 20:57:42", "remaining_time": "18:10:17", "throughput": 27759.72, "total_tokens": 6891693696} +{"current_steps": 23490, "total_steps": 29667, "loss": 0.35, "lr": 2.73224043715847e-05, "epoch": 2.3753879214992257, "percentage": 79.18, "elapsed_time": "2 days, 20:59:23", "remaining_time": "18:08:30", "throughput": 27760.26, "total_tokens": 6894641408} +{"current_steps": 23500, "total_steps": 29667, "loss": 0.3462, "lr": 2.731832597465908e-05, "epoch": 2.3763992036153336, "percentage": 79.21, "elapsed_time": "2 days, 21:01:03", "remaining_time": "18:06:43", "throughput": 27760.86, "total_tokens": 6897561792} +{"current_steps": 23510, "total_steps": 29667, "loss": 0.3459, "lr": 2.7314249403527097e-05, "epoch": 2.3774104857314415, "percentage": 79.25, "elapsed_time": "2 days, 21:02:42", "remaining_time": "18:04:55", "throughput": 27761.54, "total_tokens": 6900490304} +{"current_steps": 23520, "total_steps": 29667, "loss": 0.3429, "lr": 2.731017465682689e-05, "epoch": 2.3784217678475494, "percentage": 79.28, "elapsed_time": "2 days, 21:04:29", "remaining_time": "18:03:10", "throughput": 27761.54, "total_tokens": 6903460224} +{"current_steps": 23530, "total_steps": 29667, "loss": 0.3474, "lr": 2.730610173319802e-05, "epoch": 2.379433049963657, "percentage": 79.31, "elapsed_time": "2 days, 21:06:08", "remaining_time": "18:01:22", "throughput": 27762.33, "total_tokens": 6906393728} +{"current_steps": 23540, "total_steps": 29667, "loss": 0.3491, "lr": 2.7302030631281454e-05, "epoch": 2.380444332079765, "percentage": 79.35, "elapsed_time": "2 days, 21:07:48", "remaining_time": "17:59:35", "throughput": 27762.92, "total_tokens": 6909311232} +{"current_steps": 23550, "total_steps": 29667, "loss": 0.3455, "lr": 2.7297961349719608e-05, "epoch": 2.3814556141958727, "percentage": 79.38, "elapsed_time": "2 days, 21:09:27", "remaining_time": "17:57:48", "throughput": 27763.68, "total_tokens": 6912255104} +{"current_steps": 23560, "total_steps": 29667, "loss": 0.3484, "lr": 2.729389388715628e-05, "epoch": 2.3824668963119806, "percentage": 79.41, "elapsed_time": "2 days, 21:11:04", "remaining_time": "17:56:00", "throughput": 27764.61, "total_tokens": 6915171392} +{"current_steps": 23570, "total_steps": 29667, "loss": 0.3462, "lr": 2.728982824223671e-05, "epoch": 2.3834781784280885, "percentage": 79.45, "elapsed_time": "2 days, 21:12:43", "remaining_time": "17:54:12", "throughput": 27765.28, "total_tokens": 6918101248} +{"current_steps": 23580, "total_steps": 29667, "loss": 0.3496, "lr": 2.7285764413607527e-05, "epoch": 2.384489460544196, "percentage": 79.48, "elapsed_time": "2 days, 21:14:22", "remaining_time": "17:52:25", "throughput": 27765.94, "total_tokens": 6921011904} +{"current_steps": 23590, "total_steps": 29667, "loss": 0.3454, "lr": 2.7281702399916786e-05, "epoch": 2.385500742660304, "percentage": 79.52, "elapsed_time": "2 days, 21:16:01", "remaining_time": "17:50:37", "throughput": 27766.48, "total_tokens": 6923894848} +{"current_steps": 23600, "total_steps": 29667, "loss": 0.3477, "lr": 2.7277642199813954e-05, "epoch": 2.3865120247764118, "percentage": 79.55, "elapsed_time": "2 days, 21:17:39", "remaining_time": "17:48:50", "throughput": 27767.27, "total_tokens": 6926819456} +{"current_steps": 23610, "total_steps": 29667, "loss": 0.3443, "lr": 2.7273583811949882e-05, "epoch": 2.3875233068925197, "percentage": 79.58, "elapsed_time": "2 days, 21:19:24", "remaining_time": "17:47:04", "throughput": 27767.43, "total_tokens": 6929775424} +{"current_steps": 23620, "total_steps": 29667, "loss": 0.3477, "lr": 2.7269527234976844e-05, "epoch": 2.3885345890086276, "percentage": 79.62, "elapsed_time": "2 days, 21:21:08", "remaining_time": "17:45:18", "throughput": 27767.79, "total_tokens": 6932739968} +{"current_steps": 23630, "total_steps": 29667, "loss": 0.3445, "lr": 2.726547246754852e-05, "epoch": 2.3895458711247355, "percentage": 79.65, "elapsed_time": "2 days, 21:22:48", "remaining_time": "17:43:30", "throughput": 27768.48, "total_tokens": 6935684992} +{"current_steps": 23640, "total_steps": 29667, "loss": 0.3425, "lr": 2.726141950831998e-05, "epoch": 2.3905571532408434, "percentage": 79.68, "elapsed_time": "2 days, 21:24:25", "remaining_time": "17:41:42", "throughput": 27769.36, "total_tokens": 6938599232} +{"current_steps": 23650, "total_steps": 29667, "loss": 0.3471, "lr": 2.7257368355947686e-05, "epoch": 2.391568435356951, "percentage": 79.72, "elapsed_time": "2 days, 21:26:05", "remaining_time": "17:39:55", "throughput": 27769.91, "total_tokens": 6941513408} +{"current_steps": 23660, "total_steps": 29667, "loss": 0.3481, "lr": 2.7253319009089528e-05, "epoch": 2.3925797174730588, "percentage": 79.75, "elapsed_time": "2 days, 21:27:46", "remaining_time": "17:38:08", "throughput": 27770.5, "total_tokens": 6944460416} +{"current_steps": 23670, "total_steps": 29667, "loss": 0.3474, "lr": 2.7249271466404758e-05, "epoch": 2.3935909995891667, "percentage": 79.79, "elapsed_time": "2 days, 21:29:27", "remaining_time": "17:36:22", "throughput": 27770.96, "total_tokens": 6947385984} +{"current_steps": 23680, "total_steps": 29667, "loss": 0.3422, "lr": 2.724522572655403e-05, "epoch": 2.3946022817052746, "percentage": 79.82, "elapsed_time": "2 days, 21:31:05", "remaining_time": "17:34:34", "throughput": 27771.68, "total_tokens": 6950284800} +{"current_steps": 23690, "total_steps": 29667, "loss": 0.3461, "lr": 2.7241181788199405e-05, "epoch": 2.3956135638213825, "percentage": 79.85, "elapsed_time": "2 days, 21:32:44", "remaining_time": "17:32:47", "throughput": 27772.49, "total_tokens": 6953241024} +{"current_steps": 23700, "total_steps": 29667, "loss": 0.3469, "lr": 2.7237139650004316e-05, "epoch": 2.39662484593749, "percentage": 79.89, "elapsed_time": "2 days, 21:34:26", "remaining_time": "17:31:00", "throughput": 27773.0, "total_tokens": 6956213952} +{"current_steps": 23710, "total_steps": 29667, "loss": 0.3444, "lr": 2.7233099310633598e-05, "epoch": 2.397636128053598, "percentage": 79.92, "elapsed_time": "2 days, 21:36:05", "remaining_time": "17:29:13", "throughput": 27773.67, "total_tokens": 6959128576} +{"current_steps": 23720, "total_steps": 29667, "loss": 0.3443, "lr": 2.722906076875345e-05, "epoch": 2.3986474101697057, "percentage": 79.95, "elapsed_time": "2 days, 21:37:41", "remaining_time": "17:27:24", "throughput": 27774.64, "total_tokens": 6962023168} +{"current_steps": 23730, "total_steps": 29667, "loss": 0.3446, "lr": 2.7225024023031487e-05, "epoch": 2.3996586922858136, "percentage": 79.99, "elapsed_time": "2 days, 21:39:23", "remaining_time": "17:25:38", "throughput": 27775.2, "total_tokens": 6965020480} +{"current_steps": 23740, "total_steps": 29667, "loss": 0.3465, "lr": 2.7220989072136676e-05, "epoch": 2.4006699744019215, "percentage": 80.02, "elapsed_time": "2 days, 21:40:59", "remaining_time": "17:23:50", "throughput": 27776.18, "total_tokens": 6967909568} +{"current_steps": 23750, "total_steps": 29667, "loss": 0.3466, "lr": 2.7216955914739385e-05, "epoch": 2.4016812565180294, "percentage": 80.06, "elapsed_time": "2 days, 21:42:40", "remaining_time": "17:22:03", "throughput": 27776.66, "total_tokens": 6970852736} +{"current_steps": 23760, "total_steps": 29667, "loss": 0.3487, "lr": 2.7212924549511348e-05, "epoch": 2.402692538634137, "percentage": 80.09, "elapsed_time": "2 days, 21:44:19", "remaining_time": "17:20:16", "throughput": 27777.27, "total_tokens": 6973751552} +{"current_steps": 23770, "total_steps": 29667, "loss": 0.3486, "lr": 2.7208894975125688e-05, "epoch": 2.403703820750245, "percentage": 80.12, "elapsed_time": "2 days, 21:45:58", "remaining_time": "17:18:28", "throughput": 27777.94, "total_tokens": 6976652864} +{"current_steps": 23780, "total_steps": 29667, "loss": 0.3468, "lr": 2.720486719025689e-05, "epoch": 2.4047151028663527, "percentage": 80.16, "elapsed_time": "2 days, 21:47:40", "remaining_time": "17:16:42", "throughput": 27778.4, "total_tokens": 6979613504} +{"current_steps": 23790, "total_steps": 29667, "loss": 0.3457, "lr": 2.7200841193580816e-05, "epoch": 2.4057263849824606, "percentage": 80.19, "elapsed_time": "2 days, 21:49:18", "remaining_time": "17:14:54", "throughput": 27779.18, "total_tokens": 6982538624} +{"current_steps": 23800, "total_steps": 29667, "loss": 0.3429, "lr": 2.7196816983774708e-05, "epoch": 2.4067376670985685, "percentage": 80.22, "elapsed_time": "2 days, 21:50:58", "remaining_time": "17:13:07", "throughput": 27779.91, "total_tokens": 6985492608} +{"current_steps": 23810, "total_steps": 29667, "loss": 0.345, "lr": 2.7192794559517166e-05, "epoch": 2.4077489492146764, "percentage": 80.26, "elapsed_time": "2 days, 21:52:36", "remaining_time": "17:11:20", "throughput": 27780.7, "total_tokens": 6988407488} +{"current_steps": 23820, "total_steps": 29667, "loss": 0.3405, "lr": 2.7188773919488165e-05, "epoch": 2.408760231330784, "percentage": 80.29, "elapsed_time": "2 days, 21:54:14", "remaining_time": "17:09:32", "throughput": 27781.47, "total_tokens": 6991330752} +{"current_steps": 23830, "total_steps": 29667, "loss": 0.3474, "lr": 2.7184755062369043e-05, "epoch": 2.4097715134468918, "percentage": 80.32, "elapsed_time": "2 days, 21:55:53", "remaining_time": "17:07:45", "throughput": 27782.2, "total_tokens": 6994259584} +{"current_steps": 23840, "total_steps": 29667, "loss": 0.3493, "lr": 2.7180737986842498e-05, "epoch": 2.4107827955629997, "percentage": 80.36, "elapsed_time": "2 days, 21:57:32", "remaining_time": "17:05:58", "throughput": 27782.95, "total_tokens": 6997201088} +{"current_steps": 23850, "total_steps": 29667, "loss": 0.3492, "lr": 2.71767226915926e-05, "epoch": 2.4117940776791076, "percentage": 80.39, "elapsed_time": "2 days, 21:59:08", "remaining_time": "17:04:10", "throughput": 27783.86, "total_tokens": 7000110144} +{"current_steps": 23860, "total_steps": 29667, "loss": 0.3444, "lr": 2.7172709175304767e-05, "epoch": 2.4128053597952155, "percentage": 80.43, "elapsed_time": "2 days, 22:00:47", "remaining_time": "17:02:22", "throughput": 27784.57, "total_tokens": 7003034048} +{"current_steps": 23870, "total_steps": 29667, "loss": 0.3482, "lr": 2.716869743666579e-05, "epoch": 2.4138166419113234, "percentage": 80.46, "elapsed_time": "2 days, 22:02:30", "remaining_time": "17:00:36", "throughput": 27784.96, "total_tokens": 7005982912} +{"current_steps": 23880, "total_steps": 29667, "loss": 0.351, "lr": 2.7164687474363803e-05, "epoch": 2.414827924027431, "percentage": 80.49, "elapsed_time": "2 days, 22:04:08", "remaining_time": "16:58:49", "throughput": 27785.63, "total_tokens": 7008894080} +{"current_steps": 23890, "total_steps": 29667, "loss": 0.3449, "lr": 2.7160679287088307e-05, "epoch": 2.4158392061435388, "percentage": 80.53, "elapsed_time": "2 days, 22:05:46", "remaining_time": "16:57:01", "throughput": 27786.46, "total_tokens": 7011814720} +{"current_steps": 23900, "total_steps": 29667, "loss": 0.3448, "lr": 2.7156672873530147e-05, "epoch": 2.4168504882596467, "percentage": 80.56, "elapsed_time": "2 days, 22:07:22", "remaining_time": "16:55:13", "throughput": 27787.31, "total_tokens": 7014702592} +{"current_steps": 23910, "total_steps": 29667, "loss": 0.3425, "lr": 2.715266823238152e-05, "epoch": 2.4178617703757546, "percentage": 80.59, "elapsed_time": "2 days, 22:09:01", "remaining_time": "16:53:26", "throughput": 27788.0, "total_tokens": 7017616128} +{"current_steps": 23920, "total_steps": 29667, "loss": 0.3469, "lr": 2.714866536233598e-05, "epoch": 2.4188730524918625, "percentage": 80.63, "elapsed_time": "2 days, 22:10:42", "remaining_time": "16:51:39", "throughput": 27788.54, "total_tokens": 7020580288} +{"current_steps": 23930, "total_steps": 29667, "loss": 0.3487, "lr": 2.7144664262088422e-05, "epoch": 2.4198843346079704, "percentage": 80.66, "elapsed_time": "2 days, 22:12:22", "remaining_time": "16:49:52", "throughput": 27789.1, "total_tokens": 7023497472} +{"current_steps": 23940, "total_steps": 29667, "loss": 0.3516, "lr": 2.7140664930335084e-05, "epoch": 2.420895616724078, "percentage": 80.7, "elapsed_time": "2 days, 22:14:07", "remaining_time": "16:48:06", "throughput": 27789.46, "total_tokens": 7026492864} +{"current_steps": 23950, "total_steps": 29667, "loss": 0.3481, "lr": 2.713666736577356e-05, "epoch": 2.4219068988401857, "percentage": 80.73, "elapsed_time": "2 days, 22:15:45", "remaining_time": "16:46:19", "throughput": 27790.27, "total_tokens": 7029418560} +{"current_steps": 23960, "total_steps": 29667, "loss": 0.3438, "lr": 2.713267156710278e-05, "epoch": 2.4229181809562936, "percentage": 80.76, "elapsed_time": "2 days, 22:17:28", "remaining_time": "16:44:33", "throughput": 27790.66, "total_tokens": 7032391872} +{"current_steps": 23970, "total_steps": 29667, "loss": 0.3454, "lr": 2.712867753302301e-05, "epoch": 2.4239294630724015, "percentage": 80.8, "elapsed_time": "2 days, 22:19:04", "remaining_time": "16:42:45", "throughput": 27791.72, "total_tokens": 7035330560} +{"current_steps": 23980, "total_steps": 29667, "loss": 0.3432, "lr": 2.7124685262235865e-05, "epoch": 2.4249407451885094, "percentage": 80.83, "elapsed_time": "2 days, 22:20:49", "remaining_time": "16:40:59", "throughput": 27792.08, "total_tokens": 7038322752} +{"current_steps": 23990, "total_steps": 29667, "loss": 0.35, "lr": 2.7120694753444287e-05, "epoch": 2.425952027304617, "percentage": 80.86, "elapsed_time": "2 days, 22:22:31", "remaining_time": "16:39:13", "throughput": 27792.63, "total_tokens": 7041299008} +{"current_steps": 24000, "total_steps": 29667, "loss": 0.3449, "lr": 2.7116706005352547e-05, "epoch": 2.426963309420725, "percentage": 80.9, "elapsed_time": "2 days, 22:24:12", "remaining_time": "16:37:26", "throughput": 27793.15, "total_tokens": 7044234304} +{"current_steps": 24010, "total_steps": 29667, "loss": 0.3458, "lr": 2.7112719016666282e-05, "epoch": 2.4279745915368327, "percentage": 80.93, "elapsed_time": "2 days, 22:25:47", "remaining_time": "16:35:38", "throughput": 27793.99, "total_tokens": 7047108352} +{"current_steps": 24020, "total_steps": 29667, "loss": 0.3477, "lr": 2.7108733786092427e-05, "epoch": 2.4289858736529406, "percentage": 80.97, "elapsed_time": "2 days, 22:27:29", "remaining_time": "16:33:51", "throughput": 27794.48, "total_tokens": 7050063744} +{"current_steps": 24030, "total_steps": 29667, "loss": 0.3416, "lr": 2.7104750312339254e-05, "epoch": 2.4299971557690485, "percentage": 81.0, "elapsed_time": "2 days, 22:29:10", "remaining_time": "16:32:05", "throughput": 27795.04, "total_tokens": 7053016704} +{"current_steps": 24040, "total_steps": 29667, "loss": 0.3471, "lr": 2.7100768594116382e-05, "epoch": 2.4310084378851564, "percentage": 81.03, "elapsed_time": "2 days, 22:30:52", "remaining_time": "16:30:18", "throughput": 27795.62, "total_tokens": 7055982848} +{"current_steps": 24050, "total_steps": 29667, "loss": 0.3437, "lr": 2.709678863013473e-05, "epoch": 2.4320197200012643, "percentage": 81.07, "elapsed_time": "2 days, 22:32:27", "remaining_time": "16:28:30", "throughput": 27796.6, "total_tokens": 7058872704} +{"current_steps": 24060, "total_steps": 29667, "loss": 0.3466, "lr": 2.7092810419106562e-05, "epoch": 2.4330310021173718, "percentage": 81.1, "elapsed_time": "2 days, 22:34:03", "remaining_time": "16:26:42", "throughput": 27797.61, "total_tokens": 7061796032} +{"current_steps": 24070, "total_steps": 29667, "loss": 0.3481, "lr": 2.7088833959745457e-05, "epoch": 2.4340422842334797, "percentage": 81.13, "elapsed_time": "2 days, 22:35:39", "remaining_time": "16:24:55", "throughput": 27798.53, "total_tokens": 7064693440} +{"current_steps": 24080, "total_steps": 29667, "loss": 0.3461, "lr": 2.708485925076631e-05, "epoch": 2.4350535663495876, "percentage": 81.17, "elapsed_time": "2 days, 22:37:19", "remaining_time": "16:23:08", "throughput": 27799.4, "total_tokens": 7067693504} +{"current_steps": 24090, "total_steps": 29667, "loss": 0.3434, "lr": 2.708088629088535e-05, "epoch": 2.4360648484656955, "percentage": 81.2, "elapsed_time": "2 days, 22:39:06", "remaining_time": "16:21:22", "throughput": 27799.55, "total_tokens": 7070718720} +{"current_steps": 24100, "total_steps": 29667, "loss": 0.3437, "lr": 2.7076915078820115e-05, "epoch": 2.4370761305818034, "percentage": 81.24, "elapsed_time": "2 days, 22:40:42", "remaining_time": "16:19:35", "throughput": 27800.58, "total_tokens": 7073642880} +{"current_steps": 24110, "total_steps": 29667, "loss": 0.3505, "lr": 2.707294561328945e-05, "epoch": 2.438087412697911, "percentage": 81.27, "elapsed_time": "2 days, 22:42:24", "remaining_time": "16:17:48", "throughput": 27801.16, "total_tokens": 7076627456} +{"current_steps": 24120, "total_steps": 29667, "loss": 0.3505, "lr": 2.706897789301353e-05, "epoch": 2.4390986948140188, "percentage": 81.3, "elapsed_time": "2 days, 22:44:02", "remaining_time": "16:16:01", "throughput": 27802.12, "total_tokens": 7079597248} +{"current_steps": 24130, "total_steps": 29667, "loss": 0.3429, "lr": 2.706501191671384e-05, "epoch": 2.4401099769301267, "percentage": 81.34, "elapsed_time": "2 days, 22:45:43", "remaining_time": "16:14:14", "throughput": 27802.67, "total_tokens": 7082539008} +{"current_steps": 24140, "total_steps": 29667, "loss": 0.3482, "lr": 2.7061047683113165e-05, "epoch": 2.4411212590462346, "percentage": 81.37, "elapsed_time": "2 days, 22:47:23", "remaining_time": "16:12:27", "throughput": 27803.15, "total_tokens": 7085445568} +{"current_steps": 24150, "total_steps": 29667, "loss": 0.3445, "lr": 2.705708519093561e-05, "epoch": 2.4421325411623425, "percentage": 81.4, "elapsed_time": "2 days, 22:49:02", "remaining_time": "16:10:40", "throughput": 27803.86, "total_tokens": 7088395072} +{"current_steps": 24160, "total_steps": 29667, "loss": 0.3407, "lr": 2.705312443890658e-05, "epoch": 2.4431438232784504, "percentage": 81.44, "elapsed_time": "2 days, 22:50:44", "remaining_time": "16:08:54", "throughput": 27804.4, "total_tokens": 7091357760} +{"current_steps": 24170, "total_steps": 29667, "loss": 0.351, "lr": 2.70491654257528e-05, "epoch": 2.4441551053945583, "percentage": 81.47, "elapsed_time": "2 days, 22:52:19", "remaining_time": "16:07:06", "throughput": 27805.34, "total_tokens": 7094246272} +{"current_steps": 24180, "total_steps": 29667, "loss": 0.3467, "lr": 2.7045208150202274e-05, "epoch": 2.4451663875106657, "percentage": 81.5, "elapsed_time": "2 days, 22:53:56", "remaining_time": "16:05:19", "throughput": 27806.24, "total_tokens": 7097172672} +{"current_steps": 24190, "total_steps": 29667, "loss": 0.3497, "lr": 2.704125261098433e-05, "epoch": 2.4461776696267736, "percentage": 81.54, "elapsed_time": "2 days, 22:55:38", "remaining_time": "16:03:32", "throughput": 27806.73, "total_tokens": 7100120640} +{"current_steps": 24200, "total_steps": 29667, "loss": 0.345, "lr": 2.7037298806829586e-05, "epoch": 2.4471889517428815, "percentage": 81.57, "elapsed_time": "2 days, 22:57:17", "remaining_time": "16:01:45", "throughput": 27807.52, "total_tokens": 7103079296} +{"current_steps": 24210, "total_steps": 29667, "loss": 0.342, "lr": 2.7033346736469967e-05, "epoch": 2.4482002338589894, "percentage": 81.61, "elapsed_time": "2 days, 22:58:59", "remaining_time": "15:59:59", "throughput": 27808.14, "total_tokens": 7106086144} +{"current_steps": 24220, "total_steps": 29667, "loss": 0.3503, "lr": 2.702939639863869e-05, "epoch": 2.4492115159750973, "percentage": 81.64, "elapsed_time": "2 days, 23:00:39", "remaining_time": "15:58:12", "throughput": 27808.72, "total_tokens": 7109014464} +{"current_steps": 24230, "total_steps": 29667, "loss": 0.3451, "lr": 2.7025447792070262e-05, "epoch": 2.450222798091205, "percentage": 81.67, "elapsed_time": "2 days, 23:02:15", "remaining_time": "15:56:24", "throughput": 27809.72, "total_tokens": 7111924672} +{"current_steps": 24240, "total_steps": 29667, "loss": 0.3459, "lr": 2.7021500915500493e-05, "epoch": 2.4512340802073127, "percentage": 81.71, "elapsed_time": "2 days, 23:03:52", "remaining_time": "15:54:37", "throughput": 27810.43, "total_tokens": 7114824512} +{"current_steps": 24250, "total_steps": 29667, "loss": 0.3443, "lr": 2.701755576766648e-05, "epoch": 2.4522453623234206, "percentage": 81.74, "elapsed_time": "2 days, 23:05:33", "remaining_time": "15:52:50", "throughput": 27811.0, "total_tokens": 7117762688} +{"current_steps": 24260, "total_steps": 29667, "loss": 0.3426, "lr": 2.701361234730661e-05, "epoch": 2.4532566444395285, "percentage": 81.77, "elapsed_time": "2 days, 23:07:12", "remaining_time": "15:51:03", "throughput": 27811.64, "total_tokens": 7120696384} +{"current_steps": 24270, "total_steps": 29667, "loss": 0.3493, "lr": 2.700967065316056e-05, "epoch": 2.4542679265556364, "percentage": 81.81, "elapsed_time": "2 days, 23:08:51", "remaining_time": "15:49:16", "throughput": 27812.33, "total_tokens": 7123613824} +{"current_steps": 24280, "total_steps": 29667, "loss": 0.3475, "lr": 2.70057306839693e-05, "epoch": 2.4552792086717443, "percentage": 81.84, "elapsed_time": "2 days, 23:10:31", "remaining_time": "15:47:30", "throughput": 27812.93, "total_tokens": 7126557504} +{"current_steps": 24290, "total_steps": 29667, "loss": 0.3471, "lr": 2.7001792438475076e-05, "epoch": 2.456290490787852, "percentage": 81.88, "elapsed_time": "2 days, 23:12:13", "remaining_time": "15:45:43", "throughput": 27813.47, "total_tokens": 7129531584} +{"current_steps": 24300, "total_steps": 29667, "loss": 0.3488, "lr": 2.6997855915421416e-05, "epoch": 2.4573017729039597, "percentage": 81.91, "elapsed_time": "2 days, 23:13:52", "remaining_time": "15:43:56", "throughput": 27814.27, "total_tokens": 7132496064} +{"current_steps": 24310, "total_steps": 29667, "loss": 0.3486, "lr": 2.6993921113553145e-05, "epoch": 2.4583130550200676, "percentage": 81.94, "elapsed_time": "2 days, 23:15:34", "remaining_time": "15:42:10", "throughput": 27814.95, "total_tokens": 7135482752} +{"current_steps": 24320, "total_steps": 29667, "loss": 0.3454, "lr": 2.6989988031616343e-05, "epoch": 2.4593243371361755, "percentage": 81.98, "elapsed_time": "2 days, 23:17:12", "remaining_time": "15:40:23", "throughput": 27815.71, "total_tokens": 7138415616} +{"current_steps": 24330, "total_steps": 29667, "loss": 0.3435, "lr": 2.6986056668358396e-05, "epoch": 2.4603356192522834, "percentage": 82.01, "elapsed_time": "2 days, 23:18:53", "remaining_time": "15:38:36", "throughput": 27816.28, "total_tokens": 7141375104} +{"current_steps": 24340, "total_steps": 29667, "loss": 0.3442, "lr": 2.6982127022527947e-05, "epoch": 2.4613469013683913, "percentage": 82.04, "elapsed_time": "2 days, 23:20:35", "remaining_time": "15:36:50", "throughput": 27816.7, "total_tokens": 7144304064} +{"current_steps": 24350, "total_steps": 29667, "loss": 0.3461, "lr": 2.697819909287493e-05, "epoch": 2.4623581834844988, "percentage": 82.08, "elapsed_time": "2 days, 23:22:15", "remaining_time": "15:35:03", "throughput": 27817.19, "total_tokens": 7147234432} +{"current_steps": 24360, "total_steps": 29667, "loss": 0.3484, "lr": 2.697427287815053e-05, "epoch": 2.4633694656006067, "percentage": 82.11, "elapsed_time": "2 days, 23:24:02", "remaining_time": "15:33:18", "throughput": 27817.39, "total_tokens": 7150246080} +{"current_steps": 24370, "total_steps": 29667, "loss": 0.3494, "lr": 2.6970348377107236e-05, "epoch": 2.4643807477167146, "percentage": 82.15, "elapsed_time": "2 days, 23:25:41", "remaining_time": "15:31:31", "throughput": 27818.11, "total_tokens": 7153180480} +{"current_steps": 24380, "total_steps": 29667, "loss": 0.3477, "lr": 2.696642558849877e-05, "epoch": 2.4653920298328225, "percentage": 82.18, "elapsed_time": "2 days, 23:27:21", "remaining_time": "15:29:44", "throughput": 27818.68, "total_tokens": 7156119104} +{"current_steps": 24390, "total_steps": 29667, "loss": 0.34, "lr": 2.696250451108016e-05, "epoch": 2.4664033119489304, "percentage": 82.21, "elapsed_time": "2 days, 23:28:55", "remaining_time": "15:27:56", "throughput": 27819.8, "total_tokens": 7159027264} +{"current_steps": 24400, "total_steps": 29667, "loss": 0.3523, "lr": 2.6958585143607662e-05, "epoch": 2.4674145940650383, "percentage": 82.25, "elapsed_time": "2 days, 23:30:39", "remaining_time": "15:26:11", "throughput": 27820.28, "total_tokens": 7162031744} +{"current_steps": 24410, "total_steps": 29667, "loss": 0.3475, "lr": 2.695466748483883e-05, "epoch": 2.4684258761811457, "percentage": 82.28, "elapsed_time": "2 days, 23:32:18", "remaining_time": "15:24:24", "throughput": 27820.87, "total_tokens": 7164940608} +{"current_steps": 24420, "total_steps": 29667, "loss": 0.3505, "lr": 2.695075153353247e-05, "epoch": 2.4694371582972536, "percentage": 82.31, "elapsed_time": "2 days, 23:33:57", "remaining_time": "15:22:37", "throughput": 27821.54, "total_tokens": 7167868224} +{"current_steps": 24430, "total_steps": 29667, "loss": 0.3443, "lr": 2.6946837288448646e-05, "epoch": 2.4704484404133615, "percentage": 82.35, "elapsed_time": "2 days, 23:35:37", "remaining_time": "15:20:50", "throughput": 27822.04, "total_tokens": 7170783552} +{"current_steps": 24440, "total_steps": 29667, "loss": 0.3451, "lr": 2.6942924748348684e-05, "epoch": 2.4714597225294694, "percentage": 82.38, "elapsed_time": "2 days, 23:37:21", "remaining_time": "15:19:04", "throughput": 27822.33, "total_tokens": 7173756096} +{"current_steps": 24450, "total_steps": 29667, "loss": 0.3457, "lr": 2.693901391199517e-05, "epoch": 2.4724710046455773, "percentage": 82.41, "elapsed_time": "2 days, 23:39:02", "remaining_time": "15:17:18", "throughput": 27822.91, "total_tokens": 7176697344} +{"current_steps": 24460, "total_steps": 29667, "loss": 0.3467, "lr": 2.6935104778151943e-05, "epoch": 2.4734822867616852, "percentage": 82.45, "elapsed_time": "2 days, 23:40:46", "remaining_time": "15:15:32", "throughput": 27823.32, "total_tokens": 7179703488} +{"current_steps": 24470, "total_steps": 29667, "loss": 0.3432, "lr": 2.6931197345584102e-05, "epoch": 2.4744935688777927, "percentage": 82.48, "elapsed_time": "2 days, 23:42:24", "remaining_time": "15:13:45", "throughput": 27824.12, "total_tokens": 7182642112} +{"current_steps": 24480, "total_steps": 29667, "loss": 0.3451, "lr": 2.6927291613058003e-05, "epoch": 2.4755048509939006, "percentage": 82.52, "elapsed_time": "2 days, 23:44:04", "remaining_time": "15:11:58", "throughput": 27824.68, "total_tokens": 7185576128} +{"current_steps": 24490, "total_steps": 29667, "loss": 0.349, "lr": 2.6923387579341254e-05, "epoch": 2.4765161331100085, "percentage": 82.55, "elapsed_time": "2 days, 23:45:45", "remaining_time": "15:10:12", "throughput": 27825.32, "total_tokens": 7188541696} +{"current_steps": 24500, "total_steps": 29667, "loss": 0.3451, "lr": 2.6919485243202693e-05, "epoch": 2.4775274152261164, "percentage": 82.58, "elapsed_time": "2 days, 23:47:23", "remaining_time": "15:08:25", "throughput": 27826.08, "total_tokens": 7191471232} +{"current_steps": 24510, "total_steps": 29667, "loss": 0.3472, "lr": 2.6915584603412434e-05, "epoch": 2.4785386973422243, "percentage": 82.62, "elapsed_time": "2 days, 23:49:01", "remaining_time": "15:06:38", "throughput": 27826.92, "total_tokens": 7194419200} +{"current_steps": 24520, "total_steps": 29667, "loss": 0.348, "lr": 2.6911685658741827e-05, "epoch": 2.4795499794583318, "percentage": 82.65, "elapsed_time": "2 days, 23:50:38", "remaining_time": "15:04:50", "throughput": 27827.84, "total_tokens": 7197351744} +{"current_steps": 24530, "total_steps": 29667, "loss": 0.3461, "lr": 2.690778840796346e-05, "epoch": 2.4805612615744397, "percentage": 82.68, "elapsed_time": "2 days, 23:52:17", "remaining_time": "15:03:04", "throughput": 27828.5, "total_tokens": 7200285440} +{"current_steps": 24540, "total_steps": 29667, "loss": 0.3506, "lr": 2.6903892849851175e-05, "epoch": 2.4815725436905476, "percentage": 82.72, "elapsed_time": "2 days, 23:53:58", "remaining_time": "15:01:17", "throughput": 27829.27, "total_tokens": 7203278720} +{"current_steps": 24550, "total_steps": 29667, "loss": 0.3455, "lr": 2.6899998983180057e-05, "epoch": 2.4825838258066555, "percentage": 82.75, "elapsed_time": "2 days, 23:55:39", "remaining_time": "14:59:31", "throughput": 27829.69, "total_tokens": 7206206848} +{"current_steps": 24560, "total_steps": 29667, "loss": 0.3454, "lr": 2.689610680672642e-05, "epoch": 2.4835951079227634, "percentage": 82.79, "elapsed_time": "2 days, 23:57:15", "remaining_time": "14:57:43", "throughput": 27830.48, "total_tokens": 7209092800} +{"current_steps": 24570, "total_steps": 29667, "loss": 0.3457, "lr": 2.6892216319267843e-05, "epoch": 2.4846063900388713, "percentage": 82.82, "elapsed_time": "2 days, 23:58:52", "remaining_time": "14:55:56", "throughput": 27831.29, "total_tokens": 7211991872} +{"current_steps": 24580, "total_steps": 29667, "loss": 0.3466, "lr": 2.6888327519583107e-05, "epoch": 2.485617672154979, "percentage": 82.85, "elapsed_time": "3 days, 0:00:32", "remaining_time": "14:54:10", "throughput": 27831.86, "total_tokens": 7214936256} +{"current_steps": 24590, "total_steps": 29667, "loss": 0.3486, "lr": 2.688444040645225e-05, "epoch": 2.4866289542710867, "percentage": 82.89, "elapsed_time": "3 days, 0:02:10", "remaining_time": "14:52:22", "throughput": 27832.69, "total_tokens": 7217851136} +{"current_steps": 24600, "total_steps": 29667, "loss": 0.3454, "lr": 2.688055497865654e-05, "epoch": 2.4876402363871946, "percentage": 82.92, "elapsed_time": "3 days, 0:03:49", "remaining_time": "14:50:36", "throughput": 27833.25, "total_tokens": 7220779648} +{"current_steps": 24610, "total_steps": 29667, "loss": 0.3484, "lr": 2.6876671234978483e-05, "epoch": 2.4886515185033025, "percentage": 82.95, "elapsed_time": "3 days, 0:05:26", "remaining_time": "14:48:48", "throughput": 27834.03, "total_tokens": 7223671936} +{"current_steps": 24620, "total_steps": 29667, "loss": 0.343, "lr": 2.6872789174201807e-05, "epoch": 2.4896628006194104, "percentage": 82.99, "elapsed_time": "3 days, 0:07:06", "remaining_time": "14:47:02", "throughput": 27834.66, "total_tokens": 7226623104} +{"current_steps": 24630, "total_steps": 29667, "loss": 0.3484, "lr": 2.686890879511147e-05, "epoch": 2.4906740827355183, "percentage": 83.02, "elapsed_time": "3 days, 0:08:43", "remaining_time": "14:45:15", "throughput": 27835.59, "total_tokens": 7229556608} +{"current_steps": 24640, "total_steps": 29667, "loss": 0.3448, "lr": 2.6865030096493665e-05, "epoch": 2.4916853648516257, "percentage": 83.06, "elapsed_time": "3 days, 0:10:23", "remaining_time": "14:43:28", "throughput": 27836.2, "total_tokens": 7232498368} +{"current_steps": 24650, "total_steps": 29667, "loss": 0.3441, "lr": 2.6861153077135815e-05, "epoch": 2.4926966469677336, "percentage": 83.09, "elapsed_time": "3 days, 0:12:03", "remaining_time": "14:41:42", "throughput": 27836.91, "total_tokens": 7235457088} +{"current_steps": 24660, "total_steps": 29667, "loss": 0.3487, "lr": 2.6857277735826545e-05, "epoch": 2.4937079290838415, "percentage": 83.12, "elapsed_time": "3 days, 0:13:44", "remaining_time": "14:39:55", "throughput": 27837.49, "total_tokens": 7238426496} +{"current_steps": 24670, "total_steps": 29667, "loss": 0.3466, "lr": 2.685340407135573e-05, "epoch": 2.4947192111999494, "percentage": 83.16, "elapsed_time": "3 days, 0:15:26", "remaining_time": "14:38:09", "throughput": 27837.88, "total_tokens": 7241357952} +{"current_steps": 24680, "total_steps": 29667, "loss": 0.3531, "lr": 2.6849532082514445e-05, "epoch": 2.4957304933160573, "percentage": 83.19, "elapsed_time": "3 days, 0:17:07", "remaining_time": "14:36:23", "throughput": 27838.35, "total_tokens": 7244291968} +{"current_steps": 24690, "total_steps": 29667, "loss": 0.3479, "lr": 2.6845661768095005e-05, "epoch": 2.4967417754321652, "percentage": 83.22, "elapsed_time": "3 days, 0:18:43", "remaining_time": "14:34:35", "throughput": 27839.19, "total_tokens": 7247206784} +{"current_steps": 24700, "total_steps": 29667, "loss": 0.347, "lr": 2.6841793126890925e-05, "epoch": 2.497753057548273, "percentage": 83.26, "elapsed_time": "3 days, 0:20:19", "remaining_time": "14:32:48", "throughput": 27840.07, "total_tokens": 7250095232} +{"current_steps": 24710, "total_steps": 29667, "loss": 0.3451, "lr": 2.6837926157696946e-05, "epoch": 2.4987643396643806, "percentage": 83.29, "elapsed_time": "3 days, 0:21:57", "remaining_time": "14:31:01", "throughput": 27840.86, "total_tokens": 7253032704} +{"current_steps": 24720, "total_steps": 29667, "loss": 0.3469, "lr": 2.6834060859309018e-05, "epoch": 2.4997756217804885, "percentage": 83.32, "elapsed_time": "3 days, 0:23:35", "remaining_time": "14:29:14", "throughput": 27841.62, "total_tokens": 7255947648} +{"current_steps": 24730, "total_steps": 29667, "loss": 0.3486, "lr": 2.6830197230524317e-05, "epoch": 2.5007869038965964, "percentage": 83.36, "elapsed_time": "3 days, 0:25:15", "remaining_time": "14:27:28", "throughput": 27842.22, "total_tokens": 7258907072} +{"current_steps": 24740, "total_steps": 29667, "loss": 0.3497, "lr": 2.6826335270141216e-05, "epoch": 2.5017981860127043, "percentage": 83.39, "elapsed_time": "3 days, 0:26:52", "remaining_time": "14:25:41", "throughput": 27843.01, "total_tokens": 7261814080} +{"current_steps": 24750, "total_steps": 29667, "loss": 0.3471, "lr": 2.6822474976959312e-05, "epoch": 2.502809468128812, "percentage": 83.43, "elapsed_time": "3 days, 0:28:31", "remaining_time": "14:23:54", "throughput": 27843.77, "total_tokens": 7264755840} +{"current_steps": 24760, "total_steps": 29667, "loss": 0.3494, "lr": 2.6818616349779397e-05, "epoch": 2.5038207502449197, "percentage": 83.46, "elapsed_time": "3 days, 0:30:12", "remaining_time": "14:22:08", "throughput": 27844.14, "total_tokens": 7267677568} +{"current_steps": 24770, "total_steps": 29667, "loss": 0.3468, "lr": 2.6814759387403482e-05, "epoch": 2.5048320323610276, "percentage": 83.49, "elapsed_time": "3 days, 0:31:48", "remaining_time": "14:20:20", "throughput": 27845.23, "total_tokens": 7270627328} +{"current_steps": 24780, "total_steps": 29667, "loss": 0.3425, "lr": 2.681090408863477e-05, "epoch": 2.5058433144771355, "percentage": 83.53, "elapsed_time": "3 days, 0:33:27", "remaining_time": "14:18:34", "throughput": 27846.05, "total_tokens": 7273597504} +{"current_steps": 24790, "total_steps": 29667, "loss": 0.3489, "lr": 2.6807050452277694e-05, "epoch": 2.5068545965932434, "percentage": 83.56, "elapsed_time": "3 days, 0:35:12", "remaining_time": "14:16:48", "throughput": 27846.44, "total_tokens": 7276619904} +{"current_steps": 24800, "total_steps": 29667, "loss": 0.3436, "lr": 2.6803198477137853e-05, "epoch": 2.5078658787093513, "percentage": 83.59, "elapsed_time": "3 days, 0:36:56", "remaining_time": "14:15:02", "throughput": 27846.85, "total_tokens": 7279624448} +{"current_steps": 24810, "total_steps": 29667, "loss": 0.3499, "lr": 2.6799348162022082e-05, "epoch": 2.5088771608254588, "percentage": 83.63, "elapsed_time": "3 days, 0:38:33", "remaining_time": "14:13:15", "throughput": 27847.55, "total_tokens": 7282516736} +{"current_steps": 24820, "total_steps": 29667, "loss": 0.3518, "lr": 2.6795499505738397e-05, "epoch": 2.509888442941567, "percentage": 83.66, "elapsed_time": "3 days, 0:40:15", "remaining_time": "14:11:29", "throughput": 27847.78, "total_tokens": 7285409024} +{"current_steps": 24830, "total_steps": 29667, "loss": 0.3533, "lr": 2.679165250709601e-05, "epoch": 2.5108997250576746, "percentage": 83.7, "elapsed_time": "3 days, 0:41:54", "remaining_time": "14:09:43", "throughput": 27848.37, "total_tokens": 7288317952} +{"current_steps": 24840, "total_steps": 29667, "loss": 0.345, "lr": 2.678780716490533e-05, "epoch": 2.5119110071737825, "percentage": 83.73, "elapsed_time": "3 days, 0:43:33", "remaining_time": "14:07:56", "throughput": 27848.98, "total_tokens": 7291232576} +{"current_steps": 24850, "total_steps": 29667, "loss": 0.3471, "lr": 2.678396347797798e-05, "epoch": 2.5129222892898904, "percentage": 83.76, "elapsed_time": "3 days, 0:45:11", "remaining_time": "14:06:09", "throughput": 27849.63, "total_tokens": 7294149056} +{"current_steps": 24860, "total_steps": 29667, "loss": 0.3442, "lr": 2.6780121445126756e-05, "epoch": 2.5139335714059983, "percentage": 83.8, "elapsed_time": "3 days, 0:46:55", "remaining_time": "14:04:24", "throughput": 27849.93, "total_tokens": 7297112064} +{"current_steps": 24870, "total_steps": 29667, "loss": 0.3448, "lr": 2.6776281065165644e-05, "epoch": 2.514944853522106, "percentage": 83.83, "elapsed_time": "3 days, 0:48:39", "remaining_time": "14:02:38", "throughput": 27850.26, "total_tokens": 7300084416} +{"current_steps": 24880, "total_steps": 29667, "loss": 0.3511, "lr": 2.677244233690983e-05, "epoch": 2.5159561356382136, "percentage": 83.86, "elapsed_time": "3 days, 0:50:16", "remaining_time": "14:00:51", "throughput": 27850.96, "total_tokens": 7302970048} +{"current_steps": 24890, "total_steps": 29667, "loss": 0.3459, "lr": 2.6768605259175694e-05, "epoch": 2.5169674177543215, "percentage": 83.9, "elapsed_time": "3 days, 0:51:53", "remaining_time": "13:59:04", "throughput": 27851.71, "total_tokens": 7305886912} +{"current_steps": 24900, "total_steps": 29667, "loss": 0.3528, "lr": 2.6764769830780784e-05, "epoch": 2.5179786998704294, "percentage": 83.93, "elapsed_time": "3 days, 0:53:35", "remaining_time": "13:57:18", "throughput": 27852.31, "total_tokens": 7308883264} +{"current_steps": 24910, "total_steps": 29667, "loss": 0.3424, "lr": 2.6760936050543857e-05, "epoch": 2.5189899819865373, "percentage": 83.97, "elapsed_time": "3 days, 0:55:09", "remaining_time": "13:55:30", "throughput": 27853.4, "total_tokens": 7311776704} +{"current_steps": 24920, "total_steps": 29667, "loss": 0.3433, "lr": 2.675710391728483e-05, "epoch": 2.5200012641026452, "percentage": 84.0, "elapsed_time": "3 days, 0:56:48", "remaining_time": "13:53:44", "throughput": 27853.97, "total_tokens": 7314685696} +{"current_steps": 24930, "total_steps": 29667, "loss": 0.3483, "lr": 2.6753273429824822e-05, "epoch": 2.5210125462187527, "percentage": 84.03, "elapsed_time": "3 days, 0:58:32", "remaining_time": "13:51:58", "throughput": 27854.21, "total_tokens": 7317643648} +{"current_steps": 24940, "total_steps": 29667, "loss": 0.3484, "lr": 2.6749444586986127e-05, "epoch": 2.522023828334861, "percentage": 84.07, "elapsed_time": "3 days, 1:00:09", "remaining_time": "13:50:11", "throughput": 27855.07, "total_tokens": 7320573504} +{"current_steps": 24950, "total_steps": 29667, "loss": 0.3455, "lr": 2.6745617387592214e-05, "epoch": 2.5230351104509685, "percentage": 84.1, "elapsed_time": "3 days, 1:01:44", "remaining_time": "13:48:24", "throughput": 27856.05, "total_tokens": 7323470656} +{"current_steps": 24960, "total_steps": 29667, "loss": 0.346, "lr": 2.6741791830467728e-05, "epoch": 2.5240463925670764, "percentage": 84.13, "elapsed_time": "3 days, 1:03:18", "remaining_time": "13:46:36", "throughput": 27857.05, "total_tokens": 7326375552} +{"current_steps": 24970, "total_steps": 29667, "loss": 0.3436, "lr": 2.67379679144385e-05, "epoch": 2.5250576746831843, "percentage": 84.17, "elapsed_time": "3 days, 1:05:02", "remaining_time": "13:44:51", "throughput": 27857.42, "total_tokens": 7329355840} +{"current_steps": 24980, "total_steps": 29667, "loss": 0.3435, "lr": 2.6734145638331536e-05, "epoch": 2.526068956799292, "percentage": 84.2, "elapsed_time": "3 days, 1:06:43", "remaining_time": "13:43:04", "throughput": 27857.92, "total_tokens": 7332303424} +{"current_steps": 24990, "total_steps": 29667, "loss": 0.3483, "lr": 2.673032500097501e-05, "epoch": 2.5270802389154, "percentage": 84.24, "elapsed_time": "3 days, 1:08:23", "remaining_time": "13:41:18", "throughput": 27858.51, "total_tokens": 7335251904} +{"current_steps": 25000, "total_steps": 29667, "loss": 0.3419, "lr": 2.672650600119826e-05, "epoch": 2.5280915210315076, "percentage": 84.27, "elapsed_time": "3 days, 1:09:59", "remaining_time": "13:39:31", "throughput": 27859.39, "total_tokens": 7338149568} +{"current_steps": 25000, "total_steps": 29667, "eval_loss": 0.3296365439891815, "epoch": 2.5280915210315076, "percentage": 84.27, "elapsed_time": "3 days, 1:10:01", "remaining_time": "13:39:31", "throughput": 27859.21, "total_tokens": 7338149568} +{"current_steps": 25010, "total_steps": 29667, "loss": 0.3484, "lr": 2.672268863783181e-05, "epoch": 2.5291028031476155, "percentage": 84.3, "elapsed_time": "3 days, 1:12:46", "remaining_time": "13:37:57", "throughput": 27852.85, "total_tokens": 7341066240} +{"current_steps": 25020, "total_steps": 29667, "loss": 0.3469, "lr": 2.6718872909707347e-05, "epoch": 2.5301140852637234, "percentage": 84.34, "elapsed_time": "3 days, 1:14:26", "remaining_time": "13:36:11", "throughput": 27853.4, "total_tokens": 7344001984} +{"current_steps": 25030, "total_steps": 29667, "loss": 0.3483, "lr": 2.671505881565772e-05, "epoch": 2.5311253673798313, "percentage": 84.37, "elapsed_time": "3 days, 1:16:06", "remaining_time": "13:34:24", "throughput": 27854.1, "total_tokens": 7346968192} +{"current_steps": 25040, "total_steps": 29667, "loss": 0.3498, "lr": 2.671124635451696e-05, "epoch": 2.532136649495939, "percentage": 84.4, "elapsed_time": "3 days, 1:17:44", "remaining_time": "13:32:38", "throughput": 27854.76, "total_tokens": 7349890304} +{"current_steps": 25050, "total_steps": 29667, "loss": 0.3473, "lr": 2.6707435525120237e-05, "epoch": 2.5331479316120467, "percentage": 84.44, "elapsed_time": "3 days, 1:19:23", "remaining_time": "13:30:51", "throughput": 27855.45, "total_tokens": 7352833664} +{"current_steps": 25060, "total_steps": 29667, "loss": 0.3467, "lr": 2.6703626326303906e-05, "epoch": 2.534159213728155, "percentage": 84.47, "elapsed_time": "3 days, 1:21:06", "remaining_time": "13:29:05", "throughput": 27855.68, "total_tokens": 7355764608} +{"current_steps": 25070, "total_steps": 29667, "loss": 0.3497, "lr": 2.669981875690547e-05, "epoch": 2.5351704958442625, "percentage": 84.5, "elapsed_time": "3 days, 1:22:47", "remaining_time": "13:27:19", "throughput": 27856.15, "total_tokens": 7358691392} +{"current_steps": 25080, "total_steps": 29667, "loss": 0.3455, "lr": 2.6696012815763604e-05, "epoch": 2.5361817779603704, "percentage": 84.54, "elapsed_time": "3 days, 1:24:28", "remaining_time": "13:25:33", "throughput": 27856.73, "total_tokens": 7361655552} +{"current_steps": 25090, "total_steps": 29667, "loss": 0.3466, "lr": 2.669220850171813e-05, "epoch": 2.5371930600764783, "percentage": 84.57, "elapsed_time": "3 days, 1:26:06", "remaining_time": "13:23:46", "throughput": 27857.47, "total_tokens": 7364576768} +{"current_steps": 25100, "total_steps": 29667, "loss": 0.3486, "lr": 2.668840581361003e-05, "epoch": 2.538204342192586, "percentage": 84.61, "elapsed_time": "3 days, 1:27:49", "remaining_time": "13:22:00", "throughput": 27857.74, "total_tokens": 7367526016} +{"current_steps": 25110, "total_steps": 29667, "loss": 0.3484, "lr": 2.668460475028145e-05, "epoch": 2.539215624308694, "percentage": 84.64, "elapsed_time": "3 days, 1:29:25", "remaining_time": "13:20:13", "throughput": 27858.61, "total_tokens": 7370432448} +{"current_steps": 25120, "total_steps": 29667, "loss": 0.3486, "lr": 2.6680805310575686e-05, "epoch": 2.5402269064248015, "percentage": 84.67, "elapsed_time": "3 days, 1:31:07", "remaining_time": "13:18:27", "throughput": 27859.13, "total_tokens": 7373409984} +{"current_steps": 25130, "total_steps": 29667, "loss": 0.3465, "lr": 2.6677007493337164e-05, "epoch": 2.5412381885409094, "percentage": 84.71, "elapsed_time": "3 days, 1:32:50", "remaining_time": "13:16:42", "throughput": 27859.69, "total_tokens": 7376431808} +{"current_steps": 25140, "total_steps": 29667, "loss": 0.3426, "lr": 2.6673211297411503e-05, "epoch": 2.5422494706570173, "percentage": 84.74, "elapsed_time": "3 days, 1:34:31", "remaining_time": "13:14:55", "throughput": 27860.38, "total_tokens": 7379409856} +{"current_steps": 25150, "total_steps": 29667, "loss": 0.3485, "lr": 2.6669416721645447e-05, "epoch": 2.5432607527731252, "percentage": 84.77, "elapsed_time": "3 days, 1:36:11", "remaining_time": "13:13:09", "throughput": 27860.83, "total_tokens": 7382337984} +{"current_steps": 25160, "total_steps": 29667, "loss": 0.3465, "lr": 2.6665623764886876e-05, "epoch": 2.544272034889233, "percentage": 84.81, "elapsed_time": "3 days, 1:37:49", "remaining_time": "13:11:22", "throughput": 27861.48, "total_tokens": 7385240320} +{"current_steps": 25170, "total_steps": 29667, "loss": 0.3459, "lr": 2.6661832425984847e-05, "epoch": 2.5452833170053406, "percentage": 84.84, "elapsed_time": "3 days, 1:39:29", "remaining_time": "13:09:36", "throughput": 27862.24, "total_tokens": 7388208192} +{"current_steps": 25180, "total_steps": 29667, "loss": 0.3449, "lr": 2.665804270378953e-05, "epoch": 2.5462945991214485, "percentage": 84.88, "elapsed_time": "3 days, 1:41:04", "remaining_time": "13:07:49", "throughput": 27863.07, "total_tokens": 7391071104} +{"current_steps": 25190, "total_steps": 29667, "loss": 0.3444, "lr": 2.665425459715228e-05, "epoch": 2.5473058812375564, "percentage": 84.91, "elapsed_time": "3 days, 1:42:41", "remaining_time": "13:06:02", "throughput": 27864.01, "total_tokens": 7394026048} +{"current_steps": 25200, "total_steps": 29667, "loss": 0.3472, "lr": 2.6650468104925547e-05, "epoch": 2.5483171633536643, "percentage": 84.94, "elapsed_time": "3 days, 1:44:21", "remaining_time": "13:04:16", "throughput": 27864.64, "total_tokens": 7396974976} +{"current_steps": 25210, "total_steps": 29667, "loss": 0.3466, "lr": 2.664668322596295e-05, "epoch": 2.549328445469772, "percentage": 84.98, "elapsed_time": "3 days, 1:45:58", "remaining_time": "13:02:29", "throughput": 27865.41, "total_tokens": 7399898240} +{"current_steps": 25220, "total_steps": 29667, "loss": 0.3479, "lr": 2.664289995911925e-05, "epoch": 2.55033972758588, "percentage": 85.01, "elapsed_time": "3 days, 1:47:37", "remaining_time": "13:00:42", "throughput": 27866.15, "total_tokens": 7402852160} +{"current_steps": 25230, "total_steps": 29667, "loss": 0.3462, "lr": 2.6639118303250328e-05, "epoch": 2.551351009701988, "percentage": 85.04, "elapsed_time": "3 days, 1:49:24", "remaining_time": "12:58:57", "throughput": 27866.27, "total_tokens": 7405866944} +{"current_steps": 25240, "total_steps": 29667, "loss": 0.3456, "lr": 2.663533825721321e-05, "epoch": 2.5523622918180955, "percentage": 85.08, "elapsed_time": "3 days, 1:51:05", "remaining_time": "12:57:11", "throughput": 27866.64, "total_tokens": 7408778304} +{"current_steps": 25250, "total_steps": 29667, "loss": 0.3535, "lr": 2.6631559819866065e-05, "epoch": 2.5533735739342034, "percentage": 85.11, "elapsed_time": "3 days, 1:52:47", "remaining_time": "12:55:25", "throughput": 27866.96, "total_tokens": 7411702912} +{"current_steps": 25260, "total_steps": 29667, "loss": 0.3408, "lr": 2.662778299006819e-05, "epoch": 2.5543848560503113, "percentage": 85.15, "elapsed_time": "3 days, 1:54:29", "remaining_time": "12:53:39", "throughput": 27867.39, "total_tokens": 7414649536} +{"current_steps": 25270, "total_steps": 29667, "loss": 0.3425, "lr": 2.6624007766680004e-05, "epoch": 2.555396138166419, "percentage": 85.18, "elapsed_time": "3 days, 1:56:08", "remaining_time": "12:51:53", "throughput": 27868.02, "total_tokens": 7417590784} +{"current_steps": 25280, "total_steps": 29667, "loss": 0.35, "lr": 2.6620234148563066e-05, "epoch": 2.556407420282527, "percentage": 85.21, "elapsed_time": "3 days, 1:57:51", "remaining_time": "12:50:07", "throughput": 27868.17, "total_tokens": 7420493696} +{"current_steps": 25290, "total_steps": 29667, "loss": 0.348, "lr": 2.6616462134580072e-05, "epoch": 2.5574187023986346, "percentage": 85.25, "elapsed_time": "3 days, 1:59:30", "remaining_time": "12:48:21", "throughput": 27868.93, "total_tokens": 7423449664} +{"current_steps": 25300, "total_steps": 29667, "loss": 0.3473, "lr": 2.6612691723594835e-05, "epoch": 2.5584299845147425, "percentage": 85.28, "elapsed_time": "3 days, 2:01:05", "remaining_time": "12:46:34", "throughput": 27869.72, "total_tokens": 7426321536} +{"current_steps": 25310, "total_steps": 29667, "loss": 0.3469, "lr": 2.6608922914472283e-05, "epoch": 2.5594412666308504, "percentage": 85.31, "elapsed_time": "3 days, 2:02:48", "remaining_time": "12:44:48", "throughput": 27870.13, "total_tokens": 7429298048} +{"current_steps": 25320, "total_steps": 29667, "loss": 0.3452, "lr": 2.66051557060785e-05, "epoch": 2.5604525487469583, "percentage": 85.35, "elapsed_time": "3 days, 2:04:30", "remaining_time": "12:43:02", "throughput": 27870.52, "total_tokens": 7432256128} +{"current_steps": 25330, "total_steps": 29667, "loss": 0.3492, "lr": 2.6601390097280665e-05, "epoch": 2.561463830863066, "percentage": 85.38, "elapsed_time": "3 days, 2:06:08", "remaining_time": "12:41:16", "throughput": 27871.22, "total_tokens": 7435159488} +{"current_steps": 25340, "total_steps": 29667, "loss": 0.3494, "lr": 2.6597626086947097e-05, "epoch": 2.562475112979174, "percentage": 85.41, "elapsed_time": "3 days, 2:07:51", "remaining_time": "12:39:30", "throughput": 27871.68, "total_tokens": 7438160320} +{"current_steps": 25350, "total_steps": 29667, "loss": 0.3478, "lr": 2.659386367394722e-05, "epoch": 2.563486395095282, "percentage": 85.45, "elapsed_time": "3 days, 2:09:28", "remaining_time": "12:37:43", "throughput": 27872.53, "total_tokens": 7441082560} +{"current_steps": 25360, "total_steps": 29667, "loss": 0.3432, "lr": 2.65901028571516e-05, "epoch": 2.5644976772113894, "percentage": 85.48, "elapsed_time": "3 days, 2:11:07", "remaining_time": "12:35:57", "throughput": 27873.11, "total_tokens": 7444014336} +{"current_steps": 25370, "total_steps": 29667, "loss": 0.3454, "lr": 2.6586343635431887e-05, "epoch": 2.5655089593274973, "percentage": 85.52, "elapsed_time": "3 days, 2:12:48", "remaining_time": "12:34:11", "throughput": 27873.75, "total_tokens": 7446978688} +{"current_steps": 25380, "total_steps": 29667, "loss": 0.3504, "lr": 2.658258600766088e-05, "epoch": 2.5665202414436052, "percentage": 85.55, "elapsed_time": "3 days, 2:14:24", "remaining_time": "12:32:24", "throughput": 27874.64, "total_tokens": 7449889984} +{"current_steps": 25390, "total_steps": 29667, "loss": 0.3479, "lr": 2.657882997271247e-05, "epoch": 2.567531523559713, "percentage": 85.58, "elapsed_time": "3 days, 2:16:01", "remaining_time": "12:30:37", "throughput": 27875.39, "total_tokens": 7452813568} +{"current_steps": 25400, "total_steps": 29667, "loss": 0.3452, "lr": 2.6575075529461685e-05, "epoch": 2.568542805675821, "percentage": 85.62, "elapsed_time": "3 days, 2:17:44", "remaining_time": "12:28:51", "throughput": 27875.74, "total_tokens": 7455771584} +{"current_steps": 25410, "total_steps": 29667, "loss": 0.3439, "lr": 2.657132267678464e-05, "epoch": 2.5695540877919285, "percentage": 85.65, "elapsed_time": "3 days, 2:19:23", "remaining_time": "12:27:05", "throughput": 27876.43, "total_tokens": 7458723776} +{"current_steps": 25420, "total_steps": 29667, "loss": 0.3469, "lr": 2.656757141355857e-05, "epoch": 2.5705653699080364, "percentage": 85.68, "elapsed_time": "3 days, 2:21:06", "remaining_time": "12:25:19", "throughput": 27876.95, "total_tokens": 7461713984} +{"current_steps": 25430, "total_steps": 29667, "loss": 0.3464, "lr": 2.6563821738661833e-05, "epoch": 2.5715766520241443, "percentage": 85.72, "elapsed_time": "3 days, 2:22:47", "remaining_time": "12:23:33", "throughput": 27877.46, "total_tokens": 7464674816} +{"current_steps": 25440, "total_steps": 29667, "loss": 0.3437, "lr": 2.6560073650973873e-05, "epoch": 2.572587934140252, "percentage": 85.75, "elapsed_time": "3 days, 2:24:22", "remaining_time": "12:21:46", "throughput": 27878.39, "total_tokens": 7467571712} +{"current_steps": 25450, "total_steps": 29667, "loss": 0.3468, "lr": 2.655632714937525e-05, "epoch": 2.57359921625636, "percentage": 85.79, "elapsed_time": "3 days, 2:25:58", "remaining_time": "12:20:00", "throughput": 27879.29, "total_tokens": 7470489408} +{"current_steps": 25460, "total_steps": 29667, "loss": 0.3434, "lr": 2.6552582232747637e-05, "epoch": 2.5746104983724676, "percentage": 85.82, "elapsed_time": "3 days, 2:27:38", "remaining_time": "12:18:13", "throughput": 27879.83, "total_tokens": 7473428352} +{"current_steps": 25470, "total_steps": 29667, "loss": 0.3456, "lr": 2.6548838899973794e-05, "epoch": 2.575621780488576, "percentage": 85.85, "elapsed_time": "3 days, 2:29:19", "remaining_time": "12:16:27", "throughput": 27880.38, "total_tokens": 7476381760} +{"current_steps": 25480, "total_steps": 29667, "loss": 0.3461, "lr": 2.6545097149937598e-05, "epoch": 2.5766330626046834, "percentage": 85.89, "elapsed_time": "3 days, 2:30:54", "remaining_time": "12:14:40", "throughput": 27881.28, "total_tokens": 7479287360} +{"current_steps": 25490, "total_steps": 29667, "loss": 0.3487, "lr": 2.6541356981524018e-05, "epoch": 2.5776443447207913, "percentage": 85.92, "elapsed_time": "3 days, 2:32:29", "remaining_time": "12:12:53", "throughput": 27882.17, "total_tokens": 7482169856} +{"current_steps": 25500, "total_steps": 29667, "loss": 0.3461, "lr": 2.653761839361913e-05, "epoch": 2.578655626836899, "percentage": 85.95, "elapsed_time": "3 days, 2:34:04", "remaining_time": "12:11:07", "throughput": 27883.11, "total_tokens": 7485075008} +{"current_steps": 25510, "total_steps": 29667, "loss": 0.3495, "lr": 2.6533881385110097e-05, "epoch": 2.579666908953007, "percentage": 85.99, "elapsed_time": "3 days, 2:35:40", "remaining_time": "12:09:20", "throughput": 27884.0, "total_tokens": 7487971840} +{"current_steps": 25520, "total_steps": 29667, "loss": 0.3508, "lr": 2.6530145954885187e-05, "epoch": 2.580678191069115, "percentage": 86.02, "elapsed_time": "3 days, 2:37:18", "remaining_time": "12:07:33", "throughput": 27884.64, "total_tokens": 7490889600} +{"current_steps": 25530, "total_steps": 29667, "loss": 0.3481, "lr": 2.6526412101833764e-05, "epoch": 2.5816894731852225, "percentage": 86.06, "elapsed_time": "3 days, 2:38:56", "remaining_time": "12:05:47", "throughput": 27885.24, "total_tokens": 7493786560} +{"current_steps": 25540, "total_steps": 29667, "loss": 0.3458, "lr": 2.6522679824846287e-05, "epoch": 2.5827007553013304, "percentage": 86.09, "elapsed_time": "3 days, 2:40:36", "remaining_time": "12:04:01", "throughput": 27885.73, "total_tokens": 7496710976} +{"current_steps": 25550, "total_steps": 29667, "loss": 0.3472, "lr": 2.6518949122814297e-05, "epoch": 2.5837120374174383, "percentage": 86.12, "elapsed_time": "3 days, 2:42:12", "remaining_time": "12:02:14", "throughput": 27886.52, "total_tokens": 7499602880} +{"current_steps": 25560, "total_steps": 29667, "loss": 0.3477, "lr": 2.651521999463043e-05, "epoch": 2.584723319533546, "percentage": 86.16, "elapsed_time": "3 days, 2:43:54", "remaining_time": "12:00:28", "throughput": 27887.09, "total_tokens": 7502579136} +{"current_steps": 25570, "total_steps": 29667, "loss": 0.3448, "lr": 2.651149243918842e-05, "epoch": 2.585734601649654, "percentage": 86.19, "elapsed_time": "3 days, 2:45:31", "remaining_time": "11:58:42", "throughput": 27888.04, "total_tokens": 7505540032} +{"current_steps": 25580, "total_steps": 29667, "loss": 0.3504, "lr": 2.650776645538308e-05, "epoch": 2.5867458837657615, "percentage": 86.22, "elapsed_time": "3 days, 2:47:07", "remaining_time": "11:56:55", "throughput": 27888.89, "total_tokens": 7508448576} +{"current_steps": 25590, "total_steps": 29667, "loss": 0.3481, "lr": 2.650404204211032e-05, "epoch": 2.58775716588187, "percentage": 86.26, "elapsed_time": "3 days, 2:48:48", "remaining_time": "11:55:09", "throughput": 27889.29, "total_tokens": 7511390976} +{"current_steps": 25600, "total_steps": 29667, "loss": 0.3485, "lr": 2.6500319198267126e-05, "epoch": 2.5887684479979773, "percentage": 86.29, "elapsed_time": "3 days, 2:50:29", "remaining_time": "11:53:23", "throughput": 27889.95, "total_tokens": 7514374720} +{"current_steps": 25610, "total_steps": 29667, "loss": 0.3454, "lr": 2.6496597922751572e-05, "epoch": 2.5897797301140852, "percentage": 86.32, "elapsed_time": "3 days, 2:52:09", "remaining_time": "11:51:37", "throughput": 27890.55, "total_tokens": 7517335808} +{"current_steps": 25620, "total_steps": 29667, "loss": 0.343, "lr": 2.6492878214462818e-05, "epoch": 2.590791012230193, "percentage": 86.36, "elapsed_time": "3 days, 2:53:43", "remaining_time": "11:49:50", "throughput": 27891.53, "total_tokens": 7520223808} +{"current_steps": 25630, "total_steps": 29667, "loss": 0.3483, "lr": 2.648916007230109e-05, "epoch": 2.591802294346301, "percentage": 86.39, "elapsed_time": "3 days, 2:55:20", "remaining_time": "11:48:03", "throughput": 27892.3, "total_tokens": 7523135168} +{"current_steps": 25640, "total_steps": 29667, "loss": 0.347, "lr": 2.6485443495167722e-05, "epoch": 2.592813576462409, "percentage": 86.43, "elapsed_time": "3 days, 2:56:56", "remaining_time": "11:46:17", "throughput": 27893.2, "total_tokens": 7526055168} +{"current_steps": 25650, "total_steps": 29667, "loss": 0.348, "lr": 2.6481728481965102e-05, "epoch": 2.5938248585785164, "percentage": 86.46, "elapsed_time": "3 days, 2:58:31", "remaining_time": "11:44:30", "throughput": 27894.18, "total_tokens": 7528963264} +{"current_steps": 25660, "total_steps": 29667, "loss": 0.3448, "lr": 2.6478015031596705e-05, "epoch": 2.5948361406946243, "percentage": 86.49, "elapsed_time": "3 days, 3:00:15", "remaining_time": "11:42:44", "throughput": 27894.5, "total_tokens": 7531946176} +{"current_steps": 25670, "total_steps": 29667, "loss": 0.3453, "lr": 2.6474303142967076e-05, "epoch": 2.595847422810732, "percentage": 86.53, "elapsed_time": "3 days, 3:01:53", "remaining_time": "11:40:58", "throughput": 27895.17, "total_tokens": 7534858560} +{"current_steps": 25680, "total_steps": 29667, "loss": 0.3483, "lr": 2.6470592814981852e-05, "epoch": 2.59685870492684, "percentage": 86.56, "elapsed_time": "3 days, 3:03:33", "remaining_time": "11:39:12", "throughput": 27895.75, "total_tokens": 7537812480} +{"current_steps": 25690, "total_steps": 29667, "loss": 0.3471, "lr": 2.6466884046547725e-05, "epoch": 2.597869987042948, "percentage": 86.59, "elapsed_time": "3 days, 3:05:10", "remaining_time": "11:37:26", "throughput": 27896.71, "total_tokens": 7540766464} +{"current_steps": 25700, "total_steps": 29667, "loss": 0.3451, "lr": 2.646317683657247e-05, "epoch": 2.5988812691590555, "percentage": 86.63, "elapsed_time": "3 days, 3:06:51", "remaining_time": "11:35:40", "throughput": 27897.01, "total_tokens": 7543679424} +{"current_steps": 25710, "total_steps": 29667, "loss": 0.3512, "lr": 2.645947118396491e-05, "epoch": 2.5998925512751634, "percentage": 86.66, "elapsed_time": "3 days, 3:08:32", "remaining_time": "11:33:54", "throughput": 27897.6, "total_tokens": 7546639744} +{"current_steps": 25720, "total_steps": 29667, "loss": 0.347, "lr": 2.6455767087634982e-05, "epoch": 2.6009038333912713, "percentage": 86.7, "elapsed_time": "3 days, 3:10:14", "remaining_time": "11:32:08", "throughput": 27897.82, "total_tokens": 7549558208} +{"current_steps": 25730, "total_steps": 29667, "loss": 0.3442, "lr": 2.6452064546493642e-05, "epoch": 2.601915115507379, "percentage": 86.73, "elapsed_time": "3 days, 3:11:54", "remaining_time": "11:30:22", "throughput": 27898.41, "total_tokens": 7552509824} +{"current_steps": 25740, "total_steps": 29667, "loss": 0.3455, "lr": 2.644836355945295e-05, "epoch": 2.602926397623487, "percentage": 86.76, "elapsed_time": "3 days, 3:13:30", "remaining_time": "11:28:35", "throughput": 27899.22, "total_tokens": 7555406336} +{"current_steps": 25750, "total_steps": 29667, "loss": 0.3489, "lr": 2.6444664125426012e-05, "epoch": 2.603937679739595, "percentage": 86.8, "elapsed_time": "3 days, 3:15:09", "remaining_time": "11:26:49", "throughput": 27899.9, "total_tokens": 7558345728} +{"current_steps": 25760, "total_steps": 29667, "loss": 0.3441, "lr": 2.6440966243326985e-05, "epoch": 2.604948961855703, "percentage": 86.83, "elapsed_time": "3 days, 3:16:46", "remaining_time": "11:25:03", "throughput": 27900.66, "total_tokens": 7561254528} +{"current_steps": 25770, "total_steps": 29667, "loss": 0.3446, "lr": 2.6437269912071132e-05, "epoch": 2.6059602439718104, "percentage": 86.86, "elapsed_time": "3 days, 3:18:26", "remaining_time": "11:23:17", "throughput": 27901.33, "total_tokens": 7564228608} +{"current_steps": 25780, "total_steps": 29667, "loss": 0.3431, "lr": 2.6433575130574732e-05, "epoch": 2.6069715260879183, "percentage": 86.9, "elapsed_time": "3 days, 3:20:04", "remaining_time": "11:21:31", "throughput": 27902.15, "total_tokens": 7567189504} +{"current_steps": 25790, "total_steps": 29667, "loss": 0.3438, "lr": 2.6429881897755154e-05, "epoch": 2.607982808204026, "percentage": 86.93, "elapsed_time": "3 days, 3:21:43", "remaining_time": "11:19:44", "throughput": 27902.76, "total_tokens": 7570108672} +{"current_steps": 25800, "total_steps": 29667, "loss": 0.3489, "lr": 2.6426190212530806e-05, "epoch": 2.608994090320134, "percentage": 86.97, "elapsed_time": "3 days, 3:23:21", "remaining_time": "11:17:58", "throughput": 27903.47, "total_tokens": 7573056000} +{"current_steps": 25810, "total_steps": 29667, "loss": 0.3456, "lr": 2.6422500073821168e-05, "epoch": 2.610005372436242, "percentage": 87.0, "elapsed_time": "3 days, 3:25:06", "remaining_time": "11:16:13", "throughput": 27903.77, "total_tokens": 7576050496} +{"current_steps": 25820, "total_steps": 29667, "loss": 0.3375, "lr": 2.6418811480546757e-05, "epoch": 2.6110166545523494, "percentage": 87.03, "elapsed_time": "3 days, 3:26:48", "remaining_time": "11:14:27", "throughput": 27904.1, "total_tokens": 7578982080} +{"current_steps": 25830, "total_steps": 29667, "loss": 0.3443, "lr": 2.641512443162917e-05, "epoch": 2.6120279366684573, "percentage": 87.07, "elapsed_time": "3 days, 3:28:28", "remaining_time": "11:12:41", "throughput": 27904.6, "total_tokens": 7581927424} +{"current_steps": 25840, "total_steps": 29667, "loss": 0.3442, "lr": 2.6411438925991034e-05, "epoch": 2.6130392187845652, "percentage": 87.1, "elapsed_time": "3 days, 3:30:05", "remaining_time": "11:10:55", "throughput": 27905.35, "total_tokens": 7584817088} +{"current_steps": 25850, "total_steps": 29667, "loss": 0.3494, "lr": 2.6407754962556046e-05, "epoch": 2.614050500900673, "percentage": 87.13, "elapsed_time": "3 days, 3:31:45", "remaining_time": "11:09:09", "throughput": 27905.84, "total_tokens": 7587760960} +{"current_steps": 25860, "total_steps": 29667, "loss": 0.341, "lr": 2.640407254024894e-05, "epoch": 2.615061783016781, "percentage": 87.17, "elapsed_time": "3 days, 3:33:22", "remaining_time": "11:07:23", "throughput": 27906.69, "total_tokens": 7590694784} +{"current_steps": 25870, "total_steps": 29667, "loss": 0.343, "lr": 2.640039165799551e-05, "epoch": 2.616073065132889, "percentage": 87.2, "elapsed_time": "3 days, 3:35:06", "remaining_time": "11:05:37", "throughput": 27906.93, "total_tokens": 7593659328} +{"current_steps": 25880, "total_steps": 29667, "loss": 0.3477, "lr": 2.6396712314722586e-05, "epoch": 2.617084347248997, "percentage": 87.23, "elapsed_time": "3 days, 3:36:41", "remaining_time": "11:03:51", "throughput": 27907.8, "total_tokens": 7596550400} +{"current_steps": 25890, "total_steps": 29667, "loss": 0.3442, "lr": 2.6393034509358054e-05, "epoch": 2.6180956293651043, "percentage": 87.27, "elapsed_time": "3 days, 3:38:20", "remaining_time": "11:02:05", "throughput": 27908.47, "total_tokens": 7599499776} +{"current_steps": 25900, "total_steps": 29667, "loss": 0.344, "lr": 2.6389358240830854e-05, "epoch": 2.619106911481212, "percentage": 87.3, "elapsed_time": "3 days, 3:39:55", "remaining_time": "11:00:18", "throughput": 27909.46, "total_tokens": 7602397888} +{"current_steps": 25910, "total_steps": 29667, "loss": 0.3411, "lr": 2.6385683508070942e-05, "epoch": 2.62011819359732, "percentage": 87.34, "elapsed_time": "3 days, 3:41:33", "remaining_time": "10:58:32", "throughput": 27910.01, "total_tokens": 7605305472} +{"current_steps": 25920, "total_steps": 29667, "loss": 0.3475, "lr": 2.6382010310009335e-05, "epoch": 2.621129475713428, "percentage": 87.37, "elapsed_time": "3 days, 3:43:13", "remaining_time": "10:56:46", "throughput": 27910.6, "total_tokens": 7608251648} +{"current_steps": 25930, "total_steps": 29667, "loss": 0.3544, "lr": 2.63783386455781e-05, "epoch": 2.622140757829536, "percentage": 87.4, "elapsed_time": "3 days, 3:44:51", "remaining_time": "10:55:00", "throughput": 27911.18, "total_tokens": 7611151808} +{"current_steps": 25940, "total_steps": 29667, "loss": 0.3439, "lr": 2.637466851371032e-05, "epoch": 2.6231520399456434, "percentage": 87.44, "elapsed_time": "3 days, 3:46:34", "remaining_time": "10:53:14", "throughput": 27911.72, "total_tokens": 7614151680} +{"current_steps": 25950, "total_steps": 29667, "loss": 0.3488, "lr": 2.637099991334015e-05, "epoch": 2.6241633220617513, "percentage": 87.47, "elapsed_time": "3 days, 3:48:08", "remaining_time": "10:51:27", "throughput": 27912.71, "total_tokens": 7617064448} +{"current_steps": 25960, "total_steps": 29667, "loss": 0.3399, "lr": 2.636733284340275e-05, "epoch": 2.625174604177859, "percentage": 87.5, "elapsed_time": "3 days, 3:49:46", "remaining_time": "10:49:41", "throughput": 27913.42, "total_tokens": 7619998784} +{"current_steps": 25970, "total_steps": 29667, "loss": 0.3497, "lr": 2.6363667302834326e-05, "epoch": 2.626185886293967, "percentage": 87.54, "elapsed_time": "3 days, 3:51:27", "remaining_time": "10:47:55", "throughput": 27913.93, "total_tokens": 7622952128} +{"current_steps": 25980, "total_steps": 29667, "loss": 0.3482, "lr": 2.636000329057214e-05, "epoch": 2.627197168410075, "percentage": 87.57, "elapsed_time": "3 days, 3:53:09", "remaining_time": "10:46:10", "throughput": 27914.27, "total_tokens": 7625885120} +{"current_steps": 25990, "total_steps": 29667, "loss": 0.3482, "lr": 2.6356340805554452e-05, "epoch": 2.6282084505261825, "percentage": 87.61, "elapsed_time": "3 days, 3:54:50", "remaining_time": "10:44:24", "throughput": 27914.8, "total_tokens": 7628850560} +{"current_steps": 26000, "total_steps": 29667, "loss": 0.3456, "lr": 2.635267984672058e-05, "epoch": 2.629219732642291, "percentage": 87.64, "elapsed_time": "3 days, 3:56:28", "remaining_time": "10:42:38", "throughput": 27915.52, "total_tokens": 7631775296} +{"current_steps": 26010, "total_steps": 29667, "loss": 0.3473, "lr": 2.6349020413010862e-05, "epoch": 2.6302310147583983, "percentage": 87.67, "elapsed_time": "3 days, 3:58:08", "remaining_time": "10:40:52", "throughput": 27916.08, "total_tokens": 7634717888} +{"current_steps": 26020, "total_steps": 29667, "loss": 0.3469, "lr": 2.6345362503366676e-05, "epoch": 2.631242296874506, "percentage": 87.71, "elapsed_time": "3 days, 3:59:44", "remaining_time": "10:39:06", "throughput": 27916.91, "total_tokens": 7637640960} +{"current_steps": 26030, "total_steps": 29667, "loss": 0.3496, "lr": 2.634170611673042e-05, "epoch": 2.632253578990614, "percentage": 87.74, "elapsed_time": "3 days, 4:01:24", "remaining_time": "10:37:20", "throughput": 27917.5, "total_tokens": 7640580864} +{"current_steps": 26040, "total_steps": 29667, "loss": 0.3453, "lr": 2.6338051252045516e-05, "epoch": 2.633264861106722, "percentage": 87.77, "elapsed_time": "3 days, 4:03:00", "remaining_time": "10:35:33", "throughput": 27918.35, "total_tokens": 7643508480} +{"current_steps": 26050, "total_steps": 29667, "loss": 0.3423, "lr": 2.6334397908256412e-05, "epoch": 2.63427614322283, "percentage": 87.81, "elapsed_time": "3 days, 4:04:43", "remaining_time": "10:33:48", "throughput": 27918.78, "total_tokens": 7646487296} +{"current_steps": 26060, "total_steps": 29667, "loss": 0.3482, "lr": 2.63307460843086e-05, "epoch": 2.6352874253389373, "percentage": 87.84, "elapsed_time": "3 days, 4:06:20", "remaining_time": "10:32:02", "throughput": 27919.46, "total_tokens": 7649399552} +{"current_steps": 26070, "total_steps": 29667, "loss": 0.3488, "lr": 2.6327095779148576e-05, "epoch": 2.6362987074550452, "percentage": 87.88, "elapsed_time": "3 days, 4:08:00", "remaining_time": "10:30:16", "throughput": 27920.17, "total_tokens": 7652381056} +{"current_steps": 26080, "total_steps": 29667, "loss": 0.3515, "lr": 2.6323446991723856e-05, "epoch": 2.637309989571153, "percentage": 87.91, "elapsed_time": "3 days, 4:09:41", "remaining_time": "10:28:30", "throughput": 27920.68, "total_tokens": 7655324992} +{"current_steps": 26090, "total_steps": 29667, "loss": 0.3434, "lr": 2.6319799720982985e-05, "epoch": 2.638321271687261, "percentage": 87.94, "elapsed_time": "3 days, 4:11:19", "remaining_time": "10:26:44", "throughput": 27921.44, "total_tokens": 7658267648} +{"current_steps": 26100, "total_steps": 29667, "loss": 0.3463, "lr": 2.6316153965875527e-05, "epoch": 2.639332553803369, "percentage": 87.98, "elapsed_time": "3 days, 4:12:56", "remaining_time": "10:24:58", "throughput": 27922.05, "total_tokens": 7661155456} +{"current_steps": 26110, "total_steps": 29667, "loss": 0.341, "lr": 2.6312509725352074e-05, "epoch": 2.6403438359194764, "percentage": 88.01, "elapsed_time": "3 days, 4:14:38", "remaining_time": "10:23:12", "throughput": 27922.61, "total_tokens": 7664145472} +{"current_steps": 26120, "total_steps": 29667, "loss": 0.3483, "lr": 2.6308866998364208e-05, "epoch": 2.6413551180355848, "percentage": 88.04, "elapsed_time": "3 days, 4:16:16", "remaining_time": "10:21:26", "throughput": 27923.37, "total_tokens": 7667107136} +{"current_steps": 26130, "total_steps": 29667, "loss": 0.3468, "lr": 2.6305225783864556e-05, "epoch": 2.642366400151692, "percentage": 88.08, "elapsed_time": "3 days, 4:17:56", "remaining_time": "10:19:40", "throughput": 27924.01, "total_tokens": 7670060224} +{"current_steps": 26140, "total_steps": 29667, "loss": 0.344, "lr": 2.6301586080806734e-05, "epoch": 2.6433776822678, "percentage": 88.11, "elapsed_time": "3 days, 4:19:36", "remaining_time": "10:17:54", "throughput": 27924.65, "total_tokens": 7673047872} +{"current_steps": 26150, "total_steps": 29667, "loss": 0.3443, "lr": 2.6297947888145395e-05, "epoch": 2.644388964383908, "percentage": 88.15, "elapsed_time": "3 days, 4:21:19", "remaining_time": "10:16:09", "throughput": 27924.88, "total_tokens": 7675978816} +{"current_steps": 26160, "total_steps": 29667, "loss": 0.3445, "lr": 2.6294311204836185e-05, "epoch": 2.645400246500016, "percentage": 88.18, "elapsed_time": "3 days, 4:23:05", "remaining_time": "10:14:24", "throughput": 27924.92, "total_tokens": 7678935488} +{"current_steps": 26170, "total_steps": 29667, "loss": 0.3472, "lr": 2.6290676029835777e-05, "epoch": 2.646411528616124, "percentage": 88.21, "elapsed_time": "3 days, 4:24:42", "remaining_time": "10:12:38", "throughput": 27925.78, "total_tokens": 7681883840} +{"current_steps": 26180, "total_steps": 29667, "loss": 0.3461, "lr": 2.6287042362101834e-05, "epoch": 2.6474228107322313, "percentage": 88.25, "elapsed_time": "3 days, 4:26:17", "remaining_time": "10:10:51", "throughput": 27926.59, "total_tokens": 7684758848} +{"current_steps": 26190, "total_steps": 29667, "loss": 0.3485, "lr": 2.628341020059304e-05, "epoch": 2.648434092848339, "percentage": 88.28, "elapsed_time": "3 days, 4:27:54", "remaining_time": "10:09:05", "throughput": 27927.22, "total_tokens": 7687652992} +{"current_steps": 26200, "total_steps": 29667, "loss": 0.3497, "lr": 2.627977954426909e-05, "epoch": 2.649445374964447, "percentage": 88.31, "elapsed_time": "3 days, 4:29:33", "remaining_time": "10:07:19", "throughput": 27927.7, "total_tokens": 7690547264} +{"current_steps": 26210, "total_steps": 29667, "loss": 0.3522, "lr": 2.627615039209067e-05, "epoch": 2.650456657080555, "percentage": 88.35, "elapsed_time": "3 days, 4:31:09", "remaining_time": "10:05:33", "throughput": 27928.54, "total_tokens": 7693471616} +{"current_steps": 26220, "total_steps": 29667, "loss": 0.3462, "lr": 2.6272522743019483e-05, "epoch": 2.651467939196663, "percentage": 88.38, "elapsed_time": "3 days, 4:32:46", "remaining_time": "10:03:47", "throughput": 27929.3, "total_tokens": 7696388160} +{"current_steps": 26230, "total_steps": 29667, "loss": 0.3476, "lr": 2.6268896596018234e-05, "epoch": 2.6524792213127704, "percentage": 88.41, "elapsed_time": "3 days, 4:34:26", "remaining_time": "10:02:01", "throughput": 27929.8, "total_tokens": 7699298432} +{"current_steps": 26240, "total_steps": 29667, "loss": 0.3463, "lr": 2.6265271950050624e-05, "epoch": 2.6534905034288783, "percentage": 88.45, "elapsed_time": "3 days, 4:36:04", "remaining_time": "10:00:15", "throughput": 27930.45, "total_tokens": 7702230144} +{"current_steps": 26250, "total_steps": 29667, "loss": 0.3463, "lr": 2.626164880408136e-05, "epoch": 2.654501785544986, "percentage": 88.48, "elapsed_time": "3 days, 4:37:38", "remaining_time": "9:58:28", "throughput": 27931.32, "total_tokens": 7705102720} +{"current_steps": 26260, "total_steps": 29667, "loss": 0.3499, "lr": 2.6258027157076137e-05, "epoch": 2.655513067661094, "percentage": 88.52, "elapsed_time": "3 days, 4:39:16", "remaining_time": "9:56:42", "throughput": 27931.93, "total_tokens": 7707993280} +{"current_steps": 26270, "total_steps": 29667, "loss": 0.3449, "lr": 2.625440700800167e-05, "epoch": 2.656524349777202, "percentage": 88.55, "elapsed_time": "3 days, 4:40:58", "remaining_time": "9:54:57", "throughput": 27932.26, "total_tokens": 7710939584} +{"current_steps": 26280, "total_steps": 29667, "loss": 0.3427, "lr": 2.6250788355825646e-05, "epoch": 2.65753563189331, "percentage": 88.58, "elapsed_time": "3 days, 4:42:41", "remaining_time": "9:53:12", "throughput": 27932.57, "total_tokens": 7713908352} +{"current_steps": 26290, "total_steps": 29667, "loss": 0.3468, "lr": 2.6247171199516767e-05, "epoch": 2.658546914009418, "percentage": 88.62, "elapsed_time": "3 days, 4:44:14", "remaining_time": "9:51:25", "throughput": 27933.59, "total_tokens": 7716792448} +{"current_steps": 26300, "total_steps": 29667, "loss": 0.3486, "lr": 2.6243555538044717e-05, "epoch": 2.6595581961255252, "percentage": 88.65, "elapsed_time": "3 days, 4:45:54", "remaining_time": "9:49:39", "throughput": 27934.06, "total_tokens": 7719708032} +{"current_steps": 26310, "total_steps": 29667, "loss": 0.3489, "lr": 2.6239941370380184e-05, "epoch": 2.660569478241633, "percentage": 88.68, "elapsed_time": "3 days, 4:47:29", "remaining_time": "9:47:53", "throughput": 27935.02, "total_tokens": 7722622016} +{"current_steps": 26320, "total_steps": 29667, "loss": 0.3491, "lr": 2.6236328695494834e-05, "epoch": 2.661580760357741, "percentage": 88.72, "elapsed_time": "3 days, 4:49:09", "remaining_time": "9:46:07", "throughput": 27935.64, "total_tokens": 7725590528} +{"current_steps": 26330, "total_steps": 29667, "loss": 0.3454, "lr": 2.6232717512361343e-05, "epoch": 2.662592042473849, "percentage": 88.75, "elapsed_time": "3 days, 4:50:47", "remaining_time": "9:44:21", "throughput": 27936.18, "total_tokens": 7728471168} +{"current_steps": 26340, "total_steps": 29667, "loss": 0.3455, "lr": 2.6229107819953357e-05, "epoch": 2.663603324589957, "percentage": 88.79, "elapsed_time": "3 days, 4:52:23", "remaining_time": "9:42:35", "throughput": 27937.06, "total_tokens": 7731392000} +{"current_steps": 26350, "total_steps": 29667, "loss": 0.3478, "lr": 2.6225499617245525e-05, "epoch": 2.6646146067060643, "percentage": 88.82, "elapsed_time": "3 days, 4:54:09", "remaining_time": "9:40:50", "throughput": 27937.12, "total_tokens": 7734369792} +{"current_steps": 26360, "total_steps": 29667, "loss": 0.3474, "lr": 2.6221892903213473e-05, "epoch": 2.665625888822172, "percentage": 88.85, "elapsed_time": "3 days, 4:55:45", "remaining_time": "9:39:04", "throughput": 27937.9, "total_tokens": 7737288064} +{"current_steps": 26370, "total_steps": 29667, "loss": 0.3463, "lr": 2.621828767683382e-05, "epoch": 2.66663717093828, "percentage": 88.89, "elapsed_time": "3 days, 4:57:24", "remaining_time": "9:37:18", "throughput": 27938.37, "total_tokens": 7740169792} +{"current_steps": 26380, "total_steps": 29667, "loss": 0.3498, "lr": 2.6214683937084162e-05, "epoch": 2.667648453054388, "percentage": 88.92, "elapsed_time": "3 days, 4:59:04", "remaining_time": "9:35:32", "throughput": 27938.83, "total_tokens": 7743087552} +{"current_steps": 26390, "total_steps": 29667, "loss": 0.3431, "lr": 2.621108168294309e-05, "epoch": 2.668659735170496, "percentage": 88.95, "elapsed_time": "3 days, 5:00:42", "remaining_time": "9:33:46", "throughput": 27939.57, "total_tokens": 7746024064} +{"current_steps": 26400, "total_steps": 29667, "loss": 0.3466, "lr": 2.620748091339016e-05, "epoch": 2.669671017286604, "percentage": 88.99, "elapsed_time": "3 days, 5:02:19", "remaining_time": "9:32:00", "throughput": 27940.27, "total_tokens": 7748943616} +{"current_steps": 26410, "total_steps": 29667, "loss": 0.3489, "lr": 2.620388162740593e-05, "epoch": 2.6706822994027117, "percentage": 89.02, "elapsed_time": "3 days, 5:05:39", "remaining_time": "9:30:27", "throughput": 27930.95, "total_tokens": 7751931200} +{"current_steps": 26420, "total_steps": 29667, "loss": 0.3476, "lr": 2.620028382397192e-05, "epoch": 2.671693581518819, "percentage": 89.06, "elapsed_time": "3 days, 5:09:05", "remaining_time": "9:28:54", "throughput": 27920.69, "total_tokens": 7754843648} +{"current_steps": 26430, "total_steps": 29667, "loss": 0.3488, "lr": 2.6196687502070645e-05, "epoch": 2.672704863634927, "percentage": 89.09, "elapsed_time": "3 days, 5:12:18", "remaining_time": "9:27:20", "throughput": 27911.81, "total_tokens": 7757759808} +{"current_steps": 26440, "total_steps": 29667, "loss": 0.3449, "lr": 2.6193092660685577e-05, "epoch": 2.673716145751035, "percentage": 89.12, "elapsed_time": "3 days, 5:16:40", "remaining_time": "9:25:54", "throughput": 27896.03, "total_tokens": 7760694272} +{"current_steps": 26450, "total_steps": 29667, "loss": 0.3449, "lr": 2.618949929880118e-05, "epoch": 2.674727427867143, "percentage": 89.16, "elapsed_time": "3 days, 5:20:15", "remaining_time": "9:24:22", "throughput": 27885.2, "total_tokens": 7763670080} +{"current_steps": 26460, "total_steps": 29667, "loss": 0.3439, "lr": 2.618590741540289e-05, "epoch": 2.675738709983251, "percentage": 89.19, "elapsed_time": "3 days, 5:22:52", "remaining_time": "9:22:43", "throughput": 27879.89, "total_tokens": 7766561408} +{"current_steps": 26470, "total_steps": 29667, "loss": 0.3496, "lr": 2.6182317009477104e-05, "epoch": 2.6767499920993583, "percentage": 89.22, "elapsed_time": "3 days, 5:25:36", "remaining_time": "9:21:05", "throughput": 27873.94, "total_tokens": 7769488768} +{"current_steps": 26480, "total_steps": 29667, "loss": 0.3482, "lr": 2.617872808001122e-05, "epoch": 2.677761274215466, "percentage": 89.26, "elapsed_time": "3 days, 5:27:51", "remaining_time": "9:19:23", "throughput": 27871.11, "total_tokens": 7772454464} +{"current_steps": 26490, "total_steps": 29667, "loss": 0.3437, "lr": 2.6175140625993583e-05, "epoch": 2.678772556331574, "percentage": 89.29, "elapsed_time": "3 days, 5:31:03", "remaining_time": "9:17:48", "throughput": 27862.57, "total_tokens": 7775422144} +{"current_steps": 26500, "total_steps": 29667, "loss": 0.3448, "lr": 2.6171554646413508e-05, "epoch": 2.679783838447682, "percentage": 89.32, "elapsed_time": "3 days, 5:34:37", "remaining_time": "9:16:16", "throughput": 27851.75, "total_tokens": 7778369664} +{"current_steps": 26510, "total_steps": 29667, "loss": 0.344, "lr": 2.61679701402613e-05, "epoch": 2.68079512056379, "percentage": 89.36, "elapsed_time": "3 days, 5:38:12", "remaining_time": "9:14:43", "throughput": 27840.72, "total_tokens": 7781279488} +{"current_steps": 26520, "total_steps": 29667, "loss": 0.3506, "lr": 2.6164387106528197e-05, "epoch": 2.6818064026798973, "percentage": 89.39, "elapsed_time": "3 days, 5:41:08", "remaining_time": "9:13:06", "throughput": 27833.74, "total_tokens": 7784225920} +{"current_steps": 26530, "total_steps": 29667, "loss": 0.3465, "lr": 2.6160805544206447e-05, "epoch": 2.6828176847960057, "percentage": 89.43, "elapsed_time": "3 days, 5:43:49", "remaining_time": "9:11:27", "throughput": 27828.37, "total_tokens": 7787186432} +{"current_steps": 26540, "total_steps": 29667, "loss": 0.3478, "lr": 2.6157225452289223e-05, "epoch": 2.683828966912113, "percentage": 89.46, "elapsed_time": "3 days, 5:46:16", "remaining_time": "9:09:47", "throughput": 27824.11, "total_tokens": 7790094464} +{"current_steps": 26550, "total_steps": 29667, "loss": 0.3468, "lr": 2.6153646829770696e-05, "epoch": 2.684840249028221, "percentage": 89.49, "elapsed_time": "3 days, 5:48:43", "remaining_time": "9:08:06", "throughput": 27820.16, "total_tokens": 7793078272} +{"current_steps": 26560, "total_steps": 29667, "loss": 0.3493, "lr": 2.6150069675645972e-05, "epoch": 2.685851531144329, "percentage": 89.53, "elapsed_time": "3 days, 5:51:13", "remaining_time": "9:06:26", "throughput": 27815.72, "total_tokens": 7796021632} +{"current_steps": 26570, "total_steps": 29667, "loss": 0.3462, "lr": 2.6146493988911137e-05, "epoch": 2.686862813260437, "percentage": 89.56, "elapsed_time": "3 days, 5:53:29", "remaining_time": "9:04:44", "throughput": 27812.59, "total_tokens": 7798905216} +{"current_steps": 26580, "total_steps": 29667, "loss": 0.3497, "lr": 2.6142919768563224e-05, "epoch": 2.6878740953765448, "percentage": 89.59, "elapsed_time": "3 days, 5:55:52", "remaining_time": "9:03:03", "throughput": 27808.75, "total_tokens": 7801813120} +{"current_steps": 26590, "total_steps": 29667, "loss": 0.3485, "lr": 2.613934701360024e-05, "epoch": 2.688885377492652, "percentage": 89.63, "elapsed_time": "3 days, 5:57:54", "remaining_time": "9:01:19", "throughput": 27806.94, "total_tokens": 7804699840} +{"current_steps": 26600, "total_steps": 29667, "loss": 0.3444, "lr": 2.6135775723021143e-05, "epoch": 2.68989665960876, "percentage": 89.66, "elapsed_time": "3 days, 6:00:07", "remaining_time": "8:59:37", "throughput": 27804.27, "total_tokens": 7807646272} +{"current_steps": 26610, "total_steps": 29667, "loss": 0.3474, "lr": 2.613220589582585e-05, "epoch": 2.690907941724868, "percentage": 89.7, "elapsed_time": "3 days, 6:02:17", "remaining_time": "8:57:54", "throughput": 27801.76, "total_tokens": 7810548032} +{"current_steps": 26620, "total_steps": 29667, "loss": 0.3449, "lr": 2.612863753101522e-05, "epoch": 2.691919223840976, "percentage": 89.73, "elapsed_time": "3 days, 6:04:25", "remaining_time": "8:56:11", "throughput": 27799.53, "total_tokens": 7813487168} +{"current_steps": 26630, "total_steps": 29667, "loss": 0.35, "lr": 2.612507062759109e-05, "epoch": 2.692930505957084, "percentage": 89.76, "elapsed_time": "3 days, 6:06:36", "remaining_time": "8:54:28", "throughput": 27797.07, "total_tokens": 7816431680} +{"current_steps": 26640, "total_steps": 29667, "loss": 0.3497, "lr": 2.612150518455625e-05, "epoch": 2.6939417880731913, "percentage": 89.8, "elapsed_time": "3 days, 6:08:42", "remaining_time": "8:52:45", "throughput": 27794.98, "total_tokens": 7819362688} +{"current_steps": 26650, "total_steps": 29667, "loss": 0.3409, "lr": 2.6117941200914407e-05, "epoch": 2.6949530701892996, "percentage": 89.83, "elapsed_time": "3 days, 6:10:54", "remaining_time": "8:51:02", "throughput": 27792.48, "total_tokens": 7822307136} +{"current_steps": 26660, "total_steps": 29667, "loss": 0.3445, "lr": 2.6114378675670266e-05, "epoch": 2.695964352305407, "percentage": 89.86, "elapsed_time": "3 days, 6:13:00", "remaining_time": "8:49:19", "throughput": 27790.39, "total_tokens": 7825243264} +{"current_steps": 26670, "total_steps": 29667, "loss": 0.3499, "lr": 2.611081760782944e-05, "epoch": 2.696975634421515, "percentage": 89.9, "elapsed_time": "3 days, 6:15:08", "remaining_time": "8:47:36", "throughput": 27788.22, "total_tokens": 7828185088} +{"current_steps": 26680, "total_steps": 29667, "loss": 0.3436, "lr": 2.6107257996398533e-05, "epoch": 2.697986916537623, "percentage": 89.93, "elapsed_time": "3 days, 6:17:19", "remaining_time": "8:45:53", "throughput": 27785.8, "total_tokens": 7831138944} +{"current_steps": 26690, "total_steps": 29667, "loss": 0.3478, "lr": 2.610369984038506e-05, "epoch": 2.698998198653731, "percentage": 89.97, "elapsed_time": "3 days, 6:19:28", "remaining_time": "8:44:10", "throughput": 27783.35, "total_tokens": 7834033472} +{"current_steps": 26700, "total_steps": 29667, "loss": 0.3447, "lr": 2.6100143138797508e-05, "epoch": 2.7000094807698387, "percentage": 90.0, "elapsed_time": "3 days, 6:21:43", "remaining_time": "8:42:28", "throughput": 27780.49, "total_tokens": 7836959872} +{"current_steps": 26710, "total_steps": 29667, "loss": 0.3499, "lr": 2.6096587890645286e-05, "epoch": 2.701020762885946, "percentage": 90.03, "elapsed_time": "3 days, 6:24:26", "remaining_time": "8:40:49", "throughput": 27774.66, "total_tokens": 7839867776} +{"current_steps": 26720, "total_steps": 29667, "loss": 0.3485, "lr": 2.6093034094938772e-05, "epoch": 2.702032045002054, "percentage": 90.07, "elapsed_time": "3 days, 6:26:57", "remaining_time": "8:39:08", "throughput": 27770.16, "total_tokens": 7842768896} +{"current_steps": 26730, "total_steps": 29667, "loss": 0.3498, "lr": 2.608948175068927e-05, "epoch": 2.703043327118162, "percentage": 90.1, "elapsed_time": "3 days, 6:29:35", "remaining_time": "8:37:28", "throughput": 27765.04, "total_tokens": 7845707456} +{"current_steps": 26740, "total_steps": 29667, "loss": 0.3447, "lr": 2.6085930856909035e-05, "epoch": 2.70405460923427, "percentage": 90.13, "elapsed_time": "3 days, 6:31:55", "remaining_time": "8:35:46", "throughput": 27761.54, "total_tokens": 7848621696} +{"current_steps": 26750, "total_steps": 29667, "loss": 0.349, "lr": 2.608238141261126e-05, "epoch": 2.705065891350378, "percentage": 90.17, "elapsed_time": "3 days, 6:34:15", "remaining_time": "8:34:04", "throughput": 27758.08, "total_tokens": 7851520896} +{"current_steps": 26760, "total_steps": 29667, "loss": 0.3431, "lr": 2.6078833416810072e-05, "epoch": 2.7060771734664852, "percentage": 90.2, "elapsed_time": "3 days, 6:36:55", "remaining_time": "8:32:24", "throughput": 27752.64, "total_tokens": 7854427200} +{"current_steps": 26770, "total_steps": 29667, "loss": 0.3451, "lr": 2.6075286868520543e-05, "epoch": 2.707088455582593, "percentage": 90.23, "elapsed_time": "3 days, 6:39:13", "remaining_time": "8:30:42", "throughput": 27749.33, "total_tokens": 7857325440} +{"current_steps": 26780, "total_steps": 29667, "loss": 0.3483, "lr": 2.6071741766758678e-05, "epoch": 2.708099737698701, "percentage": 90.27, "elapsed_time": "3 days, 6:41:24", "remaining_time": "8:28:59", "throughput": 27746.65, "total_tokens": 7860192960} +{"current_steps": 26790, "total_steps": 29667, "loss": 0.3449, "lr": 2.6068198110541432e-05, "epoch": 2.709111019814809, "percentage": 90.3, "elapsed_time": "3 days, 6:43:25", "remaining_time": "8:27:15", "throughput": 27745.22, "total_tokens": 7863146432} +{"current_steps": 26800, "total_steps": 29667, "loss": 0.3431, "lr": 2.606465589888667e-05, "epoch": 2.710122301930917, "percentage": 90.34, "elapsed_time": "3 days, 6:45:29", "remaining_time": "8:25:31", "throughput": 27743.47, "total_tokens": 7866088384} +{"current_steps": 26810, "total_steps": 29667, "loss": 0.3468, "lr": 2.606111513081321e-05, "epoch": 2.7111335840470248, "percentage": 90.37, "elapsed_time": "3 days, 6:47:37", "remaining_time": "8:23:47", "throughput": 27741.06, "total_tokens": 7868958400} +{"current_steps": 26820, "total_steps": 29667, "loss": 0.3492, "lr": 2.60575758053408e-05, "epoch": 2.7121448661631327, "percentage": 90.4, "elapsed_time": "3 days, 6:49:47", "remaining_time": "8:22:04", "throughput": 27738.76, "total_tokens": 7871918848} +{"current_steps": 26830, "total_steps": 29667, "loss": 0.3485, "lr": 2.605403792149012e-05, "epoch": 2.71315614827924, "percentage": 90.44, "elapsed_time": "3 days, 6:52:14", "remaining_time": "8:20:23", "throughput": 27734.74, "total_tokens": 7874839424} +{"current_steps": 26840, "total_steps": 29667, "loss": 0.3464, "lr": 2.6050501478282775e-05, "epoch": 2.714167430395348, "percentage": 90.47, "elapsed_time": "3 days, 6:55:09", "remaining_time": "8:18:44", "throughput": 27728.07, "total_tokens": 7877802240} +{"current_steps": 26850, "total_steps": 29667, "loss": 0.3514, "lr": 2.6046966474741293e-05, "epoch": 2.715178712511456, "percentage": 90.5, "elapsed_time": "3 days, 6:57:32", "remaining_time": "8:17:02", "throughput": 27724.19, "total_tokens": 7880685376} +{"current_steps": 26860, "total_steps": 29667, "loss": 0.3473, "lr": 2.6043432909889148e-05, "epoch": 2.716189994627564, "percentage": 90.54, "elapsed_time": "3 days, 6:59:32", "remaining_time": "8:15:18", "throughput": 27722.89, "total_tokens": 7883622912} +{"current_steps": 26870, "total_steps": 29667, "loss": 0.3487, "lr": 2.6039900782750737e-05, "epoch": 2.7172012767436717, "percentage": 90.57, "elapsed_time": "3 days, 7:01:38", "remaining_time": "8:13:34", "throughput": 27720.97, "total_tokens": 7886575488} +{"current_steps": 26880, "total_steps": 29667, "loss": 0.3412, "lr": 2.6036370092351377e-05, "epoch": 2.718212558859779, "percentage": 90.61, "elapsed_time": "3 days, 7:03:48", "remaining_time": "8:11:51", "throughput": 27718.55, "total_tokens": 7889488000} +{"current_steps": 26890, "total_steps": 29667, "loss": 0.3455, "lr": 2.6032840837717298e-05, "epoch": 2.719223840975887, "percentage": 90.64, "elapsed_time": "3 days, 7:05:57", "remaining_time": "8:10:07", "throughput": 27716.5, "total_tokens": 7892470080} +{"current_steps": 26900, "total_steps": 29667, "loss": 0.3475, "lr": 2.6029313017875682e-05, "epoch": 2.720235123091995, "percentage": 90.67, "elapsed_time": "3 days, 7:07:58", "remaining_time": "8:08:23", "throughput": 27715.15, "total_tokens": 7895443456} +{"current_steps": 26910, "total_steps": 29667, "loss": 0.344, "lr": 2.602578663185461e-05, "epoch": 2.721246405208103, "percentage": 90.71, "elapsed_time": "3 days, 7:10:13", "remaining_time": "8:06:40", "throughput": 27712.28, "total_tokens": 7898376384} +{"current_steps": 26920, "total_steps": 29667, "loss": 0.3457, "lr": 2.6022261678683102e-05, "epoch": 2.722257687324211, "percentage": 90.74, "elapsed_time": "3 days, 7:12:22", "remaining_time": "8:04:56", "throughput": 27709.93, "total_tokens": 7901285824} +{"current_steps": 26930, "total_steps": 29667, "loss": 0.3479, "lr": 2.601873815739108e-05, "epoch": 2.7232689694403187, "percentage": 90.77, "elapsed_time": "3 days, 7:14:29", "remaining_time": "8:03:13", "throughput": 27707.92, "total_tokens": 7904226496} +{"current_steps": 26940, "total_steps": 29667, "loss": 0.3545, "lr": 2.6015216067009395e-05, "epoch": 2.7242802515564266, "percentage": 90.81, "elapsed_time": "3 days, 7:16:39", "remaining_time": "8:01:29", "throughput": 27705.46, "total_tokens": 7907123840} +{"current_steps": 26950, "total_steps": 29667, "loss": 0.3427, "lr": 2.6011695406569824e-05, "epoch": 2.725291533672534, "percentage": 90.84, "elapsed_time": "3 days, 7:19:10", "remaining_time": "7:59:48", "throughput": 27701.34, "total_tokens": 7910129408} +{"current_steps": 26960, "total_steps": 29667, "loss": 0.3456, "lr": 2.6008176175105048e-05, "epoch": 2.726302815788642, "percentage": 90.88, "elapsed_time": "3 days, 7:21:35", "remaining_time": "7:58:06", "throughput": 27697.42, "total_tokens": 7913038720} +{"current_steps": 26970, "total_steps": 29667, "loss": 0.346, "lr": 2.6004658371648672e-05, "epoch": 2.72731409790475, "percentage": 90.91, "elapsed_time": "3 days, 7:23:44", "remaining_time": "7:56:22", "throughput": 27695.08, "total_tokens": 7915936384} +{"current_steps": 26980, "total_steps": 29667, "loss": 0.3494, "lr": 2.6001141995235195e-05, "epoch": 2.728325380020858, "percentage": 90.94, "elapsed_time": "3 days, 7:25:50", "remaining_time": "7:54:38", "throughput": 27693.05, "total_tokens": 7918845888} +{"current_steps": 26990, "total_steps": 29667, "loss": 0.3446, "lr": 2.599762704490007e-05, "epoch": 2.7293366621369657, "percentage": 90.98, "elapsed_time": "3 days, 7:28:14", "remaining_time": "7:52:56", "throughput": 27689.44, "total_tokens": 7921789504} +{"current_steps": 27000, "total_steps": 29667, "loss": 0.3474, "lr": 2.599411351967963e-05, "epoch": 2.730347944253073, "percentage": 91.01, "elapsed_time": "3 days, 7:30:17", "remaining_time": "7:51:11", "throughput": 27687.8, "total_tokens": 7924722688} +{"current_steps": 27010, "total_steps": 29667, "loss": 0.3474, "lr": 2.5990601418611127e-05, "epoch": 2.731359226369181, "percentage": 91.04, "elapsed_time": "3 days, 7:32:33", "remaining_time": "7:49:28", "throughput": 27684.76, "total_tokens": 7927630976} +{"current_steps": 27020, "total_steps": 29667, "loss": 0.3495, "lr": 2.598709074073272e-05, "epoch": 2.732370508485289, "percentage": 91.08, "elapsed_time": "3 days, 7:34:41", "remaining_time": "7:47:45", "throughput": 27682.53, "total_tokens": 7930537152} +{"current_steps": 27030, "total_steps": 29667, "loss": 0.3486, "lr": 2.5983581485083498e-05, "epoch": 2.733381790601397, "percentage": 91.11, "elapsed_time": "3 days, 7:37:18", "remaining_time": "7:46:03", "throughput": 27677.55, "total_tokens": 7933453120} +{"current_steps": 27040, "total_steps": 29667, "loss": 0.3466, "lr": 2.598007365070343e-05, "epoch": 2.7343930727175048, "percentage": 91.15, "elapsed_time": "3 days, 7:39:47", "remaining_time": "7:44:22", "throughput": 27673.32, "total_tokens": 7936350272} +{"current_steps": 27050, "total_steps": 29667, "loss": 0.3468, "lr": 2.5976567236633403e-05, "epoch": 2.735404354833612, "percentage": 91.18, "elapsed_time": "3 days, 7:42:08", "remaining_time": "7:42:39", "throughput": 27670.08, "total_tokens": 7939331776} +{"current_steps": 27060, "total_steps": 29667, "loss": 0.348, "lr": 2.5973062241915225e-05, "epoch": 2.7364156369497206, "percentage": 91.21, "elapsed_time": "3 days, 7:44:23", "remaining_time": "7:40:56", "throughput": 27667.41, "total_tokens": 7942300480} +{"current_steps": 27070, "total_steps": 29667, "loss": 0.3504, "lr": 2.5969558665591576e-05, "epoch": 2.737426919065828, "percentage": 91.25, "elapsed_time": "3 days, 7:46:24", "remaining_time": "7:39:11", "throughput": 27666.04, "total_tokens": 7945250112} +{"current_steps": 27080, "total_steps": 29667, "loss": 0.3483, "lr": 2.5966056506706078e-05, "epoch": 2.738438201181936, "percentage": 91.28, "elapsed_time": "3 days, 7:48:34", "remaining_time": "7:37:27", "throughput": 27663.75, "total_tokens": 7948208832} +{"current_steps": 27090, "total_steps": 29667, "loss": 0.3458, "lr": 2.596255576430322e-05, "epoch": 2.739449483298044, "percentage": 91.31, "elapsed_time": "3 days, 7:51:10", "remaining_time": "7:35:46", "throughput": 27659.14, "total_tokens": 7951175680} +{"current_steps": 27100, "total_steps": 29667, "loss": 0.3462, "lr": 2.5959056437428414e-05, "epoch": 2.7404607654141517, "percentage": 91.35, "elapsed_time": "3 days, 7:53:56", "remaining_time": "7:34:05", "throughput": 27653.21, "total_tokens": 7954086464} +{"current_steps": 27110, "total_steps": 29667, "loss": 0.344, "lr": 2.5955558525127977e-05, "epoch": 2.7414720475302596, "percentage": 91.38, "elapsed_time": "3 days, 7:56:20", "remaining_time": "7:32:23", "throughput": 27649.4, "total_tokens": 7956969088} +{"current_steps": 27120, "total_steps": 29667, "loss": 0.3501, "lr": 2.5952062026449096e-05, "epoch": 2.742483329646367, "percentage": 91.41, "elapsed_time": "3 days, 7:59:07", "remaining_time": "7:30:42", "throughput": 27643.68, "total_tokens": 7959935680} +{"current_steps": 27130, "total_steps": 29667, "loss": 0.3424, "lr": 2.59485669404399e-05, "epoch": 2.743494611762475, "percentage": 91.45, "elapsed_time": "3 days, 8:01:42", "remaining_time": "7:29:01", "throughput": 27638.88, "total_tokens": 7962824000} +{"current_steps": 27140, "total_steps": 29667, "loss": 0.3446, "lr": 2.5945073266149366e-05, "epoch": 2.744505893878583, "percentage": 91.48, "elapsed_time": "3 days, 8:04:06", "remaining_time": "7:27:18", "throughput": 27635.31, "total_tokens": 7965788032} +{"current_steps": 27150, "total_steps": 29667, "loss": 0.3421, "lr": 2.594158100262741e-05, "epoch": 2.745517175994691, "percentage": 91.52, "elapsed_time": "3 days, 8:06:43", "remaining_time": "7:25:37", "throughput": 27630.66, "total_tokens": 7968769472} +{"current_steps": 27160, "total_steps": 29667, "loss": 0.3466, "lr": 2.5938090148924815e-05, "epoch": 2.7465284581107987, "percentage": 91.55, "elapsed_time": "3 days, 8:08:47", "remaining_time": "7:23:52", "throughput": 27628.93, "total_tokens": 7971713792} +{"current_steps": 27170, "total_steps": 29667, "loss": 0.3445, "lr": 2.5934600704093282e-05, "epoch": 2.747539740226906, "percentage": 91.58, "elapsed_time": "3 days, 8:10:41", "remaining_time": "7:22:06", "throughput": 27628.14, "total_tokens": 7974636032} +{"current_steps": 27180, "total_steps": 29667, "loss": 0.3503, "lr": 2.5931112667185365e-05, "epoch": 2.7485510223430145, "percentage": 91.62, "elapsed_time": "3 days, 8:12:37", "remaining_time": "7:20:21", "throughput": 27627.21, "total_tokens": 7977570432} +{"current_steps": 27190, "total_steps": 29667, "loss": 0.3441, "lr": 2.592762603725456e-05, "epoch": 2.749562304459122, "percentage": 91.65, "elapsed_time": "3 days, 8:14:44", "remaining_time": "7:18:37", "throughput": 27625.24, "total_tokens": 7980511296} +{"current_steps": 27200, "total_steps": 29667, "loss": 0.3475, "lr": 2.592414081335522e-05, "epoch": 2.75057358657523, "percentage": 91.68, "elapsed_time": "3 days, 8:16:56", "remaining_time": "7:16:53", "throughput": 27622.83, "total_tokens": 7983459712} +{"current_steps": 27210, "total_steps": 29667, "loss": 0.3463, "lr": 2.592065699454259e-05, "epoch": 2.751584868691338, "percentage": 91.72, "elapsed_time": "3 days, 8:18:53", "remaining_time": "7:15:08", "throughput": 27621.94, "total_tokens": 7986420800} +{"current_steps": 27220, "total_steps": 29667, "loss": 0.3466, "lr": 2.5917174579872815e-05, "epoch": 2.7525961508074457, "percentage": 91.75, "elapsed_time": "3 days, 8:21:20", "remaining_time": "7:13:25", "throughput": 27618.09, "total_tokens": 7989382336} +{"current_steps": 27230, "total_steps": 29667, "loss": 0.3522, "lr": 2.5913693568402926e-05, "epoch": 2.7536074329235536, "percentage": 91.79, "elapsed_time": "3 days, 8:23:30", "remaining_time": "7:11:41", "throughput": 27615.86, "total_tokens": 7992311808} +{"current_steps": 27240, "total_steps": 29667, "loss": 0.3444, "lr": 2.5910213959190833e-05, "epoch": 2.754618715039661, "percentage": 91.82, "elapsed_time": "3 days, 8:26:00", "remaining_time": "7:09:58", "throughput": 27611.71, "total_tokens": 7995245888} +{"current_steps": 27250, "total_steps": 29667, "loss": 0.345, "lr": 2.590673575129534e-05, "epoch": 2.755629997155769, "percentage": 91.85, "elapsed_time": "3 days, 8:28:41", "remaining_time": "7:08:17", "throughput": 27606.5, "total_tokens": 7998193792} +{"current_steps": 27260, "total_steps": 29667, "loss": 0.343, "lr": 2.5903258943776116e-05, "epoch": 2.756641279271877, "percentage": 91.89, "elapsed_time": "3 days, 8:30:42", "remaining_time": "7:06:32", "throughput": 27605.24, "total_tokens": 8001180096} +{"current_steps": 27270, "total_steps": 29667, "loss": 0.3489, "lr": 2.5899783535693745e-05, "epoch": 2.7576525613879848, "percentage": 91.92, "elapsed_time": "3 days, 8:32:48", "remaining_time": "7:04:47", "throughput": 27603.37, "total_tokens": 8004106432} +{"current_steps": 27280, "total_steps": 29667, "loss": 0.3406, "lr": 2.5896309526109663e-05, "epoch": 2.7586638435040927, "percentage": 91.95, "elapsed_time": "3 days, 8:34:55", "remaining_time": "7:03:03", "throughput": 27601.31, "total_tokens": 8007015552} +{"current_steps": 27290, "total_steps": 29667, "loss": 0.346, "lr": 2.589283691408621e-05, "epoch": 2.7596751256202, "percentage": 91.99, "elapsed_time": "3 days, 8:37:17", "remaining_time": "7:01:20", "throughput": 27597.89, "total_tokens": 8009937472} +{"current_steps": 27300, "total_steps": 29667, "loss": 0.3434, "lr": 2.588936569868658e-05, "epoch": 2.760686407736308, "percentage": 92.02, "elapsed_time": "3 days, 8:39:31", "remaining_time": "6:59:36", "throughput": 27595.31, "total_tokens": 8012888896} +{"current_steps": 27310, "total_steps": 29667, "loss": 0.3508, "lr": 2.5885895878974877e-05, "epoch": 2.761697689852416, "percentage": 92.06, "elapsed_time": "3 days, 8:41:38", "remaining_time": "6:57:51", "throughput": 27593.42, "total_tokens": 8015840512} +{"current_steps": 27320, "total_steps": 29667, "loss": 0.3425, "lr": 2.5882427454016055e-05, "epoch": 2.762708971968524, "percentage": 92.09, "elapsed_time": "3 days, 8:43:41", "remaining_time": "6:56:06", "throughput": 27591.91, "total_tokens": 8018796096} +{"current_steps": 27330, "total_steps": 29667, "loss": 0.3517, "lr": 2.587896042287596e-05, "epoch": 2.7637202540846317, "percentage": 92.12, "elapsed_time": "3 days, 8:45:45", "remaining_time": "6:54:21", "throughput": 27590.21, "total_tokens": 8021720896} +{"current_steps": 27340, "total_steps": 29667, "loss": 0.3427, "lr": 2.5875494784621317e-05, "epoch": 2.7647315362007396, "percentage": 92.16, "elapsed_time": "3 days, 8:47:43", "remaining_time": "6:52:36", "throughput": 27588.92, "total_tokens": 8024617280} +{"current_steps": 27350, "total_steps": 29667, "loss": 0.3454, "lr": 2.587203053831971e-05, "epoch": 2.7657428183168475, "percentage": 92.19, "elapsed_time": "3 days, 8:49:54", "remaining_time": "6:50:52", "throughput": 27586.61, "total_tokens": 8027549696} +{"current_steps": 27360, "total_steps": 29667, "loss": 0.3463, "lr": 2.586856768303961e-05, "epoch": 2.766754100432955, "percentage": 92.22, "elapsed_time": "3 days, 8:52:28", "remaining_time": "6:49:09", "throughput": 27582.0, "total_tokens": 8030465024} +{"current_steps": 27370, "total_steps": 29667, "loss": 0.3447, "lr": 2.586510621785036e-05, "epoch": 2.767765382549063, "percentage": 92.26, "elapsed_time": "3 days, 8:54:48", "remaining_time": "6:47:26", "throughput": 27578.85, "total_tokens": 8033412480} +{"current_steps": 27380, "total_steps": 29667, "loss": 0.3466, "lr": 2.5861646141822164e-05, "epoch": 2.768776664665171, "percentage": 92.29, "elapsed_time": "3 days, 8:57:17", "remaining_time": "6:45:43", "throughput": 27574.92, "total_tokens": 8036358912} +{"current_steps": 27390, "total_steps": 29667, "loss": 0.3463, "lr": 2.5858187454026106e-05, "epoch": 2.7697879467812787, "percentage": 92.32, "elapsed_time": "3 days, 8:59:30", "remaining_time": "6:43:58", "throughput": 27572.52, "total_tokens": 8039330112} +{"current_steps": 27400, "total_steps": 29667, "loss": 0.3499, "lr": 2.5854730153534134e-05, "epoch": 2.7707992288973866, "percentage": 92.36, "elapsed_time": "3 days, 9:01:59", "remaining_time": "6:42:16", "throughput": 27568.33, "total_tokens": 8042225664} +{"current_steps": 27410, "total_steps": 29667, "loss": 0.3466, "lr": 2.585127423941907e-05, "epoch": 2.771810511013494, "percentage": 92.39, "elapsed_time": "3 days, 9:04:29", "remaining_time": "6:40:33", "throughput": 27564.41, "total_tokens": 8045202688} +{"current_steps": 27420, "total_steps": 29667, "loss": 0.341, "lr": 2.58478197107546e-05, "epoch": 2.772821793129602, "percentage": 92.43, "elapsed_time": "3 days, 9:07:07", "remaining_time": "6:38:50", "throughput": 27559.71, "total_tokens": 8048196544} +{"current_steps": 27430, "total_steps": 29667, "loss": 0.3468, "lr": 2.5844366566615273e-05, "epoch": 2.77383307524571, "percentage": 92.46, "elapsed_time": "3 days, 9:09:17", "remaining_time": "6:37:06", "throughput": 27557.65, "total_tokens": 8051176704} +{"current_steps": 27440, "total_steps": 29667, "loss": 0.3457, "lr": 2.584091480607651e-05, "epoch": 2.774844357361818, "percentage": 92.49, "elapsed_time": "3 days, 9:11:29", "remaining_time": "6:35:21", "throughput": 27555.3, "total_tokens": 8054113280} +{"current_steps": 27450, "total_steps": 29667, "loss": 0.3456, "lr": 2.5837464428214592e-05, "epoch": 2.7758556394779257, "percentage": 92.53, "elapsed_time": "3 days, 9:13:35", "remaining_time": "6:33:36", "throughput": 27553.45, "total_tokens": 8057050176} +{"current_steps": 27460, "total_steps": 29667, "loss": 0.3474, "lr": 2.5834015432106666e-05, "epoch": 2.7768669215940336, "percentage": 92.56, "elapsed_time": "3 days, 9:15:38", "remaining_time": "6:31:51", "throughput": 27551.91, "total_tokens": 8059996160} +{"current_steps": 27470, "total_steps": 29667, "loss": 0.3472, "lr": 2.5830567816830737e-05, "epoch": 2.7778782037101415, "percentage": 92.59, "elapsed_time": "3 days, 9:17:48", "remaining_time": "6:30:07", "throughput": 27549.7, "total_tokens": 8062943232} +{"current_steps": 27480, "total_steps": 29667, "loss": 0.3483, "lr": 2.5827121581465668e-05, "epoch": 2.778889485826249, "percentage": 92.63, "elapsed_time": "3 days, 9:19:55", "remaining_time": "6:28:22", "throughput": 27547.73, "total_tokens": 8065864704} +{"current_steps": 27490, "total_steps": 29667, "loss": 0.3457, "lr": 2.5823676725091193e-05, "epoch": 2.779900767942357, "percentage": 92.66, "elapsed_time": "3 days, 9:22:29", "remaining_time": "6:26:39", "throughput": 27543.35, "total_tokens": 8068807872} +{"current_steps": 27500, "total_steps": 29667, "loss": 0.3462, "lr": 2.5820233246787902e-05, "epoch": 2.7809120500584648, "percentage": 92.7, "elapsed_time": "3 days, 9:24:44", "remaining_time": "6:24:55", "throughput": 27540.82, "total_tokens": 8071790848} +{"current_steps": 27510, "total_steps": 29667, "loss": 0.3465, "lr": 2.581679114563723e-05, "epoch": 2.7819233321745727, "percentage": 92.73, "elapsed_time": "3 days, 9:26:41", "remaining_time": "6:23:09", "throughput": 27539.72, "total_tokens": 8074686976} +{"current_steps": 27520, "total_steps": 29667, "loss": 0.349, "lr": 2.5813350420721488e-05, "epoch": 2.7829346142906806, "percentage": 92.76, "elapsed_time": "3 days, 9:28:40", "remaining_time": "6:21:23", "throughput": 27538.62, "total_tokens": 8077630720} +{"current_steps": 27530, "total_steps": 29667, "loss": 0.3504, "lr": 2.5809911071123834e-05, "epoch": 2.783945896406788, "percentage": 92.8, "elapsed_time": "3 days, 9:30:48", "remaining_time": "6:19:38", "throughput": 27536.61, "total_tokens": 8080577792} +{"current_steps": 27540, "total_steps": 29667, "loss": 0.3436, "lr": 2.5806473095928274e-05, "epoch": 2.784957178522896, "percentage": 92.83, "elapsed_time": "3 days, 9:32:49", "remaining_time": "6:17:53", "throughput": 27535.48, "total_tokens": 8083564160} +{"current_steps": 27550, "total_steps": 29667, "loss": 0.3478, "lr": 2.5803036494219678e-05, "epoch": 2.785968460639004, "percentage": 92.86, "elapsed_time": "3 days, 9:34:43", "remaining_time": "6:16:07", "throughput": 27534.93, "total_tokens": 8086553792} +{"current_steps": 27560, "total_steps": 29667, "loss": 0.3466, "lr": 2.5799601265083767e-05, "epoch": 2.7869797427551117, "percentage": 92.9, "elapsed_time": "3 days, 9:36:40", "remaining_time": "6:14:21", "throughput": 27533.87, "total_tokens": 8089464576} +{"current_steps": 27570, "total_steps": 29667, "loss": 0.3548, "lr": 2.5796167407607113e-05, "epoch": 2.7879910248712196, "percentage": 92.93, "elapsed_time": "3 days, 9:38:39", "remaining_time": "6:12:35", "throughput": 27532.74, "total_tokens": 8092411264} +{"current_steps": 27580, "total_steps": 29667, "loss": 0.3431, "lr": 2.5792734920877138e-05, "epoch": 2.789002306987327, "percentage": 92.97, "elapsed_time": "3 days, 9:40:43", "remaining_time": "6:10:50", "throughput": 27531.13, "total_tokens": 8095361280} +{"current_steps": 27590, "total_steps": 29667, "loss": 0.3432, "lr": 2.5789303803982114e-05, "epoch": 2.7900135891034354, "percentage": 93.0, "elapsed_time": "3 days, 9:42:50", "remaining_time": "6:09:05", "throughput": 27529.12, "total_tokens": 8098266560} +{"current_steps": 27600, "total_steps": 29667, "loss": 0.3409, "lr": 2.578587405601115e-05, "epoch": 2.791024871219543, "percentage": 93.03, "elapsed_time": "3 days, 9:45:03", "remaining_time": "6:07:20", "throughput": 27526.73, "total_tokens": 8101202432} +{"current_steps": 27610, "total_steps": 29667, "loss": 0.3473, "lr": 2.5782445676054233e-05, "epoch": 2.792036153335651, "percentage": 93.07, "elapsed_time": "3 days, 9:47:10", "remaining_time": "6:05:35", "throughput": 27524.81, "total_tokens": 8104153664} +{"current_steps": 27620, "total_steps": 29667, "loss": 0.3478, "lr": 2.577901866320217e-05, "epoch": 2.7930474354517587, "percentage": 93.1, "elapsed_time": "3 days, 9:49:08", "remaining_time": "6:03:49", "throughput": 27523.78, "total_tokens": 8107087040} +{"current_steps": 27630, "total_steps": 29667, "loss": 0.3461, "lr": 2.5775593016546618e-05, "epoch": 2.7940587175678666, "percentage": 93.13, "elapsed_time": "3 days, 9:50:57", "remaining_time": "6:02:03", "throughput": 27523.38, "total_tokens": 8109956608} +{"current_steps": 27640, "total_steps": 29667, "loss": 0.3454, "lr": 2.5772168735180084e-05, "epoch": 2.7950699996839745, "percentage": 93.17, "elapsed_time": "3 days, 9:52:48", "remaining_time": "6:00:17", "throughput": 27522.91, "total_tokens": 8112874944} +{"current_steps": 27650, "total_steps": 29667, "loss": 0.3463, "lr": 2.5768745818195927e-05, "epoch": 2.796081281800082, "percentage": 93.2, "elapsed_time": "3 days, 9:54:38", "remaining_time": "5:58:30", "throughput": 27522.6, "total_tokens": 8115830976} +{"current_steps": 27660, "total_steps": 29667, "loss": 0.3453, "lr": 2.5765324264688327e-05, "epoch": 2.79709256391619, "percentage": 93.23, "elapsed_time": "3 days, 9:56:40", "remaining_time": "5:56:45", "throughput": 27521.26, "total_tokens": 8118780352} +{"current_steps": 27670, "total_steps": 29667, "loss": 0.3481, "lr": 2.5761904073752323e-05, "epoch": 2.798103846032298, "percentage": 93.27, "elapsed_time": "3 days, 9:58:37", "remaining_time": "5:54:59", "throughput": 27520.11, "total_tokens": 8121666176} +{"current_steps": 27680, "total_steps": 29667, "loss": 0.3424, "lr": 2.5758485244483788e-05, "epoch": 2.7991151281484057, "percentage": 93.3, "elapsed_time": "3 days, 10:00:33", "remaining_time": "5:53:13", "throughput": 27519.26, "total_tokens": 8124622080} +{"current_steps": 27690, "total_steps": 29667, "loss": 0.3466, "lr": 2.5755067775979443e-05, "epoch": 2.8001264102645136, "percentage": 93.34, "elapsed_time": "3 days, 10:02:31", "remaining_time": "5:51:27", "throughput": 27518.05, "total_tokens": 8127487104} +{"current_steps": 27700, "total_steps": 29667, "loss": 0.3483, "lr": 2.5751651667336824e-05, "epoch": 2.801137692380621, "percentage": 93.37, "elapsed_time": "3 days, 10:04:31", "remaining_time": "5:49:41", "throughput": 27516.79, "total_tokens": 8130430784} +{"current_steps": 27710, "total_steps": 29667, "loss": 0.3453, "lr": 2.5748236917654333e-05, "epoch": 2.8021489744967294, "percentage": 93.4, "elapsed_time": "3 days, 10:06:30", "remaining_time": "5:47:55", "throughput": 27515.7, "total_tokens": 8133392384} +{"current_steps": 27720, "total_steps": 29667, "loss": 0.3466, "lr": 2.5744823526031202e-05, "epoch": 2.803160256612837, "percentage": 93.44, "elapsed_time": "3 days, 10:08:31", "remaining_time": "5:46:10", "throughput": 27514.43, "total_tokens": 8136342912} +{"current_steps": 27730, "total_steps": 29667, "loss": 0.3438, "lr": 2.5741411491567484e-05, "epoch": 2.8041715387289448, "percentage": 93.47, "elapsed_time": "3 days, 10:10:23", "remaining_time": "5:44:23", "throughput": 27513.97, "total_tokens": 8139285120} +{"current_steps": 27740, "total_steps": 29667, "loss": 0.336, "lr": 2.573800081336408e-05, "epoch": 2.8051828208450527, "percentage": 93.5, "elapsed_time": "3 days, 10:12:25", "remaining_time": "5:42:38", "throughput": 27512.58, "total_tokens": 8142233088} +{"current_steps": 27750, "total_steps": 29667, "loss": 0.3471, "lr": 2.573459149052272e-05, "epoch": 2.8061941029611606, "percentage": 93.54, "elapsed_time": "3 days, 10:14:20", "remaining_time": "5:40:52", "throughput": 27511.82, "total_tokens": 8145167616} +{"current_steps": 27760, "total_steps": 29667, "loss": 0.3443, "lr": 2.5731183522145968e-05, "epoch": 2.8072053850772685, "percentage": 93.57, "elapsed_time": "3 days, 10:16:17", "remaining_time": "5:39:06", "throughput": 27510.82, "total_tokens": 8148074304} +{"current_steps": 27770, "total_steps": 29667, "loss": 0.3472, "lr": 2.5727776907337226e-05, "epoch": 2.808216667193376, "percentage": 93.61, "elapsed_time": "3 days, 10:18:20", "remaining_time": "5:37:20", "throughput": 27509.36, "total_tokens": 8151047872} +{"current_steps": 27780, "total_steps": 29667, "loss": 0.3423, "lr": 2.5724371645200708e-05, "epoch": 2.809227949309484, "percentage": 93.64, "elapsed_time": "3 days, 10:20:15", "remaining_time": "5:35:34", "throughput": 27508.6, "total_tokens": 8153985216} +{"current_steps": 27790, "total_steps": 29667, "loss": 0.3457, "lr": 2.572096773484147e-05, "epoch": 2.8102392314255917, "percentage": 93.67, "elapsed_time": "3 days, 10:22:05", "remaining_time": "5:33:48", "throughput": 27508.16, "total_tokens": 8156881024} +{"current_steps": 27800, "total_steps": 29667, "loss": 0.3482, "lr": 2.5717565175365416e-05, "epoch": 2.8112505135416996, "percentage": 93.71, "elapsed_time": "3 days, 10:24:02", "remaining_time": "5:32:02", "throughput": 27507.36, "total_tokens": 8159860928} +{"current_steps": 27810, "total_steps": 29667, "loss": 0.3463, "lr": 2.571416396587924e-05, "epoch": 2.8122617956578075, "percentage": 93.74, "elapsed_time": "3 days, 10:25:54", "remaining_time": "5:30:15", "throughput": 27506.92, "total_tokens": 8162814656} +{"current_steps": 27820, "total_steps": 29667, "loss": 0.3491, "lr": 2.5710764105490486e-05, "epoch": 2.813273077773915, "percentage": 93.77, "elapsed_time": "3 days, 10:27:47", "remaining_time": "5:28:29", "throughput": 27506.4, "total_tokens": 8165769664} +{"current_steps": 27830, "total_steps": 29667, "loss": 0.345, "lr": 2.570736559330752e-05, "epoch": 2.8142843598900233, "percentage": 93.81, "elapsed_time": "3 days, 10:29:46", "remaining_time": "5:26:43", "throughput": 27505.41, "total_tokens": 8168733440} +{"current_steps": 27840, "total_steps": 29667, "loss": 0.3489, "lr": 2.570396842843953e-05, "epoch": 2.815295642006131, "percentage": 93.84, "elapsed_time": "3 days, 10:31:39", "remaining_time": "5:24:57", "throughput": 27504.82, "total_tokens": 8171675200} +{"current_steps": 27850, "total_steps": 29667, "loss": 0.3447, "lr": 2.5700572609996526e-05, "epoch": 2.8163069241222387, "percentage": 93.88, "elapsed_time": "3 days, 10:33:42", "remaining_time": "5:23:11", "throughput": 27503.29, "total_tokens": 8174590912} +{"current_steps": 27860, "total_steps": 29667, "loss": 0.3519, "lr": 2.5697178137089357e-05, "epoch": 2.8173182062383466, "percentage": 93.91, "elapsed_time": "3 days, 10:35:37", "remaining_time": "5:21:25", "throughput": 27502.33, "total_tokens": 8177470912} +{"current_steps": 27870, "total_steps": 29667, "loss": 0.3444, "lr": 2.569378500882966e-05, "epoch": 2.8183294883544545, "percentage": 93.94, "elapsed_time": "3 days, 10:37:20", "remaining_time": "5:19:38", "throughput": 27502.41, "total_tokens": 8180325248} +{"current_steps": 27880, "total_steps": 29667, "loss": 0.3468, "lr": 2.569039322432994e-05, "epoch": 2.8193407704705624, "percentage": 93.98, "elapsed_time": "3 days, 10:38:59", "remaining_time": "5:17:51", "throughput": 27502.83, "total_tokens": 8183188288} +{"current_steps": 27890, "total_steps": 29667, "loss": 0.3448, "lr": 2.5687002782703474e-05, "epoch": 2.82035205258667, "percentage": 94.01, "elapsed_time": "3 days, 10:40:48", "remaining_time": "5:16:04", "throughput": 27502.58, "total_tokens": 8186101824} +{"current_steps": 27900, "total_steps": 29667, "loss": 0.3499, "lr": 2.568361368306439e-05, "epoch": 2.821363334702778, "percentage": 94.04, "elapsed_time": "3 days, 10:42:40", "remaining_time": "5:14:18", "throughput": 27502.08, "total_tokens": 8189029376} +{"current_steps": 27910, "total_steps": 29667, "loss": 0.3472, "lr": 2.5680225924527623e-05, "epoch": 2.8223746168188857, "percentage": 94.08, "elapsed_time": "3 days, 10:44:29", "remaining_time": "5:12:31", "throughput": 27501.89, "total_tokens": 8191961792} +{"current_steps": 27920, "total_steps": 29667, "loss": 0.3424, "lr": 2.5676839506208927e-05, "epoch": 2.8233858989349936, "percentage": 94.11, "elapsed_time": "3 days, 10:46:28", "remaining_time": "5:10:45", "throughput": 27500.81, "total_tokens": 8194913600} +{"current_steps": 27930, "total_steps": 29667, "loss": 0.3455, "lr": 2.567345442722487e-05, "epoch": 2.8243971810511015, "percentage": 94.15, "elapsed_time": "3 days, 10:48:16", "remaining_time": "5:08:58", "throughput": 27500.66, "total_tokens": 8197837696} +{"current_steps": 27940, "total_steps": 29667, "loss": 0.3478, "lr": 2.567007068669283e-05, "epoch": 2.825408463167209, "percentage": 94.18, "elapsed_time": "3 days, 10:50:03", "remaining_time": "5:07:12", "throughput": 27500.44, "total_tokens": 8200730112} +{"current_steps": 27950, "total_steps": 29667, "loss": 0.3454, "lr": 2.5666688283731016e-05, "epoch": 2.826419745283317, "percentage": 94.21, "elapsed_time": "3 days, 10:51:50", "remaining_time": "5:05:25", "throughput": 27500.36, "total_tokens": 8203643392} +{"current_steps": 27960, "total_steps": 29667, "loss": 0.3452, "lr": 2.5663307217458428e-05, "epoch": 2.8274310273994248, "percentage": 94.25, "elapsed_time": "3 days, 10:53:44", "remaining_time": "5:03:39", "throughput": 27499.77, "total_tokens": 8206617216} +{"current_steps": 27970, "total_steps": 29667, "loss": 0.3476, "lr": 2.5659927486994893e-05, "epoch": 2.8284423095155327, "percentage": 94.28, "elapsed_time": "3 days, 10:55:33", "remaining_time": "5:01:52", "throughput": 27499.45, "total_tokens": 8209503744} +{"current_steps": 27980, "total_steps": 29667, "loss": 0.3512, "lr": 2.565654909146105e-05, "epoch": 2.8294535916316406, "percentage": 94.31, "elapsed_time": "3 days, 10:57:23", "remaining_time": "5:00:06", "throughput": 27498.91, "total_tokens": 8212363648} +{"current_steps": 27990, "total_steps": 29667, "loss": 0.3497, "lr": 2.5653172029978346e-05, "epoch": 2.8304648737477485, "percentage": 94.35, "elapsed_time": "3 days, 10:59:10", "remaining_time": "4:58:19", "throughput": 27498.74, "total_tokens": 8215252096} +{"current_steps": 28000, "total_steps": 29667, "loss": 0.3447, "lr": 2.5649796301669014e-05, "epoch": 2.8314761558638564, "percentage": 94.38, "elapsed_time": "3 days, 11:01:01", "remaining_time": "4:56:32", "throughput": 27498.41, "total_tokens": 8218225024} +{"current_steps": 28010, "total_steps": 29667, "loss": 0.3502, "lr": 2.5646421905656148e-05, "epoch": 2.832487437979964, "percentage": 94.41, "elapsed_time": "3 days, 11:02:54", "remaining_time": "4:54:46", "throughput": 27497.84, "total_tokens": 8221140992} +{"current_steps": 28020, "total_steps": 29667, "loss": 0.3444, "lr": 2.5643048841063587e-05, "epoch": 2.8334987200960717, "percentage": 94.45, "elapsed_time": "3 days, 11:04:45", "remaining_time": "4:53:00", "throughput": 27497.5, "total_tokens": 8224114240} +{"current_steps": 28030, "total_steps": 29667, "loss": 0.3456, "lr": 2.563967710701603e-05, "epoch": 2.8345100022121796, "percentage": 94.48, "elapsed_time": "3 days, 11:06:36", "remaining_time": "4:51:13", "throughput": 27497.2, "total_tokens": 8227060224} +{"current_steps": 28040, "total_steps": 29667, "loss": 0.3447, "lr": 2.5636306702638946e-05, "epoch": 2.8355212843282875, "percentage": 94.52, "elapsed_time": "3 days, 11:08:24", "remaining_time": "4:49:26", "throughput": 27497.06, "total_tokens": 8229980288} +{"current_steps": 28050, "total_steps": 29667, "loss": 0.3478, "lr": 2.5632937627058624e-05, "epoch": 2.8365325664443954, "percentage": 94.55, "elapsed_time": "3 days, 11:10:08", "remaining_time": "4:47:40", "throughput": 27497.13, "total_tokens": 8232876352} +{"current_steps": 28060, "total_steps": 29667, "loss": 0.3474, "lr": 2.562956987940216e-05, "epoch": 2.837543848560503, "percentage": 94.58, "elapsed_time": "3 days, 11:11:55", "remaining_time": "4:45:53", "throughput": 27497.06, "total_tokens": 8235797184} +{"current_steps": 28070, "total_steps": 29667, "loss": 0.3469, "lr": 2.5626203458797432e-05, "epoch": 2.838555130676611, "percentage": 94.62, "elapsed_time": "3 days, 11:13:42", "remaining_time": "4:44:06", "throughput": 27497.04, "total_tokens": 8238723520} +{"current_steps": 28080, "total_steps": 29667, "loss": 0.3444, "lr": 2.562283836437315e-05, "epoch": 2.8395664127927187, "percentage": 94.65, "elapsed_time": "3 days, 11:15:31", "remaining_time": "4:42:19", "throughput": 27496.87, "total_tokens": 8241676096} +{"current_steps": 28090, "total_steps": 29667, "loss": 0.3479, "lr": 2.561947459525879e-05, "epoch": 2.8405776949088266, "percentage": 94.68, "elapsed_time": "3 days, 11:17:17", "remaining_time": "4:40:33", "throughput": 27496.84, "total_tokens": 8244572992} +{"current_steps": 28100, "total_steps": 29667, "loss": 0.3498, "lr": 2.561611215058466e-05, "epoch": 2.8415889770249345, "percentage": 94.72, "elapsed_time": "3 days, 11:19:17", "remaining_time": "4:38:47", "throughput": 27495.7, "total_tokens": 8247540928} +{"current_steps": 28110, "total_steps": 29667, "loss": 0.3412, "lr": 2.5612751029481845e-05, "epoch": 2.8426002591410424, "percentage": 94.75, "elapsed_time": "3 days, 11:21:07", "remaining_time": "4:37:00", "throughput": 27495.34, "total_tokens": 8250455104} +{"current_steps": 28120, "total_steps": 29667, "loss": 0.3459, "lr": 2.560939123108225e-05, "epoch": 2.8436115412571503, "percentage": 94.79, "elapsed_time": "3 days, 11:22:59", "remaining_time": "4:35:14", "throughput": 27495.0, "total_tokens": 8253437760} +{"current_steps": 28130, "total_steps": 29667, "loss": 0.3459, "lr": 2.560603275451855e-05, "epoch": 2.844622823373258, "percentage": 94.82, "elapsed_time": "3 days, 11:24:49", "remaining_time": "4:33:27", "throughput": 27494.61, "total_tokens": 8256344576} +{"current_steps": 28140, "total_steps": 29667, "loss": 0.3496, "lr": 2.5602675598924227e-05, "epoch": 2.8456341054893657, "percentage": 94.85, "elapsed_time": "3 days, 11:26:35", "remaining_time": "4:31:40", "throughput": 27494.61, "total_tokens": 8259246592} +{"current_steps": 28150, "total_steps": 29667, "loss": 0.348, "lr": 2.5599319763433566e-05, "epoch": 2.8466453876054736, "percentage": 94.89, "elapsed_time": "3 days, 11:28:22", "remaining_time": "4:29:54", "throughput": 27494.57, "total_tokens": 8262197632} +{"current_steps": 28160, "total_steps": 29667, "loss": 0.3462, "lr": 2.559596524718164e-05, "epoch": 2.8476566697215815, "percentage": 94.92, "elapsed_time": "3 days, 11:30:12", "remaining_time": "4:28:07", "throughput": 27494.28, "total_tokens": 8265115520} +{"current_steps": 28170, "total_steps": 29667, "loss": 0.3439, "lr": 2.559261204930431e-05, "epoch": 2.8486679518376894, "percentage": 94.95, "elapsed_time": "3 days, 11:32:03", "remaining_time": "4:26:20", "throughput": 27493.92, "total_tokens": 8268059584} +{"current_steps": 28180, "total_steps": 29667, "loss": 0.3478, "lr": 2.558926016893824e-05, "epoch": 2.849679233953797, "percentage": 94.99, "elapsed_time": "3 days, 11:33:49", "remaining_time": "4:24:34", "throughput": 27494.01, "total_tokens": 8271018304} +{"current_steps": 28190, "total_steps": 29667, "loss": 0.349, "lr": 2.5585909605220877e-05, "epoch": 2.8506905160699048, "percentage": 95.02, "elapsed_time": "3 days, 11:35:34", "remaining_time": "4:22:47", "throughput": 27493.99, "total_tokens": 8273903808} +{"current_steps": 28200, "total_steps": 29667, "loss": 0.3486, "lr": 2.558256035729046e-05, "epoch": 2.8517017981860127, "percentage": 95.06, "elapsed_time": "3 days, 11:37:26", "remaining_time": "4:21:00", "throughput": 27493.52, "total_tokens": 8276829824} +{"current_steps": 28210, "total_steps": 29667, "loss": 0.3482, "lr": 2.557921242428602e-05, "epoch": 2.8527130803021206, "percentage": 95.09, "elapsed_time": "3 days, 11:39:14", "remaining_time": "4:19:14", "throughput": 27493.29, "total_tokens": 8279725760} +{"current_steps": 28220, "total_steps": 29667, "loss": 0.3507, "lr": 2.557586580534737e-05, "epoch": 2.8537243624182285, "percentage": 95.12, "elapsed_time": "3 days, 11:41:07", "remaining_time": "4:17:27", "throughput": 27492.87, "total_tokens": 8282705984} +{"current_steps": 28230, "total_steps": 29667, "loss": 0.3471, "lr": 2.5572520499615127e-05, "epoch": 2.854735644534336, "percentage": 95.16, "elapsed_time": "3 days, 11:43:00", "remaining_time": "4:15:41", "throughput": 27492.29, "total_tokens": 8285630848} +{"current_steps": 28240, "total_steps": 29667, "loss": 0.3484, "lr": 2.5569176506230667e-05, "epoch": 2.8557469266504443, "percentage": 95.19, "elapsed_time": "3 days, 11:45:09", "remaining_time": "4:13:55", "throughput": 27490.22, "total_tokens": 8288569792} +{"current_steps": 28250, "total_steps": 29667, "loss": 0.3499, "lr": 2.5565833824336183e-05, "epoch": 2.8567582087665517, "percentage": 95.22, "elapsed_time": "3 days, 11:47:05", "remaining_time": "4:12:09", "throughput": 27489.43, "total_tokens": 8291512256} +{"current_steps": 28260, "total_steps": 29667, "loss": 0.3464, "lr": 2.5562492453074633e-05, "epoch": 2.8577694908826596, "percentage": 95.26, "elapsed_time": "3 days, 11:49:07", "remaining_time": "4:10:23", "throughput": 27488.24, "total_tokens": 8294510528} +{"current_steps": 28270, "total_steps": 29667, "loss": 0.3501, "lr": 2.555915239158976e-05, "epoch": 2.8587807729987675, "percentage": 95.29, "elapsed_time": "3 days, 11:50:58", "remaining_time": "4:08:36", "throughput": 27487.75, "total_tokens": 8297405760} +{"current_steps": 28280, "total_steps": 29667, "loss": 0.3541, "lr": 2.5555813639026093e-05, "epoch": 2.8597920551148754, "percentage": 95.32, "elapsed_time": "3 days, 11:52:44", "remaining_time": "4:06:49", "throughput": 27487.71, "total_tokens": 8300316160} +{"current_steps": 28290, "total_steps": 29667, "loss": 0.3462, "lr": 2.5552476194528947e-05, "epoch": 2.8608033372309833, "percentage": 95.36, "elapsed_time": "3 days, 11:54:30", "remaining_time": "4:05:03", "throughput": 27487.76, "total_tokens": 8303244096} +{"current_steps": 28300, "total_steps": 29667, "loss": 0.344, "lr": 2.5549140057244413e-05, "epoch": 2.861814619347091, "percentage": 95.39, "elapsed_time": "3 days, 11:56:24", "remaining_time": "4:03:16", "throughput": 27487.08, "total_tokens": 8306170816} +{"current_steps": 28310, "total_steps": 29667, "loss": 0.347, "lr": 2.5545805226319362e-05, "epoch": 2.8628259014631987, "percentage": 95.43, "elapsed_time": "3 days, 11:58:11", "remaining_time": "4:01:29", "throughput": 27487.04, "total_tokens": 8309094848} +{"current_steps": 28320, "total_steps": 29667, "loss": 0.347, "lr": 2.5542471700901453e-05, "epoch": 2.8638371835793066, "percentage": 95.46, "elapsed_time": "3 days, 12:00:06", "remaining_time": "3:59:43", "throughput": 27486.06, "total_tokens": 8311975296} +{"current_steps": 28330, "total_steps": 29667, "loss": 0.347, "lr": 2.5539139480139113e-05, "epoch": 2.8648484656954145, "percentage": 95.49, "elapsed_time": "3 days, 12:01:56", "remaining_time": "3:57:56", "throughput": 27485.76, "total_tokens": 8314884736} +{"current_steps": 28340, "total_steps": 29667, "loss": 0.3461, "lr": 2.5535808563181546e-05, "epoch": 2.8658597478115224, "percentage": 95.53, "elapsed_time": "3 days, 12:03:49", "remaining_time": "3:56:10", "throughput": 27485.23, "total_tokens": 8317839424} +{"current_steps": 28350, "total_steps": 29667, "loss": 0.3479, "lr": 2.553247894917874e-05, "epoch": 2.86687102992763, "percentage": 95.56, "elapsed_time": "3 days, 12:05:39", "remaining_time": "3:54:23", "throughput": 27484.78, "total_tokens": 8320728192} +{"current_steps": 28360, "total_steps": 29667, "loss": 0.3479, "lr": 2.5529150637281453e-05, "epoch": 2.8678823120437382, "percentage": 95.59, "elapsed_time": "3 days, 12:07:27", "remaining_time": "3:52:37", "throughput": 27484.61, "total_tokens": 8323644864} +{"current_steps": 28370, "total_steps": 29667, "loss": 0.3445, "lr": 2.552582362664122e-05, "epoch": 2.8688935941598457, "percentage": 95.63, "elapsed_time": "3 days, 12:09:18", "remaining_time": "3:50:50", "throughput": 27484.37, "total_tokens": 8326616128} +{"current_steps": 28380, "total_steps": 29667, "loss": 0.3425, "lr": 2.5522497916410353e-05, "epoch": 2.8699048762759536, "percentage": 95.66, "elapsed_time": "3 days, 12:11:11", "remaining_time": "3:49:03", "throughput": 27483.76, "total_tokens": 8329552000} +{"current_steps": 28390, "total_steps": 29667, "loss": 0.345, "lr": 2.5519173505741933e-05, "epoch": 2.8709161583920615, "percentage": 95.7, "elapsed_time": "3 days, 12:13:00", "remaining_time": "3:47:17", "throughput": 27483.65, "total_tokens": 8332513664} +{"current_steps": 28400, "total_steps": 29667, "loss": 0.3448, "lr": 2.551585039378981e-05, "epoch": 2.8719274405081694, "percentage": 95.73, "elapsed_time": "3 days, 12:14:51", "remaining_time": "3:45:30", "throughput": 27483.23, "total_tokens": 8335440384} +{"current_steps": 28410, "total_steps": 29667, "loss": 0.3448, "lr": 2.551252857970861e-05, "epoch": 2.8729387226242773, "percentage": 95.76, "elapsed_time": "3 days, 12:16:45", "remaining_time": "3:43:44", "throughput": 27482.8, "total_tokens": 8338419456} +{"current_steps": 28420, "total_steps": 29667, "loss": 0.3448, "lr": 2.5509208062653734e-05, "epoch": 2.8739500047403848, "percentage": 95.8, "elapsed_time": "3 days, 12:18:37", "remaining_time": "3:41:57", "throughput": 27482.34, "total_tokens": 8341363584} +{"current_steps": 28430, "total_steps": 29667, "loss": 0.3447, "lr": 2.5505888841781333e-05, "epoch": 2.8749612868564927, "percentage": 95.83, "elapsed_time": "3 days, 12:20:24", "remaining_time": "3:40:10", "throughput": 27482.39, "total_tokens": 8344313088} +{"current_steps": 28440, "total_steps": 29667, "loss": 0.346, "lr": 2.5502570916248353e-05, "epoch": 2.8759725689726006, "percentage": 95.86, "elapsed_time": "3 days, 12:22:16", "remaining_time": "3:38:24", "throughput": 27481.84, "total_tokens": 8347239936} +{"current_steps": 28450, "total_steps": 29667, "loss": 0.3474, "lr": 2.5499254285212486e-05, "epoch": 2.8769838510887085, "percentage": 95.9, "elapsed_time": "3 days, 12:24:14", "remaining_time": "3:36:37", "throughput": 27480.72, "total_tokens": 8350151232} +{"current_steps": 28460, "total_steps": 29667, "loss": 0.3451, "lr": 2.5495938947832204e-05, "epoch": 2.8779951332048164, "percentage": 95.93, "elapsed_time": "3 days, 12:26:12", "remaining_time": "3:34:51", "throughput": 27479.71, "total_tokens": 8353074944} +{"current_steps": 28470, "total_steps": 29667, "loss": 0.3479, "lr": 2.5492624903266732e-05, "epoch": 2.879006415320924, "percentage": 95.97, "elapsed_time": "3 days, 12:28:03", "remaining_time": "3:33:04", "throughput": 27479.13, "total_tokens": 8355945728} +{"current_steps": 28480, "total_steps": 29667, "loss": 0.3446, "lr": 2.548931215067607e-05, "epoch": 2.8800176974370317, "percentage": 96.0, "elapsed_time": "3 days, 12:29:55", "remaining_time": "3:31:18", "throughput": 27478.76, "total_tokens": 8358908928} +{"current_steps": 28490, "total_steps": 29667, "loss": 0.346, "lr": 2.5486000689220985e-05, "epoch": 2.8810289795531396, "percentage": 96.03, "elapsed_time": "3 days, 12:31:48", "remaining_time": "3:29:31", "throughput": 27478.3, "total_tokens": 8361888896} +{"current_steps": 28500, "total_steps": 29667, "loss": 0.3481, "lr": 2.5482690518062994e-05, "epoch": 2.8820402616692475, "percentage": 96.07, "elapsed_time": "3 days, 12:33:33", "remaining_time": "3:27:44", "throughput": 27478.29, "total_tokens": 8364768192} +{"current_steps": 28510, "total_steps": 29667, "loss": 0.3508, "lr": 2.547938163636439e-05, "epoch": 2.8830515437853554, "percentage": 96.1, "elapsed_time": "3 days, 12:35:22", "remaining_time": "3:25:58", "throughput": 27478.14, "total_tokens": 8367698560} +{"current_steps": 28520, "total_steps": 29667, "loss": 0.3485, "lr": 2.5476074043288212e-05, "epoch": 2.8840628259014633, "percentage": 96.13, "elapsed_time": "3 days, 12:37:07", "remaining_time": "3:24:11", "throughput": 27478.17, "total_tokens": 8370602240} +{"current_steps": 28530, "total_steps": 29667, "loss": 0.3413, "lr": 2.547276773799827e-05, "epoch": 2.8850741080175712, "percentage": 96.17, "elapsed_time": "3 days, 12:38:52", "remaining_time": "3:22:24", "throughput": 27478.51, "total_tokens": 8373582400} +{"current_steps": 28540, "total_steps": 29667, "loss": 0.3449, "lr": 2.5469462719659138e-05, "epoch": 2.8860853901336787, "percentage": 96.2, "elapsed_time": "3 days, 12:40:44", "remaining_time": "3:20:37", "throughput": 27478.05, "total_tokens": 8376518912} +{"current_steps": 28550, "total_steps": 29667, "loss": 0.3472, "lr": 2.5466158987436135e-05, "epoch": 2.8870966722497866, "percentage": 96.23, "elapsed_time": "3 days, 12:42:34", "remaining_time": "3:18:51", "throughput": 27477.64, "total_tokens": 8379431488} +{"current_steps": 28560, "total_steps": 29667, "loss": 0.3451, "lr": 2.5462856540495345e-05, "epoch": 2.8881079543658945, "percentage": 96.27, "elapsed_time": "3 days, 12:44:24", "remaining_time": "3:17:04", "throughput": 27477.35, "total_tokens": 8382378944} +{"current_steps": 28570, "total_steps": 29667, "loss": 0.3452, "lr": 2.5459555378003607e-05, "epoch": 2.8891192364820024, "percentage": 96.3, "elapsed_time": "3 days, 12:46:09", "remaining_time": "3:15:17", "throughput": 27477.59, "total_tokens": 8385308800} +{"current_steps": 28580, "total_steps": 29667, "loss": 0.3456, "lr": 2.545625549912853e-05, "epoch": 2.8901305185981103, "percentage": 96.34, "elapsed_time": "3 days, 12:47:53", "remaining_time": "3:13:30", "throughput": 27477.61, "total_tokens": 8388186944} +{"current_steps": 28590, "total_steps": 29667, "loss": 0.3446, "lr": 2.5452956903038445e-05, "epoch": 2.891141800714218, "percentage": 96.37, "elapsed_time": "3 days, 12:49:39", "remaining_time": "3:11:43", "throughput": 27477.64, "total_tokens": 8391120960} +{"current_steps": 28600, "total_steps": 29667, "loss": 0.3455, "lr": 2.5449659588902468e-05, "epoch": 2.8921530828303257, "percentage": 96.4, "elapsed_time": "3 days, 12:51:31", "remaining_time": "3:09:57", "throughput": 27477.32, "total_tokens": 8394084032} +{"current_steps": 28610, "total_steps": 29667, "loss": 0.3476, "lr": 2.5446363555890464e-05, "epoch": 2.8931643649464336, "percentage": 96.44, "elapsed_time": "3 days, 12:53:18", "remaining_time": "3:08:10", "throughput": 27477.26, "total_tokens": 8397009088} +{"current_steps": 28620, "total_steps": 29667, "loss": 0.3459, "lr": 2.5443068803173025e-05, "epoch": 2.8941756470625415, "percentage": 96.47, "elapsed_time": "3 days, 12:55:09", "remaining_time": "3:06:23", "throughput": 27476.84, "total_tokens": 8399929472} +{"current_steps": 28630, "total_steps": 29667, "loss": 0.3427, "lr": 2.5439775329921533e-05, "epoch": 2.8951869291786494, "percentage": 96.5, "elapsed_time": "3 days, 12:57:03", "remaining_time": "3:04:37", "throughput": 27476.32, "total_tokens": 8402897408} +{"current_steps": 28640, "total_steps": 29667, "loss": 0.3413, "lr": 2.5436483135308092e-05, "epoch": 2.8961982112947573, "percentage": 96.54, "elapsed_time": "3 days, 12:58:58", "remaining_time": "3:02:50", "throughput": 27475.63, "total_tokens": 8405858816} +{"current_steps": 28650, "total_steps": 29667, "loss": 0.344, "lr": 2.543319221850557e-05, "epoch": 2.897209493410865, "percentage": 96.57, "elapsed_time": "3 days, 13:00:52", "remaining_time": "3:01:04", "throughput": 27475.0, "total_tokens": 8408782592} +{"current_steps": 28660, "total_steps": 29667, "loss": 0.35, "lr": 2.542990257868757e-05, "epoch": 2.8982207755269727, "percentage": 96.61, "elapsed_time": "3 days, 13:02:44", "remaining_time": "2:59:17", "throughput": 27474.55, "total_tokens": 8411734272} +{"current_steps": 28670, "total_steps": 29667, "loss": 0.3452, "lr": 2.542661421502846e-05, "epoch": 2.8992320576430806, "percentage": 96.64, "elapsed_time": "3 days, 13:04:33", "remaining_time": "2:57:30", "throughput": 27474.37, "total_tokens": 8414684224} +{"current_steps": 28680, "total_steps": 29667, "loss": 0.3473, "lr": 2.5423327126703344e-05, "epoch": 2.9002433397591885, "percentage": 96.67, "elapsed_time": "3 days, 13:06:24", "remaining_time": "2:55:44", "throughput": 27474.12, "total_tokens": 8417659584} +{"current_steps": 28690, "total_steps": 29667, "loss": 0.3513, "lr": 2.5420041312888078e-05, "epoch": 2.9012546218752964, "percentage": 96.71, "elapsed_time": "3 days, 13:08:16", "remaining_time": "2:53:57", "throughput": 27473.56, "total_tokens": 8420552256} +{"current_steps": 28700, "total_steps": 29667, "loss": 0.3475, "lr": 2.5416756772759254e-05, "epoch": 2.9022659039914043, "percentage": 96.74, "elapsed_time": "3 days, 13:10:22", "remaining_time": "2:52:11", "throughput": 27472.14, "total_tokens": 8423567168} +{"current_steps": 28710, "total_steps": 29667, "loss": 0.348, "lr": 2.5413473505494222e-05, "epoch": 2.9032771861075117, "percentage": 96.77, "elapsed_time": "3 days, 13:12:11", "remaining_time": "2:50:24", "throughput": 27472.0, "total_tokens": 8426530176} +{"current_steps": 28720, "total_steps": 29667, "loss": 0.3456, "lr": 2.5410191510271063e-05, "epoch": 2.9042884682236196, "percentage": 96.81, "elapsed_time": "3 days, 13:14:00", "remaining_time": "2:48:37", "throughput": 27472.01, "total_tokens": 8429524096} +{"current_steps": 28730, "total_steps": 29667, "loss": 0.3435, "lr": 2.5406910786268613e-05, "epoch": 2.9052997503397275, "percentage": 96.84, "elapsed_time": "3 days, 13:15:48", "remaining_time": "2:46:50", "throughput": 27472.04, "total_tokens": 8432510912} +{"current_steps": 28740, "total_steps": 29667, "loss": 0.3465, "lr": 2.5403631332666444e-05, "epoch": 2.9063110324558354, "percentage": 96.88, "elapsed_time": "3 days, 13:17:36", "remaining_time": "2:45:04", "throughput": 27471.93, "total_tokens": 8435442624} +{"current_steps": 28750, "total_steps": 29667, "loss": 0.3495, "lr": 2.5400353148644863e-05, "epoch": 2.9073223145719433, "percentage": 96.91, "elapsed_time": "3 days, 13:19:23", "remaining_time": "2:43:17", "throughput": 27471.87, "total_tokens": 8438352256} +{"current_steps": 28760, "total_steps": 29667, "loss": 0.3444, "lr": 2.5397076233384925e-05, "epoch": 2.908333596688051, "percentage": 96.94, "elapsed_time": "3 days, 13:21:08", "remaining_time": "2:41:30", "throughput": 27471.98, "total_tokens": 8441280704} +{"current_steps": 28770, "total_steps": 29667, "loss": 0.3493, "lr": 2.539380058606843e-05, "epoch": 2.909344878804159, "percentage": 96.98, "elapsed_time": "3 days, 13:22:55", "remaining_time": "2:39:43", "throughput": 27471.96, "total_tokens": 8444219264} +{"current_steps": 28780, "total_steps": 29667, "loss": 0.3445, "lr": 2.5390526205877895e-05, "epoch": 2.9103561609202666, "percentage": 97.01, "elapsed_time": "3 days, 13:24:43", "remaining_time": "2:37:56", "throughput": 27471.88, "total_tokens": 8447137600} +{"current_steps": 28790, "total_steps": 29667, "loss": 0.3445, "lr": 2.53872530919966e-05, "epoch": 2.9113674430363745, "percentage": 97.04, "elapsed_time": "3 days, 13:26:29", "remaining_time": "2:36:09", "throughput": 27471.84, "total_tokens": 8450062016} +{"current_steps": 28800, "total_steps": 29667, "loss": 0.3427, "lr": 2.5383981243608547e-05, "epoch": 2.9123787251524824, "percentage": 97.08, "elapsed_time": "3 days, 13:28:17", "remaining_time": "2:34:22", "throughput": 27471.8, "total_tokens": 8453018240} +{"current_steps": 28810, "total_steps": 29667, "loss": 0.3443, "lr": 2.5380710659898476e-05, "epoch": 2.9133900072685903, "percentage": 97.11, "elapsed_time": "3 days, 13:30:03", "remaining_time": "2:32:36", "throughput": 27471.81, "total_tokens": 8455925952} +{"current_steps": 28820, "total_steps": 29667, "loss": 0.3436, "lr": 2.537744134005187e-05, "epoch": 2.9144012893846982, "percentage": 97.14, "elapsed_time": "3 days, 13:31:49", "remaining_time": "2:30:49", "throughput": 27471.89, "total_tokens": 8458850112} +{"current_steps": 28830, "total_steps": 29667, "loss": 0.3427, "lr": 2.537417328325493e-05, "epoch": 2.9154125715008057, "percentage": 97.18, "elapsed_time": "3 days, 13:33:40", "remaining_time": "2:29:02", "throughput": 27471.66, "total_tokens": 8461833600} +{"current_steps": 28840, "total_steps": 29667, "loss": 0.354, "lr": 2.5370906488694606e-05, "epoch": 2.9164238536169136, "percentage": 97.21, "elapsed_time": "3 days, 13:35:25", "remaining_time": "2:27:15", "throughput": 27471.8, "total_tokens": 8464754496} +{"current_steps": 28850, "total_steps": 29667, "loss": 0.3521, "lr": 2.536764095555857e-05, "epoch": 2.9174351357330215, "percentage": 97.25, "elapsed_time": "3 days, 13:37:12", "remaining_time": "2:25:28", "throughput": 27471.8, "total_tokens": 8467697088} +{"current_steps": 28860, "total_steps": 29667, "loss": 0.3457, "lr": 2.536437668303524e-05, "epoch": 2.9184464178491294, "percentage": 97.28, "elapsed_time": "3 days, 13:39:03", "remaining_time": "2:23:42", "throughput": 27471.46, "total_tokens": 8470642816} +{"current_steps": 28870, "total_steps": 29667, "loss": 0.3476, "lr": 2.5361113670313745e-05, "epoch": 2.9194576999652373, "percentage": 97.31, "elapsed_time": "3 days, 13:40:50", "remaining_time": "2:21:55", "throughput": 27471.38, "total_tokens": 8473550336} +{"current_steps": 28880, "total_steps": 29667, "loss": 0.3473, "lr": 2.5357851916583964e-05, "epoch": 2.9204689820813448, "percentage": 97.35, "elapsed_time": "3 days, 13:42:40", "remaining_time": "2:20:08", "throughput": 27470.94, "total_tokens": 8476460480} +{"current_steps": 28890, "total_steps": 29667, "loss": 0.3503, "lr": 2.5354591421036485e-05, "epoch": 2.921480264197453, "percentage": 97.38, "elapsed_time": "3 days, 13:44:26", "remaining_time": "2:18:21", "throughput": 27470.98, "total_tokens": 8479365888} +{"current_steps": 28900, "total_steps": 29667, "loss": 0.3436, "lr": 2.5351332182862643e-05, "epoch": 2.9224915463135606, "percentage": 97.41, "elapsed_time": "3 days, 13:46:17", "remaining_time": "2:16:34", "throughput": 27470.77, "total_tokens": 8482357504} +{"current_steps": 28910, "total_steps": 29667, "loss": 0.3415, "lr": 2.5348074201254484e-05, "epoch": 2.9235028284296685, "percentage": 97.45, "elapsed_time": "3 days, 13:48:06", "remaining_time": "2:14:48", "throughput": 27470.56, "total_tokens": 8485273088} +{"current_steps": 28920, "total_steps": 29667, "loss": 0.3495, "lr": 2.53448174754048e-05, "epoch": 2.9245141105457764, "percentage": 97.48, "elapsed_time": "3 days, 13:49:49", "remaining_time": "2:13:01", "throughput": 27470.84, "total_tokens": 8488208576} +{"current_steps": 28930, "total_steps": 29667, "loss": 0.3462, "lr": 2.5341562004507087e-05, "epoch": 2.9255253926618843, "percentage": 97.52, "elapsed_time": "3 days, 13:51:33", "remaining_time": "2:11:14", "throughput": 27471.01, "total_tokens": 8491100224} +{"current_steps": 28940, "total_steps": 29667, "loss": 0.3436, "lr": 2.5338307787755583e-05, "epoch": 2.926536674777992, "percentage": 97.55, "elapsed_time": "3 days, 13:53:22", "remaining_time": "2:09:27", "throughput": 27470.91, "total_tokens": 8494064064} +{"current_steps": 28950, "total_steps": 29667, "loss": 0.3486, "lr": 2.533505482434524e-05, "epoch": 2.9275479568940996, "percentage": 97.58, "elapsed_time": "3 days, 13:55:11", "remaining_time": "2:07:40", "throughput": 27470.88, "total_tokens": 8497046528} +{"current_steps": 28960, "total_steps": 29667, "loss": 0.3465, "lr": 2.533180311347174e-05, "epoch": 2.9285592390102075, "percentage": 97.62, "elapsed_time": "3 days, 13:56:54", "remaining_time": "2:05:53", "throughput": 27471.14, "total_tokens": 8499967808} +{"current_steps": 28970, "total_steps": 29667, "loss": 0.3453, "lr": 2.532855265433149e-05, "epoch": 2.9295705211263154, "percentage": 97.65, "elapsed_time": "3 days, 13:58:42", "remaining_time": "2:04:06", "throughput": 27471.03, "total_tokens": 8502899584} +{"current_steps": 28980, "total_steps": 29667, "loss": 0.3409, "lr": 2.5325303446121602e-05, "epoch": 2.9305818032424233, "percentage": 97.68, "elapsed_time": "3 days, 14:00:47", "remaining_time": "2:02:20", "throughput": 27469.46, "total_tokens": 8505863616} +{"current_steps": 28990, "total_steps": 29667, "loss": 0.3476, "lr": 2.532205548803992e-05, "epoch": 2.9315930853585312, "percentage": 97.72, "elapsed_time": "3 days, 14:02:29", "remaining_time": "2:00:33", "throughput": 27469.86, "total_tokens": 8508775104} +{"current_steps": 29000, "total_steps": 29667, "loss": 0.3465, "lr": 2.531880877928502e-05, "epoch": 2.9326043674746387, "percentage": 97.75, "elapsed_time": "3 days, 14:04:15", "remaining_time": "1:58:46", "throughput": 27470.03, "total_tokens": 8511740352} +{"current_steps": 29010, "total_steps": 29667, "loss": 0.3407, "lr": 2.5315563319056173e-05, "epoch": 2.9336156495907466, "percentage": 97.79, "elapsed_time": "3 days, 14:05:57", "remaining_time": "1:56:59", "throughput": 27470.38, "total_tokens": 8514647232} +{"current_steps": 29020, "total_steps": 29667, "loss": 0.3465, "lr": 2.5312319106553384e-05, "epoch": 2.9346269317068545, "percentage": 97.82, "elapsed_time": "3 days, 14:07:46", "remaining_time": "1:55:12", "throughput": 27470.28, "total_tokens": 8517602432} +{"current_steps": 29030, "total_steps": 29667, "loss": 0.3441, "lr": 2.5309076140977378e-05, "epoch": 2.9356382138229624, "percentage": 97.85, "elapsed_time": "3 days, 14:09:39", "remaining_time": "1:53:26", "throughput": 27469.58, "total_tokens": 8520502336} +{"current_steps": 29040, "total_steps": 29667, "loss": 0.3463, "lr": 2.530583442152958e-05, "epoch": 2.9366494959390703, "percentage": 97.89, "elapsed_time": "3 days, 14:11:31", "remaining_time": "1:51:39", "throughput": 27469.32, "total_tokens": 8523483200} +{"current_steps": 29050, "total_steps": 29667, "loss": 0.3439, "lr": 2.5302593947412147e-05, "epoch": 2.9376607780551782, "percentage": 97.92, "elapsed_time": "3 days, 14:13:20", "remaining_time": "1:49:52", "throughput": 27469.22, "total_tokens": 8526464960} +{"current_steps": 29060, "total_steps": 29667, "loss": 0.3469, "lr": 2.529935471782794e-05, "epoch": 2.938672060171286, "percentage": 97.95, "elapsed_time": "3 days, 14:15:11", "remaining_time": "1:48:05", "throughput": 27468.92, "total_tokens": 8529420416} +{"current_steps": 29070, "total_steps": 29667, "loss": 0.3441, "lr": 2.5296116731980547e-05, "epoch": 2.9396833422873936, "percentage": 97.99, "elapsed_time": "3 days, 14:17:00", "remaining_time": "1:46:19", "throughput": 27468.83, "total_tokens": 8532392768} +{"current_steps": 29080, "total_steps": 29667, "loss": 0.3437, "lr": 2.529287998907426e-05, "epoch": 2.9406946244035015, "percentage": 98.02, "elapsed_time": "3 days, 14:18:44", "remaining_time": "1:44:32", "throughput": 27469.01, "total_tokens": 8535290688} +{"current_steps": 29090, "total_steps": 29667, "loss": 0.3469, "lr": 2.528964448831408e-05, "epoch": 2.9417059065196094, "percentage": 98.06, "elapsed_time": "3 days, 14:20:59", "remaining_time": "1:42:45", "throughput": 27466.58, "total_tokens": 8538251328} +{"current_steps": 29100, "total_steps": 29667, "loss": 0.3501, "lr": 2.5286410228905727e-05, "epoch": 2.9427171886357173, "percentage": 98.09, "elapsed_time": "3 days, 14:22:52", "remaining_time": "1:40:59", "throughput": 27466.02, "total_tokens": 8541171968} +{"current_steps": 29110, "total_steps": 29667, "loss": 0.3487, "lr": 2.5283177210055632e-05, "epoch": 2.943728470751825, "percentage": 98.12, "elapsed_time": "3 days, 14:24:47", "remaining_time": "1:39:12", "throughput": 27465.37, "total_tokens": 8544136832} +{"current_steps": 29120, "total_steps": 29667, "loss": 0.3449, "lr": 2.527994543097093e-05, "epoch": 2.9447397528679327, "percentage": 98.16, "elapsed_time": "3 days, 14:26:30", "remaining_time": "1:37:25", "throughput": 27465.51, "total_tokens": 8547011968} +{"current_steps": 29130, "total_steps": 29667, "loss": 0.3432, "lr": 2.5276714890859472e-05, "epoch": 2.9457510349840406, "percentage": 98.19, "elapsed_time": "3 days, 14:28:32", "remaining_time": "1:35:38", "throughput": 27464.06, "total_tokens": 8549909312} +{"current_steps": 29140, "total_steps": 29667, "loss": 0.3433, "lr": 2.527348558892981e-05, "epoch": 2.9467623171001485, "percentage": 98.22, "elapsed_time": "3 days, 14:30:29", "remaining_time": "1:33:52", "throughput": 27463.4, "total_tokens": 8552911552} +{"current_steps": 29150, "total_steps": 29667, "loss": 0.3442, "lr": 2.5270257524391223e-05, "epoch": 2.9477735992162564, "percentage": 98.26, "elapsed_time": "3 days, 14:32:32", "remaining_time": "1:32:05", "throughput": 27462.16, "total_tokens": 8555896128} +{"current_steps": 29160, "total_steps": 29667, "loss": 0.349, "lr": 2.526703069645366e-05, "epoch": 2.9487848813323643, "percentage": 98.29, "elapsed_time": "3 days, 14:34:35", "remaining_time": "1:30:19", "throughput": 27460.82, "total_tokens": 8558853184} +{"current_steps": 29170, "total_steps": 29667, "loss": 0.3444, "lr": 2.5263805104327815e-05, "epoch": 2.949796163448472, "percentage": 98.32, "elapsed_time": "3 days, 14:36:29", "remaining_time": "1:28:32", "throughput": 27460.26, "total_tokens": 8561824512} +{"current_steps": 29180, "total_steps": 29667, "loss": 0.3451, "lr": 2.526058074722506e-05, "epoch": 2.95080744556458, "percentage": 98.36, "elapsed_time": "3 days, 14:38:14", "remaining_time": "1:26:45", "throughput": 27460.35, "total_tokens": 8564742976} +{"current_steps": 29190, "total_steps": 29667, "loss": 0.348, "lr": 2.5257357624357485e-05, "epoch": 2.9518187276806875, "percentage": 98.39, "elapsed_time": "3 days, 14:40:17", "remaining_time": "1:24:58", "throughput": 27458.97, "total_tokens": 8567686144} +{"current_steps": 29200, "total_steps": 29667, "loss": 0.3446, "lr": 2.525413573493788e-05, "epoch": 2.9528300097967954, "percentage": 98.43, "elapsed_time": "3 days, 14:42:00", "remaining_time": "1:23:11", "throughput": 27459.32, "total_tokens": 8570609216} +{"current_steps": 29210, "total_steps": 29667, "loss": 0.3479, "lr": 2.525091507817974e-05, "epoch": 2.9538412919129033, "percentage": 98.46, "elapsed_time": "3 days, 14:43:49", "remaining_time": "1:21:24", "throughput": 27459.3, "total_tokens": 8573595904} +{"current_steps": 29220, "total_steps": 29667, "loss": 0.3454, "lr": 2.524769565329725e-05, "epoch": 2.9548525740290112, "percentage": 98.49, "elapsed_time": "3 days, 14:45:34", "remaining_time": "1:19:38", "throughput": 27459.42, "total_tokens": 8576518656} +{"current_steps": 29230, "total_steps": 29667, "loss": 0.3493, "lr": 2.5244477459505317e-05, "epoch": 2.955863856145119, "percentage": 98.53, "elapsed_time": "3 days, 14:47:29", "remaining_time": "1:17:51", "throughput": 27458.72, "total_tokens": 8579475328} +{"current_steps": 29240, "total_steps": 29667, "loss": 0.3442, "lr": 2.524126049601953e-05, "epoch": 2.9568751382612266, "percentage": 98.56, "elapsed_time": "3 days, 14:49:17", "remaining_time": "1:16:04", "throughput": 27458.75, "total_tokens": 8582426688} +{"current_steps": 29250, "total_steps": 29667, "loss": 0.3458, "lr": 2.523804476205619e-05, "epoch": 2.9578864203773345, "percentage": 98.59, "elapsed_time": "3 days, 14:51:04", "remaining_time": "1:14:17", "throughput": 27458.57, "total_tokens": 8585314048} +{"current_steps": 29260, "total_steps": 29667, "loss": 0.3426, "lr": 2.5234830256832292e-05, "epoch": 2.9588977024934424, "percentage": 98.63, "elapsed_time": "3 days, 14:52:54", "remaining_time": "1:12:30", "throughput": 27458.18, "total_tokens": 8588218176} +{"current_steps": 29270, "total_steps": 29667, "loss": 0.3456, "lr": 2.523161697956552e-05, "epoch": 2.9599089846095503, "percentage": 98.66, "elapsed_time": "3 days, 14:55:03", "remaining_time": "1:10:44", "throughput": 27456.26, "total_tokens": 8591152000} +{"current_steps": 29280, "total_steps": 29667, "loss": 0.349, "lr": 2.522840492947427e-05, "epoch": 2.9609202667256582, "percentage": 98.7, "elapsed_time": "3 days, 14:56:59", "remaining_time": "1:08:57", "throughput": 27455.51, "total_tokens": 8594098880} +{"current_steps": 29290, "total_steps": 29667, "loss": 0.3449, "lr": 2.5225194105777628e-05, "epoch": 2.9619315488417657, "percentage": 98.73, "elapsed_time": "3 days, 14:58:51", "remaining_time": "1:07:10", "throughput": 27455.09, "total_tokens": 8597043136} +{"current_steps": 29300, "total_steps": 29667, "loss": 0.3419, "lr": 2.5221984507695367e-05, "epoch": 2.962942830957874, "percentage": 98.76, "elapsed_time": "3 days, 15:01:01", "remaining_time": "1:05:23", "throughput": 27452.89, "total_tokens": 8599941696} +{"current_steps": 29310, "total_steps": 29667, "loss": 0.3399, "lr": 2.5218776134447975e-05, "epoch": 2.9639541130739815, "percentage": 98.8, "elapsed_time": "3 days, 15:02:47", "remaining_time": "1:03:36", "throughput": 27452.89, "total_tokens": 8602856320} +{"current_steps": 29320, "total_steps": 29667, "loss": 0.3462, "lr": 2.5215568985256617e-05, "epoch": 2.9649653951900894, "percentage": 98.83, "elapsed_time": "3 days, 15:04:33", "remaining_time": "1:01:49", "throughput": 27452.91, "total_tokens": 8605750272} +{"current_steps": 29330, "total_steps": 29667, "loss": 0.3456, "lr": 2.5212363059343154e-05, "epoch": 2.9659766773061973, "percentage": 98.86, "elapsed_time": "3 days, 15:06:17", "remaining_time": "1:00:02", "throughput": 27453.02, "total_tokens": 8608653952} +{"current_steps": 29340, "total_steps": 29667, "loss": 0.3488, "lr": 2.520915835593014e-05, "epoch": 2.966987959422305, "percentage": 98.9, "elapsed_time": "3 days, 15:08:06", "remaining_time": "0:58:16", "throughput": 27452.88, "total_tokens": 8611585728} +{"current_steps": 29350, "total_steps": 29667, "loss": 0.3483, "lr": 2.5205954874240828e-05, "epoch": 2.967999241538413, "percentage": 98.93, "elapsed_time": "3 days, 15:09:51", "remaining_time": "0:56:29", "throughput": 27452.91, "total_tokens": 8614496192} +{"current_steps": 29360, "total_steps": 29667, "loss": 0.3493, "lr": 2.5202752613499154e-05, "epoch": 2.9690105236545206, "percentage": 98.97, "elapsed_time": "3 days, 15:11:33", "remaining_time": "0:54:42", "throughput": 27453.42, "total_tokens": 8617441600} +{"current_steps": 29370, "total_steps": 29667, "loss": 0.3459, "lr": 2.5199551572929743e-05, "epoch": 2.9700218057706285, "percentage": 99.0, "elapsed_time": "3 days, 15:13:20", "remaining_time": "0:52:55", "throughput": 27453.41, "total_tokens": 8620379136} +{"current_steps": 29380, "total_steps": 29667, "loss": 0.3492, "lr": 2.5196351751757913e-05, "epoch": 2.9710330878867364, "percentage": 99.03, "elapsed_time": "3 days, 15:15:05", "remaining_time": "0:51:08", "throughput": 27453.65, "total_tokens": 8623332608} +{"current_steps": 29390, "total_steps": 29667, "loss": 0.3489, "lr": 2.5193153149209664e-05, "epoch": 2.9720443700028443, "percentage": 99.07, "elapsed_time": "3 days, 15:16:49", "remaining_time": "0:49:21", "throughput": 27453.88, "total_tokens": 8626271744} +{"current_steps": 29400, "total_steps": 29667, "loss": 0.3468, "lr": 2.5189955764511702e-05, "epoch": 2.973055652118952, "percentage": 99.1, "elapsed_time": "3 days, 15:18:32", "remaining_time": "0:47:34", "throughput": 27454.14, "total_tokens": 8629168128} +{"current_steps": 29410, "total_steps": 29667, "loss": 0.3474, "lr": 2.5186759596891398e-05, "epoch": 2.9740669342350596, "percentage": 99.13, "elapsed_time": "3 days, 15:20:31", "remaining_time": "0:45:47", "throughput": 27453.1, "total_tokens": 8632125504} +{"current_steps": 29420, "total_steps": 29667, "loss": 0.3442, "lr": 2.518356464557682e-05, "epoch": 2.975078216351168, "percentage": 99.17, "elapsed_time": "3 days, 15:22:32", "remaining_time": "0:44:00", "throughput": 27451.9, "total_tokens": 8635061696} +{"current_steps": 29430, "total_steps": 29667, "loss": 0.3479, "lr": 2.5180370909796718e-05, "epoch": 2.9760894984672754, "percentage": 99.2, "elapsed_time": "3 days, 15:24:25", "remaining_time": "0:42:14", "throughput": 27451.3, "total_tokens": 8637976448} +{"current_steps": 29440, "total_steps": 29667, "loss": 0.345, "lr": 2.5177178388780527e-05, "epoch": 2.9771007805833833, "percentage": 99.23, "elapsed_time": "3 days, 15:26:13", "remaining_time": "0:40:27", "throughput": 27451.22, "total_tokens": 8640928512} +{"current_steps": 29450, "total_steps": 29667, "loss": 0.3469, "lr": 2.5173987081758372e-05, "epoch": 2.9781120626994912, "percentage": 99.27, "elapsed_time": "3 days, 15:28:00", "remaining_time": "0:38:40", "throughput": 27451.23, "total_tokens": 8643867648} +{"current_steps": 29460, "total_steps": 29667, "loss": 0.3442, "lr": 2.5170796987961044e-05, "epoch": 2.979123344815599, "percentage": 99.3, "elapsed_time": "3 days, 15:29:41", "remaining_time": "0:36:53", "throughput": 27451.66, "total_tokens": 8646772544} +{"current_steps": 29470, "total_steps": 29667, "loss": 0.3438, "lr": 2.516760810662004e-05, "epoch": 2.980134626931707, "percentage": 99.34, "elapsed_time": "3 days, 15:31:30", "remaining_time": "0:35:06", "throughput": 27451.59, "total_tokens": 8649738432} +{"current_steps": 29480, "total_steps": 29667, "loss": 0.3477, "lr": 2.5164420436967517e-05, "epoch": 2.9811459090478145, "percentage": 99.37, "elapsed_time": "3 days, 15:33:17", "remaining_time": "0:33:19", "throughput": 27451.59, "total_tokens": 8652664640} +{"current_steps": 29490, "total_steps": 29667, "loss": 0.3415, "lr": 2.516123397823632e-05, "epoch": 2.9821571911639224, "percentage": 99.4, "elapsed_time": "3 days, 15:34:58", "remaining_time": "0:31:32", "throughput": 27451.96, "total_tokens": 8655560704} +{"current_steps": 29500, "total_steps": 29667, "loss": 0.3482, "lr": 2.5158048729659988e-05, "epoch": 2.9831684732800303, "percentage": 99.44, "elapsed_time": "3 days, 15:36:40", "remaining_time": "0:29:45", "throughput": 27452.3, "total_tokens": 8658469824} +{"current_steps": 29510, "total_steps": 29667, "loss": 0.3482, "lr": 2.5154864690472714e-05, "epoch": 2.9841797553961382, "percentage": 99.47, "elapsed_time": "3 days, 15:38:25", "remaining_time": "0:27:58", "throughput": 27452.4, "total_tokens": 8661390592} +{"current_steps": 29520, "total_steps": 29667, "loss": 0.3409, "lr": 2.5151681859909383e-05, "epoch": 2.985191037512246, "percentage": 99.5, "elapsed_time": "3 days, 15:40:27", "remaining_time": "0:26:11", "throughput": 27451.13, "total_tokens": 8664322688} +{"current_steps": 29530, "total_steps": 29667, "loss": 0.3454, "lr": 2.5148500237205564e-05, "epoch": 2.9862023196283536, "percentage": 99.54, "elapsed_time": "3 days, 15:42:12", "remaining_time": "0:24:24", "throughput": 27451.24, "total_tokens": 8667237376} +{"current_steps": 29540, "total_steps": 29667, "loss": 0.3412, "lr": 2.514531982159748e-05, "epoch": 2.9872136017444615, "percentage": 99.57, "elapsed_time": "3 days, 15:44:00", "remaining_time": "0:22:37", "throughput": 27451.16, "total_tokens": 8670181184} +{"current_steps": 29550, "total_steps": 29667, "loss": 0.3491, "lr": 2.5142140612322056e-05, "epoch": 2.9882248838605694, "percentage": 99.61, "elapsed_time": "3 days, 15:45:47", "remaining_time": "0:20:50", "throughput": 27451.11, "total_tokens": 8673103936} +{"current_steps": 29560, "total_steps": 29667, "loss": 0.3493, "lr": 2.5138962608616883e-05, "epoch": 2.9892361659766773, "percentage": 99.64, "elapsed_time": "3 days, 15:47:49", "remaining_time": "0:19:04", "throughput": 27449.97, "total_tokens": 8676101376} +{"current_steps": 29570, "total_steps": 29667, "loss": 0.3426, "lr": 2.513578580972022e-05, "epoch": 2.990247448092785, "percentage": 99.67, "elapsed_time": "3 days, 15:49:32", "remaining_time": "0:17:17", "throughput": 27450.25, "total_tokens": 8679025088} +{"current_steps": 29580, "total_steps": 29667, "loss": 0.3439, "lr": 2.5132610214871e-05, "epoch": 2.991258730208893, "percentage": 99.71, "elapsed_time": "3 days, 15:51:21", "remaining_time": "0:15:30", "throughput": 27450.26, "total_tokens": 8681999424} +{"current_steps": 29590, "total_steps": 29667, "loss": 0.3475, "lr": 2.5129435823308835e-05, "epoch": 2.992270012325001, "percentage": 99.74, "elapsed_time": "3 days, 15:53:11", "remaining_time": "0:13:43", "throughput": 27450.19, "total_tokens": 8684998528} +{"current_steps": 29600, "total_steps": 29667, "loss": 0.3474, "lr": 2.5126262634274012e-05, "epoch": 2.9932812944411085, "percentage": 99.77, "elapsed_time": "3 days, 15:54:55", "remaining_time": "0:11:56", "throughput": 27450.44, "total_tokens": 8687948800} +{"current_steps": 29610, "total_steps": 29667, "loss": 0.3433, "lr": 2.512309064700748e-05, "epoch": 2.9942925765572164, "percentage": 99.81, "elapsed_time": "3 days, 15:56:40", "remaining_time": "0:10:09", "throughput": 27450.74, "total_tokens": 8690925760} +{"current_steps": 29620, "total_steps": 29667, "loss": 0.344, "lr": 2.511991986075086e-05, "epoch": 2.9953038586733243, "percentage": 99.84, "elapsed_time": "3 days, 15:58:23", "remaining_time": "0:08:22", "throughput": 27451.01, "total_tokens": 8693817152} +{"current_steps": 29630, "total_steps": 29667, "loss": 0.3455, "lr": 2.511675027474645e-05, "epoch": 2.996315140789432, "percentage": 99.88, "elapsed_time": "3 days, 16:00:24", "remaining_time": "0:06:35", "throughput": 27449.64, "total_tokens": 8696710336} +{"current_steps": 29640, "total_steps": 29667, "loss": 0.3538, "lr": 2.5113581888237215e-05, "epoch": 2.99732642290554, "percentage": 99.91, "elapsed_time": "3 days, 16:02:15", "remaining_time": "0:04:48", "throughput": 27449.27, "total_tokens": 8699653696} +{"current_steps": 29650, "total_steps": 29667, "loss": 0.3465, "lr": 2.5110414700466782e-05, "epoch": 2.9983377050216475, "percentage": 99.94, "elapsed_time": "3 days, 16:04:07", "remaining_time": "0:03:01", "throughput": 27449.1, "total_tokens": 8702661504} +{"current_steps": 29660, "total_steps": 29667, "loss": 0.3465, "lr": 2.5107248710679447e-05, "epoch": 2.9993489871377554, "percentage": 99.98, "elapsed_time": "3 days, 16:05:50", "remaining_time": "0:01:14", "throughput": 27449.43, "total_tokens": 8705599040} +{"current_steps": 29667, "total_steps": 29667, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "3 days, 16:11:32", "remaining_time": "0:00:00", "throughput": 27425.75, "total_tokens": 8707477248}