From 9a661f888b20a30b609b49da850a599de0bfb31e Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 1 Jun 2026 06:55:12 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: laion/exp-uns-r2egym-33_6x_glm_4_7_traces_jupiter Source: Original Platform --- .gitattributes | 56 + README.md | 61 + added_tokens.json | 28 + all_results.json | 16 + chat_template.jinja | 89 + config.json | 68 + configuration.json | 1 + generation_config.json | 12 + merges.txt | 3 + model-00001-of-00004.safetensors | 3 + model-00002-of-00004.safetensors | 3 + model-00003-of-00004.safetensors | 3 + model-00004-of-00004.safetensors | 3 + model.safetensors.index.json | 407 ++ run_summary.json | 12 + special_tokens_map.json | 31 + tokenizer.json | 3 + tokenizer_config.json | 240 + train_results.json | 12 + trainer_log.jsonl | 895 +++ trainer_state.json | 9866 ++++++++++++++++++++++++++++++ training_args.bin | 3 + training_loss.png | Bin 0 -> 41142 bytes vocab.json | 3 + 24 files changed, 11818 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 all_results.json create mode 100644 chat_template.jinja create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 merges.txt create mode 100644 model-00001-of-00004.safetensors create mode 100644 model-00002-of-00004.safetensors create mode 100644 model-00003-of-00004.safetensors create mode 100644 model-00004-of-00004.safetensors create mode 100644 model.safetensors.index.json create mode 100644 run_summary.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_loss.png create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..2bf8722 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,56 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text + + +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text + +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +vocab.json filter=lfs diff=lfs merge=lfs -text +model-00003-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +model-00004-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text +training_args.bin filter=lfs diff=lfs merge=lfs -text +merges.txt filter=lfs diff=lfs merge=lfs -text +model-00002-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +model-00001-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..4e59e04 --- /dev/null +++ b/README.md @@ -0,0 +1,61 @@ +--- +library_name: transformers +license: apache-2.0 +base_model: Qwen/Qwen3-8B +tags: +- llama-factory +- full +- generated_from_trainer +model-index: +- name: exp-uns-r2egym-33_6x_glm_4_7_traces_jupiter + results: [] +--- + + + +# exp-uns-r2egym-33_6x_glm_4_7_traces_jupiter + +This model is a fine-tuned version of [Qwen/Qwen3-8B](https://huggingface.co/Qwen/Qwen3-8B) on the /data/cat/ws/befe330h-befe330h-otagent/huggingface/hub/datasets--DCAgent--exp-uns-r2egym-33_6x_glm_4.7_traces_jupiter/snapshots/9f6fd69f6fa50425609d375c4f7198b192f4a61b_thinking_preprocessed dataset. + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 4e-05 +- train_batch_size: 1 +- eval_batch_size: 8 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 8 +- gradient_accumulation_steps: 2 +- total_train_batch_size: 16 +- total_eval_batch_size: 64 +- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.98) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 7.0 + +### Training results + + + +### Framework versions + +- Transformers 4.57.6 +- Pytorch 2.9.0+cu128 +- Datasets 4.4.1 +- Tokenizers 0.22.2 diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..b54f913 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,28 @@ +{ + "": 151668, + "": 151658, + "": 151666, + "": 151667, + "": 151657, + "": 151665, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..c09233d --- /dev/null +++ b/all_results.json @@ -0,0 +1,16 @@ +{ + "achieved_tflops_per_gpu": 112208.80647067179, + "achieved_tflops_per_gpu_theoretical": 4692081.812186509, + "epoch": 7.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21058475971221924, + "mfu_percent": 11345.6831618475, + "mfu_percent_theoretical": 474426.8768641567, + "total_flos": 2.8947179058078024e+18, + "train_loss": 0.0, + "train_runtime": 3.2247, + "train_samples_per_second": 22141.844, + "train_steps_per_second": 1384.951, + "valid_targets_mean": 4636.9, + "valid_targets_min": 581 +} \ No newline at end of file diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..01be9b3 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,89 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0].role == 'system' %} + {{- messages[0].content + '\n\n' }} + {%- endif %} + {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0].role == 'system' %} + {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %} +{%- for message in messages[::-1] %} + {%- set index = (messages|length - 1) - loop.index0 %} + {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('') and message.content.endswith('')) %} + {%- set ns.multi_step_tool = false %} + {%- set ns.last_query_index = index %} + {%- endif %} +{%- endfor %} +{%- for message in messages %} + {%- if message.content is string %} + {%- set content = message.content %} + {%- else %} + {%- set content = '' %} + {%- endif %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) %} + {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {%- set reasoning_content = '' %} + {%- if message.reasoning_content is string %} + {%- set reasoning_content = message.reasoning_content %} + {%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} + {%- endif %} + {%- if loop.index0 > ns.last_query_index %} + {%- if loop.last or (not loop.last and reasoning_content) %} + {{- '<|im_start|>' + message.role + '\n\n' + reasoning_content.strip('\n') + '\n\n\n' + content.lstrip('\n') }} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- if message.tool_calls %} + {%- for tool_call in message.tool_calls %} + {%- if (loop.first and content) or (not loop.first) %} + {{- '\n' }} + {%- endif %} + {%- if tool_call.function %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {%- if tool_call.arguments is string %} + {{- tool_call.arguments }} + {%- else %} + {{- tool_call.arguments | tojson }} + {%- endif %} + {{- '}\n' }} + {%- endfor %} + {%- endif %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} + {%- if enable_thinking is defined and enable_thinking is false %} + {{- '\n\n\n\n' }} + {%- endif %} +{%- endif %} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..59b4193 --- /dev/null +++ b/config.json @@ -0,0 +1,68 @@ +{ + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "eos_token_id": 151645, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 12288, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 36, + "model_type": "qwen3", + "num_attention_heads": 32, + "num_hidden_layers": 36, + "num_key_value_heads": 8, + "pad_token_id": 151643, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": false, + "transformers_version": "4.57.6", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..159097f --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "others", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..9adbb28 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,12 @@ +{ + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "temperature": 0.6, + "top_k": 20, + "top_p": 0.95, + "transformers_version": "4.57.6" +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model-00001-of-00004.safetensors b/model-00001-of-00004.safetensors new file mode 100644 index 0000000..3877a14 --- /dev/null +++ b/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde3830db517d17751a7249864fce3ba4285564bc14f2e3bca4423045032e973 +size 4902257696 diff --git a/model-00002-of-00004.safetensors b/model-00002-of-00004.safetensors new file mode 100644 index 0000000..544705a --- /dev/null +++ b/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ad4f7a6a40e03beb64e43f12f4c797692280dfccc7999ea6a6d4212cb49340f +size 4915960368 diff --git a/model-00003-of-00004.safetensors b/model-00003-of-00004.safetensors new file mode 100644 index 0000000..ebe1b85 --- /dev/null +++ b/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5cd8085ea96cfa58e2dfb03bfd40378266dc08dd8accebac9963f2883bcae5 +size 4983068496 diff --git a/model-00004-of-00004.safetensors b/model-00004-of-00004.safetensors new file mode 100644 index 0000000..a292543 --- /dev/null +++ b/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ff4dea9549815240c7d98c50dd6508713bca5bba9292cb272625bd32aa7929 +size 1580230264 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..ba886c0 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,407 @@ +{ + "metadata": { + "total_parameters": 308224, + "total_size": 16381470720 + }, + "weight_map": { + "lm_head.weight": "model-00004-of-00004.safetensors", + "model.embed_tokens.weight": "model-00001-of-00004.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.20.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.23.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.30.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.input_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.down_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.gate_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.up_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.k_norm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.q_norm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.norm.weight": "model-00004-of-00004.safetensors" + } +} diff --git a/run_summary.json b/run_summary.json new file mode 100644 index 0000000..4aa1a38 --- /dev/null +++ b/run_summary.json @@ -0,0 +1,12 @@ +{ + "agent_name": "9f6fd69f6fa50425609d375c4f7198b192f4a61b_thinking_preprocessed", + "training_start": "2026-02-20T19:25:24Z", + "training_end": null, + "created_by": "DCAgent", + "base_model_name": "Qwen/Qwen3-8B", + "dataset_name": "/data/cat/ws/befe330h-befe330h-otagent/huggingface/hub/datasets--DCAgent--exp-uns-r2egym-33_6x_glm_4.7_traces_jupiter/snapshots/9f6fd69f6fa50425609d375c4f7198b192f4a61b_thinking_preprocessed", + "training_type": "SFT", + "training_parameters": "https://huggingface.co/laion/exp-uns-r2egym-33_6x_glm_4_7_traces_jupiter/blob/main/config.json", + "wandb_link": "https://wandb.ai/dogml/OpenThoughts-Agent/runs/sft_exp-uns-r2egym-33_6x_glm_4-7_traces_jupiter_Qwen3-8B", + "traces_location_s3": null +} \ No newline at end of file diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..ac23c0a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..cd71f61 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..e9dc937 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,240 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151665": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151666": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151667": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151668": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 32768, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..50552ae --- /dev/null +++ b/train_results.json @@ -0,0 +1,12 @@ +{ + "achieved_tflops_per_gpu": 112208.80647067179, + "achieved_tflops_per_gpu_theoretical": 4692081.812186509, + "epoch": 7.0, + "mfu_percent": 11345.6831618475, + "mfu_percent_theoretical": 474426.8768641567, + "total_flos": 2.8947179058078024e+18, + "train_loss": 0.0, + "train_runtime": 3.2247, + "train_samples_per_second": 22141.844, + "train_steps_per_second": 1384.951 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..6a4be83 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,895 @@ +{"current_steps": 5, "total_steps": 4466, "loss": 0.8602, "lr": 3.579418344519016e-07, "epoch": 0.00784313725490196, "percentage": 0.11, "elapsed_time": "0:01:29", "remaining_time": "22:04:44"} +{"current_steps": 10, "total_steps": 4466, "loss": 0.8507, "lr": 8.053691275167786e-07, "epoch": 0.01568627450980392, "percentage": 0.22, "elapsed_time": "0:02:42", "remaining_time": "20:05:27"} +{"current_steps": 15, "total_steps": 4466, "loss": 0.8156, "lr": 1.2527964205816557e-06, "epoch": 0.023529411764705882, "percentage": 0.34, "elapsed_time": "0:03:58", "remaining_time": "19:37:17"} +{"current_steps": 20, "total_steps": 4466, "loss": 0.7847, "lr": 1.7002237136465326e-06, "epoch": 0.03137254901960784, "percentage": 0.45, "elapsed_time": "0:05:18", "remaining_time": "19:40:07"} +{"current_steps": 25, "total_steps": 4466, "loss": 0.7347, "lr": 2.1476510067114096e-06, "epoch": 0.0392156862745098, "percentage": 0.56, "elapsed_time": "0:06:35", "remaining_time": "19:31:53"} +{"current_steps": 30, "total_steps": 4466, "loss": 0.6663, "lr": 2.5950782997762863e-06, "epoch": 0.047058823529411764, "percentage": 0.67, "elapsed_time": "0:07:54", "remaining_time": "19:29:30"} +{"current_steps": 35, "total_steps": 4466, "loss": 0.627, "lr": 3.0425055928411635e-06, "epoch": 0.054901960784313725, "percentage": 0.78, "elapsed_time": "0:09:15", "remaining_time": "19:31:52"} +{"current_steps": 40, "total_steps": 4466, "loss": 0.6072, "lr": 3.4899328859060407e-06, "epoch": 0.06274509803921569, "percentage": 0.9, "elapsed_time": "0:10:29", "remaining_time": "19:21:26"} +{"current_steps": 45, "total_steps": 4466, "loss": 0.5814, "lr": 3.937360178970917e-06, "epoch": 0.07058823529411765, "percentage": 1.01, "elapsed_time": "0:11:44", "remaining_time": "19:13:45"} +{"current_steps": 50, "total_steps": 4466, "loss": 0.5545, "lr": 4.384787472035795e-06, "epoch": 0.0784313725490196, "percentage": 1.12, "elapsed_time": "0:13:03", "remaining_time": "19:13:26"} +{"current_steps": 55, "total_steps": 4466, "loss": 0.5497, "lr": 4.832214765100672e-06, "epoch": 0.08627450980392157, "percentage": 1.23, "elapsed_time": "0:14:24", "remaining_time": "19:15:20"} +{"current_steps": 60, "total_steps": 4466, "loss": 0.5404, "lr": 5.2796420581655485e-06, "epoch": 0.09411764705882353, "percentage": 1.34, "elapsed_time": "0:15:41", "remaining_time": "19:12:02"} +{"current_steps": 65, "total_steps": 4466, "loss": 0.5087, "lr": 5.727069351230425e-06, "epoch": 0.10196078431372549, "percentage": 1.46, "elapsed_time": "0:16:58", "remaining_time": "19:09:45"} +{"current_steps": 70, "total_steps": 4466, "loss": 0.5017, "lr": 6.174496644295303e-06, "epoch": 0.10980392156862745, "percentage": 1.57, "elapsed_time": "0:18:20", "remaining_time": "19:11:34"} +{"current_steps": 75, "total_steps": 4466, "loss": 0.4841, "lr": 6.6219239373601796e-06, "epoch": 0.11764705882352941, "percentage": 1.68, "elapsed_time": "0:19:40", "remaining_time": "19:11:29"} +{"current_steps": 80, "total_steps": 4466, "loss": 0.4621, "lr": 7.069351230425056e-06, "epoch": 0.12549019607843137, "percentage": 1.79, "elapsed_time": "0:21:02", "remaining_time": "19:13:29"} +{"current_steps": 85, "total_steps": 4466, "loss": 0.4707, "lr": 7.516778523489934e-06, "epoch": 0.13333333333333333, "percentage": 1.9, "elapsed_time": "0:22:20", "remaining_time": "19:11:53"} +{"current_steps": 90, "total_steps": 4466, "loss": 0.435, "lr": 7.96420581655481e-06, "epoch": 0.1411764705882353, "percentage": 2.02, "elapsed_time": "0:23:37", "remaining_time": "19:08:32"} +{"current_steps": 95, "total_steps": 4466, "loss": 0.4323, "lr": 8.411633109619688e-06, "epoch": 0.14901960784313725, "percentage": 2.13, "elapsed_time": "0:25:00", "remaining_time": "19:10:27"} +{"current_steps": 100, "total_steps": 4466, "loss": 0.4226, "lr": 8.859060402684566e-06, "epoch": 0.1568627450980392, "percentage": 2.24, "elapsed_time": "0:26:16", "remaining_time": "19:07:03"} +{"current_steps": 105, "total_steps": 4466, "loss": 0.4028, "lr": 9.306487695749442e-06, "epoch": 0.16470588235294117, "percentage": 2.35, "elapsed_time": "0:27:32", "remaining_time": "19:03:34"} +{"current_steps": 110, "total_steps": 4466, "loss": 0.4017, "lr": 9.753914988814318e-06, "epoch": 0.17254901960784313, "percentage": 2.46, "elapsed_time": "0:28:52", "remaining_time": "19:03:30"} +{"current_steps": 115, "total_steps": 4466, "loss": 0.4107, "lr": 1.0201342281879197e-05, "epoch": 0.1803921568627451, "percentage": 2.58, "elapsed_time": "0:30:10", "remaining_time": "19:01:35"} +{"current_steps": 120, "total_steps": 4466, "loss": 0.4116, "lr": 1.0648769574944073e-05, "epoch": 0.18823529411764706, "percentage": 2.69, "elapsed_time": "0:31:28", "remaining_time": "18:59:38"} +{"current_steps": 125, "total_steps": 4466, "loss": 0.4072, "lr": 1.109619686800895e-05, "epoch": 0.19607843137254902, "percentage": 2.8, "elapsed_time": "0:32:51", "remaining_time": "19:01:05"} +{"current_steps": 130, "total_steps": 4466, "loss": 0.3932, "lr": 1.1543624161073828e-05, "epoch": 0.20392156862745098, "percentage": 2.91, "elapsed_time": "0:34:05", "remaining_time": "18:57:10"} +{"current_steps": 135, "total_steps": 4466, "loss": 0.3848, "lr": 1.1991051454138702e-05, "epoch": 0.21176470588235294, "percentage": 3.02, "elapsed_time": "0:35:25", "remaining_time": "18:56:34"} +{"current_steps": 140, "total_steps": 4466, "loss": 0.3761, "lr": 1.243847874720358e-05, "epoch": 0.2196078431372549, "percentage": 3.13, "elapsed_time": "0:36:44", "remaining_time": "18:55:12"} +{"current_steps": 145, "total_steps": 4466, "loss": 0.3835, "lr": 1.2885906040268457e-05, "epoch": 0.22745098039215686, "percentage": 3.25, "elapsed_time": "0:38:02", "remaining_time": "18:53:29"} +{"current_steps": 150, "total_steps": 4466, "loss": 0.3903, "lr": 1.3333333333333333e-05, "epoch": 0.23529411764705882, "percentage": 3.36, "elapsed_time": "0:39:19", "remaining_time": "18:51:27"} +{"current_steps": 155, "total_steps": 4466, "loss": 0.3831, "lr": 1.3780760626398211e-05, "epoch": 0.24313725490196078, "percentage": 3.47, "elapsed_time": "0:40:39", "remaining_time": "18:50:52"} +{"current_steps": 160, "total_steps": 4466, "loss": 0.3841, "lr": 1.4228187919463088e-05, "epoch": 0.25098039215686274, "percentage": 3.58, "elapsed_time": "0:41:57", "remaining_time": "18:49:11"} +{"current_steps": 165, "total_steps": 4466, "loss": 0.369, "lr": 1.4675615212527964e-05, "epoch": 0.25882352941176473, "percentage": 3.69, "elapsed_time": "0:43:17", "remaining_time": "18:48:28"} +{"current_steps": 170, "total_steps": 4466, "loss": 0.3851, "lr": 1.5123042505592842e-05, "epoch": 0.26666666666666666, "percentage": 3.81, "elapsed_time": "0:44:37", "remaining_time": "18:47:31"} +{"current_steps": 175, "total_steps": 4466, "loss": 0.3728, "lr": 1.5570469798657718e-05, "epoch": 0.27450980392156865, "percentage": 3.92, "elapsed_time": "0:45:51", "remaining_time": "18:44:24"} +{"current_steps": 180, "total_steps": 4466, "loss": 0.3871, "lr": 1.6017897091722595e-05, "epoch": 0.2823529411764706, "percentage": 4.03, "elapsed_time": "0:47:06", "remaining_time": "18:41:46"} +{"current_steps": 185, "total_steps": 4466, "loss": 0.3489, "lr": 1.6465324384787473e-05, "epoch": 0.2901960784313726, "percentage": 4.14, "elapsed_time": "0:48:19", "remaining_time": "18:38:23"} +{"current_steps": 190, "total_steps": 4466, "loss": 0.3599, "lr": 1.691275167785235e-05, "epoch": 0.2980392156862745, "percentage": 4.25, "elapsed_time": "0:49:39", "remaining_time": "18:37:45"} +{"current_steps": 195, "total_steps": 4466, "loss": 0.3725, "lr": 1.7360178970917228e-05, "epoch": 0.3058823529411765, "percentage": 4.37, "elapsed_time": "0:51:01", "remaining_time": "18:37:38"} +{"current_steps": 200, "total_steps": 4466, "loss": 0.3568, "lr": 1.7807606263982106e-05, "epoch": 0.3137254901960784, "percentage": 4.48, "elapsed_time": "0:52:21", "remaining_time": "18:36:44"} +{"current_steps": 205, "total_steps": 4466, "loss": 0.366, "lr": 1.825503355704698e-05, "epoch": 0.3215686274509804, "percentage": 4.59, "elapsed_time": "0:53:36", "remaining_time": "18:34:20"} +{"current_steps": 210, "total_steps": 4466, "loss": 0.3633, "lr": 1.8702460850111858e-05, "epoch": 0.32941176470588235, "percentage": 4.7, "elapsed_time": "0:54:54", "remaining_time": "18:32:43"} +{"current_steps": 215, "total_steps": 4466, "loss": 0.3486, "lr": 1.9149888143176735e-05, "epoch": 0.33725490196078434, "percentage": 4.81, "elapsed_time": "0:56:09", "remaining_time": "18:30:24"} +{"current_steps": 220, "total_steps": 4466, "loss": 0.3448, "lr": 1.9597315436241613e-05, "epoch": 0.34509803921568627, "percentage": 4.93, "elapsed_time": "0:57:24", "remaining_time": "18:28:07"} +{"current_steps": 225, "total_steps": 4466, "loss": 0.3386, "lr": 2.004474272930649e-05, "epoch": 0.35294117647058826, "percentage": 5.04, "elapsed_time": "0:58:41", "remaining_time": "18:26:14"} +{"current_steps": 230, "total_steps": 4466, "loss": 0.3484, "lr": 2.0492170022371365e-05, "epoch": 0.3607843137254902, "percentage": 5.15, "elapsed_time": "1:00:03", "remaining_time": "18:26:00"} +{"current_steps": 235, "total_steps": 4466, "loss": 0.366, "lr": 2.0939597315436246e-05, "epoch": 0.3686274509803922, "percentage": 5.26, "elapsed_time": "1:01:23", "remaining_time": "18:25:21"} +{"current_steps": 240, "total_steps": 4466, "loss": 0.3349, "lr": 2.138702460850112e-05, "epoch": 0.3764705882352941, "percentage": 5.37, "elapsed_time": "1:02:38", "remaining_time": "18:22:54"} +{"current_steps": 245, "total_steps": 4466, "loss": 0.3293, "lr": 2.1834451901565997e-05, "epoch": 0.3843137254901961, "percentage": 5.49, "elapsed_time": "1:03:55", "remaining_time": "18:21:18"} +{"current_steps": 250, "total_steps": 4466, "loss": 0.3454, "lr": 2.228187919463087e-05, "epoch": 0.39215686274509803, "percentage": 5.6, "elapsed_time": "1:05:14", "remaining_time": "18:20:18"} +{"current_steps": 255, "total_steps": 4466, "loss": 0.3224, "lr": 2.2729306487695753e-05, "epoch": 0.4, "percentage": 5.71, "elapsed_time": "1:06:35", "remaining_time": "18:19:39"} +{"current_steps": 260, "total_steps": 4466, "loss": 0.3281, "lr": 2.3176733780760627e-05, "epoch": 0.40784313725490196, "percentage": 5.82, "elapsed_time": "1:07:51", "remaining_time": "18:17:52"} +{"current_steps": 265, "total_steps": 4466, "loss": 0.3438, "lr": 2.3624161073825508e-05, "epoch": 0.41568627450980394, "percentage": 5.93, "elapsed_time": "1:09:10", "remaining_time": "18:16:30"} +{"current_steps": 270, "total_steps": 4466, "loss": 0.3292, "lr": 2.4071588366890382e-05, "epoch": 0.4235294117647059, "percentage": 6.05, "elapsed_time": "1:10:27", "remaining_time": "18:14:59"} +{"current_steps": 275, "total_steps": 4466, "loss": 0.3302, "lr": 2.451901565995526e-05, "epoch": 0.43137254901960786, "percentage": 6.16, "elapsed_time": "1:11:40", "remaining_time": "18:12:12"} +{"current_steps": 280, "total_steps": 4466, "loss": 0.3341, "lr": 2.4966442953020137e-05, "epoch": 0.4392156862745098, "percentage": 6.27, "elapsed_time": "1:12:59", "remaining_time": "18:11:06"} +{"current_steps": 285, "total_steps": 4466, "loss": 0.3259, "lr": 2.5413870246085015e-05, "epoch": 0.4470588235294118, "percentage": 6.38, "elapsed_time": "1:14:13", "remaining_time": "18:08:52"} +{"current_steps": 290, "total_steps": 4466, "loss": 0.3408, "lr": 2.586129753914989e-05, "epoch": 0.4549019607843137, "percentage": 6.49, "elapsed_time": "1:15:34", "remaining_time": "18:08:16"} +{"current_steps": 295, "total_steps": 4466, "loss": 0.3429, "lr": 2.630872483221477e-05, "epoch": 0.4627450980392157, "percentage": 6.61, "elapsed_time": "1:16:48", "remaining_time": "18:05:57"} +{"current_steps": 300, "total_steps": 4466, "loss": 0.3306, "lr": 2.6756152125279644e-05, "epoch": 0.47058823529411764, "percentage": 6.72, "elapsed_time": "1:18:08", "remaining_time": "18:05:04"} +{"current_steps": 305, "total_steps": 4466, "loss": 0.3164, "lr": 2.7203579418344522e-05, "epoch": 0.47843137254901963, "percentage": 6.83, "elapsed_time": "1:19:21", "remaining_time": "18:02:35"} +{"current_steps": 310, "total_steps": 4466, "loss": 0.311, "lr": 2.76510067114094e-05, "epoch": 0.48627450980392156, "percentage": 6.94, "elapsed_time": "1:20:38", "remaining_time": "18:01:08"} +{"current_steps": 315, "total_steps": 4466, "loss": 0.3149, "lr": 2.8098434004474274e-05, "epoch": 0.49411764705882355, "percentage": 7.05, "elapsed_time": "1:21:52", "remaining_time": "17:58:49"} +{"current_steps": 320, "total_steps": 4466, "loss": 0.3198, "lr": 2.854586129753915e-05, "epoch": 0.5019607843137255, "percentage": 7.17, "elapsed_time": "1:23:06", "remaining_time": "17:56:42"} +{"current_steps": 325, "total_steps": 4466, "loss": 0.3218, "lr": 2.899328859060403e-05, "epoch": 0.5098039215686274, "percentage": 7.28, "elapsed_time": "1:24:24", "remaining_time": "17:55:31"} +{"current_steps": 330, "total_steps": 4466, "loss": 0.3307, "lr": 2.9440715883668906e-05, "epoch": 0.5176470588235295, "percentage": 7.39, "elapsed_time": "1:25:38", "remaining_time": "17:53:21"} +{"current_steps": 335, "total_steps": 4466, "loss": 0.3338, "lr": 2.988814317673378e-05, "epoch": 0.5254901960784314, "percentage": 7.5, "elapsed_time": "1:26:54", "remaining_time": "17:51:47"} +{"current_steps": 340, "total_steps": 4466, "loss": 0.3265, "lr": 3.033557046979866e-05, "epoch": 0.5333333333333333, "percentage": 7.61, "elapsed_time": "1:28:16", "remaining_time": "17:51:14"} +{"current_steps": 345, "total_steps": 4466, "loss": 0.3232, "lr": 3.078299776286353e-05, "epoch": 0.5411764705882353, "percentage": 7.73, "elapsed_time": "1:29:31", "remaining_time": "17:49:26"} +{"current_steps": 350, "total_steps": 4466, "loss": 0.3263, "lr": 3.123042505592841e-05, "epoch": 0.5490196078431373, "percentage": 7.84, "elapsed_time": "1:30:49", "remaining_time": "17:48:07"} +{"current_steps": 355, "total_steps": 4466, "loss": 0.3295, "lr": 3.167785234899329e-05, "epoch": 0.5568627450980392, "percentage": 7.95, "elapsed_time": "1:32:09", "remaining_time": "17:47:15"} +{"current_steps": 360, "total_steps": 4466, "loss": 0.3262, "lr": 3.212527964205817e-05, "epoch": 0.5647058823529412, "percentage": 8.06, "elapsed_time": "1:33:21", "remaining_time": "17:44:50"} +{"current_steps": 365, "total_steps": 4466, "loss": 0.3133, "lr": 3.257270693512304e-05, "epoch": 0.5725490196078431, "percentage": 8.17, "elapsed_time": "1:34:40", "remaining_time": "17:43:42"} +{"current_steps": 370, "total_steps": 4466, "loss": 0.3319, "lr": 3.3020134228187924e-05, "epoch": 0.5803921568627451, "percentage": 8.28, "elapsed_time": "1:35:59", "remaining_time": "17:42:37"} +{"current_steps": 375, "total_steps": 4466, "loss": 0.3156, "lr": 3.34675615212528e-05, "epoch": 0.5882352941176471, "percentage": 8.4, "elapsed_time": "1:37:17", "remaining_time": "17:41:27"} +{"current_steps": 380, "total_steps": 4466, "loss": 0.3068, "lr": 3.391498881431768e-05, "epoch": 0.596078431372549, "percentage": 8.51, "elapsed_time": "1:38:33", "remaining_time": "17:39:46"} +{"current_steps": 385, "total_steps": 4466, "loss": 0.3132, "lr": 3.436241610738255e-05, "epoch": 0.6039215686274509, "percentage": 8.62, "elapsed_time": "1:39:51", "remaining_time": "17:38:26"} +{"current_steps": 390, "total_steps": 4466, "loss": 0.3201, "lr": 3.4809843400447434e-05, "epoch": 0.611764705882353, "percentage": 8.73, "elapsed_time": "1:41:08", "remaining_time": "17:37:05"} +{"current_steps": 395, "total_steps": 4466, "loss": 0.3079, "lr": 3.525727069351231e-05, "epoch": 0.6196078431372549, "percentage": 8.84, "elapsed_time": "1:42:27", "remaining_time": "17:35:54"} +{"current_steps": 400, "total_steps": 4466, "loss": 0.3348, "lr": 3.570469798657719e-05, "epoch": 0.6274509803921569, "percentage": 8.96, "elapsed_time": "1:43:43", "remaining_time": "17:34:16"} +{"current_steps": 405, "total_steps": 4466, "loss": 0.3244, "lr": 3.6152125279642063e-05, "epoch": 0.6352941176470588, "percentage": 9.07, "elapsed_time": "1:45:03", "remaining_time": "17:33:28"} +{"current_steps": 410, "total_steps": 4466, "loss": 0.3058, "lr": 3.659955257270694e-05, "epoch": 0.6431372549019608, "percentage": 9.18, "elapsed_time": "1:46:16", "remaining_time": "17:31:20"} +{"current_steps": 415, "total_steps": 4466, "loss": 0.3151, "lr": 3.704697986577181e-05, "epoch": 0.6509803921568628, "percentage": 9.29, "elapsed_time": "1:47:33", "remaining_time": "17:30:00"} +{"current_steps": 420, "total_steps": 4466, "loss": 0.319, "lr": 3.749440715883669e-05, "epoch": 0.6588235294117647, "percentage": 9.4, "elapsed_time": "1:48:54", "remaining_time": "17:29:04"} +{"current_steps": 425, "total_steps": 4466, "loss": 0.3148, "lr": 3.794183445190157e-05, "epoch": 0.6666666666666666, "percentage": 9.52, "elapsed_time": "1:50:11", "remaining_time": "17:27:47"} +{"current_steps": 430, "total_steps": 4466, "loss": 0.3206, "lr": 3.838926174496644e-05, "epoch": 0.6745098039215687, "percentage": 9.63, "elapsed_time": "1:51:29", "remaining_time": "17:26:31"} +{"current_steps": 435, "total_steps": 4466, "loss": 0.3121, "lr": 3.883668903803132e-05, "epoch": 0.6823529411764706, "percentage": 9.74, "elapsed_time": "1:52:46", "remaining_time": "17:25:05"} +{"current_steps": 440, "total_steps": 4466, "loss": 0.3011, "lr": 3.9284116331096196e-05, "epoch": 0.6901960784313725, "percentage": 9.85, "elapsed_time": "1:53:59", "remaining_time": "17:23:05"} +{"current_steps": 445, "total_steps": 4466, "loss": 0.3118, "lr": 3.973154362416108e-05, "epoch": 0.6980392156862745, "percentage": 9.96, "elapsed_time": "1:55:14", "remaining_time": "17:21:15"} +{"current_steps": 450, "total_steps": 4466, "loss": 0.3123, "lr": 3.999997555873748e-05, "epoch": 0.7058823529411765, "percentage": 10.08, "elapsed_time": "1:56:32", "remaining_time": "17:20:06"} +{"current_steps": 455, "total_steps": 4466, "loss": 0.3045, "lr": 3.999970059522009e-05, "epoch": 0.7137254901960784, "percentage": 10.19, "elapsed_time": "1:57:48", "remaining_time": "17:18:31"} +{"current_steps": 460, "total_steps": 4466, "loss": 0.3248, "lr": 3.9999120120821446e-05, "epoch": 0.7215686274509804, "percentage": 10.3, "elapsed_time": "1:59:09", "remaining_time": "17:17:44"} +{"current_steps": 465, "total_steps": 4466, "loss": 0.3182, "lr": 3.999823414440874e-05, "epoch": 0.7294117647058823, "percentage": 10.41, "elapsed_time": "2:00:25", "remaining_time": "17:16:09"} +{"current_steps": 470, "total_steps": 4466, "loss": 0.2902, "lr": 3.999704267951594e-05, "epoch": 0.7372549019607844, "percentage": 10.52, "elapsed_time": "2:01:41", "remaining_time": "17:14:40"} +{"current_steps": 475, "total_steps": 4466, "loss": 0.3129, "lr": 3.999554574434359e-05, "epoch": 0.7450980392156863, "percentage": 10.64, "elapsed_time": "2:02:59", "remaining_time": "17:13:23"} +{"current_steps": 480, "total_steps": 4466, "loss": 0.3007, "lr": 3.999374336175854e-05, "epoch": 0.7529411764705882, "percentage": 10.75, "elapsed_time": "2:04:07", "remaining_time": "17:10:44"} +{"current_steps": 485, "total_steps": 4466, "loss": 0.3131, "lr": 3.999163555929357e-05, "epoch": 0.7607843137254902, "percentage": 10.86, "elapsed_time": "2:05:22", "remaining_time": "17:09:10"} +{"current_steps": 490, "total_steps": 4466, "loss": 0.3053, "lr": 3.9989222369147e-05, "epoch": 0.7686274509803922, "percentage": 10.97, "elapsed_time": "2:06:43", "remaining_time": "17:08:16"} +{"current_steps": 495, "total_steps": 4466, "loss": 0.3109, "lr": 3.998650382818217e-05, "epoch": 0.7764705882352941, "percentage": 11.08, "elapsed_time": "2:08:02", "remaining_time": "17:07:10"} +{"current_steps": 500, "total_steps": 4466, "loss": 0.3061, "lr": 3.998347997792689e-05, "epoch": 0.7843137254901961, "percentage": 11.2, "elapsed_time": "2:09:17", "remaining_time": "17:05:34"} +{"current_steps": 505, "total_steps": 4466, "loss": 0.3066, "lr": 3.9980150864572815e-05, "epoch": 0.792156862745098, "percentage": 11.31, "elapsed_time": "2:10:34", "remaining_time": "17:04:10"} +{"current_steps": 510, "total_steps": 4466, "loss": 0.2985, "lr": 3.997651653897472e-05, "epoch": 0.8, "percentage": 11.42, "elapsed_time": "2:11:54", "remaining_time": "17:03:08"} +{"current_steps": 515, "total_steps": 4466, "loss": 0.2894, "lr": 3.997257705664974e-05, "epoch": 0.807843137254902, "percentage": 11.53, "elapsed_time": "2:13:14", "remaining_time": "17:02:10"} +{"current_steps": 520, "total_steps": 4466, "loss": 0.307, "lr": 3.9968332477776505e-05, "epoch": 0.8156862745098039, "percentage": 11.64, "elapsed_time": "2:14:29", "remaining_time": "17:00:37"} +{"current_steps": 525, "total_steps": 4466, "loss": 0.2935, "lr": 3.996378286719425e-05, "epoch": 0.8235294117647058, "percentage": 11.76, "elapsed_time": "2:15:47", "remaining_time": "16:59:20"} +{"current_steps": 530, "total_steps": 4466, "loss": 0.3036, "lr": 3.995892829440178e-05, "epoch": 0.8313725490196079, "percentage": 11.87, "elapsed_time": "2:17:08", "remaining_time": "16:58:26"} +{"current_steps": 535, "total_steps": 4466, "loss": 0.2963, "lr": 3.995376883355645e-05, "epoch": 0.8392156862745098, "percentage": 11.98, "elapsed_time": "2:18:26", "remaining_time": "16:57:14"} +{"current_steps": 540, "total_steps": 4466, "loss": 0.312, "lr": 3.994830456347302e-05, "epoch": 0.8470588235294118, "percentage": 12.09, "elapsed_time": "2:19:42", "remaining_time": "16:55:45"} +{"current_steps": 545, "total_steps": 4466, "loss": 0.301, "lr": 3.994253556762243e-05, "epoch": 0.8549019607843137, "percentage": 12.2, "elapsed_time": "2:20:53", "remaining_time": "16:53:40"} +{"current_steps": 550, "total_steps": 4466, "loss": 0.3165, "lr": 3.993646193413053e-05, "epoch": 0.8627450980392157, "percentage": 12.32, "elapsed_time": "2:22:09", "remaining_time": "16:52:07"} +{"current_steps": 555, "total_steps": 4466, "loss": 0.2937, "lr": 3.99300837557768e-05, "epoch": 0.8705882352941177, "percentage": 12.43, "elapsed_time": "2:23:20", "remaining_time": "16:50:03"} +{"current_steps": 560, "total_steps": 4466, "loss": 0.322, "lr": 3.9923401129992826e-05, "epoch": 0.8784313725490196, "percentage": 12.54, "elapsed_time": "2:24:38", "remaining_time": "16:48:49"} +{"current_steps": 565, "total_steps": 4466, "loss": 0.2903, "lr": 3.991641415886089e-05, "epoch": 0.8862745098039215, "percentage": 12.65, "elapsed_time": "2:25:53", "remaining_time": "16:47:20"} +{"current_steps": 570, "total_steps": 4466, "loss": 0.2932, "lr": 3.990912294911236e-05, "epoch": 0.8941176470588236, "percentage": 12.76, "elapsed_time": "2:27:10", "remaining_time": "16:45:58"} +{"current_steps": 575, "total_steps": 4466, "loss": 0.3083, "lr": 3.99015276121261e-05, "epoch": 0.9019607843137255, "percentage": 12.88, "elapsed_time": "2:28:28", "remaining_time": "16:44:44"} +{"current_steps": 580, "total_steps": 4466, "loss": 0.3084, "lr": 3.989362826392676e-05, "epoch": 0.9098039215686274, "percentage": 12.99, "elapsed_time": "2:29:39", "remaining_time": "16:42:40"} +{"current_steps": 585, "total_steps": 4466, "loss": 0.2851, "lr": 3.9885425025183e-05, "epoch": 0.9176470588235294, "percentage": 13.1, "elapsed_time": "2:30:55", "remaining_time": "16:41:14"} +{"current_steps": 590, "total_steps": 4466, "loss": 0.2879, "lr": 3.9876918021205606e-05, "epoch": 0.9254901960784314, "percentage": 13.21, "elapsed_time": "2:32:05", "remaining_time": "16:39:12"} +{"current_steps": 595, "total_steps": 4466, "loss": 0.2882, "lr": 3.9868107381945646e-05, "epoch": 0.9333333333333333, "percentage": 13.32, "elapsed_time": "2:33:24", "remaining_time": "16:38:06"} +{"current_steps": 600, "total_steps": 4466, "loss": 0.3047, "lr": 3.9858993241992454e-05, "epoch": 0.9411764705882353, "percentage": 13.43, "elapsed_time": "2:34:44", "remaining_time": "16:37:03"} +{"current_steps": 605, "total_steps": 4466, "loss": 0.3062, "lr": 3.984957574057155e-05, "epoch": 0.9490196078431372, "percentage": 13.55, "elapsed_time": "2:35:52", "remaining_time": "16:34:45"} +{"current_steps": 610, "total_steps": 4466, "loss": 0.2913, "lr": 3.983985502154254e-05, "epoch": 0.9568627450980393, "percentage": 13.66, "elapsed_time": "2:37:08", "remaining_time": "16:33:22"} +{"current_steps": 615, "total_steps": 4466, "loss": 0.2949, "lr": 3.982983123339694e-05, "epoch": 0.9647058823529412, "percentage": 13.77, "elapsed_time": "2:38:24", "remaining_time": "16:31:53"} +{"current_steps": 620, "total_steps": 4466, "loss": 0.3078, "lr": 3.9819504529255836e-05, "epoch": 0.9725490196078431, "percentage": 13.88, "elapsed_time": "2:39:45", "remaining_time": "16:31:00"} +{"current_steps": 625, "total_steps": 4466, "loss": 0.2901, "lr": 3.980887506686763e-05, "epoch": 0.9803921568627451, "percentage": 13.99, "elapsed_time": "2:41:00", "remaining_time": "16:29:32"} +{"current_steps": 630, "total_steps": 4466, "loss": 0.2913, "lr": 3.9797943008605575e-05, "epoch": 0.9882352941176471, "percentage": 14.11, "elapsed_time": "2:42:19", "remaining_time": "16:28:22"} +{"current_steps": 635, "total_steps": 4466, "loss": 0.2889, "lr": 3.978670852146529e-05, "epoch": 0.996078431372549, "percentage": 14.22, "elapsed_time": "2:43:29", "remaining_time": "16:26:21"} +{"current_steps": 640, "total_steps": 4466, "loss": 0.2951, "lr": 3.977517177706226e-05, "epoch": 1.0031372549019608, "percentage": 14.33, "elapsed_time": "2:44:42", "remaining_time": "16:24:39"} +{"current_steps": 645, "total_steps": 4466, "loss": 0.2754, "lr": 3.976333295162918e-05, "epoch": 1.0109803921568628, "percentage": 14.44, "elapsed_time": "2:45:51", "remaining_time": "16:22:31"} +{"current_steps": 650, "total_steps": 4466, "loss": 0.2758, "lr": 3.975119222601323e-05, "epoch": 1.0188235294117647, "percentage": 14.55, "elapsed_time": "2:47:03", "remaining_time": "16:20:46"} +{"current_steps": 655, "total_steps": 4466, "loss": 0.2882, "lr": 3.9738749785673406e-05, "epoch": 1.0266666666666666, "percentage": 14.67, "elapsed_time": "2:48:24", "remaining_time": "16:19:50"} +{"current_steps": 660, "total_steps": 4466, "loss": 0.2869, "lr": 3.972600582067758e-05, "epoch": 1.0345098039215685, "percentage": 14.78, "elapsed_time": "2:49:43", "remaining_time": "16:18:47"} +{"current_steps": 665, "total_steps": 4466, "loss": 0.2863, "lr": 3.971296052569967e-05, "epoch": 1.0423529411764705, "percentage": 14.89, "elapsed_time": "2:50:57", "remaining_time": "16:17:09"} +{"current_steps": 670, "total_steps": 4466, "loss": 0.2789, "lr": 3.9699614100016634e-05, "epoch": 1.0501960784313726, "percentage": 15.0, "elapsed_time": "2:52:13", "remaining_time": "16:15:48"} +{"current_steps": 675, "total_steps": 4466, "loss": 0.2856, "lr": 3.968596674750545e-05, "epoch": 1.0580392156862746, "percentage": 15.11, "elapsed_time": "2:53:28", "remaining_time": "16:14:19"} +{"current_steps": 680, "total_steps": 4466, "loss": 0.2853, "lr": 3.967201867663996e-05, "epoch": 1.0658823529411765, "percentage": 15.23, "elapsed_time": "2:54:44", "remaining_time": "16:12:54"} +{"current_steps": 685, "total_steps": 4466, "loss": 0.2778, "lr": 3.9657770100487736e-05, "epoch": 1.0737254901960784, "percentage": 15.34, "elapsed_time": "2:55:59", "remaining_time": "16:11:22"} +{"current_steps": 690, "total_steps": 4466, "loss": 0.2792, "lr": 3.964322123670678e-05, "epoch": 1.0815686274509804, "percentage": 15.45, "elapsed_time": "2:57:10", "remaining_time": "16:09:37"} +{"current_steps": 695, "total_steps": 4466, "loss": 0.2957, "lr": 3.9628372307542225e-05, "epoch": 1.0894117647058823, "percentage": 15.56, "elapsed_time": "2:58:29", "remaining_time": "16:08:30"} +{"current_steps": 700, "total_steps": 4466, "loss": 0.2925, "lr": 3.961322353982295e-05, "epoch": 1.0972549019607842, "percentage": 15.67, "elapsed_time": "2:59:47", "remaining_time": "16:07:17"} +{"current_steps": 705, "total_steps": 4466, "loss": 0.2984, "lr": 3.959777516495809e-05, "epoch": 1.1050980392156862, "percentage": 15.79, "elapsed_time": "3:01:04", "remaining_time": "16:06:00"} +{"current_steps": 710, "total_steps": 4466, "loss": 0.2898, "lr": 3.95820274189335e-05, "epoch": 1.1129411764705883, "percentage": 15.9, "elapsed_time": "3:02:19", "remaining_time": "16:04:30"} +{"current_steps": 715, "total_steps": 4466, "loss": 0.2954, "lr": 3.956598054230816e-05, "epoch": 1.1207843137254903, "percentage": 16.01, "elapsed_time": "3:03:37", "remaining_time": "16:03:20"} +{"current_steps": 720, "total_steps": 4466, "loss": 0.2879, "lr": 3.9549634780210536e-05, "epoch": 1.1286274509803922, "percentage": 16.12, "elapsed_time": "3:04:47", "remaining_time": "16:01:27"} +{"current_steps": 725, "total_steps": 4466, "loss": 0.2806, "lr": 3.953299038233476e-05, "epoch": 1.1364705882352941, "percentage": 16.23, "elapsed_time": "3:06:05", "remaining_time": "16:00:13"} +{"current_steps": 730, "total_steps": 4466, "loss": 0.2894, "lr": 3.9516047602936864e-05, "epoch": 1.144313725490196, "percentage": 16.35, "elapsed_time": "3:07:22", "remaining_time": "15:58:59"} +{"current_steps": 735, "total_steps": 4466, "loss": 0.2887, "lr": 3.949880670083091e-05, "epoch": 1.152156862745098, "percentage": 16.46, "elapsed_time": "3:08:35", "remaining_time": "15:57:18"} +{"current_steps": 740, "total_steps": 4466, "loss": 0.3061, "lr": 3.9481267939385e-05, "epoch": 1.16, "percentage": 16.57, "elapsed_time": "3:09:56", "remaining_time": "15:56:21"} +{"current_steps": 745, "total_steps": 4466, "loss": 0.2872, "lr": 3.946343158651725e-05, "epoch": 1.167843137254902, "percentage": 16.68, "elapsed_time": "3:11:11", "remaining_time": "15:54:58"} +{"current_steps": 750, "total_steps": 4466, "loss": 0.2888, "lr": 3.944529791469175e-05, "epoch": 1.175686274509804, "percentage": 16.79, "elapsed_time": "3:12:27", "remaining_time": "15:53:31"} +{"current_steps": 755, "total_steps": 4466, "loss": 0.285, "lr": 3.9426867200914355e-05, "epoch": 1.183529411764706, "percentage": 16.91, "elapsed_time": "3:13:46", "remaining_time": "15:52:29"} +{"current_steps": 760, "total_steps": 4466, "loss": 0.2866, "lr": 3.9408139726728444e-05, "epoch": 1.1913725490196079, "percentage": 17.02, "elapsed_time": "3:15:05", "remaining_time": "15:51:20"} +{"current_steps": 765, "total_steps": 4466, "loss": 0.2765, "lr": 3.9389115778210666e-05, "epoch": 1.1992156862745098, "percentage": 17.13, "elapsed_time": "3:16:18", "remaining_time": "15:49:44"} +{"current_steps": 770, "total_steps": 4466, "loss": 0.2842, "lr": 3.936979564596653e-05, "epoch": 1.2070588235294117, "percentage": 17.24, "elapsed_time": "3:17:33", "remaining_time": "15:48:14"} +{"current_steps": 775, "total_steps": 4466, "loss": 0.2814, "lr": 3.935017962512599e-05, "epoch": 1.2149019607843137, "percentage": 17.35, "elapsed_time": "3:18:46", "remaining_time": "15:46:40"} +{"current_steps": 780, "total_steps": 4466, "loss": 0.298, "lr": 3.933026801533893e-05, "epoch": 1.2227450980392156, "percentage": 17.47, "elapsed_time": "3:20:07", "remaining_time": "15:45:45"} +{"current_steps": 785, "total_steps": 4466, "loss": 0.2795, "lr": 3.9310061120770556e-05, "epoch": 1.2305882352941175, "percentage": 17.58, "elapsed_time": "3:21:24", "remaining_time": "15:44:27"} +{"current_steps": 790, "total_steps": 4466, "loss": 0.2605, "lr": 3.928955925009682e-05, "epoch": 1.2384313725490197, "percentage": 17.69, "elapsed_time": "3:22:39", "remaining_time": "15:42:58"} +{"current_steps": 795, "total_steps": 4466, "loss": 0.2693, "lr": 3.9268762716499615e-05, "epoch": 1.2462745098039216, "percentage": 17.8, "elapsed_time": "3:23:55", "remaining_time": "15:41:37"} +{"current_steps": 800, "total_steps": 4466, "loss": 0.2917, "lr": 3.924767183766208e-05, "epoch": 1.2541176470588236, "percentage": 17.91, "elapsed_time": "3:25:16", "remaining_time": "15:40:38"} +{"current_steps": 805, "total_steps": 4466, "loss": 0.2773, "lr": 3.922628693576369e-05, "epoch": 1.2619607843137255, "percentage": 18.03, "elapsed_time": "3:26:36", "remaining_time": "15:39:38"} +{"current_steps": 810, "total_steps": 4466, "loss": 0.2754, "lr": 3.9204608337475323e-05, "epoch": 1.2698039215686274, "percentage": 18.14, "elapsed_time": "3:27:56", "remaining_time": "15:38:34"} +{"current_steps": 815, "total_steps": 4466, "loss": 0.2918, "lr": 3.9182636373954345e-05, "epoch": 1.2776470588235294, "percentage": 18.25, "elapsed_time": "3:29:13", "remaining_time": "15:37:15"} +{"current_steps": 820, "total_steps": 4466, "loss": 0.2836, "lr": 3.916037138083947e-05, "epoch": 1.2854901960784313, "percentage": 18.36, "elapsed_time": "3:30:29", "remaining_time": "15:35:56"} +{"current_steps": 825, "total_steps": 4466, "loss": 0.275, "lr": 3.913781369824567e-05, "epoch": 1.2933333333333334, "percentage": 18.47, "elapsed_time": "3:31:49", "remaining_time": "15:34:52"} +{"current_steps": 830, "total_steps": 4466, "loss": 0.2935, "lr": 3.911496367075897e-05, "epoch": 1.3011764705882354, "percentage": 18.58, "elapsed_time": "3:33:10", "remaining_time": "15:33:53"} +{"current_steps": 835, "total_steps": 4466, "loss": 0.2821, "lr": 3.909182164743122e-05, "epoch": 1.3090196078431373, "percentage": 18.7, "elapsed_time": "3:34:31", "remaining_time": "15:32:51"} +{"current_steps": 840, "total_steps": 4466, "loss": 0.2772, "lr": 3.906838798177469e-05, "epoch": 1.3168627450980392, "percentage": 18.81, "elapsed_time": "3:35:46", "remaining_time": "15:31:26"} +{"current_steps": 845, "total_steps": 4466, "loss": 0.2993, "lr": 3.904466303175674e-05, "epoch": 1.3247058823529412, "percentage": 18.92, "elapsed_time": "3:37:00", "remaining_time": "15:29:56"} +{"current_steps": 850, "total_steps": 4466, "loss": 0.267, "lr": 3.90206471597943e-05, "epoch": 1.332549019607843, "percentage": 19.03, "elapsed_time": "3:38:17", "remaining_time": "15:28:38"} +{"current_steps": 855, "total_steps": 4466, "loss": 0.2832, "lr": 3.8996340732748396e-05, "epoch": 1.340392156862745, "percentage": 19.14, "elapsed_time": "3:39:34", "remaining_time": "15:27:20"} +{"current_steps": 860, "total_steps": 4466, "loss": 0.2852, "lr": 3.8971744121918465e-05, "epoch": 1.348235294117647, "percentage": 19.26, "elapsed_time": "3:40:51", "remaining_time": "15:26:03"} +{"current_steps": 865, "total_steps": 4466, "loss": 0.2831, "lr": 3.894685770303675e-05, "epoch": 1.356078431372549, "percentage": 19.37, "elapsed_time": "3:42:04", "remaining_time": "15:24:30"} +{"current_steps": 870, "total_steps": 4466, "loss": 0.2845, "lr": 3.8921681856262535e-05, "epoch": 1.3639215686274508, "percentage": 19.48, "elapsed_time": "3:43:23", "remaining_time": "15:23:22"} +{"current_steps": 875, "total_steps": 4466, "loss": 0.2694, "lr": 3.889621696617633e-05, "epoch": 1.371764705882353, "percentage": 19.59, "elapsed_time": "3:44:40", "remaining_time": "15:22:05"} +{"current_steps": 880, "total_steps": 4466, "loss": 0.2886, "lr": 3.887046342177401e-05, "epoch": 1.379607843137255, "percentage": 19.7, "elapsed_time": "3:45:51", "remaining_time": "15:20:22"} +{"current_steps": 885, "total_steps": 4466, "loss": 0.2835, "lr": 3.884442161646086e-05, "epoch": 1.3874509803921569, "percentage": 19.82, "elapsed_time": "3:47:10", "remaining_time": "15:19:11"} +{"current_steps": 890, "total_steps": 4466, "loss": 0.2719, "lr": 3.881809194804559e-05, "epoch": 1.3952941176470588, "percentage": 19.93, "elapsed_time": "3:48:18", "remaining_time": "15:17:18"} +{"current_steps": 895, "total_steps": 4466, "loss": 0.2761, "lr": 3.879147481873423e-05, "epoch": 1.4031372549019607, "percentage": 20.04, "elapsed_time": "3:49:35", "remaining_time": "15:16:05"} +{"current_steps": 900, "total_steps": 4466, "loss": 0.2814, "lr": 3.876457063512399e-05, "epoch": 1.4109803921568629, "percentage": 20.15, "elapsed_time": "3:50:47", "remaining_time": "15:14:28"} +{"current_steps": 905, "total_steps": 4466, "loss": 0.284, "lr": 3.873737980819707e-05, "epoch": 1.4188235294117648, "percentage": 20.26, "elapsed_time": "3:52:05", "remaining_time": "15:13:13"} +{"current_steps": 910, "total_steps": 4466, "loss": 0.2862, "lr": 3.870990275331437e-05, "epoch": 1.4266666666666667, "percentage": 20.38, "elapsed_time": "3:53:19", "remaining_time": "15:11:47"} +{"current_steps": 915, "total_steps": 4466, "loss": 0.2786, "lr": 3.8682139890209124e-05, "epoch": 1.4345098039215687, "percentage": 20.49, "elapsed_time": "3:54:37", "remaining_time": "15:10:34"} +{"current_steps": 920, "total_steps": 4466, "loss": 0.2878, "lr": 3.865409164298052e-05, "epoch": 1.4423529411764706, "percentage": 20.6, "elapsed_time": "3:55:52", "remaining_time": "15:09:09"} +{"current_steps": 925, "total_steps": 4466, "loss": 0.2768, "lr": 3.8625758440087213e-05, "epoch": 1.4501960784313725, "percentage": 20.71, "elapsed_time": "3:57:08", "remaining_time": "15:07:49"} +{"current_steps": 930, "total_steps": 4466, "loss": 0.2755, "lr": 3.859714071434078e-05, "epoch": 1.4580392156862745, "percentage": 20.82, "elapsed_time": "3:58:19", "remaining_time": "15:06:10"} +{"current_steps": 935, "total_steps": 4466, "loss": 0.2711, "lr": 3.8568238902899085e-05, "epoch": 1.4658823529411764, "percentage": 20.94, "elapsed_time": "3:59:41", "remaining_time": "15:05:10"} +{"current_steps": 940, "total_steps": 4466, "loss": 0.2908, "lr": 3.853905344725963e-05, "epoch": 1.4737254901960783, "percentage": 21.05, "elapsed_time": "4:00:59", "remaining_time": "15:03:57"} +{"current_steps": 945, "total_steps": 4466, "loss": 0.2809, "lr": 3.850958479325281e-05, "epoch": 1.4815686274509803, "percentage": 21.16, "elapsed_time": "4:02:17", "remaining_time": "15:02:47"} +{"current_steps": 950, "total_steps": 4466, "loss": 0.2699, "lr": 3.8479833391035085e-05, "epoch": 1.4894117647058824, "percentage": 21.27, "elapsed_time": "4:03:31", "remaining_time": "15:01:17"} +{"current_steps": 955, "total_steps": 4466, "loss": 0.2878, "lr": 3.844979969508211e-05, "epoch": 1.4972549019607844, "percentage": 21.38, "elapsed_time": "4:04:45", "remaining_time": "14:59:50"} +{"current_steps": 960, "total_steps": 4466, "loss": 0.2809, "lr": 3.84194841641818e-05, "epoch": 1.5050980392156863, "percentage": 21.5, "elapsed_time": "4:06:04", "remaining_time": "14:58:41"} +{"current_steps": 965, "total_steps": 4466, "loss": 0.2725, "lr": 3.838888726142732e-05, "epoch": 1.5129411764705882, "percentage": 21.61, "elapsed_time": "4:07:23", "remaining_time": "14:57:33"} +{"current_steps": 970, "total_steps": 4466, "loss": 0.282, "lr": 3.8358009454210006e-05, "epoch": 1.5207843137254902, "percentage": 21.72, "elapsed_time": "4:08:44", "remaining_time": "14:56:30"} +{"current_steps": 975, "total_steps": 4466, "loss": 0.2704, "lr": 3.8326851214212206e-05, "epoch": 1.5286274509803923, "percentage": 21.83, "elapsed_time": "4:09:52", "remaining_time": "14:54:40"} +{"current_steps": 980, "total_steps": 4466, "loss": 0.2584, "lr": 3.829541301740014e-05, "epoch": 1.5364705882352943, "percentage": 21.94, "elapsed_time": "4:11:11", "remaining_time": "14:53:30"} +{"current_steps": 985, "total_steps": 4466, "loss": 0.2769, "lr": 3.826369534401653e-05, "epoch": 1.5443137254901962, "percentage": 22.06, "elapsed_time": "4:12:28", "remaining_time": "14:52:15"} +{"current_steps": 990, "total_steps": 4466, "loss": 0.2739, "lr": 3.823169867857337e-05, "epoch": 1.5521568627450981, "percentage": 22.17, "elapsed_time": "4:13:46", "remaining_time": "14:51:01"} +{"current_steps": 995, "total_steps": 4466, "loss": 0.2828, "lr": 3.819942350984444e-05, "epoch": 1.56, "percentage": 22.28, "elapsed_time": "4:15:00", "remaining_time": "14:49:36"} +{"current_steps": 1000, "total_steps": 4466, "loss": 0.271, "lr": 3.816687033085788e-05, "epoch": 1.567843137254902, "percentage": 22.39, "elapsed_time": "4:16:17", "remaining_time": "14:48:19"} +{"current_steps": 1005, "total_steps": 4466, "loss": 0.2767, "lr": 3.813403963888866e-05, "epoch": 1.575686274509804, "percentage": 22.5, "elapsed_time": "4:17:36", "remaining_time": "14:47:07"} +{"current_steps": 1010, "total_steps": 4466, "loss": 0.2663, "lr": 3.810093193545097e-05, "epoch": 1.5835294117647059, "percentage": 22.62, "elapsed_time": "4:18:47", "remaining_time": "14:45:32"} +{"current_steps": 1015, "total_steps": 4466, "loss": 0.279, "lr": 3.806754772629055e-05, "epoch": 1.5913725490196078, "percentage": 22.73, "elapsed_time": "4:20:08", "remaining_time": "14:44:28"} +{"current_steps": 1020, "total_steps": 4466, "loss": 0.2671, "lr": 3.8033887521377015e-05, "epoch": 1.5992156862745097, "percentage": 22.84, "elapsed_time": "4:21:22", "remaining_time": "14:43:03"} +{"current_steps": 1025, "total_steps": 4466, "loss": 0.2792, "lr": 3.799995183489599e-05, "epoch": 1.6070588235294117, "percentage": 22.95, "elapsed_time": "4:22:38", "remaining_time": "14:41:44"} +{"current_steps": 1030, "total_steps": 4466, "loss": 0.2795, "lr": 3.796574118524131e-05, "epoch": 1.6149019607843136, "percentage": 23.06, "elapsed_time": "4:23:57", "remaining_time": "14:40:33"} +{"current_steps": 1035, "total_steps": 4466, "loss": 0.2853, "lr": 3.793125609500709e-05, "epoch": 1.6227450980392157, "percentage": 23.18, "elapsed_time": "4:25:14", "remaining_time": "14:39:17"} +{"current_steps": 1040, "total_steps": 4466, "loss": 0.2813, "lr": 3.789649709097973e-05, "epoch": 1.6305882352941177, "percentage": 23.29, "elapsed_time": "4:26:32", "remaining_time": "14:38:04"} +{"current_steps": 1045, "total_steps": 4466, "loss": 0.2718, "lr": 3.786146470412988e-05, "epoch": 1.6384313725490196, "percentage": 23.4, "elapsed_time": "4:27:50", "remaining_time": "14:36:50"} +{"current_steps": 1050, "total_steps": 4466, "loss": 0.2782, "lr": 3.782615946960432e-05, "epoch": 1.6462745098039215, "percentage": 23.51, "elapsed_time": "4:29:10", "remaining_time": "14:35:43"} +{"current_steps": 1055, "total_steps": 4466, "loss": 0.2877, "lr": 3.779058192671777e-05, "epoch": 1.6541176470588237, "percentage": 23.62, "elapsed_time": "4:30:28", "remaining_time": "14:34:28"} +{"current_steps": 1060, "total_steps": 4466, "loss": 0.2699, "lr": 3.775473261894472e-05, "epoch": 1.6619607843137256, "percentage": 23.73, "elapsed_time": "4:31:43", "remaining_time": "14:33:07"} +{"current_steps": 1065, "total_steps": 4466, "loss": 0.267, "lr": 3.771861209391103e-05, "epoch": 1.6698039215686276, "percentage": 23.85, "elapsed_time": "4:32:55", "remaining_time": "14:31:32"} +{"current_steps": 1070, "total_steps": 4466, "loss": 0.2901, "lr": 3.768222090338564e-05, "epoch": 1.6776470588235295, "percentage": 23.96, "elapsed_time": "4:34:09", "remaining_time": "14:30:08"} +{"current_steps": 1075, "total_steps": 4466, "loss": 0.2759, "lr": 3.7645559603272104e-05, "epoch": 1.6854901960784314, "percentage": 24.07, "elapsed_time": "4:35:24", "remaining_time": "14:28:46"} +{"current_steps": 1080, "total_steps": 4466, "loss": 0.2739, "lr": 3.76086287536001e-05, "epoch": 1.6933333333333334, "percentage": 24.18, "elapsed_time": "4:36:40", "remaining_time": "14:27:26"} +{"current_steps": 1085, "total_steps": 4466, "loss": 0.2641, "lr": 3.757142891851691e-05, "epoch": 1.7011764705882353, "percentage": 24.29, "elapsed_time": "4:37:56", "remaining_time": "14:26:05"} +{"current_steps": 1090, "total_steps": 4466, "loss": 0.2825, "lr": 3.753396066627876e-05, "epoch": 1.7090196078431372, "percentage": 24.41, "elapsed_time": "4:39:14", "remaining_time": "14:24:52"} +{"current_steps": 1095, "total_steps": 4466, "loss": 0.2755, "lr": 3.749622456924215e-05, "epoch": 1.7168627450980392, "percentage": 24.52, "elapsed_time": "4:40:32", "remaining_time": "14:23:40"} +{"current_steps": 1100, "total_steps": 4466, "loss": 0.2903, "lr": 3.745822120385512e-05, "epoch": 1.724705882352941, "percentage": 24.63, "elapsed_time": "4:41:53", "remaining_time": "14:22:34"} +{"current_steps": 1105, "total_steps": 4466, "loss": 0.2671, "lr": 3.7419951150648445e-05, "epoch": 1.732549019607843, "percentage": 24.74, "elapsed_time": "4:43:06", "remaining_time": "14:21:07"} +{"current_steps": 1110, "total_steps": 4466, "loss": 0.2733, "lr": 3.738141499422677e-05, "epoch": 1.740392156862745, "percentage": 24.85, "elapsed_time": "4:44:23", "remaining_time": "14:19:51"} +{"current_steps": 1115, "total_steps": 4466, "loss": 0.2792, "lr": 3.7342613323259654e-05, "epoch": 1.748235294117647, "percentage": 24.97, "elapsed_time": "4:45:38", "remaining_time": "14:18:26"} +{"current_steps": 1120, "total_steps": 4466, "loss": 0.269, "lr": 3.7303546730472607e-05, "epoch": 1.756078431372549, "percentage": 25.08, "elapsed_time": "4:46:49", "remaining_time": "14:16:52"} +{"current_steps": 1125, "total_steps": 4466, "loss": 0.2689, "lr": 3.726421581263802e-05, "epoch": 1.763921568627451, "percentage": 25.19, "elapsed_time": "4:48:09", "remaining_time": "14:15:45"} +{"current_steps": 1130, "total_steps": 4466, "loss": 0.2718, "lr": 3.722462117056607e-05, "epoch": 1.771764705882353, "percentage": 25.3, "elapsed_time": "4:49:27", "remaining_time": "14:14:33"} +{"current_steps": 1135, "total_steps": 4466, "loss": 0.2682, "lr": 3.718476340909548e-05, "epoch": 1.779607843137255, "percentage": 25.41, "elapsed_time": "4:50:45", "remaining_time": "14:13:19"} +{"current_steps": 1140, "total_steps": 4466, "loss": 0.2711, "lr": 3.714464313708439e-05, "epoch": 1.787450980392157, "percentage": 25.53, "elapsed_time": "4:52:06", "remaining_time": "14:12:13"} +{"current_steps": 1145, "total_steps": 4466, "loss": 0.2845, "lr": 3.710426096740094e-05, "epoch": 1.795294117647059, "percentage": 25.64, "elapsed_time": "4:53:19", "remaining_time": "14:10:46"} +{"current_steps": 1150, "total_steps": 4466, "loss": 0.263, "lr": 3.7063617516913974e-05, "epoch": 1.8031372549019609, "percentage": 25.75, "elapsed_time": "4:54:40", "remaining_time": "14:09:40"} +{"current_steps": 1155, "total_steps": 4466, "loss": 0.2636, "lr": 3.7022713406483626e-05, "epoch": 1.8109803921568628, "percentage": 25.86, "elapsed_time": "4:55:59", "remaining_time": "14:08:30"} +{"current_steps": 1160, "total_steps": 4466, "loss": 0.2773, "lr": 3.698154926095177e-05, "epoch": 1.8188235294117647, "percentage": 25.97, "elapsed_time": "4:57:17", "remaining_time": "14:07:15"} +{"current_steps": 1165, "total_steps": 4466, "loss": 0.2694, "lr": 3.694012570913254e-05, "epoch": 1.8266666666666667, "percentage": 26.09, "elapsed_time": "4:58:30", "remaining_time": "14:05:48"} +{"current_steps": 1170, "total_steps": 4466, "loss": 0.276, "lr": 3.689844338380271e-05, "epoch": 1.8345098039215686, "percentage": 26.2, "elapsed_time": "4:59:46", "remaining_time": "14:04:29"} +{"current_steps": 1175, "total_steps": 4466, "loss": 0.2801, "lr": 3.6856502921692004e-05, "epoch": 1.8423529411764705, "percentage": 26.31, "elapsed_time": "5:01:02", "remaining_time": "14:03:10"} +{"current_steps": 1180, "total_steps": 4466, "loss": 0.2756, "lr": 3.681430496347339e-05, "epoch": 1.8501960784313725, "percentage": 26.42, "elapsed_time": "5:02:17", "remaining_time": "14:01:47"} +{"current_steps": 1185, "total_steps": 4466, "loss": 0.2796, "lr": 3.677185015375329e-05, "epoch": 1.8580392156862744, "percentage": 26.53, "elapsed_time": "5:03:27", "remaining_time": "14:00:12"} +{"current_steps": 1190, "total_steps": 4466, "loss": 0.2759, "lr": 3.672913914106173e-05, "epoch": 1.8658823529411763, "percentage": 26.65, "elapsed_time": "5:04:47", "remaining_time": "13:59:04"} +{"current_steps": 1195, "total_steps": 4466, "loss": 0.2817, "lr": 3.6686172577842425e-05, "epoch": 1.8737254901960785, "percentage": 26.76, "elapsed_time": "5:06:01", "remaining_time": "13:57:40"} +{"current_steps": 1200, "total_steps": 4466, "loss": 0.2835, "lr": 3.6642951120442834e-05, "epoch": 1.8815686274509804, "percentage": 26.87, "elapsed_time": "5:07:22", "remaining_time": "13:56:34"} +{"current_steps": 1205, "total_steps": 4466, "loss": 0.2921, "lr": 3.6599475429104125e-05, "epoch": 1.8894117647058823, "percentage": 26.98, "elapsed_time": "5:08:38", "remaining_time": "13:55:14"} +{"current_steps": 1210, "total_steps": 4466, "loss": 0.2602, "lr": 3.655574616795108e-05, "epoch": 1.8972549019607843, "percentage": 27.09, "elapsed_time": "5:09:47", "remaining_time": "13:53:38"} +{"current_steps": 1215, "total_steps": 4466, "loss": 0.2724, "lr": 3.651176400498194e-05, "epoch": 1.9050980392156864, "percentage": 27.21, "elapsed_time": "5:11:01", "remaining_time": "13:52:14"} +{"current_steps": 1220, "total_steps": 4466, "loss": 0.2895, "lr": 3.646752961205825e-05, "epoch": 1.9129411764705884, "percentage": 27.32, "elapsed_time": "5:12:21", "remaining_time": "13:51:04"} +{"current_steps": 1225, "total_steps": 4466, "loss": 0.2759, "lr": 3.642304366489453e-05, "epoch": 1.9207843137254903, "percentage": 27.43, "elapsed_time": "5:13:39", "remaining_time": "13:49:51"} +{"current_steps": 1230, "total_steps": 4466, "loss": 0.27, "lr": 3.6378306843047996e-05, "epoch": 1.9286274509803922, "percentage": 27.54, "elapsed_time": "5:14:57", "remaining_time": "13:48:37"} +{"current_steps": 1235, "total_steps": 4466, "loss": 0.2731, "lr": 3.6333319829908196e-05, "epoch": 1.9364705882352942, "percentage": 27.65, "elapsed_time": "5:16:12", "remaining_time": "13:47:15"} +{"current_steps": 1240, "total_steps": 4466, "loss": 0.2752, "lr": 3.628808331268649e-05, "epoch": 1.944313725490196, "percentage": 27.77, "elapsed_time": "5:17:26", "remaining_time": "13:45:51"} +{"current_steps": 1245, "total_steps": 4466, "loss": 0.28, "lr": 3.624259798240565e-05, "epoch": 1.952156862745098, "percentage": 27.88, "elapsed_time": "5:18:40", "remaining_time": "13:44:28"} +{"current_steps": 1250, "total_steps": 4466, "loss": 0.2576, "lr": 3.6196864533889245e-05, "epoch": 1.96, "percentage": 27.99, "elapsed_time": "5:19:56", "remaining_time": "13:43:07"} +{"current_steps": 1255, "total_steps": 4466, "loss": 0.2722, "lr": 3.615088366575104e-05, "epoch": 1.967843137254902, "percentage": 28.1, "elapsed_time": "5:21:11", "remaining_time": "13:41:47"} +{"current_steps": 1260, "total_steps": 4466, "loss": 0.2709, "lr": 3.610465608038432e-05, "epoch": 1.9756862745098038, "percentage": 28.21, "elapsed_time": "5:22:25", "remaining_time": "13:40:24"} +{"current_steps": 1265, "total_steps": 4466, "loss": 0.2745, "lr": 3.605818248395118e-05, "epoch": 1.9835294117647058, "percentage": 28.33, "elapsed_time": "5:23:45", "remaining_time": "13:39:14"} +{"current_steps": 1270, "total_steps": 4466, "loss": 0.2661, "lr": 3.6011463586371715e-05, "epoch": 1.9913725490196077, "percentage": 28.44, "elapsed_time": "5:24:59", "remaining_time": "13:37:51"} +{"current_steps": 1275, "total_steps": 4466, "loss": 0.2708, "lr": 3.596450010131319e-05, "epoch": 1.9992156862745099, "percentage": 28.55, "elapsed_time": "5:26:15", "remaining_time": "13:36:31"} +{"current_steps": 1280, "total_steps": 4466, "loss": 0.2561, "lr": 3.5917292746179134e-05, "epoch": 2.0062745098039216, "percentage": 28.66, "elapsed_time": "5:27:19", "remaining_time": "13:34:43"} +{"current_steps": 1285, "total_steps": 4466, "loss": 0.2479, "lr": 3.586984224209837e-05, "epoch": 2.0141176470588236, "percentage": 28.77, "elapsed_time": "5:28:29", "remaining_time": "13:33:09"} +{"current_steps": 1290, "total_steps": 4466, "loss": 0.264, "lr": 3.582214931391402e-05, "epoch": 2.0219607843137255, "percentage": 28.88, "elapsed_time": "5:29:44", "remaining_time": "13:31:48"} +{"current_steps": 1295, "total_steps": 4466, "loss": 0.2724, "lr": 3.5774214690172405e-05, "epoch": 2.0298039215686274, "percentage": 29.0, "elapsed_time": "5:30:59", "remaining_time": "13:30:29"} +{"current_steps": 1300, "total_steps": 4466, "loss": 0.2521, "lr": 3.572603910311196e-05, "epoch": 2.0376470588235294, "percentage": 29.11, "elapsed_time": "5:32:11", "remaining_time": "13:29:02"} +{"current_steps": 1305, "total_steps": 4466, "loss": 0.2648, "lr": 3.5677623288652e-05, "epoch": 2.0454901960784313, "percentage": 29.22, "elapsed_time": "5:33:25", "remaining_time": "13:27:38"} +{"current_steps": 1310, "total_steps": 4466, "loss": 0.2682, "lr": 3.5628967986381485e-05, "epoch": 2.0533333333333332, "percentage": 29.33, "elapsed_time": "5:34:36", "remaining_time": "13:26:08"} +{"current_steps": 1315, "total_steps": 4466, "loss": 0.2536, "lr": 3.558007393954778e-05, "epoch": 2.061176470588235, "percentage": 29.44, "elapsed_time": "5:35:52", "remaining_time": "13:24:49"} +{"current_steps": 1320, "total_steps": 4466, "loss": 0.2586, "lr": 3.553094189504522e-05, "epoch": 2.069019607843137, "percentage": 29.56, "elapsed_time": "5:37:07", "remaining_time": "13:23:29"} +{"current_steps": 1325, "total_steps": 4466, "loss": 0.2478, "lr": 3.548157260340376e-05, "epoch": 2.076862745098039, "percentage": 29.67, "elapsed_time": "5:38:19", "remaining_time": "13:22:02"} +{"current_steps": 1330, "total_steps": 4466, "loss": 0.2627, "lr": 3.5431966818777476e-05, "epoch": 2.084705882352941, "percentage": 29.78, "elapsed_time": "5:39:32", "remaining_time": "13:20:35"} +{"current_steps": 1335, "total_steps": 4466, "loss": 0.2621, "lr": 3.5382125298933055e-05, "epoch": 2.0925490196078433, "percentage": 29.89, "elapsed_time": "5:40:51", "remaining_time": "13:19:25"} +{"current_steps": 1340, "total_steps": 4466, "loss": 0.2572, "lr": 3.533204880523823e-05, "epoch": 2.1003921568627453, "percentage": 30.0, "elapsed_time": "5:42:12", "remaining_time": "13:18:17"} +{"current_steps": 1345, "total_steps": 4466, "loss": 0.2727, "lr": 3.528173810265015e-05, "epoch": 2.108235294117647, "percentage": 30.12, "elapsed_time": "5:43:26", "remaining_time": "13:16:55"} +{"current_steps": 1350, "total_steps": 4466, "loss": 0.2589, "lr": 3.5231193959703654e-05, "epoch": 2.116078431372549, "percentage": 30.23, "elapsed_time": "5:44:42", "remaining_time": "13:15:37"} +{"current_steps": 1355, "total_steps": 4466, "loss": 0.2755, "lr": 3.51804171484996e-05, "epoch": 2.123921568627451, "percentage": 30.34, "elapsed_time": "5:46:03", "remaining_time": "13:14:32"} +{"current_steps": 1360, "total_steps": 4466, "loss": 0.2681, "lr": 3.5129408444693014e-05, "epoch": 2.131764705882353, "percentage": 30.45, "elapsed_time": "5:47:22", "remaining_time": "13:13:21"} +{"current_steps": 1365, "total_steps": 4466, "loss": 0.2552, "lr": 3.507816862748126e-05, "epoch": 2.139607843137255, "percentage": 30.56, "elapsed_time": "5:48:37", "remaining_time": "13:12:01"} +{"current_steps": 1370, "total_steps": 4466, "loss": 0.2397, "lr": 3.502669847959213e-05, "epoch": 2.147450980392157, "percentage": 30.68, "elapsed_time": "5:49:57", "remaining_time": "13:10:51"} +{"current_steps": 1375, "total_steps": 4466, "loss": 0.2621, "lr": 3.497499878727193e-05, "epoch": 2.155294117647059, "percentage": 30.79, "elapsed_time": "5:51:14", "remaining_time": "13:09:34"} +{"current_steps": 1380, "total_steps": 4466, "loss": 0.2691, "lr": 3.49230703402734e-05, "epoch": 2.1631372549019607, "percentage": 30.9, "elapsed_time": "5:52:30", "remaining_time": "13:08:17"} +{"current_steps": 1385, "total_steps": 4466, "loss": 0.2609, "lr": 3.487091393184369e-05, "epoch": 2.1709803921568627, "percentage": 31.01, "elapsed_time": "5:53:41", "remaining_time": "13:06:48"} +{"current_steps": 1390, "total_steps": 4466, "loss": 0.2628, "lr": 3.481853035871224e-05, "epoch": 2.1788235294117646, "percentage": 31.12, "elapsed_time": "5:54:59", "remaining_time": "13:05:35"} +{"current_steps": 1395, "total_steps": 4466, "loss": 0.2552, "lr": 3.476592042107862e-05, "epoch": 2.1866666666666665, "percentage": 31.24, "elapsed_time": "5:56:13", "remaining_time": "13:04:12"} +{"current_steps": 1400, "total_steps": 4466, "loss": 0.2522, "lr": 3.4713084922600274e-05, "epoch": 2.1945098039215685, "percentage": 31.35, "elapsed_time": "5:57:32", "remaining_time": "13:03:00"} +{"current_steps": 1405, "total_steps": 4466, "loss": 0.2608, "lr": 3.466002467038028e-05, "epoch": 2.2023529411764704, "percentage": 31.46, "elapsed_time": "5:58:45", "remaining_time": "13:01:36"} +{"current_steps": 1410, "total_steps": 4466, "loss": 0.2705, "lr": 3.460674047495497e-05, "epoch": 2.2101960784313723, "percentage": 31.57, "elapsed_time": "6:00:00", "remaining_time": "13:00:17"} +{"current_steps": 1415, "total_steps": 4466, "loss": 0.2496, "lr": 3.455323315028164e-05, "epoch": 2.2180392156862747, "percentage": 31.68, "elapsed_time": "6:01:18", "remaining_time": "12:59:03"} +{"current_steps": 1420, "total_steps": 4466, "loss": 0.2733, "lr": 3.449950351372599e-05, "epoch": 2.2258823529411766, "percentage": 31.8, "elapsed_time": "6:02:35", "remaining_time": "12:57:47"} +{"current_steps": 1425, "total_steps": 4466, "loss": 0.2675, "lr": 3.444555238604974e-05, "epoch": 2.2337254901960786, "percentage": 31.91, "elapsed_time": "6:03:51", "remaining_time": "12:56:29"} +{"current_steps": 1430, "total_steps": 4466, "loss": 0.2486, "lr": 3.439138059139808e-05, "epoch": 2.2415686274509805, "percentage": 32.02, "elapsed_time": "6:05:08", "remaining_time": "12:55:13"} +{"current_steps": 1435, "total_steps": 4466, "loss": 0.2546, "lr": 3.433698895728701e-05, "epoch": 2.2494117647058824, "percentage": 32.13, "elapsed_time": "6:06:19", "remaining_time": "12:53:45"} +{"current_steps": 1440, "total_steps": 4466, "loss": 0.2642, "lr": 3.428237831459078e-05, "epoch": 2.2572549019607844, "percentage": 32.24, "elapsed_time": "6:07:39", "remaining_time": "12:52:35"} +{"current_steps": 1445, "total_steps": 4466, "loss": 0.2606, "lr": 3.422754949752917e-05, "epoch": 2.2650980392156863, "percentage": 32.36, "elapsed_time": "6:08:54", "remaining_time": "12:51:15"} +{"current_steps": 1450, "total_steps": 4466, "loss": 0.2553, "lr": 3.41725033436547e-05, "epoch": 2.2729411764705882, "percentage": 32.47, "elapsed_time": "6:10:11", "remaining_time": "12:49:59"} +{"current_steps": 1455, "total_steps": 4466, "loss": 0.2618, "lr": 3.411724069383993e-05, "epoch": 2.28078431372549, "percentage": 32.58, "elapsed_time": "6:11:27", "remaining_time": "12:48:42"} +{"current_steps": 1460, "total_steps": 4466, "loss": 0.2619, "lr": 3.4061762392264545e-05, "epoch": 2.288627450980392, "percentage": 32.69, "elapsed_time": "6:12:48", "remaining_time": "12:47:35"} +{"current_steps": 1465, "total_steps": 4466, "loss": 0.2599, "lr": 3.400606928640245e-05, "epoch": 2.296470588235294, "percentage": 32.8, "elapsed_time": "6:14:05", "remaining_time": "12:46:19"} +{"current_steps": 1470, "total_steps": 4466, "loss": 0.2601, "lr": 3.3950162227008884e-05, "epoch": 2.304313725490196, "percentage": 32.92, "elapsed_time": "6:15:22", "remaining_time": "12:45:03"} +{"current_steps": 1475, "total_steps": 4466, "loss": 0.2603, "lr": 3.389404206810739e-05, "epoch": 2.312156862745098, "percentage": 33.03, "elapsed_time": "6:16:43", "remaining_time": "12:43:55"} +{"current_steps": 1480, "total_steps": 4466, "loss": 0.269, "lr": 3.383770966697675e-05, "epoch": 2.32, "percentage": 33.14, "elapsed_time": "6:18:04", "remaining_time": "12:42:46"} +{"current_steps": 1485, "total_steps": 4466, "loss": 0.2752, "lr": 3.378116588413792e-05, "epoch": 2.3278431372549018, "percentage": 33.25, "elapsed_time": "6:19:21", "remaining_time": "12:41:32"} +{"current_steps": 1490, "total_steps": 4466, "loss": 0.2725, "lr": 3.372441158334089e-05, "epoch": 2.335686274509804, "percentage": 33.36, "elapsed_time": "6:20:42", "remaining_time": "12:40:22"} +{"current_steps": 1495, "total_steps": 4466, "loss": 0.2557, "lr": 3.3667447631551456e-05, "epoch": 2.343529411764706, "percentage": 33.48, "elapsed_time": "6:21:55", "remaining_time": "12:39:00"} +{"current_steps": 1500, "total_steps": 4466, "loss": 0.2493, "lr": 3.361027489893799e-05, "epoch": 2.351372549019608, "percentage": 33.59, "elapsed_time": "6:23:11", "remaining_time": "12:37:41"} +{"current_steps": 1505, "total_steps": 4466, "loss": 0.2489, "lr": 3.3552894258858173e-05, "epoch": 2.35921568627451, "percentage": 33.7, "elapsed_time": "6:25:05", "remaining_time": "12:37:38"} +{"current_steps": 1510, "total_steps": 4466, "loss": 0.249, "lr": 3.3495306587845616e-05, "epoch": 2.367058823529412, "percentage": 33.81, "elapsed_time": "6:26:18", "remaining_time": "12:36:13"} +{"current_steps": 1515, "total_steps": 4466, "loss": 0.2516, "lr": 3.343751276559651e-05, "epoch": 2.374901960784314, "percentage": 33.92, "elapsed_time": "6:27:30", "remaining_time": "12:34:49"} +{"current_steps": 1520, "total_steps": 4466, "loss": 0.2685, "lr": 3.3379513674956134e-05, "epoch": 2.3827450980392157, "percentage": 34.03, "elapsed_time": "6:28:47", "remaining_time": "12:33:32"} +{"current_steps": 1525, "total_steps": 4466, "loss": 0.2478, "lr": 3.332131020190542e-05, "epoch": 2.3905882352941177, "percentage": 34.15, "elapsed_time": "6:30:00", "remaining_time": "12:32:07"} +{"current_steps": 1530, "total_steps": 4466, "loss": 0.2599, "lr": 3.326290323554739e-05, "epoch": 2.3984313725490196, "percentage": 34.26, "elapsed_time": "6:31:17", "remaining_time": "12:30:53"} +{"current_steps": 1535, "total_steps": 4466, "loss": 0.255, "lr": 3.320429366809361e-05, "epoch": 2.4062745098039215, "percentage": 34.37, "elapsed_time": "6:32:25", "remaining_time": "12:29:19"} +{"current_steps": 1540, "total_steps": 4466, "loss": 0.2544, "lr": 3.314548239485048e-05, "epoch": 2.4141176470588235, "percentage": 34.48, "elapsed_time": "6:33:45", "remaining_time": "12:28:07"} +{"current_steps": 1545, "total_steps": 4466, "loss": 0.2706, "lr": 3.308647031420567e-05, "epoch": 2.4219607843137254, "percentage": 34.59, "elapsed_time": "6:34:59", "remaining_time": "12:26:47"} +{"current_steps": 1550, "total_steps": 4466, "loss": 0.2559, "lr": 3.3027258327614305e-05, "epoch": 2.4298039215686273, "percentage": 34.71, "elapsed_time": "6:36:13", "remaining_time": "12:25:25"} +{"current_steps": 1555, "total_steps": 4466, "loss": 0.2617, "lr": 3.296784733958524e-05, "epoch": 2.4376470588235293, "percentage": 34.82, "elapsed_time": "6:37:32", "remaining_time": "12:24:13"} +{"current_steps": 1560, "total_steps": 4466, "loss": 0.2602, "lr": 3.2908238257667214e-05, "epoch": 2.445490196078431, "percentage": 34.93, "elapsed_time": "6:38:53", "remaining_time": "12:23:03"} +{"current_steps": 1565, "total_steps": 4466, "loss": 0.2633, "lr": 3.2848431992435037e-05, "epoch": 2.453333333333333, "percentage": 35.04, "elapsed_time": "6:40:10", "remaining_time": "12:21:48"} +{"current_steps": 1570, "total_steps": 4466, "loss": 0.2675, "lr": 3.278842945747561e-05, "epoch": 2.461176470588235, "percentage": 35.15, "elapsed_time": "6:41:28", "remaining_time": "12:20:32"} +{"current_steps": 1575, "total_steps": 4466, "loss": 0.2734, "lr": 3.272823156937403e-05, "epoch": 2.469019607843137, "percentage": 35.27, "elapsed_time": "6:42:47", "remaining_time": "12:19:21"} +{"current_steps": 1580, "total_steps": 4466, "loss": 0.2734, "lr": 3.266783924769954e-05, "epoch": 2.4768627450980394, "percentage": 35.38, "elapsed_time": "6:44:08", "remaining_time": "12:18:11"} +{"current_steps": 1585, "total_steps": 4466, "loss": 0.2491, "lr": 3.2607253414991534e-05, "epoch": 2.4847058823529413, "percentage": 35.49, "elapsed_time": "6:45:22", "remaining_time": "12:16:50"} +{"current_steps": 1590, "total_steps": 4466, "loss": 0.2517, "lr": 3.2546474996745424e-05, "epoch": 2.4925490196078433, "percentage": 35.6, "elapsed_time": "6:46:38", "remaining_time": "12:15:32"} +{"current_steps": 1595, "total_steps": 4466, "loss": 0.259, "lr": 3.248550492139851e-05, "epoch": 2.500392156862745, "percentage": 35.71, "elapsed_time": "6:47:55", "remaining_time": "12:14:15"} +{"current_steps": 1600, "total_steps": 4466, "loss": 0.2633, "lr": 3.242434412031581e-05, "epoch": 2.508235294117647, "percentage": 35.83, "elapsed_time": "6:49:10", "remaining_time": "12:12:56"} +{"current_steps": 1605, "total_steps": 4466, "loss": 0.2558, "lr": 3.236299352777583e-05, "epoch": 2.516078431372549, "percentage": 35.94, "elapsed_time": "6:50:28", "remaining_time": "12:11:42"} +{"current_steps": 1610, "total_steps": 4466, "loss": 0.2622, "lr": 3.230145408095626e-05, "epoch": 2.523921568627451, "percentage": 36.05, "elapsed_time": "6:51:44", "remaining_time": "12:10:24"} +{"current_steps": 1615, "total_steps": 4466, "loss": 0.2635, "lr": 3.223972671991972e-05, "epoch": 2.531764705882353, "percentage": 36.16, "elapsed_time": "6:52:59", "remaining_time": "12:09:04"} +{"current_steps": 1620, "total_steps": 4466, "loss": 0.2565, "lr": 3.217781238759935e-05, "epoch": 2.539607843137255, "percentage": 36.27, "elapsed_time": "6:54:12", "remaining_time": "12:07:41"} +{"current_steps": 1625, "total_steps": 4466, "loss": 0.2698, "lr": 3.211571202978442e-05, "epoch": 2.547450980392157, "percentage": 36.39, "elapsed_time": "6:55:30", "remaining_time": "12:06:25"} +{"current_steps": 1630, "total_steps": 4466, "loss": 0.25, "lr": 3.2053426595105865e-05, "epoch": 2.5552941176470587, "percentage": 36.5, "elapsed_time": "6:56:45", "remaining_time": "12:05:06"} +{"current_steps": 1635, "total_steps": 4466, "loss": 0.2626, "lr": 3.199095703502185e-05, "epoch": 2.5631372549019606, "percentage": 36.61, "elapsed_time": "6:58:05", "remaining_time": "12:03:55"} +{"current_steps": 1640, "total_steps": 4466, "loss": 0.2528, "lr": 3.1928304303803174e-05, "epoch": 2.5709803921568626, "percentage": 36.72, "elapsed_time": "6:59:20", "remaining_time": "12:02:35"} +{"current_steps": 1645, "total_steps": 4466, "loss": 0.2492, "lr": 3.1865469358518726e-05, "epoch": 2.578823529411765, "percentage": 36.83, "elapsed_time": "7:00:35", "remaining_time": "12:01:15"} +{"current_steps": 1650, "total_steps": 4466, "loss": 0.2451, "lr": 3.180245315902084e-05, "epoch": 2.586666666666667, "percentage": 36.95, "elapsed_time": "7:01:47", "remaining_time": "11:59:50"} +{"current_steps": 1655, "total_steps": 4466, "loss": 0.2504, "lr": 3.173925666793065e-05, "epoch": 2.594509803921569, "percentage": 37.06, "elapsed_time": "7:03:07", "remaining_time": "11:58:39"} +{"current_steps": 1660, "total_steps": 4466, "loss": 0.2755, "lr": 3.1675880850623416e-05, "epoch": 2.6023529411764708, "percentage": 37.17, "elapsed_time": "7:04:22", "remaining_time": "11:57:20"} +{"current_steps": 1665, "total_steps": 4466, "loss": 0.2557, "lr": 3.1612326675213717e-05, "epoch": 2.6101960784313727, "percentage": 37.28, "elapsed_time": "7:05:42", "remaining_time": "11:56:09"} +{"current_steps": 1670, "total_steps": 4466, "loss": 0.2672, "lr": 3.154859511254067e-05, "epoch": 2.6180392156862746, "percentage": 37.39, "elapsed_time": "7:06:58", "remaining_time": "11:54:52"} +{"current_steps": 1675, "total_steps": 4466, "loss": 0.2617, "lr": 3.148468713615318e-05, "epoch": 2.6258823529411766, "percentage": 37.51, "elapsed_time": "7:08:16", "remaining_time": "11:53:36"} +{"current_steps": 1680, "total_steps": 4466, "loss": 0.2561, "lr": 3.1420603722294935e-05, "epoch": 2.6337254901960785, "percentage": 37.62, "elapsed_time": "7:09:30", "remaining_time": "11:52:16"} +{"current_steps": 1685, "total_steps": 4466, "loss": 0.2612, "lr": 3.135634584988962e-05, "epoch": 2.6415686274509804, "percentage": 37.73, "elapsed_time": "7:10:48", "remaining_time": "11:51:02"} +{"current_steps": 1690, "total_steps": 4466, "loss": 0.238, "lr": 3.1291914500525886e-05, "epoch": 2.6494117647058824, "percentage": 37.84, "elapsed_time": "7:12:05", "remaining_time": "11:49:45"} +{"current_steps": 1695, "total_steps": 4466, "loss": 0.2796, "lr": 3.1227310658442395e-05, "epoch": 2.6572549019607843, "percentage": 37.95, "elapsed_time": "7:13:26", "remaining_time": "11:48:36"} +{"current_steps": 1700, "total_steps": 4466, "loss": 0.2619, "lr": 3.1162535310512745e-05, "epoch": 2.665098039215686, "percentage": 38.07, "elapsed_time": "7:14:42", "remaining_time": "11:47:17"} +{"current_steps": 1705, "total_steps": 4466, "loss": 0.2512, "lr": 3.109758944623042e-05, "epoch": 2.672941176470588, "percentage": 38.18, "elapsed_time": "7:16:00", "remaining_time": "11:46:02"} +{"current_steps": 1710, "total_steps": 4466, "loss": 0.2544, "lr": 3.103247405769372e-05, "epoch": 2.68078431372549, "percentage": 38.29, "elapsed_time": "7:17:17", "remaining_time": "11:44:47"} +{"current_steps": 1715, "total_steps": 4466, "loss": 0.2545, "lr": 3.0967190139590484e-05, "epoch": 2.688627450980392, "percentage": 38.4, "elapsed_time": "7:18:31", "remaining_time": "11:43:25"} +{"current_steps": 1720, "total_steps": 4466, "loss": 0.2568, "lr": 3.090173868918303e-05, "epoch": 2.696470588235294, "percentage": 38.51, "elapsed_time": "7:19:47", "remaining_time": "11:42:07"} +{"current_steps": 1725, "total_steps": 4466, "loss": 0.2653, "lr": 3.083612070629283e-05, "epoch": 2.704313725490196, "percentage": 38.63, "elapsed_time": "7:21:04", "remaining_time": "11:40:52"} +{"current_steps": 1730, "total_steps": 4466, "loss": 0.2504, "lr": 3.077033719328529e-05, "epoch": 2.712156862745098, "percentage": 38.74, "elapsed_time": "7:22:21", "remaining_time": "11:39:35"} +{"current_steps": 1735, "total_steps": 4466, "loss": 0.2467, "lr": 3.070438915505439e-05, "epoch": 2.7199999999999998, "percentage": 38.85, "elapsed_time": "7:23:39", "remaining_time": "11:38:20"} +{"current_steps": 1740, "total_steps": 4466, "loss": 0.2606, "lr": 3.063827759900739e-05, "epoch": 2.7278431372549017, "percentage": 38.96, "elapsed_time": "7:24:54", "remaining_time": "11:37:01"} +{"current_steps": 1745, "total_steps": 4466, "loss": 0.2667, "lr": 3.057200353504938e-05, "epoch": 2.735686274509804, "percentage": 39.07, "elapsed_time": "7:26:12", "remaining_time": "11:35:46"} +{"current_steps": 1750, "total_steps": 4466, "loss": 0.2551, "lr": 3.0505567975567915e-05, "epoch": 2.743529411764706, "percentage": 39.18, "elapsed_time": "7:27:28", "remaining_time": "11:34:28"} +{"current_steps": 1755, "total_steps": 4466, "loss": 0.2663, "lr": 3.04389719354175e-05, "epoch": 2.751372549019608, "percentage": 39.3, "elapsed_time": "7:28:45", "remaining_time": "11:33:12"} +{"current_steps": 1760, "total_steps": 4466, "loss": 0.2523, "lr": 3.0372216431904103e-05, "epoch": 2.75921568627451, "percentage": 39.41, "elapsed_time": "7:30:02", "remaining_time": "11:31:56"} +{"current_steps": 1765, "total_steps": 4466, "loss": 0.2479, "lr": 3.030530248476963e-05, "epoch": 2.767058823529412, "percentage": 39.52, "elapsed_time": "7:31:20", "remaining_time": "11:30:41"} +{"current_steps": 1770, "total_steps": 4466, "loss": 0.2612, "lr": 3.0238231116176338e-05, "epoch": 2.7749019607843137, "percentage": 39.63, "elapsed_time": "7:32:30", "remaining_time": "11:29:15"} +{"current_steps": 1775, "total_steps": 4466, "loss": 0.2681, "lr": 3.0171003350691194e-05, "epoch": 2.7827450980392157, "percentage": 39.74, "elapsed_time": "7:33:47", "remaining_time": "11:27:57"} +{"current_steps": 1780, "total_steps": 4466, "loss": 0.2609, "lr": 3.0103620215270285e-05, "epoch": 2.7905882352941176, "percentage": 39.86, "elapsed_time": "7:34:56", "remaining_time": "11:26:30"} +{"current_steps": 1785, "total_steps": 4466, "loss": 0.2507, "lr": 3.0036082739243064e-05, "epoch": 2.7984313725490195, "percentage": 39.97, "elapsed_time": "7:36:15", "remaining_time": "11:25:17"} +{"current_steps": 1790, "total_steps": 4466, "loss": 0.2667, "lr": 2.996839195429667e-05, "epoch": 2.8062745098039215, "percentage": 40.08, "elapsed_time": "7:37:36", "remaining_time": "11:24:06"} +{"current_steps": 1795, "total_steps": 4466, "loss": 0.2575, "lr": 2.9900548894460146e-05, "epoch": 2.8141176470588234, "percentage": 40.19, "elapsed_time": "7:38:51", "remaining_time": "11:22:47"} +{"current_steps": 1800, "total_steps": 4466, "loss": 0.2476, "lr": 2.9832554596088653e-05, "epoch": 2.8219607843137258, "percentage": 40.3, "elapsed_time": "7:40:11", "remaining_time": "11:21:35"} +{"current_steps": 1805, "total_steps": 4466, "loss": 0.2663, "lr": 2.9764410097847657e-05, "epoch": 2.8298039215686277, "percentage": 40.42, "elapsed_time": "7:41:30", "remaining_time": "11:20:22"} +{"current_steps": 1810, "total_steps": 4466, "loss": 0.2689, "lr": 2.9696116440697008e-05, "epoch": 2.8376470588235296, "percentage": 40.53, "elapsed_time": "7:42:48", "remaining_time": "11:19:07"} +{"current_steps": 1815, "total_steps": 4466, "loss": 0.2649, "lr": 2.9627674667875104e-05, "epoch": 2.8454901960784316, "percentage": 40.64, "elapsed_time": "7:44:07", "remaining_time": "11:17:54"} +{"current_steps": 1820, "total_steps": 4466, "loss": 0.2558, "lr": 2.9559085824882916e-05, "epoch": 2.8533333333333335, "percentage": 40.75, "elapsed_time": "7:45:25", "remaining_time": "11:16:39"} +{"current_steps": 1825, "total_steps": 4466, "loss": 0.2641, "lr": 2.9490350959468014e-05, "epoch": 2.8611764705882354, "percentage": 40.86, "elapsed_time": "7:46:45", "remaining_time": "11:15:27"} +{"current_steps": 1830, "total_steps": 4466, "loss": 0.2587, "lr": 2.9421471121608588e-05, "epoch": 2.8690196078431374, "percentage": 40.98, "elapsed_time": "7:47:58", "remaining_time": "11:14:05"} +{"current_steps": 1835, "total_steps": 4466, "loss": 0.2444, "lr": 2.9352447363497378e-05, "epoch": 2.8768627450980393, "percentage": 41.09, "elapsed_time": "7:49:15", "remaining_time": "11:12:48"} +{"current_steps": 1840, "total_steps": 4466, "loss": 0.2526, "lr": 2.928328073952564e-05, "epoch": 2.8847058823529412, "percentage": 41.2, "elapsed_time": "7:50:31", "remaining_time": "11:11:31"} +{"current_steps": 1845, "total_steps": 4466, "loss": 0.251, "lr": 2.921397230626699e-05, "epoch": 2.892549019607843, "percentage": 41.31, "elapsed_time": "7:51:47", "remaining_time": "11:10:13"} +{"current_steps": 1850, "total_steps": 4466, "loss": 0.2597, "lr": 2.914452312246131e-05, "epoch": 2.900392156862745, "percentage": 41.42, "elapsed_time": "7:53:01", "remaining_time": "11:08:53"} +{"current_steps": 1855, "total_steps": 4466, "loss": 0.2661, "lr": 2.9074934248998557e-05, "epoch": 2.908235294117647, "percentage": 41.54, "elapsed_time": "7:54:17", "remaining_time": "11:07:34"} +{"current_steps": 1860, "total_steps": 4466, "loss": 0.2632, "lr": 2.9005206748902538e-05, "epoch": 2.916078431372549, "percentage": 41.65, "elapsed_time": "7:55:32", "remaining_time": "11:06:15"} +{"current_steps": 1865, "total_steps": 4466, "loss": 0.2526, "lr": 2.8935341687314703e-05, "epoch": 2.923921568627451, "percentage": 41.76, "elapsed_time": "7:56:50", "remaining_time": "11:05:01"} +{"current_steps": 1870, "total_steps": 4466, "loss": 0.2554, "lr": 2.8865340131477846e-05, "epoch": 2.931764705882353, "percentage": 41.87, "elapsed_time": "7:58:08", "remaining_time": "11:03:46"} +{"current_steps": 1875, "total_steps": 4466, "loss": 0.2574, "lr": 2.8795203150719836e-05, "epoch": 2.9396078431372548, "percentage": 41.98, "elapsed_time": "7:59:27", "remaining_time": "11:02:33"} +{"current_steps": 1880, "total_steps": 4466, "loss": 0.2502, "lr": 2.8724931816437255e-05, "epoch": 2.9474509803921567, "percentage": 42.1, "elapsed_time": "8:00:41", "remaining_time": "11:01:12"} +{"current_steps": 1885, "total_steps": 4466, "loss": 0.2641, "lr": 2.8654527202079027e-05, "epoch": 2.9552941176470586, "percentage": 42.21, "elapsed_time": "8:01:58", "remaining_time": "10:59:55"} +{"current_steps": 1890, "total_steps": 4466, "loss": 0.2524, "lr": 2.8583990383130043e-05, "epoch": 2.9631372549019606, "percentage": 42.32, "elapsed_time": "8:03:14", "remaining_time": "10:58:38"} +{"current_steps": 1895, "total_steps": 4466, "loss": 0.247, "lr": 2.8513322437094727e-05, "epoch": 2.9709803921568625, "percentage": 42.43, "elapsed_time": "8:04:30", "remaining_time": "10:57:20"} +{"current_steps": 1900, "total_steps": 4466, "loss": 0.2522, "lr": 2.844252444348055e-05, "epoch": 2.978823529411765, "percentage": 42.54, "elapsed_time": "8:05:51", "remaining_time": "10:56:09"} +{"current_steps": 1905, "total_steps": 4466, "loss": 0.2529, "lr": 2.8371597483781577e-05, "epoch": 2.986666666666667, "percentage": 42.66, "elapsed_time": "8:07:04", "remaining_time": "10:54:47"} +{"current_steps": 1910, "total_steps": 4466, "loss": 0.2564, "lr": 2.8300542641461937e-05, "epoch": 2.9945098039215687, "percentage": 42.77, "elapsed_time": "8:08:21", "remaining_time": "10:53:31"} +{"current_steps": 1915, "total_steps": 4466, "loss": 0.2776, "lr": 2.822936100193924e-05, "epoch": 3.0015686274509803, "percentage": 42.88, "elapsed_time": "8:09:27", "remaining_time": "10:52:00"} +{"current_steps": 1920, "total_steps": 4466, "loss": 0.2491, "lr": 2.8158053652568046e-05, "epoch": 3.0094117647058822, "percentage": 42.99, "elapsed_time": "8:10:42", "remaining_time": "10:50:41"} +{"current_steps": 1925, "total_steps": 4466, "loss": 0.2411, "lr": 2.808662168262321e-05, "epoch": 3.017254901960784, "percentage": 43.1, "elapsed_time": "8:11:57", "remaining_time": "10:49:22"} +{"current_steps": 1930, "total_steps": 4466, "loss": 0.2519, "lr": 2.8015066183283272e-05, "epoch": 3.025098039215686, "percentage": 43.22, "elapsed_time": "8:13:11", "remaining_time": "10:48:03"} +{"current_steps": 1935, "total_steps": 4466, "loss": 0.2366, "lr": 2.7943388247613787e-05, "epoch": 3.032941176470588, "percentage": 43.33, "elapsed_time": "8:14:27", "remaining_time": "10:46:45"} +{"current_steps": 1940, "total_steps": 4466, "loss": 0.255, "lr": 2.787158897055061e-05, "epoch": 3.0407843137254904, "percentage": 43.44, "elapsed_time": "8:15:45", "remaining_time": "10:45:30"} +{"current_steps": 1945, "total_steps": 4466, "loss": 0.2406, "lr": 2.7799669448883165e-05, "epoch": 3.0486274509803923, "percentage": 43.55, "elapsed_time": "8:16:57", "remaining_time": "10:44:07"} +{"current_steps": 1950, "total_steps": 4466, "loss": 0.2433, "lr": 2.7727630781237743e-05, "epoch": 3.0564705882352943, "percentage": 43.66, "elapsed_time": "8:18:11", "remaining_time": "10:42:47"} +{"current_steps": 1955, "total_steps": 4466, "loss": 0.2493, "lr": 2.7655474068060644e-05, "epoch": 3.064313725490196, "percentage": 43.78, "elapsed_time": "8:19:29", "remaining_time": "10:41:32"} +{"current_steps": 1960, "total_steps": 4466, "loss": 0.2317, "lr": 2.7583200411601424e-05, "epoch": 3.072156862745098, "percentage": 43.89, "elapsed_time": "8:20:46", "remaining_time": "10:40:16"} +{"current_steps": 1965, "total_steps": 4466, "loss": 0.2406, "lr": 2.7510810915896043e-05, "epoch": 3.08, "percentage": 44.0, "elapsed_time": "8:21:58", "remaining_time": "10:38:54"} +{"current_steps": 1970, "total_steps": 4466, "loss": 0.233, "lr": 2.7438306686749978e-05, "epoch": 3.087843137254902, "percentage": 44.11, "elapsed_time": "8:23:15", "remaining_time": "10:37:37"} +{"current_steps": 1975, "total_steps": 4466, "loss": 0.2392, "lr": 2.7365688831721358e-05, "epoch": 3.095686274509804, "percentage": 44.22, "elapsed_time": "8:24:30", "remaining_time": "10:36:19"} +{"current_steps": 1980, "total_steps": 4466, "loss": 0.2504, "lr": 2.7292958460104027e-05, "epoch": 3.103529411764706, "percentage": 44.33, "elapsed_time": "8:25:49", "remaining_time": "10:35:05"} +{"current_steps": 1985, "total_steps": 4466, "loss": 0.2519, "lr": 2.7220116682910628e-05, "epoch": 3.111372549019608, "percentage": 44.45, "elapsed_time": "8:27:00", "remaining_time": "10:33:41"} +{"current_steps": 1990, "total_steps": 4466, "loss": 0.2453, "lr": 2.714716461285559e-05, "epoch": 3.1192156862745097, "percentage": 44.56, "elapsed_time": "8:28:15", "remaining_time": "10:32:23"} +{"current_steps": 1995, "total_steps": 4466, "loss": 0.2406, "lr": 2.7074103364338155e-05, "epoch": 3.1270588235294117, "percentage": 44.67, "elapsed_time": "8:29:35", "remaining_time": "10:31:10"} +{"current_steps": 2000, "total_steps": 4466, "loss": 0.248, "lr": 2.7000934053425347e-05, "epoch": 3.1349019607843136, "percentage": 44.78, "elapsed_time": "8:30:49", "remaining_time": "10:29:51"} +{"current_steps": 2005, "total_steps": 4466, "loss": 0.2402, "lr": 2.692765779783494e-05, "epoch": 3.1427450980392155, "percentage": 44.89, "elapsed_time": "8:32:08", "remaining_time": "10:28:37"} +{"current_steps": 2010, "total_steps": 4466, "loss": 0.253, "lr": 2.6854275716918352e-05, "epoch": 3.1505882352941175, "percentage": 45.01, "elapsed_time": "8:33:24", "remaining_time": "10:27:19"} +{"current_steps": 2015, "total_steps": 4466, "loss": 0.2434, "lr": 2.678078893164359e-05, "epoch": 3.1584313725490194, "percentage": 45.12, "elapsed_time": "8:34:42", "remaining_time": "10:26:04"} +{"current_steps": 2020, "total_steps": 4466, "loss": 0.2362, "lr": 2.6707198564578066e-05, "epoch": 3.1662745098039213, "percentage": 45.23, "elapsed_time": "8:36:00", "remaining_time": "10:24:50"} +{"current_steps": 2025, "total_steps": 4466, "loss": 0.2461, "lr": 2.663350573987152e-05, "epoch": 3.1741176470588237, "percentage": 45.34, "elapsed_time": "8:37:19", "remaining_time": "10:23:35"} +{"current_steps": 2030, "total_steps": 4466, "loss": 0.231, "lr": 2.655971158323879e-05, "epoch": 3.1819607843137256, "percentage": 45.45, "elapsed_time": "8:38:34", "remaining_time": "10:22:17"} +{"current_steps": 2035, "total_steps": 4466, "loss": 0.2465, "lr": 2.648581722194264e-05, "epoch": 3.1898039215686276, "percentage": 45.57, "elapsed_time": "8:39:54", "remaining_time": "10:21:04"} +{"current_steps": 2040, "total_steps": 4466, "loss": 0.2353, "lr": 2.6411823784776537e-05, "epoch": 3.1976470588235295, "percentage": 45.68, "elapsed_time": "8:41:06", "remaining_time": "10:19:42"} +{"current_steps": 2045, "total_steps": 4466, "loss": 0.2309, "lr": 2.6337732402047422e-05, "epoch": 3.2054901960784314, "percentage": 45.79, "elapsed_time": "8:42:25", "remaining_time": "10:18:28"} +{"current_steps": 2050, "total_steps": 4466, "loss": 0.2422, "lr": 2.626354420555841e-05, "epoch": 3.2133333333333334, "percentage": 45.9, "elapsed_time": "8:43:43", "remaining_time": "10:17:13"} +{"current_steps": 2055, "total_steps": 4466, "loss": 0.2461, "lr": 2.618926032859154e-05, "epoch": 3.2211764705882353, "percentage": 46.01, "elapsed_time": "8:44:59", "remaining_time": "10:15:56"} +{"current_steps": 2060, "total_steps": 4466, "loss": 0.2498, "lr": 2.611488190589043e-05, "epoch": 3.2290196078431372, "percentage": 46.13, "elapsed_time": "8:46:15", "remaining_time": "10:14:39"} +{"current_steps": 2065, "total_steps": 4466, "loss": 0.2573, "lr": 2.6040410073642965e-05, "epoch": 3.236862745098039, "percentage": 46.24, "elapsed_time": "8:47:33", "remaining_time": "10:13:23"} +{"current_steps": 2070, "total_steps": 4466, "loss": 0.249, "lr": 2.596584596946392e-05, "epoch": 3.244705882352941, "percentage": 46.35, "elapsed_time": "8:48:51", "remaining_time": "10:12:08"} +{"current_steps": 2075, "total_steps": 4466, "loss": 0.2485, "lr": 2.589119073237762e-05, "epoch": 3.252549019607843, "percentage": 46.46, "elapsed_time": "8:50:10", "remaining_time": "10:10:55"} +{"current_steps": 2080, "total_steps": 4466, "loss": 0.2467, "lr": 2.5816445502800494e-05, "epoch": 3.260392156862745, "percentage": 46.57, "elapsed_time": "8:51:28", "remaining_time": "10:09:39"} +{"current_steps": 2085, "total_steps": 4466, "loss": 0.2363, "lr": 2.5741611422523684e-05, "epoch": 3.268235294117647, "percentage": 46.69, "elapsed_time": "8:52:45", "remaining_time": "10:08:23"} +{"current_steps": 2090, "total_steps": 4466, "loss": 0.2534, "lr": 2.566668963469559e-05, "epoch": 3.276078431372549, "percentage": 46.8, "elapsed_time": "8:54:03", "remaining_time": "10:07:08"} +{"current_steps": 2095, "total_steps": 4466, "loss": 0.2451, "lr": 2.5591681283804426e-05, "epoch": 3.283921568627451, "percentage": 46.91, "elapsed_time": "8:55:18", "remaining_time": "10:05:49"} +{"current_steps": 2100, "total_steps": 4466, "loss": 0.2448, "lr": 2.5516587515660706e-05, "epoch": 3.291764705882353, "percentage": 47.02, "elapsed_time": "8:56:32", "remaining_time": "10:04:29"} +{"current_steps": 2105, "total_steps": 4466, "loss": 0.2531, "lr": 2.5441409477379764e-05, "epoch": 3.299607843137255, "percentage": 47.13, "elapsed_time": "8:57:49", "remaining_time": "10:03:14"} +{"current_steps": 2110, "total_steps": 4466, "loss": 0.2383, "lr": 2.5366148317364237e-05, "epoch": 3.307450980392157, "percentage": 47.25, "elapsed_time": "8:59:01", "remaining_time": "10:01:51"} +{"current_steps": 2115, "total_steps": 4466, "loss": 0.2358, "lr": 2.5290805185286494e-05, "epoch": 3.315294117647059, "percentage": 47.36, "elapsed_time": "9:00:17", "remaining_time": "10:00:34"} +{"current_steps": 2120, "total_steps": 4466, "loss": 0.244, "lr": 2.521538123207111e-05, "epoch": 3.323137254901961, "percentage": 47.47, "elapsed_time": "9:01:32", "remaining_time": "9:59:16"} +{"current_steps": 2125, "total_steps": 4466, "loss": 0.2586, "lr": 2.5139877609877244e-05, "epoch": 3.330980392156863, "percentage": 47.58, "elapsed_time": "9:02:48", "remaining_time": "9:57:59"} +{"current_steps": 2130, "total_steps": 4466, "loss": 0.2442, "lr": 2.506429547208107e-05, "epoch": 3.3388235294117647, "percentage": 47.69, "elapsed_time": "9:04:07", "remaining_time": "9:56:45"} +{"current_steps": 2135, "total_steps": 4466, "loss": 0.2447, "lr": 2.498863597325815e-05, "epoch": 3.3466666666666667, "percentage": 47.81, "elapsed_time": "9:05:23", "remaining_time": "9:55:27"} +{"current_steps": 2140, "total_steps": 4466, "loss": 0.2392, "lr": 2.4912900269165797e-05, "epoch": 3.3545098039215686, "percentage": 47.92, "elapsed_time": "9:06:39", "remaining_time": "9:54:10"} +{"current_steps": 2145, "total_steps": 4466, "loss": 0.2453, "lr": 2.483708951672541e-05, "epoch": 3.3623529411764705, "percentage": 48.03, "elapsed_time": "9:07:56", "remaining_time": "9:52:54"} +{"current_steps": 2150, "total_steps": 4466, "loss": 0.2361, "lr": 2.4761204874004818e-05, "epoch": 3.3701960784313725, "percentage": 48.14, "elapsed_time": "9:09:13", "remaining_time": "9:51:38"} +{"current_steps": 2155, "total_steps": 4466, "loss": 0.2367, "lr": 2.4685247500200583e-05, "epoch": 3.3780392156862744, "percentage": 48.25, "elapsed_time": "9:10:29", "remaining_time": "9:50:20"} +{"current_steps": 2160, "total_steps": 4466, "loss": 0.2494, "lr": 2.4609218555620275e-05, "epoch": 3.3858823529411763, "percentage": 48.37, "elapsed_time": "9:11:47", "remaining_time": "9:49:05"} +{"current_steps": 2165, "total_steps": 4466, "loss": 0.2504, "lr": 2.4533119201664785e-05, "epoch": 3.3937254901960783, "percentage": 48.48, "elapsed_time": "9:13:04", "remaining_time": "9:47:49"} +{"current_steps": 2170, "total_steps": 4466, "loss": 0.2416, "lr": 2.4456950600810542e-05, "epoch": 3.40156862745098, "percentage": 48.59, "elapsed_time": "9:14:19", "remaining_time": "9:46:30"} +{"current_steps": 2175, "total_steps": 4466, "loss": 0.243, "lr": 2.4380713916591785e-05, "epoch": 3.409411764705882, "percentage": 48.7, "elapsed_time": "9:15:29", "remaining_time": "9:45:07"} +{"current_steps": 2180, "total_steps": 4466, "loss": 0.2604, "lr": 2.4304410313582776e-05, "epoch": 3.417254901960784, "percentage": 48.81, "elapsed_time": "9:16:45", "remaining_time": "9:43:49"} +{"current_steps": 2185, "total_steps": 4466, "loss": 0.2497, "lr": 2.422804095738002e-05, "epoch": 3.4250980392156865, "percentage": 48.93, "elapsed_time": "9:18:00", "remaining_time": "9:42:31"} +{"current_steps": 2190, "total_steps": 4466, "loss": 0.2534, "lr": 2.4151607014584437e-05, "epoch": 3.4329411764705884, "percentage": 49.04, "elapsed_time": "9:19:20", "remaining_time": "9:41:18"} +{"current_steps": 2195, "total_steps": 4466, "loss": 0.2599, "lr": 2.4075109652783573e-05, "epoch": 3.4407843137254903, "percentage": 49.15, "elapsed_time": "9:20:34", "remaining_time": "9:39:59"} +{"current_steps": 2200, "total_steps": 4466, "loss": 0.2602, "lr": 2.3998550040533743e-05, "epoch": 3.4486274509803923, "percentage": 49.26, "elapsed_time": "9:21:53", "remaining_time": "9:38:44"} +{"current_steps": 2205, "total_steps": 4466, "loss": 0.2466, "lr": 2.392192934734219e-05, "epoch": 3.456470588235294, "percentage": 49.37, "elapsed_time": "9:23:10", "remaining_time": "9:37:28"} +{"current_steps": 2210, "total_steps": 4466, "loss": 0.2353, "lr": 2.3845248743649196e-05, "epoch": 3.464313725490196, "percentage": 49.48, "elapsed_time": "9:24:26", "remaining_time": "9:36:11"} +{"current_steps": 2215, "total_steps": 4466, "loss": 0.2518, "lr": 2.376850940081025e-05, "epoch": 3.472156862745098, "percentage": 49.6, "elapsed_time": "9:25:46", "remaining_time": "9:34:58"} +{"current_steps": 2220, "total_steps": 4466, "loss": 0.2456, "lr": 2.3691712491078107e-05, "epoch": 3.48, "percentage": 49.71, "elapsed_time": "9:26:59", "remaining_time": "9:33:38"} +{"current_steps": 2225, "total_steps": 4466, "loss": 0.2494, "lr": 2.3614859187584914e-05, "epoch": 3.487843137254902, "percentage": 49.82, "elapsed_time": "9:28:13", "remaining_time": "9:32:19"} +{"current_steps": 2230, "total_steps": 4466, "loss": 0.2498, "lr": 2.353795066432427e-05, "epoch": 3.495686274509804, "percentage": 49.93, "elapsed_time": "9:29:33", "remaining_time": "9:31:05"} +{"current_steps": 2235, "total_steps": 4466, "loss": 0.2499, "lr": 2.3460988096133284e-05, "epoch": 3.503529411764706, "percentage": 50.04, "elapsed_time": "9:30:53", "remaining_time": "9:29:52"} +{"current_steps": 2240, "total_steps": 4466, "loss": 0.2526, "lr": 2.338397265867468e-05, "epoch": 3.5113725490196077, "percentage": 50.16, "elapsed_time": "9:32:10", "remaining_time": "9:28:35"} +{"current_steps": 2245, "total_steps": 4466, "loss": 0.2488, "lr": 2.3306905528418762e-05, "epoch": 3.5192156862745096, "percentage": 50.27, "elapsed_time": "9:33:30", "remaining_time": "9:27:23"} +{"current_steps": 2250, "total_steps": 4466, "loss": 0.2439, "lr": 2.3229787882625496e-05, "epoch": 3.527058823529412, "percentage": 50.38, "elapsed_time": "9:34:45", "remaining_time": "9:26:04"} +{"current_steps": 2255, "total_steps": 4466, "loss": 0.2594, "lr": 2.315262089932653e-05, "epoch": 3.534901960784314, "percentage": 50.49, "elapsed_time": "9:36:01", "remaining_time": "9:24:47"} +{"current_steps": 2260, "total_steps": 4466, "loss": 0.2528, "lr": 2.3075405757307147e-05, "epoch": 3.542745098039216, "percentage": 50.6, "elapsed_time": "9:37:09", "remaining_time": "9:23:22"} +{"current_steps": 2265, "total_steps": 4466, "loss": 0.243, "lr": 2.2998143636088323e-05, "epoch": 3.550588235294118, "percentage": 50.72, "elapsed_time": "9:38:26", "remaining_time": "9:22:05"} +{"current_steps": 2270, "total_steps": 4466, "loss": 0.2404, "lr": 2.2920835715908654e-05, "epoch": 3.5584313725490198, "percentage": 50.83, "elapsed_time": "9:39:43", "remaining_time": "9:20:49"} +{"current_steps": 2275, "total_steps": 4466, "loss": 0.2461, "lr": 2.2843483177706363e-05, "epoch": 3.5662745098039217, "percentage": 50.94, "elapsed_time": "9:41:01", "remaining_time": "9:19:34"} +{"current_steps": 2280, "total_steps": 4466, "loss": 0.2502, "lr": 2.2766087203101245e-05, "epoch": 3.5741176470588236, "percentage": 51.05, "elapsed_time": "9:42:22", "remaining_time": "9:18:21"} +{"current_steps": 2285, "total_steps": 4466, "loss": 0.2293, "lr": 2.2688648974376622e-05, "epoch": 3.5819607843137256, "percentage": 51.16, "elapsed_time": "9:43:35", "remaining_time": "9:17:01"} +{"current_steps": 2290, "total_steps": 4466, "loss": 0.2375, "lr": 2.261116967446127e-05, "epoch": 3.5898039215686275, "percentage": 51.28, "elapsed_time": "9:44:53", "remaining_time": "9:15:46"} +{"current_steps": 2295, "total_steps": 4466, "loss": 0.2399, "lr": 2.2533650486911375e-05, "epoch": 3.5976470588235294, "percentage": 51.39, "elapsed_time": "9:46:05", "remaining_time": "9:14:25"} +{"current_steps": 2300, "total_steps": 4466, "loss": 0.2454, "lr": 2.245609259589243e-05, "epoch": 3.6054901960784314, "percentage": 51.5, "elapsed_time": "9:47:19", "remaining_time": "9:13:06"} +{"current_steps": 2305, "total_steps": 4466, "loss": 0.2472, "lr": 2.2378497186161146e-05, "epoch": 3.6133333333333333, "percentage": 51.61, "elapsed_time": "9:48:36", "remaining_time": "9:11:50"} +{"current_steps": 2310, "total_steps": 4466, "loss": 0.2509, "lr": 2.230086544304737e-05, "epoch": 3.621176470588235, "percentage": 51.72, "elapsed_time": "9:49:53", "remaining_time": "9:10:33"} +{"current_steps": 2315, "total_steps": 4466, "loss": 0.2427, "lr": 2.222319855243597e-05, "epoch": 3.629019607843137, "percentage": 51.84, "elapsed_time": "9:51:09", "remaining_time": "9:09:16"} +{"current_steps": 2320, "total_steps": 4466, "loss": 0.256, "lr": 2.2145497700748723e-05, "epoch": 3.636862745098039, "percentage": 51.95, "elapsed_time": "9:52:23", "remaining_time": "9:07:57"} +{"current_steps": 2325, "total_steps": 4466, "loss": 0.2468, "lr": 2.2067764074926163e-05, "epoch": 3.644705882352941, "percentage": 52.06, "elapsed_time": "9:53:42", "remaining_time": "9:06:43"} +{"current_steps": 2330, "total_steps": 4466, "loss": 0.2423, "lr": 2.198999886240951e-05, "epoch": 3.652549019607843, "percentage": 52.17, "elapsed_time": "9:54:57", "remaining_time": "9:05:25"} +{"current_steps": 2335, "total_steps": 4466, "loss": 0.243, "lr": 2.1912203251122475e-05, "epoch": 3.660392156862745, "percentage": 52.28, "elapsed_time": "9:56:18", "remaining_time": "9:04:12"} +{"current_steps": 2340, "total_steps": 4466, "loss": 0.2393, "lr": 2.1834378429453133e-05, "epoch": 3.668235294117647, "percentage": 52.4, "elapsed_time": "9:57:35", "remaining_time": "9:02:56"} +{"current_steps": 2345, "total_steps": 4466, "loss": 0.2447, "lr": 2.175652558623577e-05, "epoch": 3.6760784313725487, "percentage": 52.51, "elapsed_time": "9:58:52", "remaining_time": "9:01:40"} +{"current_steps": 2350, "total_steps": 4466, "loss": 0.2492, "lr": 2.1678645910732734e-05, "epoch": 3.683921568627451, "percentage": 52.62, "elapsed_time": "10:00:11", "remaining_time": "9:00:25"} +{"current_steps": 2355, "total_steps": 4466, "loss": 0.252, "lr": 2.1600740592616245e-05, "epoch": 3.691764705882353, "percentage": 52.73, "elapsed_time": "10:01:27", "remaining_time": "8:59:08"} +{"current_steps": 2360, "total_steps": 4466, "loss": 0.2372, "lr": 2.152281082195024e-05, "epoch": 3.699607843137255, "percentage": 52.84, "elapsed_time": "10:02:41", "remaining_time": "8:57:49"} +{"current_steps": 2365, "total_steps": 4466, "loss": 0.2421, "lr": 2.1444857789172185e-05, "epoch": 3.707450980392157, "percentage": 52.96, "elapsed_time": "10:03:58", "remaining_time": "8:56:33"} +{"current_steps": 2370, "total_steps": 4466, "loss": 0.2538, "lr": 2.1366882685074892e-05, "epoch": 3.715294117647059, "percentage": 53.07, "elapsed_time": "10:05:16", "remaining_time": "8:55:17"} +{"current_steps": 2375, "total_steps": 4466, "loss": 0.2389, "lr": 2.1288886700788335e-05, "epoch": 3.723137254901961, "percentage": 53.18, "elapsed_time": "10:06:34", "remaining_time": "8:54:02"} +{"current_steps": 2380, "total_steps": 4466, "loss": 0.2618, "lr": 2.1210871027761438e-05, "epoch": 3.7309803921568627, "percentage": 53.29, "elapsed_time": "10:07:53", "remaining_time": "8:52:48"} +{"current_steps": 2385, "total_steps": 4466, "loss": 0.2359, "lr": 2.1132836857743903e-05, "epoch": 3.7388235294117647, "percentage": 53.4, "elapsed_time": "10:09:07", "remaining_time": "8:51:29"} +{"current_steps": 2390, "total_steps": 4466, "loss": 0.2378, "lr": 2.105478538276797e-05, "epoch": 3.7466666666666666, "percentage": 53.52, "elapsed_time": "10:10:23", "remaining_time": "8:50:11"} +{"current_steps": 2395, "total_steps": 4466, "loss": 0.2362, "lr": 2.0976717795130233e-05, "epoch": 3.7545098039215685, "percentage": 53.63, "elapsed_time": "10:11:37", "remaining_time": "8:48:52"} +{"current_steps": 2400, "total_steps": 4466, "loss": 0.2544, "lr": 2.0898635287373423e-05, "epoch": 3.7623529411764705, "percentage": 53.74, "elapsed_time": "10:12:55", "remaining_time": "8:47:37"} +{"current_steps": 2405, "total_steps": 4466, "loss": 0.2373, "lr": 2.0820539052268186e-05, "epoch": 3.7701960784313724, "percentage": 53.85, "elapsed_time": "10:14:08", "remaining_time": "8:46:17"} +{"current_steps": 2410, "total_steps": 4466, "loss": 0.2308, "lr": 2.0742430282794857e-05, "epoch": 3.7780392156862748, "percentage": 53.96, "elapsed_time": "10:15:23", "remaining_time": "8:44:59"} +{"current_steps": 2415, "total_steps": 4466, "loss": 0.2518, "lr": 2.0664310172125242e-05, "epoch": 3.7858823529411767, "percentage": 54.08, "elapsed_time": "10:16:40", "remaining_time": "8:43:43"} +{"current_steps": 2420, "total_steps": 4466, "loss": 0.2391, "lr": 2.0586179913604413e-05, "epoch": 3.7937254901960786, "percentage": 54.19, "elapsed_time": "10:17:48", "remaining_time": "8:42:19"} +{"current_steps": 2425, "total_steps": 4466, "loss": 0.247, "lr": 2.0508040700732438e-05, "epoch": 3.8015686274509806, "percentage": 54.3, "elapsed_time": "10:19:06", "remaining_time": "8:41:04"} +{"current_steps": 2430, "total_steps": 4466, "loss": 0.2416, "lr": 2.0429893727146167e-05, "epoch": 3.8094117647058825, "percentage": 54.41, "elapsed_time": "10:20:24", "remaining_time": "8:39:49"} +{"current_steps": 2435, "total_steps": 4466, "loss": 0.2564, "lr": 2.0351740186601012e-05, "epoch": 3.8172549019607844, "percentage": 54.52, "elapsed_time": "10:21:40", "remaining_time": "8:38:31"} +{"current_steps": 2440, "total_steps": 4466, "loss": 0.2528, "lr": 2.0273581272952708e-05, "epoch": 3.8250980392156864, "percentage": 54.64, "elapsed_time": "10:22:53", "remaining_time": "8:37:11"} +{"current_steps": 2445, "total_steps": 4466, "loss": 0.2385, "lr": 2.0195418180139055e-05, "epoch": 3.8329411764705883, "percentage": 54.75, "elapsed_time": "10:24:05", "remaining_time": "8:35:51"} +{"current_steps": 2450, "total_steps": 4466, "loss": 0.2499, "lr": 2.0117252102161687e-05, "epoch": 3.8407843137254902, "percentage": 54.86, "elapsed_time": "10:25:20", "remaining_time": "8:34:34"} +{"current_steps": 2455, "total_steps": 4466, "loss": 0.2417, "lr": 2.0039084233067853e-05, "epoch": 3.848627450980392, "percentage": 54.97, "elapsed_time": "10:26:35", "remaining_time": "8:33:15"} +{"current_steps": 2460, "total_steps": 4466, "loss": 0.2549, "lr": 1.9960915766932153e-05, "epoch": 3.856470588235294, "percentage": 55.08, "elapsed_time": "10:27:53", "remaining_time": "8:32:00"} +{"current_steps": 2465, "total_steps": 4466, "loss": 0.239, "lr": 1.988274789783832e-05, "epoch": 3.864313725490196, "percentage": 55.19, "elapsed_time": "10:29:04", "remaining_time": "8:30:39"} +{"current_steps": 2470, "total_steps": 4466, "loss": 0.2343, "lr": 1.9804581819860952e-05, "epoch": 3.872156862745098, "percentage": 55.31, "elapsed_time": "10:30:20", "remaining_time": "8:29:22"} +{"current_steps": 2475, "total_steps": 4466, "loss": 0.26, "lr": 1.9726418727047295e-05, "epoch": 3.88, "percentage": 55.42, "elapsed_time": "10:31:36", "remaining_time": "8:28:05"} +{"current_steps": 2480, "total_steps": 4466, "loss": 0.2448, "lr": 1.9648259813398987e-05, "epoch": 3.887843137254902, "percentage": 55.53, "elapsed_time": "10:32:56", "remaining_time": "8:26:52"} +{"current_steps": 2485, "total_steps": 4466, "loss": 0.2365, "lr": 1.957010627285384e-05, "epoch": 3.8956862745098038, "percentage": 55.64, "elapsed_time": "10:34:08", "remaining_time": "8:25:31"} +{"current_steps": 2490, "total_steps": 4466, "loss": 0.2309, "lr": 1.9491959299267572e-05, "epoch": 3.9035294117647057, "percentage": 55.75, "elapsed_time": "10:35:23", "remaining_time": "8:24:13"} +{"current_steps": 2495, "total_steps": 4466, "loss": 0.2422, "lr": 1.941382008639559e-05, "epoch": 3.9113725490196076, "percentage": 55.87, "elapsed_time": "10:36:41", "remaining_time": "8:22:58"} +{"current_steps": 2500, "total_steps": 4466, "loss": 0.248, "lr": 1.933568982787476e-05, "epoch": 3.9192156862745096, "percentage": 55.98, "elapsed_time": "10:37:59", "remaining_time": "8:21:42"} +{"current_steps": 2505, "total_steps": 4466, "loss": 0.2445, "lr": 1.9257569717205153e-05, "epoch": 3.9270588235294115, "percentage": 56.09, "elapsed_time": "10:39:19", "remaining_time": "8:20:29"} +{"current_steps": 2510, "total_steps": 4466, "loss": 0.2365, "lr": 1.9179460947731824e-05, "epoch": 3.934901960784314, "percentage": 56.2, "elapsed_time": "10:40:35", "remaining_time": "8:19:12"} +{"current_steps": 2515, "total_steps": 4466, "loss": 0.2354, "lr": 1.9101364712626577e-05, "epoch": 3.942745098039216, "percentage": 56.31, "elapsed_time": "10:41:47", "remaining_time": "8:17:52"} +{"current_steps": 2520, "total_steps": 4466, "loss": 0.2474, "lr": 1.9023282204869767e-05, "epoch": 3.9505882352941177, "percentage": 56.43, "elapsed_time": "10:43:04", "remaining_time": "8:16:36"} +{"current_steps": 2525, "total_steps": 4466, "loss": 0.2516, "lr": 1.8945214617232036e-05, "epoch": 3.9584313725490197, "percentage": 56.54, "elapsed_time": "10:44:22", "remaining_time": "8:15:20"} +{"current_steps": 2530, "total_steps": 4466, "loss": 0.2496, "lr": 1.88671631422561e-05, "epoch": 3.9662745098039216, "percentage": 56.65, "elapsed_time": "10:45:41", "remaining_time": "8:14:05"} +{"current_steps": 2535, "total_steps": 4466, "loss": 0.2444, "lr": 1.8789128972238565e-05, "epoch": 3.9741176470588235, "percentage": 56.76, "elapsed_time": "10:46:58", "remaining_time": "8:12:49"} +{"current_steps": 2540, "total_steps": 4466, "loss": 0.2472, "lr": 1.8711113299211675e-05, "epoch": 3.9819607843137255, "percentage": 56.87, "elapsed_time": "10:48:13", "remaining_time": "8:11:31"} +{"current_steps": 2545, "total_steps": 4466, "loss": 0.2436, "lr": 1.8633117314925118e-05, "epoch": 3.9898039215686274, "percentage": 56.99, "elapsed_time": "10:49:27", "remaining_time": "8:10:13"} +{"current_steps": 2550, "total_steps": 4466, "loss": 0.2375, "lr": 1.855514221082782e-05, "epoch": 3.9976470588235293, "percentage": 57.1, "elapsed_time": "10:50:43", "remaining_time": "8:08:56"} +{"current_steps": 2555, "total_steps": 4466, "loss": 0.2473, "lr": 1.8477189178049764e-05, "epoch": 4.004705882352941, "percentage": 57.21, "elapsed_time": "10:51:52", "remaining_time": "8:07:34"} +{"current_steps": 2560, "total_steps": 4466, "loss": 0.237, "lr": 1.839925940738376e-05, "epoch": 4.012549019607843, "percentage": 57.32, "elapsed_time": "10:53:10", "remaining_time": "8:06:18"} +{"current_steps": 2565, "total_steps": 4466, "loss": 0.236, "lr": 1.8321354089267272e-05, "epoch": 4.020392156862745, "percentage": 57.43, "elapsed_time": "10:54:31", "remaining_time": "8:05:04"} +{"current_steps": 2570, "total_steps": 4466, "loss": 0.2386, "lr": 1.8243474413764236e-05, "epoch": 4.028235294117647, "percentage": 57.55, "elapsed_time": "10:55:49", "remaining_time": "8:03:50"} +{"current_steps": 2575, "total_steps": 4466, "loss": 0.2272, "lr": 1.8165621570546874e-05, "epoch": 4.036078431372549, "percentage": 57.66, "elapsed_time": "10:57:07", "remaining_time": "8:02:34"} +{"current_steps": 2580, "total_steps": 4466, "loss": 0.2429, "lr": 1.808779674887753e-05, "epoch": 4.043921568627451, "percentage": 57.77, "elapsed_time": "10:58:28", "remaining_time": "8:01:21"} +{"current_steps": 2585, "total_steps": 4466, "loss": 0.2481, "lr": 1.801000113759049e-05, "epoch": 4.051764705882353, "percentage": 57.88, "elapsed_time": "10:59:45", "remaining_time": "8:00:04"} +{"current_steps": 2590, "total_steps": 4466, "loss": 0.2298, "lr": 1.7932235925073836e-05, "epoch": 4.059607843137255, "percentage": 57.99, "elapsed_time": "11:01:02", "remaining_time": "7:58:48"} +{"current_steps": 2595, "total_steps": 4466, "loss": 0.2241, "lr": 1.7854502299251284e-05, "epoch": 4.067450980392157, "percentage": 58.11, "elapsed_time": "11:02:11", "remaining_time": "7:57:26"} +{"current_steps": 2600, "total_steps": 4466, "loss": 0.2394, "lr": 1.7776801447564032e-05, "epoch": 4.075294117647059, "percentage": 58.22, "elapsed_time": "11:03:26", "remaining_time": "7:56:08"} +{"current_steps": 2605, "total_steps": 4466, "loss": 0.2286, "lr": 1.7699134556952634e-05, "epoch": 4.083137254901961, "percentage": 58.33, "elapsed_time": "11:04:39", "remaining_time": "7:54:49"} +{"current_steps": 2610, "total_steps": 4466, "loss": 0.2334, "lr": 1.7621502813838864e-05, "epoch": 4.090980392156863, "percentage": 58.44, "elapsed_time": "11:05:55", "remaining_time": "7:53:32"} +{"current_steps": 2615, "total_steps": 4466, "loss": 0.2361, "lr": 1.754390740410758e-05, "epoch": 4.0988235294117645, "percentage": 58.55, "elapsed_time": "11:07:08", "remaining_time": "7:52:13"} +{"current_steps": 2620, "total_steps": 4466, "loss": 0.2419, "lr": 1.7466349513088636e-05, "epoch": 4.1066666666666665, "percentage": 58.67, "elapsed_time": "11:08:22", "remaining_time": "7:50:55"} +{"current_steps": 2625, "total_steps": 4466, "loss": 0.2263, "lr": 1.738883032553873e-05, "epoch": 4.114509803921568, "percentage": 58.78, "elapsed_time": "11:09:40", "remaining_time": "7:49:40"} +{"current_steps": 2630, "total_steps": 4466, "loss": 0.2296, "lr": 1.7311351025623385e-05, "epoch": 4.12235294117647, "percentage": 58.89, "elapsed_time": "11:10:55", "remaining_time": "7:48:22"} +{"current_steps": 2635, "total_steps": 4466, "loss": 0.2435, "lr": 1.723391279689876e-05, "epoch": 4.130196078431372, "percentage": 59.0, "elapsed_time": "11:12:10", "remaining_time": "7:47:04"} +{"current_steps": 2640, "total_steps": 4466, "loss": 0.223, "lr": 1.7156516822293644e-05, "epoch": 4.138039215686274, "percentage": 59.11, "elapsed_time": "11:13:18", "remaining_time": "7:45:42"} +{"current_steps": 2645, "total_steps": 4466, "loss": 0.2274, "lr": 1.7079164284091353e-05, "epoch": 4.145882352941176, "percentage": 59.23, "elapsed_time": "11:14:35", "remaining_time": "7:44:26"} +{"current_steps": 2650, "total_steps": 4466, "loss": 0.2312, "lr": 1.7001856363911687e-05, "epoch": 4.153725490196078, "percentage": 59.34, "elapsed_time": "11:15:53", "remaining_time": "7:43:10"} +{"current_steps": 2655, "total_steps": 4466, "loss": 0.2326, "lr": 1.692459424269286e-05, "epoch": 4.16156862745098, "percentage": 59.45, "elapsed_time": "11:16:59", "remaining_time": "7:41:47"} +{"current_steps": 2660, "total_steps": 4466, "loss": 0.2337, "lr": 1.6847379100673474e-05, "epoch": 4.169411764705882, "percentage": 59.56, "elapsed_time": "11:18:12", "remaining_time": "7:40:28"} +{"current_steps": 2665, "total_steps": 4466, "loss": 0.229, "lr": 1.6770212117374504e-05, "epoch": 4.177254901960785, "percentage": 59.67, "elapsed_time": "11:19:30", "remaining_time": "7:39:12"} +{"current_steps": 2670, "total_steps": 4466, "loss": 0.2205, "lr": 1.6693094471581244e-05, "epoch": 4.185098039215687, "percentage": 59.79, "elapsed_time": "11:20:44", "remaining_time": "7:37:54"} +{"current_steps": 2675, "total_steps": 4466, "loss": 0.2293, "lr": 1.6616027341325328e-05, "epoch": 4.192941176470589, "percentage": 59.9, "elapsed_time": "11:21:55", "remaining_time": "7:36:34"} +{"current_steps": 2680, "total_steps": 4466, "loss": 0.2288, "lr": 1.653901190386672e-05, "epoch": 4.2007843137254905, "percentage": 60.01, "elapsed_time": "11:23:07", "remaining_time": "7:35:15"} +{"current_steps": 2685, "total_steps": 4466, "loss": 0.2377, "lr": 1.646204933567574e-05, "epoch": 4.2086274509803925, "percentage": 60.12, "elapsed_time": "11:24:22", "remaining_time": "7:33:57"} +{"current_steps": 2690, "total_steps": 4466, "loss": 0.2358, "lr": 1.638514081241509e-05, "epoch": 4.216470588235294, "percentage": 60.23, "elapsed_time": "11:25:39", "remaining_time": "7:32:41"} +{"current_steps": 2695, "total_steps": 4466, "loss": 0.2452, "lr": 1.6308287508921893e-05, "epoch": 4.224313725490196, "percentage": 60.34, "elapsed_time": "11:26:56", "remaining_time": "7:31:24"} +{"current_steps": 2700, "total_steps": 4466, "loss": 0.2295, "lr": 1.6231490599189753e-05, "epoch": 4.232156862745098, "percentage": 60.46, "elapsed_time": "11:28:13", "remaining_time": "7:30:08"} +{"current_steps": 2705, "total_steps": 4466, "loss": 0.2274, "lr": 1.615475125635081e-05, "epoch": 4.24, "percentage": 60.57, "elapsed_time": "11:29:29", "remaining_time": "7:28:52"} +{"current_steps": 2710, "total_steps": 4466, "loss": 0.2334, "lr": 1.607807065265782e-05, "epoch": 4.247843137254902, "percentage": 60.68, "elapsed_time": "11:30:44", "remaining_time": "7:27:34"} +{"current_steps": 2715, "total_steps": 4466, "loss": 0.2368, "lr": 1.600144995946626e-05, "epoch": 4.255686274509804, "percentage": 60.79, "elapsed_time": "11:32:00", "remaining_time": "7:26:17"} +{"current_steps": 2720, "total_steps": 4466, "loss": 0.2317, "lr": 1.5924890347216433e-05, "epoch": 4.263529411764706, "percentage": 60.9, "elapsed_time": "11:33:14", "remaining_time": "7:24:59"} +{"current_steps": 2725, "total_steps": 4466, "loss": 0.2358, "lr": 1.5848392985415573e-05, "epoch": 4.271372549019608, "percentage": 61.02, "elapsed_time": "11:34:34", "remaining_time": "7:23:45"} +{"current_steps": 2730, "total_steps": 4466, "loss": 0.2304, "lr": 1.5771959042619983e-05, "epoch": 4.27921568627451, "percentage": 61.13, "elapsed_time": "11:35:52", "remaining_time": "7:22:30"} +{"current_steps": 2735, "total_steps": 4466, "loss": 0.2313, "lr": 1.5695589686417224e-05, "epoch": 4.287058823529412, "percentage": 61.24, "elapsed_time": "11:37:12", "remaining_time": "7:21:16"} +{"current_steps": 2740, "total_steps": 4466, "loss": 0.2407, "lr": 1.561928608340822e-05, "epoch": 4.294901960784314, "percentage": 61.35, "elapsed_time": "11:38:25", "remaining_time": "7:19:57"} +{"current_steps": 2745, "total_steps": 4466, "loss": 0.2363, "lr": 1.554304939918946e-05, "epoch": 4.302745098039216, "percentage": 61.46, "elapsed_time": "11:39:40", "remaining_time": "7:18:39"} +{"current_steps": 2750, "total_steps": 4466, "loss": 0.2279, "lr": 1.5466880798335222e-05, "epoch": 4.310588235294118, "percentage": 61.58, "elapsed_time": "11:40:59", "remaining_time": "7:17:24"} +{"current_steps": 2755, "total_steps": 4466, "loss": 0.2358, "lr": 1.539078144437973e-05, "epoch": 4.3184313725490195, "percentage": 61.69, "elapsed_time": "11:42:12", "remaining_time": "7:16:06"} +{"current_steps": 2760, "total_steps": 4466, "loss": 0.2328, "lr": 1.5314752499799427e-05, "epoch": 4.3262745098039215, "percentage": 61.8, "elapsed_time": "11:43:28", "remaining_time": "7:14:49"} +{"current_steps": 2765, "total_steps": 4466, "loss": 0.2405, "lr": 1.5238795125995189e-05, "epoch": 4.334117647058823, "percentage": 61.91, "elapsed_time": "11:44:38", "remaining_time": "7:13:29"} +{"current_steps": 2770, "total_steps": 4466, "loss": 0.2287, "lr": 1.5162910483274593e-05, "epoch": 4.341960784313725, "percentage": 62.02, "elapsed_time": "11:45:46", "remaining_time": "7:12:07"} +{"current_steps": 2775, "total_steps": 4466, "loss": 0.2493, "lr": 1.5087099730834207e-05, "epoch": 4.349803921568627, "percentage": 62.14, "elapsed_time": "11:47:02", "remaining_time": "7:10:50"} +{"current_steps": 2780, "total_steps": 4466, "loss": 0.2426, "lr": 1.5011364026741855e-05, "epoch": 4.357647058823529, "percentage": 62.25, "elapsed_time": "11:48:20", "remaining_time": "7:09:35"} +{"current_steps": 2785, "total_steps": 4466, "loss": 0.2469, "lr": 1.4935704527918937e-05, "epoch": 4.365490196078431, "percentage": 62.36, "elapsed_time": "11:49:38", "remaining_time": "7:08:20"} +{"current_steps": 2790, "total_steps": 4466, "loss": 0.228, "lr": 1.4860122390122764e-05, "epoch": 4.373333333333333, "percentage": 62.47, "elapsed_time": "11:50:48", "remaining_time": "7:06:59"} +{"current_steps": 2795, "total_steps": 4466, "loss": 0.2334, "lr": 1.4784618767928898e-05, "epoch": 4.381176470588235, "percentage": 62.58, "elapsed_time": "11:52:05", "remaining_time": "7:05:43"} +{"current_steps": 2800, "total_steps": 4466, "loss": 0.2356, "lr": 1.4709194814713507e-05, "epoch": 4.389019607843137, "percentage": 62.7, "elapsed_time": "11:53:21", "remaining_time": "7:04:26"} +{"current_steps": 2805, "total_steps": 4466, "loss": 0.2363, "lr": 1.4633851682635766e-05, "epoch": 4.396862745098039, "percentage": 62.81, "elapsed_time": "11:54:41", "remaining_time": "7:03:12"} +{"current_steps": 2810, "total_steps": 4466, "loss": 0.2378, "lr": 1.4558590522620239e-05, "epoch": 4.404705882352941, "percentage": 62.92, "elapsed_time": "11:55:59", "remaining_time": "7:01:56"} +{"current_steps": 2815, "total_steps": 4466, "loss": 0.2344, "lr": 1.4483412484339301e-05, "epoch": 4.412549019607843, "percentage": 63.03, "elapsed_time": "11:57:15", "remaining_time": "7:00:40"} +{"current_steps": 2820, "total_steps": 4466, "loss": 0.2325, "lr": 1.4408318716195581e-05, "epoch": 4.420392156862745, "percentage": 63.14, "elapsed_time": "11:58:31", "remaining_time": "6:59:23"} +{"current_steps": 2825, "total_steps": 4466, "loss": 0.2309, "lr": 1.4333310365304413e-05, "epoch": 4.428235294117647, "percentage": 63.26, "elapsed_time": "11:59:48", "remaining_time": "6:58:07"} +{"current_steps": 2830, "total_steps": 4466, "loss": 0.2373, "lr": 1.4258388577476322e-05, "epoch": 4.436078431372549, "percentage": 63.37, "elapsed_time": "12:01:04", "remaining_time": "6:56:51"} +{"current_steps": 2835, "total_steps": 4466, "loss": 0.2393, "lr": 1.4183554497199514e-05, "epoch": 4.443921568627451, "percentage": 63.48, "elapsed_time": "12:02:21", "remaining_time": "6:55:34"} +{"current_steps": 2840, "total_steps": 4466, "loss": 0.2336, "lr": 1.4108809267622381e-05, "epoch": 4.451764705882353, "percentage": 63.59, "elapsed_time": "12:03:41", "remaining_time": "6:54:20"} +{"current_steps": 2845, "total_steps": 4466, "loss": 0.2357, "lr": 1.4034154030536083e-05, "epoch": 4.459607843137255, "percentage": 63.7, "elapsed_time": "12:04:58", "remaining_time": "6:53:04"} +{"current_steps": 2850, "total_steps": 4466, "loss": 0.2435, "lr": 1.3959589926357042e-05, "epoch": 4.467450980392157, "percentage": 63.82, "elapsed_time": "12:06:15", "remaining_time": "6:51:47"} +{"current_steps": 2855, "total_steps": 4466, "loss": 0.2209, "lr": 1.3885118094109575e-05, "epoch": 4.475294117647059, "percentage": 63.93, "elapsed_time": "12:07:24", "remaining_time": "6:50:27"} +{"current_steps": 2860, "total_steps": 4466, "loss": 0.2409, "lr": 1.3810739671408467e-05, "epoch": 4.483137254901961, "percentage": 64.04, "elapsed_time": "12:08:39", "remaining_time": "6:49:10"} +{"current_steps": 2865, "total_steps": 4466, "loss": 0.2323, "lr": 1.3736455794441596e-05, "epoch": 4.490980392156863, "percentage": 64.15, "elapsed_time": "12:09:54", "remaining_time": "6:47:52"} +{"current_steps": 2870, "total_steps": 4466, "loss": 0.2285, "lr": 1.3662267597952588e-05, "epoch": 4.498823529411765, "percentage": 64.26, "elapsed_time": "12:11:09", "remaining_time": "6:46:35"} +{"current_steps": 2875, "total_steps": 4466, "loss": 0.2376, "lr": 1.3588176215223463e-05, "epoch": 4.506666666666667, "percentage": 64.38, "elapsed_time": "12:12:23", "remaining_time": "6:45:17"} +{"current_steps": 2880, "total_steps": 4466, "loss": 0.2331, "lr": 1.3514182778057365e-05, "epoch": 4.514509803921569, "percentage": 64.49, "elapsed_time": "12:13:39", "remaining_time": "6:44:01"} +{"current_steps": 2885, "total_steps": 4466, "loss": 0.2279, "lr": 1.3440288416761216e-05, "epoch": 4.522352941176471, "percentage": 64.6, "elapsed_time": "12:14:53", "remaining_time": "6:42:43"} +{"current_steps": 2890, "total_steps": 4466, "loss": 0.2332, "lr": 1.3366494260128484e-05, "epoch": 4.530196078431373, "percentage": 64.71, "elapsed_time": "12:16:11", "remaining_time": "6:41:27"} +{"current_steps": 2895, "total_steps": 4466, "loss": 0.2312, "lr": 1.3292801435421935e-05, "epoch": 4.5380392156862746, "percentage": 64.82, "elapsed_time": "12:17:32", "remaining_time": "6:40:14"} +{"current_steps": 2900, "total_steps": 4466, "loss": 0.2367, "lr": 1.3219211068356418e-05, "epoch": 4.5458823529411765, "percentage": 64.94, "elapsed_time": "12:18:45", "remaining_time": "6:38:55"} +{"current_steps": 2905, "total_steps": 4466, "loss": 0.2322, "lr": 1.3145724283081651e-05, "epoch": 4.553725490196078, "percentage": 65.05, "elapsed_time": "12:20:00", "remaining_time": "6:37:38"} +{"current_steps": 2910, "total_steps": 4466, "loss": 0.2309, "lr": 1.3072342202165069e-05, "epoch": 4.56156862745098, "percentage": 65.16, "elapsed_time": "12:21:18", "remaining_time": "6:36:23"} +{"current_steps": 2915, "total_steps": 4466, "loss": 0.2282, "lr": 1.2999065946574656e-05, "epoch": 4.569411764705882, "percentage": 65.27, "elapsed_time": "12:22:35", "remaining_time": "6:35:06"} +{"current_steps": 2920, "total_steps": 4466, "loss": 0.2446, "lr": 1.2925896635661852e-05, "epoch": 4.577254901960784, "percentage": 65.38, "elapsed_time": "12:23:55", "remaining_time": "6:33:52"} +{"current_steps": 2925, "total_steps": 4466, "loss": 0.2403, "lr": 1.2852835387144414e-05, "epoch": 4.585098039215686, "percentage": 65.49, "elapsed_time": "12:25:15", "remaining_time": "6:32:37"} +{"current_steps": 2930, "total_steps": 4466, "loss": 0.2398, "lr": 1.2779883317089374e-05, "epoch": 4.592941176470588, "percentage": 65.61, "elapsed_time": "12:26:31", "remaining_time": "6:31:21"} +{"current_steps": 2935, "total_steps": 4466, "loss": 0.2389, "lr": 1.2707041539895974e-05, "epoch": 4.60078431372549, "percentage": 65.72, "elapsed_time": "12:27:51", "remaining_time": "6:30:06"} +{"current_steps": 2940, "total_steps": 4466, "loss": 0.2253, "lr": 1.2634311168278652e-05, "epoch": 4.608627450980392, "percentage": 65.83, "elapsed_time": "12:29:03", "remaining_time": "6:28:47"} +{"current_steps": 2945, "total_steps": 4466, "loss": 0.2257, "lr": 1.2561693313250034e-05, "epoch": 4.616470588235294, "percentage": 65.94, "elapsed_time": "12:30:18", "remaining_time": "6:27:30"} +{"current_steps": 2950, "total_steps": 4466, "loss": 0.2418, "lr": 1.248918908410396e-05, "epoch": 4.624313725490196, "percentage": 66.05, "elapsed_time": "12:31:38", "remaining_time": "6:26:15"} +{"current_steps": 2955, "total_steps": 4466, "loss": 0.2209, "lr": 1.2416799588398576e-05, "epoch": 4.632156862745098, "percentage": 66.17, "elapsed_time": "12:32:51", "remaining_time": "6:24:57"} +{"current_steps": 2960, "total_steps": 4466, "loss": 0.235, "lr": 1.2344525931939359e-05, "epoch": 4.64, "percentage": 66.28, "elapsed_time": "12:34:07", "remaining_time": "6:23:41"} +{"current_steps": 2965, "total_steps": 4466, "loss": 0.2365, "lr": 1.2272369218762266e-05, "epoch": 4.647843137254902, "percentage": 66.39, "elapsed_time": "12:35:25", "remaining_time": "6:22:25"} +{"current_steps": 2970, "total_steps": 4466, "loss": 0.2249, "lr": 1.2200330551116838e-05, "epoch": 4.6556862745098035, "percentage": 66.5, "elapsed_time": "12:36:38", "remaining_time": "6:21:07"} +{"current_steps": 2975, "total_steps": 4466, "loss": 0.2407, "lr": 1.2128411029449403e-05, "epoch": 4.663529411764706, "percentage": 66.61, "elapsed_time": "12:37:59", "remaining_time": "6:19:53"} +{"current_steps": 2980, "total_steps": 4466, "loss": 0.2302, "lr": 1.205661175238622e-05, "epoch": 4.671372549019608, "percentage": 66.73, "elapsed_time": "12:39:14", "remaining_time": "6:18:36"} +{"current_steps": 2985, "total_steps": 4466, "loss": 0.2355, "lr": 1.1984933816716726e-05, "epoch": 4.67921568627451, "percentage": 66.84, "elapsed_time": "12:40:35", "remaining_time": "6:17:21"} +{"current_steps": 2990, "total_steps": 4466, "loss": 0.2378, "lr": 1.1913378317376796e-05, "epoch": 4.687058823529412, "percentage": 66.95, "elapsed_time": "12:41:47", "remaining_time": "6:16:03"} +{"current_steps": 2995, "total_steps": 4466, "loss": 0.2237, "lr": 1.1841946347431961e-05, "epoch": 4.694901960784314, "percentage": 67.06, "elapsed_time": "12:42:55", "remaining_time": "6:14:42"} +{"current_steps": 3000, "total_steps": 4466, "loss": 0.2299, "lr": 1.1770638998060764e-05, "epoch": 4.702745098039216, "percentage": 67.17, "elapsed_time": "12:44:08", "remaining_time": "6:13:24"} +{"current_steps": 3005, "total_steps": 4466, "loss": 0.2401, "lr": 1.1699457358538072e-05, "epoch": 4.710588235294118, "percentage": 67.29, "elapsed_time": "12:46:04", "remaining_time": "6:12:27"} +{"current_steps": 3010, "total_steps": 4466, "loss": 0.2314, "lr": 1.1628402516218432e-05, "epoch": 4.71843137254902, "percentage": 67.4, "elapsed_time": "12:47:19", "remaining_time": "6:11:10"} +{"current_steps": 3015, "total_steps": 4466, "loss": 0.2285, "lr": 1.1557475556519461e-05, "epoch": 4.726274509803922, "percentage": 67.51, "elapsed_time": "12:48:35", "remaining_time": "6:09:53"} +{"current_steps": 3020, "total_steps": 4466, "loss": 0.2271, "lr": 1.1486677562905281e-05, "epoch": 4.734117647058824, "percentage": 67.62, "elapsed_time": "12:49:49", "remaining_time": "6:08:35"} +{"current_steps": 3025, "total_steps": 4466, "loss": 0.235, "lr": 1.1416009616869959e-05, "epoch": 4.741960784313726, "percentage": 67.73, "elapsed_time": "12:51:09", "remaining_time": "6:07:21"} +{"current_steps": 3030, "total_steps": 4466, "loss": 0.2352, "lr": 1.134547279792098e-05, "epoch": 4.749803921568628, "percentage": 67.85, "elapsed_time": "12:52:27", "remaining_time": "6:06:05"} +{"current_steps": 3035, "total_steps": 4466, "loss": 0.2345, "lr": 1.1275068183562747e-05, "epoch": 4.75764705882353, "percentage": 67.96, "elapsed_time": "12:53:46", "remaining_time": "6:04:50"} +{"current_steps": 3040, "total_steps": 4466, "loss": 0.2436, "lr": 1.1204796849280167e-05, "epoch": 4.7654901960784315, "percentage": 68.07, "elapsed_time": "12:55:01", "remaining_time": "6:03:32"} +{"current_steps": 3045, "total_steps": 4466, "loss": 0.2396, "lr": 1.1134659868522158e-05, "epoch": 4.773333333333333, "percentage": 68.18, "elapsed_time": "12:56:19", "remaining_time": "6:02:17"} +{"current_steps": 3050, "total_steps": 4466, "loss": 0.2344, "lr": 1.106465831268531e-05, "epoch": 4.781176470588235, "percentage": 68.29, "elapsed_time": "12:57:33", "remaining_time": "6:00:59"} +{"current_steps": 3055, "total_steps": 4466, "loss": 0.2329, "lr": 1.0994793251097468e-05, "epoch": 4.789019607843137, "percentage": 68.41, "elapsed_time": "12:58:50", "remaining_time": "5:59:43"} +{"current_steps": 3060, "total_steps": 4466, "loss": 0.2316, "lr": 1.0925065751001445e-05, "epoch": 4.796862745098039, "percentage": 68.52, "elapsed_time": "13:00:09", "remaining_time": "5:58:27"} +{"current_steps": 3065, "total_steps": 4466, "loss": 0.2328, "lr": 1.0855476877538687e-05, "epoch": 4.804705882352941, "percentage": 68.63, "elapsed_time": "13:01:24", "remaining_time": "5:57:10"} +{"current_steps": 3070, "total_steps": 4466, "loss": 0.2281, "lr": 1.0786027693733015e-05, "epoch": 4.812549019607843, "percentage": 68.74, "elapsed_time": "13:02:39", "remaining_time": "5:55:53"} +{"current_steps": 3075, "total_steps": 4466, "loss": 0.2284, "lr": 1.0716719260474365e-05, "epoch": 4.820392156862745, "percentage": 68.85, "elapsed_time": "13:03:55", "remaining_time": "5:54:36"} +{"current_steps": 3080, "total_steps": 4466, "loss": 0.2468, "lr": 1.0647552636502629e-05, "epoch": 4.828235294117647, "percentage": 68.97, "elapsed_time": "13:05:14", "remaining_time": "5:53:21"} +{"current_steps": 3085, "total_steps": 4466, "loss": 0.2258, "lr": 1.0578528878391419e-05, "epoch": 4.836078431372549, "percentage": 69.08, "elapsed_time": "13:06:23", "remaining_time": "5:52:01"} +{"current_steps": 3090, "total_steps": 4466, "loss": 0.2262, "lr": 1.0509649040531994e-05, "epoch": 4.843921568627451, "percentage": 69.19, "elapsed_time": "13:07:39", "remaining_time": "5:50:44"} +{"current_steps": 3095, "total_steps": 4466, "loss": 0.2413, "lr": 1.044091417511709e-05, "epoch": 4.851764705882353, "percentage": 69.3, "elapsed_time": "13:08:53", "remaining_time": "5:49:27"} +{"current_steps": 3100, "total_steps": 4466, "loss": 0.2271, "lr": 1.0372325332124896e-05, "epoch": 4.859607843137255, "percentage": 69.41, "elapsed_time": "13:10:10", "remaining_time": "5:48:11"} +{"current_steps": 3105, "total_steps": 4466, "loss": 0.2254, "lr": 1.0303883559302999e-05, "epoch": 4.867450980392157, "percentage": 69.53, "elapsed_time": "13:11:26", "remaining_time": "5:46:54"} +{"current_steps": 3110, "total_steps": 4466, "loss": 0.2363, "lr": 1.0235589902152351e-05, "epoch": 4.875294117647059, "percentage": 69.64, "elapsed_time": "13:12:40", "remaining_time": "5:45:37"} +{"current_steps": 3115, "total_steps": 4466, "loss": 0.2406, "lr": 1.0167445403911356e-05, "epoch": 4.8831372549019605, "percentage": 69.75, "elapsed_time": "13:13:55", "remaining_time": "5:44:19"} +{"current_steps": 3120, "total_steps": 4466, "loss": 0.2334, "lr": 1.0099451105539866e-05, "epoch": 4.890980392156862, "percentage": 69.86, "elapsed_time": "13:15:14", "remaining_time": "5:43:04"} +{"current_steps": 3125, "total_steps": 4466, "loss": 0.2429, "lr": 1.0031608045703347e-05, "epoch": 4.898823529411764, "percentage": 69.97, "elapsed_time": "13:16:31", "remaining_time": "5:41:48"} +{"current_steps": 3130, "total_steps": 4466, "loss": 0.2351, "lr": 9.963917260756937e-06, "epoch": 4.906666666666666, "percentage": 70.09, "elapsed_time": "13:17:48", "remaining_time": "5:40:32"} +{"current_steps": 3135, "total_steps": 4466, "loss": 0.2357, "lr": 9.89637978472972e-06, "epoch": 4.914509803921568, "percentage": 70.2, "elapsed_time": "13:19:01", "remaining_time": "5:39:14"} +{"current_steps": 3140, "total_steps": 4466, "loss": 0.2447, "lr": 9.828996649308804e-06, "epoch": 4.92235294117647, "percentage": 70.31, "elapsed_time": "13:20:20", "remaining_time": "5:37:58"} +{"current_steps": 3145, "total_steps": 4466, "loss": 0.2469, "lr": 9.76176888382367e-06, "epoch": 4.930196078431372, "percentage": 70.42, "elapsed_time": "13:21:39", "remaining_time": "5:36:43"} +{"current_steps": 3150, "total_steps": 4466, "loss": 0.232, "lr": 9.694697515230371e-06, "epoch": 4.938039215686274, "percentage": 70.53, "elapsed_time": "13:22:54", "remaining_time": "5:35:26"} +{"current_steps": 3155, "total_steps": 4466, "loss": 0.236, "lr": 9.627783568095905e-06, "epoch": 4.945882352941177, "percentage": 70.64, "elapsed_time": "13:24:14", "remaining_time": "5:34:11"} +{"current_steps": 3160, "total_steps": 4466, "loss": 0.2336, "lr": 9.561028064582507e-06, "epoch": 4.953725490196079, "percentage": 70.76, "elapsed_time": "13:25:34", "remaining_time": "5:32:56"} +{"current_steps": 3165, "total_steps": 4466, "loss": 0.2264, "lr": 9.494432024432087e-06, "epoch": 4.961568627450981, "percentage": 70.87, "elapsed_time": "13:26:49", "remaining_time": "5:31:38"} +{"current_steps": 3170, "total_steps": 4466, "loss": 0.2391, "lr": 9.42799646495062e-06, "epoch": 4.969411764705883, "percentage": 70.98, "elapsed_time": "13:28:09", "remaining_time": "5:30:24"} +{"current_steps": 3175, "total_steps": 4466, "loss": 0.2249, "lr": 9.361722400992618e-06, "epoch": 4.977254901960785, "percentage": 71.09, "elapsed_time": "13:29:26", "remaining_time": "5:29:07"} +{"current_steps": 3180, "total_steps": 4466, "loss": 0.2286, "lr": 9.295610844945613e-06, "epoch": 4.9850980392156865, "percentage": 71.2, "elapsed_time": "13:30:36", "remaining_time": "5:27:48"} +{"current_steps": 3185, "total_steps": 4466, "loss": 0.2291, "lr": 9.229662806714721e-06, "epoch": 4.992941176470588, "percentage": 71.32, "elapsed_time": "13:31:51", "remaining_time": "5:26:31"} +{"current_steps": 3190, "total_steps": 4466, "loss": 0.2424, "lr": 9.163879293707172e-06, "epoch": 5.0, "percentage": 71.43, "elapsed_time": "13:33:03", "remaining_time": "5:25:13"} +{"current_steps": 3195, "total_steps": 4466, "loss": 0.2235, "lr": 9.09826131081698e-06, "epoch": 5.007843137254902, "percentage": 71.54, "elapsed_time": "13:34:23", "remaining_time": "5:23:58"} +{"current_steps": 3200, "total_steps": 4466, "loss": 0.2257, "lr": 9.03280986040952e-06, "epoch": 5.015686274509804, "percentage": 71.65, "elapsed_time": "13:35:40", "remaining_time": "5:22:42"} +{"current_steps": 3205, "total_steps": 4466, "loss": 0.2333, "lr": 8.967525942306285e-06, "epoch": 5.023529411764706, "percentage": 71.76, "elapsed_time": "13:36:56", "remaining_time": "5:21:25"} +{"current_steps": 3210, "total_steps": 4466, "loss": 0.2202, "lr": 8.902410553769575e-06, "epoch": 5.031372549019608, "percentage": 71.88, "elapsed_time": "13:38:15", "remaining_time": "5:20:09"} +{"current_steps": 3215, "total_steps": 4466, "loss": 0.2238, "lr": 8.837464689487261e-06, "epoch": 5.03921568627451, "percentage": 71.99, "elapsed_time": "13:39:26", "remaining_time": "5:18:51"} +{"current_steps": 3220, "total_steps": 4466, "loss": 0.2199, "lr": 8.772689341557611e-06, "epoch": 5.047058823529412, "percentage": 72.1, "elapsed_time": "13:40:41", "remaining_time": "5:17:34"} +{"current_steps": 3225, "total_steps": 4466, "loss": 0.2298, "lr": 8.708085499474112e-06, "epoch": 5.0549019607843135, "percentage": 72.21, "elapsed_time": "13:42:01", "remaining_time": "5:16:19"} +{"current_steps": 3230, "total_steps": 4466, "loss": 0.2297, "lr": 8.643654150110387e-06, "epoch": 5.0627450980392155, "percentage": 72.32, "elapsed_time": "13:43:15", "remaining_time": "5:15:01"} +{"current_steps": 3235, "total_steps": 4466, "loss": 0.2333, "lr": 8.579396277705071e-06, "epoch": 5.070588235294117, "percentage": 72.44, "elapsed_time": "13:44:28", "remaining_time": "5:13:43"} +{"current_steps": 3240, "total_steps": 4466, "loss": 0.2218, "lr": 8.51531286384683e-06, "epoch": 5.078431372549019, "percentage": 72.55, "elapsed_time": "13:45:42", "remaining_time": "5:12:26"} +{"current_steps": 3245, "total_steps": 4466, "loss": 0.2206, "lr": 8.451404887459325e-06, "epoch": 5.086274509803921, "percentage": 72.66, "elapsed_time": "13:46:57", "remaining_time": "5:11:09"} +{"current_steps": 3250, "total_steps": 4466, "loss": 0.2203, "lr": 8.387673324786292e-06, "epoch": 5.094117647058823, "percentage": 72.77, "elapsed_time": "13:48:15", "remaining_time": "5:09:53"} +{"current_steps": 3255, "total_steps": 4466, "loss": 0.2236, "lr": 8.324119149376584e-06, "epoch": 5.101960784313725, "percentage": 72.88, "elapsed_time": "13:49:30", "remaining_time": "5:08:36"} +{"current_steps": 3260, "total_steps": 4466, "loss": 0.2258, "lr": 8.260743332069355e-06, "epoch": 5.109803921568627, "percentage": 73.0, "elapsed_time": "13:50:46", "remaining_time": "5:07:20"} +{"current_steps": 3265, "total_steps": 4466, "loss": 0.225, "lr": 8.197546840979172e-06, "epoch": 5.117647058823529, "percentage": 73.11, "elapsed_time": "13:52:02", "remaining_time": "5:06:03"} +{"current_steps": 3270, "total_steps": 4466, "loss": 0.2261, "lr": 8.134530641481289e-06, "epoch": 5.125490196078431, "percentage": 73.22, "elapsed_time": "13:53:13", "remaining_time": "5:04:45"} +{"current_steps": 3275, "total_steps": 4466, "loss": 0.2333, "lr": 8.071695696196824e-06, "epoch": 5.133333333333334, "percentage": 73.33, "elapsed_time": "13:54:32", "remaining_time": "5:03:29"} +{"current_steps": 3280, "total_steps": 4466, "loss": 0.2178, "lr": 8.00904296497815e-06, "epoch": 5.141176470588236, "percentage": 73.44, "elapsed_time": "13:55:49", "remaining_time": "5:02:13"} +{"current_steps": 3285, "total_steps": 4466, "loss": 0.2238, "lr": 7.946573404894133e-06, "epoch": 5.149019607843138, "percentage": 73.56, "elapsed_time": "13:56:58", "remaining_time": "5:00:54"} +{"current_steps": 3290, "total_steps": 4466, "loss": 0.2398, "lr": 7.88428797021559e-06, "epoch": 5.1568627450980395, "percentage": 73.67, "elapsed_time": "13:58:15", "remaining_time": "4:59:38"} +{"current_steps": 3295, "total_steps": 4466, "loss": 0.2341, "lr": 7.82218761240065e-06, "epoch": 5.1647058823529415, "percentage": 73.78, "elapsed_time": "13:59:34", "remaining_time": "4:58:22"} +{"current_steps": 3300, "total_steps": 4466, "loss": 0.2275, "lr": 7.760273280080282e-06, "epoch": 5.172549019607843, "percentage": 73.89, "elapsed_time": "14:00:50", "remaining_time": "4:57:05"} +{"current_steps": 3305, "total_steps": 4466, "loss": 0.2368, "lr": 7.69854591904374e-06, "epoch": 5.180392156862745, "percentage": 74.0, "elapsed_time": "14:02:02", "remaining_time": "4:55:47"} +{"current_steps": 3310, "total_steps": 4466, "loss": 0.2228, "lr": 7.637006472224173e-06, "epoch": 5.188235294117647, "percentage": 74.12, "elapsed_time": "14:03:20", "remaining_time": "4:54:31"} +{"current_steps": 3315, "total_steps": 4466, "loss": 0.2219, "lr": 7.575655879684192e-06, "epoch": 5.196078431372549, "percentage": 74.23, "elapsed_time": "14:04:24", "remaining_time": "4:53:11"} +{"current_steps": 3320, "total_steps": 4466, "loss": 0.2197, "lr": 7.514495078601492e-06, "epoch": 5.203921568627451, "percentage": 74.34, "elapsed_time": "14:05:39", "remaining_time": "4:51:54"} +{"current_steps": 3325, "total_steps": 4466, "loss": 0.2265, "lr": 7.453525003254585e-06, "epoch": 5.211764705882353, "percentage": 74.45, "elapsed_time": "14:06:53", "remaining_time": "4:50:36"} +{"current_steps": 3330, "total_steps": 4466, "loss": 0.2251, "lr": 7.39274658500847e-06, "epoch": 5.219607843137255, "percentage": 74.56, "elapsed_time": "14:08:12", "remaining_time": "4:49:21"} +{"current_steps": 3335, "total_steps": 4466, "loss": 0.2207, "lr": 7.33216075230047e-06, "epoch": 5.227450980392157, "percentage": 74.68, "elapsed_time": "14:09:21", "remaining_time": "4:48:02"} +{"current_steps": 3340, "total_steps": 4466, "loss": 0.2272, "lr": 7.271768430625983e-06, "epoch": 5.235294117647059, "percentage": 74.79, "elapsed_time": "14:10:40", "remaining_time": "4:46:47"} +{"current_steps": 3345, "total_steps": 4466, "loss": 0.2238, "lr": 7.2115705425243996e-06, "epoch": 5.243137254901961, "percentage": 74.9, "elapsed_time": "14:11:58", "remaining_time": "4:45:31"} +{"current_steps": 3350, "total_steps": 4466, "loss": 0.218, "lr": 7.151568007564962e-06, "epoch": 5.250980392156863, "percentage": 75.01, "elapsed_time": "14:13:14", "remaining_time": "4:44:14"} +{"current_steps": 3355, "total_steps": 4466, "loss": 0.2223, "lr": 7.091761742332786e-06, "epoch": 5.258823529411765, "percentage": 75.12, "elapsed_time": "14:14:35", "remaining_time": "4:42:59"} +{"current_steps": 3360, "total_steps": 4466, "loss": 0.2285, "lr": 7.032152660414764e-06, "epoch": 5.266666666666667, "percentage": 75.24, "elapsed_time": "14:15:52", "remaining_time": "4:41:43"} +{"current_steps": 3365, "total_steps": 4466, "loss": 0.2339, "lr": 6.972741672385699e-06, "epoch": 5.2745098039215685, "percentage": 75.35, "elapsed_time": "14:17:02", "remaining_time": "4:40:24"} +{"current_steps": 3370, "total_steps": 4466, "loss": 0.2234, "lr": 6.913529685794333e-06, "epoch": 5.2823529411764705, "percentage": 75.46, "elapsed_time": "14:18:15", "remaining_time": "4:39:07"} +{"current_steps": 3375, "total_steps": 4466, "loss": 0.2147, "lr": 6.854517605149526e-06, "epoch": 5.290196078431372, "percentage": 75.57, "elapsed_time": "14:19:35", "remaining_time": "4:37:52"} +{"current_steps": 3380, "total_steps": 4466, "loss": 0.2321, "lr": 6.795706331906402e-06, "epoch": 5.298039215686274, "percentage": 75.68, "elapsed_time": "14:20:51", "remaining_time": "4:36:35"} +{"current_steps": 3385, "total_steps": 4466, "loss": 0.2349, "lr": 6.737096764452609e-06, "epoch": 5.305882352941176, "percentage": 75.79, "elapsed_time": "14:22:11", "remaining_time": "4:35:20"} +{"current_steps": 3390, "total_steps": 4466, "loss": 0.2248, "lr": 6.678689798094582e-06, "epoch": 5.313725490196078, "percentage": 75.91, "elapsed_time": "14:23:25", "remaining_time": "4:34:03"} +{"current_steps": 3395, "total_steps": 4466, "loss": 0.2248, "lr": 6.620486325043871e-06, "epoch": 5.32156862745098, "percentage": 76.02, "elapsed_time": "14:24:43", "remaining_time": "4:32:47"} +{"current_steps": 3400, "total_steps": 4466, "loss": 0.228, "lr": 6.562487234403492e-06, "epoch": 5.329411764705882, "percentage": 76.13, "elapsed_time": "14:26:00", "remaining_time": "4:31:31"} +{"current_steps": 3405, "total_steps": 4466, "loss": 0.2233, "lr": 6.504693412154384e-06, "epoch": 5.337254901960784, "percentage": 76.24, "elapsed_time": "14:27:16", "remaining_time": "4:30:14"} +{"current_steps": 3410, "total_steps": 4466, "loss": 0.2364, "lr": 6.447105741141828e-06, "epoch": 5.345098039215686, "percentage": 76.35, "elapsed_time": "14:28:35", "remaining_time": "4:28:58"} +{"current_steps": 3415, "total_steps": 4466, "loss": 0.2361, "lr": 6.389725101062017e-06, "epoch": 5.352941176470588, "percentage": 76.47, "elapsed_time": "14:29:48", "remaining_time": "4:27:41"} +{"current_steps": 3420, "total_steps": 4466, "loss": 0.2189, "lr": 6.332552368448552e-06, "epoch": 5.36078431372549, "percentage": 76.58, "elapsed_time": "14:31:03", "remaining_time": "4:26:24"} +{"current_steps": 3425, "total_steps": 4466, "loss": 0.2348, "lr": 6.275588416659111e-06, "epoch": 5.368627450980393, "percentage": 76.69, "elapsed_time": "14:32:18", "remaining_time": "4:25:07"} +{"current_steps": 3430, "total_steps": 4466, "loss": 0.2253, "lr": 6.218834115862082e-06, "epoch": 5.376470588235295, "percentage": 76.8, "elapsed_time": "14:33:35", "remaining_time": "4:23:51"} +{"current_steps": 3435, "total_steps": 4466, "loss": 0.2477, "lr": 6.162290333023255e-06, "epoch": 5.3843137254901965, "percentage": 76.91, "elapsed_time": "14:34:52", "remaining_time": "4:22:35"} +{"current_steps": 3440, "total_steps": 4466, "loss": 0.2278, "lr": 6.105957931892619e-06, "epoch": 5.392156862745098, "percentage": 77.03, "elapsed_time": "14:36:08", "remaining_time": "4:21:18"} +{"current_steps": 3445, "total_steps": 4466, "loss": 0.2301, "lr": 6.049837772991119e-06, "epoch": 5.4, "percentage": 77.14, "elapsed_time": "14:37:25", "remaining_time": "4:20:02"} +{"current_steps": 3450, "total_steps": 4466, "loss": 0.222, "lr": 5.99393071359756e-06, "epoch": 5.407843137254902, "percentage": 77.25, "elapsed_time": "14:38:44", "remaining_time": "4:18:47"} +{"current_steps": 3455, "total_steps": 4466, "loss": 0.2266, "lr": 5.93823760773546e-06, "epoch": 5.415686274509804, "percentage": 77.36, "elapsed_time": "14:40:04", "remaining_time": "4:17:31"} +{"current_steps": 3460, "total_steps": 4466, "loss": 0.2222, "lr": 5.882759306160071e-06, "epoch": 5.423529411764706, "percentage": 77.47, "elapsed_time": "14:41:18", "remaining_time": "4:16:14"} +{"current_steps": 3465, "total_steps": 4466, "loss": 0.2322, "lr": 5.827496656345299e-06, "epoch": 5.431372549019608, "percentage": 77.59, "elapsed_time": "14:42:34", "remaining_time": "4:14:58"} +{"current_steps": 3470, "total_steps": 4466, "loss": 0.2217, "lr": 5.772450502470841e-06, "epoch": 5.43921568627451, "percentage": 77.7, "elapsed_time": "14:43:46", "remaining_time": "4:13:40"} +{"current_steps": 3475, "total_steps": 4466, "loss": 0.2317, "lr": 5.71762168540922e-06, "epoch": 5.447058823529412, "percentage": 77.81, "elapsed_time": "14:45:04", "remaining_time": "4:12:24"} +{"current_steps": 3480, "total_steps": 4466, "loss": 0.2238, "lr": 5.663011042712996e-06, "epoch": 5.454901960784314, "percentage": 77.92, "elapsed_time": "14:46:17", "remaining_time": "4:11:06"} +{"current_steps": 3485, "total_steps": 4466, "loss": 0.2315, "lr": 5.608619408601925e-06, "epoch": 5.462745098039216, "percentage": 78.03, "elapsed_time": "14:47:34", "remaining_time": "4:09:50"} +{"current_steps": 3490, "total_steps": 4466, "loss": 0.228, "lr": 5.554447613950262e-06, "epoch": 5.470588235294118, "percentage": 78.15, "elapsed_time": "14:48:53", "remaining_time": "4:08:35"} +{"current_steps": 3495, "total_steps": 4466, "loss": 0.2307, "lr": 5.500496486274014e-06, "epoch": 5.47843137254902, "percentage": 78.26, "elapsed_time": "14:50:10", "remaining_time": "4:07:18"} +{"current_steps": 3500, "total_steps": 4466, "loss": 0.2346, "lr": 5.446766849718368e-06, "epoch": 5.486274509803922, "percentage": 78.37, "elapsed_time": "14:51:19", "remaining_time": "4:06:00"} +{"current_steps": 3505, "total_steps": 4466, "loss": 0.2253, "lr": 5.393259525045025e-06, "epoch": 5.4941176470588236, "percentage": 78.48, "elapsed_time": "14:52:35", "remaining_time": "4:04:43"} +{"current_steps": 3510, "total_steps": 4466, "loss": 0.2274, "lr": 5.3399753296197286e-06, "epoch": 5.5019607843137255, "percentage": 78.59, "elapsed_time": "14:53:56", "remaining_time": "4:03:28"} +{"current_steps": 3515, "total_steps": 4466, "loss": 0.2354, "lr": 5.286915077399728e-06, "epoch": 5.509803921568627, "percentage": 78.71, "elapsed_time": "14:55:08", "remaining_time": "4:02:11"} +{"current_steps": 3520, "total_steps": 4466, "loss": 0.2262, "lr": 5.2340795789213896e-06, "epoch": 5.517647058823529, "percentage": 78.82, "elapsed_time": "14:56:25", "remaining_time": "4:00:54"} +{"current_steps": 3525, "total_steps": 4466, "loss": 0.2154, "lr": 5.1814696412877665e-06, "epoch": 5.525490196078431, "percentage": 78.93, "elapsed_time": "14:57:30", "remaining_time": "3:59:35"} +{"current_steps": 3530, "total_steps": 4466, "loss": 0.2265, "lr": 5.1290860681563195e-06, "epoch": 5.533333333333333, "percentage": 79.04, "elapsed_time": "14:58:48", "remaining_time": "3:58:19"} +{"current_steps": 3535, "total_steps": 4466, "loss": 0.2262, "lr": 5.0769296597266126e-06, "epoch": 5.541176470588235, "percentage": 79.15, "elapsed_time": "15:00:03", "remaining_time": "3:57:02"} +{"current_steps": 3540, "total_steps": 4466, "loss": 0.2242, "lr": 5.0250012127280755e-06, "epoch": 5.549019607843137, "percentage": 79.27, "elapsed_time": "15:01:19", "remaining_time": "3:55:46"} +{"current_steps": 3545, "total_steps": 4466, "loss": 0.23, "lr": 4.973301520407874e-06, "epoch": 5.556862745098039, "percentage": 79.38, "elapsed_time": "15:02:30", "remaining_time": "3:54:28"} +{"current_steps": 3550, "total_steps": 4466, "loss": 0.2299, "lr": 4.921831372518751e-06, "epoch": 5.564705882352941, "percentage": 79.49, "elapsed_time": "15:03:46", "remaining_time": "3:53:12"} +{"current_steps": 3555, "total_steps": 4466, "loss": 0.2182, "lr": 4.870591555306996e-06, "epoch": 5.572549019607843, "percentage": 79.6, "elapsed_time": "15:04:56", "remaining_time": "3:51:54"} +{"current_steps": 3560, "total_steps": 4466, "loss": 0.226, "lr": 4.819582851500406e-06, "epoch": 5.580392156862745, "percentage": 79.71, "elapsed_time": "15:06:12", "remaining_time": "3:50:37"} +{"current_steps": 3565, "total_steps": 4466, "loss": 0.2199, "lr": 4.768806040296348e-06, "epoch": 5.588235294117647, "percentage": 79.83, "elapsed_time": "15:07:31", "remaining_time": "3:49:21"} +{"current_steps": 3570, "total_steps": 4466, "loss": 0.211, "lr": 4.718261897349856e-06, "epoch": 5.596078431372549, "percentage": 79.94, "elapsed_time": "15:08:43", "remaining_time": "3:48:04"} +{"current_steps": 3575, "total_steps": 4466, "loss": 0.2346, "lr": 4.667951194761773e-06, "epoch": 5.603921568627451, "percentage": 80.05, "elapsed_time": "15:09:56", "remaining_time": "3:46:47"} +{"current_steps": 3580, "total_steps": 4466, "loss": 0.2274, "lr": 4.6178747010669485e-06, "epoch": 5.6117647058823525, "percentage": 80.16, "elapsed_time": "15:11:14", "remaining_time": "3:45:31"} +{"current_steps": 3585, "total_steps": 4466, "loss": 0.2199, "lr": 4.5680331812225335e-06, "epoch": 5.6196078431372545, "percentage": 80.27, "elapsed_time": "15:12:33", "remaining_time": "3:44:15"} +{"current_steps": 3590, "total_steps": 4466, "loss": 0.2202, "lr": 4.518427396596246e-06, "epoch": 5.627450980392156, "percentage": 80.39, "elapsed_time": "15:13:51", "remaining_time": "3:42:59"} +{"current_steps": 3595, "total_steps": 4466, "loss": 0.2193, "lr": 4.469058104954786e-06, "epoch": 5.635294117647058, "percentage": 80.5, "elapsed_time": "15:15:06", "remaining_time": "3:41:42"} +{"current_steps": 3600, "total_steps": 4466, "loss": 0.23, "lr": 4.4199260604522266e-06, "epoch": 5.643137254901961, "percentage": 80.61, "elapsed_time": "15:16:27", "remaining_time": "3:40:27"} +{"current_steps": 3605, "total_steps": 4466, "loss": 0.2379, "lr": 4.371032013618519e-06, "epoch": 5.650980392156863, "percentage": 80.72, "elapsed_time": "15:17:44", "remaining_time": "3:39:11"} +{"current_steps": 3610, "total_steps": 4466, "loss": 0.2254, "lr": 4.322376711348009e-06, "epoch": 5.658823529411765, "percentage": 80.83, "elapsed_time": "15:19:00", "remaining_time": "3:37:54"} +{"current_steps": 3615, "total_steps": 4466, "loss": 0.2285, "lr": 4.273960896888045e-06, "epoch": 5.666666666666667, "percentage": 80.94, "elapsed_time": "15:20:21", "remaining_time": "3:36:39"} +{"current_steps": 3620, "total_steps": 4466, "loss": 0.2353, "lr": 4.225785309827595e-06, "epoch": 5.674509803921569, "percentage": 81.06, "elapsed_time": "15:21:36", "remaining_time": "3:35:22"} +{"current_steps": 3625, "total_steps": 4466, "loss": 0.2374, "lr": 4.177850686085987e-06, "epoch": 5.682352941176471, "percentage": 81.17, "elapsed_time": "15:22:56", "remaining_time": "3:34:07"} +{"current_steps": 3630, "total_steps": 4466, "loss": 0.2259, "lr": 4.130157757901632e-06, "epoch": 5.690196078431373, "percentage": 81.28, "elapsed_time": "15:24:17", "remaining_time": "3:32:51"} +{"current_steps": 3635, "total_steps": 4466, "loss": 0.2193, "lr": 4.0827072538208705e-06, "epoch": 5.698039215686275, "percentage": 81.39, "elapsed_time": "15:25:32", "remaining_time": "3:31:35"} +{"current_steps": 3640, "total_steps": 4466, "loss": 0.2254, "lr": 4.03549989868681e-06, "epoch": 5.705882352941177, "percentage": 81.5, "elapsed_time": "15:26:46", "remaining_time": "3:30:18"} +{"current_steps": 3645, "total_steps": 4466, "loss": 0.224, "lr": 3.988536413628286e-06, "epoch": 5.713725490196079, "percentage": 81.62, "elapsed_time": "15:28:02", "remaining_time": "3:29:01"} +{"current_steps": 3650, "total_steps": 4466, "loss": 0.2246, "lr": 3.941817516048827e-06, "epoch": 5.7215686274509805, "percentage": 81.73, "elapsed_time": "15:29:13", "remaining_time": "3:27:44"} +{"current_steps": 3655, "total_steps": 4466, "loss": 0.2256, "lr": 3.895343919615686e-06, "epoch": 5.729411764705882, "percentage": 81.84, "elapsed_time": "15:30:30", "remaining_time": "3:26:28"} +{"current_steps": 3660, "total_steps": 4466, "loss": 0.2269, "lr": 3.849116334248972e-06, "epoch": 5.737254901960784, "percentage": 81.95, "elapsed_time": "15:31:48", "remaining_time": "3:25:12"} +{"current_steps": 3665, "total_steps": 4466, "loss": 0.2287, "lr": 3.803135466110761e-06, "epoch": 5.745098039215686, "percentage": 82.06, "elapsed_time": "15:33:08", "remaining_time": "3:23:56"} +{"current_steps": 3670, "total_steps": 4466, "loss": 0.2411, "lr": 3.7574020175943514e-06, "epoch": 5.752941176470588, "percentage": 82.18, "elapsed_time": "15:34:25", "remaining_time": "3:22:40"} +{"current_steps": 3675, "total_steps": 4466, "loss": 0.2223, "lr": 3.7119166873135102e-06, "epoch": 5.76078431372549, "percentage": 82.29, "elapsed_time": "15:35:41", "remaining_time": "3:21:23"} +{"current_steps": 3680, "total_steps": 4466, "loss": 0.2391, "lr": 3.666680170091812e-06, "epoch": 5.768627450980392, "percentage": 82.4, "elapsed_time": "15:36:59", "remaining_time": "3:20:07"} +{"current_steps": 3685, "total_steps": 4466, "loss": 0.226, "lr": 3.6216931569519995e-06, "epoch": 5.776470588235294, "percentage": 82.51, "elapsed_time": "15:38:18", "remaining_time": "3:18:51"} +{"current_steps": 3690, "total_steps": 4466, "loss": 0.2321, "lr": 3.576956335105477e-06, "epoch": 5.784313725490196, "percentage": 82.62, "elapsed_time": "15:39:34", "remaining_time": "3:17:35"} +{"current_steps": 3695, "total_steps": 4466, "loss": 0.2273, "lr": 3.5324703879417553e-06, "epoch": 5.792156862745098, "percentage": 82.74, "elapsed_time": "15:40:52", "remaining_time": "3:16:19"} +{"current_steps": 3700, "total_steps": 4466, "loss": 0.2216, "lr": 3.488235995018063e-06, "epoch": 5.8, "percentage": 82.85, "elapsed_time": "15:42:10", "remaining_time": "3:15:03"} +{"current_steps": 3705, "total_steps": 4466, "loss": 0.2279, "lr": 3.444253832048925e-06, "epoch": 5.807843137254902, "percentage": 82.96, "elapsed_time": "15:43:26", "remaining_time": "3:13:46"} +{"current_steps": 3710, "total_steps": 4466, "loss": 0.2193, "lr": 3.4005245708958757e-06, "epoch": 5.815686274509804, "percentage": 83.07, "elapsed_time": "15:44:47", "remaining_time": "3:12:31"} +{"current_steps": 3715, "total_steps": 4466, "loss": 0.2201, "lr": 3.3570488795571653e-06, "epoch": 5.823529411764706, "percentage": 83.18, "elapsed_time": "15:45:58", "remaining_time": "3:11:13"} +{"current_steps": 3720, "total_steps": 4466, "loss": 0.2166, "lr": 3.313827422157583e-06, "epoch": 5.8313725490196076, "percentage": 83.3, "elapsed_time": "15:47:09", "remaining_time": "3:09:56"} +{"current_steps": 3725, "total_steps": 4466, "loss": 0.2326, "lr": 3.2708608589382783e-06, "epoch": 5.8392156862745095, "percentage": 83.41, "elapsed_time": "15:48:23", "remaining_time": "3:08:39"} +{"current_steps": 3730, "total_steps": 4466, "loss": 0.2251, "lr": 3.2281498462467177e-06, "epoch": 5.847058823529411, "percentage": 83.52, "elapsed_time": "15:49:37", "remaining_time": "3:07:22"} +{"current_steps": 3735, "total_steps": 4466, "loss": 0.2206, "lr": 3.185695036526615e-06, "epoch": 5.854901960784313, "percentage": 83.63, "elapsed_time": "15:50:48", "remaining_time": "3:06:05"} +{"current_steps": 3740, "total_steps": 4466, "loss": 0.2166, "lr": 3.1434970783080043e-06, "epoch": 5.862745098039216, "percentage": 83.74, "elapsed_time": "15:51:57", "remaining_time": "3:04:47"} +{"current_steps": 3745, "total_steps": 4466, "loss": 0.2208, "lr": 3.1015566161972967e-06, "epoch": 5.870588235294118, "percentage": 83.86, "elapsed_time": "15:53:14", "remaining_time": "3:03:31"} +{"current_steps": 3750, "total_steps": 4466, "loss": 0.219, "lr": 3.059874290867464e-06, "epoch": 5.87843137254902, "percentage": 83.97, "elapsed_time": "15:54:31", "remaining_time": "3:02:15"} +{"current_steps": 3755, "total_steps": 4466, "loss": 0.2269, "lr": 3.01845073904824e-06, "epoch": 5.886274509803922, "percentage": 84.08, "elapsed_time": "15:55:44", "remaining_time": "3:00:57"} +{"current_steps": 3760, "total_steps": 4466, "loss": 0.2295, "lr": 2.977286593516382e-06, "epoch": 5.894117647058824, "percentage": 84.19, "elapsed_time": "15:57:02", "remaining_time": "2:59:42"} +{"current_steps": 3765, "total_steps": 4466, "loss": 0.2216, "lr": 2.936382483086022e-06, "epoch": 5.901960784313726, "percentage": 84.3, "elapsed_time": "15:58:15", "remaining_time": "2:58:25"} +{"current_steps": 3770, "total_steps": 4466, "loss": 0.2129, "lr": 2.895739032599065e-06, "epoch": 5.909803921568628, "percentage": 84.42, "elapsed_time": "15:59:26", "remaining_time": "2:57:07"} +{"current_steps": 3775, "total_steps": 4466, "loss": 0.2261, "lr": 2.8553568629156124e-06, "epoch": 5.91764705882353, "percentage": 84.53, "elapsed_time": "16:00:44", "remaining_time": "2:55:51"} +{"current_steps": 3780, "total_steps": 4466, "loss": 0.2175, "lr": 2.815236590904522e-06, "epoch": 5.925490196078432, "percentage": 84.64, "elapsed_time": "16:01:56", "remaining_time": "2:54:34"} +{"current_steps": 3785, "total_steps": 4466, "loss": 0.2344, "lr": 2.7753788294339412e-06, "epoch": 5.933333333333334, "percentage": 84.75, "elapsed_time": "16:03:14", "remaining_time": "2:53:18"} +{"current_steps": 3790, "total_steps": 4466, "loss": 0.2271, "lr": 2.7357841873619804e-06, "epoch": 5.9411764705882355, "percentage": 84.86, "elapsed_time": "16:04:29", "remaining_time": "2:52:01"} +{"current_steps": 3795, "total_steps": 4466, "loss": 0.2208, "lr": 2.6964532695273993e-06, "epoch": 5.949019607843137, "percentage": 84.98, "elapsed_time": "16:05:44", "remaining_time": "2:50:45"} +{"current_steps": 3800, "total_steps": 4466, "loss": 0.2167, "lr": 2.65738667674035e-06, "epoch": 5.956862745098039, "percentage": 85.09, "elapsed_time": "16:07:02", "remaining_time": "2:49:29"} +{"current_steps": 3805, "total_steps": 4466, "loss": 0.2279, "lr": 2.6185850057732377e-06, "epoch": 5.964705882352941, "percentage": 85.2, "elapsed_time": "16:08:22", "remaining_time": "2:48:13"} +{"current_steps": 3810, "total_steps": 4466, "loss": 0.2268, "lr": 2.5800488493515576e-06, "epoch": 5.972549019607843, "percentage": 85.31, "elapsed_time": "16:09:40", "remaining_time": "2:46:57"} +{"current_steps": 3815, "total_steps": 4466, "loss": 0.2281, "lr": 2.5417787961448893e-06, "epoch": 5.980392156862745, "percentage": 85.42, "elapsed_time": "16:10:57", "remaining_time": "2:45:41"} +{"current_steps": 3820, "total_steps": 4466, "loss": 0.2214, "lr": 2.5037754307578553e-06, "epoch": 5.988235294117647, "percentage": 85.54, "elapsed_time": "16:12:13", "remaining_time": "2:44:24"} +{"current_steps": 3825, "total_steps": 4466, "loss": 0.2287, "lr": 2.466039333721246e-06, "epoch": 5.996078431372549, "percentage": 85.65, "elapsed_time": "16:13:28", "remaining_time": "2:43:08"} +{"current_steps": 3830, "total_steps": 4466, "loss": 0.2229, "lr": 2.4285710814830908e-06, "epoch": 6.003137254901961, "percentage": 85.76, "elapsed_time": "16:14:40", "remaining_time": "2:41:51"} +{"current_steps": 3835, "total_steps": 4466, "loss": 0.2227, "lr": 2.3913712463999026e-06, "epoch": 6.0109803921568625, "percentage": 85.87, "elapsed_time": "16:15:55", "remaining_time": "2:40:34"} +{"current_steps": 3840, "total_steps": 4466, "loss": 0.2276, "lr": 2.354440396727902e-06, "epoch": 6.0188235294117645, "percentage": 85.98, "elapsed_time": "16:17:14", "remaining_time": "2:39:18"} +{"current_steps": 3845, "total_steps": 4466, "loss": 0.2102, "lr": 2.3177790966143653e-06, "epoch": 6.026666666666666, "percentage": 86.09, "elapsed_time": "16:18:26", "remaining_time": "2:38:01"} +{"current_steps": 3850, "total_steps": 4466, "loss": 0.2172, "lr": 2.28138790608897e-06, "epoch": 6.034509803921568, "percentage": 86.21, "elapsed_time": "16:19:40", "remaining_time": "2:36:44"} +{"current_steps": 3855, "total_steps": 4466, "loss": 0.2233, "lr": 2.2452673810552783e-06, "epoch": 6.04235294117647, "percentage": 86.32, "elapsed_time": "16:20:56", "remaining_time": "2:35:28"} +{"current_steps": 3860, "total_steps": 4466, "loss": 0.2239, "lr": 2.2094180732822235e-06, "epoch": 6.050196078431372, "percentage": 86.43, "elapsed_time": "16:22:07", "remaining_time": "2:34:11"} +{"current_steps": 3865, "total_steps": 4466, "loss": 0.2277, "lr": 2.1738405303956877e-06, "epoch": 6.058039215686274, "percentage": 86.54, "elapsed_time": "16:23:20", "remaining_time": "2:32:54"} +{"current_steps": 3870, "total_steps": 4466, "loss": 0.2156, "lr": 2.138535295870121e-06, "epoch": 6.065882352941176, "percentage": 86.65, "elapsed_time": "16:24:35", "remaining_time": "2:31:37"} +{"current_steps": 3875, "total_steps": 4466, "loss": 0.2295, "lr": 2.1035029090202717e-06, "epoch": 6.073725490196079, "percentage": 86.77, "elapsed_time": "16:25:55", "remaining_time": "2:30:22"} +{"current_steps": 3880, "total_steps": 4466, "loss": 0.2234, "lr": 2.0687439049929113e-06, "epoch": 6.081568627450981, "percentage": 86.88, "elapsed_time": "16:27:14", "remaining_time": "2:29:06"} +{"current_steps": 3885, "total_steps": 4466, "loss": 0.233, "lr": 2.034258814758696e-06, "epoch": 6.089411764705883, "percentage": 86.99, "elapsed_time": "16:28:34", "remaining_time": "2:27:50"} +{"current_steps": 3890, "total_steps": 4466, "loss": 0.2196, "lr": 2.0000481651040182e-06, "epoch": 6.097254901960785, "percentage": 87.1, "elapsed_time": "16:29:50", "remaining_time": "2:26:34"} +{"current_steps": 3895, "total_steps": 4466, "loss": 0.222, "lr": 1.96611247862299e-06, "epoch": 6.105098039215687, "percentage": 87.21, "elapsed_time": "16:31:07", "remaining_time": "2:25:17"} +{"current_steps": 3900, "total_steps": 4466, "loss": 0.217, "lr": 1.932452273709453e-06, "epoch": 6.1129411764705885, "percentage": 87.33, "elapsed_time": "16:32:24", "remaining_time": "2:24:01"} +{"current_steps": 3905, "total_steps": 4466, "loss": 0.2236, "lr": 1.8990680645490389e-06, "epoch": 6.1207843137254905, "percentage": 87.44, "elapsed_time": "16:33:44", "remaining_time": "2:22:45"} +{"current_steps": 3910, "total_steps": 4466, "loss": 0.2124, "lr": 1.8659603611113475e-06, "epoch": 6.128627450980392, "percentage": 87.55, "elapsed_time": "16:35:03", "remaining_time": "2:21:29"} +{"current_steps": 3915, "total_steps": 4466, "loss": 0.2246, "lr": 1.833129669142124e-06, "epoch": 6.136470588235294, "percentage": 87.66, "elapsed_time": "16:36:18", "remaining_time": "2:20:13"} +{"current_steps": 3920, "total_steps": 4466, "loss": 0.2137, "lr": 1.8005764901555678e-06, "epoch": 6.144313725490196, "percentage": 87.77, "elapsed_time": "16:37:32", "remaining_time": "2:18:56"} +{"current_steps": 3925, "total_steps": 4466, "loss": 0.227, "lr": 1.7683013214266354e-06, "epoch": 6.152156862745098, "percentage": 87.89, "elapsed_time": "16:38:52", "remaining_time": "2:17:40"} +{"current_steps": 3930, "total_steps": 4466, "loss": 0.2276, "lr": 1.7363046559834718e-06, "epoch": 6.16, "percentage": 88.0, "elapsed_time": "16:40:08", "remaining_time": "2:16:24"} +{"current_steps": 3935, "total_steps": 4466, "loss": 0.2156, "lr": 1.7045869825998674e-06, "epoch": 6.167843137254902, "percentage": 88.11, "elapsed_time": "16:41:22", "remaining_time": "2:15:07"} +{"current_steps": 3940, "total_steps": 4466, "loss": 0.2331, "lr": 1.6731487857877971e-06, "epoch": 6.175686274509804, "percentage": 88.22, "elapsed_time": "16:42:37", "remaining_time": "2:13:51"} +{"current_steps": 3945, "total_steps": 4466, "loss": 0.2176, "lr": 1.641990545790002e-06, "epoch": 6.183529411764706, "percentage": 88.33, "elapsed_time": "16:43:53", "remaining_time": "2:12:34"} +{"current_steps": 3950, "total_steps": 4466, "loss": 0.2285, "lr": 1.6111127385726844e-06, "epoch": 6.191372549019608, "percentage": 88.45, "elapsed_time": "16:45:11", "remaining_time": "2:11:18"} +{"current_steps": 3955, "total_steps": 4466, "loss": 0.2238, "lr": 1.5805158358182039e-06, "epoch": 6.19921568627451, "percentage": 88.56, "elapsed_time": "16:46:28", "remaining_time": "2:10:02"} +{"current_steps": 3960, "total_steps": 4466, "loss": 0.2247, "lr": 1.550200304917897e-06, "epoch": 6.207058823529412, "percentage": 88.67, "elapsed_time": "16:47:43", "remaining_time": "2:08:45"} +{"current_steps": 3965, "total_steps": 4466, "loss": 0.2196, "lr": 1.5201666089649193e-06, "epoch": 6.214901960784314, "percentage": 88.78, "elapsed_time": "16:48:58", "remaining_time": "2:07:29"} +{"current_steps": 3970, "total_steps": 4466, "loss": 0.2184, "lr": 1.4904152067471932e-06, "epoch": 6.222745098039216, "percentage": 88.89, "elapsed_time": "16:50:11", "remaining_time": "2:06:12"} +{"current_steps": 3975, "total_steps": 4466, "loss": 0.227, "lr": 1.4609465527403722e-06, "epoch": 6.2305882352941175, "percentage": 89.01, "elapsed_time": "16:51:26", "remaining_time": "2:04:56"} +{"current_steps": 3980, "total_steps": 4466, "loss": 0.2213, "lr": 1.431761097100921e-06, "epoch": 6.2384313725490195, "percentage": 89.12, "elapsed_time": "16:52:38", "remaining_time": "2:03:39"} +{"current_steps": 3985, "total_steps": 4466, "loss": 0.2206, "lr": 1.4028592856592239e-06, "epoch": 6.246274509803921, "percentage": 89.23, "elapsed_time": "16:53:55", "remaining_time": "2:02:23"} +{"current_steps": 3990, "total_steps": 4466, "loss": 0.211, "lr": 1.374241559912788e-06, "epoch": 6.254117647058823, "percentage": 89.34, "elapsed_time": "16:55:11", "remaining_time": "2:01:06"} +{"current_steps": 3995, "total_steps": 4466, "loss": 0.2076, "lr": 1.345908357019483e-06, "epoch": 6.261960784313725, "percentage": 89.45, "elapsed_time": "16:56:22", "remaining_time": "1:59:49"} +{"current_steps": 4000, "total_steps": 4466, "loss": 0.2187, "lr": 1.3178601097908827e-06, "epoch": 6.269803921568627, "percentage": 89.57, "elapsed_time": "16:57:39", "remaining_time": "1:58:33"} +{"current_steps": 4005, "total_steps": 4466, "loss": 0.2141, "lr": 1.2900972466856377e-06, "epoch": 6.277647058823529, "percentage": 89.68, "elapsed_time": "16:58:54", "remaining_time": "1:57:16"} +{"current_steps": 4010, "total_steps": 4466, "loss": 0.2193, "lr": 1.2626201918029301e-06, "epoch": 6.285490196078431, "percentage": 89.79, "elapsed_time": "17:00:13", "remaining_time": "1:56:00"} +{"current_steps": 4015, "total_steps": 4466, "loss": 0.2166, "lr": 1.235429364876015e-06, "epoch": 6.293333333333333, "percentage": 89.9, "elapsed_time": "17:01:28", "remaining_time": "1:54:44"} +{"current_steps": 4020, "total_steps": 4466, "loss": 0.2246, "lr": 1.2085251812657762e-06, "epoch": 6.301176470588235, "percentage": 90.01, "elapsed_time": "17:02:45", "remaining_time": "1:53:28"} +{"current_steps": 4025, "total_steps": 4466, "loss": 0.2213, "lr": 1.1819080519544123e-06, "epoch": 6.309019607843137, "percentage": 90.13, "elapsed_time": "17:04:02", "remaining_time": "1:52:11"} +{"current_steps": 4030, "total_steps": 4466, "loss": 0.2207, "lr": 1.155578383539142e-06, "epoch": 6.316862745098039, "percentage": 90.24, "elapsed_time": "17:05:16", "remaining_time": "1:50:55"} +{"current_steps": 4035, "total_steps": 4466, "loss": 0.2231, "lr": 1.1295365782259982e-06, "epoch": 6.324705882352941, "percentage": 90.35, "elapsed_time": "17:06:34", "remaining_time": "1:49:39"} +{"current_steps": 4040, "total_steps": 4466, "loss": 0.2315, "lr": 1.103783033823671e-06, "epoch": 6.332549019607843, "percentage": 90.46, "elapsed_time": "17:07:52", "remaining_time": "1:48:23"} +{"current_steps": 4045, "total_steps": 4466, "loss": 0.221, "lr": 1.0783181437374669e-06, "epoch": 6.3403921568627455, "percentage": 90.57, "elapsed_time": "17:09:11", "remaining_time": "1:47:07"} +{"current_steps": 4050, "total_steps": 4466, "loss": 0.2343, "lr": 1.05314229696325e-06, "epoch": 6.348235294117647, "percentage": 90.69, "elapsed_time": "17:10:32", "remaining_time": "1:45:51"} +{"current_steps": 4055, "total_steps": 4466, "loss": 0.2306, "lr": 1.0282558780815411e-06, "epoch": 6.356078431372549, "percentage": 90.8, "elapsed_time": "17:11:51", "remaining_time": "1:44:35"} +{"current_steps": 4060, "total_steps": 4466, "loss": 0.2159, "lr": 1.0036592672516088e-06, "epoch": 6.363921568627451, "percentage": 90.91, "elapsed_time": "17:13:10", "remaining_time": "1:43:19"} +{"current_steps": 4065, "total_steps": 4466, "loss": 0.2175, "lr": 9.79352840205703e-07, "epoch": 6.371764705882353, "percentage": 91.02, "elapsed_time": "17:14:24", "remaining_time": "1:42:02"} +{"current_steps": 4070, "total_steps": 4466, "loss": 0.2286, "lr": 9.55336968243268e-07, "epoch": 6.379607843137255, "percentage": 91.13, "elapsed_time": "17:15:43", "remaining_time": "1:40:46"} +{"current_steps": 4075, "total_steps": 4466, "loss": 0.2111, "lr": 9.316120182253141e-07, "epoch": 6.387450980392157, "percentage": 91.24, "elapsed_time": "17:17:02", "remaining_time": "1:39:30"} +{"current_steps": 4080, "total_steps": 4466, "loss": 0.2226, "lr": 9.081783525687826e-07, "epoch": 6.395294117647059, "percentage": 91.36, "elapsed_time": "17:18:22", "remaining_time": "1:38:14"} +{"current_steps": 4085, "total_steps": 4466, "loss": 0.2243, "lr": 8.850363292410269e-07, "epoch": 6.403137254901961, "percentage": 91.47, "elapsed_time": "17:19:40", "remaining_time": "1:36:58"} +{"current_steps": 4090, "total_steps": 4466, "loss": 0.2134, "lr": 8.621863017543353e-07, "epoch": 6.410980392156863, "percentage": 91.58, "elapsed_time": "17:20:58", "remaining_time": "1:35:41"} +{"current_steps": 4095, "total_steps": 4466, "loss": 0.2393, "lr": 8.396286191605352e-07, "epoch": 6.418823529411765, "percentage": 91.69, "elapsed_time": "17:22:18", "remaining_time": "1:34:25"} +{"current_steps": 4100, "total_steps": 4466, "loss": 0.2185, "lr": 8.173636260456575e-07, "epoch": 6.426666666666667, "percentage": 91.8, "elapsed_time": "17:23:26", "remaining_time": "1:33:08"} +{"current_steps": 4105, "total_steps": 4466, "loss": 0.2154, "lr": 7.953916625246804e-07, "epoch": 6.434509803921569, "percentage": 91.92, "elapsed_time": "17:24:37", "remaining_time": "1:31:51"} +{"current_steps": 4110, "total_steps": 4466, "loss": 0.2188, "lr": 7.737130642363211e-07, "epoch": 6.442352941176471, "percentage": 92.03, "elapsed_time": "17:25:49", "remaining_time": "1:30:35"} +{"current_steps": 4115, "total_steps": 4466, "loss": 0.2199, "lr": 7.52328162337923e-07, "epoch": 6.4501960784313725, "percentage": 92.14, "elapsed_time": "17:27:08", "remaining_time": "1:29:19"} +{"current_steps": 4120, "total_steps": 4466, "loss": 0.213, "lr": 7.3123728350039e-07, "epoch": 6.4580392156862745, "percentage": 92.25, "elapsed_time": "17:28:26", "remaining_time": "1:28:02"} +{"current_steps": 4125, "total_steps": 4466, "loss": 0.2205, "lr": 7.104407499031896e-07, "epoch": 6.465882352941176, "percentage": 92.36, "elapsed_time": "17:29:42", "remaining_time": "1:26:46"} +{"current_steps": 4130, "total_steps": 4466, "loss": 0.2273, "lr": 6.899388792294482e-07, "epoch": 6.473725490196078, "percentage": 92.48, "elapsed_time": "17:30:54", "remaining_time": "1:25:29"} +{"current_steps": 4135, "total_steps": 4466, "loss": 0.2275, "lr": 6.697319846610772e-07, "epoch": 6.48156862745098, "percentage": 92.59, "elapsed_time": "17:32:13", "remaining_time": "1:24:13"} +{"current_steps": 4140, "total_steps": 4466, "loss": 0.2172, "lr": 6.498203748740106e-07, "epoch": 6.489411764705882, "percentage": 92.7, "elapsed_time": "17:33:30", "remaining_time": "1:22:57"} +{"current_steps": 4145, "total_steps": 4466, "loss": 0.2247, "lr": 6.302043540334701e-07, "epoch": 6.497254901960784, "percentage": 92.81, "elapsed_time": "17:34:47", "remaining_time": "1:21:41"} +{"current_steps": 4150, "total_steps": 4466, "loss": 0.2287, "lr": 6.108842217893384e-07, "epoch": 6.505098039215686, "percentage": 92.92, "elapsed_time": "17:36:03", "remaining_time": "1:20:24"} +{"current_steps": 4155, "total_steps": 4466, "loss": 0.2206, "lr": 5.918602732715583e-07, "epoch": 6.512941176470588, "percentage": 93.04, "elapsed_time": "17:37:19", "remaining_time": "1:19:08"} +{"current_steps": 4160, "total_steps": 4466, "loss": 0.2282, "lr": 5.731327990856517e-07, "epoch": 6.52078431372549, "percentage": 93.15, "elapsed_time": "17:38:35", "remaining_time": "1:17:52"} +{"current_steps": 4165, "total_steps": 4466, "loss": 0.2177, "lr": 5.547020853082497e-07, "epoch": 6.528627450980392, "percentage": 93.26, "elapsed_time": "17:39:53", "remaining_time": "1:16:35"} +{"current_steps": 4170, "total_steps": 4466, "loss": 0.2301, "lr": 5.365684134827542e-07, "epoch": 6.536470588235294, "percentage": 93.37, "elapsed_time": "17:41:11", "remaining_time": "1:15:19"} +{"current_steps": 4175, "total_steps": 4466, "loss": 0.2316, "lr": 5.187320606150103e-07, "epoch": 6.544313725490196, "percentage": 93.48, "elapsed_time": "17:42:27", "remaining_time": "1:14:03"} +{"current_steps": 4180, "total_steps": 4466, "loss": 0.2263, "lr": 5.011932991690959e-07, "epoch": 6.552156862745098, "percentage": 93.6, "elapsed_time": "17:43:44", "remaining_time": "1:12:46"} +{"current_steps": 4185, "total_steps": 4466, "loss": 0.2187, "lr": 4.839523970631387e-07, "epoch": 6.5600000000000005, "percentage": 93.71, "elapsed_time": "17:44:59", "remaining_time": "1:11:30"} +{"current_steps": 4190, "total_steps": 4466, "loss": 0.2168, "lr": 4.6700961766524833e-07, "epoch": 6.567843137254902, "percentage": 93.82, "elapsed_time": "17:46:13", "remaining_time": "1:10:13"} +{"current_steps": 4195, "total_steps": 4466, "loss": 0.2184, "lr": 4.503652197894681e-07, "epoch": 6.575686274509804, "percentage": 93.93, "elapsed_time": "17:47:27", "remaining_time": "1:08:57"} +{"current_steps": 4200, "total_steps": 4466, "loss": 0.2247, "lr": 4.3401945769183884e-07, "epoch": 6.583529411764706, "percentage": 94.04, "elapsed_time": "17:48:34", "remaining_time": "1:07:40"} +{"current_steps": 4205, "total_steps": 4466, "loss": 0.2146, "lr": 4.1797258106650804e-07, "epoch": 6.591372549019608, "percentage": 94.16, "elapsed_time": "17:49:48", "remaining_time": "1:06:24"} +{"current_steps": 4210, "total_steps": 4466, "loss": 0.2145, "lr": 4.0222483504191556e-07, "epoch": 6.59921568627451, "percentage": 94.27, "elapsed_time": "17:51:05", "remaining_time": "1:05:07"} +{"current_steps": 4215, "total_steps": 4466, "loss": 0.2295, "lr": 3.8677646017704963e-07, "epoch": 6.607058823529412, "percentage": 94.38, "elapsed_time": "17:52:26", "remaining_time": "1:03:51"} +{"current_steps": 4220, "total_steps": 4466, "loss": 0.2322, "lr": 3.716276924577744e-07, "epoch": 6.614901960784314, "percentage": 94.49, "elapsed_time": "17:53:40", "remaining_time": "1:02:35"} +{"current_steps": 4225, "total_steps": 4466, "loss": 0.2174, "lr": 3.5677876329322624e-07, "epoch": 6.622745098039216, "percentage": 94.6, "elapsed_time": "17:54:59", "remaining_time": "1:01:19"} +{"current_steps": 4230, "total_steps": 4466, "loss": 0.24, "lr": 3.422298995122675e-07, "epoch": 6.630588235294118, "percentage": 94.72, "elapsed_time": "17:56:13", "remaining_time": "1:00:02"} +{"current_steps": 4235, "total_steps": 4466, "loss": 0.2078, "lr": 3.279813233600404e-07, "epoch": 6.63843137254902, "percentage": 94.83, "elapsed_time": "17:57:30", "remaining_time": "0:58:46"} +{"current_steps": 4240, "total_steps": 4466, "loss": 0.2205, "lr": 3.140332524945522e-07, "epoch": 6.646274509803922, "percentage": 94.94, "elapsed_time": "17:58:45", "remaining_time": "0:57:30"} +{"current_steps": 4245, "total_steps": 4466, "loss": 0.2232, "lr": 3.0038589998336423e-07, "epoch": 6.654117647058824, "percentage": 95.05, "elapsed_time": "18:00:06", "remaining_time": "0:56:13"} +{"current_steps": 4250, "total_steps": 4466, "loss": 0.2076, "lr": 2.8703947430033465e-07, "epoch": 6.661960784313726, "percentage": 95.16, "elapsed_time": "18:01:26", "remaining_time": "0:54:57"} +{"current_steps": 4255, "total_steps": 4466, "loss": 0.2296, "lr": 2.7399417932242325e-07, "epoch": 6.669803921568628, "percentage": 95.28, "elapsed_time": "18:02:42", "remaining_time": "0:53:41"} +{"current_steps": 4260, "total_steps": 4466, "loss": 0.2176, "lr": 2.6125021432659824e-07, "epoch": 6.6776470588235295, "percentage": 95.39, "elapsed_time": "18:04:01", "remaining_time": "0:52:25"} +{"current_steps": 4265, "total_steps": 4466, "loss": 0.2426, "lr": 2.4880777398677e-07, "epoch": 6.685490196078431, "percentage": 95.5, "elapsed_time": "18:05:20", "remaining_time": "0:51:08"} +{"current_steps": 4270, "total_steps": 4466, "loss": 0.211, "lr": 2.3666704837082888e-07, "epoch": 6.693333333333333, "percentage": 95.61, "elapsed_time": "18:06:36", "remaining_time": "0:49:52"} +{"current_steps": 4275, "total_steps": 4466, "loss": 0.2268, "lr": 2.2482822293774297e-07, "epoch": 6.701176470588235, "percentage": 95.72, "elapsed_time": "18:07:55", "remaining_time": "0:48:36"} +{"current_steps": 4280, "total_steps": 4466, "loss": 0.2195, "lr": 2.13291478534714e-07, "epoch": 6.709019607843137, "percentage": 95.84, "elapsed_time": "18:09:09", "remaining_time": "0:47:19"} +{"current_steps": 4285, "total_steps": 4466, "loss": 0.2247, "lr": 2.020569913944348e-07, "epoch": 6.716862745098039, "percentage": 95.95, "elapsed_time": "18:10:25", "remaining_time": "0:46:03"} +{"current_steps": 4290, "total_steps": 4466, "loss": 0.2271, "lr": 1.9112493313236947e-07, "epoch": 6.724705882352941, "percentage": 96.06, "elapsed_time": "18:11:46", "remaining_time": "0:44:47"} +{"current_steps": 4295, "total_steps": 4466, "loss": 0.2254, "lr": 1.8049547074416195e-07, "epoch": 6.732549019607843, "percentage": 96.17, "elapsed_time": "18:13:06", "remaining_time": "0:43:31"} +{"current_steps": 4300, "total_steps": 4466, "loss": 0.2177, "lr": 1.701687666030627e-07, "epoch": 6.740392156862745, "percentage": 96.28, "elapsed_time": "18:14:22", "remaining_time": "0:42:14"} +{"current_steps": 4305, "total_steps": 4466, "loss": 0.2213, "lr": 1.6014497845745715e-07, "epoch": 6.748235294117647, "percentage": 96.39, "elapsed_time": "18:15:37", "remaining_time": "0:40:58"} +{"current_steps": 4310, "total_steps": 4466, "loss": 0.2229, "lr": 1.504242594284544e-07, "epoch": 6.756078431372549, "percentage": 96.51, "elapsed_time": "18:16:52", "remaining_time": "0:39:42"} +{"current_steps": 4315, "total_steps": 4466, "loss": 0.2197, "lr": 1.4100675800754914e-07, "epoch": 6.763921568627451, "percentage": 96.62, "elapsed_time": "18:18:11", "remaining_time": "0:38:25"} +{"current_steps": 4320, "total_steps": 4466, "loss": 0.2228, "lr": 1.318926180543545e-07, "epoch": 6.771764705882353, "percentage": 96.73, "elapsed_time": "18:19:26", "remaining_time": "0:37:09"} +{"current_steps": 4325, "total_steps": 4466, "loss": 0.2298, "lr": 1.2308197879439932e-07, "epoch": 6.779607843137255, "percentage": 96.84, "elapsed_time": "18:20:38", "remaining_time": "0:35:52"} +{"current_steps": 4330, "total_steps": 4466, "loss": 0.2277, "lr": 1.1457497481700775e-07, "epoch": 6.7874509803921566, "percentage": 96.95, "elapsed_time": "18:21:54", "remaining_time": "0:34:36"} +{"current_steps": 4335, "total_steps": 4466, "loss": 0.2232, "lr": 1.0637173607323859e-07, "epoch": 6.7952941176470585, "percentage": 97.07, "elapsed_time": "18:23:12", "remaining_time": "0:33:20"} +{"current_steps": 4340, "total_steps": 4466, "loss": 0.2281, "lr": 9.847238787390246e-08, "epoch": 6.80313725490196, "percentage": 97.18, "elapsed_time": "18:24:25", "remaining_time": "0:32:03"} +{"current_steps": 4345, "total_steps": 4466, "loss": 0.2216, "lr": 9.087705088764997e-08, "epoch": 6.810980392156862, "percentage": 97.29, "elapsed_time": "18:25:44", "remaining_time": "0:30:47"} +{"current_steps": 4350, "total_steps": 4466, "loss": 0.217, "lr": 8.358584113911994e-08, "epoch": 6.818823529411764, "percentage": 97.4, "elapsed_time": "18:27:00", "remaining_time": "0:29:31"} +{"current_steps": 4355, "total_steps": 4466, "loss": 0.2129, "lr": 7.659887000717403e-08, "epoch": 6.826666666666666, "percentage": 97.51, "elapsed_time": "18:28:18", "remaining_time": "0:28:14"} +{"current_steps": 4360, "total_steps": 4466, "loss": 0.2209, "lr": 6.991624422320042e-08, "epoch": 6.834509803921568, "percentage": 97.63, "elapsed_time": "18:29:37", "remaining_time": "0:26:58"} +{"current_steps": 4365, "total_steps": 4466, "loss": 0.2146, "lr": 6.353806586946842e-08, "epoch": 6.842352941176471, "percentage": 97.74, "elapsed_time": "18:30:51", "remaining_time": "0:25:42"} +{"current_steps": 4370, "total_steps": 4466, "loss": 0.2188, "lr": 5.7464432377580814e-08, "epoch": 6.850196078431373, "percentage": 97.85, "elapsed_time": "18:32:08", "remaining_time": "0:24:25"} +{"current_steps": 4375, "total_steps": 4466, "loss": 0.2192, "lr": 5.169543652698617e-08, "epoch": 6.858039215686275, "percentage": 97.96, "elapsed_time": "18:33:24", "remaining_time": "0:23:09"} +{"current_steps": 4380, "total_steps": 4466, "loss": 0.2146, "lr": 4.623116644354886e-08, "epoch": 6.865882352941177, "percentage": 98.07, "elapsed_time": "18:34:38", "remaining_time": "0:21:53"} +{"current_steps": 4385, "total_steps": 4466, "loss": 0.2152, "lr": 4.107170559822127e-08, "epoch": 6.873725490196079, "percentage": 98.19, "elapsed_time": "18:35:48", "remaining_time": "0:20:36"} +{"current_steps": 4390, "total_steps": 4466, "loss": 0.231, "lr": 3.621713280575367e-08, "epoch": 6.881568627450981, "percentage": 98.3, "elapsed_time": "18:37:02", "remaining_time": "0:19:20"} +{"current_steps": 4395, "total_steps": 4466, "loss": 0.2224, "lr": 3.166752222349523e-08, "epoch": 6.889411764705883, "percentage": 98.41, "elapsed_time": "18:38:20", "remaining_time": "0:18:03"} +{"current_steps": 4400, "total_steps": 4466, "loss": 0.2254, "lr": 2.7422943350263743e-08, "epoch": 6.8972549019607845, "percentage": 98.52, "elapsed_time": "18:39:37", "remaining_time": "0:16:47"} +{"current_steps": 4405, "total_steps": 4466, "loss": 0.2247, "lr": 2.3483461025282094e-08, "epoch": 6.905098039215686, "percentage": 98.63, "elapsed_time": "18:40:52", "remaining_time": "0:15:31"} +{"current_steps": 4410, "total_steps": 4466, "loss": 0.2261, "lr": 1.9849135427187916e-08, "epoch": 6.912941176470588, "percentage": 98.75, "elapsed_time": "18:42:09", "remaining_time": "0:14:14"} +{"current_steps": 4415, "total_steps": 4466, "loss": 0.2269, "lr": 1.6520022073112098e-08, "epoch": 6.92078431372549, "percentage": 98.86, "elapsed_time": "18:43:25", "remaining_time": "0:12:58"} +{"current_steps": 4420, "total_steps": 4466, "loss": 0.2291, "lr": 1.3496171817832804e-08, "epoch": 6.928627450980392, "percentage": 98.97, "elapsed_time": "18:44:46", "remaining_time": "0:11:42"} +{"current_steps": 4425, "total_steps": 4466, "loss": 0.2329, "lr": 1.0777630853000543e-08, "epoch": 6.936470588235294, "percentage": 99.08, "elapsed_time": "18:46:03", "remaining_time": "0:10:26"} +{"current_steps": 4430, "total_steps": 4466, "loss": 0.2242, "lr": 8.364440706429833e-09, "epoch": 6.944313725490196, "percentage": 99.19, "elapsed_time": "18:47:21", "remaining_time": "0:09:09"} +{"current_steps": 4435, "total_steps": 4466, "loss": 0.2264, "lr": 6.2566382414641635e-09, "epoch": 6.952156862745098, "percentage": 99.31, "elapsed_time": "18:48:34", "remaining_time": "0:07:53"} +{"current_steps": 4440, "total_steps": 4466, "loss": 0.2178, "lr": 4.454255656414219e-09, "epoch": 6.96, "percentage": 99.42, "elapsed_time": "18:49:49", "remaining_time": "0:06:36"} +{"current_steps": 4445, "total_steps": 4466, "loss": 0.2123, "lr": 2.957320484067161e-09, "epoch": 6.967843137254902, "percentage": 99.53, "elapsed_time": "18:51:07", "remaining_time": "0:05:20"} +{"current_steps": 4450, "total_steps": 4466, "loss": 0.2191, "lr": 1.7658555912647423e-09, "epoch": 6.975686274509804, "percentage": 99.64, "elapsed_time": "18:52:19", "remaining_time": "0:04:04"} +{"current_steps": 4455, "total_steps": 4466, "loss": 0.2156, "lr": 8.79879178554699e-10, "epoch": 6.983529411764706, "percentage": 99.75, "elapsed_time": "18:53:35", "remaining_time": "0:02:47"} +{"current_steps": 4460, "total_steps": 4466, "loss": 0.2156, "lr": 2.9940477991097227e-10, "epoch": 6.991372549019608, "percentage": 99.87, "elapsed_time": "18:54:50", "remaining_time": "0:01:31"} +{"current_steps": 4465, "total_steps": 4466, "loss": 0.2094, "lr": 2.4441262527208355e-11, "epoch": 6.99921568627451, "percentage": 99.98, "elapsed_time": "18:56:00", "remaining_time": "0:00:15"} +{"current_steps": 4466, "total_steps": 4466, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "18:56:52", "remaining_time": "0:00:00"} +{"current_steps": 4466, "total_steps": 4466, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..3e51ab2 --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,9866 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 7.0, + "eval_steps": 500, + "global_step": 4466, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.00784313725490196, + "grad_norm": 23.298347338390826, + "learning_rate": 3.579418344519016e-07, + "loss": 0.8602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.43839943408966064, + "step": 5, + "valid_targets_mean": 6052.9, + "valid_targets_min": 4026 + }, + { + "epoch": 0.01568627450980392, + "grad_norm": 22.291211448466854, + "learning_rate": 8.053691275167786e-07, + "loss": 0.8507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3826303482055664, + "step": 10, + "valid_targets_mean": 4323.8, + "valid_targets_min": 757 + }, + { + "epoch": 0.023529411764705882, + "grad_norm": 19.59349405942615, + "learning_rate": 1.2527964205816557e-06, + "loss": 0.8156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.39852985739707947, + "step": 15, + "valid_targets_mean": 5580.4, + "valid_targets_min": 3518 + }, + { + "epoch": 0.03137254901960784, + "grad_norm": 15.074355357417764, + "learning_rate": 1.7002237136465326e-06, + "loss": 0.7847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3531936705112457, + "step": 20, + "valid_targets_mean": 4555.9, + "valid_targets_min": 757 + }, + { + "epoch": 0.0392156862745098, + "grad_norm": 8.503476256842038, + "learning_rate": 2.1476510067114096e-06, + "loss": 0.7347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3691006302833557, + "step": 25, + "valid_targets_mean": 5543.6, + "valid_targets_min": 1224 + }, + { + "epoch": 0.047058823529411764, + "grad_norm": 4.791441092709092, + "learning_rate": 2.5950782997762863e-06, + "loss": 0.6663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.313259482383728, + "step": 30, + "valid_targets_mean": 4514.2, + "valid_targets_min": 3605 + }, + { + "epoch": 0.054901960784313725, + "grad_norm": 2.5079670106002365, + "learning_rate": 3.0425055928411635e-06, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3332233428955078, + "step": 35, + "valid_targets_mean": 5949.8, + "valid_targets_min": 3442 + }, + { + "epoch": 0.06274509803921569, + "grad_norm": 1.773502389142227, + "learning_rate": 3.4899328859060407e-06, + "loss": 0.6072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2549877166748047, + "step": 40, + "valid_targets_mean": 4407.0, + "valid_targets_min": 3418 + }, + { + "epoch": 0.07058823529411765, + "grad_norm": 1.6073737125855354, + "learning_rate": 3.937360178970917e-06, + "loss": 0.5814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27978047728538513, + "step": 45, + "valid_targets_mean": 4382.0, + "valid_targets_min": 850 + }, + { + "epoch": 0.0784313725490196, + "grad_norm": 1.2925467378333404, + "learning_rate": 4.384787472035795e-06, + "loss": 0.5545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26093819737434387, + "step": 50, + "valid_targets_mean": 5089.8, + "valid_targets_min": 3683 + }, + { + "epoch": 0.08627450980392157, + "grad_norm": 1.0921764137166408, + "learning_rate": 4.832214765100672e-06, + "loss": 0.5497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2828206419944763, + "step": 55, + "valid_targets_mean": 4860.9, + "valid_targets_min": 3327 + }, + { + "epoch": 0.09411764705882353, + "grad_norm": 0.9105078282562821, + "learning_rate": 5.2796420581655485e-06, + "loss": 0.5404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2650872468948364, + "step": 60, + "valid_targets_mean": 4219.0, + "valid_targets_min": 960 + }, + { + "epoch": 0.10196078431372549, + "grad_norm": 0.8176291712197993, + "learning_rate": 5.727069351230425e-06, + "loss": 0.5087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2280701994895935, + "step": 65, + "valid_targets_mean": 4217.8, + "valid_targets_min": 612 + }, + { + "epoch": 0.10980392156862745, + "grad_norm": 0.7305215048778408, + "learning_rate": 6.174496644295303e-06, + "loss": 0.5017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25523003935813904, + "step": 70, + "valid_targets_mean": 5386.5, + "valid_targets_min": 3532 + }, + { + "epoch": 0.11764705882352941, + "grad_norm": 0.6691013259217359, + "learning_rate": 6.6219239373601796e-06, + "loss": 0.4841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24713614583015442, + "step": 75, + "valid_targets_mean": 4911.4, + "valid_targets_min": 3582 + }, + { + "epoch": 0.12549019607843137, + "grad_norm": 0.609679353765235, + "learning_rate": 7.069351230425056e-06, + "loss": 0.4621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23147262632846832, + "step": 80, + "valid_targets_mean": 4827.0, + "valid_targets_min": 4254 + }, + { + "epoch": 0.13333333333333333, + "grad_norm": 0.6087171040956587, + "learning_rate": 7.516778523489934e-06, + "loss": 0.4707, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24862024188041687, + "step": 85, + "valid_targets_mean": 6231.5, + "valid_targets_min": 4574 + }, + { + "epoch": 0.1411764705882353, + "grad_norm": 0.6145120711271943, + "learning_rate": 7.96420581655481e-06, + "loss": 0.435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22450268268585205, + "step": 90, + "valid_targets_mean": 4949.2, + "valid_targets_min": 3877 + }, + { + "epoch": 0.14901960784313725, + "grad_norm": 0.5603079041349106, + "learning_rate": 8.411633109619688e-06, + "loss": 0.4323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18175888061523438, + "step": 95, + "valid_targets_mean": 4763.6, + "valid_targets_min": 626 + }, + { + "epoch": 0.1568627450980392, + "grad_norm": 0.6890920617581278, + "learning_rate": 8.859060402684566e-06, + "loss": 0.4226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21500495076179504, + "step": 100, + "valid_targets_mean": 5103.5, + "valid_targets_min": 636 + }, + { + "epoch": 0.16470588235294117, + "grad_norm": 0.7055026012162536, + "learning_rate": 9.306487695749442e-06, + "loss": 0.4028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.216325581073761, + "step": 105, + "valid_targets_mean": 4637.9, + "valid_targets_min": 943 + }, + { + "epoch": 0.17254901960784313, + "grad_norm": 0.5643953971819364, + "learning_rate": 9.753914988814318e-06, + "loss": 0.4017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19290407001972198, + "step": 110, + "valid_targets_mean": 4680.8, + "valid_targets_min": 3445 + }, + { + "epoch": 0.1803921568627451, + "grad_norm": 0.7330275863785135, + "learning_rate": 1.0201342281879197e-05, + "loss": 0.4107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16619446873664856, + "step": 115, + "valid_targets_mean": 3789.8, + "valid_targets_min": 621 + }, + { + "epoch": 0.18823529411764706, + "grad_norm": 0.618524578115423, + "learning_rate": 1.0648769574944073e-05, + "loss": 0.4116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21853846311569214, + "step": 120, + "valid_targets_mean": 5809.2, + "valid_targets_min": 2354 + }, + { + "epoch": 0.19607843137254902, + "grad_norm": 0.5780165322055293, + "learning_rate": 1.109619686800895e-05, + "loss": 0.4072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1631530225276947, + "step": 125, + "valid_targets_mean": 4298.9, + "valid_targets_min": 907 + }, + { + "epoch": 0.20392156862745098, + "grad_norm": 0.5547050817776145, + "learning_rate": 1.1543624161073828e-05, + "loss": 0.3932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1529003232717514, + "step": 130, + "valid_targets_mean": 4122.0, + "valid_targets_min": 995 + }, + { + "epoch": 0.21176470588235294, + "grad_norm": 0.5810478350386387, + "learning_rate": 1.1991051454138702e-05, + "loss": 0.3848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.216994971036911, + "step": 135, + "valid_targets_mean": 5638.5, + "valid_targets_min": 3599 + }, + { + "epoch": 0.2196078431372549, + "grad_norm": 0.5922588085332883, + "learning_rate": 1.243847874720358e-05, + "loss": 0.3761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18506886065006256, + "step": 140, + "valid_targets_mean": 4467.4, + "valid_targets_min": 3917 + }, + { + "epoch": 0.22745098039215686, + "grad_norm": 0.6014684802309681, + "learning_rate": 1.2885906040268457e-05, + "loss": 0.3835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14172306656837463, + "step": 145, + "valid_targets_mean": 4013.1, + "valid_targets_min": 600 + }, + { + "epoch": 0.23529411764705882, + "grad_norm": 0.6097819527541619, + "learning_rate": 1.3333333333333333e-05, + "loss": 0.3903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1689232587814331, + "step": 150, + "valid_targets_mean": 4505.0, + "valid_targets_min": 4012 + }, + { + "epoch": 0.24313725490196078, + "grad_norm": 0.554747015726934, + "learning_rate": 1.3780760626398211e-05, + "loss": 0.3831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27534186840057373, + "step": 155, + "valid_targets_mean": 6673.6, + "valid_targets_min": 2505 + }, + { + "epoch": 0.25098039215686274, + "grad_norm": 0.8259973561073648, + "learning_rate": 1.4228187919463088e-05, + "loss": 0.3841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1627364158630371, + "step": 160, + "valid_targets_mean": 4557.5, + "valid_targets_min": 2179 + }, + { + "epoch": 0.25882352941176473, + "grad_norm": 0.5575267126622169, + "learning_rate": 1.4675615212527964e-05, + "loss": 0.369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1631404161453247, + "step": 165, + "valid_targets_mean": 4479.1, + "valid_targets_min": 782 + }, + { + "epoch": 0.26666666666666666, + "grad_norm": 0.5975170110533272, + "learning_rate": 1.5123042505592842e-05, + "loss": 0.3851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17251205444335938, + "step": 170, + "valid_targets_mean": 4417.2, + "valid_targets_min": 724 + }, + { + "epoch": 0.27450980392156865, + "grad_norm": 0.5366892107887073, + "learning_rate": 1.5570469798657718e-05, + "loss": 0.3728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19492444396018982, + "step": 175, + "valid_targets_mean": 5861.2, + "valid_targets_min": 3404 + }, + { + "epoch": 0.2823529411764706, + "grad_norm": 0.6754136526395924, + "learning_rate": 1.6017897091722595e-05, + "loss": 0.3871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17513027787208557, + "step": 180, + "valid_targets_mean": 3518.5, + "valid_targets_min": 620 + }, + { + "epoch": 0.2901960784313726, + "grad_norm": 0.9443788799610068, + "learning_rate": 1.6465324384787473e-05, + "loss": 0.3489, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18656358122825623, + "step": 185, + "valid_targets_mean": 5753.5, + "valid_targets_min": 4620 + }, + { + "epoch": 0.2980392156862745, + "grad_norm": 0.5451311543234643, + "learning_rate": 1.691275167785235e-05, + "loss": 0.3599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21605977416038513, + "step": 190, + "valid_targets_mean": 6037.1, + "valid_targets_min": 3270 + }, + { + "epoch": 0.3058823529411765, + "grad_norm": 0.5096399052054448, + "learning_rate": 1.7360178970917228e-05, + "loss": 0.3725, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20450440049171448, + "step": 195, + "valid_targets_mean": 6507.9, + "valid_targets_min": 3275 + }, + { + "epoch": 0.3137254901960784, + "grad_norm": 0.5993350633001354, + "learning_rate": 1.7807606263982106e-05, + "loss": 0.3568, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15169182419776917, + "step": 200, + "valid_targets_mean": 4578.1, + "valid_targets_min": 4111 + }, + { + "epoch": 0.3215686274509804, + "grad_norm": 0.6205306419609562, + "learning_rate": 1.825503355704698e-05, + "loss": 0.366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17773106694221497, + "step": 205, + "valid_targets_mean": 4392.1, + "valid_targets_min": 1069 + }, + { + "epoch": 0.32941176470588235, + "grad_norm": 0.62482187351153, + "learning_rate": 1.8702460850111858e-05, + "loss": 0.3633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1388782262802124, + "step": 210, + "valid_targets_mean": 4299.2, + "valid_targets_min": 3375 + }, + { + "epoch": 0.33725490196078434, + "grad_norm": 0.6208166759487009, + "learning_rate": 1.9149888143176735e-05, + "loss": 0.3486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20655155181884766, + "step": 215, + "valid_targets_mean": 5151.0, + "valid_targets_min": 3970 + }, + { + "epoch": 0.34509803921568627, + "grad_norm": 0.6173058180465927, + "learning_rate": 1.9597315436241613e-05, + "loss": 0.3448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23730814456939697, + "step": 220, + "valid_targets_mean": 5458.9, + "valid_targets_min": 806 + }, + { + "epoch": 0.35294117647058826, + "grad_norm": 0.8313308037805428, + "learning_rate": 2.004474272930649e-05, + "loss": 0.3386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20326246321201324, + "step": 225, + "valid_targets_mean": 5639.2, + "valid_targets_min": 1312 + }, + { + "epoch": 0.3607843137254902, + "grad_norm": 0.5802044604297666, + "learning_rate": 2.0492170022371365e-05, + "loss": 0.3484, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1663266271352768, + "step": 230, + "valid_targets_mean": 5272.0, + "valid_targets_min": 4070 + }, + { + "epoch": 0.3686274509803922, + "grad_norm": 0.5500195062926332, + "learning_rate": 2.0939597315436246e-05, + "loss": 0.366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2033405900001526, + "step": 235, + "valid_targets_mean": 6574.4, + "valid_targets_min": 4332 + }, + { + "epoch": 0.3764705882352941, + "grad_norm": 0.6230935555119714, + "learning_rate": 2.138702460850112e-05, + "loss": 0.3349, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13374356925487518, + "step": 240, + "valid_targets_mean": 3771.4, + "valid_targets_min": 856 + }, + { + "epoch": 0.3843137254901961, + "grad_norm": 0.5902118918894713, + "learning_rate": 2.1834451901565997e-05, + "loss": 0.3293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15112121403217316, + "step": 245, + "valid_targets_mean": 3938.1, + "valid_targets_min": 806 + }, + { + "epoch": 0.39215686274509803, + "grad_norm": 0.5856848973492705, + "learning_rate": 2.228187919463087e-05, + "loss": 0.3454, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17914924025535583, + "step": 250, + "valid_targets_mean": 5226.8, + "valid_targets_min": 949 + }, + { + "epoch": 0.4, + "grad_norm": 0.5808064932029918, + "learning_rate": 2.2729306487695753e-05, + "loss": 0.3224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.168888121843338, + "step": 255, + "valid_targets_mean": 5211.1, + "valid_targets_min": 2843 + }, + { + "epoch": 0.40784313725490196, + "grad_norm": 0.608614659511003, + "learning_rate": 2.3176733780760627e-05, + "loss": 0.3281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16316288709640503, + "step": 260, + "valid_targets_mean": 4988.6, + "valid_targets_min": 794 + }, + { + "epoch": 0.41568627450980394, + "grad_norm": 0.6482303863343926, + "learning_rate": 2.3624161073825508e-05, + "loss": 0.3438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17435654997825623, + "step": 265, + "valid_targets_mean": 4630.8, + "valid_targets_min": 904 + }, + { + "epoch": 0.4235294117647059, + "grad_norm": 0.7427445144818828, + "learning_rate": 2.4071588366890382e-05, + "loss": 0.3292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14953133463859558, + "step": 270, + "valid_targets_mean": 4994.5, + "valid_targets_min": 3067 + }, + { + "epoch": 0.43137254901960786, + "grad_norm": 0.5724650392644556, + "learning_rate": 2.451901565995526e-05, + "loss": 0.3302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17354685068130493, + "step": 275, + "valid_targets_mean": 5621.2, + "valid_targets_min": 3628 + }, + { + "epoch": 0.4392156862745098, + "grad_norm": 0.5950700951789527, + "learning_rate": 2.4966442953020137e-05, + "loss": 0.3341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1778419315814972, + "step": 280, + "valid_targets_mean": 5702.2, + "valid_targets_min": 995 + }, + { + "epoch": 0.4470588235294118, + "grad_norm": 0.6345193957231828, + "learning_rate": 2.5413870246085015e-05, + "loss": 0.3259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20228183269500732, + "step": 285, + "valid_targets_mean": 4570.2, + "valid_targets_min": 782 + }, + { + "epoch": 0.4549019607843137, + "grad_norm": 0.6094068416813229, + "learning_rate": 2.586129753914989e-05, + "loss": 0.3408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13829955458641052, + "step": 290, + "valid_targets_mean": 4302.2, + "valid_targets_min": 2734 + }, + { + "epoch": 0.4627450980392157, + "grad_norm": 0.5825911888294858, + "learning_rate": 2.630872483221477e-05, + "loss": 0.3429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13955016434192657, + "step": 295, + "valid_targets_mean": 4808.9, + "valid_targets_min": 3739 + }, + { + "epoch": 0.47058823529411764, + "grad_norm": 0.6437990917169216, + "learning_rate": 2.6756152125279644e-05, + "loss": 0.3306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18308787047863007, + "step": 300, + "valid_targets_mean": 4868.2, + "valid_targets_min": 681 + }, + { + "epoch": 0.47843137254901963, + "grad_norm": 0.6714443312074112, + "learning_rate": 2.7203579418344522e-05, + "loss": 0.3164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16416051983833313, + "step": 305, + "valid_targets_mean": 4578.1, + "valid_targets_min": 3890 + }, + { + "epoch": 0.48627450980392156, + "grad_norm": 0.5771009814027651, + "learning_rate": 2.76510067114094e-05, + "loss": 0.311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1598922163248062, + "step": 310, + "valid_targets_mean": 5190.5, + "valid_targets_min": 3797 + }, + { + "epoch": 0.49411764705882355, + "grad_norm": 0.5690495376174819, + "learning_rate": 2.8098434004474274e-05, + "loss": 0.3149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19397258758544922, + "step": 315, + "valid_targets_mean": 5327.6, + "valid_targets_min": 3876 + }, + { + "epoch": 0.5019607843137255, + "grad_norm": 0.550480153370413, + "learning_rate": 2.854586129753915e-05, + "loss": 0.3198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15099109709262848, + "step": 320, + "valid_targets_mean": 5396.5, + "valid_targets_min": 4033 + }, + { + "epoch": 0.5098039215686274, + "grad_norm": 0.583247357916581, + "learning_rate": 2.899328859060403e-05, + "loss": 0.3218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11765319854021072, + "step": 325, + "valid_targets_mean": 4748.0, + "valid_targets_min": 3230 + }, + { + "epoch": 0.5176470588235295, + "grad_norm": 0.64154390330704, + "learning_rate": 2.9440715883668906e-05, + "loss": 0.3307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15749859809875488, + "step": 330, + "valid_targets_mean": 4616.2, + "valid_targets_min": 730 + }, + { + "epoch": 0.5254901960784314, + "grad_norm": 0.615191724266002, + "learning_rate": 2.988814317673378e-05, + "loss": 0.3338, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16712582111358643, + "step": 335, + "valid_targets_mean": 4441.6, + "valid_targets_min": 2253 + }, + { + "epoch": 0.5333333333333333, + "grad_norm": 0.5891783226631264, + "learning_rate": 3.033557046979866e-05, + "loss": 0.3265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17673718929290771, + "step": 340, + "valid_targets_mean": 4994.9, + "valid_targets_min": 768 + }, + { + "epoch": 0.5411764705882353, + "grad_norm": 0.5602456880109379, + "learning_rate": 3.078299776286353e-05, + "loss": 0.3232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12272541970014572, + "step": 345, + "valid_targets_mean": 4047.5, + "valid_targets_min": 407 + }, + { + "epoch": 0.5490196078431373, + "grad_norm": 0.5463989570288924, + "learning_rate": 3.123042505592841e-05, + "loss": 0.3263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16012008488178253, + "step": 350, + "valid_targets_mean": 5549.2, + "valid_targets_min": 2882 + }, + { + "epoch": 0.5568627450980392, + "grad_norm": 0.5817982029983223, + "learning_rate": 3.167785234899329e-05, + "loss": 0.3295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17968128621578217, + "step": 355, + "valid_targets_mean": 5364.1, + "valid_targets_min": 685 + }, + { + "epoch": 0.5647058823529412, + "grad_norm": 0.5606408079082489, + "learning_rate": 3.212527964205817e-05, + "loss": 0.3262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18859368562698364, + "step": 360, + "valid_targets_mean": 5831.8, + "valid_targets_min": 3932 + }, + { + "epoch": 0.5725490196078431, + "grad_norm": 0.6040131290277008, + "learning_rate": 3.257270693512304e-05, + "loss": 0.3133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17811569571495056, + "step": 365, + "valid_targets_mean": 5092.4, + "valid_targets_min": 2456 + }, + { + "epoch": 0.5803921568627451, + "grad_norm": 0.5323257843878618, + "learning_rate": 3.3020134228187924e-05, + "loss": 0.3319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1304280161857605, + "step": 370, + "valid_targets_mean": 4231.9, + "valid_targets_min": 504 + }, + { + "epoch": 0.5882352941176471, + "grad_norm": 0.5501225667538716, + "learning_rate": 3.34675615212528e-05, + "loss": 0.3156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15985777974128723, + "step": 375, + "valid_targets_mean": 4744.2, + "valid_targets_min": 907 + }, + { + "epoch": 0.596078431372549, + "grad_norm": 0.6070915816256318, + "learning_rate": 3.391498881431768e-05, + "loss": 0.3068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14768286049365997, + "step": 380, + "valid_targets_mean": 4678.5, + "valid_targets_min": 780 + }, + { + "epoch": 0.6039215686274509, + "grad_norm": 0.5676478206539363, + "learning_rate": 3.436241610738255e-05, + "loss": 0.3132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18851745128631592, + "step": 385, + "valid_targets_mean": 5673.2, + "valid_targets_min": 4270 + }, + { + "epoch": 0.611764705882353, + "grad_norm": 0.6294438971771676, + "learning_rate": 3.4809843400447434e-05, + "loss": 0.3201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16219162940979004, + "step": 390, + "valid_targets_mean": 4658.5, + "valid_targets_min": 3482 + }, + { + "epoch": 0.6196078431372549, + "grad_norm": 0.5517350373337631, + "learning_rate": 3.525727069351231e-05, + "loss": 0.3079, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15507352352142334, + "step": 395, + "valid_targets_mean": 5542.0, + "valid_targets_min": 3454 + }, + { + "epoch": 0.6274509803921569, + "grad_norm": 0.5402705972646643, + "learning_rate": 3.570469798657719e-05, + "loss": 0.3348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2057492733001709, + "step": 400, + "valid_targets_mean": 6888.8, + "valid_targets_min": 3784 + }, + { + "epoch": 0.6352941176470588, + "grad_norm": 0.5745876216369237, + "learning_rate": 3.6152125279642063e-05, + "loss": 0.3244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13152286410331726, + "step": 405, + "valid_targets_mean": 4793.1, + "valid_targets_min": 4053 + }, + { + "epoch": 0.6431372549019608, + "grad_norm": 0.6031541334068352, + "learning_rate": 3.659955257270694e-05, + "loss": 0.3058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18968364596366882, + "step": 410, + "valid_targets_mean": 5629.0, + "valid_targets_min": 4213 + }, + { + "epoch": 0.6509803921568628, + "grad_norm": 0.6164309927080983, + "learning_rate": 3.704697986577181e-05, + "loss": 0.3151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16448290646076202, + "step": 415, + "valid_targets_mean": 4735.1, + "valid_targets_min": 765 + }, + { + "epoch": 0.6588235294117647, + "grad_norm": 0.5359492226720084, + "learning_rate": 3.749440715883669e-05, + "loss": 0.319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19872182607650757, + "step": 420, + "valid_targets_mean": 5724.0, + "valid_targets_min": 648 + }, + { + "epoch": 0.6666666666666666, + "grad_norm": 0.5819044959604062, + "learning_rate": 3.794183445190157e-05, + "loss": 0.3148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14885927736759186, + "step": 425, + "valid_targets_mean": 5043.6, + "valid_targets_min": 812 + }, + { + "epoch": 0.6745098039215687, + "grad_norm": 0.5752622619650046, + "learning_rate": 3.838926174496644e-05, + "loss": 0.3206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14092881977558136, + "step": 430, + "valid_targets_mean": 4815.8, + "valid_targets_min": 632 + }, + { + "epoch": 0.6823529411764706, + "grad_norm": 0.49132427520732735, + "learning_rate": 3.883668903803132e-05, + "loss": 0.3121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14789029955863953, + "step": 435, + "valid_targets_mean": 5252.1, + "valid_targets_min": 3838 + }, + { + "epoch": 0.6901960784313725, + "grad_norm": 0.48093782694535336, + "learning_rate": 3.9284116331096196e-05, + "loss": 0.3011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13488665223121643, + "step": 440, + "valid_targets_mean": 5491.2, + "valid_targets_min": 3145 + }, + { + "epoch": 0.6980392156862745, + "grad_norm": 0.5571196071755746, + "learning_rate": 3.973154362416108e-05, + "loss": 0.3118, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19611987471580505, + "step": 445, + "valid_targets_mean": 5789.0, + "valid_targets_min": 3587 + }, + { + "epoch": 0.7058823529411765, + "grad_norm": 0.6046907322781063, + "learning_rate": 3.999997555873748e-05, + "loss": 0.3123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14690479636192322, + "step": 450, + "valid_targets_mean": 5491.9, + "valid_targets_min": 3758 + }, + { + "epoch": 0.7137254901960784, + "grad_norm": 0.5492823367274015, + "learning_rate": 3.999970059522009e-05, + "loss": 0.3045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14941585063934326, + "step": 455, + "valid_targets_mean": 4707.6, + "valid_targets_min": 3849 + }, + { + "epoch": 0.7215686274509804, + "grad_norm": 0.5380082427998023, + "learning_rate": 3.9999120120821446e-05, + "loss": 0.3248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24840714037418365, + "step": 460, + "valid_targets_mean": 6441.1, + "valid_targets_min": 745 + }, + { + "epoch": 0.7294117647058823, + "grad_norm": 0.5596379062224002, + "learning_rate": 3.999823414440874e-05, + "loss": 0.3182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13548262417316437, + "step": 465, + "valid_targets_mean": 4467.9, + "valid_targets_min": 2927 + }, + { + "epoch": 0.7372549019607844, + "grad_norm": 0.5356703634829085, + "learning_rate": 3.999704267951594e-05, + "loss": 0.2902, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15319597721099854, + "step": 470, + "valid_targets_mean": 4402.6, + "valid_targets_min": 820 + }, + { + "epoch": 0.7450980392156863, + "grad_norm": 0.600066524630049, + "learning_rate": 3.999554574434359e-05, + "loss": 0.3129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11718227714300156, + "step": 475, + "valid_targets_mean": 3519.2, + "valid_targets_min": 590 + }, + { + "epoch": 0.7529411764705882, + "grad_norm": 0.6098828990516277, + "learning_rate": 3.999374336175854e-05, + "loss": 0.3007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1625547856092453, + "step": 480, + "valid_targets_mean": 4139.1, + "valid_targets_min": 664 + }, + { + "epoch": 0.7607843137254902, + "grad_norm": 0.5371084402168345, + "learning_rate": 3.999163555929357e-05, + "loss": 0.3131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14883488416671753, + "step": 485, + "valid_targets_mean": 4719.6, + "valid_targets_min": 928 + }, + { + "epoch": 0.7686274509803922, + "grad_norm": 0.5528904483847205, + "learning_rate": 3.9989222369147e-05, + "loss": 0.3053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.149824321269989, + "step": 490, + "valid_targets_mean": 5001.2, + "valid_targets_min": 3946 + }, + { + "epoch": 0.7764705882352941, + "grad_norm": 0.6173104751559979, + "learning_rate": 3.998650382818217e-05, + "loss": 0.3109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23142695426940918, + "step": 495, + "valid_targets_mean": 5869.8, + "valid_targets_min": 3481 + }, + { + "epoch": 0.7843137254901961, + "grad_norm": 0.5310347193247758, + "learning_rate": 3.998347997792689e-05, + "loss": 0.3061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1767919659614563, + "step": 500, + "valid_targets_mean": 5104.8, + "valid_targets_min": 477 + }, + { + "epoch": 0.792156862745098, + "grad_norm": 0.5225823121767637, + "learning_rate": 3.9980150864572815e-05, + "loss": 0.3066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1493397206068039, + "step": 505, + "valid_targets_mean": 5159.4, + "valid_targets_min": 739 + }, + { + "epoch": 0.8, + "grad_norm": 0.5473700973149909, + "learning_rate": 3.997651653897472e-05, + "loss": 0.2985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1430482566356659, + "step": 510, + "valid_targets_mean": 4216.4, + "valid_targets_min": 636 + }, + { + "epoch": 0.807843137254902, + "grad_norm": 0.5527704785980678, + "learning_rate": 3.997257705664974e-05, + "loss": 0.2894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1335963010787964, + "step": 515, + "valid_targets_mean": 4604.4, + "valid_targets_min": 3499 + }, + { + "epoch": 0.8156862745098039, + "grad_norm": 0.5146849440416694, + "learning_rate": 3.9968332477776505e-05, + "loss": 0.307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11378350108861923, + "step": 520, + "valid_targets_mean": 4262.4, + "valid_targets_min": 3479 + }, + { + "epoch": 0.8235294117647058, + "grad_norm": 0.5786673735607119, + "learning_rate": 3.996378286719425e-05, + "loss": 0.2935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1584271490573883, + "step": 525, + "valid_targets_mean": 4425.1, + "valid_targets_min": 904 + }, + { + "epoch": 0.8313725490196079, + "grad_norm": 0.48691241061943, + "learning_rate": 3.995892829440178e-05, + "loss": 0.3036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14986231923103333, + "step": 530, + "valid_targets_mean": 5350.5, + "valid_targets_min": 3222 + }, + { + "epoch": 0.8392156862745098, + "grad_norm": 0.6882772998345945, + "learning_rate": 3.995376883355645e-05, + "loss": 0.2963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16301119327545166, + "step": 535, + "valid_targets_mean": 5388.0, + "valid_targets_min": 3841 + }, + { + "epoch": 0.8470588235294118, + "grad_norm": 0.5504142868498775, + "learning_rate": 3.994830456347302e-05, + "loss": 0.312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13605545461177826, + "step": 540, + "valid_targets_mean": 4475.0, + "valid_targets_min": 249 + }, + { + "epoch": 0.8549019607843137, + "grad_norm": 0.552541153109021, + "learning_rate": 3.994253556762243e-05, + "loss": 0.301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1425020694732666, + "step": 545, + "valid_targets_mean": 4783.4, + "valid_targets_min": 4019 + }, + { + "epoch": 0.8627450980392157, + "grad_norm": 0.516174073782907, + "learning_rate": 3.993646193413053e-05, + "loss": 0.3165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12146864831447601, + "step": 550, + "valid_targets_mean": 4630.2, + "valid_targets_min": 1989 + }, + { + "epoch": 0.8705882352941177, + "grad_norm": 0.5114622919919676, + "learning_rate": 3.99300837557768e-05, + "loss": 0.2937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.129593163728714, + "step": 555, + "valid_targets_mean": 4601.2, + "valid_targets_min": 3465 + }, + { + "epoch": 0.8784313725490196, + "grad_norm": 0.6180845077447936, + "learning_rate": 3.9923401129992826e-05, + "loss": 0.322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22494003176689148, + "step": 560, + "valid_targets_mean": 4843.1, + "valid_targets_min": 443 + }, + { + "epoch": 0.8862745098039215, + "grad_norm": 0.5938338606255534, + "learning_rate": 3.991641415886089e-05, + "loss": 0.2903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13986267149448395, + "step": 565, + "valid_targets_mean": 4873.4, + "valid_targets_min": 3458 + }, + { + "epoch": 0.8941176470588236, + "grad_norm": 0.5131012574265683, + "learning_rate": 3.990912294911236e-05, + "loss": 0.2932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.141075998544693, + "step": 570, + "valid_targets_mean": 5001.8, + "valid_targets_min": 3638 + }, + { + "epoch": 0.9019607843137255, + "grad_norm": 0.5218539338715148, + "learning_rate": 3.99015276121261e-05, + "loss": 0.3083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18449991941452026, + "step": 575, + "valid_targets_mean": 7555.2, + "valid_targets_min": 4641 + }, + { + "epoch": 0.9098039215686274, + "grad_norm": 0.5584481822366371, + "learning_rate": 3.989362826392676e-05, + "loss": 0.3084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15493915975093842, + "step": 580, + "valid_targets_mean": 5178.5, + "valid_targets_min": 3262 + }, + { + "epoch": 0.9176470588235294, + "grad_norm": 0.5330193946594204, + "learning_rate": 3.9885425025183e-05, + "loss": 0.2851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12677499651908875, + "step": 585, + "valid_targets_mean": 4999.5, + "valid_targets_min": 3634 + }, + { + "epoch": 0.9254901960784314, + "grad_norm": 0.555409429804303, + "learning_rate": 3.9876918021205606e-05, + "loss": 0.2879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16259485483169556, + "step": 590, + "valid_targets_mean": 4657.9, + "valid_targets_min": 766 + }, + { + "epoch": 0.9333333333333333, + "grad_norm": 0.5413694736991173, + "learning_rate": 3.9868107381945646e-05, + "loss": 0.2882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14090581238269806, + "step": 595, + "valid_targets_mean": 4137.2, + "valid_targets_min": 805 + }, + { + "epoch": 0.9411764705882353, + "grad_norm": 0.5097233576500176, + "learning_rate": 3.9858993241992454e-05, + "loss": 0.3047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16496001183986664, + "step": 600, + "valid_targets_mean": 5535.8, + "valid_targets_min": 3537 + }, + { + "epoch": 0.9490196078431372, + "grad_norm": 0.565606495791218, + "learning_rate": 3.984957574057155e-05, + "loss": 0.3062, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1719355583190918, + "step": 605, + "valid_targets_mean": 5035.8, + "valid_targets_min": 3531 + }, + { + "epoch": 0.9568627450980393, + "grad_norm": 0.5662622685590348, + "learning_rate": 3.983985502154254e-05, + "loss": 0.2913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1330733746290207, + "step": 610, + "valid_targets_mean": 4509.8, + "valid_targets_min": 690 + }, + { + "epoch": 0.9647058823529412, + "grad_norm": 0.650042780936349, + "learning_rate": 3.982983123339694e-05, + "loss": 0.2949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16050265729427338, + "step": 615, + "valid_targets_mean": 4618.6, + "valid_targets_min": 3628 + }, + { + "epoch": 0.9725490196078431, + "grad_norm": 0.4789311071288452, + "learning_rate": 3.9819504529255836e-05, + "loss": 0.3078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1295998990535736, + "step": 620, + "valid_targets_mean": 5019.6, + "valid_targets_min": 604 + }, + { + "epoch": 0.9803921568627451, + "grad_norm": 0.5185497844397633, + "learning_rate": 3.980887506686763e-05, + "loss": 0.2901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11702439188957214, + "step": 625, + "valid_targets_mean": 4191.5, + "valid_targets_min": 991 + }, + { + "epoch": 0.9882352941176471, + "grad_norm": 0.5290223238660421, + "learning_rate": 3.9797943008605575e-05, + "loss": 0.2913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14580155909061432, + "step": 630, + "valid_targets_mean": 4653.8, + "valid_targets_min": 906 + }, + { + "epoch": 0.996078431372549, + "grad_norm": 0.5266373986466892, + "learning_rate": 3.978670852146529e-05, + "loss": 0.2889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13359291851520538, + "step": 635, + "valid_targets_mean": 4390.6, + "valid_targets_min": 3725 + }, + { + "epoch": 1.0031372549019608, + "grad_norm": 0.47547522888568966, + "learning_rate": 3.977517177706226e-05, + "loss": 0.2951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12808755040168762, + "step": 640, + "valid_targets_mean": 5032.6, + "valid_targets_min": 558 + }, + { + "epoch": 1.0109803921568628, + "grad_norm": 0.5103283050856352, + "learning_rate": 3.976333295162918e-05, + "loss": 0.2754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15815523266792297, + "step": 645, + "valid_targets_mean": 4782.9, + "valid_targets_min": 3797 + }, + { + "epoch": 1.0188235294117647, + "grad_norm": 0.5437229569859977, + "learning_rate": 3.975119222601323e-05, + "loss": 0.2758, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1376689076423645, + "step": 650, + "valid_targets_mean": 4856.1, + "valid_targets_min": 2930 + }, + { + "epoch": 1.0266666666666666, + "grad_norm": 0.47980311335397074, + "learning_rate": 3.9738749785673406e-05, + "loss": 0.2882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15655337274074554, + "step": 655, + "valid_targets_mean": 4985.4, + "valid_targets_min": 3526 + }, + { + "epoch": 1.0345098039215685, + "grad_norm": 0.6311205327783157, + "learning_rate": 3.972600582067758e-05, + "loss": 0.2869, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1531863808631897, + "step": 660, + "valid_targets_mean": 4498.0, + "valid_targets_min": 496 + }, + { + "epoch": 1.0423529411764705, + "grad_norm": 0.5716799603731424, + "learning_rate": 3.971296052569967e-05, + "loss": 0.2863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1194576546549797, + "step": 665, + "valid_targets_mean": 4117.6, + "valid_targets_min": 3617 + }, + { + "epoch": 1.0501960784313726, + "grad_norm": 0.4684618466869646, + "learning_rate": 3.9699614100016634e-05, + "loss": 0.2789, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16516944766044617, + "step": 670, + "valid_targets_mean": 5447.8, + "valid_targets_min": 4101 + }, + { + "epoch": 1.0580392156862746, + "grad_norm": 0.49367470728777396, + "learning_rate": 3.968596674750545e-05, + "loss": 0.2856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14375250041484833, + "step": 675, + "valid_targets_mean": 5414.5, + "valid_targets_min": 3837 + }, + { + "epoch": 1.0658823529411765, + "grad_norm": 0.46044503507781187, + "learning_rate": 3.967201867663996e-05, + "loss": 0.2853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16253119707107544, + "step": 680, + "valid_targets_mean": 6025.1, + "valid_targets_min": 392 + }, + { + "epoch": 1.0737254901960784, + "grad_norm": 0.6024045182349768, + "learning_rate": 3.9657770100487736e-05, + "loss": 0.2778, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13948144018650055, + "step": 685, + "valid_targets_mean": 5004.2, + "valid_targets_min": 3757 + }, + { + "epoch": 1.0815686274509804, + "grad_norm": 0.5157512027527342, + "learning_rate": 3.964322123670678e-05, + "loss": 0.2792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1478308141231537, + "step": 690, + "valid_targets_mean": 4180.2, + "valid_targets_min": 654 + }, + { + "epoch": 1.0894117647058823, + "grad_norm": 0.5002569272875327, + "learning_rate": 3.9628372307542225e-05, + "loss": 0.2957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1788061261177063, + "step": 695, + "valid_targets_mean": 5319.0, + "valid_targets_min": 2231 + }, + { + "epoch": 1.0972549019607842, + "grad_norm": 0.5100097718835788, + "learning_rate": 3.961322353982295e-05, + "loss": 0.2925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1128082424402237, + "step": 700, + "valid_targets_mean": 4365.6, + "valid_targets_min": 3235 + }, + { + "epoch": 1.1050980392156862, + "grad_norm": 0.5109172456711149, + "learning_rate": 3.959777516495809e-05, + "loss": 0.2984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1364116221666336, + "step": 705, + "valid_targets_mean": 3845.6, + "valid_targets_min": 836 + }, + { + "epoch": 1.1129411764705883, + "grad_norm": 0.49047092157775113, + "learning_rate": 3.95820274189335e-05, + "loss": 0.2898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17177531123161316, + "step": 710, + "valid_targets_mean": 5469.4, + "valid_targets_min": 4127 + }, + { + "epoch": 1.1207843137254903, + "grad_norm": 0.4843667352820801, + "learning_rate": 3.956598054230816e-05, + "loss": 0.2954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13446100056171417, + "step": 715, + "valid_targets_mean": 4805.4, + "valid_targets_min": 3414 + }, + { + "epoch": 1.1286274509803922, + "grad_norm": 0.5326626591489633, + "learning_rate": 3.9549634780210536e-05, + "loss": 0.2879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15380431711673737, + "step": 720, + "valid_targets_mean": 5294.5, + "valid_targets_min": 3954 + }, + { + "epoch": 1.1364705882352941, + "grad_norm": 0.506684867506722, + "learning_rate": 3.953299038233476e-05, + "loss": 0.2806, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16172771155834198, + "step": 725, + "valid_targets_mean": 6202.2, + "valid_targets_min": 4193 + }, + { + "epoch": 1.144313725490196, + "grad_norm": 0.49900322782201706, + "learning_rate": 3.9516047602936864e-05, + "loss": 0.2894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1386362463235855, + "step": 730, + "valid_targets_mean": 5224.0, + "valid_targets_min": 3954 + }, + { + "epoch": 1.152156862745098, + "grad_norm": 0.5485013506223598, + "learning_rate": 3.949880670083091e-05, + "loss": 0.2887, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1538248062133789, + "step": 735, + "valid_targets_mean": 4433.6, + "valid_targets_min": 882 + }, + { + "epoch": 1.16, + "grad_norm": 0.5114165877370134, + "learning_rate": 3.9481267939385e-05, + "loss": 0.3061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17208515107631683, + "step": 740, + "valid_targets_mean": 4607.8, + "valid_targets_min": 1044 + }, + { + "epoch": 1.167843137254902, + "grad_norm": 0.5140897776212602, + "learning_rate": 3.946343158651725e-05, + "loss": 0.2872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19184085726737976, + "step": 745, + "valid_targets_mean": 6692.2, + "valid_targets_min": 4235 + }, + { + "epoch": 1.175686274509804, + "grad_norm": 0.510349829135783, + "learning_rate": 3.944529791469175e-05, + "loss": 0.2888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15706050395965576, + "step": 750, + "valid_targets_mean": 5801.4, + "valid_targets_min": 2930 + }, + { + "epoch": 1.183529411764706, + "grad_norm": 0.5139210232913193, + "learning_rate": 3.9426867200914355e-05, + "loss": 0.285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11696702986955643, + "step": 755, + "valid_targets_mean": 4200.5, + "valid_targets_min": 580 + }, + { + "epoch": 1.1913725490196079, + "grad_norm": 0.6138467891844176, + "learning_rate": 3.9408139726728444e-05, + "loss": 0.2866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13788250088691711, + "step": 760, + "valid_targets_mean": 4887.9, + "valid_targets_min": 3979 + }, + { + "epoch": 1.1992156862745098, + "grad_norm": 0.5274585474600504, + "learning_rate": 3.9389115778210666e-05, + "loss": 0.2765, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15761765837669373, + "step": 765, + "valid_targets_mean": 5229.5, + "valid_targets_min": 558 + }, + { + "epoch": 1.2070588235294117, + "grad_norm": 0.5045239215906021, + "learning_rate": 3.936979564596653e-05, + "loss": 0.2842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14591068029403687, + "step": 770, + "valid_targets_mean": 4233.5, + "valid_targets_min": 919 + }, + { + "epoch": 1.2149019607843137, + "grad_norm": 0.5278256503203437, + "learning_rate": 3.935017962512599e-05, + "loss": 0.2814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11342287063598633, + "step": 775, + "valid_targets_mean": 4776.5, + "valid_targets_min": 3375 + }, + { + "epoch": 1.2227450980392156, + "grad_norm": 0.47582043807758717, + "learning_rate": 3.933026801533893e-05, + "loss": 0.298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15707777440547943, + "step": 780, + "valid_targets_mean": 5618.9, + "valid_targets_min": 4369 + }, + { + "epoch": 1.2305882352941175, + "grad_norm": 0.45934059705023184, + "learning_rate": 3.9310061120770556e-05, + "loss": 0.2795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13776640594005585, + "step": 785, + "valid_targets_mean": 5107.0, + "valid_targets_min": 4087 + }, + { + "epoch": 1.2384313725490197, + "grad_norm": 0.46414624555908107, + "learning_rate": 3.928955925009682e-05, + "loss": 0.2605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1537836790084839, + "step": 790, + "valid_targets_mean": 4994.2, + "valid_targets_min": 3250 + }, + { + "epoch": 1.2462745098039216, + "grad_norm": 0.4408619533536079, + "learning_rate": 3.9268762716499615e-05, + "loss": 0.2693, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13994896411895752, + "step": 795, + "valid_targets_mean": 6135.1, + "valid_targets_min": 3933 + }, + { + "epoch": 1.2541176470588236, + "grad_norm": 0.4736658560562933, + "learning_rate": 3.924767183766208e-05, + "loss": 0.2917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12094531208276749, + "step": 800, + "valid_targets_mean": 4518.0, + "valid_targets_min": 1112 + }, + { + "epoch": 1.2619607843137255, + "grad_norm": 0.5874137322174587, + "learning_rate": 3.922628693576369e-05, + "loss": 0.2773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14845438301563263, + "step": 805, + "valid_targets_mean": 4616.0, + "valid_targets_min": 1066 + }, + { + "epoch": 1.2698039215686274, + "grad_norm": 0.47373845837495127, + "learning_rate": 3.9204608337475323e-05, + "loss": 0.2754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1442110240459442, + "step": 810, + "valid_targets_mean": 5869.6, + "valid_targets_min": 4108 + }, + { + "epoch": 1.2776470588235294, + "grad_norm": 0.5594446464578944, + "learning_rate": 3.9182636373954345e-05, + "loss": 0.2918, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18353107571601868, + "step": 815, + "valid_targets_mean": 5140.8, + "valid_targets_min": 275 + }, + { + "epoch": 1.2854901960784313, + "grad_norm": 0.4574990179860623, + "learning_rate": 3.916037138083947e-05, + "loss": 0.2836, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12598153948783875, + "step": 820, + "valid_targets_mean": 5185.1, + "valid_targets_min": 3440 + }, + { + "epoch": 1.2933333333333334, + "grad_norm": 0.40740564941785307, + "learning_rate": 3.913781369824567e-05, + "loss": 0.275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14568153023719788, + "step": 825, + "valid_targets_mean": 6277.1, + "valid_targets_min": 3898 + }, + { + "epoch": 1.3011764705882354, + "grad_norm": 0.44929897069661345, + "learning_rate": 3.911496367075897e-05, + "loss": 0.2935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08832447975873947, + "step": 830, + "valid_targets_mean": 4550.4, + "valid_targets_min": 3266 + }, + { + "epoch": 1.3090196078431373, + "grad_norm": 0.4838672180760848, + "learning_rate": 3.909182164743122e-05, + "loss": 0.2821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1226353794336319, + "step": 835, + "valid_targets_mean": 5036.8, + "valid_targets_min": 1606 + }, + { + "epoch": 1.3168627450980392, + "grad_norm": 0.5483780903684279, + "learning_rate": 3.906838798177469e-05, + "loss": 0.2772, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13118325173854828, + "step": 840, + "valid_targets_mean": 4114.9, + "valid_targets_min": 776 + }, + { + "epoch": 1.3247058823529412, + "grad_norm": 0.46795419074341116, + "learning_rate": 3.904466303175674e-05, + "loss": 0.2993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13329827785491943, + "step": 845, + "valid_targets_mean": 5061.5, + "valid_targets_min": 605 + }, + { + "epoch": 1.332549019607843, + "grad_norm": 0.5731984387593678, + "learning_rate": 3.90206471597943e-05, + "loss": 0.267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1332540065050125, + "step": 850, + "valid_targets_mean": 4545.1, + "valid_targets_min": 3721 + }, + { + "epoch": 1.340392156862745, + "grad_norm": 0.493596072249093, + "learning_rate": 3.8996340732748396e-05, + "loss": 0.2832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15036369860172272, + "step": 855, + "valid_targets_mean": 5181.5, + "valid_targets_min": 449 + }, + { + "epoch": 1.348235294117647, + "grad_norm": 0.5153894528113263, + "learning_rate": 3.8971744121918465e-05, + "loss": 0.2852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13004739582538605, + "step": 860, + "valid_targets_mean": 5174.0, + "valid_targets_min": 4119 + }, + { + "epoch": 1.356078431372549, + "grad_norm": 0.531726998826914, + "learning_rate": 3.894685770303675e-05, + "loss": 0.2831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16023707389831543, + "step": 865, + "valid_targets_mean": 4943.9, + "valid_targets_min": 1176 + }, + { + "epoch": 1.3639215686274508, + "grad_norm": 0.4984274476423372, + "learning_rate": 3.8921681856262535e-05, + "loss": 0.2845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15315961837768555, + "step": 870, + "valid_targets_mean": 5614.4, + "valid_targets_min": 3721 + }, + { + "epoch": 1.371764705882353, + "grad_norm": 0.4524127448562263, + "learning_rate": 3.889621696617633e-05, + "loss": 0.2694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1313284933567047, + "step": 875, + "valid_targets_mean": 4431.6, + "valid_targets_min": 710 + }, + { + "epoch": 1.379607843137255, + "grad_norm": 0.578828012700717, + "learning_rate": 3.887046342177401e-05, + "loss": 0.2886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15103895962238312, + "step": 880, + "valid_targets_mean": 3760.1, + "valid_targets_min": 928 + }, + { + "epoch": 1.3874509803921569, + "grad_norm": 0.47108002593851134, + "learning_rate": 3.884442161646086e-05, + "loss": 0.2835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1282312572002411, + "step": 885, + "valid_targets_mean": 4732.4, + "valid_targets_min": 881 + }, + { + "epoch": 1.3952941176470588, + "grad_norm": 0.46403908903025914, + "learning_rate": 3.881809194804559e-05, + "loss": 0.2719, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14507359266281128, + "step": 890, + "valid_targets_mean": 5339.4, + "valid_targets_min": 3849 + }, + { + "epoch": 1.4031372549019607, + "grad_norm": 0.5164491186153499, + "learning_rate": 3.879147481873423e-05, + "loss": 0.2761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14479577541351318, + "step": 895, + "valid_targets_mean": 4245.0, + "valid_targets_min": 1211 + }, + { + "epoch": 1.4109803921568629, + "grad_norm": 0.47262134352541796, + "learning_rate": 3.876457063512399e-05, + "loss": 0.2814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14927907288074493, + "step": 900, + "valid_targets_mean": 5170.5, + "valid_targets_min": 3806 + }, + { + "epoch": 1.4188235294117648, + "grad_norm": 0.48030885275086166, + "learning_rate": 3.873737980819707e-05, + "loss": 0.284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1346939206123352, + "step": 905, + "valid_targets_mean": 4743.6, + "valid_targets_min": 2538 + }, + { + "epoch": 1.4266666666666667, + "grad_norm": 0.5198341770217074, + "learning_rate": 3.870990275331437e-05, + "loss": 0.2862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17289170622825623, + "step": 910, + "valid_targets_mean": 4804.0, + "valid_targets_min": 808 + }, + { + "epoch": 1.4345098039215687, + "grad_norm": 0.45328710388368715, + "learning_rate": 3.8682139890209124e-05, + "loss": 0.2786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17157664895057678, + "step": 915, + "valid_targets_mean": 6150.1, + "valid_targets_min": 3749 + }, + { + "epoch": 1.4423529411764706, + "grad_norm": 0.5085841911130472, + "learning_rate": 3.865409164298052e-05, + "loss": 0.2878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13336902856826782, + "step": 920, + "valid_targets_mean": 4057.1, + "valid_targets_min": 731 + }, + { + "epoch": 1.4501960784313725, + "grad_norm": 0.4994287763598936, + "learning_rate": 3.8625758440087213e-05, + "loss": 0.2768, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16101914644241333, + "step": 925, + "valid_targets_mean": 4822.4, + "valid_targets_min": 3827 + }, + { + "epoch": 1.4580392156862745, + "grad_norm": 0.4941923929879018, + "learning_rate": 3.859714071434078e-05, + "loss": 0.2755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16710661351680756, + "step": 930, + "valid_targets_mean": 5267.9, + "valid_targets_min": 882 + }, + { + "epoch": 1.4658823529411764, + "grad_norm": 0.48327572840974614, + "learning_rate": 3.8568238902899085e-05, + "loss": 0.2711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1417180448770523, + "step": 935, + "valid_targets_mean": 4978.8, + "valid_targets_min": 778 + }, + { + "epoch": 1.4737254901960783, + "grad_norm": 0.44695203493729635, + "learning_rate": 3.853905344725963e-05, + "loss": 0.2908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13325612246990204, + "step": 940, + "valid_targets_mean": 5665.6, + "valid_targets_min": 3905 + }, + { + "epoch": 1.4815686274509803, + "grad_norm": 0.5099534725059365, + "learning_rate": 3.850958479325281e-05, + "loss": 0.2809, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12173628807067871, + "step": 945, + "valid_targets_mean": 4427.0, + "valid_targets_min": 1989 + }, + { + "epoch": 1.4894117647058824, + "grad_norm": 0.5134884915273966, + "learning_rate": 3.8479833391035085e-05, + "loss": 0.2699, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11635063588619232, + "step": 950, + "valid_targets_mean": 4344.9, + "valid_targets_min": 443 + }, + { + "epoch": 1.4972549019607844, + "grad_norm": 0.480513750698937, + "learning_rate": 3.844979969508211e-05, + "loss": 0.2878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17787393927574158, + "step": 955, + "valid_targets_mean": 5552.0, + "valid_targets_min": 695 + }, + { + "epoch": 1.5050980392156863, + "grad_norm": 0.4766337557657441, + "learning_rate": 3.84194841641818e-05, + "loss": 0.2809, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1378069669008255, + "step": 960, + "valid_targets_mean": 4584.0, + "valid_targets_min": 897 + }, + { + "epoch": 1.5129411764705882, + "grad_norm": 0.44495383748209494, + "learning_rate": 3.838888726142732e-05, + "loss": 0.2725, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1239204853773117, + "step": 965, + "valid_targets_mean": 4935.8, + "valid_targets_min": 3706 + }, + { + "epoch": 1.5207843137254902, + "grad_norm": 0.4861707300267207, + "learning_rate": 3.8358009454210006e-05, + "loss": 0.282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1610291451215744, + "step": 970, + "valid_targets_mean": 5325.9, + "valid_targets_min": 2552 + }, + { + "epoch": 1.5286274509803923, + "grad_norm": 0.46843425756768353, + "learning_rate": 3.8326851214212206e-05, + "loss": 0.2704, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10426193475723267, + "step": 975, + "valid_targets_mean": 3031.6, + "valid_targets_min": 677 + }, + { + "epoch": 1.5364705882352943, + "grad_norm": 0.4787661485970747, + "learning_rate": 3.829541301740014e-05, + "loss": 0.2584, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11571415513753891, + "step": 980, + "valid_targets_mean": 4581.1, + "valid_targets_min": 1164 + }, + { + "epoch": 1.5443137254901962, + "grad_norm": 0.4798542433376364, + "learning_rate": 3.826369534401653e-05, + "loss": 0.2769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12648630142211914, + "step": 985, + "valid_targets_mean": 4808.4, + "valid_targets_min": 3196 + }, + { + "epoch": 1.5521568627450981, + "grad_norm": 0.4524354796896961, + "learning_rate": 3.823169867857337e-05, + "loss": 0.2739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11299093067646027, + "step": 990, + "valid_targets_mean": 4355.0, + "valid_targets_min": 3430 + }, + { + "epoch": 1.56, + "grad_norm": 0.48021380766661625, + "learning_rate": 3.819942350984444e-05, + "loss": 0.2828, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11084786802530289, + "step": 995, + "valid_targets_mean": 4540.6, + "valid_targets_min": 4192 + }, + { + "epoch": 1.567843137254902, + "grad_norm": 0.45077386317800505, + "learning_rate": 3.816687033085788e-05, + "loss": 0.271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14281418919563293, + "step": 1000, + "valid_targets_mean": 4483.5, + "valid_targets_min": 973 + }, + { + "epoch": 1.575686274509804, + "grad_norm": 0.49805538601357824, + "learning_rate": 3.813403963888866e-05, + "loss": 0.2767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10800270736217499, + "step": 1005, + "valid_targets_mean": 4369.6, + "valid_targets_min": 1821 + }, + { + "epoch": 1.5835294117647059, + "grad_norm": 0.4505476380153165, + "learning_rate": 3.810093193545097e-05, + "loss": 0.2663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17713075876235962, + "step": 1010, + "valid_targets_mean": 5999.9, + "valid_targets_min": 904 + }, + { + "epoch": 1.5913725490196078, + "grad_norm": 0.4575194505901327, + "learning_rate": 3.806754772629055e-05, + "loss": 0.279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14325906336307526, + "step": 1015, + "valid_targets_mean": 4706.1, + "valid_targets_min": 464 + }, + { + "epoch": 1.5992156862745097, + "grad_norm": 0.45014150592540364, + "learning_rate": 3.8033887521377015e-05, + "loss": 0.2671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14992156624794006, + "step": 1020, + "valid_targets_mean": 5189.2, + "valid_targets_min": 3654 + }, + { + "epoch": 1.6070588235294117, + "grad_norm": 0.4491623171932943, + "learning_rate": 3.799995183489599e-05, + "loss": 0.2792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17521008849143982, + "step": 1025, + "valid_targets_mean": 6152.9, + "valid_targets_min": 4129 + }, + { + "epoch": 1.6149019607843136, + "grad_norm": 0.4964276596194231, + "learning_rate": 3.796574118524131e-05, + "loss": 0.2795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12860007584095, + "step": 1030, + "valid_targets_mean": 4406.8, + "valid_targets_min": 3784 + }, + { + "epoch": 1.6227450980392157, + "grad_norm": 0.45560423944040035, + "learning_rate": 3.793125609500709e-05, + "loss": 0.2853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1591438204050064, + "step": 1035, + "valid_targets_mean": 6584.6, + "valid_targets_min": 3599 + }, + { + "epoch": 1.6305882352941177, + "grad_norm": 0.4408094419647726, + "learning_rate": 3.789649709097973e-05, + "loss": 0.2813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1180456355214119, + "step": 1040, + "valid_targets_mean": 4745.6, + "valid_targets_min": 2823 + }, + { + "epoch": 1.6384313725490196, + "grad_norm": 0.48261746494460517, + "learning_rate": 3.786146470412988e-05, + "loss": 0.2718, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13682833313941956, + "step": 1045, + "valid_targets_mean": 4307.1, + "valid_targets_min": 784 + }, + { + "epoch": 1.6462745098039215, + "grad_norm": 0.5081155036574729, + "learning_rate": 3.782615946960432e-05, + "loss": 0.2782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12664803862571716, + "step": 1050, + "valid_targets_mean": 5285.6, + "valid_targets_min": 696 + }, + { + "epoch": 1.6541176470588237, + "grad_norm": 0.4195569376421684, + "learning_rate": 3.779058192671777e-05, + "loss": 0.2877, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1745804250240326, + "step": 1055, + "valid_targets_mean": 6423.2, + "valid_targets_min": 3217 + }, + { + "epoch": 1.6619607843137256, + "grad_norm": 0.4698726821958353, + "learning_rate": 3.775473261894472e-05, + "loss": 0.2699, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16999664902687073, + "step": 1060, + "valid_targets_mean": 6138.6, + "valid_targets_min": 3941 + }, + { + "epoch": 1.6698039215686276, + "grad_norm": 0.41817128576043927, + "learning_rate": 3.771861209391103e-05, + "loss": 0.267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1361289620399475, + "step": 1065, + "valid_targets_mean": 5478.5, + "valid_targets_min": 3265 + }, + { + "epoch": 1.6776470588235295, + "grad_norm": 0.5313533412781013, + "learning_rate": 3.768222090338564e-05, + "loss": 0.2901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13523992896080017, + "step": 1070, + "valid_targets_mean": 3810.9, + "valid_targets_min": 668 + }, + { + "epoch": 1.6854901960784314, + "grad_norm": 0.44784161225326163, + "learning_rate": 3.7645559603272104e-05, + "loss": 0.2759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14014381170272827, + "step": 1075, + "valid_targets_mean": 5192.9, + "valid_targets_min": 701 + }, + { + "epoch": 1.6933333333333334, + "grad_norm": 0.4745633540456, + "learning_rate": 3.76086287536001e-05, + "loss": 0.2739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13647784292697906, + "step": 1080, + "valid_targets_mean": 4379.9, + "valid_targets_min": 786 + }, + { + "epoch": 1.7011764705882353, + "grad_norm": 0.4406930109228543, + "learning_rate": 3.757142891851691e-05, + "loss": 0.2641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11379043757915497, + "step": 1085, + "valid_targets_mean": 4284.6, + "valid_targets_min": 2690 + }, + { + "epoch": 1.7090196078431372, + "grad_norm": 0.4381588247078304, + "learning_rate": 3.753396066627876e-05, + "loss": 0.2825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13208818435668945, + "step": 1090, + "valid_targets_mean": 4889.5, + "valid_targets_min": 3500 + }, + { + "epoch": 1.7168627450980392, + "grad_norm": 0.4494074671045861, + "learning_rate": 3.749622456924215e-05, + "loss": 0.2755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12918317317962646, + "step": 1095, + "valid_targets_mean": 5156.4, + "valid_targets_min": 3659 + }, + { + "epoch": 1.724705882352941, + "grad_norm": 0.459960762817952, + "learning_rate": 3.745822120385512e-05, + "loss": 0.2903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11129502952098846, + "step": 1100, + "valid_targets_mean": 4385.8, + "valid_targets_min": 736 + }, + { + "epoch": 1.732549019607843, + "grad_norm": 0.47940383452188756, + "learning_rate": 3.7419951150648445e-05, + "loss": 0.2671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10941147804260254, + "step": 1105, + "valid_targets_mean": 3149.5, + "valid_targets_min": 808 + }, + { + "epoch": 1.740392156862745, + "grad_norm": 0.4821955655374367, + "learning_rate": 3.738141499422677e-05, + "loss": 0.2733, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13078473508358002, + "step": 1110, + "valid_targets_mean": 4533.4, + "valid_targets_min": 1115 + }, + { + "epoch": 1.748235294117647, + "grad_norm": 0.5819716977898828, + "learning_rate": 3.7342613323259654e-05, + "loss": 0.2792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11359615623950958, + "step": 1115, + "valid_targets_mean": 4173.2, + "valid_targets_min": 757 + }, + { + "epoch": 1.756078431372549, + "grad_norm": 0.4021276805738122, + "learning_rate": 3.7303546730472607e-05, + "loss": 0.269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14241759479045868, + "step": 1120, + "valid_targets_mean": 5989.4, + "valid_targets_min": 4148 + }, + { + "epoch": 1.763921568627451, + "grad_norm": 0.4882268950005422, + "learning_rate": 3.726421581263802e-05, + "loss": 0.2689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1279492974281311, + "step": 1125, + "valid_targets_mean": 4249.0, + "valid_targets_min": 604 + }, + { + "epoch": 1.771764705882353, + "grad_norm": 0.4391268851806516, + "learning_rate": 3.722462117056607e-05, + "loss": 0.2718, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17066633701324463, + "step": 1130, + "valid_targets_mean": 5343.8, + "valid_targets_min": 3800 + }, + { + "epoch": 1.779607843137255, + "grad_norm": 0.41715519290088876, + "learning_rate": 3.718476340909548e-05, + "loss": 0.2682, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12390994280576706, + "step": 1135, + "valid_targets_mean": 5063.4, + "valid_targets_min": 3835 + }, + { + "epoch": 1.787450980392157, + "grad_norm": 0.43055363176019373, + "learning_rate": 3.714464313708439e-05, + "loss": 0.2711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12827664613723755, + "step": 1140, + "valid_targets_mean": 5404.1, + "valid_targets_min": 3878 + }, + { + "epoch": 1.795294117647059, + "grad_norm": 0.4467983247147168, + "learning_rate": 3.710426096740094e-05, + "loss": 0.2845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11275273561477661, + "step": 1145, + "valid_targets_mean": 5128.1, + "valid_targets_min": 3606 + }, + { + "epoch": 1.8031372549019609, + "grad_norm": 0.4532080165298866, + "learning_rate": 3.7063617516913974e-05, + "loss": 0.263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10102865099906921, + "step": 1150, + "valid_targets_mean": 3786.1, + "valid_targets_min": 601 + }, + { + "epoch": 1.8109803921568628, + "grad_norm": 0.45477210640708865, + "learning_rate": 3.7022713406483626e-05, + "loss": 0.2636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12230783700942993, + "step": 1155, + "valid_targets_mean": 4558.8, + "valid_targets_min": 2708 + }, + { + "epoch": 1.8188235294117647, + "grad_norm": 0.4331370541967343, + "learning_rate": 3.698154926095177e-05, + "loss": 0.2773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12535810470581055, + "step": 1160, + "valid_targets_mean": 5213.6, + "valid_targets_min": 3787 + }, + { + "epoch": 1.8266666666666667, + "grad_norm": 0.4121000726174262, + "learning_rate": 3.694012570913254e-05, + "loss": 0.2694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1354580819606781, + "step": 1165, + "valid_targets_mean": 5838.6, + "valid_targets_min": 4390 + }, + { + "epoch": 1.8345098039215686, + "grad_norm": 0.41764883679327386, + "learning_rate": 3.689844338380271e-05, + "loss": 0.276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16744661331176758, + "step": 1170, + "valid_targets_mean": 6286.6, + "valid_targets_min": 3685 + }, + { + "epoch": 1.8423529411764705, + "grad_norm": 0.4777235188577736, + "learning_rate": 3.6856502921692004e-05, + "loss": 0.2801, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14872866868972778, + "step": 1175, + "valid_targets_mean": 4034.6, + "valid_targets_min": 501 + }, + { + "epoch": 1.8501960784313725, + "grad_norm": 0.4537327724299662, + "learning_rate": 3.681430496347339e-05, + "loss": 0.2756, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12654449045658112, + "step": 1180, + "valid_targets_mean": 4453.2, + "valid_targets_min": 1911 + }, + { + "epoch": 1.8580392156862744, + "grad_norm": 0.4725361478945017, + "learning_rate": 3.677185015375329e-05, + "loss": 0.2796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11899863183498383, + "step": 1185, + "valid_targets_mean": 3511.9, + "valid_targets_min": 637 + }, + { + "epoch": 1.8658823529411763, + "grad_norm": 0.43676745421678775, + "learning_rate": 3.672913914106173e-05, + "loss": 0.2759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11573658138513565, + "step": 1190, + "valid_targets_mean": 4290.5, + "valid_targets_min": 1293 + }, + { + "epoch": 1.8737254901960785, + "grad_norm": 0.4929717954552796, + "learning_rate": 3.6686172577842425e-05, + "loss": 0.2817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13691729307174683, + "step": 1195, + "valid_targets_mean": 4568.4, + "valid_targets_min": 659 + }, + { + "epoch": 1.8815686274509804, + "grad_norm": 0.4405003687632648, + "learning_rate": 3.6642951120442834e-05, + "loss": 0.2835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1263415813446045, + "step": 1200, + "valid_targets_mean": 5306.5, + "valid_targets_min": 4122 + }, + { + "epoch": 1.8894117647058823, + "grad_norm": 0.44460183123100777, + "learning_rate": 3.6599475429104125e-05, + "loss": 0.2921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20764252543449402, + "step": 1205, + "valid_targets_mean": 7194.6, + "valid_targets_min": 3276 + }, + { + "epoch": 1.8972549019607843, + "grad_norm": 0.44478346536222496, + "learning_rate": 3.655574616795108e-05, + "loss": 0.2602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14065058529376984, + "step": 1210, + "valid_targets_mean": 5352.9, + "valid_targets_min": 3593 + }, + { + "epoch": 1.9050980392156864, + "grad_norm": 0.4419280017991199, + "learning_rate": 3.651176400498194e-05, + "loss": 0.2724, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16233976185321808, + "step": 1215, + "valid_targets_mean": 5459.9, + "valid_targets_min": 4407 + }, + { + "epoch": 1.9129411764705884, + "grad_norm": 0.46390239048982107, + "learning_rate": 3.646752961205825e-05, + "loss": 0.2895, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17894771695137024, + "step": 1220, + "valid_targets_mean": 5047.5, + "valid_targets_min": 833 + }, + { + "epoch": 1.9207843137254903, + "grad_norm": 0.4438782966995154, + "learning_rate": 3.642304366489453e-05, + "loss": 0.2759, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1729862093925476, + "step": 1225, + "valid_targets_mean": 6348.2, + "valid_targets_min": 4423 + }, + { + "epoch": 1.9286274509803922, + "grad_norm": 0.47402141722773866, + "learning_rate": 3.6378306843047996e-05, + "loss": 0.27, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10692477226257324, + "step": 1230, + "valid_targets_mean": 4371.1, + "valid_targets_min": 3719 + }, + { + "epoch": 1.9364705882352942, + "grad_norm": 0.43266903488313885, + "learning_rate": 3.6333319829908196e-05, + "loss": 0.2731, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1654496192932129, + "step": 1235, + "valid_targets_mean": 6174.9, + "valid_targets_min": 3664 + }, + { + "epoch": 1.944313725490196, + "grad_norm": 0.49592255861334467, + "learning_rate": 3.628808331268649e-05, + "loss": 0.2752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1314307451248169, + "step": 1240, + "valid_targets_mean": 4144.4, + "valid_targets_min": 407 + }, + { + "epoch": 1.952156862745098, + "grad_norm": 0.435538874680241, + "learning_rate": 3.624259798240565e-05, + "loss": 0.28, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15344339609146118, + "step": 1245, + "valid_targets_mean": 5449.9, + "valid_targets_min": 3396 + }, + { + "epoch": 1.96, + "grad_norm": 0.5094650203239252, + "learning_rate": 3.6196864533889245e-05, + "loss": 0.2576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12815450131893158, + "step": 1250, + "valid_targets_mean": 4447.8, + "valid_targets_min": 722 + }, + { + "epoch": 1.967843137254902, + "grad_norm": 0.45177257568112905, + "learning_rate": 3.615088366575104e-05, + "loss": 0.2722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13006862998008728, + "step": 1255, + "valid_targets_mean": 4545.5, + "valid_targets_min": 3821 + }, + { + "epoch": 1.9756862745098038, + "grad_norm": 0.4682992295938859, + "learning_rate": 3.610465608038432e-05, + "loss": 0.2709, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1345278024673462, + "step": 1260, + "valid_targets_mean": 4651.2, + "valid_targets_min": 3695 + }, + { + "epoch": 1.9835294117647058, + "grad_norm": 0.46672262150503485, + "learning_rate": 3.605818248395118e-05, + "loss": 0.2745, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12447239458560944, + "step": 1265, + "valid_targets_mean": 3983.6, + "valid_targets_min": 675 + }, + { + "epoch": 1.9913725490196077, + "grad_norm": 0.4299468455762349, + "learning_rate": 3.6011463586371715e-05, + "loss": 0.2661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11944080144166946, + "step": 1270, + "valid_targets_mean": 5400.0, + "valid_targets_min": 3763 + }, + { + "epoch": 1.9992156862745099, + "grad_norm": 0.43099766066618245, + "learning_rate": 3.596450010131319e-05, + "loss": 0.2708, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10978048294782639, + "step": 1275, + "valid_targets_mean": 4126.8, + "valid_targets_min": 785 + }, + { + "epoch": 2.0062745098039216, + "grad_norm": 0.4576887974176139, + "learning_rate": 3.5917292746179134e-05, + "loss": 0.2561, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14465484023094177, + "step": 1280, + "valid_targets_mean": 5874.0, + "valid_targets_min": 4065 + }, + { + "epoch": 2.0141176470588236, + "grad_norm": 0.45200663585781176, + "learning_rate": 3.586984224209837e-05, + "loss": 0.2479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11500234156847, + "step": 1285, + "valid_targets_mean": 4390.4, + "valid_targets_min": 3582 + }, + { + "epoch": 2.0219607843137255, + "grad_norm": 0.45078823865058354, + "learning_rate": 3.582214931391402e-05, + "loss": 0.264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13320954144001007, + "step": 1290, + "valid_targets_mean": 4999.0, + "valid_targets_min": 3822 + }, + { + "epoch": 2.0298039215686274, + "grad_norm": 0.48915435190703266, + "learning_rate": 3.5774214690172405e-05, + "loss": 0.2724, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15321773290634155, + "step": 1295, + "valid_targets_mean": 5010.4, + "valid_targets_min": 952 + }, + { + "epoch": 2.0376470588235294, + "grad_norm": 0.43119415423933033, + "learning_rate": 3.572603910311196e-05, + "loss": 0.2521, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14951878786087036, + "step": 1300, + "valid_targets_mean": 5940.9, + "valid_targets_min": 4218 + }, + { + "epoch": 2.0454901960784313, + "grad_norm": 0.453774158368299, + "learning_rate": 3.5677623288652e-05, + "loss": 0.2648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12337134033441544, + "step": 1305, + "valid_targets_mean": 4268.1, + "valid_targets_min": 669 + }, + { + "epoch": 2.0533333333333332, + "grad_norm": 0.43873462102134814, + "learning_rate": 3.5628967986381485e-05, + "loss": 0.2682, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12993843853473663, + "step": 1310, + "valid_targets_mean": 5040.6, + "valid_targets_min": 3270 + }, + { + "epoch": 2.061176470588235, + "grad_norm": 0.48445761598277753, + "learning_rate": 3.558007393954778e-05, + "loss": 0.2536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1226993054151535, + "step": 1315, + "valid_targets_mean": 4753.5, + "valid_targets_min": 3988 + }, + { + "epoch": 2.069019607843137, + "grad_norm": 0.4431437458469214, + "learning_rate": 3.553094189504522e-05, + "loss": 0.2586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12933582067489624, + "step": 1320, + "valid_targets_mean": 5278.0, + "valid_targets_min": 3530 + }, + { + "epoch": 2.076862745098039, + "grad_norm": 0.4925639699972867, + "learning_rate": 3.548157260340376e-05, + "loss": 0.2478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12065766751766205, + "step": 1325, + "valid_targets_mean": 4327.9, + "valid_targets_min": 928 + }, + { + "epoch": 2.084705882352941, + "grad_norm": 0.4748173687132383, + "learning_rate": 3.5431966818777476e-05, + "loss": 0.2627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14784438908100128, + "step": 1330, + "valid_targets_mean": 4556.0, + "valid_targets_min": 677 + }, + { + "epoch": 2.0925490196078433, + "grad_norm": 0.46446365306399356, + "learning_rate": 3.5382125298933055e-05, + "loss": 0.2621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13218021392822266, + "step": 1335, + "valid_targets_mean": 4969.9, + "valid_targets_min": 3886 + }, + { + "epoch": 2.1003921568627453, + "grad_norm": 0.4024430729199942, + "learning_rate": 3.533204880523823e-05, + "loss": 0.2572, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12806639075279236, + "step": 1340, + "valid_targets_mean": 6134.9, + "valid_targets_min": 3973 + }, + { + "epoch": 2.108235294117647, + "grad_norm": 0.49039396114872347, + "learning_rate": 3.528173810265015e-05, + "loss": 0.2727, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13579592108726501, + "step": 1345, + "valid_targets_mean": 4923.4, + "valid_targets_min": 3575 + }, + { + "epoch": 2.116078431372549, + "grad_norm": 0.4547559535366543, + "learning_rate": 3.5231193959703654e-05, + "loss": 0.2589, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17610886693000793, + "step": 1350, + "valid_targets_mean": 5835.4, + "valid_targets_min": 780 + }, + { + "epoch": 2.123921568627451, + "grad_norm": 0.4335357581518014, + "learning_rate": 3.51804171484996e-05, + "loss": 0.2755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15231119096279144, + "step": 1355, + "valid_targets_mean": 6393.4, + "valid_targets_min": 4455 + }, + { + "epoch": 2.131764705882353, + "grad_norm": 0.4262901053655905, + "learning_rate": 3.5129408444693014e-05, + "loss": 0.2681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15080666542053223, + "step": 1360, + "valid_targets_mean": 5871.1, + "valid_targets_min": 3873 + }, + { + "epoch": 2.139607843137255, + "grad_norm": 0.41157978357484015, + "learning_rate": 3.507816862748126e-05, + "loss": 0.2552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11613994836807251, + "step": 1365, + "valid_targets_mean": 4608.5, + "valid_targets_min": 817 + }, + { + "epoch": 2.147450980392157, + "grad_norm": 0.4393084572770216, + "learning_rate": 3.502669847959213e-05, + "loss": 0.2397, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12773963809013367, + "step": 1370, + "valid_targets_mean": 5043.8, + "valid_targets_min": 3797 + }, + { + "epoch": 2.155294117647059, + "grad_norm": 0.43224899587658944, + "learning_rate": 3.497499878727193e-05, + "loss": 0.2621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14609867334365845, + "step": 1375, + "valid_targets_mean": 7183.4, + "valid_targets_min": 3707 + }, + { + "epoch": 2.1631372549019607, + "grad_norm": 0.44993852844779975, + "learning_rate": 3.49230703402734e-05, + "loss": 0.2691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15001554787158966, + "step": 1380, + "valid_targets_mean": 5360.2, + "valid_targets_min": 3605 + }, + { + "epoch": 2.1709803921568627, + "grad_norm": 0.45145932766055635, + "learning_rate": 3.487091393184369e-05, + "loss": 0.2609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10081503540277481, + "step": 1385, + "valid_targets_mean": 3932.6, + "valid_targets_min": 580 + }, + { + "epoch": 2.1788235294117646, + "grad_norm": 0.4630111233196212, + "learning_rate": 3.481853035871224e-05, + "loss": 0.2628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15715688467025757, + "step": 1390, + "valid_targets_mean": 5147.0, + "valid_targets_min": 816 + }, + { + "epoch": 2.1866666666666665, + "grad_norm": 0.42476980988232227, + "learning_rate": 3.476592042107862e-05, + "loss": 0.2552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1355331540107727, + "step": 1395, + "valid_targets_mean": 5580.8, + "valid_targets_min": 3203 + }, + { + "epoch": 2.1945098039215685, + "grad_norm": 0.46012280923366145, + "learning_rate": 3.4713084922600274e-05, + "loss": 0.2522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09466949850320816, + "step": 1400, + "valid_targets_mean": 3824.4, + "valid_targets_min": 897 + }, + { + "epoch": 2.2023529411764704, + "grad_norm": 0.45613351517254874, + "learning_rate": 3.466002467038028e-05, + "loss": 0.2608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14354060590267181, + "step": 1405, + "valid_targets_mean": 5275.2, + "valid_targets_min": 3251 + }, + { + "epoch": 2.2101960784313723, + "grad_norm": 0.45134079789119325, + "learning_rate": 3.460674047495497e-05, + "loss": 0.2705, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09967637807130814, + "step": 1410, + "valid_targets_mean": 3815.8, + "valid_targets_min": 796 + }, + { + "epoch": 2.2180392156862747, + "grad_norm": 0.4423793190213438, + "learning_rate": 3.455323315028164e-05, + "loss": 0.2496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12513357400894165, + "step": 1415, + "valid_targets_mean": 5017.8, + "valid_targets_min": 3620 + }, + { + "epoch": 2.2258823529411766, + "grad_norm": 0.48405737331229126, + "learning_rate": 3.449950351372599e-05, + "loss": 0.2733, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12709875404834747, + "step": 1420, + "valid_targets_mean": 3627.4, + "valid_targets_min": 578 + }, + { + "epoch": 2.2337254901960786, + "grad_norm": 0.44207806562612784, + "learning_rate": 3.444555238604974e-05, + "loss": 0.2675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11383885145187378, + "step": 1425, + "valid_targets_mean": 4074.1, + "valid_targets_min": 983 + }, + { + "epoch": 2.2415686274509805, + "grad_norm": 0.45288162146105243, + "learning_rate": 3.439138059139808e-05, + "loss": 0.2486, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13188298046588898, + "step": 1430, + "valid_targets_mean": 5178.9, + "valid_targets_min": 3668 + }, + { + "epoch": 2.2494117647058824, + "grad_norm": 0.41893172335481055, + "learning_rate": 3.433698895728701e-05, + "loss": 0.2546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11395653337240219, + "step": 1435, + "valid_targets_mean": 5147.2, + "valid_targets_min": 3650 + }, + { + "epoch": 2.2572549019607844, + "grad_norm": 0.4463833706314381, + "learning_rate": 3.428237831459078e-05, + "loss": 0.2642, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1425066888332367, + "step": 1440, + "valid_targets_mean": 5160.4, + "valid_targets_min": 3250 + }, + { + "epoch": 2.2650980392156863, + "grad_norm": 0.4628208133465244, + "learning_rate": 3.422754949752917e-05, + "loss": 0.2606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1350829303264618, + "step": 1445, + "valid_targets_mean": 5317.6, + "valid_targets_min": 3540 + }, + { + "epoch": 2.2729411764705882, + "grad_norm": 0.41564615419434575, + "learning_rate": 3.41725033436547e-05, + "loss": 0.2553, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.126197949051857, + "step": 1450, + "valid_targets_mean": 4831.5, + "valid_targets_min": 665 + }, + { + "epoch": 2.28078431372549, + "grad_norm": 0.4340917177276431, + "learning_rate": 3.411724069383993e-05, + "loss": 0.2618, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1303197741508484, + "step": 1455, + "valid_targets_mean": 5435.0, + "valid_targets_min": 3797 + }, + { + "epoch": 2.288627450980392, + "grad_norm": 0.47085411749146966, + "learning_rate": 3.4061762392264545e-05, + "loss": 0.2619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12932007014751434, + "step": 1460, + "valid_targets_mean": 4807.9, + "valid_targets_min": 869 + }, + { + "epoch": 2.296470588235294, + "grad_norm": 0.4517811739999653, + "learning_rate": 3.400606928640245e-05, + "loss": 0.2599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14722979068756104, + "step": 1465, + "valid_targets_mean": 6255.8, + "valid_targets_min": 685 + }, + { + "epoch": 2.304313725490196, + "grad_norm": 0.4287736838496608, + "learning_rate": 3.3950162227008884e-05, + "loss": 0.2601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11872623860836029, + "step": 1470, + "valid_targets_mean": 4925.6, + "valid_targets_min": 3386 + }, + { + "epoch": 2.312156862745098, + "grad_norm": 0.4087067393977361, + "learning_rate": 3.389404206810739e-05, + "loss": 0.2603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12659403681755066, + "step": 1475, + "valid_targets_mean": 5264.6, + "valid_targets_min": 3238 + }, + { + "epoch": 2.32, + "grad_norm": 0.42539754197954616, + "learning_rate": 3.383770966697675e-05, + "loss": 0.269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11696159094572067, + "step": 1480, + "valid_targets_mean": 5793.8, + "valid_targets_min": 3558 + }, + { + "epoch": 2.3278431372549018, + "grad_norm": 0.45919977036236226, + "learning_rate": 3.378116588413792e-05, + "loss": 0.2752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2455115169286728, + "step": 1485, + "valid_targets_mean": 7003.0, + "valid_targets_min": 3702 + }, + { + "epoch": 2.335686274509804, + "grad_norm": 0.47012118225391586, + "learning_rate": 3.372441158334089e-05, + "loss": 0.2725, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12278923392295837, + "step": 1490, + "valid_targets_mean": 4004.5, + "valid_targets_min": 705 + }, + { + "epoch": 2.343529411764706, + "grad_norm": 0.45097229914655057, + "learning_rate": 3.3667447631551456e-05, + "loss": 0.2557, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11797159165143967, + "step": 1495, + "valid_targets_mean": 4820.8, + "valid_targets_min": 3175 + }, + { + "epoch": 2.351372549019608, + "grad_norm": 0.44937463916849063, + "learning_rate": 3.361027489893799e-05, + "loss": 0.2493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1273888796567917, + "step": 1500, + "valid_targets_mean": 4960.4, + "valid_targets_min": 3482 + }, + { + "epoch": 2.35921568627451, + "grad_norm": 0.4297668418247861, + "learning_rate": 3.3552894258858173e-05, + "loss": 0.2489, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1481958031654358, + "step": 1505, + "valid_targets_mean": 5842.0, + "valid_targets_min": 3544 + }, + { + "epoch": 2.367058823529412, + "grad_norm": 0.4960961983896037, + "learning_rate": 3.3495306587845616e-05, + "loss": 0.249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13040918111801147, + "step": 1510, + "valid_targets_mean": 3905.0, + "valid_targets_min": 635 + }, + { + "epoch": 2.374901960784314, + "grad_norm": 0.4282759611457031, + "learning_rate": 3.343751276559651e-05, + "loss": 0.2516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11184579879045486, + "step": 1515, + "valid_targets_mean": 4647.2, + "valid_targets_min": 660 + }, + { + "epoch": 2.3827450980392157, + "grad_norm": 0.45579365401838495, + "learning_rate": 3.3379513674956134e-05, + "loss": 0.2685, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12589934468269348, + "step": 1520, + "valid_targets_mean": 5245.9, + "valid_targets_min": 1678 + }, + { + "epoch": 2.3905882352941177, + "grad_norm": 0.45709101945433256, + "learning_rate": 3.332131020190542e-05, + "loss": 0.2478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11196628212928772, + "step": 1525, + "valid_targets_mean": 4238.2, + "valid_targets_min": 3391 + }, + { + "epoch": 2.3984313725490196, + "grad_norm": 0.4591799991741506, + "learning_rate": 3.326290323554739e-05, + "loss": 0.2599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1280558705329895, + "step": 1530, + "valid_targets_mean": 3959.6, + "valid_targets_min": 681 + }, + { + "epoch": 2.4062745098039215, + "grad_norm": 0.4615942164142822, + "learning_rate": 3.320429366809361e-05, + "loss": 0.255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11446023732423782, + "step": 1535, + "valid_targets_mean": 4679.1, + "valid_targets_min": 3561 + }, + { + "epoch": 2.4141176470588235, + "grad_norm": 0.42097481544627646, + "learning_rate": 3.314548239485048e-05, + "loss": 0.2544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12864826619625092, + "step": 1540, + "valid_targets_mean": 5744.0, + "valid_targets_min": 4080 + }, + { + "epoch": 2.4219607843137254, + "grad_norm": 0.4698739773554904, + "learning_rate": 3.308647031420567e-05, + "loss": 0.2706, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10772387683391571, + "step": 1545, + "valid_targets_mean": 3619.2, + "valid_targets_min": 420 + }, + { + "epoch": 2.4298039215686273, + "grad_norm": 0.46570283043841393, + "learning_rate": 3.3027258327614305e-05, + "loss": 0.2559, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13037823140621185, + "step": 1550, + "valid_targets_mean": 4860.4, + "valid_targets_min": 392 + }, + { + "epoch": 2.4376470588235293, + "grad_norm": 0.42593711692675135, + "learning_rate": 3.296784733958524e-05, + "loss": 0.2617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11170825362205505, + "step": 1555, + "valid_targets_mean": 5222.6, + "valid_targets_min": 3930 + }, + { + "epoch": 2.445490196078431, + "grad_norm": 0.4503559079527785, + "learning_rate": 3.2908238257667214e-05, + "loss": 0.2602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11901139467954636, + "step": 1560, + "valid_targets_mean": 4362.2, + "valid_targets_min": 618 + }, + { + "epoch": 2.453333333333333, + "grad_norm": 0.4536297330372539, + "learning_rate": 3.2848431992435037e-05, + "loss": 0.2633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1577979326248169, + "step": 1565, + "valid_targets_mean": 5607.9, + "valid_targets_min": 664 + }, + { + "epoch": 2.461176470588235, + "grad_norm": 0.4578552551635253, + "learning_rate": 3.278842945747561e-05, + "loss": 0.2675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13507062196731567, + "step": 1570, + "valid_targets_mean": 4755.2, + "valid_targets_min": 4177 + }, + { + "epoch": 2.469019607843137, + "grad_norm": 0.405225958138305, + "learning_rate": 3.272823156937403e-05, + "loss": 0.2734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12951521575450897, + "step": 1575, + "valid_targets_mean": 5787.6, + "valid_targets_min": 3621 + }, + { + "epoch": 2.4768627450980394, + "grad_norm": 0.47001834465815556, + "learning_rate": 3.266783924769954e-05, + "loss": 0.2734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15250499546527863, + "step": 1580, + "valid_targets_mean": 4942.0, + "valid_targets_min": 958 + }, + { + "epoch": 2.4847058823529413, + "grad_norm": 0.4443067921781512, + "learning_rate": 3.2607253414991534e-05, + "loss": 0.2491, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11628343164920807, + "step": 1585, + "valid_targets_mean": 4674.5, + "valid_targets_min": 1464 + }, + { + "epoch": 2.4925490196078433, + "grad_norm": 0.434437602942818, + "learning_rate": 3.2546474996745424e-05, + "loss": 0.2517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13555780053138733, + "step": 1590, + "valid_targets_mean": 5046.5, + "valid_targets_min": 730 + }, + { + "epoch": 2.500392156862745, + "grad_norm": 0.4208723935905886, + "learning_rate": 3.248550492139851e-05, + "loss": 0.259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13717062771320343, + "step": 1595, + "valid_targets_mean": 5657.9, + "valid_targets_min": 727 + }, + { + "epoch": 2.508235294117647, + "grad_norm": 0.4156063186715286, + "learning_rate": 3.242434412031581e-05, + "loss": 0.2633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12002235651016235, + "step": 1600, + "valid_targets_mean": 4616.9, + "valid_targets_min": 3414 + }, + { + "epoch": 2.516078431372549, + "grad_norm": 0.4532735568961372, + "learning_rate": 3.236299352777583e-05, + "loss": 0.2558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11414999514818192, + "step": 1605, + "valid_targets_mean": 4527.4, + "valid_targets_min": 3291 + }, + { + "epoch": 2.523921568627451, + "grad_norm": 0.45229568900269806, + "learning_rate": 3.230145408095626e-05, + "loss": 0.2622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16222326457500458, + "step": 1610, + "valid_targets_mean": 6180.2, + "valid_targets_min": 4221 + }, + { + "epoch": 2.531764705882353, + "grad_norm": 0.9265934257142856, + "learning_rate": 3.223972671991972e-05, + "loss": 0.2635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11284160614013672, + "step": 1615, + "valid_targets_mean": 4565.6, + "valid_targets_min": 2368 + }, + { + "epoch": 2.539607843137255, + "grad_norm": 0.4676815700857632, + "learning_rate": 3.217781238759935e-05, + "loss": 0.2565, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13243766129016876, + "step": 1620, + "valid_targets_mean": 4217.1, + "valid_targets_min": 768 + }, + { + "epoch": 2.547450980392157, + "grad_norm": 0.46955739866786866, + "learning_rate": 3.211571202978442e-05, + "loss": 0.2698, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14136609435081482, + "step": 1625, + "valid_targets_mean": 3918.2, + "valid_targets_min": 744 + }, + { + "epoch": 2.5552941176470587, + "grad_norm": 0.4096516881386851, + "learning_rate": 3.2053426595105865e-05, + "loss": 0.25, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1313982754945755, + "step": 1630, + "valid_targets_mean": 5967.1, + "valid_targets_min": 3776 + }, + { + "epoch": 2.5631372549019606, + "grad_norm": 0.40846410459043553, + "learning_rate": 3.199095703502185e-05, + "loss": 0.2626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12226898968219757, + "step": 1635, + "valid_targets_mean": 5342.9, + "valid_targets_min": 3797 + }, + { + "epoch": 2.5709803921568626, + "grad_norm": 0.4673050459428165, + "learning_rate": 3.1928304303803174e-05, + "loss": 0.2528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15106196701526642, + "step": 1640, + "valid_targets_mean": 5145.8, + "valid_targets_min": 3736 + }, + { + "epoch": 2.578823529411765, + "grad_norm": 0.4221808109207067, + "learning_rate": 3.1865469358518726e-05, + "loss": 0.2492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12939462065696716, + "step": 1645, + "valid_targets_mean": 5564.0, + "valid_targets_min": 3317 + }, + { + "epoch": 2.586666666666667, + "grad_norm": 0.4770970150351554, + "learning_rate": 3.180245315902084e-05, + "loss": 0.2451, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13009631633758545, + "step": 1650, + "valid_targets_mean": 4264.9, + "valid_targets_min": 3863 + }, + { + "epoch": 2.594509803921569, + "grad_norm": 0.4658297511693963, + "learning_rate": 3.173925666793065e-05, + "loss": 0.2504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11663345992565155, + "step": 1655, + "valid_targets_mean": 4386.8, + "valid_targets_min": 806 + }, + { + "epoch": 2.6023529411764708, + "grad_norm": 0.42932723171267134, + "learning_rate": 3.1675880850623416e-05, + "loss": 0.2755, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1144811138510704, + "step": 1660, + "valid_targets_mean": 4374.2, + "valid_targets_min": 3576 + }, + { + "epoch": 2.6101960784313727, + "grad_norm": 0.44524167780109175, + "learning_rate": 3.1612326675213717e-05, + "loss": 0.2557, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13575562834739685, + "step": 1665, + "valid_targets_mean": 5264.5, + "valid_targets_min": 3536 + }, + { + "epoch": 2.6180392156862746, + "grad_norm": 0.40667869411716223, + "learning_rate": 3.154859511254067e-05, + "loss": 0.2672, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14803528785705566, + "step": 1670, + "valid_targets_mean": 5660.6, + "valid_targets_min": 3556 + }, + { + "epoch": 2.6258823529411766, + "grad_norm": 0.46647343522628637, + "learning_rate": 3.148468713615318e-05, + "loss": 0.2617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17942845821380615, + "step": 1675, + "valid_targets_mean": 5058.1, + "valid_targets_min": 882 + }, + { + "epoch": 2.6337254901960785, + "grad_norm": 0.42492816146492085, + "learning_rate": 3.1420603722294935e-05, + "loss": 0.2561, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0995701402425766, + "step": 1680, + "valid_targets_mean": 4293.0, + "valid_targets_min": 868 + }, + { + "epoch": 2.6415686274509804, + "grad_norm": 0.4643952663623767, + "learning_rate": 3.135634584988962e-05, + "loss": 0.2612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15429197251796722, + "step": 1685, + "valid_targets_mean": 5230.4, + "valid_targets_min": 671 + }, + { + "epoch": 2.6494117647058824, + "grad_norm": 0.4307747516160081, + "learning_rate": 3.1291914500525886e-05, + "loss": 0.238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12061157077550888, + "step": 1690, + "valid_targets_mean": 4799.1, + "valid_targets_min": 876 + }, + { + "epoch": 2.6572549019607843, + "grad_norm": 0.45228484652654455, + "learning_rate": 3.1227310658442395e-05, + "loss": 0.2796, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1393534541130066, + "step": 1695, + "valid_targets_mean": 5052.2, + "valid_targets_min": 924 + }, + { + "epoch": 2.665098039215686, + "grad_norm": 0.4168826045733845, + "learning_rate": 3.1162535310512745e-05, + "loss": 0.2619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18650421500205994, + "step": 1700, + "valid_targets_mean": 6966.9, + "valid_targets_min": 601 + }, + { + "epoch": 2.672941176470588, + "grad_norm": 0.40084673503347185, + "learning_rate": 3.109758944623042e-05, + "loss": 0.2512, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14108054339885712, + "step": 1705, + "valid_targets_mean": 5895.4, + "valid_targets_min": 4538 + }, + { + "epoch": 2.68078431372549, + "grad_norm": 0.3955665597655761, + "learning_rate": 3.103247405769372e-05, + "loss": 0.2544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14262932538986206, + "step": 1710, + "valid_targets_mean": 6712.8, + "valid_targets_min": 3756 + }, + { + "epoch": 2.688627450980392, + "grad_norm": 0.44285839167263197, + "learning_rate": 3.0967190139590484e-05, + "loss": 0.2545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11949534714221954, + "step": 1715, + "valid_targets_mean": 4721.9, + "valid_targets_min": 3757 + }, + { + "epoch": 2.696470588235294, + "grad_norm": 0.4382594154360303, + "learning_rate": 3.090173868918303e-05, + "loss": 0.2568, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13688015937805176, + "step": 1720, + "valid_targets_mean": 5184.2, + "valid_targets_min": 3311 + }, + { + "epoch": 2.704313725490196, + "grad_norm": 0.44947431591051146, + "learning_rate": 3.083612070629283e-05, + "loss": 0.2653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13894183933734894, + "step": 1725, + "valid_targets_mean": 5535.2, + "valid_targets_min": 3820 + }, + { + "epoch": 2.712156862745098, + "grad_norm": 0.4183405331712526, + "learning_rate": 3.077033719328529e-05, + "loss": 0.2504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1369009017944336, + "step": 1730, + "valid_targets_mean": 6275.8, + "valid_targets_min": 4239 + }, + { + "epoch": 2.7199999999999998, + "grad_norm": 0.4573204986274018, + "learning_rate": 3.070438915505439e-05, + "loss": 0.2467, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1038956418633461, + "step": 1735, + "valid_targets_mean": 4946.8, + "valid_targets_min": 3587 + }, + { + "epoch": 2.7278431372549017, + "grad_norm": 0.40878178498619927, + "learning_rate": 3.063827759900739e-05, + "loss": 0.2606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17439252138137817, + "step": 1740, + "valid_targets_mean": 6192.5, + "valid_targets_min": 723 + }, + { + "epoch": 2.735686274509804, + "grad_norm": 0.44085339250166117, + "learning_rate": 3.057200353504938e-05, + "loss": 0.2667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16376739740371704, + "step": 1745, + "valid_targets_mean": 5451.5, + "valid_targets_min": 3356 + }, + { + "epoch": 2.743529411764706, + "grad_norm": 0.461953369271599, + "learning_rate": 3.0505567975567915e-05, + "loss": 0.2551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1565898358821869, + "step": 1750, + "valid_targets_mean": 5895.6, + "valid_targets_min": 3764 + }, + { + "epoch": 2.751372549019608, + "grad_norm": 0.4281409420363027, + "learning_rate": 3.04389719354175e-05, + "loss": 0.2663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13279592990875244, + "step": 1755, + "valid_targets_mean": 3907.8, + "valid_targets_min": 678 + }, + { + "epoch": 2.75921568627451, + "grad_norm": 0.43238889821769466, + "learning_rate": 3.0372216431904103e-05, + "loss": 0.2523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10412300378084183, + "step": 1760, + "valid_targets_mean": 4064.8, + "valid_targets_min": 995 + }, + { + "epoch": 2.767058823529412, + "grad_norm": 0.44339678774004454, + "learning_rate": 3.030530248476963e-05, + "loss": 0.2479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1417621672153473, + "step": 1765, + "valid_targets_mean": 4940.9, + "valid_targets_min": 808 + }, + { + "epoch": 2.7749019607843137, + "grad_norm": 0.7531055888351225, + "learning_rate": 3.0238231116176338e-05, + "loss": 0.2612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1466093808412552, + "step": 1770, + "valid_targets_mean": 5570.1, + "valid_targets_min": 1116 + }, + { + "epoch": 2.7827450980392157, + "grad_norm": 0.44515977292919706, + "learning_rate": 3.0171003350691194e-05, + "loss": 0.2681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11763986945152283, + "step": 1775, + "valid_targets_mean": 4642.2, + "valid_targets_min": 3477 + }, + { + "epoch": 2.7905882352941176, + "grad_norm": 0.4681887303349638, + "learning_rate": 3.0103620215270285e-05, + "loss": 0.2609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14247599244117737, + "step": 1780, + "valid_targets_mean": 4720.1, + "valid_targets_min": 4152 + }, + { + "epoch": 2.7984313725490195, + "grad_norm": 0.4368899815968614, + "learning_rate": 3.0036082739243064e-05, + "loss": 0.2507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11585693061351776, + "step": 1785, + "valid_targets_mean": 4842.4, + "valid_targets_min": 3042 + }, + { + "epoch": 2.8062745098039215, + "grad_norm": 0.4139493135985029, + "learning_rate": 2.996839195429667e-05, + "loss": 0.2667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13053040206432343, + "step": 1790, + "valid_targets_mean": 4798.0, + "valid_targets_min": 820 + }, + { + "epoch": 2.8141176470588234, + "grad_norm": 0.4339471630530843, + "learning_rate": 2.9900548894460146e-05, + "loss": 0.2575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11310513317584991, + "step": 1795, + "valid_targets_mean": 4532.4, + "valid_targets_min": 3948 + }, + { + "epoch": 2.8219607843137258, + "grad_norm": 0.4146149344392902, + "learning_rate": 2.9832554596088653e-05, + "loss": 0.2476, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11644154787063599, + "step": 1800, + "valid_targets_mean": 4799.2, + "valid_targets_min": 3593 + }, + { + "epoch": 2.8298039215686277, + "grad_norm": 0.399208547371692, + "learning_rate": 2.9764410097847657e-05, + "loss": 0.2663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1448148936033249, + "step": 1805, + "valid_targets_mean": 5765.4, + "valid_targets_min": 4453 + }, + { + "epoch": 2.8376470588235296, + "grad_norm": 0.42365842351647104, + "learning_rate": 2.9696116440697008e-05, + "loss": 0.2689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12039990723133087, + "step": 1810, + "valid_targets_mean": 4533.0, + "valid_targets_min": 699 + }, + { + "epoch": 2.8454901960784316, + "grad_norm": 0.41829893935454315, + "learning_rate": 2.9627674667875104e-05, + "loss": 0.2649, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1044776663184166, + "step": 1815, + "valid_targets_mean": 4577.5, + "valid_targets_min": 633 + }, + { + "epoch": 2.8533333333333335, + "grad_norm": 0.5098614371498988, + "learning_rate": 2.9559085824882916e-05, + "loss": 0.2558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1291094571352005, + "step": 1820, + "valid_targets_mean": 5700.8, + "valid_targets_min": 3426 + }, + { + "epoch": 2.8611764705882354, + "grad_norm": 0.3886315178037877, + "learning_rate": 2.9490350959468014e-05, + "loss": 0.2641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10714983940124512, + "step": 1825, + "valid_targets_mean": 5307.0, + "valid_targets_min": 3690 + }, + { + "epoch": 2.8690196078431374, + "grad_norm": 0.4434985699129623, + "learning_rate": 2.9421471121608588e-05, + "loss": 0.2587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.112812839448452, + "step": 1830, + "valid_targets_mean": 4190.8, + "valid_targets_min": 747 + }, + { + "epoch": 2.8768627450980393, + "grad_norm": 0.40331633099392356, + "learning_rate": 2.9352447363497378e-05, + "loss": 0.2444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16460323333740234, + "step": 1835, + "valid_targets_mean": 6978.6, + "valid_targets_min": 3874 + }, + { + "epoch": 2.8847058823529412, + "grad_norm": 0.3931483141522423, + "learning_rate": 2.928328073952564e-05, + "loss": 0.2526, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1279119849205017, + "step": 1840, + "valid_targets_mean": 5583.5, + "valid_targets_min": 3800 + }, + { + "epoch": 2.892549019607843, + "grad_norm": 0.44537855883298005, + "learning_rate": 2.921397230626699e-05, + "loss": 0.251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14499521255493164, + "step": 1845, + "valid_targets_mean": 5594.1, + "valid_targets_min": 3706 + }, + { + "epoch": 2.900392156862745, + "grad_norm": 0.4291966772375491, + "learning_rate": 2.914452312246131e-05, + "loss": 0.2597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1422233134508133, + "step": 1850, + "valid_targets_mean": 5994.2, + "valid_targets_min": 4215 + }, + { + "epoch": 2.908235294117647, + "grad_norm": 0.5524116065305122, + "learning_rate": 2.9074934248998557e-05, + "loss": 0.2661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13530707359313965, + "step": 1855, + "valid_targets_mean": 5521.1, + "valid_targets_min": 2581 + }, + { + "epoch": 2.916078431372549, + "grad_norm": 0.4208152215051117, + "learning_rate": 2.9005206748902538e-05, + "loss": 0.2632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15862345695495605, + "step": 1860, + "valid_targets_mean": 6273.5, + "valid_targets_min": 3548 + }, + { + "epoch": 2.923921568627451, + "grad_norm": 0.42119458482360816, + "learning_rate": 2.8935341687314703e-05, + "loss": 0.2526, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1609993726015091, + "step": 1865, + "valid_targets_mean": 6337.6, + "valid_targets_min": 4558 + }, + { + "epoch": 2.931764705882353, + "grad_norm": 0.429911645514168, + "learning_rate": 2.8865340131477846e-05, + "loss": 0.2554, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10718243569135666, + "step": 1870, + "valid_targets_mean": 3961.9, + "valid_targets_min": 967 + }, + { + "epoch": 2.9396078431372548, + "grad_norm": 0.3991529710863121, + "learning_rate": 2.8795203150719836e-05, + "loss": 0.2574, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12177126109600067, + "step": 1875, + "valid_targets_mean": 4913.1, + "valid_targets_min": 3659 + }, + { + "epoch": 2.9474509803921567, + "grad_norm": 0.3941443481025059, + "learning_rate": 2.8724931816437255e-05, + "loss": 0.2502, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10472463071346283, + "step": 1880, + "valid_targets_mean": 5183.1, + "valid_targets_min": 3549 + }, + { + "epoch": 2.9552941176470586, + "grad_norm": 0.4413921768424274, + "learning_rate": 2.8654527202079027e-05, + "loss": 0.2641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14560449123382568, + "step": 1885, + "valid_targets_mean": 4850.9, + "valid_targets_min": 2118 + }, + { + "epoch": 2.9631372549019606, + "grad_norm": 0.4475101418982669, + "learning_rate": 2.8583990383130043e-05, + "loss": 0.2524, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12408129125833511, + "step": 1890, + "valid_targets_mean": 4401.6, + "valid_targets_min": 636 + }, + { + "epoch": 2.9709803921568625, + "grad_norm": 0.42161930668028813, + "learning_rate": 2.8513322437094727e-05, + "loss": 0.247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12770900130271912, + "step": 1895, + "valid_targets_mean": 5884.8, + "valid_targets_min": 734 + }, + { + "epoch": 2.978823529411765, + "grad_norm": 0.47301335801935585, + "learning_rate": 2.844252444348055e-05, + "loss": 0.2522, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12068523466587067, + "step": 1900, + "valid_targets_mean": 4397.2, + "valid_targets_min": 593 + }, + { + "epoch": 2.986666666666667, + "grad_norm": 0.4152297852271275, + "learning_rate": 2.8371597483781577e-05, + "loss": 0.2529, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09066110849380493, + "step": 1905, + "valid_targets_mean": 4132.5, + "valid_targets_min": 277 + }, + { + "epoch": 2.9945098039215687, + "grad_norm": 0.4058706264549092, + "learning_rate": 2.8300542641461937e-05, + "loss": 0.2564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13444828987121582, + "step": 1910, + "valid_targets_mean": 6010.4, + "valid_targets_min": 4250 + }, + { + "epoch": 3.0015686274509803, + "grad_norm": 0.447309349141732, + "learning_rate": 2.822936100193924e-05, + "loss": 0.2776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11755850911140442, + "step": 1915, + "valid_targets_mean": 4557.0, + "valid_targets_min": 3016 + }, + { + "epoch": 3.0094117647058822, + "grad_norm": 0.4062062188090626, + "learning_rate": 2.8158053652568046e-05, + "loss": 0.2491, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13184432685375214, + "step": 1920, + "valid_targets_mean": 6199.8, + "valid_targets_min": 4235 + }, + { + "epoch": 3.017254901960784, + "grad_norm": 0.44070499727258766, + "learning_rate": 2.808662168262321e-05, + "loss": 0.2411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11080098152160645, + "step": 1925, + "valid_targets_mean": 4623.4, + "valid_targets_min": 3713 + }, + { + "epoch": 3.025098039215686, + "grad_norm": 0.4763670171149257, + "learning_rate": 2.8015066183283272e-05, + "loss": 0.2519, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1113940179347992, + "step": 1930, + "valid_targets_mean": 4373.8, + "valid_targets_min": 460 + }, + { + "epoch": 3.032941176470588, + "grad_norm": 0.4355243760620159, + "learning_rate": 2.7943388247613787e-05, + "loss": 0.2366, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14149567484855652, + "step": 1935, + "valid_targets_mean": 5609.1, + "valid_targets_min": 4401 + }, + { + "epoch": 3.0407843137254904, + "grad_norm": 0.42356997296686133, + "learning_rate": 2.787158897055061e-05, + "loss": 0.255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1346980333328247, + "step": 1940, + "valid_targets_mean": 5785.2, + "valid_targets_min": 4146 + }, + { + "epoch": 3.0486274509803923, + "grad_norm": 0.465176695347723, + "learning_rate": 2.7799669448883165e-05, + "loss": 0.2406, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12955603003501892, + "step": 1945, + "valid_targets_mean": 3767.0, + "valid_targets_min": 770 + }, + { + "epoch": 3.0564705882352943, + "grad_norm": 0.46121709494870516, + "learning_rate": 2.7727630781237743e-05, + "loss": 0.2433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1162000298500061, + "step": 1950, + "valid_targets_mean": 4428.5, + "valid_targets_min": 783 + }, + { + "epoch": 3.064313725490196, + "grad_norm": 0.429787541213453, + "learning_rate": 2.7655474068060644e-05, + "loss": 0.2493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11739633232355118, + "step": 1955, + "valid_targets_mean": 4955.6, + "valid_targets_min": 516 + }, + { + "epoch": 3.072156862745098, + "grad_norm": 0.46328820902774925, + "learning_rate": 2.7583200411601424e-05, + "loss": 0.2317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11228733509778976, + "step": 1960, + "valid_targets_mean": 5139.6, + "valid_targets_min": 2463 + }, + { + "epoch": 3.08, + "grad_norm": 0.5328657014424273, + "learning_rate": 2.7510810915896043e-05, + "loss": 0.2406, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13428783416748047, + "step": 1965, + "valid_targets_mean": 4627.1, + "valid_targets_min": 3925 + }, + { + "epoch": 3.087843137254902, + "grad_norm": 0.45050168223411524, + "learning_rate": 2.7438306686749978e-05, + "loss": 0.233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10249172151088715, + "step": 1970, + "valid_targets_mean": 4340.6, + "valid_targets_min": 3457 + }, + { + "epoch": 3.095686274509804, + "grad_norm": 0.4319070860395141, + "learning_rate": 2.7365688831721358e-05, + "loss": 0.2392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13910704851150513, + "step": 1975, + "valid_targets_mean": 5662.8, + "valid_targets_min": 4784 + }, + { + "epoch": 3.103529411764706, + "grad_norm": 0.42886398818721116, + "learning_rate": 2.7292958460104027e-05, + "loss": 0.2504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12069983780384064, + "step": 1980, + "valid_targets_mean": 5236.9, + "valid_targets_min": 782 + }, + { + "epoch": 3.111372549019608, + "grad_norm": 0.4611108403825653, + "learning_rate": 2.7220116682910628e-05, + "loss": 0.2519, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13484933972358704, + "step": 1985, + "valid_targets_mean": 5587.2, + "valid_targets_min": 821 + }, + { + "epoch": 3.1192156862745097, + "grad_norm": 0.4451396832224761, + "learning_rate": 2.714716461285559e-05, + "loss": 0.2453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11066186428070068, + "step": 1990, + "valid_targets_mean": 5059.9, + "valid_targets_min": 4067 + }, + { + "epoch": 3.1270588235294117, + "grad_norm": 0.38821312176893963, + "learning_rate": 2.7074103364338155e-05, + "loss": 0.2406, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14021679759025574, + "step": 1995, + "valid_targets_mean": 7066.0, + "valid_targets_min": 4159 + }, + { + "epoch": 3.1349019607843136, + "grad_norm": 0.4183193977456837, + "learning_rate": 2.7000934053425347e-05, + "loss": 0.248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12177550047636032, + "step": 2000, + "valid_targets_mean": 5553.2, + "valid_targets_min": 3258 + }, + { + "epoch": 3.1427450980392155, + "grad_norm": 0.43765474174948893, + "learning_rate": 2.692765779783494e-05, + "loss": 0.2402, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11270841956138611, + "step": 2005, + "valid_targets_mean": 4834.6, + "valid_targets_min": 3572 + }, + { + "epoch": 3.1505882352941175, + "grad_norm": 0.426633457560378, + "learning_rate": 2.6854275716918352e-05, + "loss": 0.253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14287523925304413, + "step": 2010, + "valid_targets_mean": 5455.9, + "valid_targets_min": 841 + }, + { + "epoch": 3.1584313725490194, + "grad_norm": 0.4078425097510185, + "learning_rate": 2.678078893164359e-05, + "loss": 0.2434, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11538930237293243, + "step": 2015, + "valid_targets_mean": 5689.1, + "valid_targets_min": 3770 + }, + { + "epoch": 3.1662745098039213, + "grad_norm": 0.44439178115633443, + "learning_rate": 2.6707198564578066e-05, + "loss": 0.2362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11317244172096252, + "step": 2020, + "valid_targets_mean": 4206.0, + "valid_targets_min": 2551 + }, + { + "epoch": 3.1741176470588237, + "grad_norm": 0.456212200285294, + "learning_rate": 2.663350573987152e-05, + "loss": 0.2461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11523454636335373, + "step": 2025, + "valid_targets_mean": 4083.5, + "valid_targets_min": 626 + }, + { + "epoch": 3.1819607843137256, + "grad_norm": 0.4599279892597807, + "learning_rate": 2.655971158323879e-05, + "loss": 0.231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11775343865156174, + "step": 2030, + "valid_targets_mean": 4272.1, + "valid_targets_min": 3329 + }, + { + "epoch": 3.1898039215686276, + "grad_norm": 0.40566259798749416, + "learning_rate": 2.648581722194264e-05, + "loss": 0.2465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12668456137180328, + "step": 2035, + "valid_targets_mean": 5694.6, + "valid_targets_min": 4027 + }, + { + "epoch": 3.1976470588235295, + "grad_norm": 0.4725635952751264, + "learning_rate": 2.6411823784776537e-05, + "loss": 0.2353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10355997085571289, + "step": 2040, + "valid_targets_mean": 4016.1, + "valid_targets_min": 792 + }, + { + "epoch": 3.2054901960784314, + "grad_norm": 0.44696073096110805, + "learning_rate": 2.6337732402047422e-05, + "loss": 0.2309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08200616389513016, + "step": 2045, + "valid_targets_mean": 4368.2, + "valid_targets_min": 3319 + }, + { + "epoch": 3.2133333333333334, + "grad_norm": 0.4046751507104614, + "learning_rate": 2.626354420555841e-05, + "loss": 0.2422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10652727633714676, + "step": 2050, + "valid_targets_mean": 5266.0, + "valid_targets_min": 4091 + }, + { + "epoch": 3.2211764705882353, + "grad_norm": 0.43847046907302706, + "learning_rate": 2.618926032859154e-05, + "loss": 0.2461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10782967507839203, + "step": 2055, + "valid_targets_mean": 4211.2, + "valid_targets_min": 789 + }, + { + "epoch": 3.2290196078431372, + "grad_norm": 0.4329089155848683, + "learning_rate": 2.611488190589043e-05, + "loss": 0.2498, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12138757854700089, + "step": 2060, + "valid_targets_mean": 4696.2, + "valid_targets_min": 4053 + }, + { + "epoch": 3.236862745098039, + "grad_norm": 0.42953762620876, + "learning_rate": 2.6040410073642965e-05, + "loss": 0.2573, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10514818876981735, + "step": 2065, + "valid_targets_mean": 4275.8, + "valid_targets_min": 888 + }, + { + "epoch": 3.244705882352941, + "grad_norm": 0.4701217543316149, + "learning_rate": 2.596584596946392e-05, + "loss": 0.249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11655449122190475, + "step": 2070, + "valid_targets_mean": 4477.5, + "valid_targets_min": 609 + }, + { + "epoch": 3.252549019607843, + "grad_norm": 0.4448673683099468, + "learning_rate": 2.589119073237762e-05, + "loss": 0.2485, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1493644416332245, + "step": 2075, + "valid_targets_mean": 5425.0, + "valid_targets_min": 876 + }, + { + "epoch": 3.260392156862745, + "grad_norm": 0.4529303538983212, + "learning_rate": 2.5816445502800494e-05, + "loss": 0.2467, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1310499757528305, + "step": 2080, + "valid_targets_mean": 4829.0, + "valid_targets_min": 731 + }, + { + "epoch": 3.268235294117647, + "grad_norm": 0.42516319618073034, + "learning_rate": 2.5741611422523684e-05, + "loss": 0.2363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10771302878856659, + "step": 2085, + "valid_targets_mean": 4812.5, + "valid_targets_min": 3609 + }, + { + "epoch": 3.276078431372549, + "grad_norm": 0.4202683026835801, + "learning_rate": 2.566668963469559e-05, + "loss": 0.2534, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13373664021492004, + "step": 2090, + "valid_targets_mean": 5934.4, + "valid_targets_min": 3554 + }, + { + "epoch": 3.283921568627451, + "grad_norm": 0.46645395477484847, + "learning_rate": 2.5591681283804426e-05, + "loss": 0.2451, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1471448540687561, + "step": 2095, + "valid_targets_mean": 6183.4, + "valid_targets_min": 3574 + }, + { + "epoch": 3.291764705882353, + "grad_norm": 0.414522147212614, + "learning_rate": 2.5516587515660706e-05, + "loss": 0.2448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12761680781841278, + "step": 2100, + "valid_targets_mean": 5796.4, + "valid_targets_min": 3701 + }, + { + "epoch": 3.299607843137255, + "grad_norm": 0.42790819400186036, + "learning_rate": 2.5441409477379764e-05, + "loss": 0.2531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09236972033977509, + "step": 2105, + "valid_targets_mean": 4362.0, + "valid_targets_min": 881 + }, + { + "epoch": 3.307450980392157, + "grad_norm": 0.46013772293585553, + "learning_rate": 2.5366148317364237e-05, + "loss": 0.2383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10060383379459381, + "step": 2110, + "valid_targets_mean": 3963.4, + "valid_targets_min": 799 + }, + { + "epoch": 3.315294117647059, + "grad_norm": 0.41304440348713223, + "learning_rate": 2.5290805185286494e-05, + "loss": 0.2358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10279671102762222, + "step": 2115, + "valid_targets_mean": 4324.1, + "valid_targets_min": 909 + }, + { + "epoch": 3.323137254901961, + "grad_norm": 0.39225623307144264, + "learning_rate": 2.521538123207111e-05, + "loss": 0.244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1322818249464035, + "step": 2120, + "valid_targets_mean": 5806.5, + "valid_targets_min": 897 + }, + { + "epoch": 3.330980392156863, + "grad_norm": 0.4904865566407993, + "learning_rate": 2.5139877609877244e-05, + "loss": 0.2586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13356977701187134, + "step": 2125, + "valid_targets_mean": 5983.1, + "valid_targets_min": 3689 + }, + { + "epoch": 3.3388235294117647, + "grad_norm": 0.4198231556106936, + "learning_rate": 2.506429547208107e-05, + "loss": 0.2442, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10872642695903778, + "step": 2130, + "valid_targets_mean": 4768.0, + "valid_targets_min": 4005 + }, + { + "epoch": 3.3466666666666667, + "grad_norm": 0.45380194517033634, + "learning_rate": 2.498863597325815e-05, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11521173268556595, + "step": 2135, + "valid_targets_mean": 5030.1, + "valid_targets_min": 808 + }, + { + "epoch": 3.3545098039215686, + "grad_norm": 0.43347927756835075, + "learning_rate": 2.4912900269165797e-05, + "loss": 0.2392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13011592626571655, + "step": 2140, + "valid_targets_mean": 6122.5, + "valid_targets_min": 3536 + }, + { + "epoch": 3.3623529411764705, + "grad_norm": 0.4271739715689149, + "learning_rate": 2.483708951672541e-05, + "loss": 0.2453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1262693703174591, + "step": 2145, + "valid_targets_mean": 5268.2, + "valid_targets_min": 3765 + }, + { + "epoch": 3.3701960784313725, + "grad_norm": 0.4025912834365145, + "learning_rate": 2.4761204874004818e-05, + "loss": 0.2361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12437351047992706, + "step": 2150, + "valid_targets_mean": 5548.9, + "valid_targets_min": 3340 + }, + { + "epoch": 3.3780392156862744, + "grad_norm": 0.45364220463006383, + "learning_rate": 2.4685247500200583e-05, + "loss": 0.2367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10871313512325287, + "step": 2155, + "valid_targets_mean": 4770.6, + "valid_targets_min": 578 + }, + { + "epoch": 3.3858823529411763, + "grad_norm": 0.44490191755890435, + "learning_rate": 2.4609218555620275e-05, + "loss": 0.2494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12509560585021973, + "step": 2160, + "valid_targets_mean": 5227.4, + "valid_targets_min": 4045 + }, + { + "epoch": 3.3937254901960783, + "grad_norm": 0.40037646667924837, + "learning_rate": 2.4533119201664785e-05, + "loss": 0.2504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10177329182624817, + "step": 2165, + "valid_targets_mean": 4978.2, + "valid_targets_min": 3524 + }, + { + "epoch": 3.40156862745098, + "grad_norm": 0.4155901937269117, + "learning_rate": 2.4456950600810542e-05, + "loss": 0.2416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15294963121414185, + "step": 2170, + "valid_targets_mean": 6141.0, + "valid_targets_min": 3708 + }, + { + "epoch": 3.409411764705882, + "grad_norm": 0.4641026797448153, + "learning_rate": 2.4380713916591785e-05, + "loss": 0.243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12357586622238159, + "step": 2175, + "valid_targets_mean": 4147.4, + "valid_targets_min": 1039 + }, + { + "epoch": 3.417254901960784, + "grad_norm": 0.4171810410522086, + "learning_rate": 2.4304410313582776e-05, + "loss": 0.2604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12325207889080048, + "step": 2180, + "valid_targets_mean": 5426.9, + "valid_targets_min": 537 + }, + { + "epoch": 3.4250980392156865, + "grad_norm": 0.46416076819498153, + "learning_rate": 2.422804095738002e-05, + "loss": 0.2497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08827514946460724, + "step": 2185, + "valid_targets_mean": 3166.9, + "valid_targets_min": 535 + }, + { + "epoch": 3.4329411764705884, + "grad_norm": 0.4532483257717387, + "learning_rate": 2.4151607014584437e-05, + "loss": 0.2534, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15844324231147766, + "step": 2190, + "valid_targets_mean": 7008.6, + "valid_targets_min": 4008 + }, + { + "epoch": 3.4407843137254903, + "grad_norm": 0.44426263058425547, + "learning_rate": 2.4075109652783573e-05, + "loss": 0.2599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11195256561040878, + "step": 2195, + "valid_targets_mean": 4449.6, + "valid_targets_min": 827 + }, + { + "epoch": 3.4486274509803923, + "grad_norm": 0.4782397885162491, + "learning_rate": 2.3998550040533743e-05, + "loss": 0.2602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13909482955932617, + "step": 2200, + "valid_targets_mean": 4378.5, + "valid_targets_min": 1104 + }, + { + "epoch": 3.456470588235294, + "grad_norm": 0.4702721164139716, + "learning_rate": 2.392192934734219e-05, + "loss": 0.2466, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13552600145339966, + "step": 2205, + "valid_targets_mean": 4721.4, + "valid_targets_min": 3900 + }, + { + "epoch": 3.464313725490196, + "grad_norm": 0.43475168828785626, + "learning_rate": 2.3845248743649196e-05, + "loss": 0.2353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1300785392522812, + "step": 2210, + "valid_targets_mean": 5198.1, + "valid_targets_min": 3612 + }, + { + "epoch": 3.472156862745098, + "grad_norm": 0.43867207693018295, + "learning_rate": 2.376850940081025e-05, + "loss": 0.2518, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14244931936264038, + "step": 2215, + "valid_targets_mean": 5360.0, + "valid_targets_min": 3791 + }, + { + "epoch": 3.48, + "grad_norm": 0.44063741886627417, + "learning_rate": 2.3691712491078107e-05, + "loss": 0.2456, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09964333474636078, + "step": 2220, + "valid_targets_mean": 4041.4, + "valid_targets_min": 811 + }, + { + "epoch": 3.487843137254902, + "grad_norm": 0.42522725919593213, + "learning_rate": 2.3614859187584914e-05, + "loss": 0.2494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13847005367279053, + "step": 2225, + "valid_targets_mean": 4862.5, + "valid_targets_min": 1989 + }, + { + "epoch": 3.495686274509804, + "grad_norm": 0.6390226843494196, + "learning_rate": 2.353795066432427e-05, + "loss": 0.2498, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1294592320919037, + "step": 2230, + "valid_targets_mean": 6039.2, + "valid_targets_min": 4011 + }, + { + "epoch": 3.503529411764706, + "grad_norm": 0.4288414756464652, + "learning_rate": 2.3460988096133284e-05, + "loss": 0.2499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12420792132616043, + "step": 2235, + "valid_targets_mean": 5175.9, + "valid_targets_min": 3530 + }, + { + "epoch": 3.5113725490196077, + "grad_norm": 0.43668336523298357, + "learning_rate": 2.338397265867468e-05, + "loss": 0.2526, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11191526055335999, + "step": 2240, + "valid_targets_mean": 4937.1, + "valid_targets_min": 4136 + }, + { + "epoch": 3.5192156862745096, + "grad_norm": 0.4668546590697348, + "learning_rate": 2.3306905528418762e-05, + "loss": 0.2488, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14170069992542267, + "step": 2245, + "valid_targets_mean": 5523.1, + "valid_targets_min": 3314 + }, + { + "epoch": 3.527058823529412, + "grad_norm": 0.4235869993667335, + "learning_rate": 2.3229787882625496e-05, + "loss": 0.2439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12099191546440125, + "step": 2250, + "valid_targets_mean": 4769.6, + "valid_targets_min": 3255 + }, + { + "epoch": 3.534901960784314, + "grad_norm": 0.43656476223885277, + "learning_rate": 2.315262089932653e-05, + "loss": 0.2594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12198434770107269, + "step": 2255, + "valid_targets_mean": 5176.5, + "valid_targets_min": 4087 + }, + { + "epoch": 3.542745098039216, + "grad_norm": 0.4152031042873841, + "learning_rate": 2.3075405757307147e-05, + "loss": 0.2528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12806783616542816, + "step": 2260, + "valid_targets_mean": 6016.6, + "valid_targets_min": 3494 + }, + { + "epoch": 3.550588235294118, + "grad_norm": 0.43654785463193213, + "learning_rate": 2.2998143636088323e-05, + "loss": 0.243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11978089809417725, + "step": 2265, + "valid_targets_mean": 5109.9, + "valid_targets_min": 3790 + }, + { + "epoch": 3.5584313725490198, + "grad_norm": 0.45198424570474105, + "learning_rate": 2.2920835715908654e-05, + "loss": 0.2404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13197702169418335, + "step": 2270, + "valid_targets_mean": 4443.2, + "valid_targets_min": 840 + }, + { + "epoch": 3.5662745098039217, + "grad_norm": 0.4250985223444925, + "learning_rate": 2.2843483177706363e-05, + "loss": 0.2461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.149743914604187, + "step": 2275, + "valid_targets_mean": 6065.6, + "valid_targets_min": 3785 + }, + { + "epoch": 3.5741176470588236, + "grad_norm": 0.4173987075467208, + "learning_rate": 2.2766087203101245e-05, + "loss": 0.2502, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1250050663948059, + "step": 2280, + "valid_targets_mean": 5207.5, + "valid_targets_min": 3569 + }, + { + "epoch": 3.5819607843137256, + "grad_norm": 0.45314085836943274, + "learning_rate": 2.2688648974376622e-05, + "loss": 0.2293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10489747673273087, + "step": 2285, + "valid_targets_mean": 3719.0, + "valid_targets_min": 691 + }, + { + "epoch": 3.5898039215686275, + "grad_norm": 0.44051637331745386, + "learning_rate": 2.261116967446127e-05, + "loss": 0.2375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1355193555355072, + "step": 2290, + "valid_targets_mean": 4599.1, + "valid_targets_min": 4026 + }, + { + "epoch": 3.5976470588235294, + "grad_norm": 0.4728518002937475, + "learning_rate": 2.2533650486911375e-05, + "loss": 0.2399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13677480816841125, + "step": 2295, + "valid_targets_mean": 4525.0, + "valid_targets_min": 593 + }, + { + "epoch": 3.6054901960784314, + "grad_norm": 0.4008279926262856, + "learning_rate": 2.245609259589243e-05, + "loss": 0.2454, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10138443112373352, + "step": 2300, + "valid_targets_mean": 5378.1, + "valid_targets_min": 3568 + }, + { + "epoch": 3.6133333333333333, + "grad_norm": 0.4265027129685831, + "learning_rate": 2.2378497186161146e-05, + "loss": 0.2472, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1514357626438141, + "step": 2305, + "valid_targets_mean": 6498.0, + "valid_targets_min": 634 + }, + { + "epoch": 3.621176470588235, + "grad_norm": 0.4746697315873271, + "learning_rate": 2.230086544304737e-05, + "loss": 0.2509, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1213865876197815, + "step": 2310, + "valid_targets_mean": 4269.1, + "valid_targets_min": 612 + }, + { + "epoch": 3.629019607843137, + "grad_norm": 0.464244944957954, + "learning_rate": 2.222319855243597e-05, + "loss": 0.2427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11628014594316483, + "step": 2315, + "valid_targets_mean": 4143.0, + "valid_targets_min": 1031 + }, + { + "epoch": 3.636862745098039, + "grad_norm": 0.4020090060829787, + "learning_rate": 2.2145497700748723e-05, + "loss": 0.256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11320920288562775, + "step": 2320, + "valid_targets_mean": 5850.8, + "valid_targets_min": 3387 + }, + { + "epoch": 3.644705882352941, + "grad_norm": 0.4007527110243504, + "learning_rate": 2.2067764074926163e-05, + "loss": 0.2468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13083413243293762, + "step": 2325, + "valid_targets_mean": 5778.8, + "valid_targets_min": 3775 + }, + { + "epoch": 3.652549019607843, + "grad_norm": 0.4347470779889978, + "learning_rate": 2.198999886240951e-05, + "loss": 0.2423, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10197200626134872, + "step": 2330, + "valid_targets_mean": 4524.2, + "valid_targets_min": 747 + }, + { + "epoch": 3.660392156862745, + "grad_norm": 0.4345175758531176, + "learning_rate": 2.1912203251122475e-05, + "loss": 0.243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11358082294464111, + "step": 2335, + "valid_targets_mean": 5199.6, + "valid_targets_min": 3988 + }, + { + "epoch": 3.668235294117647, + "grad_norm": 0.4007587051470908, + "learning_rate": 2.1834378429453133e-05, + "loss": 0.2393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13197997212409973, + "step": 2340, + "valid_targets_mean": 5778.9, + "valid_targets_min": 3808 + }, + { + "epoch": 3.6760784313725487, + "grad_norm": 0.4494627231362916, + "learning_rate": 2.175652558623577e-05, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12308965623378754, + "step": 2345, + "valid_targets_mean": 5130.2, + "valid_targets_min": 3482 + }, + { + "epoch": 3.683921568627451, + "grad_norm": 0.4152150942753047, + "learning_rate": 2.1678645910732734e-05, + "loss": 0.2492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1369512677192688, + "step": 2350, + "valid_targets_mean": 6060.2, + "valid_targets_min": 4055 + }, + { + "epoch": 3.691764705882353, + "grad_norm": 0.4712923072777983, + "learning_rate": 2.1600740592616245e-05, + "loss": 0.252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09407570213079453, + "step": 2355, + "valid_targets_mean": 4600.4, + "valid_targets_min": 3945 + }, + { + "epoch": 3.699607843137255, + "grad_norm": 0.4105138321258731, + "learning_rate": 2.152281082195024e-05, + "loss": 0.2372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12141579389572144, + "step": 2360, + "valid_targets_mean": 4882.1, + "valid_targets_min": 3774 + }, + { + "epoch": 3.707450980392157, + "grad_norm": 0.45925298953338334, + "learning_rate": 2.1444857789172185e-05, + "loss": 0.2421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11542713642120361, + "step": 2365, + "valid_targets_mean": 4519.5, + "valid_targets_min": 3414 + }, + { + "epoch": 3.715294117647059, + "grad_norm": 0.45517657387663035, + "learning_rate": 2.1366882685074892e-05, + "loss": 0.2538, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12940552830696106, + "step": 2370, + "valid_targets_mean": 4775.5, + "valid_targets_min": 785 + }, + { + "epoch": 3.723137254901961, + "grad_norm": 0.42564920456574895, + "learning_rate": 2.1288886700788335e-05, + "loss": 0.2389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13440310955047607, + "step": 2375, + "valid_targets_mean": 5391.8, + "valid_targets_min": 585 + }, + { + "epoch": 3.7309803921568627, + "grad_norm": 0.6178229501585953, + "learning_rate": 2.1210871027761438e-05, + "loss": 0.2618, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13043555617332458, + "step": 2380, + "valid_targets_mean": 5792.1, + "valid_targets_min": 3642 + }, + { + "epoch": 3.7388235294117647, + "grad_norm": 0.4102212916044459, + "learning_rate": 2.1132836857743903e-05, + "loss": 0.2359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13514447212219238, + "step": 2385, + "valid_targets_mean": 5541.0, + "valid_targets_min": 4262 + }, + { + "epoch": 3.7466666666666666, + "grad_norm": 0.4345973715149457, + "learning_rate": 2.105478538276797e-05, + "loss": 0.2378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11293156445026398, + "step": 2390, + "valid_targets_mean": 4884.6, + "valid_targets_min": 2117 + }, + { + "epoch": 3.7545098039215685, + "grad_norm": 0.4055907879478308, + "learning_rate": 2.0976717795130233e-05, + "loss": 0.2362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12585970759391785, + "step": 2395, + "valid_targets_mean": 5308.1, + "valid_targets_min": 3482 + }, + { + "epoch": 3.7623529411764705, + "grad_norm": 0.5125677754224955, + "learning_rate": 2.0898635287373423e-05, + "loss": 0.2544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17816469073295593, + "step": 2400, + "valid_targets_mean": 5720.0, + "valid_targets_min": 965 + }, + { + "epoch": 3.7701960784313724, + "grad_norm": 0.4433647739611089, + "learning_rate": 2.0820539052268186e-05, + "loss": 0.2373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09588039666414261, + "step": 2405, + "valid_targets_mean": 3557.0, + "valid_targets_min": 537 + }, + { + "epoch": 3.7780392156862748, + "grad_norm": 0.40809336018652104, + "learning_rate": 2.0742430282794857e-05, + "loss": 0.2308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09966695308685303, + "step": 2410, + "valid_targets_mean": 4593.8, + "valid_targets_min": 1211 + }, + { + "epoch": 3.7858823529411767, + "grad_norm": 0.41957665576470976, + "learning_rate": 2.0664310172125242e-05, + "loss": 0.2518, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10396531969308853, + "step": 2415, + "valid_targets_mean": 4152.6, + "valid_targets_min": 783 + }, + { + "epoch": 3.7937254901960786, + "grad_norm": 0.44894426328179443, + "learning_rate": 2.0586179913604413e-05, + "loss": 0.2391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11163697391748428, + "step": 2420, + "valid_targets_mean": 4620.6, + "valid_targets_min": 3845 + }, + { + "epoch": 3.8015686274509806, + "grad_norm": 0.3977540873194003, + "learning_rate": 2.0508040700732438e-05, + "loss": 0.247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19368122518062592, + "step": 2425, + "valid_targets_mean": 7945.9, + "valid_targets_min": 3828 + }, + { + "epoch": 3.8094117647058825, + "grad_norm": 0.45889914530307035, + "learning_rate": 2.0429893727146167e-05, + "loss": 0.2416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11084446310997009, + "step": 2430, + "valid_targets_mean": 4031.5, + "valid_targets_min": 785 + }, + { + "epoch": 3.8172549019607844, + "grad_norm": 0.48554569449891527, + "learning_rate": 2.0351740186601012e-05, + "loss": 0.2564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1371164172887802, + "step": 2435, + "valid_targets_mean": 5224.0, + "valid_targets_min": 727 + }, + { + "epoch": 3.8250980392156864, + "grad_norm": 0.44497973302423827, + "learning_rate": 2.0273581272952708e-05, + "loss": 0.2528, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09165876358747482, + "step": 2440, + "valid_targets_mean": 3842.6, + "valid_targets_min": 692 + }, + { + "epoch": 3.8329411764705883, + "grad_norm": 0.44165704466795486, + "learning_rate": 2.0195418180139055e-05, + "loss": 0.2385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11761967837810516, + "step": 2445, + "valid_targets_mean": 4286.0, + "valid_targets_min": 3469 + }, + { + "epoch": 3.8407843137254902, + "grad_norm": 0.47116094179324775, + "learning_rate": 2.0117252102161687e-05, + "loss": 0.2499, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12916581332683563, + "step": 2450, + "valid_targets_mean": 3781.9, + "valid_targets_min": 672 + }, + { + "epoch": 3.848627450980392, + "grad_norm": 0.4432899814548258, + "learning_rate": 2.0039084233067853e-05, + "loss": 0.2417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09984422475099564, + "step": 2455, + "valid_targets_mean": 4347.4, + "valid_targets_min": 3304 + }, + { + "epoch": 3.856470588235294, + "grad_norm": 0.43238947024639623, + "learning_rate": 1.9960915766932153e-05, + "loss": 0.2549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14688940346240997, + "step": 2460, + "valid_targets_mean": 6676.2, + "valid_targets_min": 4367 + }, + { + "epoch": 3.864313725490196, + "grad_norm": 0.4441903847270208, + "learning_rate": 1.988274789783832e-05, + "loss": 0.239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12853792309761047, + "step": 2465, + "valid_targets_mean": 4793.4, + "valid_targets_min": 4049 + }, + { + "epoch": 3.872156862745098, + "grad_norm": 0.4069753596366182, + "learning_rate": 1.9804581819860952e-05, + "loss": 0.2343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13356426358222961, + "step": 2470, + "valid_targets_mean": 5416.6, + "valid_targets_min": 4194 + }, + { + "epoch": 3.88, + "grad_norm": 0.4361007055406648, + "learning_rate": 1.9726418727047295e-05, + "loss": 0.26, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12676510214805603, + "step": 2475, + "valid_targets_mean": 5579.5, + "valid_targets_min": 1244 + }, + { + "epoch": 3.887843137254902, + "grad_norm": 0.4198017556701137, + "learning_rate": 1.9648259813398987e-05, + "loss": 0.2448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1500803530216217, + "step": 2480, + "valid_targets_mean": 6409.1, + "valid_targets_min": 3902 + }, + { + "epoch": 3.8956862745098038, + "grad_norm": 0.42378635541342735, + "learning_rate": 1.957010627285384e-05, + "loss": 0.2365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13810518383979797, + "step": 2485, + "valid_targets_mean": 6154.2, + "valid_targets_min": 912 + }, + { + "epoch": 3.9035294117647057, + "grad_norm": 0.4330011404936207, + "learning_rate": 1.9491959299267572e-05, + "loss": 0.2309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12688998878002167, + "step": 2490, + "valid_targets_mean": 4943.1, + "valid_targets_min": 3557 + }, + { + "epoch": 3.9113725490196076, + "grad_norm": 0.43668303326520075, + "learning_rate": 1.941382008639559e-05, + "loss": 0.2422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1096714660525322, + "step": 2495, + "valid_targets_mean": 4343.4, + "valid_targets_min": 1011 + }, + { + "epoch": 3.9192156862745096, + "grad_norm": 0.45479288831404163, + "learning_rate": 1.933568982787476e-05, + "loss": 0.248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.143254354596138, + "step": 2500, + "valid_targets_mean": 5751.5, + "valid_targets_min": 4181 + }, + { + "epoch": 3.9270588235294115, + "grad_norm": 0.42946212220942426, + "learning_rate": 1.9257569717205153e-05, + "loss": 0.2445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10440149158239365, + "step": 2505, + "valid_targets_mean": 4229.2, + "valid_targets_min": 710 + }, + { + "epoch": 3.934901960784314, + "grad_norm": 0.43173231505010357, + "learning_rate": 1.9179460947731824e-05, + "loss": 0.2365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11701091378927231, + "step": 2510, + "valid_targets_mean": 4764.4, + "valid_targets_min": 3967 + }, + { + "epoch": 3.942745098039216, + "grad_norm": 0.4179666973800945, + "learning_rate": 1.9101364712626577e-05, + "loss": 0.2354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1057259738445282, + "step": 2515, + "valid_targets_mean": 4593.4, + "valid_targets_min": 3174 + }, + { + "epoch": 3.9505882352941177, + "grad_norm": 0.41267797631647846, + "learning_rate": 1.9023282204869767e-05, + "loss": 0.2474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1084958016872406, + "step": 2520, + "valid_targets_mean": 5013.1, + "valid_targets_min": 3702 + }, + { + "epoch": 3.9584313725490197, + "grad_norm": 0.4182805319321907, + "learning_rate": 1.8945214617232036e-05, + "loss": 0.2516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1471642702817917, + "step": 2525, + "valid_targets_mean": 5577.8, + "valid_targets_min": 4326 + }, + { + "epoch": 3.9662745098039216, + "grad_norm": 0.7234435491670909, + "learning_rate": 1.88671631422561e-05, + "loss": 0.2496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09615735709667206, + "step": 2530, + "valid_targets_mean": 4327.0, + "valid_targets_min": 921 + }, + { + "epoch": 3.9741176470588235, + "grad_norm": 0.42254129246244126, + "learning_rate": 1.8789128972238565e-05, + "loss": 0.2444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0965128019452095, + "step": 2535, + "valid_targets_mean": 4908.0, + "valid_targets_min": 1678 + }, + { + "epoch": 3.9819607843137255, + "grad_norm": 0.4108845812599496, + "learning_rate": 1.8711113299211675e-05, + "loss": 0.2472, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1227368712425232, + "step": 2540, + "valid_targets_mean": 5048.0, + "valid_targets_min": 3740 + }, + { + "epoch": 3.9898039215686274, + "grad_norm": 0.34816284688558613, + "learning_rate": 1.8633117314925118e-05, + "loss": 0.2436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11549834907054901, + "step": 2545, + "valid_targets_mean": 7279.1, + "valid_targets_min": 4113 + }, + { + "epoch": 3.9976470588235293, + "grad_norm": 0.4017959546348958, + "learning_rate": 1.855514221082782e-05, + "loss": 0.2375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12120068818330765, + "step": 2550, + "valid_targets_mean": 5609.5, + "valid_targets_min": 3329 + }, + { + "epoch": 4.004705882352941, + "grad_norm": 0.39569157004085714, + "learning_rate": 1.8477189178049764e-05, + "loss": 0.2473, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1075434684753418, + "step": 2555, + "valid_targets_mean": 5506.8, + "valid_targets_min": 3669 + }, + { + "epoch": 4.012549019607843, + "grad_norm": 0.41935713908603817, + "learning_rate": 1.839925940738376e-05, + "loss": 0.237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1180042028427124, + "step": 2560, + "valid_targets_mean": 5294.9, + "valid_targets_min": 849 + }, + { + "epoch": 4.020392156862745, + "grad_norm": 0.4394484999752763, + "learning_rate": 1.8321354089267272e-05, + "loss": 0.236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10508240014314651, + "step": 2565, + "valid_targets_mean": 4761.2, + "valid_targets_min": 891 + }, + { + "epoch": 4.028235294117647, + "grad_norm": 0.44221495285080337, + "learning_rate": 1.8243474413764236e-05, + "loss": 0.2386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18124812841415405, + "step": 2570, + "valid_targets_mean": 7468.4, + "valid_targets_min": 3878 + }, + { + "epoch": 4.036078431372549, + "grad_norm": 0.4132976841846695, + "learning_rate": 1.8165621570546874e-05, + "loss": 0.2272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11682303994894028, + "step": 2575, + "valid_targets_mean": 5616.6, + "valid_targets_min": 3473 + }, + { + "epoch": 4.043921568627451, + "grad_norm": 0.4568921049954836, + "learning_rate": 1.808779674887753e-05, + "loss": 0.2429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11188096553087234, + "step": 2580, + "valid_targets_mean": 4916.9, + "valid_targets_min": 747 + }, + { + "epoch": 4.051764705882353, + "grad_norm": 0.4622869017756218, + "learning_rate": 1.801000113759049e-05, + "loss": 0.2481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10092595219612122, + "step": 2585, + "valid_targets_mean": 4231.2, + "valid_targets_min": 2038 + }, + { + "epoch": 4.059607843137255, + "grad_norm": 0.4176738466656865, + "learning_rate": 1.7932235925073836e-05, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08800789713859558, + "step": 2590, + "valid_targets_mean": 4712.8, + "valid_targets_min": 3705 + }, + { + "epoch": 4.067450980392157, + "grad_norm": 0.4241403087923899, + "learning_rate": 1.7854502299251284e-05, + "loss": 0.2241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1052800789475441, + "step": 2595, + "valid_targets_mean": 4965.0, + "valid_targets_min": 1951 + }, + { + "epoch": 4.075294117647059, + "grad_norm": 0.4705868076345857, + "learning_rate": 1.7776801447564032e-05, + "loss": 0.2394, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12272444367408752, + "step": 2600, + "valid_targets_mean": 4833.2, + "valid_targets_min": 3409 + }, + { + "epoch": 4.083137254901961, + "grad_norm": 0.4378490088120457, + "learning_rate": 1.7699134556952634e-05, + "loss": 0.2286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10248713195323944, + "step": 2605, + "valid_targets_mean": 4233.1, + "valid_targets_min": 678 + }, + { + "epoch": 4.090980392156863, + "grad_norm": 0.42865922256952516, + "learning_rate": 1.7621502813838864e-05, + "loss": 0.2334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10999415814876556, + "step": 2610, + "valid_targets_mean": 4333.8, + "valid_targets_min": 768 + }, + { + "epoch": 4.0988235294117645, + "grad_norm": 0.43159569485209737, + "learning_rate": 1.754390740410758e-05, + "loss": 0.2361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08083570003509521, + "step": 2615, + "valid_targets_mean": 3548.9, + "valid_targets_min": 496 + }, + { + "epoch": 4.1066666666666665, + "grad_norm": 0.5194467132035089, + "learning_rate": 1.7466349513088636e-05, + "loss": 0.2419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12257933616638184, + "step": 2620, + "valid_targets_mean": 4051.9, + "valid_targets_min": 713 + }, + { + "epoch": 4.114509803921568, + "grad_norm": 0.4139767381834643, + "learning_rate": 1.738883032553873e-05, + "loss": 0.2263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11203347146511078, + "step": 2625, + "valid_targets_mean": 5300.0, + "valid_targets_min": 3694 + }, + { + "epoch": 4.12235294117647, + "grad_norm": 0.45862693952462696, + "learning_rate": 1.7311351025623385e-05, + "loss": 0.2296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12201839685440063, + "step": 2630, + "valid_targets_mean": 5129.0, + "valid_targets_min": 4048 + }, + { + "epoch": 4.130196078431372, + "grad_norm": 0.4417442163099453, + "learning_rate": 1.723391279689876e-05, + "loss": 0.2435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17832894623279572, + "step": 2635, + "valid_targets_mean": 7041.9, + "valid_targets_min": 1176 + }, + { + "epoch": 4.138039215686274, + "grad_norm": 0.4350450889064667, + "learning_rate": 1.7156516822293644e-05, + "loss": 0.223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10031968355178833, + "step": 2640, + "valid_targets_mean": 4177.1, + "valid_targets_min": 532 + }, + { + "epoch": 4.145882352941176, + "grad_norm": 0.46888520664230127, + "learning_rate": 1.7079164284091353e-05, + "loss": 0.2274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10806365311145782, + "step": 2645, + "valid_targets_mean": 4084.9, + "valid_targets_min": 783 + }, + { + "epoch": 4.153725490196078, + "grad_norm": 0.41910197413913913, + "learning_rate": 1.7001856363911687e-05, + "loss": 0.2312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10648825764656067, + "step": 2650, + "valid_targets_mean": 5057.6, + "valid_targets_min": 671 + }, + { + "epoch": 4.16156862745098, + "grad_norm": 0.5218402944168531, + "learning_rate": 1.692459424269286e-05, + "loss": 0.2326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11246689409017563, + "step": 2655, + "valid_targets_mean": 3674.1, + "valid_targets_min": 775 + }, + { + "epoch": 4.169411764705882, + "grad_norm": 0.46180954109801275, + "learning_rate": 1.6847379100673474e-05, + "loss": 0.2337, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14503367245197296, + "step": 2660, + "valid_targets_mean": 5285.0, + "valid_targets_min": 488 + }, + { + "epoch": 4.177254901960785, + "grad_norm": 0.444249980676699, + "learning_rate": 1.6770212117374504e-05, + "loss": 0.229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10934904217720032, + "step": 2665, + "valid_targets_mean": 4780.2, + "valid_targets_min": 783 + }, + { + "epoch": 4.185098039215687, + "grad_norm": 0.465724690204505, + "learning_rate": 1.6693094471581244e-05, + "loss": 0.2205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10249033570289612, + "step": 2670, + "valid_targets_mean": 4325.9, + "valid_targets_min": 3458 + }, + { + "epoch": 4.192941176470589, + "grad_norm": 0.44416118201724536, + "learning_rate": 1.6616027341325328e-05, + "loss": 0.2293, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1000424325466156, + "step": 2675, + "valid_targets_mean": 4408.9, + "valid_targets_min": 2176 + }, + { + "epoch": 4.2007843137254905, + "grad_norm": 0.45587041013740054, + "learning_rate": 1.653901190386672e-05, + "loss": 0.2288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11124923825263977, + "step": 2680, + "valid_targets_mean": 4076.0, + "valid_targets_min": 569 + }, + { + "epoch": 4.2086274509803925, + "grad_norm": 0.4849010155411813, + "learning_rate": 1.646204933567574e-05, + "loss": 0.2377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11906752735376358, + "step": 2685, + "valid_targets_mean": 4709.2, + "valid_targets_min": 3212 + }, + { + "epoch": 4.216470588235294, + "grad_norm": 0.4550980097289989, + "learning_rate": 1.638514081241509e-05, + "loss": 0.2358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15008796751499176, + "step": 2690, + "valid_targets_mean": 5774.9, + "valid_targets_min": 738 + }, + { + "epoch": 4.224313725490196, + "grad_norm": 0.44042050024817103, + "learning_rate": 1.6308287508921893e-05, + "loss": 0.2452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09062080085277557, + "step": 2695, + "valid_targets_mean": 4297.5, + "valid_targets_min": 3574 + }, + { + "epoch": 4.232156862745098, + "grad_norm": 0.4247855213774718, + "learning_rate": 1.6231490599189753e-05, + "loss": 0.2295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12232277542352676, + "step": 2700, + "valid_targets_mean": 5617.2, + "valid_targets_min": 3678 + }, + { + "epoch": 4.24, + "grad_norm": 0.4404614212649334, + "learning_rate": 1.615475125635081e-05, + "loss": 0.2274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09367984533309937, + "step": 2705, + "valid_targets_mean": 4037.8, + "valid_targets_min": 3472 + }, + { + "epoch": 4.247843137254902, + "grad_norm": 0.4506826599579043, + "learning_rate": 1.607807065265782e-05, + "loss": 0.2334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10886059701442719, + "step": 2710, + "valid_targets_mean": 5706.8, + "valid_targets_min": 2538 + }, + { + "epoch": 4.255686274509804, + "grad_norm": 0.4782992698604372, + "learning_rate": 1.600144995946626e-05, + "loss": 0.2368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12588849663734436, + "step": 2715, + "valid_targets_mean": 4821.1, + "valid_targets_min": 272 + }, + { + "epoch": 4.263529411764706, + "grad_norm": 0.4510322699008573, + "learning_rate": 1.5924890347216433e-05, + "loss": 0.2317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11632902175188065, + "step": 2720, + "valid_targets_mean": 4474.1, + "valid_targets_min": 1068 + }, + { + "epoch": 4.271372549019608, + "grad_norm": 0.44522967831663324, + "learning_rate": 1.5848392985415573e-05, + "loss": 0.2358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11140655726194382, + "step": 2725, + "valid_targets_mean": 4962.0, + "valid_targets_min": 3536 + }, + { + "epoch": 4.27921568627451, + "grad_norm": 0.41416180143940035, + "learning_rate": 1.5771959042619983e-05, + "loss": 0.2304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09167453646659851, + "step": 2730, + "valid_targets_mean": 4499.6, + "valid_targets_min": 1455 + }, + { + "epoch": 4.287058823529412, + "grad_norm": 0.4121993785188106, + "learning_rate": 1.5695589686417224e-05, + "loss": 0.2313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09622062742710114, + "step": 2735, + "valid_targets_mean": 4420.5, + "valid_targets_min": 726 + }, + { + "epoch": 4.294901960784314, + "grad_norm": 0.4992264402830286, + "learning_rate": 1.561928608340822e-05, + "loss": 0.2407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09109040349721909, + "step": 2740, + "valid_targets_mean": 3033.8, + "valid_targets_min": 785 + }, + { + "epoch": 4.302745098039216, + "grad_norm": 0.6052650370274888, + "learning_rate": 1.554304939918946e-05, + "loss": 0.2363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09706152230501175, + "step": 2745, + "valid_targets_mean": 3555.8, + "valid_targets_min": 767 + }, + { + "epoch": 4.310588235294118, + "grad_norm": 0.43459356722197345, + "learning_rate": 1.5466880798335222e-05, + "loss": 0.2279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12693923711776733, + "step": 2750, + "valid_targets_mean": 5968.5, + "valid_targets_min": 4153 + }, + { + "epoch": 4.3184313725490195, + "grad_norm": 0.41454868256199134, + "learning_rate": 1.539078144437973e-05, + "loss": 0.2358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11799121648073196, + "step": 2755, + "valid_targets_mean": 6189.2, + "valid_targets_min": 3457 + }, + { + "epoch": 4.3262745098039215, + "grad_norm": 0.4376302429257829, + "learning_rate": 1.5314752499799427e-05, + "loss": 0.2328, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11019665002822876, + "step": 2760, + "valid_targets_mean": 5059.8, + "valid_targets_min": 1353 + }, + { + "epoch": 4.334117647058823, + "grad_norm": 0.49424493066282355, + "learning_rate": 1.5238795125995189e-05, + "loss": 0.2405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12486723065376282, + "step": 2765, + "valid_targets_mean": 4199.2, + "valid_targets_min": 751 + }, + { + "epoch": 4.341960784313725, + "grad_norm": 0.45864869228381433, + "learning_rate": 1.5162910483274593e-05, + "loss": 0.2287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11594164371490479, + "step": 2770, + "valid_targets_mean": 4496.1, + "valid_targets_min": 3342 + }, + { + "epoch": 4.349803921568627, + "grad_norm": 0.4290020306517361, + "learning_rate": 1.5087099730834207e-05, + "loss": 0.2493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14288020133972168, + "step": 2775, + "valid_targets_mean": 6175.4, + "valid_targets_min": 3887 + }, + { + "epoch": 4.357647058823529, + "grad_norm": 0.39691105380569963, + "learning_rate": 1.5011364026741855e-05, + "loss": 0.2426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13958340883255005, + "step": 2780, + "valid_targets_mean": 6673.4, + "valid_targets_min": 3618 + }, + { + "epoch": 4.365490196078431, + "grad_norm": 0.43661081180233746, + "learning_rate": 1.4935704527918937e-05, + "loss": 0.2469, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14695270359516144, + "step": 2785, + "valid_targets_mean": 6581.8, + "valid_targets_min": 4414 + }, + { + "epoch": 4.373333333333333, + "grad_norm": 0.40863500299394734, + "learning_rate": 1.4860122390122764e-05, + "loss": 0.228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14593222737312317, + "step": 2790, + "valid_targets_mean": 6116.5, + "valid_targets_min": 4051 + }, + { + "epoch": 4.381176470588235, + "grad_norm": 0.475295429629708, + "learning_rate": 1.4784618767928898e-05, + "loss": 0.2334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12581712007522583, + "step": 2795, + "valid_targets_mean": 4507.4, + "valid_targets_min": 3297 + }, + { + "epoch": 4.389019607843137, + "grad_norm": 0.45469343912432475, + "learning_rate": 1.4709194814713507e-05, + "loss": 0.2356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13349707424640656, + "step": 2800, + "valid_targets_mean": 4666.4, + "valid_targets_min": 1108 + }, + { + "epoch": 4.396862745098039, + "grad_norm": 0.41875147310143834, + "learning_rate": 1.4633851682635766e-05, + "loss": 0.2363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11100316047668457, + "step": 2805, + "valid_targets_mean": 4645.6, + "valid_targets_min": 980 + }, + { + "epoch": 4.404705882352941, + "grad_norm": 0.4408284838489042, + "learning_rate": 1.4558590522620239e-05, + "loss": 0.2378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14001163840293884, + "step": 2810, + "valid_targets_mean": 5793.5, + "valid_targets_min": 3699 + }, + { + "epoch": 4.412549019607843, + "grad_norm": 0.4646282293043246, + "learning_rate": 1.4483412484339301e-05, + "loss": 0.2344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11910644918680191, + "step": 2815, + "valid_targets_mean": 4785.8, + "valid_targets_min": 3638 + }, + { + "epoch": 4.420392156862745, + "grad_norm": 0.44310182616986576, + "learning_rate": 1.4408318716195581e-05, + "loss": 0.2325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1331317126750946, + "step": 2820, + "valid_targets_mean": 5117.9, + "valid_targets_min": 512 + }, + { + "epoch": 4.428235294117647, + "grad_norm": 0.48547553289245554, + "learning_rate": 1.4333310365304413e-05, + "loss": 0.2309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09377738833427429, + "step": 2825, + "valid_targets_mean": 4225.5, + "valid_targets_min": 474 + }, + { + "epoch": 4.436078431372549, + "grad_norm": 0.40807911759860815, + "learning_rate": 1.4258388577476322e-05, + "loss": 0.2373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10872749984264374, + "step": 2830, + "valid_targets_mean": 5272.0, + "valid_targets_min": 3551 + }, + { + "epoch": 4.443921568627451, + "grad_norm": 0.4279963815599532, + "learning_rate": 1.4183554497199514e-05, + "loss": 0.2393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.113418810069561, + "step": 2835, + "valid_targets_mean": 5528.8, + "valid_targets_min": 2550 + }, + { + "epoch": 4.451764705882353, + "grad_norm": 0.45965069219955873, + "learning_rate": 1.4108809267622381e-05, + "loss": 0.2336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10628610849380493, + "step": 2840, + "valid_targets_mean": 4212.6, + "valid_targets_min": 404 + }, + { + "epoch": 4.459607843137255, + "grad_norm": 0.42613985033761675, + "learning_rate": 1.4034154030536083e-05, + "loss": 0.2357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12714120745658875, + "step": 2845, + "valid_targets_mean": 5532.8, + "valid_targets_min": 4137 + }, + { + "epoch": 4.467450980392157, + "grad_norm": 0.4382198571804567, + "learning_rate": 1.3959589926357042e-05, + "loss": 0.2435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1308916211128235, + "step": 2850, + "valid_targets_mean": 5463.6, + "valid_targets_min": 664 + }, + { + "epoch": 4.475294117647059, + "grad_norm": 0.4192454419323077, + "learning_rate": 1.3885118094109575e-05, + "loss": 0.2209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08181822299957275, + "step": 2855, + "valid_targets_mean": 4375.1, + "valid_targets_min": 3878 + }, + { + "epoch": 4.483137254901961, + "grad_norm": 0.5532407130131899, + "learning_rate": 1.3810739671408467e-05, + "loss": 0.2409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09779887646436691, + "step": 2860, + "valid_targets_mean": 3727.5, + "valid_targets_min": 806 + }, + { + "epoch": 4.490980392156863, + "grad_norm": 0.444360439292349, + "learning_rate": 1.3736455794441596e-05, + "loss": 0.2323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11745741963386536, + "step": 2865, + "valid_targets_mean": 4643.2, + "valid_targets_min": 3131 + }, + { + "epoch": 4.498823529411765, + "grad_norm": 0.4200795782839923, + "learning_rate": 1.3662267597952588e-05, + "loss": 0.2285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12091678380966187, + "step": 2870, + "valid_targets_mean": 5856.4, + "valid_targets_min": 3370 + }, + { + "epoch": 4.506666666666667, + "grad_norm": 0.42488592060924674, + "learning_rate": 1.3588176215223463e-05, + "loss": 0.2376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10534407198429108, + "step": 2875, + "valid_targets_mean": 4626.0, + "valid_targets_min": 3890 + }, + { + "epoch": 4.514509803921569, + "grad_norm": 0.4200545765520546, + "learning_rate": 1.3514182778057365e-05, + "loss": 0.2331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10357141494750977, + "step": 2880, + "valid_targets_mean": 5135.2, + "valid_targets_min": 3790 + }, + { + "epoch": 4.522352941176471, + "grad_norm": 0.5215283256019683, + "learning_rate": 1.3440288416761216e-05, + "loss": 0.2279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12107962369918823, + "step": 2885, + "valid_targets_mean": 4660.5, + "valid_targets_min": 3653 + }, + { + "epoch": 4.530196078431373, + "grad_norm": 0.4424012943358386, + "learning_rate": 1.3366494260128484e-05, + "loss": 0.2332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10020311921834946, + "step": 2890, + "valid_targets_mean": 4800.6, + "valid_targets_min": 694 + }, + { + "epoch": 4.5380392156862746, + "grad_norm": 0.4286355399479813, + "learning_rate": 1.3292801435421935e-05, + "loss": 0.2312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1244986429810524, + "step": 2895, + "valid_targets_mean": 5535.9, + "valid_targets_min": 3469 + }, + { + "epoch": 4.5458823529411765, + "grad_norm": 0.430885468445451, + "learning_rate": 1.3219211068356418e-05, + "loss": 0.2367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14919069409370422, + "step": 2900, + "valid_targets_mean": 5873.8, + "valid_targets_min": 904 + }, + { + "epoch": 4.553725490196078, + "grad_norm": 0.45289858258160803, + "learning_rate": 1.3145724283081651e-05, + "loss": 0.2322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10817940533161163, + "step": 2905, + "valid_targets_mean": 4748.0, + "valid_targets_min": 4218 + }, + { + "epoch": 4.56156862745098, + "grad_norm": 0.41980663944214935, + "learning_rate": 1.3072342202165069e-05, + "loss": 0.2309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11044943332672119, + "step": 2910, + "valid_targets_mean": 5293.0, + "valid_targets_min": 3835 + }, + { + "epoch": 4.569411764705882, + "grad_norm": 0.4839386189792505, + "learning_rate": 1.2999065946574656e-05, + "loss": 0.2282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13633571565151215, + "step": 2915, + "valid_targets_mean": 5534.4, + "valid_targets_min": 3576 + }, + { + "epoch": 4.577254901960784, + "grad_norm": 0.42243480444753406, + "learning_rate": 1.2925896635661852e-05, + "loss": 0.2446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1725214570760727, + "step": 2920, + "valid_targets_mean": 7218.0, + "valid_targets_min": 4212 + }, + { + "epoch": 4.585098039215686, + "grad_norm": 0.4469954447796888, + "learning_rate": 1.2852835387144414e-05, + "loss": 0.2403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10223016887903214, + "step": 2925, + "valid_targets_mean": 4194.5, + "valid_targets_min": 3159 + }, + { + "epoch": 4.592941176470588, + "grad_norm": 0.45911654389244627, + "learning_rate": 1.2779883317089374e-05, + "loss": 0.2398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10432572662830353, + "step": 2930, + "valid_targets_mean": 4234.1, + "valid_targets_min": 675 + }, + { + "epoch": 4.60078431372549, + "grad_norm": 0.452905704169797, + "learning_rate": 1.2707041539895974e-05, + "loss": 0.2389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1017366498708725, + "step": 2935, + "valid_targets_mean": 4624.2, + "valid_targets_min": 3290 + }, + { + "epoch": 4.608627450980392, + "grad_norm": 0.4446195839335299, + "learning_rate": 1.2634311168278652e-05, + "loss": 0.2253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1165042296051979, + "step": 2940, + "valid_targets_mean": 5227.2, + "valid_targets_min": 677 + }, + { + "epoch": 4.616470588235294, + "grad_norm": 0.39868825687973575, + "learning_rate": 1.2561693313250034e-05, + "loss": 0.2257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09707609564065933, + "step": 2945, + "valid_targets_mean": 5251.4, + "valid_targets_min": 3902 + }, + { + "epoch": 4.624313725490196, + "grad_norm": 0.4216177868655537, + "learning_rate": 1.248918908410396e-05, + "loss": 0.2418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10996775329113007, + "step": 2950, + "valid_targets_mean": 4927.2, + "valid_targets_min": 2015 + }, + { + "epoch": 4.632156862745098, + "grad_norm": 0.7264160142237203, + "learning_rate": 1.2416799588398576e-05, + "loss": 0.2209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08461538702249527, + "step": 2955, + "valid_targets_mean": 4145.6, + "valid_targets_min": 942 + }, + { + "epoch": 4.64, + "grad_norm": 0.4291908154396816, + "learning_rate": 1.2344525931939359e-05, + "loss": 0.235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11082827299833298, + "step": 2960, + "valid_targets_mean": 5010.8, + "valid_targets_min": 2231 + }, + { + "epoch": 4.647843137254902, + "grad_norm": 0.4199152718325381, + "learning_rate": 1.2272369218762266e-05, + "loss": 0.2365, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12899282574653625, + "step": 2965, + "valid_targets_mean": 5659.4, + "valid_targets_min": 3966 + }, + { + "epoch": 4.6556862745098035, + "grad_norm": 0.4604380546521672, + "learning_rate": 1.2200330551116838e-05, + "loss": 0.2249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11434175074100494, + "step": 2970, + "valid_targets_mean": 4256.5, + "valid_targets_min": 702 + }, + { + "epoch": 4.663529411764706, + "grad_norm": 0.49072667250137836, + "learning_rate": 1.2128411029449403e-05, + "loss": 0.2407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11742053925991058, + "step": 2975, + "valid_targets_mean": 4721.1, + "valid_targets_min": 974 + }, + { + "epoch": 4.671372549019608, + "grad_norm": 0.458501520651535, + "learning_rate": 1.205661175238622e-05, + "loss": 0.2302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12470651417970657, + "step": 2980, + "valid_targets_mean": 5843.1, + "valid_targets_min": 3848 + }, + { + "epoch": 4.67921568627451, + "grad_norm": 0.4308150069093234, + "learning_rate": 1.1984933816716726e-05, + "loss": 0.2355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12182128429412842, + "step": 2985, + "valid_targets_mean": 5752.2, + "valid_targets_min": 3848 + }, + { + "epoch": 4.687058823529412, + "grad_norm": 0.44479697330206897, + "learning_rate": 1.1913378317376796e-05, + "loss": 0.2378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11784543842077255, + "step": 2990, + "valid_targets_mean": 5041.1, + "valid_targets_min": 3733 + }, + { + "epoch": 4.694901960784314, + "grad_norm": 0.44454023318061986, + "learning_rate": 1.1841946347431961e-05, + "loss": 0.2237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10518812388181686, + "step": 2995, + "valid_targets_mean": 4918.2, + "valid_targets_min": 3311 + }, + { + "epoch": 4.702745098039216, + "grad_norm": 0.4183316201089064, + "learning_rate": 1.1770638998060764e-05, + "loss": 0.2299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10675269365310669, + "step": 3000, + "valid_targets_mean": 4699.8, + "valid_targets_min": 4095 + }, + { + "epoch": 4.710588235294118, + "grad_norm": 0.41360698717185757, + "learning_rate": 1.1699457358538072e-05, + "loss": 0.2401, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09616823494434357, + "step": 3005, + "valid_targets_mean": 5704.4, + "valid_targets_min": 4123 + }, + { + "epoch": 4.71843137254902, + "grad_norm": 0.4113294167567783, + "learning_rate": 1.1628402516218432e-05, + "loss": 0.2314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10045308619737625, + "step": 3010, + "valid_targets_mean": 4660.0, + "valid_targets_min": 3935 + }, + { + "epoch": 4.726274509803922, + "grad_norm": 0.4997749546359887, + "learning_rate": 1.1557475556519461e-05, + "loss": 0.2285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11495951563119888, + "step": 3015, + "valid_targets_mean": 3924.1, + "valid_targets_min": 893 + }, + { + "epoch": 4.734117647058824, + "grad_norm": 0.4469295834755647, + "learning_rate": 1.1486677562905281e-05, + "loss": 0.2271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1331641972064972, + "step": 3020, + "valid_targets_mean": 5024.4, + "valid_targets_min": 3857 + }, + { + "epoch": 4.741960784313726, + "grad_norm": 0.3873914400544633, + "learning_rate": 1.1416009616869959e-05, + "loss": 0.235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1114264726638794, + "step": 3025, + "valid_targets_mean": 5801.9, + "valid_targets_min": 2997 + }, + { + "epoch": 4.749803921568628, + "grad_norm": 0.4225044408926774, + "learning_rate": 1.134547279792098e-05, + "loss": 0.2352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13369326293468475, + "step": 3030, + "valid_targets_mean": 6771.4, + "valid_targets_min": 3721 + }, + { + "epoch": 4.75764705882353, + "grad_norm": 0.49039891697784743, + "learning_rate": 1.1275068183562747e-05, + "loss": 0.2345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1427251100540161, + "step": 3035, + "valid_targets_mean": 5687.2, + "valid_targets_min": 704 + }, + { + "epoch": 4.7654901960784315, + "grad_norm": 0.45410172670277094, + "learning_rate": 1.1204796849280167e-05, + "loss": 0.2436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10159337520599365, + "step": 3040, + "valid_targets_mean": 4214.5, + "valid_targets_min": 614 + }, + { + "epoch": 4.773333333333333, + "grad_norm": 0.4622914859651975, + "learning_rate": 1.1134659868522158e-05, + "loss": 0.2396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1267380267381668, + "step": 3045, + "valid_targets_mean": 5010.5, + "valid_targets_min": 782 + }, + { + "epoch": 4.781176470588235, + "grad_norm": 0.47045215080087177, + "learning_rate": 1.106465831268531e-05, + "loss": 0.2344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11707454174757004, + "step": 3050, + "valid_targets_mean": 5423.0, + "valid_targets_min": 3482 + }, + { + "epoch": 4.789019607843137, + "grad_norm": 0.48230473285593406, + "learning_rate": 1.0994793251097468e-05, + "loss": 0.2329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10609722137451172, + "step": 3055, + "valid_targets_mean": 4305.5, + "valid_targets_min": 3645 + }, + { + "epoch": 4.796862745098039, + "grad_norm": 0.5021067379610036, + "learning_rate": 1.0925065751001445e-05, + "loss": 0.2316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10157807916402817, + "step": 3060, + "valid_targets_mean": 3710.1, + "valid_targets_min": 909 + }, + { + "epoch": 4.804705882352941, + "grad_norm": 0.4409944385549482, + "learning_rate": 1.0855476877538687e-05, + "loss": 0.2328, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10870078951120377, + "step": 3065, + "valid_targets_mean": 4619.1, + "valid_targets_min": 3695 + }, + { + "epoch": 4.812549019607843, + "grad_norm": 0.44312872363060424, + "learning_rate": 1.0786027693733015e-05, + "loss": 0.2281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09856695681810379, + "step": 3070, + "valid_targets_mean": 4376.0, + "valid_targets_min": 649 + }, + { + "epoch": 4.820392156862745, + "grad_norm": 0.4228137519417471, + "learning_rate": 1.0716719260474365e-05, + "loss": 0.2284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08073513954877853, + "step": 3075, + "valid_targets_mean": 3504.0, + "valid_targets_min": 246 + }, + { + "epoch": 4.828235294117647, + "grad_norm": 0.4492912860086454, + "learning_rate": 1.0647552636502629e-05, + "loss": 0.2468, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12045551091432571, + "step": 3080, + "valid_targets_mean": 4412.9, + "valid_targets_min": 715 + }, + { + "epoch": 4.836078431372549, + "grad_norm": 1.0408966059706204, + "learning_rate": 1.0578528878391419e-05, + "loss": 0.2258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12493710219860077, + "step": 3085, + "valid_targets_mean": 5019.9, + "valid_targets_min": 776 + }, + { + "epoch": 4.843921568627451, + "grad_norm": 0.4192359756622533, + "learning_rate": 1.0509649040531994e-05, + "loss": 0.2262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09598597884178162, + "step": 3090, + "valid_targets_mean": 4504.4, + "valid_targets_min": 3380 + }, + { + "epoch": 4.851764705882353, + "grad_norm": 0.426501242282498, + "learning_rate": 1.044091417511709e-05, + "loss": 0.2413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11279591917991638, + "step": 3095, + "valid_targets_mean": 5271.6, + "valid_targets_min": 4448 + }, + { + "epoch": 4.859607843137255, + "grad_norm": 0.5341696931177127, + "learning_rate": 1.0372325332124896e-05, + "loss": 0.2271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11988389492034912, + "step": 3100, + "valid_targets_mean": 5265.9, + "valid_targets_min": 3534 + }, + { + "epoch": 4.867450980392157, + "grad_norm": 0.4411575534344696, + "learning_rate": 1.0303883559302999e-05, + "loss": 0.2254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11052796244621277, + "step": 3105, + "valid_targets_mean": 5221.1, + "valid_targets_min": 3672 + }, + { + "epoch": 4.875294117647059, + "grad_norm": 0.43327957470978096, + "learning_rate": 1.0235589902152351e-05, + "loss": 0.2363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12073686718940735, + "step": 3110, + "valid_targets_mean": 4906.5, + "valid_targets_min": 3891 + }, + { + "epoch": 4.8831372549019605, + "grad_norm": 0.46410452856624584, + "learning_rate": 1.0167445403911356e-05, + "loss": 0.2406, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11970961838960648, + "step": 3115, + "valid_targets_mean": 4996.5, + "valid_targets_min": 3709 + }, + { + "epoch": 4.890980392156862, + "grad_norm": 0.4457445424078122, + "learning_rate": 1.0099451105539866e-05, + "loss": 0.2334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11119598895311356, + "step": 3120, + "valid_targets_mean": 4615.5, + "valid_targets_min": 2185 + }, + { + "epoch": 4.898823529411764, + "grad_norm": 0.4238986113816507, + "learning_rate": 1.0031608045703347e-05, + "loss": 0.2429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1175379753112793, + "step": 3125, + "valid_targets_mean": 4690.8, + "valid_targets_min": 712 + }, + { + "epoch": 4.906666666666666, + "grad_norm": 0.4969126965651698, + "learning_rate": 9.963917260756937e-06, + "loss": 0.2351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10803299397230148, + "step": 3130, + "valid_targets_mean": 3725.6, + "valid_targets_min": 644 + }, + { + "epoch": 4.914509803921568, + "grad_norm": 0.42476715117328734, + "learning_rate": 9.89637978472972e-06, + "loss": 0.2357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12074100971221924, + "step": 3135, + "valid_targets_mean": 5526.5, + "valid_targets_min": 731 + }, + { + "epoch": 4.92235294117647, + "grad_norm": 0.4732390657116341, + "learning_rate": 9.828996649308804e-06, + "loss": 0.2447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14218966662883759, + "step": 3140, + "valid_targets_mean": 5210.5, + "valid_targets_min": 789 + }, + { + "epoch": 4.930196078431372, + "grad_norm": 0.4511606219481335, + "learning_rate": 9.76176888382367e-06, + "loss": 0.2469, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10251887142658234, + "step": 3145, + "valid_targets_mean": 4451.0, + "valid_targets_min": 3309 + }, + { + "epoch": 4.938039215686274, + "grad_norm": 0.40999282678558024, + "learning_rate": 9.694697515230371e-06, + "loss": 0.232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1229824647307396, + "step": 3150, + "valid_targets_mean": 5916.8, + "valid_targets_min": 3639 + }, + { + "epoch": 4.945882352941177, + "grad_norm": 0.4529754066112067, + "learning_rate": 9.627783568095905e-06, + "loss": 0.236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1377158910036087, + "step": 3155, + "valid_targets_mean": 6208.2, + "valid_targets_min": 3652 + }, + { + "epoch": 4.953725490196079, + "grad_norm": 0.4242985299137044, + "learning_rate": 9.561028064582507e-06, + "loss": 0.2336, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10480914264917374, + "step": 3160, + "valid_targets_mean": 5257.2, + "valid_targets_min": 4459 + }, + { + "epoch": 4.961568627450981, + "grad_norm": 0.41878222358740275, + "learning_rate": 9.494432024432087e-06, + "loss": 0.2264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13485050201416016, + "step": 3165, + "valid_targets_mean": 5783.6, + "valid_targets_min": 3438 + }, + { + "epoch": 4.969411764705883, + "grad_norm": 0.4483772324698896, + "learning_rate": 9.42799646495062e-06, + "loss": 0.2391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10306377708911896, + "step": 3170, + "valid_targets_mean": 4810.8, + "valid_targets_min": 3566 + }, + { + "epoch": 4.977254901960785, + "grad_norm": 0.4575109733204383, + "learning_rate": 9.361722400992618e-06, + "loss": 0.2249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13620686531066895, + "step": 3175, + "valid_targets_mean": 5052.2, + "valid_targets_min": 595 + }, + { + "epoch": 4.9850980392156865, + "grad_norm": 0.4664072811099875, + "learning_rate": 9.295610844945613e-06, + "loss": 0.2286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1414259970188141, + "step": 3180, + "valid_targets_mean": 5369.8, + "valid_targets_min": 2914 + }, + { + "epoch": 4.992941176470588, + "grad_norm": 0.4084175714626147, + "learning_rate": 9.229662806714721e-06, + "loss": 0.2291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1109371930360794, + "step": 3185, + "valid_targets_mean": 5307.1, + "valid_targets_min": 4409 + }, + { + "epoch": 5.0, + "grad_norm": 0.6467547947661242, + "learning_rate": 9.163879293707172e-06, + "loss": 0.2424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.278501957654953, + "step": 3190, + "valid_targets_mean": 5547.1, + "valid_targets_min": 601 + }, + { + "epoch": 5.007843137254902, + "grad_norm": 0.40387115368040144, + "learning_rate": 9.09826131081698e-06, + "loss": 0.2235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10747785866260529, + "step": 3195, + "valid_targets_mean": 5887.5, + "valid_targets_min": 3970 + }, + { + "epoch": 5.015686274509804, + "grad_norm": 0.45143393354352845, + "learning_rate": 9.03280986040952e-06, + "loss": 0.2257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13973960280418396, + "step": 3200, + "valid_targets_mean": 5593.4, + "valid_targets_min": 3313 + }, + { + "epoch": 5.023529411764706, + "grad_norm": 0.5170646910567398, + "learning_rate": 8.967525942306285e-06, + "loss": 0.2333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12646545469760895, + "step": 3205, + "valid_targets_mean": 4262.0, + "valid_targets_min": 757 + }, + { + "epoch": 5.031372549019608, + "grad_norm": 0.4177365278956721, + "learning_rate": 8.902410553769575e-06, + "loss": 0.2202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11722061038017273, + "step": 3210, + "valid_targets_mean": 6452.1, + "valid_targets_min": 4591 + }, + { + "epoch": 5.03921568627451, + "grad_norm": 0.45982665324198024, + "learning_rate": 8.837464689487261e-06, + "loss": 0.2238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14046096801757812, + "step": 3215, + "valid_targets_mean": 5643.9, + "valid_targets_min": 4702 + }, + { + "epoch": 5.047058823529412, + "grad_norm": 0.46047545116826843, + "learning_rate": 8.772689341557611e-06, + "loss": 0.2199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08853432536125183, + "step": 3220, + "valid_targets_mean": 3722.0, + "valid_targets_min": 869 + }, + { + "epoch": 5.0549019607843135, + "grad_norm": 0.4214879259510868, + "learning_rate": 8.708085499474112e-06, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1543363481760025, + "step": 3225, + "valid_targets_mean": 6443.2, + "valid_targets_min": 796 + }, + { + "epoch": 5.0627450980392155, + "grad_norm": 0.49671062233371066, + "learning_rate": 8.643654150110387e-06, + "loss": 0.2297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09493766725063324, + "step": 3230, + "valid_targets_mean": 3947.6, + "valid_targets_min": 1011 + }, + { + "epoch": 5.070588235294117, + "grad_norm": 0.44383290688698823, + "learning_rate": 8.579396277705071e-06, + "loss": 0.2333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11513125896453857, + "step": 3235, + "valid_targets_mean": 5591.4, + "valid_targets_min": 1091 + }, + { + "epoch": 5.078431372549019, + "grad_norm": 0.41639923855857314, + "learning_rate": 8.51531286384683e-06, + "loss": 0.2218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12974339723587036, + "step": 3240, + "valid_targets_mean": 6583.4, + "valid_targets_min": 4301 + }, + { + "epoch": 5.086274509803921, + "grad_norm": 0.4817613204052127, + "learning_rate": 8.451404887459325e-06, + "loss": 0.2206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10065077245235443, + "step": 3245, + "valid_targets_mean": 4468.6, + "valid_targets_min": 2552 + }, + { + "epoch": 5.094117647058823, + "grad_norm": 0.41458592266722405, + "learning_rate": 8.387673324786292e-06, + "loss": 0.2203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09595533460378647, + "step": 3250, + "valid_targets_mean": 5498.2, + "valid_targets_min": 3578 + }, + { + "epoch": 5.101960784313725, + "grad_norm": 0.455325990243027, + "learning_rate": 8.324119149376584e-06, + "loss": 0.2236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08556359261274338, + "step": 3255, + "valid_targets_mean": 3785.8, + "valid_targets_min": 681 + }, + { + "epoch": 5.109803921568627, + "grad_norm": 0.4545717072003482, + "learning_rate": 8.260743332069355e-06, + "loss": 0.2258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08474293351173401, + "step": 3260, + "valid_targets_mean": 3495.5, + "valid_targets_min": 821 + }, + { + "epoch": 5.117647058823529, + "grad_norm": 0.451686422050851, + "learning_rate": 8.197546840979172e-06, + "loss": 0.225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12904678285121918, + "step": 3265, + "valid_targets_mean": 5611.8, + "valid_targets_min": 4490 + }, + { + "epoch": 5.125490196078431, + "grad_norm": 0.4533041440520356, + "learning_rate": 8.134530641481289e-06, + "loss": 0.2261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10058914870023727, + "step": 3270, + "valid_targets_mean": 5074.5, + "valid_targets_min": 4181 + }, + { + "epoch": 5.133333333333334, + "grad_norm": 0.4447041485071207, + "learning_rate": 8.071695696196824e-06, + "loss": 0.2333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12126485258340836, + "step": 3275, + "valid_targets_mean": 6402.9, + "valid_targets_min": 2974 + }, + { + "epoch": 5.141176470588236, + "grad_norm": 0.45393041745826174, + "learning_rate": 8.00904296497815e-06, + "loss": 0.2178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10773161798715591, + "step": 3280, + "valid_targets_mean": 4721.6, + "valid_targets_min": 952 + }, + { + "epoch": 5.149019607843138, + "grad_norm": 0.44358510403133994, + "learning_rate": 7.946573404894133e-06, + "loss": 0.2238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11503250896930695, + "step": 3285, + "valid_targets_mean": 4849.8, + "valid_targets_min": 3997 + }, + { + "epoch": 5.1568627450980395, + "grad_norm": 0.43628925896890625, + "learning_rate": 7.88428797021559e-06, + "loss": 0.2398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10749220848083496, + "step": 3290, + "valid_targets_mean": 6218.1, + "valid_targets_min": 3660 + }, + { + "epoch": 5.1647058823529415, + "grad_norm": 0.4997173668196613, + "learning_rate": 7.82218761240065e-06, + "loss": 0.2341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13712440431118011, + "step": 3295, + "valid_targets_mean": 4569.8, + "valid_targets_min": 894 + }, + { + "epoch": 5.172549019607843, + "grad_norm": 0.5678602543997687, + "learning_rate": 7.760273280080282e-06, + "loss": 0.2275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10061115026473999, + "step": 3300, + "valid_targets_mean": 2956.1, + "valid_targets_min": 488 + }, + { + "epoch": 5.180392156862745, + "grad_norm": 0.47622399456179687, + "learning_rate": 7.69854591904374e-06, + "loss": 0.2368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10639934241771698, + "step": 3305, + "valid_targets_mean": 4359.8, + "valid_targets_min": 2734 + }, + { + "epoch": 5.188235294117647, + "grad_norm": 0.5152270602959604, + "learning_rate": 7.637006472224173e-06, + "loss": 0.2228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13346779346466064, + "step": 3310, + "valid_targets_mean": 4612.8, + "valid_targets_min": 810 + }, + { + "epoch": 5.196078431372549, + "grad_norm": 0.4780328019266813, + "learning_rate": 7.575655879684192e-06, + "loss": 0.2219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11803792417049408, + "step": 3315, + "valid_targets_mean": 4777.1, + "valid_targets_min": 4313 + }, + { + "epoch": 5.203921568627451, + "grad_norm": 0.44076887070103893, + "learning_rate": 7.514495078601492e-06, + "loss": 0.2197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08803778141736984, + "step": 3320, + "valid_targets_mean": 4427.4, + "valid_targets_min": 3267 + }, + { + "epoch": 5.211764705882353, + "grad_norm": 0.44122086049924814, + "learning_rate": 7.453525003254585e-06, + "loss": 0.2265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11798333376646042, + "step": 3325, + "valid_targets_mean": 5929.4, + "valid_targets_min": 3780 + }, + { + "epoch": 5.219607843137255, + "grad_norm": 0.424878856482959, + "learning_rate": 7.39274658500847e-06, + "loss": 0.2251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12534697353839874, + "step": 3330, + "valid_targets_mean": 5617.8, + "valid_targets_min": 275 + }, + { + "epoch": 5.227450980392157, + "grad_norm": 0.568778481226979, + "learning_rate": 7.33216075230047e-06, + "loss": 0.2207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11138676106929779, + "step": 3335, + "valid_targets_mean": 4802.5, + "valid_targets_min": 3568 + }, + { + "epoch": 5.235294117647059, + "grad_norm": 0.4452420707521999, + "learning_rate": 7.271768430625983e-06, + "loss": 0.2272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11331316828727722, + "step": 3340, + "valid_targets_mean": 4633.6, + "valid_targets_min": 3254 + }, + { + "epoch": 5.243137254901961, + "grad_norm": 0.46420148150643264, + "learning_rate": 7.2115705425243996e-06, + "loss": 0.2238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09831637889146805, + "step": 3345, + "valid_targets_mean": 4430.6, + "valid_targets_min": 1147 + }, + { + "epoch": 5.250980392156863, + "grad_norm": 0.44459726741360717, + "learning_rate": 7.151568007564962e-06, + "loss": 0.218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11376352608203888, + "step": 3350, + "valid_targets_mean": 4682.2, + "valid_targets_min": 3530 + }, + { + "epoch": 5.258823529411765, + "grad_norm": 0.4311003479897479, + "learning_rate": 7.091761742332786e-06, + "loss": 0.2223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12164557725191116, + "step": 3355, + "valid_targets_mean": 5216.8, + "valid_targets_min": 4379 + }, + { + "epoch": 5.266666666666667, + "grad_norm": 0.4451618391957542, + "learning_rate": 7.032152660414764e-06, + "loss": 0.2285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.127460315823555, + "step": 3360, + "valid_targets_mean": 5033.1, + "valid_targets_min": 3806 + }, + { + "epoch": 5.2745098039215685, + "grad_norm": 0.46225025121912444, + "learning_rate": 6.972741672385699e-06, + "loss": 0.2339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10879524052143097, + "step": 3365, + "valid_targets_mean": 4410.0, + "valid_targets_min": 3384 + }, + { + "epoch": 5.2823529411764705, + "grad_norm": 0.45290397096114937, + "learning_rate": 6.913529685794333e-06, + "loss": 0.2234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09558887034654617, + "step": 3370, + "valid_targets_mean": 4651.5, + "valid_targets_min": 4220 + }, + { + "epoch": 5.290196078431372, + "grad_norm": 0.48261339698594724, + "learning_rate": 6.854517605149526e-06, + "loss": 0.2147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10471512377262115, + "step": 3375, + "valid_targets_mean": 4497.6, + "valid_targets_min": 776 + }, + { + "epoch": 5.298039215686274, + "grad_norm": 0.5223086996794308, + "learning_rate": 6.795706331906402e-06, + "loss": 0.2321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12723124027252197, + "step": 3380, + "valid_targets_mean": 5067.9, + "valid_targets_min": 831 + }, + { + "epoch": 5.305882352941176, + "grad_norm": 0.4484965233257951, + "learning_rate": 6.737096764452609e-06, + "loss": 0.2349, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1439855396747589, + "step": 3385, + "valid_targets_mean": 5265.8, + "valid_targets_min": 3597 + }, + { + "epoch": 5.313725490196078, + "grad_norm": 0.46966081881038835, + "learning_rate": 6.678689798094582e-06, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15899275243282318, + "step": 3390, + "valid_targets_mean": 5395.5, + "valid_targets_min": 872 + }, + { + "epoch": 5.32156862745098, + "grad_norm": 0.4610547507319241, + "learning_rate": 6.620486325043871e-06, + "loss": 0.2248, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1168796718120575, + "step": 3395, + "valid_targets_mean": 4572.5, + "valid_targets_min": 885 + }, + { + "epoch": 5.329411764705882, + "grad_norm": 0.4249547346844441, + "learning_rate": 6.562487234403492e-06, + "loss": 0.228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.07667449116706848, + "step": 3400, + "valid_targets_mean": 3854.9, + "valid_targets_min": 924 + }, + { + "epoch": 5.337254901960784, + "grad_norm": 0.5036540762705398, + "learning_rate": 6.504693412154384e-06, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1367102861404419, + "step": 3405, + "valid_targets_mean": 5214.8, + "valid_targets_min": 691 + }, + { + "epoch": 5.345098039215686, + "grad_norm": 0.49092534393309145, + "learning_rate": 6.447105741141828e-06, + "loss": 0.2364, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12212163954973221, + "step": 3410, + "valid_targets_mean": 4840.9, + "valid_targets_min": 1036 + }, + { + "epoch": 5.352941176470588, + "grad_norm": 0.4308675993577972, + "learning_rate": 6.389725101062017e-06, + "loss": 0.2361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10715265572071075, + "step": 3415, + "valid_targets_mean": 4416.5, + "valid_targets_min": 3391 + }, + { + "epoch": 5.36078431372549, + "grad_norm": 0.4481341239142485, + "learning_rate": 6.332552368448552e-06, + "loss": 0.2189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09622816741466522, + "step": 3420, + "valid_targets_mean": 4727.2, + "valid_targets_min": 3663 + }, + { + "epoch": 5.368627450980393, + "grad_norm": 0.42938641110064063, + "learning_rate": 6.275588416659111e-06, + "loss": 0.2348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11082536727190018, + "step": 3425, + "valid_targets_mean": 6231.6, + "valid_targets_min": 4385 + }, + { + "epoch": 5.376470588235295, + "grad_norm": 0.41006221308335794, + "learning_rate": 6.218834115862082e-06, + "loss": 0.2253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13855819404125214, + "step": 3430, + "valid_targets_mean": 7189.1, + "valid_targets_min": 4094 + }, + { + "epoch": 5.3843137254901965, + "grad_norm": 0.4851566191798374, + "learning_rate": 6.162290333023255e-06, + "loss": 0.2477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08945602178573608, + "step": 3435, + "valid_targets_mean": 4465.5, + "valid_targets_min": 3624 + }, + { + "epoch": 5.392156862745098, + "grad_norm": 0.48931355595220627, + "learning_rate": 6.105957931892619e-06, + "loss": 0.2278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09989559650421143, + "step": 3440, + "valid_targets_mean": 4265.6, + "valid_targets_min": 3459 + }, + { + "epoch": 5.4, + "grad_norm": 0.47032888212749213, + "learning_rate": 6.049837772991119e-06, + "loss": 0.2301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10447871685028076, + "step": 3445, + "valid_targets_mean": 4224.2, + "valid_targets_min": 810 + }, + { + "epoch": 5.407843137254902, + "grad_norm": 0.492717333292633, + "learning_rate": 5.99393071359756e-06, + "loss": 0.222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10688762366771698, + "step": 3450, + "valid_targets_mean": 4938.9, + "valid_targets_min": 727 + }, + { + "epoch": 5.415686274509804, + "grad_norm": 1.4420089359222485, + "learning_rate": 5.93823760773546e-06, + "loss": 0.2266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12139762938022614, + "step": 3455, + "valid_targets_mean": 4968.8, + "valid_targets_min": 3542 + }, + { + "epoch": 5.423529411764706, + "grad_norm": 0.4517197547603553, + "learning_rate": 5.882759306160071e-06, + "loss": 0.2222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12694215774536133, + "step": 3460, + "valid_targets_mean": 5412.6, + "valid_targets_min": 837 + }, + { + "epoch": 5.431372549019608, + "grad_norm": 0.45973692771505037, + "learning_rate": 5.827496656345299e-06, + "loss": 0.2322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1373184472322464, + "step": 3465, + "valid_targets_mean": 5169.2, + "valid_targets_min": 3526 + }, + { + "epoch": 5.43921568627451, + "grad_norm": 0.5065418637453369, + "learning_rate": 5.772450502470841e-06, + "loss": 0.2217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1180776059627533, + "step": 3470, + "valid_targets_mean": 4207.4, + "valid_targets_min": 780 + }, + { + "epoch": 5.447058823529412, + "grad_norm": 0.4707896045299758, + "learning_rate": 5.71762168540922e-06, + "loss": 0.2317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1182604730129242, + "step": 3475, + "valid_targets_mean": 4802.8, + "valid_targets_min": 747 + }, + { + "epoch": 5.454901960784314, + "grad_norm": 0.5024641672118548, + "learning_rate": 5.663011042712996e-06, + "loss": 0.2238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08559073507785797, + "step": 3480, + "valid_targets_mean": 3836.0, + "valid_targets_min": 622 + }, + { + "epoch": 5.462745098039216, + "grad_norm": 0.46735202669260495, + "learning_rate": 5.608619408601925e-06, + "loss": 0.2315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12076675891876221, + "step": 3485, + "valid_targets_mean": 5519.2, + "valid_targets_min": 2934 + }, + { + "epoch": 5.470588235294118, + "grad_norm": 0.4696336699134175, + "learning_rate": 5.554447613950262e-06, + "loss": 0.228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09073761105537415, + "step": 3490, + "valid_targets_mean": 4277.1, + "valid_targets_min": 457 + }, + { + "epoch": 5.47843137254902, + "grad_norm": 0.6036366533315168, + "learning_rate": 5.500496486274014e-06, + "loss": 0.2307, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11612799763679504, + "step": 3495, + "valid_targets_mean": 4985.4, + "valid_targets_min": 620 + }, + { + "epoch": 5.486274509803922, + "grad_norm": 0.47726925266975956, + "learning_rate": 5.446766849718368e-06, + "loss": 0.2346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12205741554498672, + "step": 3500, + "valid_targets_mean": 4844.0, + "valid_targets_min": 3442 + }, + { + "epoch": 5.4941176470588236, + "grad_norm": 0.4916736015437308, + "learning_rate": 5.393259525045025e-06, + "loss": 0.2253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1252761334180832, + "step": 3505, + "valid_targets_mean": 5064.5, + "valid_targets_min": 730 + }, + { + "epoch": 5.5019607843137255, + "grad_norm": 0.440080474865469, + "learning_rate": 5.3399753296197286e-06, + "loss": 0.2274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1194039136171341, + "step": 3510, + "valid_targets_mean": 6281.8, + "valid_targets_min": 3326 + }, + { + "epoch": 5.509803921568627, + "grad_norm": 0.4676090968245843, + "learning_rate": 5.286915077399728e-06, + "loss": 0.2354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12264136224985123, + "step": 3515, + "valid_targets_mean": 4933.1, + "valid_targets_min": 3593 + }, + { + "epoch": 5.517647058823529, + "grad_norm": 0.45612503188721304, + "learning_rate": 5.2340795789213896e-06, + "loss": 0.2262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11936895549297333, + "step": 3520, + "valid_targets_mean": 5021.1, + "valid_targets_min": 4010 + }, + { + "epoch": 5.525490196078431, + "grad_norm": 0.4830786890949812, + "learning_rate": 5.1814696412877665e-06, + "loss": 0.2154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0968177393078804, + "step": 3525, + "valid_targets_mean": 4000.5, + "valid_targets_min": 726 + }, + { + "epoch": 5.533333333333333, + "grad_norm": 0.42333378915841735, + "learning_rate": 5.1290860681563195e-06, + "loss": 0.2265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1203262209892273, + "step": 3530, + "valid_targets_mean": 5863.4, + "valid_targets_min": 3710 + }, + { + "epoch": 5.541176470588235, + "grad_norm": 0.4299669760963479, + "learning_rate": 5.0769296597266126e-06, + "loss": 0.2262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0961022824048996, + "step": 3535, + "valid_targets_mean": 4194.5, + "valid_targets_min": 950 + }, + { + "epoch": 5.549019607843137, + "grad_norm": 0.4913004808346495, + "learning_rate": 5.0250012127280755e-06, + "loss": 0.2242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14035651087760925, + "step": 3540, + "valid_targets_mean": 5527.6, + "valid_targets_min": 558 + }, + { + "epoch": 5.556862745098039, + "grad_norm": 0.42420621008985054, + "learning_rate": 4.973301520407874e-06, + "loss": 0.23, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11041077226400375, + "step": 3545, + "valid_targets_mean": 4931.5, + "valid_targets_min": 3822 + }, + { + "epoch": 5.564705882352941, + "grad_norm": 0.4397064800423962, + "learning_rate": 4.921831372518751e-06, + "loss": 0.2299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1008322536945343, + "step": 3550, + "valid_targets_mean": 4589.4, + "valid_targets_min": 3745 + }, + { + "epoch": 5.572549019607843, + "grad_norm": 0.42983114719825694, + "learning_rate": 4.870591555306996e-06, + "loss": 0.2182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12528643012046814, + "step": 3555, + "valid_targets_mean": 5302.1, + "valid_targets_min": 3917 + }, + { + "epoch": 5.580392156862745, + "grad_norm": 0.41251872258649447, + "learning_rate": 4.819582851500406e-06, + "loss": 0.226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11194668710231781, + "step": 3560, + "valid_targets_mean": 5665.6, + "valid_targets_min": 3842 + }, + { + "epoch": 5.588235294117647, + "grad_norm": 0.41089046624017184, + "learning_rate": 4.768806040296348e-06, + "loss": 0.2199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10383773595094681, + "step": 3565, + "valid_targets_mean": 5147.0, + "valid_targets_min": 4120 + }, + { + "epoch": 5.596078431372549, + "grad_norm": 0.44250020714243427, + "learning_rate": 4.718261897349856e-06, + "loss": 0.211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11924265325069427, + "step": 3570, + "valid_targets_mean": 5651.6, + "valid_targets_min": 3699 + }, + { + "epoch": 5.603921568627451, + "grad_norm": 0.4520177978675399, + "learning_rate": 4.667951194761773e-06, + "loss": 0.2346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11091027408838272, + "step": 3575, + "valid_targets_mean": 5147.1, + "valid_targets_min": 3362 + }, + { + "epoch": 5.6117647058823525, + "grad_norm": 0.46655243788650486, + "learning_rate": 4.6178747010669485e-06, + "loss": 0.2274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09887704253196716, + "step": 3580, + "valid_targets_mean": 5145.6, + "valid_targets_min": 782 + }, + { + "epoch": 5.6196078431372545, + "grad_norm": 0.43380729747663566, + "learning_rate": 4.5680331812225335e-06, + "loss": 0.2199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11621832847595215, + "step": 3585, + "valid_targets_mean": 6146.0, + "valid_targets_min": 4295 + }, + { + "epoch": 5.627450980392156, + "grad_norm": 0.42101797383398143, + "learning_rate": 4.518427396596246e-06, + "loss": 0.2202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09557899832725525, + "step": 3590, + "valid_targets_mean": 4636.6, + "valid_targets_min": 3449 + }, + { + "epoch": 5.635294117647058, + "grad_norm": 0.4332157513198714, + "learning_rate": 4.469058104954786e-06, + "loss": 0.2193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10167904198169708, + "step": 3595, + "valid_targets_mean": 4072.9, + "valid_targets_min": 1054 + }, + { + "epoch": 5.643137254901961, + "grad_norm": 0.4433003894407488, + "learning_rate": 4.4199260604522266e-06, + "loss": 0.23, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08998174965381622, + "step": 3600, + "valid_targets_mean": 4496.6, + "valid_targets_min": 823 + }, + { + "epoch": 5.650980392156863, + "grad_norm": 0.4488408459473684, + "learning_rate": 4.371032013618519e-06, + "loss": 0.2379, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12565404176712036, + "step": 3605, + "valid_targets_mean": 5324.5, + "valid_targets_min": 3326 + }, + { + "epoch": 5.658823529411765, + "grad_norm": 0.44653324730690613, + "learning_rate": 4.322376711348009e-06, + "loss": 0.2254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11299017071723938, + "step": 3610, + "valid_targets_mean": 5719.5, + "valid_targets_min": 4228 + }, + { + "epoch": 5.666666666666667, + "grad_norm": 0.4807605716107027, + "learning_rate": 4.273960896888045e-06, + "loss": 0.2285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10924605280160904, + "step": 3615, + "valid_targets_mean": 4711.0, + "valid_targets_min": 672 + }, + { + "epoch": 5.674509803921569, + "grad_norm": 0.4375515041383165, + "learning_rate": 4.225785309827595e-06, + "loss": 0.2353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16533643007278442, + "step": 3620, + "valid_targets_mean": 7468.0, + "valid_targets_min": 4598 + }, + { + "epoch": 5.682352941176471, + "grad_norm": 0.4420469898871082, + "learning_rate": 4.177850686085987e-06, + "loss": 0.2374, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09723871201276779, + "step": 3625, + "valid_targets_mean": 5326.0, + "valid_targets_min": 3710 + }, + { + "epoch": 5.690196078431373, + "grad_norm": 0.5190219956910557, + "learning_rate": 4.130157757901632e-06, + "loss": 0.2259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0885414406657219, + "step": 3630, + "valid_targets_mean": 4358.0, + "valid_targets_min": 621 + }, + { + "epoch": 5.698039215686275, + "grad_norm": 0.4183514479684243, + "learning_rate": 4.0827072538208705e-06, + "loss": 0.2193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09757456183433533, + "step": 3635, + "valid_targets_mean": 4744.9, + "valid_targets_min": 3655 + }, + { + "epoch": 5.705882352941177, + "grad_norm": 0.45008902375660204, + "learning_rate": 4.03549989868681e-06, + "loss": 0.2254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1252342164516449, + "step": 3640, + "valid_targets_mean": 5274.1, + "valid_targets_min": 4356 + }, + { + "epoch": 5.713725490196079, + "grad_norm": 0.43044920377943224, + "learning_rate": 3.988536413628286e-06, + "loss": 0.224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11895223706960678, + "step": 3645, + "valid_targets_mean": 4859.6, + "valid_targets_min": 4330 + }, + { + "epoch": 5.7215686274509805, + "grad_norm": 0.4547106288349754, + "learning_rate": 3.941817516048827e-06, + "loss": 0.2246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1304386854171753, + "step": 3650, + "valid_targets_mean": 5126.4, + "valid_targets_min": 986 + }, + { + "epoch": 5.729411764705882, + "grad_norm": 0.4358567072415122, + "learning_rate": 3.895343919615686e-06, + "loss": 0.2256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09702654927968979, + "step": 3655, + "valid_targets_mean": 4727.8, + "valid_targets_min": 3603 + }, + { + "epoch": 5.737254901960784, + "grad_norm": 0.43283259864119533, + "learning_rate": 3.849116334248972e-06, + "loss": 0.2269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12856844067573547, + "step": 3660, + "valid_targets_mean": 5489.1, + "valid_targets_min": 4068 + }, + { + "epoch": 5.745098039215686, + "grad_norm": 0.4420398806206634, + "learning_rate": 3.803135466110761e-06, + "loss": 0.2287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14836335182189941, + "step": 3665, + "valid_targets_mean": 6416.6, + "valid_targets_min": 3531 + }, + { + "epoch": 5.752941176470588, + "grad_norm": 0.48584018258685463, + "learning_rate": 3.7574020175943514e-06, + "loss": 0.2411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.134757399559021, + "step": 3670, + "valid_targets_mean": 4905.2, + "valid_targets_min": 545 + }, + { + "epoch": 5.76078431372549, + "grad_norm": 0.4466902118893254, + "learning_rate": 3.7119166873135102e-06, + "loss": 0.2223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11019237339496613, + "step": 3675, + "valid_targets_mean": 4478.0, + "valid_targets_min": 3613 + }, + { + "epoch": 5.768627450980392, + "grad_norm": 0.43514773978127463, + "learning_rate": 3.666680170091812e-06, + "loss": 0.2391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09685391187667847, + "step": 3680, + "valid_targets_mean": 4997.0, + "valid_targets_min": 726 + }, + { + "epoch": 5.776470588235294, + "grad_norm": 0.4563081739000789, + "learning_rate": 3.6216931569519995e-06, + "loss": 0.226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1273442655801773, + "step": 3685, + "valid_targets_mean": 5875.6, + "valid_targets_min": 2930 + }, + { + "epoch": 5.784313725490196, + "grad_norm": 0.44541713200948646, + "learning_rate": 3.576956335105477e-06, + "loss": 0.2321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12498340010643005, + "step": 3690, + "valid_targets_mean": 4812.2, + "valid_targets_min": 4032 + }, + { + "epoch": 5.792156862745098, + "grad_norm": 0.4890839073410703, + "learning_rate": 3.5324703879417553e-06, + "loss": 0.2273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12750136852264404, + "step": 3695, + "valid_targets_mean": 4419.8, + "valid_targets_min": 3059 + }, + { + "epoch": 5.8, + "grad_norm": 0.423189067918186, + "learning_rate": 3.488235995018063e-06, + "loss": 0.2216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10611607134342194, + "step": 3700, + "valid_targets_mean": 5321.4, + "valid_targets_min": 686 + }, + { + "epoch": 5.807843137254902, + "grad_norm": 0.4603090763488122, + "learning_rate": 3.444253832048925e-06, + "loss": 0.2279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12216217070817947, + "step": 3705, + "valid_targets_mean": 5663.4, + "valid_targets_min": 610 + }, + { + "epoch": 5.815686274509804, + "grad_norm": 0.43406157889209235, + "learning_rate": 3.4005245708958757e-06, + "loss": 0.2193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10026943683624268, + "step": 3710, + "valid_targets_mean": 5337.1, + "valid_targets_min": 3646 + }, + { + "epoch": 5.823529411764706, + "grad_norm": 0.45578923444429736, + "learning_rate": 3.3570488795571653e-06, + "loss": 0.2201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10260643810033798, + "step": 3715, + "valid_targets_mean": 4458.5, + "valid_targets_min": 626 + }, + { + "epoch": 5.8313725490196076, + "grad_norm": 0.4441416835886368, + "learning_rate": 3.313827422157583e-06, + "loss": 0.2166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11893025785684586, + "step": 3720, + "valid_targets_mean": 5243.4, + "valid_targets_min": 4273 + }, + { + "epoch": 5.8392156862745095, + "grad_norm": 0.4490186340963944, + "learning_rate": 3.2708608589382783e-06, + "loss": 0.2326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1208035871386528, + "step": 3725, + "valid_targets_mean": 5224.9, + "valid_targets_min": 3941 + }, + { + "epoch": 5.847058823529411, + "grad_norm": 0.4998487790679273, + "learning_rate": 3.2281498462467177e-06, + "loss": 0.2251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12360478937625885, + "step": 3730, + "valid_targets_mean": 4348.6, + "valid_targets_min": 850 + }, + { + "epoch": 5.854901960784313, + "grad_norm": 0.41982853355713934, + "learning_rate": 3.185695036526615e-06, + "loss": 0.2206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09100072085857391, + "step": 3735, + "valid_targets_mean": 4289.4, + "valid_targets_min": 3739 + }, + { + "epoch": 5.862745098039216, + "grad_norm": 0.4611918743721464, + "learning_rate": 3.1434970783080043e-06, + "loss": 0.2166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11276879161596298, + "step": 3740, + "valid_targets_mean": 5198.1, + "valid_targets_min": 3462 + }, + { + "epoch": 5.870588235294118, + "grad_norm": 0.45917677458750794, + "learning_rate": 3.1015566161972967e-06, + "loss": 0.2208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12548470497131348, + "step": 3745, + "valid_targets_mean": 5063.1, + "valid_targets_min": 3888 + }, + { + "epoch": 5.87843137254902, + "grad_norm": 0.42903473316059026, + "learning_rate": 3.059874290867464e-06, + "loss": 0.219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12700194120407104, + "step": 3750, + "valid_targets_mean": 5993.8, + "valid_targets_min": 3910 + }, + { + "epoch": 5.886274509803922, + "grad_norm": 0.48598276291447545, + "learning_rate": 3.01845073904824e-06, + "loss": 0.2269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10122105479240417, + "step": 3755, + "valid_targets_mean": 3913.8, + "valid_targets_min": 735 + }, + { + "epoch": 5.894117647058824, + "grad_norm": 0.46358860073680896, + "learning_rate": 2.977286593516382e-06, + "loss": 0.2295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11198492348194122, + "step": 3760, + "valid_targets_mean": 5098.1, + "valid_targets_min": 3774 + }, + { + "epoch": 5.901960784313726, + "grad_norm": 0.43396800884845904, + "learning_rate": 2.936382483086022e-06, + "loss": 0.2216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0948493629693985, + "step": 3765, + "valid_targets_mean": 5090.5, + "valid_targets_min": 3697 + }, + { + "epoch": 5.909803921568628, + "grad_norm": 0.42396863953417807, + "learning_rate": 2.895739032599065e-06, + "loss": 0.2129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10739844292402267, + "step": 3770, + "valid_targets_mean": 5082.1, + "valid_targets_min": 3741 + }, + { + "epoch": 5.91764705882353, + "grad_norm": 0.4367233791726713, + "learning_rate": 2.8553568629156124e-06, + "loss": 0.2261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11178376525640488, + "step": 3775, + "valid_targets_mean": 5284.2, + "valid_targets_min": 578 + }, + { + "epoch": 5.925490196078432, + "grad_norm": 0.43952645084490743, + "learning_rate": 2.815236590904522e-06, + "loss": 0.2175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13286638259887695, + "step": 3780, + "valid_targets_mean": 5756.5, + "valid_targets_min": 3362 + }, + { + "epoch": 5.933333333333334, + "grad_norm": 0.47695086720882024, + "learning_rate": 2.7753788294339412e-06, + "loss": 0.2344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10761082172393799, + "step": 3785, + "valid_targets_mean": 4253.6, + "valid_targets_min": 296 + }, + { + "epoch": 5.9411764705882355, + "grad_norm": 0.5099850777126819, + "learning_rate": 2.7357841873619804e-06, + "loss": 0.2271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1005336195230484, + "step": 3790, + "valid_targets_mean": 4683.2, + "valid_targets_min": 665 + }, + { + "epoch": 5.949019607843137, + "grad_norm": 0.42328334889515123, + "learning_rate": 2.6964532695273993e-06, + "loss": 0.2208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10245101898908615, + "step": 3795, + "valid_targets_mean": 4895.5, + "valid_targets_min": 3691 + }, + { + "epoch": 5.956862745098039, + "grad_norm": 0.47936537216048497, + "learning_rate": 2.65738667674035e-06, + "loss": 0.2167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11452037841081619, + "step": 3800, + "valid_targets_mean": 5202.2, + "valid_targets_min": 4291 + }, + { + "epoch": 5.964705882352941, + "grad_norm": 0.45793993615683437, + "learning_rate": 2.6185850057732377e-06, + "loss": 0.2279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12399207055568695, + "step": 3805, + "valid_targets_mean": 5232.4, + "valid_targets_min": 3835 + }, + { + "epoch": 5.972549019607843, + "grad_norm": 0.4303247993369076, + "learning_rate": 2.5800488493515576e-06, + "loss": 0.2268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12024565041065216, + "step": 3810, + "valid_targets_mean": 5481.5, + "valid_targets_min": 3927 + }, + { + "epoch": 5.980392156862745, + "grad_norm": 0.4339078888124253, + "learning_rate": 2.5417787961448893e-06, + "loss": 0.2281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11610336601734161, + "step": 3815, + "valid_targets_mean": 5475.6, + "valid_targets_min": 4163 + }, + { + "epoch": 5.988235294117647, + "grad_norm": 0.4643015265473758, + "learning_rate": 2.5037754307578553e-06, + "loss": 0.2214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12840969860553741, + "step": 3820, + "valid_targets_mean": 5129.9, + "valid_targets_min": 3500 + }, + { + "epoch": 5.996078431372549, + "grad_norm": 0.45333397118083585, + "learning_rate": 2.466039333721246e-06, + "loss": 0.2287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14173388481140137, + "step": 3825, + "valid_targets_mean": 5541.9, + "valid_targets_min": 2930 + }, + { + "epoch": 6.003137254901961, + "grad_norm": 0.64995545201576, + "learning_rate": 2.4285710814830908e-06, + "loss": 0.2229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11834508180618286, + "step": 3830, + "valid_targets_mean": 5217.9, + "valid_targets_min": 3748 + }, + { + "epoch": 6.0109803921568625, + "grad_norm": 0.40310804602190514, + "learning_rate": 2.3913712463999026e-06, + "loss": 0.2227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12881794571876526, + "step": 3835, + "valid_targets_mean": 7408.9, + "valid_targets_min": 4043 + }, + { + "epoch": 6.0188235294117645, + "grad_norm": 0.3976956884972396, + "learning_rate": 2.354440396727902e-06, + "loss": 0.2276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11172664165496826, + "step": 3840, + "valid_targets_mean": 5850.1, + "valid_targets_min": 3770 + }, + { + "epoch": 6.026666666666666, + "grad_norm": 0.46290334545230455, + "learning_rate": 2.3177790966143653e-06, + "loss": 0.2102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1118907779455185, + "step": 3845, + "valid_targets_mean": 4627.0, + "valid_targets_min": 3205 + }, + { + "epoch": 6.034509803921568, + "grad_norm": 0.4417770357609195, + "learning_rate": 2.28138790608897e-06, + "loss": 0.2172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0939764678478241, + "step": 3850, + "valid_targets_mean": 4603.8, + "valid_targets_min": 2856 + }, + { + "epoch": 6.04235294117647, + "grad_norm": 0.41116088453012645, + "learning_rate": 2.2452673810552783e-06, + "loss": 0.2233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11001232266426086, + "step": 3855, + "valid_targets_mean": 5604.6, + "valid_targets_min": 691 + }, + { + "epoch": 6.050196078431372, + "grad_norm": 0.4582789471885693, + "learning_rate": 2.2094180732822235e-06, + "loss": 0.2239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11757993698120117, + "step": 3860, + "valid_targets_mean": 5268.5, + "valid_targets_min": 3291 + }, + { + "epoch": 6.058039215686274, + "grad_norm": 0.43527377714699433, + "learning_rate": 2.1738405303956877e-06, + "loss": 0.2277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11812390387058258, + "step": 3865, + "valid_targets_mean": 4652.0, + "valid_targets_min": 1211 + }, + { + "epoch": 6.065882352941176, + "grad_norm": 0.436259827105265, + "learning_rate": 2.138535295870121e-06, + "loss": 0.2156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1061776727437973, + "step": 3870, + "valid_targets_mean": 4835.5, + "valid_targets_min": 3781 + }, + { + "epoch": 6.073725490196079, + "grad_norm": 0.46710848541258787, + "learning_rate": 2.1035029090202717e-06, + "loss": 0.2295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1308131217956543, + "step": 3875, + "valid_targets_mean": 4839.9, + "valid_targets_min": 757 + }, + { + "epoch": 6.081568627450981, + "grad_norm": 0.4346179493431141, + "learning_rate": 2.0687439049929113e-06, + "loss": 0.2234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11312983185052872, + "step": 3880, + "valid_targets_mean": 5265.2, + "valid_targets_min": 2579 + }, + { + "epoch": 6.089411764705883, + "grad_norm": 0.4310847748884074, + "learning_rate": 2.034258814758696e-06, + "loss": 0.233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15229426324367523, + "step": 3885, + "valid_targets_mean": 7243.0, + "valid_targets_min": 3673 + }, + { + "epoch": 6.097254901960785, + "grad_norm": 0.4377098786768193, + "learning_rate": 2.0000481651040182e-06, + "loss": 0.2196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11475956439971924, + "step": 3890, + "valid_targets_mean": 4506.0, + "valid_targets_min": 797 + }, + { + "epoch": 6.105098039215687, + "grad_norm": 0.4697067576333791, + "learning_rate": 1.96611247862299e-06, + "loss": 0.222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11185763776302338, + "step": 3895, + "valid_targets_mean": 4808.0, + "valid_targets_min": 3482 + }, + { + "epoch": 6.1129411764705885, + "grad_norm": 0.39659631265979406, + "learning_rate": 1.932452273709453e-06, + "loss": 0.217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10514408349990845, + "step": 3900, + "valid_targets_mean": 5980.1, + "valid_targets_min": 4308 + }, + { + "epoch": 6.1207843137254905, + "grad_norm": 0.4800811132838675, + "learning_rate": 1.8990680645490389e-06, + "loss": 0.2236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10940663516521454, + "step": 3905, + "valid_targets_mean": 4273.5, + "valid_targets_min": 950 + }, + { + "epoch": 6.128627450980392, + "grad_norm": 0.4353985528320435, + "learning_rate": 1.8659603611113475e-06, + "loss": 0.2124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09796038269996643, + "step": 3910, + "valid_targets_mean": 4635.4, + "valid_targets_min": 1342 + }, + { + "epoch": 6.136470588235294, + "grad_norm": 0.4208733037887433, + "learning_rate": 1.833129669142124e-06, + "loss": 0.2246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11479602009057999, + "step": 3915, + "valid_targets_mean": 6398.9, + "valid_targets_min": 4249 + }, + { + "epoch": 6.144313725490196, + "grad_norm": 0.46839862019377804, + "learning_rate": 1.8005764901555678e-06, + "loss": 0.2137, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10964938253164291, + "step": 3920, + "valid_targets_mean": 5338.1, + "valid_targets_min": 3817 + }, + { + "epoch": 6.152156862745098, + "grad_norm": 0.4645376835084068, + "learning_rate": 1.7683013214266354e-06, + "loss": 0.227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1521643102169037, + "step": 3925, + "valid_targets_mean": 5332.6, + "valid_targets_min": 678 + }, + { + "epoch": 6.16, + "grad_norm": 0.40683657902501225, + "learning_rate": 1.7363046559834718e-06, + "loss": 0.2276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11666695028543472, + "step": 3930, + "valid_targets_mean": 6784.1, + "valid_targets_min": 4317 + }, + { + "epoch": 6.167843137254902, + "grad_norm": 0.4639347819876015, + "learning_rate": 1.7045869825998674e-06, + "loss": 0.2156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09457366168498993, + "step": 3935, + "valid_targets_mean": 3903.6, + "valid_targets_min": 784 + }, + { + "epoch": 6.175686274509804, + "grad_norm": 0.4646117573962641, + "learning_rate": 1.6731487857877971e-06, + "loss": 0.2331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15744554996490479, + "step": 3940, + "valid_targets_mean": 5625.9, + "valid_targets_min": 3955 + }, + { + "epoch": 6.183529411764706, + "grad_norm": 0.4356971179363293, + "learning_rate": 1.641990545790002e-06, + "loss": 0.2176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10445305705070496, + "step": 3945, + "valid_targets_mean": 5696.6, + "valid_targets_min": 3260 + }, + { + "epoch": 6.191372549019608, + "grad_norm": 0.4351794252227166, + "learning_rate": 1.6111127385726844e-06, + "loss": 0.2285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11319652199745178, + "step": 3950, + "valid_targets_mean": 5047.4, + "valid_targets_min": 3681 + }, + { + "epoch": 6.19921568627451, + "grad_norm": 0.48584900526974223, + "learning_rate": 1.5805158358182039e-06, + "loss": 0.2238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09738421440124512, + "step": 3955, + "valid_targets_mean": 4529.9, + "valid_targets_min": 3430 + }, + { + "epoch": 6.207058823529412, + "grad_norm": 0.442358610321098, + "learning_rate": 1.550200304917897e-06, + "loss": 0.2247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10242228209972382, + "step": 3960, + "valid_targets_mean": 4843.8, + "valid_targets_min": 3220 + }, + { + "epoch": 6.214901960784314, + "grad_norm": 0.5001361874122662, + "learning_rate": 1.5201666089649193e-06, + "loss": 0.2196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0966445803642273, + "step": 3965, + "valid_targets_mean": 4384.6, + "valid_targets_min": 692 + }, + { + "epoch": 6.222745098039216, + "grad_norm": 0.4832526224656965, + "learning_rate": 1.4904152067471932e-06, + "loss": 0.2184, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10578788816928864, + "step": 3970, + "valid_targets_mean": 4047.4, + "valid_targets_min": 2904 + }, + { + "epoch": 6.2305882352941175, + "grad_norm": 0.4561742516644297, + "learning_rate": 1.4609465527403722e-06, + "loss": 0.227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0976758748292923, + "step": 3975, + "valid_targets_mean": 4819.9, + "valid_targets_min": 869 + }, + { + "epoch": 6.2384313725490195, + "grad_norm": 0.4957291772635957, + "learning_rate": 1.431761097100921e-06, + "loss": 0.2213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1101255863904953, + "step": 3980, + "valid_targets_mean": 3684.1, + "valid_targets_min": 775 + }, + { + "epoch": 6.246274509803921, + "grad_norm": 0.465197280451629, + "learning_rate": 1.4028592856592239e-06, + "loss": 0.2206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11609461158514023, + "step": 3985, + "valid_targets_mean": 4429.8, + "valid_targets_min": 916 + }, + { + "epoch": 6.254117647058823, + "grad_norm": 0.496223651742939, + "learning_rate": 1.374241559912788e-06, + "loss": 0.211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11883389949798584, + "step": 3990, + "valid_targets_mean": 5541.2, + "valid_targets_min": 4575 + }, + { + "epoch": 6.261960784313725, + "grad_norm": 0.45057004857361893, + "learning_rate": 1.345908357019483e-06, + "loss": 0.2076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09654825925827026, + "step": 3995, + "valid_targets_mean": 4013.4, + "valid_targets_min": 640 + }, + { + "epoch": 6.269803921568627, + "grad_norm": 0.48472218470428075, + "learning_rate": 1.3178601097908827e-06, + "loss": 0.2187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09483954310417175, + "step": 4000, + "valid_targets_mean": 4327.1, + "valid_targets_min": 760 + }, + { + "epoch": 6.277647058823529, + "grad_norm": 0.4761380329140597, + "learning_rate": 1.2900972466856377e-06, + "loss": 0.2141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10870771110057831, + "step": 4005, + "valid_targets_mean": 4861.2, + "valid_targets_min": 3449 + }, + { + "epoch": 6.285490196078431, + "grad_norm": 0.49338258536074125, + "learning_rate": 1.2626201918029301e-06, + "loss": 0.2193, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11417485028505325, + "step": 4010, + "valid_targets_mean": 4991.2, + "valid_targets_min": 3913 + }, + { + "epoch": 6.293333333333333, + "grad_norm": 0.48241818096169126, + "learning_rate": 1.235429364876015e-06, + "loss": 0.2166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11160287261009216, + "step": 4015, + "valid_targets_mean": 4995.0, + "valid_targets_min": 3574 + }, + { + "epoch": 6.301176470588235, + "grad_norm": 0.4378176483854021, + "learning_rate": 1.2085251812657762e-06, + "loss": 0.2246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10883471369743347, + "step": 4020, + "valid_targets_mean": 5228.6, + "valid_targets_min": 3682 + }, + { + "epoch": 6.309019607843137, + "grad_norm": 0.469030673041714, + "learning_rate": 1.1819080519544123e-06, + "loss": 0.2213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11258652806282043, + "step": 4025, + "valid_targets_mean": 4730.2, + "valid_targets_min": 3556 + }, + { + "epoch": 6.316862745098039, + "grad_norm": 0.44244478805711335, + "learning_rate": 1.155578383539142e-06, + "loss": 0.2207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10519449412822723, + "step": 4030, + "valid_targets_mean": 5691.1, + "valid_targets_min": 677 + }, + { + "epoch": 6.324705882352941, + "grad_norm": 0.5758805053505508, + "learning_rate": 1.1295365782259982e-06, + "loss": 0.2231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13826540112495422, + "step": 4035, + "valid_targets_mean": 6115.6, + "valid_targets_min": 3513 + }, + { + "epoch": 6.332549019607843, + "grad_norm": 0.47896063638163283, + "learning_rate": 1.103783033823671e-06, + "loss": 0.2315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1043325737118721, + "step": 4040, + "valid_targets_mean": 4979.2, + "valid_targets_min": 3179 + }, + { + "epoch": 6.3403921568627455, + "grad_norm": 0.4334623118587568, + "learning_rate": 1.0783181437374669e-06, + "loss": 0.221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10528846085071564, + "step": 4045, + "valid_targets_mean": 5229.1, + "valid_targets_min": 3059 + }, + { + "epoch": 6.348235294117647, + "grad_norm": 0.4096491972779553, + "learning_rate": 1.05314229696325e-06, + "loss": 0.2343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12475338578224182, + "step": 4050, + "valid_targets_mean": 7550.8, + "valid_targets_min": 4536 + }, + { + "epoch": 6.356078431372549, + "grad_norm": 0.4573346545451403, + "learning_rate": 1.0282558780815411e-06, + "loss": 0.2306, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10188288986682892, + "step": 4055, + "valid_targets_mean": 4367.8, + "valid_targets_min": 761 + }, + { + "epoch": 6.363921568627451, + "grad_norm": 0.46912558391597736, + "learning_rate": 1.0036592672516088e-06, + "loss": 0.2159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12381172925233841, + "step": 4060, + "valid_targets_mean": 5394.8, + "valid_targets_min": 3766 + }, + { + "epoch": 6.371764705882353, + "grad_norm": 0.4813159773927962, + "learning_rate": 9.79352840205703e-07, + "loss": 0.2175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10303199291229248, + "step": 4065, + "valid_targets_mean": 3941.1, + "valid_targets_min": 615 + }, + { + "epoch": 6.379607843137255, + "grad_norm": 0.41667861310639953, + "learning_rate": 9.55336968243268e-07, + "loss": 0.2286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11974573880434036, + "step": 4070, + "valid_targets_mean": 5733.5, + "valid_targets_min": 3492 + }, + { + "epoch": 6.387450980392157, + "grad_norm": 0.49151600430779024, + "learning_rate": 9.316120182253141e-07, + "loss": 0.2111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10450279712677002, + "step": 4075, + "valid_targets_mean": 4488.6, + "valid_targets_min": 661 + }, + { + "epoch": 6.395294117647059, + "grad_norm": 0.4415542796332715, + "learning_rate": 9.081783525687826e-07, + "loss": 0.2226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1253572702407837, + "step": 4080, + "valid_targets_mean": 6553.2, + "valid_targets_min": 4229 + }, + { + "epoch": 6.403137254901961, + "grad_norm": 0.44382860786184114, + "learning_rate": 8.850363292410269e-07, + "loss": 0.2243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11451376229524612, + "step": 4085, + "valid_targets_mean": 5709.0, + "valid_targets_min": 3848 + }, + { + "epoch": 6.410980392156863, + "grad_norm": 0.4428905242189662, + "learning_rate": 8.621863017543353e-07, + "loss": 0.2134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10134243965148926, + "step": 4090, + "valid_targets_mean": 5144.8, + "valid_targets_min": 4120 + }, + { + "epoch": 6.418823529411765, + "grad_norm": 0.5018401575755567, + "learning_rate": 8.396286191605352e-07, + "loss": 0.2393, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11206495761871338, + "step": 4095, + "valid_targets_mean": 4646.0, + "valid_targets_min": 1807 + }, + { + "epoch": 6.426666666666667, + "grad_norm": 0.4517958808892632, + "learning_rate": 8.173636260456575e-07, + "loss": 0.2185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09486055374145508, + "step": 4100, + "valid_targets_mean": 4185.4, + "valid_targets_min": 626 + }, + { + "epoch": 6.434509803921569, + "grad_norm": 0.4545491068989947, + "learning_rate": 7.953916625246804e-07, + "loss": 0.2154, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09442710876464844, + "step": 4105, + "valid_targets_mean": 4015.5, + "valid_targets_min": 701 + }, + { + "epoch": 6.442352941176471, + "grad_norm": 0.4598041822034105, + "learning_rate": 7.737130642363211e-07, + "loss": 0.2188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09323002398014069, + "step": 4110, + "valid_targets_mean": 3760.2, + "valid_targets_min": 765 + }, + { + "epoch": 6.4501960784313725, + "grad_norm": 0.4582099692292797, + "learning_rate": 7.52328162337923e-07, + "loss": 0.2199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09848172962665558, + "step": 4115, + "valid_targets_mean": 4312.4, + "valid_targets_min": 780 + }, + { + "epoch": 6.4580392156862745, + "grad_norm": 0.44772459638692896, + "learning_rate": 7.3123728350039e-07, + "loss": 0.213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1100703775882721, + "step": 4120, + "valid_targets_mean": 5088.5, + "valid_targets_min": 4233 + }, + { + "epoch": 6.465882352941176, + "grad_norm": 0.46327139443607485, + "learning_rate": 7.104407499031896e-07, + "loss": 0.2205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18428373336791992, + "step": 4125, + "valid_targets_mean": 6381.0, + "valid_targets_min": 811 + }, + { + "epoch": 6.473725490196078, + "grad_norm": 0.43202629332535153, + "learning_rate": 6.899388792294482e-07, + "loss": 0.2273, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10554929077625275, + "step": 4130, + "valid_targets_mean": 4890.8, + "valid_targets_min": 2166 + }, + { + "epoch": 6.48156862745098, + "grad_norm": 0.4787639033963915, + "learning_rate": 6.697319846610772e-07, + "loss": 0.2275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12935051321983337, + "step": 4135, + "valid_targets_mean": 5128.5, + "valid_targets_min": 3360 + }, + { + "epoch": 6.489411764705882, + "grad_norm": 0.4374673739573011, + "learning_rate": 6.498203748740106e-07, + "loss": 0.2172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11974336206912994, + "step": 4140, + "valid_targets_mean": 5625.0, + "valid_targets_min": 3430 + }, + { + "epoch": 6.497254901960784, + "grad_norm": 0.4718170829134424, + "learning_rate": 6.302043540334701e-07, + "loss": 0.2247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10960593819618225, + "step": 4145, + "valid_targets_mean": 4964.1, + "valid_targets_min": 3384 + }, + { + "epoch": 6.505098039215686, + "grad_norm": 0.4929681247793601, + "learning_rate": 6.108842217893384e-07, + "loss": 0.2287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14213602244853973, + "step": 4150, + "valid_targets_mean": 5879.5, + "valid_targets_min": 593 + }, + { + "epoch": 6.512941176470588, + "grad_norm": 0.48504256263392026, + "learning_rate": 5.918602732715583e-07, + "loss": 0.2206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09823766350746155, + "step": 4155, + "valid_targets_mean": 4444.2, + "valid_targets_min": 386 + }, + { + "epoch": 6.52078431372549, + "grad_norm": 0.4767032025354917, + "learning_rate": 5.731327990856517e-07, + "loss": 0.2282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11948859691619873, + "step": 4160, + "valid_targets_mean": 5461.9, + "valid_targets_min": 3945 + }, + { + "epoch": 6.528627450980392, + "grad_norm": 0.4247913504681906, + "learning_rate": 5.547020853082497e-07, + "loss": 0.2177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11250126361846924, + "step": 4165, + "valid_targets_mean": 5245.2, + "valid_targets_min": 501 + }, + { + "epoch": 6.536470588235294, + "grad_norm": 0.47341087020563916, + "learning_rate": 5.365684134827542e-07, + "loss": 0.2301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1286301612854004, + "step": 4170, + "valid_targets_mean": 5085.1, + "valid_targets_min": 768 + }, + { + "epoch": 6.544313725490196, + "grad_norm": 0.5452947122533847, + "learning_rate": 5.187320606150103e-07, + "loss": 0.2316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18514202535152435, + "step": 4175, + "valid_targets_mean": 6446.4, + "valid_targets_min": 751 + }, + { + "epoch": 6.552156862745098, + "grad_norm": 0.42641629979857115, + "learning_rate": 5.011932991690959e-07, + "loss": 0.2263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12646891176700592, + "step": 4180, + "valid_targets_mean": 5828.9, + "valid_targets_min": 4165 + }, + { + "epoch": 6.5600000000000005, + "grad_norm": 0.46574222475217153, + "learning_rate": 4.839523970631387e-07, + "loss": 0.2187, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12034496665000916, + "step": 4185, + "valid_targets_mean": 5428.6, + "valid_targets_min": 3459 + }, + { + "epoch": 6.567843137254902, + "grad_norm": 0.48648714804401355, + "learning_rate": 4.6700961766524833e-07, + "loss": 0.2168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10155089199542999, + "step": 4190, + "valid_targets_mean": 4122.8, + "valid_targets_min": 768 + }, + { + "epoch": 6.575686274509804, + "grad_norm": 0.4655250441869616, + "learning_rate": 4.503652197894681e-07, + "loss": 0.2184, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09567312896251678, + "step": 4195, + "valid_targets_mean": 4185.8, + "valid_targets_min": 3418 + }, + { + "epoch": 6.583529411764706, + "grad_norm": 0.464660545382178, + "learning_rate": 4.3401945769183884e-07, + "loss": 0.2247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.094794362783432, + "step": 4200, + "valid_targets_mean": 3753.0, + "valid_targets_min": 1343 + }, + { + "epoch": 6.591372549019608, + "grad_norm": 0.40188876002080204, + "learning_rate": 4.1797258106650804e-07, + "loss": 0.2146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10433869063854218, + "step": 4205, + "valid_targets_mean": 5433.4, + "valid_targets_min": 3375 + }, + { + "epoch": 6.59921568627451, + "grad_norm": 0.4714750606191182, + "learning_rate": 4.0222483504191556e-07, + "loss": 0.2145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08846727758646011, + "step": 4210, + "valid_targets_mean": 4271.1, + "valid_targets_min": 817 + }, + { + "epoch": 6.607058823529412, + "grad_norm": 0.5078200189738814, + "learning_rate": 3.8677646017704963e-07, + "loss": 0.2295, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10169130563735962, + "step": 4215, + "valid_targets_mean": 3950.5, + "valid_targets_min": 662 + }, + { + "epoch": 6.614901960784314, + "grad_norm": 0.4232569435845233, + "learning_rate": 3.716276924577744e-07, + "loss": 0.2322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08592445403337479, + "step": 4220, + "valid_targets_mean": 5230.9, + "valid_targets_min": 3524 + }, + { + "epoch": 6.622745098039216, + "grad_norm": 0.43181541312088884, + "learning_rate": 3.5677876329322624e-07, + "loss": 0.2174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1324676275253296, + "step": 4225, + "valid_targets_mean": 6772.1, + "valid_targets_min": 3196 + }, + { + "epoch": 6.630588235294118, + "grad_norm": 0.49254515548212713, + "learning_rate": 3.422298995122675e-07, + "loss": 0.24, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13985073566436768, + "step": 4230, + "valid_targets_mean": 4969.0, + "valid_targets_min": 727 + }, + { + "epoch": 6.63843137254902, + "grad_norm": 0.4264979019492451, + "learning_rate": 3.279813233600404e-07, + "loss": 0.2078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11380667984485626, + "step": 4235, + "valid_targets_mean": 5638.6, + "valid_targets_min": 3436 + }, + { + "epoch": 6.646274509803922, + "grad_norm": 0.4434834036479819, + "learning_rate": 3.140332524945522e-07, + "loss": 0.2205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10968320071697235, + "step": 4240, + "valid_targets_mean": 4396.2, + "valid_targets_min": 3472 + }, + { + "epoch": 6.654117647058824, + "grad_norm": 0.4755423972418163, + "learning_rate": 3.0038589998336423e-07, + "loss": 0.2232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1261489987373352, + "step": 4245, + "valid_targets_mean": 5429.0, + "valid_targets_min": 3906 + }, + { + "epoch": 6.661960784313726, + "grad_norm": 0.4329871366469772, + "learning_rate": 2.8703947430033465e-07, + "loss": 0.2076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09297747164964676, + "step": 4250, + "valid_targets_mean": 4497.1, + "valid_targets_min": 3315 + }, + { + "epoch": 6.669803921568628, + "grad_norm": 0.4993264893966694, + "learning_rate": 2.7399417932242325e-07, + "loss": 0.2296, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11046084016561508, + "step": 4255, + "valid_targets_mean": 4216.9, + "valid_targets_min": 919 + }, + { + "epoch": 6.6776470588235295, + "grad_norm": 0.4355414330786498, + "learning_rate": 2.6125021432659824e-07, + "loss": 0.2176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10060550272464752, + "step": 4260, + "valid_targets_mean": 5505.8, + "valid_targets_min": 2862 + }, + { + "epoch": 6.685490196078431, + "grad_norm": 0.4521689898500482, + "learning_rate": 2.4880777398677e-07, + "loss": 0.2426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1378835141658783, + "step": 4265, + "valid_targets_mean": 5625.0, + "valid_targets_min": 4029 + }, + { + "epoch": 6.693333333333333, + "grad_norm": 0.470768846829166, + "learning_rate": 2.3666704837082888e-07, + "loss": 0.211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12488949298858643, + "step": 4270, + "valid_targets_mean": 4775.0, + "valid_targets_min": 3986 + }, + { + "epoch": 6.701176470588235, + "grad_norm": 0.4710412868048963, + "learning_rate": 2.2482822293774297e-07, + "loss": 0.2268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1238384023308754, + "step": 4275, + "valid_targets_mean": 6255.5, + "valid_targets_min": 4588 + }, + { + "epoch": 6.709019607843137, + "grad_norm": 0.4438839076302866, + "learning_rate": 2.13291478534714e-07, + "loss": 0.2195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14333386719226837, + "step": 4280, + "valid_targets_mean": 6303.6, + "valid_targets_min": 3679 + }, + { + "epoch": 6.716862745098039, + "grad_norm": 0.5060736267850259, + "learning_rate": 2.020569913944348e-07, + "loss": 0.2247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11077409237623215, + "step": 4285, + "valid_targets_mean": 3751.0, + "valid_targets_min": 789 + }, + { + "epoch": 6.724705882352941, + "grad_norm": 0.45844627042874836, + "learning_rate": 1.9112493313236947e-07, + "loss": 0.2271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13419592380523682, + "step": 4290, + "valid_targets_mean": 6193.1, + "valid_targets_min": 3947 + }, + { + "epoch": 6.732549019607843, + "grad_norm": 0.4624929402927315, + "learning_rate": 1.8049547074416195e-07, + "loss": 0.2254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12782934308052063, + "step": 4295, + "valid_targets_mean": 4674.4, + "valid_targets_min": 724 + }, + { + "epoch": 6.740392156862745, + "grad_norm": 0.44973617852573694, + "learning_rate": 1.701687666030627e-07, + "loss": 0.2177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1164279356598854, + "step": 4300, + "valid_targets_mean": 4788.5, + "valid_targets_min": 3863 + }, + { + "epoch": 6.748235294117647, + "grad_norm": 0.4877134554107391, + "learning_rate": 1.6014497845745715e-07, + "loss": 0.2213, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12220542132854462, + "step": 4305, + "valid_targets_mean": 4376.2, + "valid_targets_min": 948 + }, + { + "epoch": 6.756078431372549, + "grad_norm": 0.4770935848522137, + "learning_rate": 1.504242594284544e-07, + "loss": 0.2229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1367311328649521, + "step": 4310, + "valid_targets_mean": 5298.9, + "valid_targets_min": 4224 + }, + { + "epoch": 6.763921568627451, + "grad_norm": 0.5373921676125825, + "learning_rate": 1.4100675800754914e-07, + "loss": 0.2197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12212381511926651, + "step": 4315, + "valid_targets_mean": 4523.1, + "valid_targets_min": 939 + }, + { + "epoch": 6.771764705882353, + "grad_norm": 0.4927951692587741, + "learning_rate": 1.318926180543545e-07, + "loss": 0.2228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10165538638830185, + "step": 4320, + "valid_targets_mean": 4021.1, + "valid_targets_min": 909 + }, + { + "epoch": 6.779607843137255, + "grad_norm": 0.4813767080894923, + "learning_rate": 1.2308197879439932e-07, + "loss": 0.2298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1391141563653946, + "step": 4325, + "valid_targets_mean": 5597.2, + "valid_targets_min": 4134 + }, + { + "epoch": 6.7874509803921566, + "grad_norm": 0.43435379671631896, + "learning_rate": 1.1457497481700775e-07, + "loss": 0.2277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1326904147863388, + "step": 4330, + "valid_targets_mean": 5858.1, + "valid_targets_min": 3410 + }, + { + "epoch": 6.7952941176470585, + "grad_norm": 0.509799192903302, + "learning_rate": 1.0637173607323859e-07, + "loss": 0.2232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08625923097133636, + "step": 4335, + "valid_targets_mean": 3410.9, + "valid_targets_min": 601 + }, + { + "epoch": 6.80313725490196, + "grad_norm": 0.4340451395208277, + "learning_rate": 9.847238787390246e-08, + "loss": 0.2281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10468437522649765, + "step": 4340, + "valid_targets_mean": 5285.2, + "valid_targets_min": 3760 + }, + { + "epoch": 6.810980392156862, + "grad_norm": 0.4662601092806204, + "learning_rate": 9.087705088764997e-08, + "loss": 0.2216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09582984447479248, + "step": 4345, + "valid_targets_mean": 4779.4, + "valid_targets_min": 3127 + }, + { + "epoch": 6.818823529411764, + "grad_norm": 0.46696313433638315, + "learning_rate": 8.358584113911994e-08, + "loss": 0.217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10853664577007294, + "step": 4350, + "valid_targets_mean": 4434.6, + "valid_targets_min": 3719 + }, + { + "epoch": 6.826666666666666, + "grad_norm": 0.43846142448189535, + "learning_rate": 7.659887000717403e-08, + "loss": 0.2129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10556395351886749, + "step": 4355, + "valid_targets_mean": 4671.9, + "valid_targets_min": 890 + }, + { + "epoch": 6.834509803921568, + "grad_norm": 0.4319322520744759, + "learning_rate": 6.991624422320042e-08, + "loss": 0.2209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10148314386606216, + "step": 4360, + "valid_targets_mean": 4710.1, + "valid_targets_min": 3220 + }, + { + "epoch": 6.842352941176471, + "grad_norm": 0.4528238104041261, + "learning_rate": 6.353806586946842e-08, + "loss": 0.2146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10324162989854813, + "step": 4365, + "valid_targets_mean": 4713.1, + "valid_targets_min": 3076 + }, + { + "epoch": 6.850196078431373, + "grad_norm": 0.44883130023888307, + "learning_rate": 5.7464432377580814e-08, + "loss": 0.2188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1069837287068367, + "step": 4370, + "valid_targets_mean": 4678.0, + "valid_targets_min": 2848 + }, + { + "epoch": 6.858039215686275, + "grad_norm": 0.502502931033106, + "learning_rate": 5.169543652698617e-08, + "loss": 0.2192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10652319341897964, + "step": 4375, + "valid_targets_mean": 4192.1, + "valid_targets_min": 1039 + }, + { + "epoch": 6.865882352941177, + "grad_norm": 0.4817734391686949, + "learning_rate": 4.623116644354886e-08, + "loss": 0.2146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12233863025903702, + "step": 4380, + "valid_targets_mean": 5835.8, + "valid_targets_min": 3830 + }, + { + "epoch": 6.873725490196079, + "grad_norm": 0.444884821554049, + "learning_rate": 4.107170559822127e-08, + "loss": 0.2152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09412867575883865, + "step": 4385, + "valid_targets_mean": 4147.2, + "valid_targets_min": 919 + }, + { + "epoch": 6.881568627450981, + "grad_norm": 0.45787283402160717, + "learning_rate": 3.621713280575367e-08, + "loss": 0.231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10872447490692139, + "step": 4390, + "valid_targets_mean": 5069.1, + "valid_targets_min": 3293 + }, + { + "epoch": 6.889411764705883, + "grad_norm": 0.4342624586083637, + "learning_rate": 3.166752222349523e-08, + "loss": 0.2224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09016773104667664, + "step": 4395, + "valid_targets_mean": 4896.4, + "valid_targets_min": 899 + }, + { + "epoch": 6.8972549019607845, + "grad_norm": 0.4981911991886726, + "learning_rate": 2.7422943350263743e-08, + "loss": 0.2254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11719105392694473, + "step": 4400, + "valid_targets_mean": 4600.9, + "valid_targets_min": 3802 + }, + { + "epoch": 6.905098039215686, + "grad_norm": 0.47616977358182333, + "learning_rate": 2.3483461025282094e-08, + "loss": 0.2247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.08278848975896835, + "step": 4405, + "valid_targets_mean": 3947.2, + "valid_targets_min": 659 + }, + { + "epoch": 6.912941176470588, + "grad_norm": 0.47507102563863857, + "learning_rate": 1.9849135427187916e-08, + "loss": 0.2261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16222912073135376, + "step": 4410, + "valid_targets_mean": 5750.8, + "valid_targets_min": 3535 + }, + { + "epoch": 6.92078431372549, + "grad_norm": 0.43316713506324794, + "learning_rate": 1.6520022073112098e-08, + "loss": 0.2269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.0887688621878624, + "step": 4415, + "valid_targets_mean": 4106.0, + "valid_targets_min": 1988 + }, + { + "epoch": 6.928627450980392, + "grad_norm": 0.46871403580777404, + "learning_rate": 1.3496171817832804e-08, + "loss": 0.2291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1262306571006775, + "step": 4420, + "valid_targets_mean": 6219.2, + "valid_targets_min": 4586 + }, + { + "epoch": 6.936470588235294, + "grad_norm": 0.44141115841411704, + "learning_rate": 1.0777630853000543e-08, + "loss": 0.2329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09531784057617188, + "step": 4425, + "valid_targets_mean": 5062.0, + "valid_targets_min": 3697 + }, + { + "epoch": 6.944313725490196, + "grad_norm": 0.48753846856369104, + "learning_rate": 8.364440706429833e-09, + "loss": 0.2242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11849364638328552, + "step": 4430, + "valid_targets_mean": 4558.0, + "valid_targets_min": 711 + }, + { + "epoch": 6.952156862745098, + "grad_norm": 0.49429667262142357, + "learning_rate": 6.2566382414641635e-09, + "loss": 0.2264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12699516117572784, + "step": 4435, + "valid_targets_mean": 5793.4, + "valid_targets_min": 2085 + }, + { + "epoch": 6.96, + "grad_norm": 0.4789452496037441, + "learning_rate": 4.454255656414219e-09, + "loss": 0.2178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11449083685874939, + "step": 4440, + "valid_targets_mean": 5632.1, + "valid_targets_min": 909 + }, + { + "epoch": 6.967843137254902, + "grad_norm": 0.4578636924842011, + "learning_rate": 2.957320484067161e-09, + "loss": 0.2123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10642892122268677, + "step": 4445, + "valid_targets_mean": 4728.5, + "valid_targets_min": 628 + }, + { + "epoch": 6.975686274509804, + "grad_norm": 0.4583003210525026, + "learning_rate": 1.7658555912647423e-09, + "loss": 0.2191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13077768683433533, + "step": 4450, + "valid_targets_mean": 6211.1, + "valid_targets_min": 4483 + }, + { + "epoch": 6.983529411764706, + "grad_norm": 0.45176736594513867, + "learning_rate": 8.79879178554699e-10, + "loss": 0.2156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11069822311401367, + "step": 4455, + "valid_targets_mean": 4677.2, + "valid_targets_min": 1989 + }, + { + "epoch": 6.991372549019608, + "grad_norm": 0.4435188034232649, + "learning_rate": 2.9940477991097227e-10, + "loss": 0.2156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09977850317955017, + "step": 4460, + "valid_targets_mean": 4503.6, + "valid_targets_min": 604 + }, + { + "epoch": 6.99921568627451, + "grad_norm": 0.45734595449193466, + "learning_rate": 2.4441262527208355e-11, + "loss": 0.2094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10217998921871185, + "step": 4465, + "valid_targets_mean": 4522.4, + "valid_targets_min": 449 + }, + { + "epoch": 7.0, + "step": 4466, + "total_flos": 2.8947179058078024e+18, + "train_loss": 0.0, + "train_runtime": 3.2247, + "train_samples_per_second": 22141.844, + "train_steps_per_second": 1384.951 + } + ], + "logging_steps": 5, + "max_steps": 4466, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 1500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 2.8947179058078024e+18, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..08e1073 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0675e31c6bd40bee14d02640e56278aeb8e7bd65b921430bb113cd409e0e0401 +size 8785 diff --git a/training_loss.png b/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..520c60640934999fe1acdb646a5201b672210ea7 GIT binary patch literal 41142 zcmdqJg5l|38S`Yzg5kWe|0z@h4 zQb3gM{N{q^eb0N&_nq?x9Iwag@ps3*_gZVNImaAhtR14Mevyitg&e~$DwRu0+89QF z$1vP5DG9tH-rheB|0nHoLC@vtT}zjHW=^*-H8U3n+q*8dcg#86ZaF#Mxoa;bBq|~# zDZqK##l^u{T3Fcbzds>#*U3t_&cL-5u0rN;>4r0g(U_sXxGee1I~bPAt)g^J$35}y zz&-Ei&Yc5uZPBv5ue@Rz$e+pzjBy{)a=;s~UZ-7Eb~HKuCtzBU^@RGIbiU#0HW_y? zWeneWw;M(ZtMFFoQ<-?{VR+uQ9*lY;8E8p)1PnLI<@ZBj!=$+(Du;ZN2N z&9|kDFrZ*G$DsMM$U?flfwB*Jp_iU=N(P(4u3e8{76LQv4I zb1_9_>_hnZ8sBa8b@%F5gX*i|89$<*KJ~vW^nN_o?$jdiu821 ztWiPb0(rUXG)abb$hn6kC9clFq_w>zHe4$7UHL|RU1~Uoc-*kT-74bfPyW5Vy%K${e`lwwJClg@3T*sJS<5Z0NJxIoXwWgp!1?zM(%Uu*!e(oBtJV4(Uc;Zce&;svb>*wt+5|DG0lPb^HC6>?Ngo5Lj-YpvRv2^n z3o7Xuja;;fS54kK9b@-d(t5-yMIXi}{GtE7v*TzZnapaxbI*I{i900$`j*RoI?L97 zC$tw^X)sZexJ-9Z!H@GhIXU%~-?1`ubrrXN|BGR1x|@bKnhb}-F-bab4!Vy~6~vis zZ!E`2yPl+{r%(McMa#w({wezSSfu=p_Qw zdNqPoiu<^qPNs9(tuN0;9#9D3_4DlW-g)$tyYinrd2+6vLfCY)F+@;KPE73J;lqdH zL@h|nEiAOIT?@Edy-sp9Q@sh6FR1TsjnUw}<_NaQ-V**->PexGAJe|f%p7}2BUcNz z5L~mfK~Ypxv`{@;waPwIxu|aF@hc`y)=R>7^WT|%zuoPu*RSg>B4xWywryV-vFY`8 zo@i~lcHJo8i%>WGACYob)y)T;zqR#tD-iLAW5rq|bUMD7k&T5>E-7t|=e&>T*WlzX6@j>ERrCsN|X ztf-@+qT=Xe!q~n3iXLKQ9Q%_~pd86A>##JbRk^*=w>IC*QRF)BZ)7njqjs;YB8ty0Xs z#);~^vt{PhNbXOw5jL)5D(!coXqDgf{+e`_Q8k19&Ye3STU+h_W&WH&m($GFDby3d zOJ1-nzA@<{UF1G*&gD-FVZ(qmcI6ppEI&1tTOW_smCtOkJVOfHu>E{ zSYxHf;<(+lYuC611g;o*&o{Ae4mvbY)!#lHIy!3Z(brRCabc+1N8^2-x0=DOxE)z~ z`w7dhagMtAoxSAbtsAZy%@Eey zSn$%)(p9bCyVT+yYdL|TfS;my0>m+&?*MIPIr-249v_!P))zhX_~rb-6p#q9>VJ8UJ!UIei#Dk>7Z)fd#()}DhvR3zn^J*q5!s^m+avi0@#4$Ga_H~;nyme?@DT2WLPN3N~8SFVkQ=~cRm@~ABI z?%rIb!R*VYc!`LJhS%oD%KpCjLQ6}F4-O`k*_vx8?E8n|A3dUkvV~#4zdk=&y8C`2 zIl67kL9)=iiF_}7CUzkpL~MIR;Ku#^{Y_CUzjw;$UfkGT9TJ7tAwp5ELiw+1g-=kh ziI7Hyv!->R;$HJ*;VPn_hLNI_hLPGMcPsDjY;T^={K3V|O%Q!tLvE_4o6*FZjyyn- z{p2uP9~3k;>$iJ0fNnGXatyLYvNQ<)q8a};Q(4Dd0!c*^N&+fggLBA^xJFv{CJKZZ?Ki{s(f{TnzdHE z+wfs(DyM%yfLT}WjjZf!sXGQNM=r)Zc`~wG8NWE&^y`aojgqzXNl43dhYtC}+>F7d zlf2_)*k%Pgv}|W%nvS0S0o*(e`|yaFFreP~WhW$IS{9bj?afuMr0L=|x#(Tq^XJby z{wwL;*y=Na`iF`q#DQ5u;7I9^Z$p{m*to6Vty{-nMlD<7f4TlGvS?1#Ir%I1jZN-4 z6tjrU*%}VODWufYAK32o<8nGfzkk=hk|M{(#l=NRMpg$Y^Uu8TPwi?sLT^zfN`NxA z=V?PPgfZ0FmySUiJuvJo=v}f3X)ZwVMJ=QQ*>^*b+P~dCy#`4)-bXE{;XWh|YN!Da zLTJ`j{`CdDe905pre|U})@zh<7Yi{w5LaJel$!tltz9_^Xqf5i8iJa())xb`vk$>QtJ+B47Zz%c|N0e@ zXHXi-cl8x1X8!AQ%)*#(^;#Onxv;Px6H%-u0L3KuXR+0nKG@&8+&A6 zoP!<{Z0m!Sn==&z_%c|>Un{%I-6jhj5_Y{jSg@?u%E!KBuNf(vLL#igXv}qEy1SM0 zfhg*m01fcYM#sgSfK;fYqw{pFS$>CW(09|$u~lk?Y|<7Wn3qA^aP$~na%(>j8A$fu!@jC3lOy9^fOZa>C(FMK*40Mi6H zEVlH0wbAPAkO?J|h{D$tc@vqPwK2uaA0f%IUZGGoJWRT4@?iUi!m=6dy;sm32Jx$< zt<62V3dxcD^yCQ~Cz?ugbMrv;{Rg z<=!+W`T3jR`u@u4bms#p_lB@kmueafayFWL^bJ|CK2>AM?N1Mv?_HUHs=MsM zW^vs7SL$W!H{ZkvQ*GY+_ReV1y+JzX-(TrQMn;VNqGu}?BQQ=s-ml5B2L6G8q2uE> zBOmQho$2RHOH1=_v0N-`g&ZjWi~9WebH(5dKMH6t=%I8lP%sJ|Iy2~=j&UMTEo$9y z!f|`KI}C2|qM_5LV+8m$KpN^BRV7 zLx&CpLoN+Fp6srO(e6Sl#rp_y`Cn2~J4{GINo(Rg9}pZCb`Vp#bSW4ufXtgB-JENb z>@s?=NkSJEoVfhO&XXuq0$3I-{|%|~B=*s-t#rUG0m=y@jFP?TQuU78fcy`3k8!$r z*pwkKU8EV>eAQbEm+9Ep1koNqAxg){cpO%_fAE?6`mfjvH*dZ?!OtH(D+Pl``vRa8 z+gUeKY&55!T6*eJxy#gOd)2tKnYH!nLj62;Mq*CiwUGl{{)>_Fl9GD;Zhdy_6JJ_d z4)aETvZyE!(hO?gf^LS3S1o>=4g+);f^z0!oBU8t-o1Xupv6xFDAVNRmw!$-Xiw73 ziCLwhpg0IP|5fuC^eB;ec6(lw686NVg0jAt4L1LDX#YfEWyY*MAus z>CX5agjWF~*7#Oc3d+lyz($z=cAn-_pRxN0F`&Apx`zj3TbI|yA}L_fAq@O!6}L8~ z3kdLSGc2pqV5x3g}AQ`lPip}{`E zDq@On_RVke51idSs{DvHiYMgkY~|HK%i^C(-rn9}fe~A9#V13%xL~gHfx$)M7^6kGrn$P}-Yf(9xaV|U z+RK+p0DnW^Vr!J@N1_uF_;pUkAXqB%uA*A=%yEo}bFY)?yH9vvysb+uLE=-N(dyfb z-3VtVCnZzURCnkj{b`q14Y~Yl0lDKafa7>)2ls2&VhRMfG1InW*^i$;FZ_`sNSwO5 zs={?|z?D(w}S2LuExL~3U@&W$t_0WMO8MLT-uNOrpgkMc2_UeAK5g?JK<-%VAJtPOSWhX+(5V z?)2$HXZjr;Hm|Gy+8OYeNMf&n=C%BS-_uMjVEpTP4r`d1Ku}+?%Pv zu`Wx9A=nxfHR`xsP`yE(elb!RvRkuryrd)dU$?Ve1tv7u8sH;N75ZeKl^X>T5|#P1 z1gnEy!ia6~UioRY;1C#yTBzDuh4od)8RVj(q6;;#(3~G!UtceSlKMf>eSw}1L6 z=M`F?{vNzsyKXFg=Q~gTy&)e|n4TmiJ_5F6LuOWXwSR1W(`R+y0Jh*`t#*8Km7bNA zviRqtYdN|lz2e?CYJ6n@)IYSze@}9d_sZi^Kd40xlB{LF<85S&$0jFlFHN?e_oZ2b z9EfJP&%T1{sf{uJig!#$wRlp&)_EcokEV z(q^Ruvx>c|qC$plbRxx%9e~p@x!o;i)MP@^Cjk~_+-GxnItb9$a088e<4cujO+CF} z4Y~Eku@c$mojKPVEQ>v;%$&Am&s>Bs%dc9|Uta~>OmyHt`n}mfCOPl2%7NuwL62?R z#7&-VN|$@Dp(g5!(z#*Y>{)NIm37`xxr%!3CH;=Q@^$BuX{9>BkOb1Kr05)g}GfpHZkDbFfY zHcW8k`6=RrGj~@u9y0^x$A*DUYRrf=4)xvM;Ns*|$Upb0d-@2Ki?y}2%mYFU%H?V~ z#38BMzusfJ$q5P5^JSlIE=bZqJ@HZ#6BDC5a%7s06H}NStink)uO?jqKJ0f(LQqo} z;}|ry>|>Yvn?GAxTADWo(-}9z*ayZ|pAE`)OG@2?LUl`1KiVd3zeD)P zM#^oFe){xD(q)oX!nS94dA2)a#79+KJy7w*|*I2Fd0jRx)oi{(U zyTb^a2iNH6s6!nw<8Zu9{u8T|-hXa@b=(t=o<7|%7G~3(Z(U@H_sr#swi^{J7zbKD#ycH0|v1B3B{u00PJ~go8e-MmpE7)tQP6!@dbp&uoA$ z;-71Hpx=-DZfP#AI-813o9mjI!=lNjI5{zBxEE%%w6ualLkWhrPD$LGF-(Nw1EYD| zJ(RZ@`wK;zA*>p+?|n;_;=948TVVWe`IoWl%=-yX zTW{#i(67Ln_||@o;YSJAVzAPq=k1+?qhn(@$(k2x$ujFt$zPUN&-+4yBscU{ox!6b z!VlOb7D21wo#u%zh?P7$Q$~1zhJ9(BYd8wB5x|Qvn2OkkF>!HBP!q-{CXSvur9Ief zU6PiS^)dY|+3?nf@i4D%v^`|$k(BIb>x zaaVXRMfuwlRK5H3NZmr;bC<r)(9HU4 zXDeO1b{J^&FvzamV?EF(Vpm^XsaqZLiv&`i8OqRUw8KpNwhsfXX&*DurFnVw7qIb3 z$9S>7gH?SKv79C>zR8A;O^2avPukji#4I*WMp1n_v18;rKo$T_KyDxR1-yaK1_E(~ zz-1zG0hQ4=#l=+wmEtyC?oais1-=pE|NgZ#gqRh1enqd^`+YYfpjMnp)Eta|-FEiV zpx+TOpADBv0Geyit~w65c8>sIS9>hha8&HE{a@FGl7a16@5yg3*i8~spmIf$Sy36e zc3yLbUT+@K=WxW?ncFV%;mQxQuV#*#>~1i=&dEve_8DmU@L}}Zi}Oz3rbahx?=Z=* z$$IMS&{qQ!XlayQQZin0AbwSDYyqa+9I6KJ+&NpnUKbY9VyRA%{ze~zq?>W!{y=FMGnB{Ouw{di7XGe#7i|*wsR}cYF z6>+!hpUZ5Du$qq)s=Cld&dvwMCniz?Ndp%zQB5j?CQL_HH+g9t*sL-5b!A7#c@@HP zfFNVQS$+UQNyKB}CScCq>4%51+OodH}!()poG2+$C zec*%unFOKyw>Z((47vv*ff2DA2L;x5d-;0GH3n?LW(80?%7pa*!9;F<<3xCB4Vr89 zY{BC{`n||7n711I54 zT{mN-ru6sC*@U$A+al2BqLM@%L{g9hl+*bz51 ztX0$i5wnVe@u;wKlqsjTTagiDXiqIu{mm;KT==X2v_9F9Gxke* zJ}=73dMvI)*wp-Z?^g{M#RfT|^6TrVOn!jSLkR^2Q5V-4ijNIR80EkJ&0^bMMh8<` z+-;GOk+HD(6&NBiE`P(f8#lYzL`*Tj^AXUwTYP@XXFPTuXLY@3Q!)j(6&8q-g(|jF zH%YmV9xb}v&K)VtEx)~VaAkJLPu1^kb(wC@9e0}0u&}BXSK@*E6#k2wszLNicTc;_}*Mkv0qiCi{&pyg!D=jp|q5vwZ( z9x(WM;P*VX%03)_ZMggbvm#!H9+nY^AaT!?zhnt5flxCJfu4ncEM~Q0+L5Id9?=8@ zg(Oft4lUx{oPvT>@K0*xaFzf_!UPVM&k?5RcOMJi!vRpGp*bPAapMNk%V14<28*2gL1n@QI?d^pSj%Jl~zzV8X z;uCcXa&whHU3sOJ5C}Q}h+*cdGXqE@0a+Batm_+|RqVo*a|8eu*pX@+clr)J5-3r- zgL-NYoK* zX@Io=hD(CvO^=9IC~lKKGHE32`-4q<*NI_)*}FXso} z5VhID_$TO?)?kk#-6}dl$6K&N|9 za;_eel47o_s{=xn4#X8;fkeI6=At7E2;=>P86oyT?=}OvXTjkG2<#LH-_L`r=1CO= z@?&#H_Ek|Ra47u%h+xhK{W{vR3*scddczv=$B%i)0FonZ*oTC!#dSKbG_9vS*hl(5msP2iF)e|9`!^e*wYom@`ew>*2SL}xua1~?i z7de`sqy>Q@I{hfGzw?__iccWuGb3-l2%RsrAAl-!AK|$i-Mspzd{<@O%OsW0^FGgKsWX( z!5&=_leFQcW;uO{{a`OEz>(G)_}Mf z1&V{QIwXOOJS-J5HAskb zKxP3t3Im`uU_o9*8(yFfO$ucsJ!?1^7&Z#BXJLFP8oPNE1>6c>+JBum1!H7kNfFiFl7Dn99``^zi zz-;olO&mldv}&V38z1*E@+oOr?mb<(3+d_sV%LGr6(TG4T()+ERDpy%Ac2%@ZF9>Y zpvO<~d#(JX!y2Cn8pyO>)6+YFGIV>+bz#`n0iSNtHw4izBH>PU#pdtbap>-7ksNU{ z=5pWw_A`z>72jWp(uX_wO<*UW+YfkO~2-W8PC}HVPyuEffuN z$hUHR?tlu&FekyQ_riU6Pp?$6c&Q!fEqBc++xU}nAy&x9UpMD4j3LpvRmyy4Yu)&k zE)vF&0z${mE(BaE2(+|lxF^nZ(t~Tq9K>gEN9aQ;K@v48GoK>+Y$ZfpCN=3eIE0}^ zk&W;HfM82h$4}3WRyD#Bl<45(c+{%;(9|x+EXEt@JHsOTw#m z-})OKC_Hw+Zm{wOMhkHyn-_M_)e`a4(n&KlLU%M4+#0zM(%_&Fv%=LlRKyj<>kcq@$OUal! z-<6WCHHcbYxNu<&k`D|y>ql}+pEgX$k5_7ofAo2Fqd={VR5@my_3G6J8`}Y(7w&?s z$Lp)A8zh>#H@Chxz(A8T7~JHlKX41{6=In8;6cCkE$bi*I=4V*)snK`(Yi_k6J86A z&bNwtccG+=fUctm;JcaWWATOb_BDaBD?7h{R*~ZG&d$%5o4WEfuw*9dpB?ZHu<1Eb zoq&vEwz=|e4O+%;1t#*58@`~Xfe0awkc?uU?wK1-8L}YoEHdAIZ}ZPHj>?8r;${17 zB<;hFL0UxFWLg+Bl<*y~){AbxY>>$rBK-z!JCtI8 zF*XxnYRu9~m-*14H9d90sMab>hB_-GCGbmL35gpnC3$Jd1?hcshYug?ur5K_4}5P+ z`j-b>{VHJfxpvgbo-Nz_$t)2U4?JjpdDgD)of;DUkeLWdGYS}B%a1|Fsb8fgl%GM9 zuyMzhPm@t4_-fX?f|AldeRXx}m6?IQaXEj{e6t`Kl>e0fIO<%g3gjhjwAyLDB)5CL$6Nrw{Dl zr##E`=UH4>czA$fyOgsTC8p5;nfvkM$KSeIIKg&#^>I>?V1eO}pCXtHRer!EBmi(% zbbQDI*GbxMz)KfFLEn-ZWEO?@XKdb|LS{~D6Y0gdyw;!dYRKRjBKrR@c(M|L@iQrz zmOvsQ?^B6M_BNW|Ip@*M@4Hj~@E~20lI3*Ph2}>` z&QR0H%qb+4KGbJyMxIqyq%4a7C*}+M0_5?>m`iLUXj@ zB}=4t6~#4O1A{X`!C6;}ezMsu{Lls>^+fgh?;}X}@2U1Viy$*V2WU$51}6Z@HP`Gc z3;!Le;Q-lpP8u1P`~icqB3uN;^gbxP-Y~r5RVzTw1%h~G3aTX%IvfGgatR8m`O1ih z&|ZEfPzUV=g16AL$<=}eHaI$Q$%?uHzx~Z3+H0hD^~{UP4}nQPGbGPQRpuqYdhzxA zrQTX?v#@jeXA{_XKEu}7_yY(}&}TIP%ySqCU?jlg)`kg@tia*3LQ`ot7mT=ZGwY84zWr(5tWpbFiAPR ztW?X>wSbD%Q{z`tY4`ClS9o%IZZ4&VhX<2{ZCs@qc;UpwmtS_@YvWao@&}Ct*w8P1 z&xDLZ!HR$^dVqbAivAb~lfM%et=Przz8_O{x#g512b#Y)aF(X!C7f64xRdpi+)#|C zx+Q<0_mQ$iPRc=icdn^Q)UbnOMbQ~(oRCHXE`mDXe@st3pMz#=6u7RlN9|r*ZJkSCW26Ax4F97H5$w zk_xG-D=D1<7zG%dB2s376qJK@P!=k|_k!%Lf~EZrppVG8G4UQj`MZNMF0+GdNHPGQ zQ2=;Je{6i6YEM4^^b8t}IdGV$|Am&O;;I}+5;G;Xt)pZ_QkeE3FzU6wKa03sKVY(j z*h9^N9R;sOmmV`f`jq#@ho8ZO^4n7ZOX-NAW>q%K@t^D)UW_R2xTh`&!nUUM-zFxLTAS^{-o6^6KUrhJZZ{EM3Epm6Sa_rBV0w&YmU7ERkq5 z^H3B~dKYsFV|*T3R_;H+hscSa?OXHAp)&SVd7S}Q0OJx+m3axuR!k6Gs@aceH5oB! zF=Wlp;|GPpf>+d)9Tt!;!+@kPD~cJiEw{BSOz=}huDUGO*7}pD#8A3d$_v7!rf93u zFIih*dRi7XV_mdReJ<8x-!%9R)4x3luin|W^zVQ21kdejt$kNNQ6krW2{+^;RX&w( z+0SuMU(&jo(bon};rB|(zfRPHBY$&eTgA;!^q|(2Zg`xfK;PlQ>AM;+il7@FpMb_3 zR9Lr}{-0fHFDy+VJ?p5Fm6xk>zIhHsQlElQLH?M^vQe!>5Wea6?J)*Ax+n7M z;6gxX54k1*i2!v6K1Qe5X&?om^al(No63NOQ25iG{Q%YLDF+A+DBVEmr-A$prhGGSSuTu$8cK|T5rzqTlKo|l>=Shf`RZnrwZ1Xw}Ig+!jP_4Z}vaVW2dKCrJ|w?ugwVy)@$bwjR{G3dgY00I<((gE%* z4)9Y5AhHE{RiSe#gI*SF3ipPg_rNd^h#~89@$e8q{b+(_CjgN!plug;w}79B5ZEFX zW1r<~AO%vuZm9<{z!8)|tQOi23`1l)*zxBeI6pV%gQ@~LVI3HL=RO@zF$K(~_vU8E z)*5)5!@`f88HEP65nMLNqiX@se&PL@yMvFQkwiZy3~L&K_?9L{6Pc2PD;TCycz6D3 zOl)k!%~LNRr-IWX&vQn$`Agxn9<%Y9Bgbo-e|n2^k}gzd-u)2=JW=s~+jFp$zD+z& z>3b=-nVdrOP`NYLr}XYn1kgO-f#ehwZ67O2urDV=lLlU}7n+ibGDxnyd6Q>P?gt+* z@KS5Q?I0)VD5_nk)Pf$v6yDkv4;2ORtdfqSM6g!0jEq6Z*o@p#<2Jw@QUY1j1imkj zd+x)4k)em_^zFyjz2JlaLB@Bfw^IO?kr05YO>V9Lati~)2hDLzWCDl)2zrC6KMFy6 z@x~2im}*{mU$_rs=Y@kL%j+!Sm8CPS;}iG1>L_7Po=ki%U-c^g5GC3qI#$EA_YuAL z4dNX!cZe_51Z$rBVCh{GsWn18obgx!ci)Z?lqUfJN^mG(c*GpT_nhVqU`H=T_&1Cw z=Rk5>ta=X;olPv%AwDs($JJnMbscAPs+H}yJy(d@d4o!h_P+9zZ5N~{k< z^Nx?8$rK7ahJ`B=*8Z&Orw8FLaKQee zudf^sivzbe4eRp00E?>c!nV*TWGesbGghukC~CkAu=2?dPzyyt<3)!nz=Bf`ELPZq z2LzChH=nlN113x%^9RCtJ;hcu(3L)f>P7>b?kL0*hM}s747UPC<%i%nggcz-K$<3U z{bIDt%w*sPKFqJn3H;)%Ten)u-N5FvN3LxwO|1brgqSlygLkGN=`O_8AWt*DZf-4@ zT zM&E!nGIaZS3mwS;%O3%@);F{h2$dT{_7FtPp#TEmQ95HnRh`X}VeWgzWl<1GkpKz9 zYkojXF$WSoAXF;YoyMEUi-}8TVspF+@EK-%$! z#gkhdDl{WRkqGFM9S%nz+Qb1g+oaPr?(fRV@kULl|EZ1Nxd;@%b`HHJs#FUS5Sx(C z&A}un7bykwXOUf>gw!yY=}sWgCrqe3t9=?!3-JA3TZw%6LZ*2+6miqIgHWFN?{HjA zQcnYI)~&*bJ?jrJAOUbdW=-ZdN-jWW0#8lMMFb)qvgbq+#8SboqX8^=r}Nzz<+{Dv zoy5h)P3V3S3F9a$fn~K09P9HCL*_r<+(K}MMfP{d@nnS?H=b`rCnfoO=$-hCSwD5f zaqhv44pnI-5)m00R@k-xjoJGa7Z%`5*1yF#pjB8tYHZ5t zKtAFyh_#D`hODr84`6YpZjt|nHHEOSSeqLG)20ZLM}U%Vvf+z=H~fb{Hz#p7FLy-S z0q(1%MCk@t2$np3j+6%KUxj~Sv$rNcW;YPwfsr|X?i>zz%hCA?pu@q=5g;SV!_WWa z=-4VWA?Koa(D5xv-z`aiU`U?b0uIqOCv&*2Qz!hj{V`fgI9I8k1U3a|6Bia2agr3= zmt9S2vwi3lQ(wO(heQsC7FNPuM#%pW2}td$e=fjtr}*sLkbLBe!tW2(bEvsBbLwZL z?1~kn0J!n`D*ze>x~s38uOk#Z{oua+Czfi(HA(#x_xCmn!vhHeJ6grL1U?9(XdW_X z;DaAMQnC{a>T@BoE{T6$6O8~EkIDl$rQ>Q;OO4a%?lt>1_l%A%i444!=LlU{*vuIm zE@nLD$%<)Jpfwe}jj$yfV9PijDY5$>%5yow&Y>u^feSSsavj^I)Ndu?Mewiz`xg0L zwT>xn4=w68!he2ZRtV=O{J3{`RGkA*9`C3B3NTM5Y(upBuZe{b$>Y64rX?hRogNw0 zLa?~-ieO6?`IM>2`|lti`c<6d+hI(1@7!vdZY}z)a{RJ2n&058<-N}f4R46z1&9#; zkr|0g<#4`*xmrKFk4Tffn^Rffp`EZZXB0u;7X4c82$RD81;o(>0D$ftgZ$->mP|np@B!yqyVno8#&Ucs-*s{04&M(ne_N z_z6#_upam?M9$$Hj&mWskL9soRs=AY?Nb(LE}bw^qTBD;_wJ4wjkuFoz#p&m<<~GG zl3f2YB?EPPv#C!5v-w+}LJuSTR&I^kV}R0r>@C45ykf@ze9Zp7%M5`#iuQhlyGeph z@TxPSMYvzQKP*ug^n!qChZV-ZcMiDy4%Fo4KNWZ>GJk~2_kQC&J?S2)wHE|>Mg+73 zrfho+hd7K(&xe_5m6G#IE%X)bQ^376_cvpw_Ir;2G#8haZ<#)Fy=A(8{V8*-hnkd& zHtQPUFb^%79v?J4Y5BCN&h)`zgnGA18b)aCdQPICo0ZnV${a=%d5#?e>yR02WiU=% zPT!0GE+~q}V;gmRRz*!}(N?$$LE;0LC4VtsDJ7Rb(pRuD@Cbn;{|Exo?*K%COUxWh z1)#yLzTZVPJu#7W9gIh^z=9!Gy3Og!k%@SsQChri2L83s(T@naE4fI+r6fTEMPBqc zDQ8|N)DO|AAt;u>gRZ>y1Jw}h_`g!Xu?a7(UBmQDNIu*+)ceu=8+^ZmTv`bOu?Z#r zD~Xa?gReACh&YZafi72cV*(MY4ge8B$xY6-d>1$VjzL7ThSl(x4G#FN_B)zM-i*7~ z_4G)gp9lOG`440%Nr&NDmB=A5kRdlG5JFj>wgng{K=9e}^6*&C7B73w(-C_gSGFHU z5!6p`GDe7UK?Wb7hQ;3x!P!b69L7_iw-D>i-%$M4O8U5DZx@NX1Y`eu&L0>rg5!VC zVjKgb=(A|!iT_zP^#92*uZrUFeb$^14zO1yJ6wY?&GdFoFpT6}FL+ie#YzoU6c%8k zZ!h#9uPz*CL~5mmCmXb4VC0NU5mON&{9*dvQ8YnZvzE=I2#ym&=ex@Q-1x}715Jz4Fgh*k~(nGtpq4* z{(z=BvXk+F+fH}Zh=A#TZwY>k2n#yzz=!IJ^`M-u; za*6*d?WH&qcNePnp^!MGQ{UdBEf)gm}c*Pgw1AJGcq zLZ(!EIe9PtOdJY7^dSE~$>jq2mJLIpQ8H1z(B9l4lEkn<6u-=WzmOV{97!x_bbR94 z2OjUyDAN1ip-inZV^dHkK(*s4RI)b5V<=r&+oA76&YPHBw!w)ZiaqTrB;7WU)(+~O zA!{^uuC=`P_F6H@*ldv1Cs>4tC;kwSNFIzs*_R5k?*ut^!3fLJJ(;Q{b=Tn7{-pB3 zicUOr;+ovByT4$~Sz_0Y9?xJsfhOlYMb9-d7KO*gRQUaw&4xTX(V=RE-FEKC#2)_P zeem@9KHnn<%i0EY(avp_(o|}%cugLHD0H^YSY+tz9T3B}VuiV(`&E^7|7PsuK48zB z_k)N4O~$n|B;Sq_W=$~d)h|~xhx%HvI2R7Wtg-*`+UIV8;c}tjQ+ow;|5x&{Z!;LH z>lilurPg7eL)!Zhm;iilxj<^jEmN3<$TKPg-a|#}~lOz`H68=Wan@ zdgf?AQYo6$g||Jy5(KH&M_{6H{}DjPDtApvs0`G@<6f`F_(*(mps$>4a>7=qTqL94D3VO!8R#U3c@;CwVe5vb+r$mUQhhOMkqR^= z<7Qal+a6xb9(aNXR_%R>`sJB;S5BU~d@qw)AUiI*gze4hGEE9pD%STA~h`RwQ!N z*-CsVegK~N2qZTS?&ep_C^|Zdf*KeA90BT#;?CX^0&zb1ohNy?cBdM_d?)c&Q3M4# zwAs=qm@s6%0y;ou@vGR!mX@Z}a}UuOa}V=Ny1ER9>~pMncz947{Q=mgU>qR{r;rde zXvuqzhS1e`p%qGU%M`!yy!My)Ujmf&<=KbXJ^0l@fIb~CE=!`Br&F7yMKG+impS3dGXL-e zir@Y#V$1*ueuTQjdmmdqcKe<9`JA8VWw!yc|i zKTx0LO5!#1Q|>(_<^BW^_sU>fVCXHh{dsDA6{Ms?V7!uqrv1tD=RX4l7lmIaQ(>t+ zwlSr|`zw+3K!OIFfDKz^OoR25IUZ#YG7JV{kQok3y3f@e=qq#GX*i5|-o$Pk*t_fd zf5s~kZ~XlEb8@iiEH(^$N;9}K_Vf%C&>++IzH{_#)GYmL5Ys7iH>ZH`D zNl6v7wCFHXI9iQt^EeE6pU%!syPv0P(%{UOjr9P50^9yje)Y-_BBpx`o!Nl>;W#&Z z&d{a(0)_|n3@D>)yCV}94Vi1LbJ!F~FGcB?kjC#}l`NP8LIk#9ml1#`51pN&Wndt| zdfwR`fo)PQVV|`7E&J(Xo(VvDC9T>b(5Z`;Q0v*QyrMo1r7Eh#gG2<5ccJ6j-79d` z=j}P0tyo2_a}Wg9&b8L}6ljhSl$^Xo&*@*xV5*e*CNDt+Lg=4Df)#c>SMNS(szy6L zP!xc5r3J;r^Xb#4Z_U1JMcSOB?Y8D55AetGY`97HfJ&AJESNX2{+hBh?WpT zCk*0bJe-b{w$_|DELV>IAD;)Yp$;n1WC{4?OzuAHT03(co3x=P-BZK0oJ%|~Qp~M_ z4LwZ)ye>4@WM8Q;oQ5LLh;seczfO)#LtD4k1IA~z5Y_^*HijIKz~4WKiXy<`&fH}O zr5jvX>LYH4-9mmEhAx$Jc;Uw;ifxgQI*GA@7yD{R@SNuE|T7 zxPD0P6uyqcilp%E=U!erh>Nt9Oc*Pulns#4K&3f(mx6+#0SVPWQNN)w`0Y2Y!Wpq) zM~9Qf6wHYCJI!Q?HViChIyyS;cHnx21Lk)gGOP=GP^KC%Iw++wV49kD?nFyKPSo1` z@f$acmJ(@$a8xUhmOzmdj-rx*;o~?AzqhMpk$>40o4$(A#|nFFFXRo3EFw_Neb0^^ z12sJXEO#G*>5hV{8UE)0$sgIt^a@SS8JuY=$QlQ%*!KVkD=)2M`zU$5*PGH5*c^0L znN`kP4|*3+2|)|33Ww2n=Mkl8UIOWsyR?!7N}5uFi(Myr#)kEAcw|7Lte0DKWWkMM z<(=L2#fdYUmEgZ_gh$al=T1Bb0;TXHxws;Fs(q2S=i zwEx?;r@_~@A;Wv(1SycynJ!iDOgp6SUe9PMo-CH3d->qtIRwte;Wk~`=1QKy{f)ir zvyU$J3}XdT9mEed7`{j3ue7N#*tnk%2jA>5+4UR8pIez~w$^V%N z4QIc8<3>nhqY|o;aA>Rvl!!KEXN?=X!*uP zPg?6h{Dmfo&JQ|3ARjXurIX$voTg-Af0wGd?IzavX5eZubAk2IJ@SP4T5Hd~IC4Q(Jax#Z4AckS@F>)O|Dx_TM z)koH~Ay31z&cGQ^+{IQYSj=?ieaz&+BmU>e>K0at3Ubd`Y8|ewb|wns2}q842Tf+l zMZ5X+e|M!DnQB`bJBe*=%2-*O5i6o4CW_fw8RAkqn>}m)10_D8mpW8uZ`5L!>ri{V zh+cT=8m(YUz2A33!_?E7b!fkD1eOZ^!_cTULYd${U?Cd7LTeT@lKZ_3f*n?d(Fy`3 zZjt{WYZQJb2zr>ohL}J{05{CH2AFE~D{2Q1-db1@N!J}T)-~$mwL6NE-F-k;W3Pd$ z_Pf=60M8Obz(pdCMGzub`)cpbnH5a930*OK;+y#5PF9o`f&hMrz2+sTU89x7hV@iB ze_B(cU40(?l!~+m7H4GW^DZ8d=>HHfyYh2*=9oVVCbGw}saXJyqEaKrVMMn(+55)M zC*n-q$o4~45+K*(Z2NZwM($mk(ajjcev=rEzQQ;C0T)VwOUz25RB04pMZvv?mxXR^D+7Cl=O2g#cwW3@Zp`lX`>= z;|(~1!$PLKYeiTD~IgwwX~-mDYG#m5vjuO zb)@Sb0LN*U=aGCbJoKoa`0IY*c>q)T(#3$LY($CnI*CYTE=i~E<_$YWG)FWrNAO&R zVO0W&L{fTl&4!ov7(!bGEEy2$s)Resd>S>YEfU4^X`ptWf31eK%`_~*e4Y|0b&FUD zD(sQh+$M0VS6QGJin-qHDcdD3gY5^`6Cf=5veC+LR`hr^Mds7B3Jo``$5@r@x$NZ7 z)wl`XVtCcCmg%DEqH_SWj(^sg&e2CLm8&&;n=eV949m)27Fzx;{xz60iJT#U@Xq_g zRuy+(_Qs*Ze|ObW%?O)J?@CeRGBZ^a!Avi@P2I3Pj0SiBUBCx8W-ctO28mW;h@TSH{*8iMfTsQcT-M@GIri<3MOqL)CZlbt{5(=y z6fL6%OiOczYf~za1lHfoaQZy{(wCe5N*TN9?uEckI9&CWw)EYU0$6HKWfB7H`wiN7 zn9zP0ZL^LlRQIltiY^oLxMEHh-dKMKeC{)FpQ0u89-Gv^u9;i8@%hhvCE^V@+fCGZ zV!>Dtk;&4+5I%9`LWFv@@63lnoW^4eWY}j}T91vun;(xr*a6@DS6gq28CwZ;6C#V% zx*7PhIm!{;vXtxpi7>EaTLtHZViXTj7p>mi&%2VhROxfUGN*Z#?!LYfi8U8dp?v0+ ztpq&sBX~nUoT@n}q$Mj}6K#P3h=*fKW z_#8I|gFfjFD&PVnW`EX>X>()PG|l0}7zAFP>`v1{CbMn=k^s@d9tq$tXbd@6r9 z35J?WY0j*}cZ0~=JU7t_?`HLu6}C)j+E5T zX~{fYiag!E&w27bssThXiVs@AZhAIV%j3iHLC=fk%lEyv-pJFeKAIg=&O?luUpv<+ zJWDtU7__!&xpf zQ0>7u22@T;^E~vA|EsaLfU0`^x<)r00@5X2(h|}k-6Gu}f`l7HK%_ysI|LP_73q|e z4n?J;1d$e$MoJO+*3bX@e)qfMj(2?b4A1bKA@2Q)=ULBMbImm;YN6rHn~_(Uz-sXj zsv`fPBs%n+95b?8N?UTKNcmin0$yFuPV@!$UkfMVZUV?=F9r}w_o+BB)L*{e9y_Hx zefqztO1&w-IpL;cWLx~6u2`s2L#J`&Di%s9fu2JhTLB*ijD^ZwxRFmh`e5+y?0uHQ zL9ctM*pctbmFRc3m4K20LuNDe0<$9VsgEo>zTN9+Vi}*o5h488RQ>SkBm;M++)Y>Y z`DqsZ){Zl(HxR$k0)G#F&6!B+;8xd(I?LW$eZG9id6VRu@lsCjzs2%_`ci_$SAPgZ zL#4|{vECwT*OxJ#8KjZgkFie{g)5^TGV;j<5F_ECqX$(TF65k*h-Y3?@m!u*DnqbrQ-m;azzW^7K>uuvP%FzB}N0LRuo|0^J&?9{eKF zbsxh0`Y-n@F@z7t=!>Rx56PNPqff*=a-PB>)lZmxL!0I_%bCi z3IYf8!%HIrTBS9|zEWx3iTI*uJsbO;;eh+IC6UOTo51t3CB7VvQcx_$A=FgLHCtPn zvK0My9FGHKe6uqUCq&G|>G+;Oc3pt)PyPQa2x6>G5}jAOB&fR&C=^?wF6A3&NLo1e zlRXND`}$#oe5m}=wa2;@y)i37s7@EYPeTUr$el4GAF2C#Xuv+*9|ILUlODghR4O{p zf;{63aLqzxA6d^IqU~a)mU)CjX(!|ulu+kqqNo1}yfcuqkd#l_Fr(1MUmIt(Nt@iv zXi%MNPwVtdtOF)z)ZmuxM#Dq>W`n0Ur-AZSyy?`nZdXU8{r9b8d#1+NXUlgrh zrWB&Py65YkPj`OyllFH%?k&%GXH;jvM$%HFGS1ymE4UA7ZMc25_Sz6swLl%^d0QKE z6qnTHxWMK}3MF_1(jvGa&tm!qBo(sYYlYg%>I4@`&-}Qn79#-LDoBdMu)SPh%6BQK z{KaGvZ8}M6sD;^GlJe~^iUYJ88JTCPeVW=?(F`lSrZk)c}c|mbN98~hYuOmYd(iUPA#bWciU)(_EW4^%A(FjDE>tG;InE$NfU#}2D}S;h8vwh=bvLy6@;c2W7Y3u z9&UbjO<^dfXQ?6@GXI z1D=}R@!JrtaLM?OP~0(UMMhjW9au=!4}{o*J}srWtBS(10KIt#ZH0;JZ{sNKKp!G z0iNK?NO%#(E>&0d#^gj$4>zdekjyP_1|8k^&HS5cv7YT<2rW0qf_o_4yz8|j)s3VD zTema*#YFXZJ%@(nM&-!sHnWaCECP*~RQ%!)oW{A}sthVULI~eICflSY3z@ccLS-A8 z2wbB!rJ=-B$P!|AOwdrWz9$6L>xKCfM#HbaiCsSJvx?n!U-(L~I{nBz%%RoOVh^d) z_3y)5D$?;6<2sJ-cL-lzxjWNRykzyctH__|3Y{0s0PvfB-TIP10HQ{ODH(n zY)*HiY@$3HJ%xa4Ofp0Qw<=xuKd=gbD%=PPoA^MgL56KXy#bkYcB*Ok`|4&nfoTp! zG;R9d6&VSo3L{&uWc)9}Ty&qJI8Z40KXQz@_lClXCzIevJNYr}dYj7h)>Ms%>w9j+ z%!w$VzwY)7QJDEuL-xg6S`WN)nO{lp068{<>O%f2BefqbP(=o;p_>xV`^Pb&HOQ zS^{2`3XI<6jXLiF=ir~pYeE8|qBOHWcY+tG6sDVh@XO3If=r!Iw$7LE)pt)ptflM7 z%Im?&JlWFAS5IAMgkg=B+W2Z5(QGfv)xK{3J-^OVR@pZk@Dqiay0|k|ZV&qvKSjk5 zXLcqPp*RD1-xnST1`4DmplO5*@9x6rm&67GDBX}CgOP|_;K!Mcwl)UPE(1Cv44O*+ z!r03BxQ!f3`k~U4PXwk@jpN39Nz2PGbU&%xw#5kkoQv0*>@2MDvU~HVp=>{+_~ksA zoSU%%-}^p(1r9#`dSLE+yH^a+e+E7yHiG5 zkzd3Z=t_Eu+D9+TarGA|>zWh8eo}xOYyZ6qX_09mFsTmlF1Qzz`Ff%X6-?<%UQey+)JaoxZfp_i)!9hOJgXXdj@K=aX>USo_36Chnt2Z?+feM_sIVD;94tCMez z*~IE`Ddg7k##S5dc?E+~mzru{?3s5>n5b*#A~SZ;pZ=#(K&1{5hn8*ey)=eyfOWfn zl8;OOVGmx@MY9UmKx48<4pxn-{%7{-WK4Og*DJ89Ds{s99Pv=D?+>ih1O*xm{yuza z-5DgGetJ8dIQqh3GJ1<-QkH|QKpZJQ{(lw=sGPZGC?^y>Jw>49i?Biw;R)DiZUE7F z-?$osBDNSNTF3~knf9&6mnu%o^4HfO=Q>X8cX}$imn-mj+N+*6_X7jhwQXd=Kqi5n zlVr^llU!($etVSj&(E(`M&?`9GYrH-b6%$x_ypiTV~E|%8C9leRic&i`W>ScKOJ1F zfTh%pL}XrZ%CHL=nTk*T8M|3;fp4eI^`175((?nk7Ur#6sbW<+KpTl}ttrCcP5 zVwpj~AUf-zM9BtLXX;!}o*|#GJSX{0*CF)2Y>-{J`-Ie$Wim?_#bI*gR@A?XP>y*~RE z;XhV&)S;t|hvlHBcdKh9cyvF4=4NgDGkeyH7ScM5ov%Bk zmA=AubCtJ`eY z52PndWP)XkLb|p1P}4cCHmnPP6H}01^!x)goHAgfR$%7R3nz;;4Su10trynRO&U8AKZb)73Kr< z7wJ;I$rr23S!ciW_&BX3$}eEn^KK5m3Q;RYQVTn43yjH00ajDJJ6*q(ahh%`ln1&+ zlfJ#u$ik};A0&0S8h|{LkKAg04adEy^CVQi`GxNK-~%uewOl;G^jIx=)`v&4bjPK# zb|%l5M^5Y0`1FsuB9!c;GE|GwpJ-8Ibf5xnJ7wSrnHOQjVDpXJfCb2t_rFwOV;v6> zDx_{q{vK7;$fz6`g8{gxRw>#;ao(9o1HXTNPD&Ea0eFSg-<`?qbo?2vR6H7{vLDMg z^)BU4^^L9^vtm(jBry)8tBC;Jfp{2(h))% z!?%!;mGnSV)WDyx4{+ouxIRR1sn4-&cx|a&x3*Rg^?~2pjnCsfmmG!(YO z8>S0TLi}22QcI>%%BwG>hD!BBv<@4?f{G2ZLDE7mcFVk&>6H3uMRvyzmi~hT1%qrd z5>^(B>0HCmgKjMbz6xAy(z|2%PDU*J;&@{h_=F2AC3(@hu=w)=D>F|$S8Jjgyz%}X zPZ3~GTDNMKU^IA#=7`jnq1^kPTcL&sge#)6REp6LCoRN{y`{D;MrdToh-5p0+sqe=mBQv&Q*P>q zA5StzqN*VWne2MZI9`?sfNV~0s<~C<$M1dnJC>qaq-1%0a?9!Z7Sn)DV z%i0!hIAI68evc$jlwxB7!KE;T%Jya?A>1!h{_+y(KbEXUFpsQ4I7EanVl>eXb<}-w zW!u-&q^`Sj)_)q^@~4B^h!mw82539JX(Zt*z;59?TJiU?=Zd29Fhq+)wY>+c(A{ z-DW>EcJWzA?ombMJXSw0_ypO8d7p6%@uc$0qs_Fl2M^^-%e|q>ULD`UcK&zAfdnW^tZ%FONZLQ+!0*vuP?=>=~4;$X8@xu-|z0aEy zT5Yqck2~P#^A@M&;;OMfP6$bKh!X1}00P`quUT7*2x-K)*RUj8{e$k%jyxCCjb&w% zuA@bz-Sm7g`a0v3XsJjD%b)-Y17^u$r2{JYEmLe(>zMM|Zst*&zUT*aTFeIS5_jrE z@60MqqO#m~40*i>@l+U2qFt!ovd1Opfx2nH+66rGZ4-cnp>Y+`JA! zAqAe6zi%v>%nyrwyHSxL^y+3kLqdXfZ12s_#c%mND|N@N4RPQZ@fNS>uU+B!5EAU6 zXm-Ez{-nEdrGmG+H8mMZ?KsBS>tVQwF^w|@q_^Es?5fi~1q=?xCOXWi*v8?VcU;tj zUA;q}>tisLm7)&KiVK?99wmAj&{@6Sz=#VUIT-(RH|`|?WoP1KZ9*`}X& zGlVSf;*U#duNbw+(Ui@FcGPO$dOa=2RnRmgaX=N4X*|XD#f%vxIQwjQuL&xm)X#BR z@x)J)sRLxa3$9KrABSmOfK$%Ma%=jzaTt6h)7&o6`TxEh_}9&PEzZLQ2IM zq(z2Mxw{vxx#L_HZ)`WoG+^~1Q^!W9>Ph_F`Lg2fDs2%#QG7^oV@dfy179r9rHRbg z*hf*-V_;kR2qya{ia14MebnIy8-RJ^`>t7GBOtmDEoQ338HC z(DQWEa#j3;PTndomR5MfWIrGfQ7dmz5ht`a?!1;P)Ql#rmdU}$m5Jo&`sN&nlYU)2 z{!ML4qWS$i6wOh5|KA+X+tkLaFjJm&F{uZ_CqNpgEbhzyHjqK|($_5)XT5A+-^Oa{ zXWAR$@g~J7Le2NCx{@pkx0<{(v9r?RNXj(2b=IYX4XEU&I{EibBPGz2coX)je`ZrR zjRT1+?CJiuAY}Y$lc3={@^>7A$}*bKoHK@K+|F!D$jsHdh( z;3F419y;0&$9g&&6UsjDU`}p`wT5$c`O|eeh_WGbtT3g_p!9a@;)uA-W^;2_?t6gv zguZXY`yzNP>|%NwxDa+12k8+~QMsiT3^xh2<^O zcbZpiik;#gBFAT(!^>HmD^Sj(tm+G8qq;|jkP;Oevk?h6Y0Qk0A z3fuENdbjTpKLq+}_Et(fPrf{3z7+yi$mSt8#avQ407zWV>{h5vp^}XsG4u<1f4y}R zH!{1^wG&OK@8XlEZWJQhN{8C#`_Vc!?1(AUQGgqel*Kxo7g{_Sim}I)oR5KEC#)+U zcHeEvEn4yUJDKoQGEVvu_k&j95!ysrt9oYCgxsD6HM*FF#9Z6lDD#;-CAHWvd@B@?!_z&axkegb0=rR~pr09dva@xuV zwT9bomcG${62*ihj1B7<1s{yRI>+FTh|@c3q;WVE6oh$YOVyVBG1CWNKeA3QevVbo z%0abZf}}z#G-F-iAdaMaR7n&Lp1s9;-)+hsmt>MdO{{{p!{=`x$tfv&Sz@5UT~TWX zOJ|>tU%s`D5mVA)>Tpwju}7|Kt-wG7z*Id0;|<}O{)Qds&B3BU8$-8;N=SELHGEmm#mAS@(oFzejH$19 zXx^h4ROrFoL4LNZGkw3H{GGk}gNp+@(Q+3oC9FiJ&U~gy89#Fx#|VGl+bw#oait{e zGrA{s4DCfAmIrXlr{U|}jkC%5FD4fsv_k?_y^>6Ho7xmfHB4XjFMs;@7+=g8>53h# zX4o&MvQ0B!(idZ*i?IQUj?lwuiM*r_Q4shI6#lA8uTpkryD(kfajThyP#dq%&O zG5J<|^vs{-=2x4qdD*_YkAJpRQkfv-l%+h>+HgcJel??Nk2 zwb;X3BNp6)gAx@pl|t897>6{8qDVWF$_9zJF8S!9|T=?7~N+GiKdQl*n|y#npS@PI4+|!BHXxODePH6}!1>LlMsDy3emJ zxX?8KUJ*kycFW#cqENdB^5*ZThs}VgCUt|sB3V-jCAr!m{=iH<=C8f} zt5(JiW>cgp*gvXWvz%_-X)sW7t!5g&{yiQ6&tMJO*rY~Tsy$G(%ho6Pi^`ka3cN0G zx@OlPRo$BRfgSbd&W*}174rF}9DoFpteOtu)INkZUvP~gzyt|X8$SkdpA!OBz*D9c zV#1lV`|He|wesQyn~$-n`CUnUi|`_$o;!GM%?@G++!9LA^(=UwK(uoFF_Z`U%G(&W z&}=sQ(qHh4u#%EcQ&9HI^!5EewmQ|v+7%Yhgc!+F)Pt?_>H3bAqy`Z1+5 zg_DP+J~B;0m;IDXx7n((*@d2oEas;)-m<`F&gs-xOW~`Wt44&8>WX)!h`#?kRe7f< zxIjedvV{q}D~aUIxW0!)%X-0_Uo9U}LXkj3&uOHE1M4?oojS^*6${FFPsdT{|9x0$Muh(+}f10NrK2Gi&h|HMK-2Z zB!`pda8$z`oVQig(1dX3h9l>UQ?eK`jy^ydm;YS>4IPSHrcU`%3oYi6?Jxhi2 zpGNtlNukbr*yM1%73d6UIeZ-|*l1F!lJJRb1YH1F(ALTN`xB?&>E#-$x&A^`n<@9o zB~ONMiZEdzR$6!!e&vmuOO{!Wv* zL_)LF4RuxUfOgp`E795V^^Z?BKhax>4qsd|6+sp0M#DbN{c&l7E<#M=C%dLWp%?*% zlRHI;5sThSw^7Nu%0)H6snp?g0cfAF(M@ma{Ne_E9Fslym6AR4`JBiMJhY+ybVP zTuXFNjTH7#&TjeBlkvVc`KElU+jH;E3Tn1(+j9=v95pcg)o_p&-fE|atU^4?n?V=5 z=vHV8O)tLw=BW(%2=%?UyT7I@?H!U&)%X9qcr#%ExdaksPkj=NXZhjNolNd=d0H%P^^<_PtQM zDYl)?VOPoN%=mxUC(N6ccS)R$wIEGrcqhTm^Tl1waj})cDyYSH<j<~j-#(Kn_Tr6tUPknQD(=ERYn^4_xg!efjjySF`D<)Y{O=1j(tB4KoBpq9JX;eBl6U5v%m%?+cv2hb*)i+l>(-Fa0pmQ zO^=pR!pR&q-mAAhPPi$h58`pL#;5x$+s>U*SbuT^yO6xq)`rt_5WU-VZ>V5S;@Q&( zXbGKkbo?05c9S%SaEZFg_?CI73iOW@j^Co1b&|@i6Ej}%NOJn)ed=K)bG2&?@7E}% z=>B^FWb*^`v65lT4zCh&8Q>}jIcLDS-*=CAa0iE}tYCcR+1xhtp44~O{E1NF%mV!Y z7~Q6RELR)Zo-H80J~3!WB0V%dC^{>m4ak#Fi@I-o{NqL%VD4rgpi43d{njJ&3ssW2 zcb1Mx%%Z#zZWLFft5*1ZhA^F!!^F`NIdN#=sNMM5?yEkLPl@& zdd*ss=zAKnlD@nMQonOJ5Z0ORg<-Ef87>Tn2*?>W*6J@ZwKqz3FPBQW;zX5bK?N9Z z{{d07#jDOAXTO-V2bvon>M7xCm6b!n`ldw(GQ+IdC3pNB?y|1MKZvjz(-OPz0XyxTq2E1MzizZ&p zoU%Rq8^{q!=k9jA%XKVg2utD(ml*+TibXNUEXx@Jo zEi{R3vXuj;*WRzGWX)BV2u{PYgBEvFv^(F2g= z0#J-&g_P*RWI&*lsO2W?rK?g`3k9SYFzFsVoOPIJ`1qVEsD9+}o4d3{r}wh8xBo3z zV76L$rB&95@`z|eZ>M75k3VZ}Om%}mEN$}5Sei?rtaPJAY;f-NwimisU5)EQNnfmi z6Yf0?18(R{tcJXhN~asw!uj3zWCbN8uW|*C4w#oZm(oI@^AIeTGVh!xQ5qmQSn8q= z)imV8luv`4Uf1*D00*qPqOzo3w?YLd7|>;|0YC-b_R4~tr3t}4ADWcePT|~_;%Ev- z8G1urXq+)mKH%gLv?}KTkPJAxI1^7d(7jku3?=XN#9lZVp;{vG^6t5k0(Yd`8xO%c z?mp%e`aVJXi5)Y%1zVX%vwEtcWeIG4KIdL+Rkod~F@Rl;{oM$9es6gzl?<9Ncq3t8 zQLwU`S)H(EBYW+KL>5tuVuEIJM9K>%o>rRc^8nf1QcE0&AcC44pkjQ?qmwF4CFJPGnL_hbXvZ2VwAq#L+ltmSWd4noR_y3?V;(iic&UXyDxYc}im| z-d&){t|VjwGNhnXf^oJKMv5MXCRKE|R{S4Ud7-WdEGa6Rxu@Z+*!JosuZGu(J>Rp5 z^FJ%p(})rO4y_AG2*M0+D|UI)Dqs{x7!4R#-iyglyE>;%3g&_Vs39S}$T#Nkn5)JH zPzOj+H9w_ZWoCc5LceyHqyj(*KxYh>2hl0k28ovPzbJSkBQ~NQC_1Ln0e6>8S_4lL z6OG;iUf?0!3T*=~RN>{~(O-%;wjsnrbH%RDW`}JG%CErIWy$tAk1zHCc_xvdwD^1A zF(QQ~vLRCc{u1RN$whZvO3z{b(haS1RA=&o2dstRUfjUTctg=*4{$c@Dv z?}=0qNQx0pHvL_WSwjo0%1_qf<|yi$KM;U~77!!gc?6|2alXM%Kb?5^dB(S%wAq1r z<#)F03VqLy_9B)AhL`Ity1;>}>GDs`$Aaemw0jXgx;UaNn&ZTkeSyfi(J7NfL~l(v zman4?7qalwC$yepvGQ=l*#lb}-m;yFC+(&i&pq`EY@KPm^BZQl=o3>L!+2%Cp;e)$ zrQQk^;lSemB@n5!FJ&Usb$4H*JlWuKB~fq4iLKx4iOu2r8dcmMf!+g$Nd!t$?uEnM z)7uz%`KcGprtt3VWV0M35p+Wzkm-=z`gbpGmt7ruU5VBZW#V_bMg3saf3RN)mI6(K z0g}*dKO4aU`j^?m5`=I8O`G@|5)Ol>tB)k)DWu_4lY7#5NCdkKS7^>=poNJ_X(A@!j7Qr?3 zd!${9qxn65Wg6Dcjh-I^=6?-*u5BvWx(>&vB@gqI^|!as?S790))~o9?yQwEuQXE3 zOG%XZZ7tLkrz$XQ$?|4ov*t%qz^#)<9H{d_!AQ+2q=We0dsPA7>F$u|*=ibuM}3)5 zQC<`rgu)QR*f8as=r_g*fAzc#YMX!M?7HRDP$17f`ejoE4kDQ{t$f3P?HyiUhPz`3 zEbG^QU)%H-Rq^@=?v8etr)M_770K#P+f)5>uAIh zjXw(m_ILm5ccnd)aq-JaZQx+fSoxe}YR$ zfs_NueayvCc4>|1Cl+{P`@DJ<2m+S`Jf?#L!d?ItBIqadcxAJ6yxyp(I`Y-?zN)-V z0^NB?uRPl7>C-q^#mz4J;IxJfLI$a)XO5NL-X8xM>db9YNgIpE7=>q6S6e5ycP+MF z<}Y(j>=TN#H);K9f|YQU^Y>c3 zUMlCOuxJi>++h94z%ehwMGAGYzGA!fa&I&(q=1rPH|jnTYIYZgFS)-9G2<@!&7Tb+ z7>+7lwCjGtcobBa98q+nbS28Lubu`{Havn3dI6?v3qPl(QiA4={`?i_^M|^bPXST4 zId~Ov&R^m4Z(bCancRlIk$$TB-i3EV432*M&L9eZ_37&!By%nTPomLrfyWe`QufTX5^hp4;bX?*Y(ah+-rV3h?@b z7SewS`trE1+!}}L_^Y6HvhT~zB9>-Asq7; zpn7Sb!StAZYFesTNy#dPi44O6Xke-xk`(@v6ZU1VXKuZofm*A%-WHlb!*Sn+Wse)=zrL6(jfPfX(RZ^3BuPS!PZ3dRD<+%$7?O$sw?xSpV;tcUD4;|h@ia+)mJK@ z_51XfbekR=Gg$=Thx|Mo<))h6p|&!$aP_@6H;OylB~^B&a);QPk*^2B9Pmd$t;^^}$4nMa0r|WIQu;Q1I1$Y4Q43vEaKg zb&m=^Ztvn}%r%=l!N^fGSG$#Ix_dc7A+j&3K&x!P_2>Q*3kW;O<(?JR3kte8Br8S> z2&=~%D#5ZQEt2got%;3AG|Ko+j5h!SX8)DBK4cN*LvOtXkHF|u7e?h5VTRaMYQwn?Ceu~q2o*|l&#mrHAU#4+lW3> zCPFteyv=;&0TIcUUzO%k`2bb;^6v6BLvwwye%XQ9(e*+Dz^*liXq)e6ay9SgNalRv zq@`0ee#L(0+Mna}oBwor}M467`c*{S}77Nud)_w6Pu!2T_b@zNro=wBz-7 zD6^+!2!SJriOCy@8MGYc&hk=;M9cHNi=NpX7^lp%y0I5Ci%kj4aUhUEqll0ft>^k$ ziB*&K5oH{-5`cDB7@2tzXh;pBtR)Q>+B&|9>bYt`CxL+^wC7i5N%;lT`Kgn*L2E=F zP&AN|$=tQl5^L7HM?|Aa4So)~5H%aVk8_IaW*AQVZVK|cxI*vIR>KY-GDYC_$G3Zg z3Qb93DY0VfW=z`d5Uhzr0sT@1=Z-KC27r09HG-$(v`!OY0@A*aSfszZIb{mQG>7;v&GENK6r(_JCXLxv=XMg&E z>vP3_%Y{d(Q|g;r&mx;&2dgG490JP&)>8Nv-7E9PXibk^4x+;g+@5VjC1ptu)HIvi zyOV_U$3A2!OKOi~n9f2kCH3a5E@0BwEMEcw`%0ROU`>}a(%pyMSw6G&_zsA^<$A9n zVhH$7J{y3iWIsG)3EUAkd;>W?G;D0rLmE_>aiy?jG9ZU-AxHDlCbdy6 zFVuGq$BB>XUQ0PloOs#482BN&4e8%OjMrZ3I| z6;==s%+Wqwio4%tdM;)C=Z_<(0F+p35Q(x0f8ai^EVJxVDKzjMx05v|NJ%GvyxmK{ zp+YNmB?jep%~ay2L->-eG{L|`;%B1@8Pjh<5Z<6||0_q65#}v#>#-M(NJ#HVj*SoHHI_A|F>U(!FlGhi~i z(qJ$4(dbi=K<^7iOZ&T*b#l@s#CZ7yHLY(cJBATZZ0eW%DP=spk)ynIC(HGkTO_8h z*BGsAsvI?5hpY0tR6}QvL)(dKW%==XI1S(Kl-OZvs9e<|4s^TH!-SJ*;PL+O6IYV3 z;wwGdO))~D%YEy@0`G`i##eEK8(Y1fs#RnN1ZO{X3>{b-FkQRCCdx{GdB}!IEKZMS zFOgtx+Iqf2Y+g_1E&gb(O|si>mdk zn0{F%d}|Kqy`x*dmPi`32;f(^8u4lG`?4p?g@7q}4?wbs{xfGaXDsKJEF|qfHj!c>z(fYxOd;6#GI=71=oBGa@ zQ;~5|;*fBDaY-bA<$M(HUq;W5*VZ3W?Bb(yZ7k@!SSa2xjwcr)qhGW}RiLt$oiI@7LBT+x9W*?)z zV&q`9<1i?3v9-uVSy0hW<4MYW<(^2~I66`+Gbwn#(K9qdT{LjXM^9hRzsF|=xU-=Z}c8|GV<#?xLapPxUb0MC1y4%~^CxI{V z&VBlpG8bRV@jxAP!qEpcJ~UJ?jxjdBYaX_7wGj8+vT zcQ`e`Q_C&zA{$Gh55*QD1w*^r#m<#n)r6CKPtP;)#X)+?i2-`dFiTj_?*QlqG{ zN|aBTDCrB+PR7RmVM+2ux9a?-mKmE^?V19fAfW*-Wwq+}+c;z2k8Z(!P$`@|EdLP9 zG8fnXI)1D!PGTu^&!pblH^ujkmX%DN>&L@Q_Mqa^exhqL8Mc$e{*(8S>vA8Ry{s*b z#l@AKaw|S&FuRD`GZhrV0* z!xNsHAJ5=k2~RvBK0adp;<%U(i=5lZZK>)B){u=#0=kr}J3a62TW3GI&E#!#Z?cIt zaAsQ2x^-iW>7!SGFrt~%qN`Rx|0(?=Fjqj4!n+VQTaPZ|OLKPpsZDy%41PIz^xHSJ zSp2xex&;q2>w{xb4KfWv&6n*KXq3F4muEbkkCy0hQz`H}xjl;>Cy@%18flVb@9(4Y zD9I{YwpPe+g!1KTv#%a`%MSd?D;2;47vKsF0Mz7G?Az5L`i z;R|zNc@MES9bcs1Q!6q_9B@itG|D*j=O8hAC-;SL%fq9;j4O3YWVa2SiD}Mr7GO0` z5=$*7LZMT8_jvt?;4xVz;w*xA#^s*>aavhf0q@B~&;V5r3X%g|9=yJ+tgOPkJVaPH z3WVrD;U}T3O%}97h(NbYIS>m*tmb?~hv_lTPG#2|X540t4)y-J4AOe}2cB6@&waZy zqf%${`YF+z4XYt87u*TVT3Zu&o18;zhq%yQMtk3GFh$&=0Nv8QyujmkkY6-mO8|Hx2{9Nm>uA<`G#uFz9MVmz$JDngkrKZou4t3cIyN z0t$VV{O~Z5APf!-YO)~_S3_N70H!12Z#|wEa;=OjvB$+Ey%kNOQwKAl;jbI z70?wzMykPURmIel2ITi}QD8?v0G@aHAcKnX1@G({w>fEesOJjcR(enlLs1c<&O|d0 zU>c5W?hb1@O8(bMx@5o+KREY9KYB#11LM>(KHC}8QCG#qm0q>UE;Kv5r}lkg69_ht zkDfW5{XRs*u(usQA@{vqn(_*ZmZ+Q^?&a$5-5sA8*?%G%DpSb>h_al1_P-dSLg|R? zSTeFmIxa*TPURNY?ZHlLWm}Af_p5}S+VDy1{y2Z#qVKa(a)mT@Zh2#&z#k>-3pw0! zi@saqCD6v}a#Pc*CRq^JJw1~Q`h6AjsOP*DkHx>tfYF8n^4#_VNpI}eBp&Ph=}HpXOizst64|f5p~iId z&UR6HpN91Loh!(t)7m59@86{-DS)x&##B|bNg1)X;X3*M`5h5aJ*q7K?kS4>Klc{( zKi)d~2)C?7RxR+R$}Jm7?E4cy zp+5T4_g>J*6O6y(;?e_V;^58#n*N9vV_{vLA+@2QVK^RhASsBPf!GfS`S(0)uh%aF zIdo)qA>Iwl%*h~tU(nueL;dN~r*K449}EE03dvwqN?KT2ItV8wCT3rIC{F~9#N}l~ zZ~P=s-dxAePs;H_HU=o{fLB%9UjHSZ-}`FCh~hpNLl`XDg1Z%XO6f@t{l#xDC}88J zB$PeftQ!m1q-nVork1g^WCx~xy&wfIn8YZ<)eeq*7eHS5s?AWhM3e@5x3L3yUY~+uM)qK<|+c^r?7Bm}I#@i{kRw zr%$SiilJU@g@wvsf?NY0I?76Zl;ama)p+ zyA`BiXJoDryvY&cKX`;okDZ>Ues$^?NwmY1?1r6eSZ-FM^xNm=&0Gx)4bsTSNJUrU z^=1)_gVQr`T#TRpd(=1SYQ)V@O%T4R!Xo{%#nVeh0ofX z`}g4Tts1k4f#p=>#=xXYWP6t?G741t@lkf5Ie2ZjQ8=PE$H zI?b1ix0%dxzje;; z&&ggveZ3LlNNIriHaP!j7taD&@5UkcPm}AuH1xmm%BcIh*HULFmZGcqx{I^3g0^=2 z=2vxfb@t1b)mx6i1ry}y)x5o5Q!aZ+gEA%veX{n+9*ii1{-uEqxKaGr*zf?wyH+o; zLQ{2hJQNET7cNQ%WdO{L5=S=7tiq(ks8o@!5q2Wzg@uoo z?vgfjn6@5+8lKZoPAcQ^uRv!Pm-IfO2T7sxis2Ptbqpq`^4>dN6JdHyYiD-L8%~7! z#>V$cRhwBZb3YgDz$#Z=EDDa76!7E#=?zM1YCBL2Iq6~k+X*)UXLXL$eOyt;4slmOT>*U}7L(NK)R}K#kon2is4&Q?{j>9{@J9l{C7C>;8yN^g#oh7QHY-9QO zbaBsjnprUobVWerrl7P`%iqDt$$oFCZ|q^+&Gjgp04lR=nS2TxW{MO{4}Tf(m}zumga!2TdS@D3B9-z&Xz`qW`f%5T32q!^!rw{ADOAr6Ax%Yw#6aFh=?b`!oka}_y&V2t+m zykb_+PQW|`h>;`Cw@powsZXEsaXwV4zNQw(N1=)6cMFmB?KLTdN%<4108?oQA~M4T48w!H1ZMjc5G=`USc^lYvMg?*HQjt-H3 zKtL+QNjS=bPLC8TOqNYMepA6&8xK}f@On{TctYnT&4}0}!8h|;z9y=vsW~~UddT?U zJttcW7bJ9)`|v6jfBr&@V2X;0P$;e&&xug*Ms|H=t7o?i{=m5al3A8vbo5eV`r)6 zUtizc_iyB6a~?XVSZ+`iA_N&LJj9C-^r})IPfbfBhew5+8Fo$|vO|#?YHx23%(Z%+ z*R{0J&&|!j!$5_AWHMM6fT-;EB%2FlqZLb(LS&I`adCuyzDaa+fr`NB^mGiEdeeZ< zLLWH7M}wd(cK$xxsPSCYl0R2hVP{f@OJ8}c!?iirN(1#m1VmCTEyCdA)_FvT>Fv;v z8hli3UES#C&#`l@KFg`)PqwK>N|q>oL++3gqE`(pD_e=knDr=+=V7q3xIYLXwKE%`XbvVK zdPgYA@L&HA4;TKtn+T3LD0GB+un|qV|L4d5FMoV~@zNdfOeTse;VAe=Q&m@`Qpq;# Fe*u(hz}El( literal 0 HcmV?d00001 diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..6c49fc6 --- /dev/null +++ b/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833