From e4c310e9e08b61f8cc3f07029a9899a3db28632d Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Mon, 1 Jun 2026 00:43:12 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: laion/exp_tas_optimal_combined_traces Source: Original Platform --- .gitattributes | 56 + README.md | 61 + added_tokens.json | 28 + all_results.json | 16 + chat_template.jinja | 89 + config.json | 68 + configuration.json | 1 + generation_config.json | 12 + merges.txt | 3 + model-00001-of-00004.safetensors | 3 + model-00002-of-00004.safetensors | 3 + model-00003-of-00004.safetensors | 3 + model-00004-of-00004.safetensors | 3 + model.safetensors.index.json | 407 ++ run_summary.json | 12 + special_tokens_map.json | 31 + tokenizer.json | 3 + tokenizer_config.json | 240 + train_results.json | 16 + trainer_log.jsonl | 793 +++ trainer_state.json | 8759 ++++++++++++++++++++++++++++++ training_args.bin | 3 + training_loss.png | Bin 0 -> 46910 bytes vocab.json | 3 + 24 files changed, 10613 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 all_results.json create mode 100644 chat_template.jinja create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 merges.txt create mode 100644 model-00001-of-00004.safetensors create mode 100644 model-00002-of-00004.safetensors create mode 100644 model-00003-of-00004.safetensors create mode 100644 model-00004-of-00004.safetensors create mode 100644 model.safetensors.index.json create mode 100644 run_summary.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_loss.png create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..ab54ba1 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,56 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text + + +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text + +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +merges.txt filter=lfs diff=lfs merge=lfs -text +model-00004-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +training_args.bin filter=lfs diff=lfs merge=lfs -text +model-00003-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text +vocab.json filter=lfs diff=lfs merge=lfs -text +model-00002-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text +model-00001-of-00004.safetensors filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..f77311f --- /dev/null +++ b/README.md @@ -0,0 +1,61 @@ +--- +library_name: transformers +license: apache-2.0 +base_model: Qwen/Qwen3-8B +tags: +- llama-factory +- full +- generated_from_trainer +model-index: +- name: exp_tas_optimal_combined_traces + results: [] +--- + + + +# exp_tas_optimal_combined_traces + +This model is a fine-tuned version of [Qwen/Qwen3-8B](https://huggingface.co/Qwen/Qwen3-8B) on the /data/cat/ws/befe330h-befe330h-otagent/huggingface/hub/datasets--DCAgent--exp_tas_optimal_combined_traces/snapshots/ebbeebd254227e227eae6f6f3f25dd76407c5d1c_thinking_preprocessed dataset. + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 4e-05 +- train_batch_size: 1 +- eval_batch_size: 8 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 8 +- gradient_accumulation_steps: 2 +- total_train_batch_size: 16 +- total_eval_batch_size: 64 +- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.98) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 7.0 + +### Training results + + + +### Framework versions + +- Transformers 4.57.6 +- Pytorch 2.9.0+cu128 +- Datasets 4.4.1 +- Tokenizers 0.22.2 diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..b54f913 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,28 @@ +{ + "": 151668, + "": 151658, + "": 151666, + "": 151667, + "": 151657, + "": 151665, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..a39ef13 --- /dev/null +++ b/all_results.json @@ -0,0 +1,16 @@ +{ + "achieved_tflops_per_gpu": 3.4026604141089156, + "achieved_tflops_per_gpu_theoretical": 406.5485475387801, + "epoch": 7.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.48488524556159973, + "mfu_percent": 0.34405059798876797, + "mfu_percent_theoretical": 41.10703210705562, + "total_flos": 9.02500960062931e+17, + "train_loss": 0.468742822619895, + "train_runtime": 33154.24, + "train_samples_per_second": 1.91, + "train_steps_per_second": 0.12, + "valid_targets_mean": 3460.0, + "valid_targets_min": 1632 +} \ No newline at end of file diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..01be9b3 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,89 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0].role == 'system' %} + {{- messages[0].content + '\n\n' }} + {%- endif %} + {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0].role == 'system' %} + {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %} +{%- for message in messages[::-1] %} + {%- set index = (messages|length - 1) - loop.index0 %} + {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('') and message.content.endswith('')) %} + {%- set ns.multi_step_tool = false %} + {%- set ns.last_query_index = index %} + {%- endif %} +{%- endfor %} +{%- for message in messages %} + {%- if message.content is string %} + {%- set content = message.content %} + {%- else %} + {%- set content = '' %} + {%- endif %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) %} + {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {%- set reasoning_content = '' %} + {%- if message.reasoning_content is string %} + {%- set reasoning_content = message.reasoning_content %} + {%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} + {%- endif %} + {%- if loop.index0 > ns.last_query_index %} + {%- if loop.last or (not loop.last and reasoning_content) %} + {{- '<|im_start|>' + message.role + '\n\n' + reasoning_content.strip('\n') + '\n\n\n' + content.lstrip('\n') }} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- if message.tool_calls %} + {%- for tool_call in message.tool_calls %} + {%- if (loop.first and content) or (not loop.first) %} + {{- '\n' }} + {%- endif %} + {%- if tool_call.function %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {%- if tool_call.arguments is string %} + {{- tool_call.arguments }} + {%- else %} + {{- tool_call.arguments | tojson }} + {%- endif %} + {{- '}\n' }} + {%- endfor %} + {%- endif %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} + {%- if enable_thinking is defined and enable_thinking is false %} + {{- '\n\n\n\n' }} + {%- endif %} +{%- endif %} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..59b4193 --- /dev/null +++ b/config.json @@ -0,0 +1,68 @@ +{ + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "eos_token_id": 151645, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 12288, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 36, + "model_type": "qwen3", + "num_attention_heads": 32, + "num_hidden_layers": 36, + "num_key_value_heads": 8, + "pad_token_id": 151643, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": false, + "transformers_version": "4.57.6", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..bbeeda1 --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "text-generation", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..9adbb28 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,12 @@ +{ + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "temperature": 0.6, + "top_k": 20, + "top_p": 0.95, + "transformers_version": "4.57.6" +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model-00001-of-00004.safetensors b/model-00001-of-00004.safetensors new file mode 100644 index 0000000..b5ff10d --- /dev/null +++ b/model-00001-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a27de8e000c12a8f44292bf11f669f867c413377283579acec2f106dce87dd29 +size 4902257696 diff --git a/model-00002-of-00004.safetensors b/model-00002-of-00004.safetensors new file mode 100644 index 0000000..d34786c --- /dev/null +++ b/model-00002-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2863eef4d0dfa2cb37f04940a8ead85dbec92ff990f0bc0e81959265e9d4c63 +size 4915960368 diff --git a/model-00003-of-00004.safetensors b/model-00003-of-00004.safetensors new file mode 100644 index 0000000..983f598 --- /dev/null +++ b/model-00003-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ea188debf8f0ff0bfdeda5bc78808c5c3fe8ccb76fe8a50fc77214d1dc563d +size 4983068496 diff --git a/model-00004-of-00004.safetensors b/model-00004-of-00004.safetensors new file mode 100644 index 0000000..06f6db0 --- /dev/null +++ b/model-00004-of-00004.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4e63b1c1a8319780f42ee90f967f49995e59b3c2765b23e2457cb625545338 +size 1580230264 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..ba886c0 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,407 @@ +{ + "metadata": { + "total_parameters": 308224, + "total_size": 16381470720 + }, + "weight_map": { + "lm_head.weight": "model-00004-of-00004.safetensors", + "model.embed_tokens.weight": "model-00001-of-00004.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.20.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.22.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.23.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.30.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.down_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.gate_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.mlp.up_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.input_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.down_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.gate_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.mlp.up_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.k_norm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.q_norm.weight": "model-00004-of-00004.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00003-of-00004.safetensors", + "model.layers.4.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.input_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00002-of-00004.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", + "model.layers.9.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00004.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00004.safetensors", + "model.norm.weight": "model-00004-of-00004.safetensors" + } +} diff --git a/run_summary.json b/run_summary.json new file mode 100644 index 0000000..96887e8 --- /dev/null +++ b/run_summary.json @@ -0,0 +1,12 @@ +{ + "agent_name": "ebbeebd254227e227eae6f6f3f25dd76407c5d1c_thinking_preprocessed", + "training_start": "2026-01-27T07:29:58Z", + "training_end": null, + "created_by": "DCAgent", + "base_model_name": "Qwen/Qwen3-8B", + "dataset_name": "/data/cat/ws/befe330h-befe330h-otagent/huggingface/hub/datasets--DCAgent--exp_tas_optimal_combined_traces/snapshots/ebbeebd254227e227eae6f6f3f25dd76407c5d1c_thinking_preprocessed", + "training_type": "SFT", + "training_parameters": "https://huggingface.co/laion/exp_tas_optimal_combined_traces/blob/main/config.json", + "wandb_link": "https://wandb.ai/dogml/OpenThoughts-Agent/runs/sft_exp_tas_optimal_combined_traces_Qwen3-8B", + "traces_location_s3": null +} \ No newline at end of file diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..ac23c0a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..cd71f61 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..e9dc937 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,240 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151665": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151666": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151667": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151668": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 32768, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..a39ef13 --- /dev/null +++ b/train_results.json @@ -0,0 +1,16 @@ +{ + "achieved_tflops_per_gpu": 3.4026604141089156, + "achieved_tflops_per_gpu_theoretical": 406.5485475387801, + "epoch": 7.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.48488524556159973, + "mfu_percent": 0.34405059798876797, + "mfu_percent_theoretical": 41.10703210705562, + "total_flos": 9.02500960062931e+17, + "train_loss": 0.468742822619895, + "train_runtime": 33154.24, + "train_samples_per_second": 1.91, + "train_steps_per_second": 0.12, + "valid_targets_mean": 3460.0, + "valid_targets_min": 1632 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..ed3094c --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,793 @@ +{"current_steps": 5, "total_steps": 3962, "loss": 0.9913, "lr": 4.030226700251889e-07, "epoch": 0.008841732979664015, "percentage": 0.13, "elapsed_time": "0:00:55", "remaining_time": "12:05:41"} +{"current_steps": 10, "total_steps": 3962, "loss": 1.09, "lr": 9.068010075566751e-07, "epoch": 0.01768346595932803, "percentage": 0.25, "elapsed_time": "0:01:28", "remaining_time": "9:44:07"} +{"current_steps": 15, "total_steps": 3962, "loss": 1.0664, "lr": 1.4105793450881613e-06, "epoch": 0.026525198938992044, "percentage": 0.38, "elapsed_time": "0:02:21", "remaining_time": "10:21:14"} +{"current_steps": 20, "total_steps": 3962, "loss": 1.0244, "lr": 1.9143576826196476e-06, "epoch": 0.03536693191865606, "percentage": 0.5, "elapsed_time": "0:03:20", "remaining_time": "10:58:17"} +{"current_steps": 25, "total_steps": 3962, "loss": 0.9523, "lr": 2.4181360201511335e-06, "epoch": 0.04420866489832007, "percentage": 0.63, "elapsed_time": "0:04:10", "remaining_time": "10:58:31"} +{"current_steps": 30, "total_steps": 3962, "loss": 0.8882, "lr": 2.92191435768262e-06, "epoch": 0.05305039787798409, "percentage": 0.76, "elapsed_time": "0:04:55", "remaining_time": "10:44:40"} +{"current_steps": 35, "total_steps": 3962, "loss": 0.8596, "lr": 3.425692695214106e-06, "epoch": 0.0618921308576481, "percentage": 0.88, "elapsed_time": "0:05:46", "remaining_time": "10:48:29"} +{"current_steps": 40, "total_steps": 3962, "loss": 0.8071, "lr": 3.9294710327455925e-06, "epoch": 0.07073386383731212, "percentage": 1.01, "elapsed_time": "0:06:36", "remaining_time": "10:48:18"} +{"current_steps": 45, "total_steps": 3962, "loss": 0.7654, "lr": 4.433249370277078e-06, "epoch": 0.07957559681697612, "percentage": 1.14, "elapsed_time": "0:07:26", "remaining_time": "10:47:32"} +{"current_steps": 50, "total_steps": 3962, "loss": 0.7661, "lr": 4.937027707808565e-06, "epoch": 0.08841732979664015, "percentage": 1.26, "elapsed_time": "0:08:08", "remaining_time": "10:37:29"} +{"current_steps": 55, "total_steps": 3962, "loss": 0.7088, "lr": 5.440806045340051e-06, "epoch": 0.09725906277630415, "percentage": 1.39, "elapsed_time": "0:08:53", "remaining_time": "10:31:09"} +{"current_steps": 60, "total_steps": 3962, "loss": 0.7418, "lr": 5.944584382871537e-06, "epoch": 0.10610079575596817, "percentage": 1.51, "elapsed_time": "0:09:26", "remaining_time": "10:13:34"} +{"current_steps": 65, "total_steps": 3962, "loss": 0.7786, "lr": 6.448362720403023e-06, "epoch": 0.11494252873563218, "percentage": 1.64, "elapsed_time": "0:10:11", "remaining_time": "10:11:01"} +{"current_steps": 70, "total_steps": 3962, "loss": 0.7667, "lr": 6.9521410579345095e-06, "epoch": 0.1237842617152962, "percentage": 1.77, "elapsed_time": "0:10:52", "remaining_time": "10:04:56"} +{"current_steps": 75, "total_steps": 3962, "loss": 0.7316, "lr": 7.455919395465996e-06, "epoch": 0.13262599469496023, "percentage": 1.89, "elapsed_time": "0:11:37", "remaining_time": "10:02:14"} +{"current_steps": 80, "total_steps": 3962, "loss": 0.7216, "lr": 7.959697732997482e-06, "epoch": 0.14146772767462423, "percentage": 2.02, "elapsed_time": "0:12:23", "remaining_time": "10:01:08"} +{"current_steps": 85, "total_steps": 3962, "loss": 0.6962, "lr": 8.463476070528968e-06, "epoch": 0.15030946065428824, "percentage": 2.15, "elapsed_time": "0:13:07", "remaining_time": "9:58:46"} +{"current_steps": 90, "total_steps": 3962, "loss": 0.7161, "lr": 8.967254408060454e-06, "epoch": 0.15915119363395225, "percentage": 2.27, "elapsed_time": "0:13:50", "remaining_time": "9:55:21"} +{"current_steps": 95, "total_steps": 3962, "loss": 0.706, "lr": 9.47103274559194e-06, "epoch": 0.16799292661361626, "percentage": 2.4, "elapsed_time": "0:14:24", "remaining_time": "9:46:28"} +{"current_steps": 100, "total_steps": 3962, "loss": 0.6583, "lr": 9.974811083123427e-06, "epoch": 0.1768346595932803, "percentage": 2.52, "elapsed_time": "0:15:18", "remaining_time": "9:51:00"} +{"current_steps": 105, "total_steps": 3962, "loss": 0.6697, "lr": 1.0478589420654912e-05, "epoch": 0.1856763925729443, "percentage": 2.65, "elapsed_time": "0:15:49", "remaining_time": "9:41:12"} +{"current_steps": 110, "total_steps": 3962, "loss": 0.6139, "lr": 1.0982367758186399e-05, "epoch": 0.1945181255526083, "percentage": 2.78, "elapsed_time": "0:16:29", "remaining_time": "9:37:31"} +{"current_steps": 115, "total_steps": 3962, "loss": 0.6651, "lr": 1.1486146095717885e-05, "epoch": 0.20335985853227231, "percentage": 2.9, "elapsed_time": "0:17:03", "remaining_time": "9:30:40"} +{"current_steps": 120, "total_steps": 3962, "loss": 0.7056, "lr": 1.1989924433249371e-05, "epoch": 0.21220159151193635, "percentage": 3.03, "elapsed_time": "0:17:47", "remaining_time": "9:29:52"} +{"current_steps": 125, "total_steps": 3962, "loss": 0.6327, "lr": 1.2493702770780859e-05, "epoch": 0.22104332449160036, "percentage": 3.15, "elapsed_time": "0:18:43", "remaining_time": "9:34:56"} +{"current_steps": 130, "total_steps": 3962, "loss": 0.6477, "lr": 1.2997481108312344e-05, "epoch": 0.22988505747126436, "percentage": 3.28, "elapsed_time": "0:19:26", "remaining_time": "9:32:59"} +{"current_steps": 135, "total_steps": 3962, "loss": 0.6188, "lr": 1.350125944584383e-05, "epoch": 0.23872679045092837, "percentage": 3.41, "elapsed_time": "0:20:03", "remaining_time": "9:28:49"} +{"current_steps": 140, "total_steps": 3962, "loss": 0.6729, "lr": 1.4005037783375318e-05, "epoch": 0.2475685234305924, "percentage": 3.53, "elapsed_time": "0:20:49", "remaining_time": "9:28:29"} +{"current_steps": 145, "total_steps": 3962, "loss": 0.5868, "lr": 1.4508816120906802e-05, "epoch": 0.2564102564102564, "percentage": 3.66, "elapsed_time": "0:21:34", "remaining_time": "9:27:44"} +{"current_steps": 150, "total_steps": 3962, "loss": 0.6371, "lr": 1.5012594458438288e-05, "epoch": 0.26525198938992045, "percentage": 3.79, "elapsed_time": "0:22:14", "remaining_time": "9:25:13"} +{"current_steps": 155, "total_steps": 3962, "loss": 0.6119, "lr": 1.5516372795969776e-05, "epoch": 0.27409372236958446, "percentage": 3.91, "elapsed_time": "0:23:11", "remaining_time": "9:29:39"} +{"current_steps": 160, "total_steps": 3962, "loss": 0.6135, "lr": 1.602015113350126e-05, "epoch": 0.28293545534924847, "percentage": 4.04, "elapsed_time": "0:24:05", "remaining_time": "9:32:29"} +{"current_steps": 165, "total_steps": 3962, "loss": 0.6163, "lr": 1.6523929471032747e-05, "epoch": 0.2917771883289125, "percentage": 4.16, "elapsed_time": "0:24:58", "remaining_time": "9:34:54"} +{"current_steps": 170, "total_steps": 3962, "loss": 0.6208, "lr": 1.7027707808564233e-05, "epoch": 0.3006189213085765, "percentage": 4.29, "elapsed_time": "0:25:37", "remaining_time": "9:31:28"} +{"current_steps": 175, "total_steps": 3962, "loss": 0.6582, "lr": 1.753148614609572e-05, "epoch": 0.3094606542882405, "percentage": 4.42, "elapsed_time": "0:26:11", "remaining_time": "9:26:45"} +{"current_steps": 180, "total_steps": 3962, "loss": 0.661, "lr": 1.8035264483627205e-05, "epoch": 0.3183023872679045, "percentage": 4.54, "elapsed_time": "0:27:01", "remaining_time": "9:27:48"} +{"current_steps": 185, "total_steps": 3962, "loss": 0.613, "lr": 1.8539042821158694e-05, "epoch": 0.3271441202475685, "percentage": 4.67, "elapsed_time": "0:27:39", "remaining_time": "9:24:46"} +{"current_steps": 190, "total_steps": 3962, "loss": 0.6091, "lr": 1.9042821158690177e-05, "epoch": 0.3359858532272325, "percentage": 4.8, "elapsed_time": "0:28:14", "remaining_time": "9:20:40"} +{"current_steps": 195, "total_steps": 3962, "loss": 0.7227, "lr": 1.9546599496221663e-05, "epoch": 0.3448275862068966, "percentage": 4.92, "elapsed_time": "0:28:48", "remaining_time": "9:16:25"} +{"current_steps": 200, "total_steps": 3962, "loss": 0.6012, "lr": 2.0050377833753152e-05, "epoch": 0.3536693191865606, "percentage": 5.05, "elapsed_time": "0:29:33", "remaining_time": "9:15:54"} +{"current_steps": 205, "total_steps": 3962, "loss": 0.597, "lr": 2.0554156171284634e-05, "epoch": 0.3625110521662246, "percentage": 5.17, "elapsed_time": "0:30:05", "remaining_time": "9:11:31"} +{"current_steps": 210, "total_steps": 3962, "loss": 0.6181, "lr": 2.1057934508816124e-05, "epoch": 0.3713527851458886, "percentage": 5.3, "elapsed_time": "0:30:44", "remaining_time": "9:09:15"} +{"current_steps": 215, "total_steps": 3962, "loss": 0.6068, "lr": 2.156171284634761e-05, "epoch": 0.3801945181255526, "percentage": 5.43, "elapsed_time": "0:31:24", "remaining_time": "9:07:15"} +{"current_steps": 220, "total_steps": 3962, "loss": 0.5964, "lr": 2.2065491183879092e-05, "epoch": 0.3890362511052166, "percentage": 5.55, "elapsed_time": "0:32:05", "remaining_time": "9:05:51"} +{"current_steps": 225, "total_steps": 3962, "loss": 0.6837, "lr": 2.256926952141058e-05, "epoch": 0.3978779840848806, "percentage": 5.68, "elapsed_time": "0:32:55", "remaining_time": "9:06:46"} +{"current_steps": 230, "total_steps": 3962, "loss": 0.603, "lr": 2.3073047858942067e-05, "epoch": 0.40671971706454463, "percentage": 5.81, "elapsed_time": "0:33:42", "remaining_time": "9:06:53"} +{"current_steps": 235, "total_steps": 3962, "loss": 0.597, "lr": 2.3576826196473553e-05, "epoch": 0.4155614500442087, "percentage": 5.93, "elapsed_time": "0:34:22", "remaining_time": "9:05:07"} +{"current_steps": 240, "total_steps": 3962, "loss": 0.6116, "lr": 2.408060453400504e-05, "epoch": 0.4244031830238727, "percentage": 6.06, "elapsed_time": "0:35:09", "remaining_time": "9:05:09"} +{"current_steps": 245, "total_steps": 3962, "loss": 0.6241, "lr": 2.4584382871536528e-05, "epoch": 0.4332449160035367, "percentage": 6.18, "elapsed_time": "0:35:50", "remaining_time": "9:03:49"} +{"current_steps": 250, "total_steps": 3962, "loss": 0.6053, "lr": 2.508816120906801e-05, "epoch": 0.4420866489832007, "percentage": 6.31, "elapsed_time": "0:36:36", "remaining_time": "9:03:40"} +{"current_steps": 255, "total_steps": 3962, "loss": 0.5453, "lr": 2.55919395465995e-05, "epoch": 0.4509283819628647, "percentage": 6.44, "elapsed_time": "0:37:14", "remaining_time": "9:01:28"} +{"current_steps": 260, "total_steps": 3962, "loss": 0.6377, "lr": 2.6095717884130986e-05, "epoch": 0.45977011494252873, "percentage": 6.56, "elapsed_time": "0:37:50", "remaining_time": "8:58:51"} +{"current_steps": 265, "total_steps": 3962, "loss": 0.623, "lr": 2.659949622166247e-05, "epoch": 0.46861184792219274, "percentage": 6.69, "elapsed_time": "0:38:37", "remaining_time": "8:58:46"} +{"current_steps": 270, "total_steps": 3962, "loss": 0.5872, "lr": 2.7103274559193958e-05, "epoch": 0.47745358090185674, "percentage": 6.81, "elapsed_time": "0:39:15", "remaining_time": "8:56:52"} +{"current_steps": 275, "total_steps": 3962, "loss": 0.616, "lr": 2.760705289672544e-05, "epoch": 0.48629531388152075, "percentage": 6.94, "elapsed_time": "0:39:55", "remaining_time": "8:55:18"} +{"current_steps": 280, "total_steps": 3962, "loss": 0.6361, "lr": 2.811083123425693e-05, "epoch": 0.4951370468611848, "percentage": 7.07, "elapsed_time": "0:40:32", "remaining_time": "8:53:10"} +{"current_steps": 285, "total_steps": 3962, "loss": 0.605, "lr": 2.8614609571788415e-05, "epoch": 0.5039787798408488, "percentage": 7.19, "elapsed_time": "0:41:15", "remaining_time": "8:52:20"} +{"current_steps": 290, "total_steps": 3962, "loss": 0.6046, "lr": 2.91183879093199e-05, "epoch": 0.5128205128205128, "percentage": 7.32, "elapsed_time": "0:41:51", "remaining_time": "8:50:07"} +{"current_steps": 295, "total_steps": 3962, "loss": 0.6052, "lr": 2.9622166246851387e-05, "epoch": 0.5216622458001768, "percentage": 7.45, "elapsed_time": "0:42:25", "remaining_time": "8:47:19"} +{"current_steps": 300, "total_steps": 3962, "loss": 0.6084, "lr": 3.0125944584382876e-05, "epoch": 0.5305039787798409, "percentage": 7.57, "elapsed_time": "0:42:57", "remaining_time": "8:44:20"} +{"current_steps": 305, "total_steps": 3962, "loss": 0.5926, "lr": 3.062972292191436e-05, "epoch": 0.5393457117595049, "percentage": 7.7, "elapsed_time": "0:43:40", "remaining_time": "8:43:38"} +{"current_steps": 310, "total_steps": 3962, "loss": 0.5576, "lr": 3.113350125944585e-05, "epoch": 0.5481874447391689, "percentage": 7.82, "elapsed_time": "0:44:23", "remaining_time": "8:42:59"} +{"current_steps": 315, "total_steps": 3962, "loss": 0.5824, "lr": 3.1637279596977334e-05, "epoch": 0.5570291777188329, "percentage": 7.95, "elapsed_time": "0:45:15", "remaining_time": "8:43:59"} +{"current_steps": 320, "total_steps": 3962, "loss": 0.5984, "lr": 3.214105793450882e-05, "epoch": 0.5658709106984969, "percentage": 8.08, "elapsed_time": "0:45:56", "remaining_time": "8:42:52"} +{"current_steps": 325, "total_steps": 3962, "loss": 0.5448, "lr": 3.2644836272040306e-05, "epoch": 0.5747126436781609, "percentage": 8.2, "elapsed_time": "0:46:35", "remaining_time": "8:41:23"} +{"current_steps": 330, "total_steps": 3962, "loss": 0.5912, "lr": 3.314861460957179e-05, "epoch": 0.583554376657825, "percentage": 8.33, "elapsed_time": "0:47:13", "remaining_time": "8:39:46"} +{"current_steps": 335, "total_steps": 3962, "loss": 0.546, "lr": 3.365239294710328e-05, "epoch": 0.5923961096374889, "percentage": 8.46, "elapsed_time": "0:48:01", "remaining_time": "8:39:53"} +{"current_steps": 340, "total_steps": 3962, "loss": 0.5375, "lr": 3.415617128463476e-05, "epoch": 0.601237842617153, "percentage": 8.58, "elapsed_time": "0:48:43", "remaining_time": "8:39:03"} +{"current_steps": 345, "total_steps": 3962, "loss": 0.5658, "lr": 3.465994962216625e-05, "epoch": 0.610079575596817, "percentage": 8.71, "elapsed_time": "0:49:30", "remaining_time": "8:39:01"} +{"current_steps": 350, "total_steps": 3962, "loss": 0.5964, "lr": 3.516372795969774e-05, "epoch": 0.618921308576481, "percentage": 8.83, "elapsed_time": "0:50:14", "remaining_time": "8:38:27"} +{"current_steps": 355, "total_steps": 3962, "loss": 0.5694, "lr": 3.566750629722922e-05, "epoch": 0.627763041556145, "percentage": 8.96, "elapsed_time": "0:51:01", "remaining_time": "8:38:25"} +{"current_steps": 360, "total_steps": 3962, "loss": 0.542, "lr": 3.617128463476071e-05, "epoch": 0.636604774535809, "percentage": 9.09, "elapsed_time": "0:51:46", "remaining_time": "8:38:02"} +{"current_steps": 365, "total_steps": 3962, "loss": 0.5764, "lr": 3.667506297229219e-05, "epoch": 0.6454465075154731, "percentage": 9.21, "elapsed_time": "0:52:35", "remaining_time": "8:38:19"} +{"current_steps": 370, "total_steps": 3962, "loss": 0.5865, "lr": 3.717884130982368e-05, "epoch": 0.654288240495137, "percentage": 9.34, "elapsed_time": "0:53:17", "remaining_time": "8:37:23"} +{"current_steps": 375, "total_steps": 3962, "loss": 0.6103, "lr": 3.7682619647355165e-05, "epoch": 0.6631299734748011, "percentage": 9.46, "elapsed_time": "0:53:48", "remaining_time": "8:34:37"} +{"current_steps": 380, "total_steps": 3962, "loss": 0.5234, "lr": 3.8186397984886654e-05, "epoch": 0.671971706454465, "percentage": 9.59, "elapsed_time": "0:54:36", "remaining_time": "8:34:44"} +{"current_steps": 385, "total_steps": 3962, "loss": 0.5644, "lr": 3.8690176322418137e-05, "epoch": 0.6808134394341291, "percentage": 9.72, "elapsed_time": "0:55:10", "remaining_time": "8:32:40"} +{"current_steps": 390, "total_steps": 3962, "loss": 0.587, "lr": 3.9193954659949626e-05, "epoch": 0.6896551724137931, "percentage": 9.84, "elapsed_time": "0:55:55", "remaining_time": "8:32:10"} +{"current_steps": 395, "total_steps": 3962, "loss": 0.594, "lr": 3.969773299748111e-05, "epoch": 0.6984969053934571, "percentage": 9.97, "elapsed_time": "0:56:49", "remaining_time": "8:33:07"} +{"current_steps": 400, "total_steps": 3962, "loss": 0.5368, "lr": 3.999996893720319e-05, "epoch": 0.7073386383731212, "percentage": 10.1, "elapsed_time": "0:57:27", "remaining_time": "8:31:41"} +{"current_steps": 405, "total_steps": 3962, "loss": 0.5683, "lr": 3.999961948184714e-05, "epoch": 0.7161803713527851, "percentage": 10.22, "elapsed_time": "0:58:03", "remaining_time": "8:29:56"} +{"current_steps": 410, "total_steps": 3962, "loss": 0.543, "lr": 3.999888174944605e-05, "epoch": 0.7250221043324492, "percentage": 10.35, "elapsed_time": "0:58:53", "remaining_time": "8:30:08"} +{"current_steps": 415, "total_steps": 3962, "loss": 0.5316, "lr": 3.9997755754322415e-05, "epoch": 0.7338638373121131, "percentage": 10.47, "elapsed_time": "0:59:38", "remaining_time": "8:29:44"} +{"current_steps": 420, "total_steps": 3962, "loss": 0.5805, "lr": 3.9996241518336554e-05, "epoch": 0.7427055702917772, "percentage": 10.6, "elapsed_time": "1:00:19", "remaining_time": "8:28:42"} +{"current_steps": 425, "total_steps": 3962, "loss": 0.5688, "lr": 3.999433907088618e-05, "epoch": 0.7515473032714411, "percentage": 10.73, "elapsed_time": "1:01:02", "remaining_time": "8:27:58"} +{"current_steps": 430, "total_steps": 3962, "loss": 0.5326, "lr": 3.999204844890582e-05, "epoch": 0.7603890362511052, "percentage": 10.85, "elapsed_time": "1:01:42", "remaining_time": "8:26:53"} +{"current_steps": 435, "total_steps": 3962, "loss": 0.565, "lr": 3.998936969686614e-05, "epoch": 0.7692307692307693, "percentage": 10.98, "elapsed_time": "1:02:27", "remaining_time": "8:26:21"} +{"current_steps": 440, "total_steps": 3962, "loss": 0.561, "lr": 3.9986302866773e-05, "epoch": 0.7780725022104332, "percentage": 11.11, "elapsed_time": "1:03:08", "remaining_time": "8:25:26"} +{"current_steps": 445, "total_steps": 3962, "loss": 0.5455, "lr": 3.998284801816654e-05, "epoch": 0.7869142351900973, "percentage": 11.23, "elapsed_time": "1:03:49", "remaining_time": "8:24:23"} +{"current_steps": 450, "total_steps": 3962, "loss": 0.5635, "lr": 3.997900521811995e-05, "epoch": 0.7957559681697612, "percentage": 11.36, "elapsed_time": "1:04:28", "remaining_time": "8:23:15"} +{"current_steps": 455, "total_steps": 3962, "loss": 0.5781, "lr": 3.997477454123818e-05, "epoch": 0.8045977011494253, "percentage": 11.48, "elapsed_time": "1:05:12", "remaining_time": "8:22:35"} +{"current_steps": 460, "total_steps": 3962, "loss": 0.5392, "lr": 3.997015606965656e-05, "epoch": 0.8134394341290893, "percentage": 11.61, "elapsed_time": "1:06:03", "remaining_time": "8:22:52"} +{"current_steps": 465, "total_steps": 3962, "loss": 0.6028, "lr": 3.996514989303911e-05, "epoch": 0.8222811671087533, "percentage": 11.74, "elapsed_time": "1:06:40", "remaining_time": "8:21:23"} +{"current_steps": 470, "total_steps": 3962, "loss": 0.5558, "lr": 3.9959756108576853e-05, "epoch": 0.8311229000884174, "percentage": 11.86, "elapsed_time": "1:07:27", "remaining_time": "8:21:13"} +{"current_steps": 475, "total_steps": 3962, "loss": 0.5884, "lr": 3.995397482098591e-05, "epoch": 0.8399646330680813, "percentage": 11.99, "elapsed_time": "1:07:59", "remaining_time": "8:19:08"} +{"current_steps": 480, "total_steps": 3962, "loss": 0.5396, "lr": 3.994780614250548e-05, "epoch": 0.8488063660477454, "percentage": 12.12, "elapsed_time": "1:08:52", "remaining_time": "8:19:38"} +{"current_steps": 485, "total_steps": 3962, "loss": 0.5359, "lr": 3.994125019289566e-05, "epoch": 0.8576480990274093, "percentage": 12.24, "elapsed_time": "1:09:34", "remaining_time": "8:18:45"} +{"current_steps": 490, "total_steps": 3962, "loss": 0.5466, "lr": 3.99343070994351e-05, "epoch": 0.8664898320070734, "percentage": 12.37, "elapsed_time": "1:10:08", "remaining_time": "8:17:00"} +{"current_steps": 495, "total_steps": 3962, "loss": 0.5754, "lr": 3.992697699691857e-05, "epoch": 0.8753315649867374, "percentage": 12.49, "elapsed_time": "1:10:51", "remaining_time": "8:16:14"} +{"current_steps": 500, "total_steps": 3962, "loss": 0.612, "lr": 3.9919260027654304e-05, "epoch": 0.8841732979664014, "percentage": 12.62, "elapsed_time": "1:11:32", "remaining_time": "8:15:23"} +{"current_steps": 505, "total_steps": 3962, "loss": 0.5209, "lr": 3.991115634146123e-05, "epoch": 0.8930150309460654, "percentage": 12.75, "elapsed_time": "1:12:17", "remaining_time": "8:14:54"} +{"current_steps": 510, "total_steps": 3962, "loss": 0.5822, "lr": 3.990266609566614e-05, "epoch": 0.9018567639257294, "percentage": 12.87, "elapsed_time": "1:12:56", "remaining_time": "8:13:43"} +{"current_steps": 515, "total_steps": 3962, "loss": 0.5182, "lr": 3.9893789455100514e-05, "epoch": 0.9106984969053935, "percentage": 13.0, "elapsed_time": "1:13:55", "remaining_time": "8:14:44"} +{"current_steps": 520, "total_steps": 3962, "loss": 0.5723, "lr": 3.988452659209745e-05, "epoch": 0.9195402298850575, "percentage": 13.12, "elapsed_time": "1:14:28", "remaining_time": "8:12:58"} +{"current_steps": 525, "total_steps": 3962, "loss": 0.5628, "lr": 3.9874877686488197e-05, "epoch": 0.9283819628647215, "percentage": 13.25, "elapsed_time": "1:15:02", "remaining_time": "8:11:13"} +{"current_steps": 530, "total_steps": 3962, "loss": 0.5405, "lr": 3.986484292559877e-05, "epoch": 0.9372236958443855, "percentage": 13.38, "elapsed_time": "1:15:46", "remaining_time": "8:10:40"} +{"current_steps": 535, "total_steps": 3962, "loss": 0.5626, "lr": 3.9854422504246224e-05, "epoch": 0.9460654288240495, "percentage": 13.5, "elapsed_time": "1:16:28", "remaining_time": "8:09:55"} +{"current_steps": 540, "total_steps": 3962, "loss": 0.5616, "lr": 3.984361662473494e-05, "epoch": 0.9549071618037135, "percentage": 13.63, "elapsed_time": "1:17:16", "remaining_time": "8:09:43"} +{"current_steps": 545, "total_steps": 3962, "loss": 0.5737, "lr": 3.9832425496852644e-05, "epoch": 0.9637488947833776, "percentage": 13.76, "elapsed_time": "1:18:00", "remaining_time": "8:09:05"} +{"current_steps": 550, "total_steps": 3962, "loss": 0.5622, "lr": 3.982084933786639e-05, "epoch": 0.9725906277630415, "percentage": 13.88, "elapsed_time": "1:18:47", "remaining_time": "8:08:48"} +{"current_steps": 555, "total_steps": 3962, "loss": 0.523, "lr": 3.9808888372518285e-05, "epoch": 0.9814323607427056, "percentage": 14.01, "elapsed_time": "1:19:41", "remaining_time": "8:09:12"} +{"current_steps": 560, "total_steps": 3962, "loss": 0.561, "lr": 3.979654283302115e-05, "epoch": 0.9902740937223696, "percentage": 14.13, "elapsed_time": "1:20:33", "remaining_time": "8:09:20"} +{"current_steps": 565, "total_steps": 3962, "loss": 0.54, "lr": 3.9783812959054054e-05, "epoch": 0.9991158267020336, "percentage": 14.26, "elapsed_time": "1:21:15", "remaining_time": "8:08:35"} +{"current_steps": 570, "total_steps": 3962, "loss": 0.5341, "lr": 3.9770698997757564e-05, "epoch": 1.0070733863837311, "percentage": 14.39, "elapsed_time": "1:21:48", "remaining_time": "8:06:51"} +{"current_steps": 575, "total_steps": 3962, "loss": 0.5604, "lr": 3.975720120372905e-05, "epoch": 1.0159151193633953, "percentage": 14.51, "elapsed_time": "1:22:41", "remaining_time": "8:07:03"} +{"current_steps": 580, "total_steps": 3962, "loss": 0.5139, "lr": 3.974331983901766e-05, "epoch": 1.0247568523430592, "percentage": 14.64, "elapsed_time": "1:23:22", "remaining_time": "8:06:09"} +{"current_steps": 585, "total_steps": 3962, "loss": 0.5025, "lr": 3.972905517311929e-05, "epoch": 1.0335985853227232, "percentage": 14.77, "elapsed_time": "1:24:17", "remaining_time": "8:06:33"} +{"current_steps": 590, "total_steps": 3962, "loss": 0.503, "lr": 3.9714407482971335e-05, "epoch": 1.0424403183023874, "percentage": 14.89, "elapsed_time": "1:24:54", "remaining_time": "8:05:15"} +{"current_steps": 595, "total_steps": 3962, "loss": 0.5078, "lr": 3.969937705294728e-05, "epoch": 1.0512820512820513, "percentage": 15.02, "elapsed_time": "1:25:41", "remaining_time": "8:04:57"} +{"current_steps": 600, "total_steps": 3962, "loss": 0.5508, "lr": 3.968396417485125e-05, "epoch": 1.0601237842617153, "percentage": 15.14, "elapsed_time": "1:26:33", "remaining_time": "8:05:00"} +{"current_steps": 605, "total_steps": 3962, "loss": 0.5343, "lr": 3.966816914791226e-05, "epoch": 1.0689655172413792, "percentage": 15.27, "elapsed_time": "1:27:06", "remaining_time": "8:03:20"} +{"current_steps": 610, "total_steps": 3962, "loss": 0.5254, "lr": 3.965199227877846e-05, "epoch": 1.0778072502210434, "percentage": 15.4, "elapsed_time": "1:27:48", "remaining_time": "8:02:28"} +{"current_steps": 615, "total_steps": 3962, "loss": 0.5176, "lr": 3.963543388151117e-05, "epoch": 1.0866489832007074, "percentage": 15.52, "elapsed_time": "1:28:31", "remaining_time": "8:01:48"} +{"current_steps": 620, "total_steps": 3962, "loss": 0.5254, "lr": 3.9618494277578806e-05, "epoch": 1.0954907161803713, "percentage": 15.65, "elapsed_time": "1:29:22", "remaining_time": "8:01:45"} +{"current_steps": 625, "total_steps": 3962, "loss": 0.56, "lr": 3.960117379585057e-05, "epoch": 1.1043324491600353, "percentage": 15.77, "elapsed_time": "1:29:54", "remaining_time": "8:00:01"} +{"current_steps": 630, "total_steps": 3962, "loss": 0.4971, "lr": 3.958347277259015e-05, "epoch": 1.1131741821396994, "percentage": 15.9, "elapsed_time": "1:30:38", "remaining_time": "7:59:21"} +{"current_steps": 635, "total_steps": 3962, "loss": 0.5234, "lr": 3.956539155144912e-05, "epoch": 1.1220159151193634, "percentage": 16.03, "elapsed_time": "1:31:12", "remaining_time": "7:57:51"} +{"current_steps": 640, "total_steps": 3962, "loss": 0.516, "lr": 3.9546930483460326e-05, "epoch": 1.1308576480990273, "percentage": 16.15, "elapsed_time": "1:31:54", "remaining_time": "7:57:04"} +{"current_steps": 645, "total_steps": 3962, "loss": 0.5083, "lr": 3.952808992703102e-05, "epoch": 1.1396993810786915, "percentage": 16.28, "elapsed_time": "1:32:23", "remaining_time": "7:55:09"} +{"current_steps": 650, "total_steps": 3962, "loss": 0.5351, "lr": 3.9508870247935964e-05, "epoch": 1.1485411140583555, "percentage": 16.41, "elapsed_time": "1:33:06", "remaining_time": "7:54:27"} +{"current_steps": 655, "total_steps": 3962, "loss": 0.52, "lr": 3.948927181931024e-05, "epoch": 1.1573828470380194, "percentage": 16.53, "elapsed_time": "1:34:04", "remaining_time": "7:54:59"} +{"current_steps": 660, "total_steps": 3962, "loss": 0.5235, "lr": 3.94692950216421e-05, "epoch": 1.1662245800176834, "percentage": 16.66, "elapsed_time": "1:34:46", "remaining_time": "7:54:10"} +{"current_steps": 665, "total_steps": 3962, "loss": 0.5026, "lr": 3.944894024276552e-05, "epoch": 1.1750663129973475, "percentage": 16.78, "elapsed_time": "1:35:32", "remaining_time": "7:53:39"} +{"current_steps": 670, "total_steps": 3962, "loss": 0.5115, "lr": 3.9428207877852684e-05, "epoch": 1.1839080459770115, "percentage": 16.91, "elapsed_time": "1:36:15", "remaining_time": "7:52:56"} +{"current_steps": 675, "total_steps": 3962, "loss": 0.5465, "lr": 3.940709832940632e-05, "epoch": 1.1927497789566754, "percentage": 17.04, "elapsed_time": "1:36:44", "remaining_time": "7:51:08"} +{"current_steps": 680, "total_steps": 3962, "loss": 0.513, "lr": 3.938561200725189e-05, "epoch": 1.2015915119363396, "percentage": 17.16, "elapsed_time": "1:37:32", "remaining_time": "7:50:46"} +{"current_steps": 685, "total_steps": 3962, "loss": 0.5482, "lr": 3.9363749328529594e-05, "epoch": 1.2104332449160036, "percentage": 17.29, "elapsed_time": "1:38:11", "remaining_time": "7:49:42"} +{"current_steps": 690, "total_steps": 3962, "loss": 0.5537, "lr": 3.934151071768634e-05, "epoch": 1.2192749778956675, "percentage": 17.42, "elapsed_time": "1:38:48", "remaining_time": "7:48:34"} +{"current_steps": 695, "total_steps": 3962, "loss": 0.5482, "lr": 3.931889660646744e-05, "epoch": 1.2281167108753315, "percentage": 17.54, "elapsed_time": "1:39:32", "remaining_time": "7:47:54"} +{"current_steps": 700, "total_steps": 3962, "loss": 0.5415, "lr": 3.9295907433908264e-05, "epoch": 1.2369584438549956, "percentage": 17.67, "elapsed_time": "1:40:21", "remaining_time": "7:47:41"} +{"current_steps": 705, "total_steps": 3962, "loss": 0.5317, "lr": 3.9272543646325703e-05, "epoch": 1.2458001768346596, "percentage": 17.79, "elapsed_time": "1:41:07", "remaining_time": "7:47:10"} +{"current_steps": 710, "total_steps": 3962, "loss": 0.5281, "lr": 3.924880569730951e-05, "epoch": 1.2546419098143236, "percentage": 17.92, "elapsed_time": "1:41:58", "remaining_time": "7:47:05"} +{"current_steps": 715, "total_steps": 3962, "loss": 0.51, "lr": 3.9224694047713475e-05, "epoch": 1.2634836427939877, "percentage": 18.05, "elapsed_time": "1:42:33", "remaining_time": "7:45:46"} +{"current_steps": 720, "total_steps": 3962, "loss": 0.504, "lr": 3.920020916564652e-05, "epoch": 1.2723253757736517, "percentage": 18.17, "elapsed_time": "1:43:24", "remaining_time": "7:45:36"} +{"current_steps": 725, "total_steps": 3962, "loss": 0.57, "lr": 3.917535152646356e-05, "epoch": 1.2811671087533156, "percentage": 18.3, "elapsed_time": "1:44:14", "remaining_time": "7:45:26"} +{"current_steps": 730, "total_steps": 3962, "loss": 0.5579, "lr": 3.915012161275633e-05, "epoch": 1.2900088417329796, "percentage": 18.43, "elapsed_time": "1:44:59", "remaining_time": "7:44:51"} +{"current_steps": 735, "total_steps": 3962, "loss": 0.5253, "lr": 3.912451991434395e-05, "epoch": 1.2988505747126438, "percentage": 18.55, "elapsed_time": "1:45:30", "remaining_time": "7:43:14"} +{"current_steps": 740, "total_steps": 3962, "loss": 0.5043, "lr": 3.909854692826348e-05, "epoch": 1.3076923076923077, "percentage": 18.68, "elapsed_time": "1:46:09", "remaining_time": "7:42:13"} +{"current_steps": 745, "total_steps": 3962, "loss": 0.5015, "lr": 3.9072203158760215e-05, "epoch": 1.3165340406719717, "percentage": 18.8, "elapsed_time": "1:46:52", "remaining_time": "7:41:30"} +{"current_steps": 750, "total_steps": 3962, "loss": 0.5228, "lr": 3.904548911727793e-05, "epoch": 1.3253757736516358, "percentage": 18.93, "elapsed_time": "1:47:35", "remaining_time": "7:40:48"} +{"current_steps": 755, "total_steps": 3962, "loss": 0.4892, "lr": 3.901840532244897e-05, "epoch": 1.3342175066312998, "percentage": 19.06, "elapsed_time": "1:48:08", "remaining_time": "7:39:22"} +{"current_steps": 760, "total_steps": 3962, "loss": 0.4955, "lr": 3.899095230008411e-05, "epoch": 1.3430592396109637, "percentage": 19.18, "elapsed_time": "1:48:58", "remaining_time": "7:39:09"} +{"current_steps": 765, "total_steps": 3962, "loss": 0.5131, "lr": 3.896313058316242e-05, "epoch": 1.3519009725906277, "percentage": 19.31, "elapsed_time": "1:49:53", "remaining_time": "7:39:13"} +{"current_steps": 770, "total_steps": 3962, "loss": 0.5282, "lr": 3.8934940711820876e-05, "epoch": 1.3607427055702916, "percentage": 19.43, "elapsed_time": "1:50:46", "remaining_time": "7:39:12"} +{"current_steps": 775, "total_steps": 3962, "loss": 0.5301, "lr": 3.8906383233343886e-05, "epoch": 1.3695844385499558, "percentage": 19.56, "elapsed_time": "1:51:20", "remaining_time": "7:37:50"} +{"current_steps": 780, "total_steps": 3962, "loss": 0.5448, "lr": 3.887745870215268e-05, "epoch": 1.3784261715296198, "percentage": 19.69, "elapsed_time": "1:52:05", "remaining_time": "7:37:16"} +{"current_steps": 785, "total_steps": 3962, "loss": 0.5251, "lr": 3.884816767979449e-05, "epoch": 1.387267904509284, "percentage": 19.81, "elapsed_time": "1:52:46", "remaining_time": "7:36:26"} +{"current_steps": 790, "total_steps": 3962, "loss": 0.5549, "lr": 3.881851073493174e-05, "epoch": 1.396109637488948, "percentage": 19.94, "elapsed_time": "1:53:25", "remaining_time": "7:35:25"} +{"current_steps": 795, "total_steps": 3962, "loss": 0.4985, "lr": 3.878848844333091e-05, "epoch": 1.4049513704686118, "percentage": 20.07, "elapsed_time": "1:54:07", "remaining_time": "7:34:36"} +{"current_steps": 800, "total_steps": 3962, "loss": 0.517, "lr": 3.875810138785144e-05, "epoch": 1.4137931034482758, "percentage": 20.19, "elapsed_time": "1:55:00", "remaining_time": "7:34:35"} +{"current_steps": 805, "total_steps": 3962, "loss": 0.5369, "lr": 3.872735015843435e-05, "epoch": 1.4226348364279398, "percentage": 20.32, "elapsed_time": "1:55:44", "remaining_time": "7:33:56"} +{"current_steps": 810, "total_steps": 3962, "loss": 0.4849, "lr": 3.8696235352090827e-05, "epoch": 1.431476569407604, "percentage": 20.44, "elapsed_time": "1:56:29", "remaining_time": "7:33:18"} +{"current_steps": 815, "total_steps": 3962, "loss": 0.5431, "lr": 3.8664757572890624e-05, "epoch": 1.4403183023872679, "percentage": 20.57, "elapsed_time": "1:57:11", "remaining_time": "7:32:30"} +{"current_steps": 820, "total_steps": 3962, "loss": 0.5368, "lr": 3.863291743195031e-05, "epoch": 1.449160035366932, "percentage": 20.7, "elapsed_time": "1:57:54", "remaining_time": "7:31:46"} +{"current_steps": 825, "total_steps": 3962, "loss": 0.5517, "lr": 3.860071554742144e-05, "epoch": 1.458001768346596, "percentage": 20.82, "elapsed_time": "1:58:26", "remaining_time": "7:30:20"} +{"current_steps": 830, "total_steps": 3962, "loss": 0.538, "lr": 3.856815254447854e-05, "epoch": 1.46684350132626, "percentage": 20.95, "elapsed_time": "1:59:10", "remaining_time": "7:29:41"} +{"current_steps": 835, "total_steps": 3962, "loss": 0.4972, "lr": 3.853522905530698e-05, "epoch": 1.475685234305924, "percentage": 21.08, "elapsed_time": "1:59:51", "remaining_time": "7:28:53"} +{"current_steps": 840, "total_steps": 3962, "loss": 0.5515, "lr": 3.850194571909065e-05, "epoch": 1.4845269672855879, "percentage": 21.2, "elapsed_time": "2:00:42", "remaining_time": "7:28:39"} +{"current_steps": 845, "total_steps": 3962, "loss": 0.5241, "lr": 3.8468303181999625e-05, "epoch": 1.493368700265252, "percentage": 21.33, "elapsed_time": "2:01:16", "remaining_time": "7:27:20"} +{"current_steps": 850, "total_steps": 3962, "loss": 0.501, "lr": 3.843430209717758e-05, "epoch": 1.502210433244916, "percentage": 21.45, "elapsed_time": "2:01:53", "remaining_time": "7:26:16"} +{"current_steps": 855, "total_steps": 3962, "loss": 0.5055, "lr": 3.839994312472911e-05, "epoch": 1.5110521662245802, "percentage": 21.58, "elapsed_time": "2:02:24", "remaining_time": "7:24:50"} +{"current_steps": 860, "total_steps": 3962, "loss": 0.5333, "lr": 3.836522693170692e-05, "epoch": 1.5198938992042441, "percentage": 21.71, "elapsed_time": "2:03:08", "remaining_time": "7:24:11"} +{"current_steps": 865, "total_steps": 3962, "loss": 0.5195, "lr": 3.833015419209888e-05, "epoch": 1.528735632183908, "percentage": 21.83, "elapsed_time": "2:03:47", "remaining_time": "7:23:14"} +{"current_steps": 870, "total_steps": 3962, "loss": 0.5379, "lr": 3.8294725586814925e-05, "epoch": 1.537577365163572, "percentage": 21.96, "elapsed_time": "2:04:35", "remaining_time": "7:22:48"} +{"current_steps": 875, "total_steps": 3962, "loss": 0.4895, "lr": 3.8258941803673845e-05, "epoch": 1.546419098143236, "percentage": 22.08, "elapsed_time": "2:05:13", "remaining_time": "7:21:49"} +{"current_steps": 880, "total_steps": 3962, "loss": 0.5278, "lr": 3.822280353738995e-05, "epoch": 1.5552608311229, "percentage": 22.21, "elapsed_time": "2:05:45", "remaining_time": "7:20:27"} +{"current_steps": 885, "total_steps": 3962, "loss": 0.5183, "lr": 3.818631148955954e-05, "epoch": 1.564102564102564, "percentage": 22.34, "elapsed_time": "2:06:31", "remaining_time": "7:19:53"} +{"current_steps": 890, "total_steps": 3962, "loss": 0.5016, "lr": 3.814946636864732e-05, "epoch": 1.5729442970822283, "percentage": 22.46, "elapsed_time": "2:07:13", "remaining_time": "7:19:10"} +{"current_steps": 895, "total_steps": 3962, "loss": 0.5002, "lr": 3.8112268889972635e-05, "epoch": 1.5817860300618922, "percentage": 22.59, "elapsed_time": "2:07:52", "remaining_time": "7:18:13"} +{"current_steps": 900, "total_steps": 3962, "loss": 0.5247, "lr": 3.807471977569558e-05, "epoch": 1.5906277630415562, "percentage": 22.72, "elapsed_time": "2:08:26", "remaining_time": "7:16:58"} +{"current_steps": 905, "total_steps": 3962, "loss": 0.5339, "lr": 3.803681975480298e-05, "epoch": 1.5994694960212201, "percentage": 22.84, "elapsed_time": "2:09:07", "remaining_time": "7:16:08"} +{"current_steps": 910, "total_steps": 3962, "loss": 0.5043, "lr": 3.799856956309424e-05, "epoch": 1.608311229000884, "percentage": 22.97, "elapsed_time": "2:09:48", "remaining_time": "7:15:22"} +{"current_steps": 915, "total_steps": 3962, "loss": 0.4945, "lr": 3.7959969943167064e-05, "epoch": 1.617152961980548, "percentage": 23.09, "elapsed_time": "2:10:29", "remaining_time": "7:14:32"} +{"current_steps": 920, "total_steps": 3962, "loss": 0.513, "lr": 3.7921021644403024e-05, "epoch": 1.6259946949602122, "percentage": 23.22, "elapsed_time": "2:11:01", "remaining_time": "7:13:12"} +{"current_steps": 925, "total_steps": 3962, "loss": 0.4882, "lr": 3.788172542295303e-05, "epoch": 1.6348364279398764, "percentage": 23.35, "elapsed_time": "2:11:28", "remaining_time": "7:11:40"} +{"current_steps": 930, "total_steps": 3962, "loss": 0.4901, "lr": 3.784208204172262e-05, "epoch": 1.6436781609195403, "percentage": 23.47, "elapsed_time": "2:11:56", "remaining_time": "7:10:10"} +{"current_steps": 935, "total_steps": 3962, "loss": 0.5329, "lr": 3.7802092270357196e-05, "epoch": 1.6525198938992043, "percentage": 23.6, "elapsed_time": "2:12:39", "remaining_time": "7:09:29"} +{"current_steps": 940, "total_steps": 3962, "loss": 0.491, "lr": 3.7761756885227046e-05, "epoch": 1.6613616268788682, "percentage": 23.73, "elapsed_time": "2:13:42", "remaining_time": "7:09:50"} +{"current_steps": 945, "total_steps": 3962, "loss": 0.5167, "lr": 3.772107666941226e-05, "epoch": 1.6702033598585322, "percentage": 23.85, "elapsed_time": "2:14:31", "remaining_time": "7:09:29"} +{"current_steps": 950, "total_steps": 3962, "loss": 0.5639, "lr": 3.768005241268757e-05, "epoch": 1.6790450928381961, "percentage": 23.98, "elapsed_time": "2:15:08", "remaining_time": "7:08:28"} +{"current_steps": 955, "total_steps": 3962, "loss": 0.5478, "lr": 3.7638684911506993e-05, "epoch": 1.6878868258178603, "percentage": 24.1, "elapsed_time": "2:15:44", "remaining_time": "7:07:24"} +{"current_steps": 960, "total_steps": 3962, "loss": 0.4773, "lr": 3.7596974968988366e-05, "epoch": 1.6967285587975243, "percentage": 24.23, "elapsed_time": "2:16:37", "remaining_time": "7:07:14"} +{"current_steps": 965, "total_steps": 3962, "loss": 0.5122, "lr": 3.755492339489775e-05, "epoch": 1.7055702917771884, "percentage": 24.36, "elapsed_time": "2:17:38", "remaining_time": "7:07:28"} +{"current_steps": 970, "total_steps": 3962, "loss": 0.4883, "lr": 3.751253100563373e-05, "epoch": 1.7144120247568524, "percentage": 24.48, "elapsed_time": "2:18:15", "remaining_time": "7:06:26"} +{"current_steps": 975, "total_steps": 3962, "loss": 0.492, "lr": 3.746979862421154e-05, "epoch": 1.7232537577365163, "percentage": 24.61, "elapsed_time": "2:19:00", "remaining_time": "7:05:51"} +{"current_steps": 980, "total_steps": 3962, "loss": 0.5171, "lr": 3.742672708024711e-05, "epoch": 1.7320954907161803, "percentage": 24.73, "elapsed_time": "2:19:42", "remaining_time": "7:05:05"} +{"current_steps": 985, "total_steps": 3962, "loss": 0.5151, "lr": 3.7383317209940936e-05, "epoch": 1.7409372236958442, "percentage": 24.86, "elapsed_time": "2:20:20", "remaining_time": "7:04:10"} +{"current_steps": 990, "total_steps": 3962, "loss": 0.5084, "lr": 3.7339569856061864e-05, "epoch": 1.7497789566755084, "percentage": 24.99, "elapsed_time": "2:21:01", "remaining_time": "7:03:21"} +{"current_steps": 995, "total_steps": 3962, "loss": 0.509, "lr": 3.7295485867930715e-05, "epoch": 1.7586206896551724, "percentage": 25.11, "elapsed_time": "2:21:43", "remaining_time": "7:02:36"} +{"current_steps": 1000, "total_steps": 3962, "loss": 0.5291, "lr": 3.72510661014038e-05, "epoch": 1.7674624226348365, "percentage": 25.24, "elapsed_time": "2:22:18", "remaining_time": "7:01:31"} +{"current_steps": 1005, "total_steps": 3962, "loss": 0.5058, "lr": 3.720631141885633e-05, "epoch": 1.7763041556145005, "percentage": 25.37, "elapsed_time": "2:23:12", "remaining_time": "7:01:21"} +{"current_steps": 1010, "total_steps": 3962, "loss": 0.4809, "lr": 3.716122268916561e-05, "epoch": 1.7851458885941645, "percentage": 25.49, "elapsed_time": "2:23:42", "remaining_time": "7:00:02"} +{"current_steps": 1015, "total_steps": 3962, "loss": 0.5089, "lr": 3.711580078769424e-05, "epoch": 1.7939876215738284, "percentage": 25.62, "elapsed_time": "2:24:29", "remaining_time": "6:59:30"} +{"current_steps": 1020, "total_steps": 3962, "loss": 0.4978, "lr": 3.707004659627308e-05, "epoch": 1.8028293545534924, "percentage": 25.74, "elapsed_time": "2:25:11", "remaining_time": "6:58:46"} +{"current_steps": 1025, "total_steps": 3962, "loss": 0.5847, "lr": 3.702396100318414e-05, "epoch": 1.8116710875331565, "percentage": 25.87, "elapsed_time": "2:25:49", "remaining_time": "6:57:51"} +{"current_steps": 1030, "total_steps": 3962, "loss": 0.5644, "lr": 3.697754490314335e-05, "epoch": 1.8205128205128205, "percentage": 26.0, "elapsed_time": "2:26:26", "remaining_time": "6:56:52"} +{"current_steps": 1035, "total_steps": 3962, "loss": 0.4957, "lr": 3.693079919728314e-05, "epoch": 1.8293545534924847, "percentage": 26.12, "elapsed_time": "2:27:12", "remaining_time": "6:56:18"} +{"current_steps": 1040, "total_steps": 3962, "loss": 0.5339, "lr": 3.688372479313503e-05, "epoch": 1.8381962864721486, "percentage": 26.25, "elapsed_time": "2:27:53", "remaining_time": "6:55:30"} +{"current_steps": 1045, "total_steps": 3962, "loss": 0.5628, "lr": 3.683632260461191e-05, "epoch": 1.8470380194518126, "percentage": 26.38, "elapsed_time": "2:28:34", "remaining_time": "6:54:45"} +{"current_steps": 1050, "total_steps": 3962, "loss": 0.4787, "lr": 3.6788593551990395e-05, "epoch": 1.8558797524314765, "percentage": 26.5, "elapsed_time": "2:29:20", "remaining_time": "6:54:10"} +{"current_steps": 1055, "total_steps": 3962, "loss": 0.5058, "lr": 3.674053856189289e-05, "epoch": 1.8647214854111405, "percentage": 26.63, "elapsed_time": "2:30:11", "remaining_time": "6:53:49"} +{"current_steps": 1060, "total_steps": 3962, "loss": 0.5145, "lr": 3.66921585672696e-05, "epoch": 1.8735632183908046, "percentage": 26.75, "elapsed_time": "2:30:41", "remaining_time": "6:52:32"} +{"current_steps": 1065, "total_steps": 3962, "loss": 0.4853, "lr": 3.664345450738048e-05, "epoch": 1.8824049513704686, "percentage": 26.88, "elapsed_time": "2:31:15", "remaining_time": "6:51:27"} +{"current_steps": 1070, "total_steps": 3962, "loss": 0.5163, "lr": 3.659442732777694e-05, "epoch": 1.8912466843501328, "percentage": 27.01, "elapsed_time": "2:31:51", "remaining_time": "6:50:27"} +{"current_steps": 1075, "total_steps": 3962, "loss": 0.5004, "lr": 3.6545077980283516e-05, "epoch": 1.9000884173297967, "percentage": 27.13, "elapsed_time": "2:32:29", "remaining_time": "6:49:32"} +{"current_steps": 1080, "total_steps": 3962, "loss": 0.5095, "lr": 3.649540742297937e-05, "epoch": 1.9089301503094607, "percentage": 27.26, "elapsed_time": "2:33:08", "remaining_time": "6:48:40"} +{"current_steps": 1085, "total_steps": 3962, "loss": 0.4988, "lr": 3.6445416620179715e-05, "epoch": 1.9177718832891246, "percentage": 27.39, "elapsed_time": "2:33:46", "remaining_time": "6:47:44"} +{"current_steps": 1090, "total_steps": 3962, "loss": 0.5155, "lr": 3.6395106542417066e-05, "epoch": 1.9266136162687886, "percentage": 27.51, "elapsed_time": "2:34:23", "remaining_time": "6:46:48"} +{"current_steps": 1095, "total_steps": 3962, "loss": 0.4981, "lr": 3.6344478166422435e-05, "epoch": 1.9354553492484527, "percentage": 27.64, "elapsed_time": "2:35:19", "remaining_time": "6:46:41"} +{"current_steps": 1100, "total_steps": 3962, "loss": 0.482, "lr": 3.6293532475106325e-05, "epoch": 1.9442970822281167, "percentage": 27.76, "elapsed_time": "2:36:02", "remaining_time": "6:45:59"} +{"current_steps": 1105, "total_steps": 3962, "loss": 0.5106, "lr": 3.6242270457539695e-05, "epoch": 1.9531388152077809, "percentage": 27.89, "elapsed_time": "2:36:47", "remaining_time": "6:45:24"} +{"current_steps": 1110, "total_steps": 3962, "loss": 0.4966, "lr": 3.6190693108934685e-05, "epoch": 1.9619805481874448, "percentage": 28.02, "elapsed_time": "2:37:20", "remaining_time": "6:44:15"} +{"current_steps": 1115, "total_steps": 3962, "loss": 0.5274, "lr": 3.613880143062539e-05, "epoch": 1.9708222811671088, "percentage": 28.14, "elapsed_time": "2:37:58", "remaining_time": "6:43:21"} +{"current_steps": 1120, "total_steps": 3962, "loss": 0.544, "lr": 3.6086596430048355e-05, "epoch": 1.9796640141467727, "percentage": 28.27, "elapsed_time": "2:38:28", "remaining_time": "6:42:07"} +{"current_steps": 1125, "total_steps": 3962, "loss": 0.4664, "lr": 3.603407912072303e-05, "epoch": 1.9885057471264367, "percentage": 28.39, "elapsed_time": "2:39:03", "remaining_time": "6:41:07"} +{"current_steps": 1130, "total_steps": 3962, "loss": 0.4927, "lr": 3.598125052223209e-05, "epoch": 1.9973474801061006, "percentage": 28.52, "elapsed_time": "2:39:42", "remaining_time": "6:40:15"} +{"current_steps": 1135, "total_steps": 3962, "loss": 0.461, "lr": 3.592811166020166e-05, "epoch": 2.0053050397877983, "percentage": 28.65, "elapsed_time": "2:40:20", "remaining_time": "6:39:22"} +{"current_steps": 1140, "total_steps": 3962, "loss": 0.4984, "lr": 3.5874663566281386e-05, "epoch": 2.0141467727674622, "percentage": 28.77, "elapsed_time": "2:41:01", "remaining_time": "6:38:36"} +{"current_steps": 1145, "total_steps": 3962, "loss": 0.4376, "lr": 3.582090727812441e-05, "epoch": 2.0229885057471266, "percentage": 28.9, "elapsed_time": "2:41:47", "remaining_time": "6:38:03"} +{"current_steps": 1150, "total_steps": 3962, "loss": 0.4825, "lr": 3.576684383936721e-05, "epoch": 2.0318302387267906, "percentage": 29.03, "elapsed_time": "2:42:27", "remaining_time": "6:37:14"} +{"current_steps": 1155, "total_steps": 3962, "loss": 0.4354, "lr": 3.571247429960939e-05, "epoch": 2.0406719717064545, "percentage": 29.15, "elapsed_time": "2:43:06", "remaining_time": "6:36:23"} +{"current_steps": 1160, "total_steps": 3962, "loss": 0.4842, "lr": 3.5657799714393226e-05, "epoch": 2.0495137046861185, "percentage": 29.28, "elapsed_time": "2:43:40", "remaining_time": "6:35:22"} +{"current_steps": 1165, "total_steps": 3962, "loss": 0.4675, "lr": 3.560282114518324e-05, "epoch": 2.0583554376657824, "percentage": 29.4, "elapsed_time": "2:44:17", "remaining_time": "6:34:27"} +{"current_steps": 1170, "total_steps": 3962, "loss": 0.4865, "lr": 3.554753965934556e-05, "epoch": 2.0671971706454464, "percentage": 29.53, "elapsed_time": "2:44:49", "remaining_time": "6:33:20"} +{"current_steps": 1175, "total_steps": 3962, "loss": 0.5007, "lr": 3.5491956330127206e-05, "epoch": 2.0760389036251103, "percentage": 29.66, "elapsed_time": "2:45:27", "remaining_time": "6:32:27"} +{"current_steps": 1180, "total_steps": 3962, "loss": 0.4824, "lr": 3.543607223663524e-05, "epoch": 2.0848806366047747, "percentage": 29.78, "elapsed_time": "2:46:06", "remaining_time": "6:31:36"} +{"current_steps": 1185, "total_steps": 3962, "loss": 0.4959, "lr": 3.537988846381585e-05, "epoch": 2.0937223695844387, "percentage": 29.91, "elapsed_time": "2:46:54", "remaining_time": "6:31:08"} +{"current_steps": 1190, "total_steps": 3962, "loss": 0.5028, "lr": 3.532340610243325e-05, "epoch": 2.1025641025641026, "percentage": 30.04, "elapsed_time": "2:47:31", "remaining_time": "6:30:13"} +{"current_steps": 1195, "total_steps": 3962, "loss": 0.4576, "lr": 3.526662624904852e-05, "epoch": 2.1114058355437666, "percentage": 30.16, "elapsed_time": "2:48:13", "remaining_time": "6:29:30"} +{"current_steps": 1200, "total_steps": 3962, "loss": 0.4621, "lr": 3.5209550005998314e-05, "epoch": 2.1202475685234305, "percentage": 30.29, "elapsed_time": "2:48:54", "remaining_time": "6:28:47"} +{"current_steps": 1205, "total_steps": 3962, "loss": 0.5064, "lr": 3.515217848137347e-05, "epoch": 2.1290893015030945, "percentage": 30.41, "elapsed_time": "2:49:36", "remaining_time": "6:28:03"} +{"current_steps": 1210, "total_steps": 3962, "loss": 0.4645, "lr": 3.509451278899748e-05, "epoch": 2.1379310344827585, "percentage": 30.54, "elapsed_time": "2:50:25", "remaining_time": "6:27:37"} +{"current_steps": 1215, "total_steps": 3962, "loss": 0.4721, "lr": 3.503655404840488e-05, "epoch": 2.146772767462423, "percentage": 30.67, "elapsed_time": "2:51:03", "remaining_time": "6:26:44"} +{"current_steps": 1220, "total_steps": 3962, "loss": 0.4882, "lr": 3.497830338481949e-05, "epoch": 2.155614500442087, "percentage": 30.79, "elapsed_time": "2:51:34", "remaining_time": "6:25:36"} +{"current_steps": 1225, "total_steps": 3962, "loss": 0.4497, "lr": 3.491976192913262e-05, "epoch": 2.1644562334217508, "percentage": 30.92, "elapsed_time": "2:52:17", "remaining_time": "6:24:56"} +{"current_steps": 1230, "total_steps": 3962, "loss": 0.4413, "lr": 3.486093081788106e-05, "epoch": 2.1732979664014147, "percentage": 31.04, "elapsed_time": "2:52:58", "remaining_time": "6:24:12"} +{"current_steps": 1235, "total_steps": 3962, "loss": 0.5526, "lr": 3.480181119322504e-05, "epoch": 2.1821396993810787, "percentage": 31.17, "elapsed_time": "2:53:41", "remaining_time": "6:23:30"} +{"current_steps": 1240, "total_steps": 3962, "loss": 0.4818, "lr": 3.474240420292606e-05, "epoch": 2.1909814323607426, "percentage": 31.3, "elapsed_time": "2:54:28", "remaining_time": "6:22:59"} +{"current_steps": 1245, "total_steps": 3962, "loss": 0.4567, "lr": 3.4682711000324586e-05, "epoch": 2.1998231653404066, "percentage": 31.42, "elapsed_time": "2:55:15", "remaining_time": "6:22:28"} +{"current_steps": 1250, "total_steps": 3962, "loss": 0.4573, "lr": 3.462273274431769e-05, "epoch": 2.2086648983200705, "percentage": 31.55, "elapsed_time": "2:56:08", "remaining_time": "6:22:09"} +{"current_steps": 1255, "total_steps": 3962, "loss": 0.4824, "lr": 3.456247059933653e-05, "epoch": 2.217506631299735, "percentage": 31.68, "elapsed_time": "2:56:54", "remaining_time": "6:21:35"} +{"current_steps": 1260, "total_steps": 3962, "loss": 0.5275, "lr": 3.450192573532373e-05, "epoch": 2.226348364279399, "percentage": 31.8, "elapsed_time": "2:57:27", "remaining_time": "6:20:33"} +{"current_steps": 1265, "total_steps": 3962, "loss": 0.4654, "lr": 3.444109932771072e-05, "epoch": 2.235190097259063, "percentage": 31.93, "elapsed_time": "2:58:28", "remaining_time": "6:20:30"} +{"current_steps": 1270, "total_steps": 3962, "loss": 0.5126, "lr": 3.4379992557394846e-05, "epoch": 2.2440318302387268, "percentage": 32.05, "elapsed_time": "2:59:19", "remaining_time": "6:20:05"} +{"current_steps": 1275, "total_steps": 3962, "loss": 0.5167, "lr": 3.4318606610716484e-05, "epoch": 2.2528735632183907, "percentage": 32.18, "elapsed_time": "3:00:00", "remaining_time": "6:19:21"} +{"current_steps": 1280, "total_steps": 3962, "loss": 0.4922, "lr": 3.4256942679436015e-05, "epoch": 2.2617152961980547, "percentage": 32.31, "elapsed_time": "3:00:47", "remaining_time": "6:18:48"} +{"current_steps": 1285, "total_steps": 3962, "loss": 0.4754, "lr": 3.419500196071067e-05, "epoch": 2.270557029177719, "percentage": 32.43, "elapsed_time": "3:01:29", "remaining_time": "6:18:05"} +{"current_steps": 1290, "total_steps": 3962, "loss": 0.4993, "lr": 3.413278565707128e-05, "epoch": 2.279398762157383, "percentage": 32.56, "elapsed_time": "3:02:22", "remaining_time": "6:17:45"} +{"current_steps": 1295, "total_steps": 3962, "loss": 0.4577, "lr": 3.407029497639896e-05, "epoch": 2.288240495137047, "percentage": 32.69, "elapsed_time": "3:03:04", "remaining_time": "6:17:01"} +{"current_steps": 1300, "total_steps": 3962, "loss": 0.5239, "lr": 3.400753113190164e-05, "epoch": 2.297082228116711, "percentage": 32.81, "elapsed_time": "3:03:44", "remaining_time": "6:16:15"} +{"current_steps": 1305, "total_steps": 3962, "loss": 0.475, "lr": 3.394449534209049e-05, "epoch": 2.305923961096375, "percentage": 32.94, "elapsed_time": "3:04:30", "remaining_time": "6:15:39"} +{"current_steps": 1310, "total_steps": 3962, "loss": 0.4645, "lr": 3.388118883075632e-05, "epoch": 2.314765694076039, "percentage": 33.06, "elapsed_time": "3:05:19", "remaining_time": "6:15:10"} +{"current_steps": 1315, "total_steps": 3962, "loss": 0.4587, "lr": 3.381761282694576e-05, "epoch": 2.323607427055703, "percentage": 33.19, "elapsed_time": "3:05:59", "remaining_time": "6:14:22"} +{"current_steps": 1320, "total_steps": 3962, "loss": 0.474, "lr": 3.375376856493744e-05, "epoch": 2.3324491600353667, "percentage": 33.32, "elapsed_time": "3:06:44", "remaining_time": "6:13:46"} +{"current_steps": 1325, "total_steps": 3962, "loss": 0.4457, "lr": 3.368965728421802e-05, "epoch": 2.341290893015031, "percentage": 33.44, "elapsed_time": "3:07:14", "remaining_time": "6:12:38"} +{"current_steps": 1330, "total_steps": 3962, "loss": 0.4635, "lr": 3.362528022945811e-05, "epoch": 2.350132625994695, "percentage": 33.57, "elapsed_time": "3:07:47", "remaining_time": "6:11:37"} +{"current_steps": 1335, "total_steps": 3962, "loss": 0.481, "lr": 3.3560638650488116e-05, "epoch": 2.358974358974359, "percentage": 33.7, "elapsed_time": "3:08:27", "remaining_time": "6:10:49"} +{"current_steps": 1340, "total_steps": 3962, "loss": 0.4947, "lr": 3.3495733802273973e-05, "epoch": 2.367816091954023, "percentage": 33.82, "elapsed_time": "3:08:56", "remaining_time": "6:09:43"} +{"current_steps": 1345, "total_steps": 3962, "loss": 0.4769, "lr": 3.3430566944892797e-05, "epoch": 2.376657824933687, "percentage": 33.95, "elapsed_time": "3:09:30", "remaining_time": "6:08:43"} +{"current_steps": 1350, "total_steps": 3962, "loss": 0.5036, "lr": 3.3365139343508394e-05, "epoch": 2.385499557913351, "percentage": 34.07, "elapsed_time": "3:10:19", "remaining_time": "6:08:14"} +{"current_steps": 1355, "total_steps": 3962, "loss": 0.4645, "lr": 3.329945226834672e-05, "epoch": 2.394341290893015, "percentage": 34.2, "elapsed_time": "3:11:10", "remaining_time": "6:07:48"} +{"current_steps": 1360, "total_steps": 3962, "loss": 0.4951, "lr": 3.3233506994671226e-05, "epoch": 2.4031830238726792, "percentage": 34.33, "elapsed_time": "3:11:53", "remaining_time": "6:07:08"} +{"current_steps": 1365, "total_steps": 3962, "loss": 0.4464, "lr": 3.316730480275804e-05, "epoch": 2.412024756852343, "percentage": 34.45, "elapsed_time": "3:12:35", "remaining_time": "6:06:24"} +{"current_steps": 1370, "total_steps": 3962, "loss": 0.4913, "lr": 3.3100846977871205e-05, "epoch": 2.420866489832007, "percentage": 34.58, "elapsed_time": "3:13:24", "remaining_time": "6:05:54"} +{"current_steps": 1375, "total_steps": 3962, "loss": 0.4994, "lr": 3.303413481023767e-05, "epoch": 2.429708222811671, "percentage": 34.7, "elapsed_time": "3:14:06", "remaining_time": "6:05:13"} +{"current_steps": 1380, "total_steps": 3962, "loss": 0.4784, "lr": 3.296716959502222e-05, "epoch": 2.438549955791335, "percentage": 34.83, "elapsed_time": "3:14:47", "remaining_time": "6:04:26"} +{"current_steps": 1385, "total_steps": 3962, "loss": 0.4922, "lr": 3.2899952632302406e-05, "epoch": 2.447391688770999, "percentage": 34.96, "elapsed_time": "3:15:26", "remaining_time": "6:03:38"} +{"current_steps": 1390, "total_steps": 3962, "loss": 0.4593, "lr": 3.2832485227043224e-05, "epoch": 2.456233421750663, "percentage": 35.08, "elapsed_time": "3:16:10", "remaining_time": "6:02:59"} +{"current_steps": 1395, "total_steps": 3962, "loss": 0.4621, "lr": 3.276476868907185e-05, "epoch": 2.465075154730327, "percentage": 35.21, "elapsed_time": "3:17:01", "remaining_time": "6:02:33"} +{"current_steps": 1400, "total_steps": 3962, "loss": 0.497, "lr": 3.2696804333052134e-05, "epoch": 2.4739168877099913, "percentage": 35.34, "elapsed_time": "3:18:03", "remaining_time": "6:02:27"} +{"current_steps": 1405, "total_steps": 3962, "loss": 0.5055, "lr": 3.2628593478459166e-05, "epoch": 2.4827586206896552, "percentage": 35.46, "elapsed_time": "3:18:44", "remaining_time": "6:01:41"} +{"current_steps": 1410, "total_steps": 3962, "loss": 0.4718, "lr": 3.256013744955359e-05, "epoch": 2.491600353669319, "percentage": 35.59, "elapsed_time": "3:19:16", "remaining_time": "6:00:40"} +{"current_steps": 1415, "total_steps": 3962, "loss": 0.4583, "lr": 3.249143757535593e-05, "epoch": 2.500442086648983, "percentage": 35.71, "elapsed_time": "3:20:00", "remaining_time": "6:00:00"} +{"current_steps": 1420, "total_steps": 3962, "loss": 0.4994, "lr": 3.242249518962075e-05, "epoch": 2.509283819628647, "percentage": 35.84, "elapsed_time": "3:20:44", "remaining_time": "5:59:21"} +{"current_steps": 1425, "total_steps": 3962, "loss": 0.4564, "lr": 3.2353311630810824e-05, "epoch": 2.5181255526083115, "percentage": 35.97, "elapsed_time": "3:21:30", "remaining_time": "5:58:45"} +{"current_steps": 1430, "total_steps": 3962, "loss": 0.4889, "lr": 3.2283888242071084e-05, "epoch": 2.5269672855879755, "percentage": 36.09, "elapsed_time": "3:22:06", "remaining_time": "5:57:52"} +{"current_steps": 1435, "total_steps": 3962, "loss": 0.4679, "lr": 3.221422637120259e-05, "epoch": 2.5358090185676394, "percentage": 36.22, "elapsed_time": "3:22:45", "remaining_time": "5:57:02"} +{"current_steps": 1440, "total_steps": 3962, "loss": 0.454, "lr": 3.2144327370636346e-05, "epoch": 2.5446507515473034, "percentage": 36.35, "elapsed_time": "3:23:25", "remaining_time": "5:56:16"} +{"current_steps": 1445, "total_steps": 3962, "loss": 0.4613, "lr": 3.2074192597407035e-05, "epoch": 2.5534924845269673, "percentage": 36.47, "elapsed_time": "3:24:09", "remaining_time": "5:55:36"} +{"current_steps": 1450, "total_steps": 3962, "loss": 0.4492, "lr": 3.200382341312669e-05, "epoch": 2.5623342175066313, "percentage": 36.6, "elapsed_time": "3:24:44", "remaining_time": "5:54:41"} +{"current_steps": 1455, "total_steps": 3962, "loss": 0.4892, "lr": 3.193322118395825e-05, "epoch": 2.571175950486295, "percentage": 36.72, "elapsed_time": "3:25:17", "remaining_time": "5:53:44"} +{"current_steps": 1460, "total_steps": 3962, "loss": 0.4779, "lr": 3.1862387280589035e-05, "epoch": 2.580017683465959, "percentage": 36.85, "elapsed_time": "3:25:53", "remaining_time": "5:52:49"} +{"current_steps": 1465, "total_steps": 3962, "loss": 0.4415, "lr": 3.179132307820415e-05, "epoch": 2.588859416445623, "percentage": 36.98, "elapsed_time": "3:26:32", "remaining_time": "5:52:01"} +{"current_steps": 1470, "total_steps": 3962, "loss": 0.4591, "lr": 3.1720029956459765e-05, "epoch": 2.5977011494252875, "percentage": 37.1, "elapsed_time": "3:27:18", "remaining_time": "5:51:26"} +{"current_steps": 1475, "total_steps": 3962, "loss": 0.4262, "lr": 3.1648509299456354e-05, "epoch": 2.6065428824049515, "percentage": 37.23, "elapsed_time": "3:27:58", "remaining_time": "5:50:40"} +{"current_steps": 1480, "total_steps": 3962, "loss": 0.5071, "lr": 3.15767624957118e-05, "epoch": 2.6153846153846154, "percentage": 37.35, "elapsed_time": "3:28:40", "remaining_time": "5:49:57"} +{"current_steps": 1485, "total_steps": 3962, "loss": 0.4698, "lr": 3.150479093813444e-05, "epoch": 2.6242263483642794, "percentage": 37.48, "elapsed_time": "3:29:17", "remaining_time": "5:49:06"} +{"current_steps": 1490, "total_steps": 3962, "loss": 0.4813, "lr": 3.143259602399605e-05, "epoch": 2.6330680813439433, "percentage": 37.61, "elapsed_time": "3:30:01", "remaining_time": "5:48:26"} +{"current_steps": 1495, "total_steps": 3962, "loss": 0.4572, "lr": 3.13601791549047e-05, "epoch": 2.6419098143236073, "percentage": 37.73, "elapsed_time": "3:30:38", "remaining_time": "5:47:35"} +{"current_steps": 1500, "total_steps": 3962, "loss": 0.4732, "lr": 3.128754173677753e-05, "epoch": 2.6507515473032717, "percentage": 37.86, "elapsed_time": "3:31:11", "remaining_time": "5:46:37"} +{"current_steps": 1505, "total_steps": 3962, "loss": 0.4793, "lr": 3.121468517981348e-05, "epoch": 2.6595932802829356, "percentage": 37.99, "elapsed_time": "3:32:27", "remaining_time": "5:46:51"} +{"current_steps": 1510, "total_steps": 3962, "loss": 0.4586, "lr": 3.1141610898465886e-05, "epoch": 2.6684350132625996, "percentage": 38.11, "elapsed_time": "3:33:06", "remaining_time": "5:46:02"} +{"current_steps": 1515, "total_steps": 3962, "loss": 0.4882, "lr": 3.106832031141505e-05, "epoch": 2.6772767462422635, "percentage": 38.24, "elapsed_time": "3:33:29", "remaining_time": "5:44:49"} +{"current_steps": 1520, "total_steps": 3962, "loss": 0.4694, "lr": 3.099481484154066e-05, "epoch": 2.6861184792219275, "percentage": 38.36, "elapsed_time": "3:34:13", "remaining_time": "5:44:10"} +{"current_steps": 1525, "total_steps": 3962, "loss": 0.47, "lr": 3.092109591589421e-05, "epoch": 2.6949602122015914, "percentage": 38.49, "elapsed_time": "3:34:43", "remaining_time": "5:43:07"} +{"current_steps": 1530, "total_steps": 3962, "loss": 0.4691, "lr": 3.084716496567125e-05, "epoch": 2.7038019451812554, "percentage": 38.62, "elapsed_time": "3:35:27", "remaining_time": "5:42:29"} +{"current_steps": 1535, "total_steps": 3962, "loss": 0.5029, "lr": 3.0773023426183646e-05, "epoch": 2.7126436781609193, "percentage": 38.74, "elapsed_time": "3:36:16", "remaining_time": "5:41:56"} +{"current_steps": 1540, "total_steps": 3962, "loss": 0.4813, "lr": 3.069867273683166e-05, "epoch": 2.7214854111405833, "percentage": 38.87, "elapsed_time": "3:36:52", "remaining_time": "5:41:05"} +{"current_steps": 1545, "total_steps": 3962, "loss": 0.4961, "lr": 3.062411434107607e-05, "epoch": 2.7303271441202477, "percentage": 39.0, "elapsed_time": "3:37:30", "remaining_time": "5:40:16"} +{"current_steps": 1550, "total_steps": 3962, "loss": 0.4807, "lr": 3.0549349686410086e-05, "epoch": 2.7391688770999116, "percentage": 39.12, "elapsed_time": "3:38:10", "remaining_time": "5:39:29"} +{"current_steps": 1555, "total_steps": 3962, "loss": 0.4601, "lr": 3.0474380224331292e-05, "epoch": 2.7480106100795756, "percentage": 39.25, "elapsed_time": "3:38:50", "remaining_time": "5:38:44"} +{"current_steps": 1560, "total_steps": 3962, "loss": 0.452, "lr": 3.039920741031342e-05, "epoch": 2.7568523430592395, "percentage": 39.37, "elapsed_time": "3:39:30", "remaining_time": "5:37:58"} +{"current_steps": 1565, "total_steps": 3962, "loss": 0.477, "lr": 3.0323832703778168e-05, "epoch": 2.7656940760389035, "percentage": 39.5, "elapsed_time": "3:40:12", "remaining_time": "5:37:15"} +{"current_steps": 1570, "total_steps": 3962, "loss": 0.4784, "lr": 3.024825756806677e-05, "epoch": 2.774535809018568, "percentage": 39.63, "elapsed_time": "3:40:52", "remaining_time": "5:36:30"} +{"current_steps": 1575, "total_steps": 3962, "loss": 0.4674, "lr": 3.017248347041168e-05, "epoch": 2.783377541998232, "percentage": 39.75, "elapsed_time": "3:41:27", "remaining_time": "5:35:37"} +{"current_steps": 1580, "total_steps": 3962, "loss": 0.476, "lr": 3.0096511881908007e-05, "epoch": 2.792219274977896, "percentage": 39.88, "elapsed_time": "3:42:07", "remaining_time": "5:34:53"} +{"current_steps": 1585, "total_steps": 3962, "loss": 0.48, "lr": 3.0020344277485017e-05, "epoch": 2.8010610079575597, "percentage": 40.01, "elapsed_time": "3:43:05", "remaining_time": "5:34:34"} +{"current_steps": 1590, "total_steps": 3962, "loss": 0.4652, "lr": 2.994398213587746e-05, "epoch": 2.8099027409372237, "percentage": 40.13, "elapsed_time": "3:43:47", "remaining_time": "5:33:51"} +{"current_steps": 1595, "total_steps": 3962, "loss": 0.4838, "lr": 2.9867426939596876e-05, "epoch": 2.8187444739168876, "percentage": 40.26, "elapsed_time": "3:44:34", "remaining_time": "5:33:16"} +{"current_steps": 1600, "total_steps": 3962, "loss": 0.4958, "lr": 2.9790680174902818e-05, "epoch": 2.8275862068965516, "percentage": 40.38, "elapsed_time": "3:45:07", "remaining_time": "5:32:19"} +{"current_steps": 1605, "total_steps": 3962, "loss": 0.4531, "lr": 2.971374333177398e-05, "epoch": 2.8364279398762156, "percentage": 40.51, "elapsed_time": "3:45:51", "remaining_time": "5:31:41"} +{"current_steps": 1610, "total_steps": 3962, "loss": 0.4687, "lr": 2.963661790387928e-05, "epoch": 2.8452696728558795, "percentage": 40.64, "elapsed_time": "3:46:36", "remaining_time": "5:31:03"} +{"current_steps": 1615, "total_steps": 3962, "loss": 0.4605, "lr": 2.9559305388548884e-05, "epoch": 2.854111405835544, "percentage": 40.76, "elapsed_time": "3:47:11", "remaining_time": "5:30:09"} +{"current_steps": 1620, "total_steps": 3962, "loss": 0.4769, "lr": 2.948180728674508e-05, "epoch": 2.862953138815208, "percentage": 40.89, "elapsed_time": "3:47:43", "remaining_time": "5:29:13"} +{"current_steps": 1625, "total_steps": 3962, "loss": 0.4986, "lr": 2.9404125103033207e-05, "epoch": 2.871794871794872, "percentage": 41.01, "elapsed_time": "3:48:27", "remaining_time": "5:28:33"} +{"current_steps": 1630, "total_steps": 3962, "loss": 0.4532, "lr": 2.9326260345552384e-05, "epoch": 2.8806366047745358, "percentage": 41.14, "elapsed_time": "3:49:22", "remaining_time": "5:28:10"} +{"current_steps": 1635, "total_steps": 3962, "loss": 0.4596, "lr": 2.924821452598628e-05, "epoch": 2.8894783377541997, "percentage": 41.27, "elapsed_time": "3:50:02", "remaining_time": "5:27:24"} +{"current_steps": 1640, "total_steps": 3962, "loss": 0.4898, "lr": 2.916998915953373e-05, "epoch": 2.898320070733864, "percentage": 41.39, "elapsed_time": "3:50:46", "remaining_time": "5:26:44"} +{"current_steps": 1645, "total_steps": 3962, "loss": 0.4942, "lr": 2.9091585764879334e-05, "epoch": 2.907161803713528, "percentage": 41.52, "elapsed_time": "3:51:26", "remaining_time": "5:25:59"} +{"current_steps": 1650, "total_steps": 3962, "loss": 0.4683, "lr": 2.9013005864163967e-05, "epoch": 2.916003536693192, "percentage": 41.65, "elapsed_time": "3:52:01", "remaining_time": "5:25:07"} +{"current_steps": 1655, "total_steps": 3962, "loss": 0.5104, "lr": 2.8934250982955245e-05, "epoch": 2.924845269672856, "percentage": 41.77, "elapsed_time": "3:52:47", "remaining_time": "5:24:30"} +{"current_steps": 1660, "total_steps": 3962, "loss": 0.4734, "lr": 2.8855322650217878e-05, "epoch": 2.93368700265252, "percentage": 41.9, "elapsed_time": "3:53:37", "remaining_time": "5:23:58"} +{"current_steps": 1665, "total_steps": 3962, "loss": 0.4742, "lr": 2.877622239828402e-05, "epoch": 2.942528735632184, "percentage": 42.02, "elapsed_time": "3:54:23", "remaining_time": "5:23:21"} +{"current_steps": 1670, "total_steps": 3962, "loss": 0.4536, "lr": 2.8696951762823482e-05, "epoch": 2.951370468611848, "percentage": 42.15, "elapsed_time": "3:55:02", "remaining_time": "5:22:35"} +{"current_steps": 1675, "total_steps": 3962, "loss": 0.4773, "lr": 2.8617512282813962e-05, "epoch": 2.9602122015915118, "percentage": 42.28, "elapsed_time": "3:55:45", "remaining_time": "5:21:54"} +{"current_steps": 1680, "total_steps": 3962, "loss": 0.4409, "lr": 2.8537905500511115e-05, "epoch": 2.9690539345711757, "percentage": 42.4, "elapsed_time": "3:56:20", "remaining_time": "5:21:01"} +{"current_steps": 1685, "total_steps": 3962, "loss": 0.4841, "lr": 2.845813296141867e-05, "epoch": 2.97789566755084, "percentage": 42.53, "elapsed_time": "3:56:55", "remaining_time": "5:20:09"} +{"current_steps": 1690, "total_steps": 3962, "loss": 0.4642, "lr": 2.8378196214258368e-05, "epoch": 2.986737400530504, "percentage": 42.66, "elapsed_time": "3:57:38", "remaining_time": "5:19:29"} +{"current_steps": 1695, "total_steps": 3962, "loss": 0.4763, "lr": 2.8298096810939947e-05, "epoch": 2.995579133510168, "percentage": 42.78, "elapsed_time": "3:58:21", "remaining_time": "5:18:48"} +{"current_steps": 1700, "total_steps": 3962, "loss": 0.4496, "lr": 2.821783630653097e-05, "epoch": 3.0035366931918657, "percentage": 42.91, "elapsed_time": "3:59:06", "remaining_time": "5:18:09"} +{"current_steps": 1705, "total_steps": 3962, "loss": 0.4547, "lr": 2.8137416259226647e-05, "epoch": 3.0123784261715296, "percentage": 43.03, "elapsed_time": "3:59:51", "remaining_time": "5:17:31"} +{"current_steps": 1710, "total_steps": 3962, "loss": 0.4457, "lr": 2.805683823031962e-05, "epoch": 3.0212201591511936, "percentage": 43.16, "elapsed_time": "4:00:33", "remaining_time": "5:16:48"} +{"current_steps": 1715, "total_steps": 3962, "loss": 0.4231, "lr": 2.797610378416958e-05, "epoch": 3.0300618921308575, "percentage": 43.29, "elapsed_time": "4:01:08", "remaining_time": "5:15:56"} +{"current_steps": 1720, "total_steps": 3962, "loss": 0.4209, "lr": 2.789521448817297e-05, "epoch": 3.0389036251105215, "percentage": 43.41, "elapsed_time": "4:02:02", "remaining_time": "5:15:30"} +{"current_steps": 1725, "total_steps": 3962, "loss": 0.4595, "lr": 2.7814171912732505e-05, "epoch": 3.047745358090186, "percentage": 43.54, "elapsed_time": "4:02:46", "remaining_time": "5:14:49"} +{"current_steps": 1730, "total_steps": 3962, "loss": 0.4599, "lr": 2.7732977631226707e-05, "epoch": 3.05658709106985, "percentage": 43.66, "elapsed_time": "4:03:36", "remaining_time": "5:14:17"} +{"current_steps": 1735, "total_steps": 3962, "loss": 0.4421, "lr": 2.7651633219979354e-05, "epoch": 3.065428824049514, "percentage": 43.79, "elapsed_time": "4:04:08", "remaining_time": "5:13:22"} +{"current_steps": 1740, "total_steps": 3962, "loss": 0.4157, "lr": 2.757014025822887e-05, "epoch": 3.0742705570291777, "percentage": 43.92, "elapsed_time": "4:04:46", "remaining_time": "5:12:34"} +{"current_steps": 1745, "total_steps": 3962, "loss": 0.4646, "lr": 2.7488500328097676e-05, "epoch": 3.0831122900088417, "percentage": 44.04, "elapsed_time": "4:05:20", "remaining_time": "5:11:42"} +{"current_steps": 1750, "total_steps": 3962, "loss": 0.4398, "lr": 2.740671501456147e-05, "epoch": 3.0919540229885056, "percentage": 44.17, "elapsed_time": "4:06:01", "remaining_time": "5:10:58"} +{"current_steps": 1755, "total_steps": 3962, "loss": 0.4825, "lr": 2.732478590541846e-05, "epoch": 3.1007957559681696, "percentage": 44.3, "elapsed_time": "4:06:40", "remaining_time": "5:10:12"} +{"current_steps": 1760, "total_steps": 3962, "loss": 0.4489, "lr": 2.7242714591258515e-05, "epoch": 3.109637488947834, "percentage": 44.42, "elapsed_time": "4:07:26", "remaining_time": "5:09:35"} +{"current_steps": 1765, "total_steps": 3962, "loss": 0.447, "lr": 2.716050266543233e-05, "epoch": 3.118479221927498, "percentage": 44.55, "elapsed_time": "4:08:12", "remaining_time": "5:08:57"} +{"current_steps": 1770, "total_steps": 3962, "loss": 0.4511, "lr": 2.707815172402045e-05, "epoch": 3.127320954907162, "percentage": 44.67, "elapsed_time": "4:08:57", "remaining_time": "5:08:19"} +{"current_steps": 1775, "total_steps": 3962, "loss": 0.4653, "lr": 2.6995663365802297e-05, "epoch": 3.136162687886826, "percentage": 44.8, "elapsed_time": "4:09:26", "remaining_time": "5:07:20"} +{"current_steps": 1780, "total_steps": 3962, "loss": 0.4716, "lr": 2.6913039192225143e-05, "epoch": 3.14500442086649, "percentage": 44.93, "elapsed_time": "4:10:05", "remaining_time": "5:06:34"} +{"current_steps": 1785, "total_steps": 3962, "loss": 0.4321, "lr": 2.683028080737301e-05, "epoch": 3.1538461538461537, "percentage": 45.05, "elapsed_time": "4:10:44", "remaining_time": "5:05:48"} +{"current_steps": 1790, "total_steps": 3962, "loss": 0.4697, "lr": 2.6747389817935513e-05, "epoch": 3.1626878868258177, "percentage": 45.18, "elapsed_time": "4:11:20", "remaining_time": "5:04:58"} +{"current_steps": 1795, "total_steps": 3962, "loss": 0.4435, "lr": 2.6664367833176706e-05, "epoch": 3.171529619805482, "percentage": 45.31, "elapsed_time": "4:11:53", "remaining_time": "5:04:06"} +{"current_steps": 1800, "total_steps": 3962, "loss": 0.447, "lr": 2.6581216464903783e-05, "epoch": 3.180371352785146, "percentage": 45.43, "elapsed_time": "4:12:34", "remaining_time": "5:03:22"} +{"current_steps": 1805, "total_steps": 3962, "loss": 0.4587, "lr": 2.649793732743585e-05, "epoch": 3.18921308576481, "percentage": 45.56, "elapsed_time": "4:13:17", "remaining_time": "5:02:40"} +{"current_steps": 1810, "total_steps": 3962, "loss": 0.4575, "lr": 2.641453203757253e-05, "epoch": 3.198054818744474, "percentage": 45.68, "elapsed_time": "4:13:59", "remaining_time": "5:01:58"} +{"current_steps": 1815, "total_steps": 3962, "loss": 0.4535, "lr": 2.6331002214562612e-05, "epoch": 3.206896551724138, "percentage": 45.81, "elapsed_time": "4:14:29", "remaining_time": "5:01:03"} +{"current_steps": 1820, "total_steps": 3962, "loss": 0.4782, "lr": 2.624734948007259e-05, "epoch": 3.215738284703802, "percentage": 45.94, "elapsed_time": "4:15:19", "remaining_time": "5:00:29"} +{"current_steps": 1825, "total_steps": 3962, "loss": 0.4341, "lr": 2.616357545815518e-05, "epoch": 3.224580017683466, "percentage": 46.06, "elapsed_time": "4:16:04", "remaining_time": "4:59:51"} +{"current_steps": 1830, "total_steps": 3962, "loss": 0.4494, "lr": 2.6079681775217833e-05, "epoch": 3.2334217506631298, "percentage": 46.19, "elapsed_time": "4:16:49", "remaining_time": "4:59:11"} +{"current_steps": 1835, "total_steps": 3962, "loss": 0.4564, "lr": 2.5995670059991085e-05, "epoch": 3.242263483642794, "percentage": 46.31, "elapsed_time": "4:17:29", "remaining_time": "4:58:27"} +{"current_steps": 1840, "total_steps": 3962, "loss": 0.4148, "lr": 2.5911541943497e-05, "epoch": 3.251105216622458, "percentage": 46.44, "elapsed_time": "4:18:04", "remaining_time": "4:57:38"} +{"current_steps": 1845, "total_steps": 3962, "loss": 0.4271, "lr": 2.582729905901747e-05, "epoch": 3.259946949602122, "percentage": 46.57, "elapsed_time": "4:18:50", "remaining_time": "4:56:59"} +{"current_steps": 1850, "total_steps": 3962, "loss": 0.4524, "lr": 2.574294304206254e-05, "epoch": 3.268788682581786, "percentage": 46.69, "elapsed_time": "4:19:43", "remaining_time": "4:56:30"} +{"current_steps": 1855, "total_steps": 3962, "loss": 0.4439, "lr": 2.56584755303386e-05, "epoch": 3.27763041556145, "percentage": 46.82, "elapsed_time": "4:20:30", "remaining_time": "4:55:54"} +{"current_steps": 1860, "total_steps": 3962, "loss": 0.4215, "lr": 2.5573898163716663e-05, "epoch": 3.286472148541114, "percentage": 46.95, "elapsed_time": "4:21:20", "remaining_time": "4:55:21"} +{"current_steps": 1865, "total_steps": 3962, "loss": 0.448, "lr": 2.5489212584200446e-05, "epoch": 3.2953138815207783, "percentage": 47.07, "elapsed_time": "4:22:02", "remaining_time": "4:54:38"} +{"current_steps": 1870, "total_steps": 3962, "loss": 0.449, "lr": 2.5404420435894578e-05, "epoch": 3.3041556145004423, "percentage": 47.2, "elapsed_time": "4:22:48", "remaining_time": "4:54:00"} +{"current_steps": 1875, "total_steps": 3962, "loss": 0.447, "lr": 2.5319523364972606e-05, "epoch": 3.312997347480106, "percentage": 47.32, "elapsed_time": "4:23:34", "remaining_time": "4:53:22"} +{"current_steps": 1880, "total_steps": 3962, "loss": 0.4362, "lr": 2.5234523019645086e-05, "epoch": 3.32183908045977, "percentage": 47.45, "elapsed_time": "4:24:06", "remaining_time": "4:52:28"} +{"current_steps": 1885, "total_steps": 3962, "loss": 0.4341, "lr": 2.5149421050127556e-05, "epoch": 3.330680813439434, "percentage": 47.58, "elapsed_time": "4:24:53", "remaining_time": "4:51:52"} +{"current_steps": 1890, "total_steps": 3962, "loss": 0.4351, "lr": 2.5064219108608525e-05, "epoch": 3.339522546419098, "percentage": 47.7, "elapsed_time": "4:25:34", "remaining_time": "4:51:08"} +{"current_steps": 1895, "total_steps": 3962, "loss": 0.4492, "lr": 2.497891884921735e-05, "epoch": 3.348364279398762, "percentage": 47.83, "elapsed_time": "4:26:27", "remaining_time": "4:50:38"} +{"current_steps": 1900, "total_steps": 3962, "loss": 0.4703, "lr": 2.4893521927992182e-05, "epoch": 3.357206012378426, "percentage": 47.96, "elapsed_time": "4:27:09", "remaining_time": "4:49:56"} +{"current_steps": 1905, "total_steps": 3962, "loss": 0.4376, "lr": 2.4808030002847775e-05, "epoch": 3.3660477453580904, "percentage": 48.08, "elapsed_time": "4:27:53", "remaining_time": "4:49:16"} +{"current_steps": 1910, "total_steps": 3962, "loss": 0.4769, "lr": 2.472244473354332e-05, "epoch": 3.3748894783377543, "percentage": 48.21, "elapsed_time": "4:28:31", "remaining_time": "4:48:29"} +{"current_steps": 1915, "total_steps": 3962, "loss": 0.4615, "lr": 2.4636767781650183e-05, "epoch": 3.3837312113174183, "percentage": 48.33, "elapsed_time": "4:29:11", "remaining_time": "4:47:44"} +{"current_steps": 1920, "total_steps": 3962, "loss": 0.4899, "lr": 2.4551000810519714e-05, "epoch": 3.3925729442970822, "percentage": 48.46, "elapsed_time": "4:29:52", "remaining_time": "4:47:00"} +{"current_steps": 1925, "total_steps": 3962, "loss": 0.4519, "lr": 2.4465145485250888e-05, "epoch": 3.401414677276746, "percentage": 48.59, "elapsed_time": "4:30:37", "remaining_time": "4:46:22"} +{"current_steps": 1930, "total_steps": 3962, "loss": 0.4214, "lr": 2.437920347265802e-05, "epoch": 3.41025641025641, "percentage": 48.71, "elapsed_time": "4:31:04", "remaining_time": "4:45:23"} +{"current_steps": 1935, "total_steps": 3962, "loss": 0.4112, "lr": 2.4293176441238396e-05, "epoch": 3.419098143236074, "percentage": 48.84, "elapsed_time": "4:31:38", "remaining_time": "4:44:33"} +{"current_steps": 1940, "total_steps": 3962, "loss": 0.4189, "lr": 2.420706606113986e-05, "epoch": 3.4279398762157385, "percentage": 48.97, "elapsed_time": "4:32:19", "remaining_time": "4:43:49"} +{"current_steps": 1945, "total_steps": 3962, "loss": 0.4861, "lr": 2.4120874004128422e-05, "epoch": 3.4367816091954024, "percentage": 49.09, "elapsed_time": "4:32:57", "remaining_time": "4:43:03"} +{"current_steps": 1950, "total_steps": 3962, "loss": 0.4576, "lr": 2.4034601943555775e-05, "epoch": 3.4456233421750664, "percentage": 49.22, "elapsed_time": "4:33:43", "remaining_time": "4:42:26"} +{"current_steps": 1955, "total_steps": 3962, "loss": 0.4412, "lr": 2.3948251554326826e-05, "epoch": 3.4544650751547303, "percentage": 49.34, "elapsed_time": "4:34:38", "remaining_time": "4:41:57"} +{"current_steps": 1960, "total_steps": 3962, "loss": 0.421, "lr": 2.3861824512867172e-05, "epoch": 3.4633068081343943, "percentage": 49.47, "elapsed_time": "4:35:14", "remaining_time": "4:41:07"} +{"current_steps": 1965, "total_steps": 3962, "loss": 0.4557, "lr": 2.377532249709054e-05, "epoch": 3.4721485411140582, "percentage": 49.6, "elapsed_time": "4:36:00", "remaining_time": "4:40:30"} +{"current_steps": 1970, "total_steps": 3962, "loss": 0.4472, "lr": 2.368874718636625e-05, "epoch": 3.480990274093722, "percentage": 49.72, "elapsed_time": "4:36:38", "remaining_time": "4:39:44"} +{"current_steps": 1975, "total_steps": 3962, "loss": 0.4754, "lr": 2.3602100261486557e-05, "epoch": 3.489832007073386, "percentage": 49.85, "elapsed_time": "4:37:22", "remaining_time": "4:39:03"} +{"current_steps": 1980, "total_steps": 3962, "loss": 0.4378, "lr": 2.3515383404634075e-05, "epoch": 3.4986737400530505, "percentage": 49.97, "elapsed_time": "4:38:07", "remaining_time": "4:38:24"} +{"current_steps": 1985, "total_steps": 3962, "loss": 0.4694, "lr": 2.3428598299349076e-05, "epoch": 3.5075154730327145, "percentage": 50.1, "elapsed_time": "4:38:44", "remaining_time": "4:37:37"} +{"current_steps": 1990, "total_steps": 3962, "loss": 0.4454, "lr": 2.3341746630496828e-05, "epoch": 3.5163572060123784, "percentage": 50.23, "elapsed_time": "4:39:12", "remaining_time": "4:36:41"} +{"current_steps": 1995, "total_steps": 3962, "loss": 0.4168, "lr": 2.3254830084234877e-05, "epoch": 3.5251989389920424, "percentage": 50.35, "elapsed_time": "4:40:03", "remaining_time": "4:36:07"} +{"current_steps": 2000, "total_steps": 3962, "loss": 0.4506, "lr": 2.316785034798032e-05, "epoch": 3.5340406719717063, "percentage": 50.48, "elapsed_time": "4:40:40", "remaining_time": "4:35:20"} +{"current_steps": 2005, "total_steps": 3962, "loss": 0.4358, "lr": 2.308080911037703e-05, "epoch": 3.5428824049513707, "percentage": 50.61, "elapsed_time": "4:41:24", "remaining_time": "4:34:40"} +{"current_steps": 2010, "total_steps": 3962, "loss": 0.458, "lr": 2.2993708061262886e-05, "epoch": 3.5517241379310347, "percentage": 50.73, "elapsed_time": "4:41:58", "remaining_time": "4:33:50"} +{"current_steps": 2015, "total_steps": 3962, "loss": 0.4567, "lr": 2.2906548891636956e-05, "epoch": 3.5605658709106986, "percentage": 50.86, "elapsed_time": "4:42:42", "remaining_time": "4:33:10"} +{"current_steps": 2020, "total_steps": 3962, "loss": 0.4483, "lr": 2.2819333293626686e-05, "epoch": 3.5694076038903626, "percentage": 50.98, "elapsed_time": "4:43:28", "remaining_time": "4:32:32"} +{"current_steps": 2025, "total_steps": 3962, "loss": 0.4373, "lr": 2.2732062960455014e-05, "epoch": 3.5782493368700266, "percentage": 51.11, "elapsed_time": "4:44:24", "remaining_time": "4:32:02"} +{"current_steps": 2030, "total_steps": 3962, "loss": 0.412, "lr": 2.264473958640753e-05, "epoch": 3.5870910698496905, "percentage": 51.24, "elapsed_time": "4:45:20", "remaining_time": "4:31:34"} +{"current_steps": 2035, "total_steps": 3962, "loss": 0.4285, "lr": 2.2557364866799572e-05, "epoch": 3.5959328028293545, "percentage": 51.36, "elapsed_time": "4:45:49", "remaining_time": "4:30:39"} +{"current_steps": 2040, "total_steps": 3962, "loss": 0.4663, "lr": 2.246994049794332e-05, "epoch": 3.6047745358090184, "percentage": 51.49, "elapsed_time": "4:46:41", "remaining_time": "4:30:06"} +{"current_steps": 2045, "total_steps": 3962, "loss": 0.4001, "lr": 2.2382468177114834e-05, "epoch": 3.6136162687886824, "percentage": 51.62, "elapsed_time": "4:47:27", "remaining_time": "4:29:28"} +{"current_steps": 2050, "total_steps": 3962, "loss": 0.4664, "lr": 2.2294949602521142e-05, "epoch": 3.6224580017683468, "percentage": 51.74, "elapsed_time": "4:48:12", "remaining_time": "4:28:48"} +{"current_steps": 2055, "total_steps": 3962, "loss": 0.4407, "lr": 2.2207386473267247e-05, "epoch": 3.6312997347480107, "percentage": 51.87, "elapsed_time": "4:48:46", "remaining_time": "4:27:58"} +{"current_steps": 2060, "total_steps": 3962, "loss": 0.4363, "lr": 2.2119780489323154e-05, "epoch": 3.6401414677276747, "percentage": 51.99, "elapsed_time": "4:49:13", "remaining_time": "4:27:02"} +{"current_steps": 2065, "total_steps": 3962, "loss": 0.4571, "lr": 2.2032133351490835e-05, "epoch": 3.6489832007073386, "percentage": 52.12, "elapsed_time": "4:49:50", "remaining_time": "4:26:15"} +{"current_steps": 2070, "total_steps": 3962, "loss": 0.4217, "lr": 2.1944446761371264e-05, "epoch": 3.6578249336870026, "percentage": 52.25, "elapsed_time": "4:50:26", "remaining_time": "4:25:27"} +{"current_steps": 2075, "total_steps": 3962, "loss": 0.444, "lr": 2.1856722421331322e-05, "epoch": 3.6666666666666665, "percentage": 52.37, "elapsed_time": "4:51:09", "remaining_time": "4:24:46"} +{"current_steps": 2080, "total_steps": 3962, "loss": 0.4696, "lr": 2.1768962034470803e-05, "epoch": 3.675508399646331, "percentage": 52.5, "elapsed_time": "4:51:50", "remaining_time": "4:24:03"} +{"current_steps": 2085, "total_steps": 3962, "loss": 0.4074, "lr": 2.1681167304589295e-05, "epoch": 3.684350132625995, "percentage": 52.62, "elapsed_time": "4:52:18", "remaining_time": "4:23:08"} +{"current_steps": 2090, "total_steps": 3962, "loss": 0.424, "lr": 2.1593339936153148e-05, "epoch": 3.693191865605659, "percentage": 52.75, "elapsed_time": "4:53:08", "remaining_time": "4:22:33"} +{"current_steps": 2095, "total_steps": 3962, "loss": 0.4053, "lr": 2.1505481634262354e-05, "epoch": 3.7020335985853228, "percentage": 52.88, "elapsed_time": "4:53:58", "remaining_time": "4:21:59"} +{"current_steps": 2100, "total_steps": 3962, "loss": 0.4182, "lr": 2.141759410461746e-05, "epoch": 3.7108753315649867, "percentage": 53.0, "elapsed_time": "4:54:33", "remaining_time": "4:21:10"} +{"current_steps": 2105, "total_steps": 3962, "loss": 0.4478, "lr": 2.1329679053486444e-05, "epoch": 3.7197170645446507, "percentage": 53.13, "elapsed_time": "4:55:18", "remaining_time": "4:20:30"} +{"current_steps": 2110, "total_steps": 3962, "loss": 0.4299, "lr": 2.1241738187671595e-05, "epoch": 3.7285587975243146, "percentage": 53.26, "elapsed_time": "4:55:57", "remaining_time": "4:19:46"} +{"current_steps": 2115, "total_steps": 3962, "loss": 0.4992, "lr": 2.115377321447637e-05, "epoch": 3.7374005305039786, "percentage": 53.38, "elapsed_time": "4:56:30", "remaining_time": "4:18:55"} +{"current_steps": 2120, "total_steps": 3962, "loss": 0.4114, "lr": 2.106578584167225e-05, "epoch": 3.7462422634836425, "percentage": 53.51, "elapsed_time": "4:57:09", "remaining_time": "4:18:11"} +{"current_steps": 2125, "total_steps": 3962, "loss": 0.4229, "lr": 2.0977777777465594e-05, "epoch": 3.755083996463307, "percentage": 53.63, "elapsed_time": "4:57:43", "remaining_time": "4:17:22"} +{"current_steps": 2130, "total_steps": 3962, "loss": 0.4612, "lr": 2.0889750730464474e-05, "epoch": 3.763925729442971, "percentage": 53.76, "elapsed_time": "4:58:16", "remaining_time": "4:16:32"} +{"current_steps": 2135, "total_steps": 3962, "loss": 0.4607, "lr": 2.0801706409645473e-05, "epoch": 3.772767462422635, "percentage": 53.89, "elapsed_time": "4:59:00", "remaining_time": "4:15:52"} +{"current_steps": 2140, "total_steps": 3962, "loss": 0.4408, "lr": 2.0713646524320557e-05, "epoch": 3.781609195402299, "percentage": 54.01, "elapsed_time": "4:59:32", "remaining_time": "4:15:02"} +{"current_steps": 2145, "total_steps": 3962, "loss": 0.471, "lr": 2.0625572784103855e-05, "epoch": 3.7904509283819627, "percentage": 54.14, "elapsed_time": "5:00:12", "remaining_time": "4:14:18"} +{"current_steps": 2150, "total_steps": 3962, "loss": 0.4261, "lr": 2.053748689887848e-05, "epoch": 3.799292661361627, "percentage": 54.27, "elapsed_time": "5:00:54", "remaining_time": "4:13:35"} +{"current_steps": 2155, "total_steps": 3962, "loss": 0.4283, "lr": 2.0449390578763336e-05, "epoch": 3.808134394341291, "percentage": 54.39, "elapsed_time": "5:01:35", "remaining_time": "4:12:53"} +{"current_steps": 2160, "total_steps": 3962, "loss": 0.4411, "lr": 2.036128553407989e-05, "epoch": 3.816976127320955, "percentage": 54.52, "elapsed_time": "5:02:15", "remaining_time": "4:12:09"} +{"current_steps": 2165, "total_steps": 3962, "loss": 0.4583, "lr": 2.027317347531902e-05, "epoch": 3.825817860300619, "percentage": 54.64, "elapsed_time": "5:02:57", "remaining_time": "4:11:27"} +{"current_steps": 2170, "total_steps": 3962, "loss": 0.495, "lr": 2.0185056113107763e-05, "epoch": 3.834659593280283, "percentage": 54.77, "elapsed_time": "5:03:53", "remaining_time": "4:10:57"} +{"current_steps": 2175, "total_steps": 3962, "loss": 0.434, "lr": 2.0096935158176105e-05, "epoch": 3.843501326259947, "percentage": 54.9, "elapsed_time": "5:04:31", "remaining_time": "4:10:12"} +{"current_steps": 2180, "total_steps": 3962, "loss": 0.4657, "lr": 2.000881232132381e-05, "epoch": 3.852343059239611, "percentage": 55.02, "elapsed_time": "5:05:13", "remaining_time": "4:09:30"} +{"current_steps": 2185, "total_steps": 3962, "loss": 0.4246, "lr": 1.9920689313387148e-05, "epoch": 3.861184792219275, "percentage": 55.15, "elapsed_time": "5:05:55", "remaining_time": "4:08:48"} +{"current_steps": 2190, "total_steps": 3962, "loss": 0.4161, "lr": 1.9832567845205735e-05, "epoch": 3.8700265251989387, "percentage": 55.28, "elapsed_time": "5:06:45", "remaining_time": "4:08:12"} +{"current_steps": 2195, "total_steps": 3962, "loss": 0.4294, "lr": 1.974444962758929e-05, "epoch": 3.878868258178603, "percentage": 55.4, "elapsed_time": "5:07:27", "remaining_time": "4:07:30"} +{"current_steps": 2200, "total_steps": 3962, "loss": 0.4552, "lr": 1.9656336371284406e-05, "epoch": 3.887709991158267, "percentage": 55.53, "elapsed_time": "5:08:07", "remaining_time": "4:06:46"} +{"current_steps": 2205, "total_steps": 3962, "loss": 0.4438, "lr": 1.956822978694137e-05, "epoch": 3.896551724137931, "percentage": 55.65, "elapsed_time": "5:08:52", "remaining_time": "4:06:07"} +{"current_steps": 2210, "total_steps": 3962, "loss": 0.4231, "lr": 1.9480131585080946e-05, "epoch": 3.905393457117595, "percentage": 55.78, "elapsed_time": "5:09:40", "remaining_time": "4:05:30"} +{"current_steps": 2215, "total_steps": 3962, "loss": 0.4493, "lr": 1.939204347606115e-05, "epoch": 3.914235190097259, "percentage": 55.91, "elapsed_time": "5:10:18", "remaining_time": "4:04:44"} +{"current_steps": 2220, "total_steps": 3962, "loss": 0.4358, "lr": 1.9303967170044043e-05, "epoch": 3.9230769230769234, "percentage": 56.03, "elapsed_time": "5:11:07", "remaining_time": "4:04:08"} +{"current_steps": 2225, "total_steps": 3962, "loss": 0.4263, "lr": 1.9215904376962555e-05, "epoch": 3.9319186560565873, "percentage": 56.16, "elapsed_time": "5:11:46", "remaining_time": "4:03:24"} +{"current_steps": 2230, "total_steps": 3962, "loss": 0.4388, "lr": 1.9127856806487266e-05, "epoch": 3.9407603890362513, "percentage": 56.28, "elapsed_time": "5:12:24", "remaining_time": "4:02:38"} +{"current_steps": 2235, "total_steps": 3962, "loss": 0.4483, "lr": 1.9039826167993235e-05, "epoch": 3.949602122015915, "percentage": 56.41, "elapsed_time": "5:12:57", "remaining_time": "4:01:49"} +{"current_steps": 2240, "total_steps": 3962, "loss": 0.4231, "lr": 1.895181417052677e-05, "epoch": 3.958443854995579, "percentage": 56.54, "elapsed_time": "5:13:39", "remaining_time": "4:01:07"} +{"current_steps": 2245, "total_steps": 3962, "loss": 0.4245, "lr": 1.88638225227723e-05, "epoch": 3.967285587975243, "percentage": 56.66, "elapsed_time": "5:14:32", "remaining_time": "4:00:33"} +{"current_steps": 2250, "total_steps": 3962, "loss": 0.4163, "lr": 1.877585293301918e-05, "epoch": 3.976127320954907, "percentage": 56.79, "elapsed_time": "5:15:15", "remaining_time": "3:59:52"} +{"current_steps": 2255, "total_steps": 3962, "loss": 0.4301, "lr": 1.868790710912853e-05, "epoch": 3.984969053934571, "percentage": 56.92, "elapsed_time": "5:16:01", "remaining_time": "3:59:13"} +{"current_steps": 2260, "total_steps": 3962, "loss": 0.4667, "lr": 1.8599986758500047e-05, "epoch": 3.993810786914235, "percentage": 57.04, "elapsed_time": "5:16:40", "remaining_time": "3:58:29"} +{"current_steps": 2265, "total_steps": 3962, "loss": 0.4144, "lr": 1.8512093588038915e-05, "epoch": 4.001768346595933, "percentage": 57.17, "elapsed_time": "5:17:20", "remaining_time": "3:57:45"} +{"current_steps": 2270, "total_steps": 3962, "loss": 0.4182, "lr": 1.842422930412262e-05, "epoch": 4.010610079575597, "percentage": 57.29, "elapsed_time": "5:18:14", "remaining_time": "3:57:12"} +{"current_steps": 2275, "total_steps": 3962, "loss": 0.4081, "lr": 1.8336395612567857e-05, "epoch": 4.0194518125552605, "percentage": 57.42, "elapsed_time": "5:18:50", "remaining_time": "3:56:26"} +{"current_steps": 2280, "total_steps": 3962, "loss": 0.4291, "lr": 1.824859421859736e-05, "epoch": 4.0282935455349245, "percentage": 57.55, "elapsed_time": "5:19:26", "remaining_time": "3:55:39"} +{"current_steps": 2285, "total_steps": 3962, "loss": 0.4333, "lr": 1.8160826826806856e-05, "epoch": 4.037135278514588, "percentage": 57.67, "elapsed_time": "5:20:04", "remaining_time": "3:54:54"} +{"current_steps": 2290, "total_steps": 3962, "loss": 0.3803, "lr": 1.8073095141131946e-05, "epoch": 4.045977011494253, "percentage": 57.8, "elapsed_time": "5:20:49", "remaining_time": "3:54:14"} +{"current_steps": 2295, "total_steps": 3962, "loss": 0.4017, "lr": 1.7985400864815027e-05, "epoch": 4.054818744473917, "percentage": 57.93, "elapsed_time": "5:21:25", "remaining_time": "3:53:28"} +{"current_steps": 2300, "total_steps": 3962, "loss": 0.403, "lr": 1.7897745700372194e-05, "epoch": 4.063660477453581, "percentage": 58.05, "elapsed_time": "5:22:12", "remaining_time": "3:52:49"} +{"current_steps": 2305, "total_steps": 3962, "loss": 0.3903, "lr": 1.781013134956025e-05, "epoch": 4.072502210433245, "percentage": 58.18, "elapsed_time": "5:22:45", "remaining_time": "3:52:01"} +{"current_steps": 2310, "total_steps": 3962, "loss": 0.4298, "lr": 1.7722559513343616e-05, "epoch": 4.081343943412909, "percentage": 58.3, "elapsed_time": "5:23:37", "remaining_time": "3:51:26"} +{"current_steps": 2315, "total_steps": 3962, "loss": 0.4048, "lr": 1.7635031891861334e-05, "epoch": 4.090185676392573, "percentage": 58.43, "elapsed_time": "5:24:19", "remaining_time": "3:50:44"} +{"current_steps": 2320, "total_steps": 3962, "loss": 0.3999, "lr": 1.7547550184394036e-05, "epoch": 4.099027409372237, "percentage": 58.56, "elapsed_time": "5:24:57", "remaining_time": "3:49:59"} +{"current_steps": 2325, "total_steps": 3962, "loss": 0.4263, "lr": 1.746011608933098e-05, "epoch": 4.107869142351901, "percentage": 58.68, "elapsed_time": "5:25:33", "remaining_time": "3:49:13"} +{"current_steps": 2330, "total_steps": 3962, "loss": 0.4234, "lr": 1.7372731304137072e-05, "epoch": 4.116710875331565, "percentage": 58.81, "elapsed_time": "5:26:22", "remaining_time": "3:48:36"} +{"current_steps": 2335, "total_steps": 3962, "loss": 0.4209, "lr": 1.7285397525319897e-05, "epoch": 4.125552608311229, "percentage": 58.93, "elapsed_time": "5:27:15", "remaining_time": "3:48:01"} +{"current_steps": 2340, "total_steps": 3962, "loss": 0.4446, "lr": 1.719811644839679e-05, "epoch": 4.134394341290893, "percentage": 59.06, "elapsed_time": "5:28:02", "remaining_time": "3:47:23"} +{"current_steps": 2345, "total_steps": 3962, "loss": 0.4049, "lr": 1.711088976786192e-05, "epoch": 4.143236074270557, "percentage": 59.19, "elapsed_time": "5:28:49", "remaining_time": "3:46:44"} +{"current_steps": 2350, "total_steps": 3962, "loss": 0.4287, "lr": 1.7023719177153397e-05, "epoch": 4.152077807250221, "percentage": 59.31, "elapsed_time": "5:29:40", "remaining_time": "3:46:08"} +{"current_steps": 2355, "total_steps": 3962, "loss": 0.426, "lr": 1.6936606368620393e-05, "epoch": 4.160919540229885, "percentage": 59.44, "elapsed_time": "5:30:14", "remaining_time": "3:45:21"} +{"current_steps": 2360, "total_steps": 3962, "loss": 0.4116, "lr": 1.684955303349027e-05, "epoch": 4.1697612732095495, "percentage": 59.57, "elapsed_time": "5:30:56", "remaining_time": "3:44:39"} +{"current_steps": 2365, "total_steps": 3962, "loss": 0.3691, "lr": 1.6762560861835778e-05, "epoch": 4.178603006189213, "percentage": 59.69, "elapsed_time": "5:31:32", "remaining_time": "3:43:52"} +{"current_steps": 2370, "total_steps": 3962, "loss": 0.4199, "lr": 1.6675631542542206e-05, "epoch": 4.187444739168877, "percentage": 59.82, "elapsed_time": "5:32:06", "remaining_time": "3:43:05"} +{"current_steps": 2375, "total_steps": 3962, "loss": 0.4325, "lr": 1.658876676327464e-05, "epoch": 4.196286472148541, "percentage": 59.94, "elapsed_time": "5:32:47", "remaining_time": "3:42:22"} +{"current_steps": 2380, "total_steps": 3962, "loss": 0.433, "lr": 1.6501968210445144e-05, "epoch": 4.205128205128205, "percentage": 60.07, "elapsed_time": "5:33:21", "remaining_time": "3:41:35"} +{"current_steps": 2385, "total_steps": 3962, "loss": 0.4051, "lr": 1.641523756918006e-05, "epoch": 4.213969938107869, "percentage": 60.2, "elapsed_time": "5:34:13", "remaining_time": "3:40:59"} +{"current_steps": 2390, "total_steps": 3962, "loss": 0.4268, "lr": 1.6328576523287284e-05, "epoch": 4.222811671087533, "percentage": 60.32, "elapsed_time": "5:34:54", "remaining_time": "3:40:17"} +{"current_steps": 2395, "total_steps": 3962, "loss": 0.4281, "lr": 1.6241986755223574e-05, "epoch": 4.231653404067197, "percentage": 60.45, "elapsed_time": "5:35:48", "remaining_time": "3:39:43"} +{"current_steps": 2400, "total_steps": 3962, "loss": 0.3957, "lr": 1.6155469946061863e-05, "epoch": 4.240495137046861, "percentage": 60.58, "elapsed_time": "5:36:27", "remaining_time": "3:38:58"} +{"current_steps": 2405, "total_steps": 3962, "loss": 0.4381, "lr": 1.6069027775458665e-05, "epoch": 4.249336870026525, "percentage": 60.7, "elapsed_time": "5:37:07", "remaining_time": "3:38:15"} +{"current_steps": 2410, "total_steps": 3962, "loss": 0.4092, "lr": 1.5982661921621437e-05, "epoch": 4.258178603006189, "percentage": 60.83, "elapsed_time": "5:37:50", "remaining_time": "3:37:33"} +{"current_steps": 2415, "total_steps": 3962, "loss": 0.4286, "lr": 1.5896374061276015e-05, "epoch": 4.267020335985853, "percentage": 60.95, "elapsed_time": "5:38:29", "remaining_time": "3:36:50"} +{"current_steps": 2420, "total_steps": 3962, "loss": 0.4031, "lr": 1.5810165869634027e-05, "epoch": 4.275862068965517, "percentage": 61.08, "elapsed_time": "5:39:03", "remaining_time": "3:36:02"} +{"current_steps": 2425, "total_steps": 3962, "loss": 0.4139, "lr": 1.572403902036042e-05, "epoch": 4.284703801945181, "percentage": 61.21, "elapsed_time": "5:39:49", "remaining_time": "3:35:22"} +{"current_steps": 2430, "total_steps": 3962, "loss": 0.3881, "lr": 1.5637995185540932e-05, "epoch": 4.293545534924846, "percentage": 61.33, "elapsed_time": "5:40:25", "remaining_time": "3:34:37"} +{"current_steps": 2435, "total_steps": 3962, "loss": 0.4188, "lr": 1.5552036035649656e-05, "epoch": 4.30238726790451, "percentage": 61.46, "elapsed_time": "5:40:59", "remaining_time": "3:33:50"} +{"current_steps": 2440, "total_steps": 3962, "loss": 0.3927, "lr": 1.5466163239516553e-05, "epoch": 4.311229000884174, "percentage": 61.59, "elapsed_time": "5:41:50", "remaining_time": "3:33:13"} +{"current_steps": 2445, "total_steps": 3962, "loss": 0.3999, "lr": 1.5380378464295133e-05, "epoch": 4.3200707338638376, "percentage": 61.71, "elapsed_time": "5:42:27", "remaining_time": "3:32:28"} +{"current_steps": 2450, "total_steps": 3962, "loss": 0.45, "lr": 1.5294683375430035e-05, "epoch": 4.3289124668435015, "percentage": 61.84, "elapsed_time": "5:42:52", "remaining_time": "3:31:36"} +{"current_steps": 2455, "total_steps": 3962, "loss": 0.398, "lr": 1.520907963662471e-05, "epoch": 4.3377541998231655, "percentage": 61.96, "elapsed_time": "5:43:21", "remaining_time": "3:30:46"} +{"current_steps": 2460, "total_steps": 3962, "loss": 0.3993, "lr": 1.5123568909809103e-05, "epoch": 4.346595932802829, "percentage": 62.09, "elapsed_time": "5:43:53", "remaining_time": "3:29:58"} +{"current_steps": 2465, "total_steps": 3962, "loss": 0.4331, "lr": 1.5038152855107422e-05, "epoch": 4.355437665782493, "percentage": 62.22, "elapsed_time": "5:44:34", "remaining_time": "3:29:15"} +{"current_steps": 2470, "total_steps": 3962, "loss": 0.4228, "lr": 1.4952833130805884e-05, "epoch": 4.364279398762157, "percentage": 62.34, "elapsed_time": "5:45:18", "remaining_time": "3:28:34"} +{"current_steps": 2475, "total_steps": 3962, "loss": 0.4432, "lr": 1.4867611393320533e-05, "epoch": 4.373121131741821, "percentage": 62.47, "elapsed_time": "5:46:04", "remaining_time": "3:27:55"} +{"current_steps": 2480, "total_steps": 3962, "loss": 0.3911, "lr": 1.478248929716505e-05, "epoch": 4.381962864721485, "percentage": 62.59, "elapsed_time": "5:46:49", "remaining_time": "3:27:15"} +{"current_steps": 2485, "total_steps": 3962, "loss": 0.4436, "lr": 1.4697468494918687e-05, "epoch": 4.390804597701149, "percentage": 62.72, "elapsed_time": "5:47:19", "remaining_time": "3:26:26"} +{"current_steps": 2490, "total_steps": 3962, "loss": 0.4475, "lr": 1.4612550637194141e-05, "epoch": 4.399646330680813, "percentage": 62.85, "elapsed_time": "5:48:02", "remaining_time": "3:25:45"} +{"current_steps": 2495, "total_steps": 3962, "loss": 0.4507, "lr": 1.4527737372605529e-05, "epoch": 4.408488063660477, "percentage": 62.97, "elapsed_time": "5:48:38", "remaining_time": "3:24:59"} +{"current_steps": 2500, "total_steps": 3962, "loss": 0.4381, "lr": 1.4443030347736347e-05, "epoch": 4.417329796640141, "percentage": 63.1, "elapsed_time": "5:49:21", "remaining_time": "3:24:17"} +{"current_steps": 2505, "total_steps": 3962, "loss": 0.4017, "lr": 1.435843120710756e-05, "epoch": 4.426171529619806, "percentage": 63.23, "elapsed_time": "5:50:06", "remaining_time": "3:23:38"} +{"current_steps": 2510, "total_steps": 3962, "loss": 0.4483, "lr": 1.4273941593145636e-05, "epoch": 4.43501326259947, "percentage": 63.35, "elapsed_time": "5:50:48", "remaining_time": "3:22:56"} +{"current_steps": 2515, "total_steps": 3962, "loss": 0.4212, "lr": 1.4189563146150669e-05, "epoch": 4.443854995579134, "percentage": 63.48, "elapsed_time": "5:51:23", "remaining_time": "3:22:10"} +{"current_steps": 2520, "total_steps": 3962, "loss": 0.4347, "lr": 1.4105297504264516e-05, "epoch": 4.452696728558798, "percentage": 63.6, "elapsed_time": "5:51:49", "remaining_time": "3:21:19"} +{"current_steps": 2525, "total_steps": 3962, "loss": 0.4029, "lr": 1.4021146303439031e-05, "epoch": 4.461538461538462, "percentage": 63.73, "elapsed_time": "5:52:25", "remaining_time": "3:20:34"} +{"current_steps": 2530, "total_steps": 3962, "loss": 0.4369, "lr": 1.3937111177404279e-05, "epoch": 4.470380194518126, "percentage": 63.86, "elapsed_time": "5:53:07", "remaining_time": "3:19:52"} +{"current_steps": 2535, "total_steps": 3962, "loss": 0.3756, "lr": 1.385319375763682e-05, "epoch": 4.47922192749779, "percentage": 63.98, "elapsed_time": "5:53:48", "remaining_time": "3:19:09"} +{"current_steps": 2540, "total_steps": 3962, "loss": 0.4351, "lr": 1.376939567332804e-05, "epoch": 4.4880636604774535, "percentage": 64.11, "elapsed_time": "5:54:25", "remaining_time": "3:18:25"} +{"current_steps": 2545, "total_steps": 3962, "loss": 0.4428, "lr": 1.3685718551352518e-05, "epoch": 4.4969053934571175, "percentage": 64.24, "elapsed_time": "5:55:07", "remaining_time": "3:17:43"} +{"current_steps": 2550, "total_steps": 3962, "loss": 0.4019, "lr": 1.3602164016236444e-05, "epoch": 4.505747126436781, "percentage": 64.36, "elapsed_time": "5:55:56", "remaining_time": "3:17:05"} +{"current_steps": 2555, "total_steps": 3962, "loss": 0.4236, "lr": 1.3518733690126084e-05, "epoch": 4.514588859416445, "percentage": 64.49, "elapsed_time": "5:56:33", "remaining_time": "3:16:20"} +{"current_steps": 2560, "total_steps": 3962, "loss": 0.388, "lr": 1.3435429192756275e-05, "epoch": 4.523430592396109, "percentage": 64.61, "elapsed_time": "5:57:24", "remaining_time": "3:15:44"} +{"current_steps": 2565, "total_steps": 3962, "loss": 0.4202, "lr": 1.3352252141418998e-05, "epoch": 4.532272325375773, "percentage": 64.74, "elapsed_time": "5:57:54", "remaining_time": "3:14:55"} +{"current_steps": 2570, "total_steps": 3962, "loss": 0.4112, "lr": 1.3269204150931953e-05, "epoch": 4.541114058355438, "percentage": 64.87, "elapsed_time": "5:58:46", "remaining_time": "3:14:19"} +{"current_steps": 2575, "total_steps": 3962, "loss": 0.4039, "lr": 1.3186286833607244e-05, "epoch": 4.549955791335101, "percentage": 64.99, "elapsed_time": "5:59:25", "remaining_time": "3:13:36"} +{"current_steps": 2580, "total_steps": 3962, "loss": 0.4085, "lr": 1.3103501799220033e-05, "epoch": 4.558797524314766, "percentage": 65.12, "elapsed_time": "6:00:06", "remaining_time": "3:12:53"} +{"current_steps": 2585, "total_steps": 3962, "loss": 0.4209, "lr": 1.3020850654977333e-05, "epoch": 4.56763925729443, "percentage": 65.24, "elapsed_time": "6:00:41", "remaining_time": "3:12:07"} +{"current_steps": 2590, "total_steps": 3962, "loss": 0.4446, "lr": 1.293833500548678e-05, "epoch": 4.576480990274094, "percentage": 65.37, "elapsed_time": "6:01:24", "remaining_time": "3:11:26"} +{"current_steps": 2595, "total_steps": 3962, "loss": 0.3752, "lr": 1.2855956452725471e-05, "epoch": 4.585322723253758, "percentage": 65.5, "elapsed_time": "6:02:20", "remaining_time": "3:10:52"} +{"current_steps": 2600, "total_steps": 3962, "loss": 0.3987, "lr": 1.2773716596008889e-05, "epoch": 4.594164456233422, "percentage": 65.62, "elapsed_time": "6:02:56", "remaining_time": "3:10:07"} +{"current_steps": 2605, "total_steps": 3962, "loss": 0.4105, "lr": 1.2691617031959843e-05, "epoch": 4.603006189213086, "percentage": 65.75, "elapsed_time": "6:03:38", "remaining_time": "3:09:25"} +{"current_steps": 2610, "total_steps": 3962, "loss": 0.4349, "lr": 1.2609659354477458e-05, "epoch": 4.61184792219275, "percentage": 65.88, "elapsed_time": "6:04:11", "remaining_time": "3:08:39"} +{"current_steps": 2615, "total_steps": 3962, "loss": 0.3781, "lr": 1.2527845154706264e-05, "epoch": 4.620689655172414, "percentage": 66.0, "elapsed_time": "6:04:54", "remaining_time": "3:07:57"} +{"current_steps": 2620, "total_steps": 3962, "loss": 0.4202, "lr": 1.2446176021005245e-05, "epoch": 4.629531388152078, "percentage": 66.13, "elapsed_time": "6:05:30", "remaining_time": "3:07:12"} +{"current_steps": 2625, "total_steps": 3962, "loss": 0.4161, "lr": 1.2364653538917076e-05, "epoch": 4.638373121131742, "percentage": 66.25, "elapsed_time": "6:06:03", "remaining_time": "3:06:26"} +{"current_steps": 2630, "total_steps": 3962, "loss": 0.4246, "lr": 1.2283279291137291e-05, "epoch": 4.647214854111406, "percentage": 66.38, "elapsed_time": "6:06:50", "remaining_time": "3:05:47"} +{"current_steps": 2635, "total_steps": 3962, "loss": 0.4014, "lr": 1.2202054857483576e-05, "epoch": 4.6560565870910695, "percentage": 66.51, "elapsed_time": "6:07:45", "remaining_time": "3:05:12"} +{"current_steps": 2640, "total_steps": 3962, "loss": 0.4114, "lr": 1.2120981814865073e-05, "epoch": 4.6648983200707335, "percentage": 66.63, "elapsed_time": "6:08:31", "remaining_time": "3:04:32"} +{"current_steps": 2645, "total_steps": 3962, "loss": 0.4629, "lr": 1.2040061737251807e-05, "epoch": 4.673740053050398, "percentage": 66.76, "elapsed_time": "6:09:07", "remaining_time": "3:03:47"} +{"current_steps": 2650, "total_steps": 3962, "loss": 0.3891, "lr": 1.19592961956441e-05, "epoch": 4.682581786030062, "percentage": 66.89, "elapsed_time": "6:10:01", "remaining_time": "3:03:11"} +{"current_steps": 2655, "total_steps": 3962, "loss": 0.4552, "lr": 1.1878686758042086e-05, "epoch": 4.691423519009726, "percentage": 67.01, "elapsed_time": "6:10:49", "remaining_time": "3:02:32"} +{"current_steps": 2660, "total_steps": 3962, "loss": 0.4191, "lr": 1.179823498941523e-05, "epoch": 4.70026525198939, "percentage": 67.14, "elapsed_time": "6:11:36", "remaining_time": "3:01:53"} +{"current_steps": 2665, "total_steps": 3962, "loss": 0.4428, "lr": 1.1717942451672008e-05, "epoch": 4.709106984969054, "percentage": 67.26, "elapsed_time": "6:12:26", "remaining_time": "3:01:15"} +{"current_steps": 2670, "total_steps": 3962, "loss": 0.4001, "lr": 1.1637810703629549e-05, "epoch": 4.717948717948718, "percentage": 67.39, "elapsed_time": "6:12:59", "remaining_time": "3:00:29"} +{"current_steps": 2675, "total_steps": 3962, "loss": 0.4537, "lr": 1.1557841300983363e-05, "epoch": 4.726790450928382, "percentage": 67.52, "elapsed_time": "6:13:28", "remaining_time": "2:59:41"} +{"current_steps": 2680, "total_steps": 3962, "loss": 0.4426, "lr": 1.1478035796277158e-05, "epoch": 4.735632183908046, "percentage": 67.64, "elapsed_time": "6:14:17", "remaining_time": "2:59:02"} +{"current_steps": 2685, "total_steps": 3962, "loss": 0.422, "lr": 1.1398395738872683e-05, "epoch": 4.74447391688771, "percentage": 67.77, "elapsed_time": "6:14:55", "remaining_time": "2:58:19"} +{"current_steps": 2690, "total_steps": 3962, "loss": 0.4646, "lr": 1.1318922674919675e-05, "epoch": 4.753315649867374, "percentage": 67.9, "elapsed_time": "6:15:47", "remaining_time": "2:57:41"} +{"current_steps": 2695, "total_steps": 3962, "loss": 0.3928, "lr": 1.1239618147325802e-05, "epoch": 4.762157382847038, "percentage": 68.02, "elapsed_time": "6:16:35", "remaining_time": "2:57:02"} +{"current_steps": 2700, "total_steps": 3962, "loss": 0.4034, "lr": 1.116048369572674e-05, "epoch": 4.770999115826702, "percentage": 68.15, "elapsed_time": "6:17:14", "remaining_time": "2:56:19"} +{"current_steps": 2705, "total_steps": 3962, "loss": 0.409, "lr": 1.1081520856456267e-05, "epoch": 4.779840848806366, "percentage": 68.27, "elapsed_time": "6:17:50", "remaining_time": "2:55:34"} +{"current_steps": 2710, "total_steps": 3962, "loss": 0.4359, "lr": 1.1002731162516453e-05, "epoch": 4.78868258178603, "percentage": 68.4, "elapsed_time": "6:18:24", "remaining_time": "2:54:49"} +{"current_steps": 2715, "total_steps": 3962, "loss": 0.4171, "lr": 1.0924116143547878e-05, "epoch": 4.797524314765694, "percentage": 68.53, "elapsed_time": "6:19:03", "remaining_time": "2:54:06"} +{"current_steps": 2720, "total_steps": 3962, "loss": 0.4312, "lr": 1.0845677325799935e-05, "epoch": 4.8063660477453585, "percentage": 68.65, "elapsed_time": "6:19:42", "remaining_time": "2:53:23"} +{"current_steps": 2725, "total_steps": 3962, "loss": 0.4391, "lr": 1.0767416232101215e-05, "epoch": 4.815207780725022, "percentage": 68.78, "elapsed_time": "6:20:19", "remaining_time": "2:52:38"} +{"current_steps": 2730, "total_steps": 3962, "loss": 0.4088, "lr": 1.0689334381829948e-05, "epoch": 4.824049513704686, "percentage": 68.9, "elapsed_time": "6:21:06", "remaining_time": "2:51:59"} +{"current_steps": 2735, "total_steps": 3962, "loss": 0.4004, "lr": 1.0611433290884472e-05, "epoch": 4.83289124668435, "percentage": 69.03, "elapsed_time": "6:22:04", "remaining_time": "2:51:24"} +{"current_steps": 2740, "total_steps": 3962, "loss": 0.4312, "lr": 1.0533714471653832e-05, "epoch": 4.841732979664014, "percentage": 69.16, "elapsed_time": "6:22:50", "remaining_time": "2:50:44"} +{"current_steps": 2745, "total_steps": 3962, "loss": 0.4497, "lr": 1.04561794329884e-05, "epoch": 4.850574712643678, "percentage": 69.28, "elapsed_time": "6:23:26", "remaining_time": "2:49:59"} +{"current_steps": 2750, "total_steps": 3962, "loss": 0.4322, "lr": 1.0378829680170622e-05, "epoch": 4.859416445623342, "percentage": 69.41, "elapsed_time": "6:24:03", "remaining_time": "2:49:16"} +{"current_steps": 2755, "total_steps": 3962, "loss": 0.4325, "lr": 1.0301666714885725e-05, "epoch": 4.868258178603006, "percentage": 69.54, "elapsed_time": "6:24:41", "remaining_time": "2:48:32"} +{"current_steps": 2760, "total_steps": 3962, "loss": 0.4438, "lr": 1.0224692035192625e-05, "epoch": 4.87709991158267, "percentage": 69.66, "elapsed_time": "6:25:18", "remaining_time": "2:47:48"} +{"current_steps": 2765, "total_steps": 3962, "loss": 0.4236, "lr": 1.0147907135494803e-05, "epoch": 4.885941644562334, "percentage": 69.79, "elapsed_time": "6:25:54", "remaining_time": "2:47:03"} +{"current_steps": 2770, "total_steps": 3962, "loss": 0.3959, "lr": 1.0071313506511334e-05, "epoch": 4.894783377541998, "percentage": 69.91, "elapsed_time": "6:26:37", "remaining_time": "2:46:22"} +{"current_steps": 2775, "total_steps": 3962, "loss": 0.3991, "lr": 9.9949126352479e-06, "epoch": 4.903625110521662, "percentage": 70.04, "elapsed_time": "6:27:26", "remaining_time": "2:45:43"} +{"current_steps": 2780, "total_steps": 3962, "loss": 0.4288, "lr": 9.918706004967948e-06, "epoch": 4.912466843501326, "percentage": 70.17, "elapsed_time": "6:28:08", "remaining_time": "2:45:01"} +{"current_steps": 2785, "total_steps": 3962, "loss": 0.423, "lr": 9.842695095163878e-06, "epoch": 4.921308576480991, "percentage": 70.29, "elapsed_time": "6:28:54", "remaining_time": "2:44:21"} +{"current_steps": 2790, "total_steps": 3962, "loss": 0.4199, "lr": 9.766881381528357e-06, "epoch": 4.930150309460654, "percentage": 70.42, "elapsed_time": "6:29:28", "remaining_time": "2:43:36"} +{"current_steps": 2795, "total_steps": 3962, "loss": 0.4507, "lr": 9.691266335925615e-06, "epoch": 4.938992042440319, "percentage": 70.55, "elapsed_time": "6:30:11", "remaining_time": "2:42:54"} +{"current_steps": 2800, "total_steps": 3962, "loss": 0.4385, "lr": 9.615851426362904e-06, "epoch": 4.947833775419983, "percentage": 70.67, "elapsed_time": "6:30:43", "remaining_time": "2:42:08"} +{"current_steps": 2805, "total_steps": 3962, "loss": 0.4195, "lr": 9.540638116961986e-06, "epoch": 4.9566755083996465, "percentage": 70.8, "elapsed_time": "6:31:23", "remaining_time": "2:41:26"} +{"current_steps": 2810, "total_steps": 3962, "loss": 0.4017, "lr": 9.465627867930734e-06, "epoch": 4.9655172413793105, "percentage": 70.92, "elapsed_time": "6:31:53", "remaining_time": "2:40:39"} +{"current_steps": 2815, "total_steps": 3962, "loss": 0.4037, "lr": 9.390822135534738e-06, "epoch": 4.9743589743589745, "percentage": 71.05, "elapsed_time": "6:32:43", "remaining_time": "2:40:01"} +{"current_steps": 2820, "total_steps": 3962, "loss": 0.4356, "lr": 9.31622237206907e-06, "epoch": 4.983200707338638, "percentage": 71.18, "elapsed_time": "6:33:23", "remaining_time": "2:39:18"} +{"current_steps": 2825, "total_steps": 3962, "loss": 0.4128, "lr": 9.241830025830059e-06, "epoch": 4.992042440318302, "percentage": 71.3, "elapsed_time": "6:34:06", "remaining_time": "2:38:37"} +{"current_steps": 2830, "total_steps": 3962, "loss": 0.4185, "lr": 9.167646541087216e-06, "epoch": 5.0, "percentage": 71.43, "elapsed_time": "6:34:45", "remaining_time": "2:37:54"} +{"current_steps": 2835, "total_steps": 3962, "loss": 0.418, "lr": 9.09367335805515e-06, "epoch": 5.008841732979664, "percentage": 71.55, "elapsed_time": "6:35:28", "remaining_time": "2:37:12"} +{"current_steps": 2840, "total_steps": 3962, "loss": 0.3993, "lr": 9.019911912865634e-06, "epoch": 5.017683465959328, "percentage": 71.68, "elapsed_time": "6:36:22", "remaining_time": "2:36:35"} +{"current_steps": 2845, "total_steps": 3962, "loss": 0.3912, "lr": 8.946363637539699e-06, "epoch": 5.026525198938992, "percentage": 71.81, "elapsed_time": "6:37:13", "remaining_time": "2:35:57"} +{"current_steps": 2850, "total_steps": 3962, "loss": 0.387, "lr": 8.87302995995988e-06, "epoch": 5.035366931918656, "percentage": 71.93, "elapsed_time": "6:38:00", "remaining_time": "2:35:17"} +{"current_steps": 2855, "total_steps": 3962, "loss": 0.4087, "lr": 8.799912303842437e-06, "epoch": 5.04420866489832, "percentage": 72.06, "elapsed_time": "6:38:39", "remaining_time": "2:34:34"} +{"current_steps": 2860, "total_steps": 3962, "loss": 0.3722, "lr": 8.727012088709751e-06, "epoch": 5.053050397877984, "percentage": 72.19, "elapsed_time": "6:39:18", "remaining_time": "2:33:51"} +{"current_steps": 2865, "total_steps": 3962, "loss": 0.3869, "lr": 8.654330729862752e-06, "epoch": 5.061892130857648, "percentage": 72.31, "elapsed_time": "6:40:03", "remaining_time": "2:33:10"} +{"current_steps": 2870, "total_steps": 3962, "loss": 0.3783, "lr": 8.58186963835346e-06, "epoch": 5.0707338638373125, "percentage": 72.44, "elapsed_time": "6:40:56", "remaining_time": "2:32:33"} +{"current_steps": 2875, "total_steps": 3962, "loss": 0.4093, "lr": 8.509630220957554e-06, "epoch": 5.0795755968169765, "percentage": 72.56, "elapsed_time": "6:41:19", "remaining_time": "2:31:44"} +{"current_steps": 2880, "total_steps": 3962, "loss": 0.3913, "lr": 8.437613880147093e-06, "epoch": 5.08841732979664, "percentage": 72.69, "elapsed_time": "6:41:52", "remaining_time": "2:30:58"} +{"current_steps": 2885, "total_steps": 3962, "loss": 0.3658, "lr": 8.365822014063287e-06, "epoch": 5.097259062776304, "percentage": 72.82, "elapsed_time": "6:42:32", "remaining_time": "2:30:16"} +{"current_steps": 2890, "total_steps": 3962, "loss": 0.3952, "lr": 8.29425601648933e-06, "epoch": 5.106100795755968, "percentage": 72.94, "elapsed_time": "6:43:07", "remaining_time": "2:29:31"} +{"current_steps": 2895, "total_steps": 3962, "loss": 0.3976, "lr": 8.222917276823361e-06, "epoch": 5.114942528735632, "percentage": 73.07, "elapsed_time": "6:43:43", "remaining_time": "2:28:47"} +{"current_steps": 2900, "total_steps": 3962, "loss": 0.4313, "lr": 8.151807180051474e-06, "epoch": 5.123784261715296, "percentage": 73.2, "elapsed_time": "6:44:16", "remaining_time": "2:28:02"} +{"current_steps": 2905, "total_steps": 3962, "loss": 0.4158, "lr": 8.080927106720862e-06, "epoch": 5.13262599469496, "percentage": 73.32, "elapsed_time": "6:45:00", "remaining_time": "2:27:21"} +{"current_steps": 2910, "total_steps": 3962, "loss": 0.4258, "lr": 8.010278432912971e-06, "epoch": 5.141467727674624, "percentage": 73.45, "elapsed_time": "6:45:35", "remaining_time": "2:26:37"} +{"current_steps": 2915, "total_steps": 3962, "loss": 0.3872, "lr": 7.939862530216808e-06, "epoch": 5.150309460654288, "percentage": 73.57, "elapsed_time": "6:46:13", "remaining_time": "2:25:54"} +{"current_steps": 2920, "total_steps": 3962, "loss": 0.4319, "lr": 7.869680765702313e-06, "epoch": 5.159151193633952, "percentage": 73.7, "elapsed_time": "6:46:55", "remaining_time": "2:25:12"} +{"current_steps": 2925, "total_steps": 3962, "loss": 0.3872, "lr": 7.799734501893825e-06, "epoch": 5.167992926613616, "percentage": 73.83, "elapsed_time": "6:48:03", "remaining_time": "2:24:39"} +{"current_steps": 2930, "total_steps": 3962, "loss": 0.4124, "lr": 7.730025096743601e-06, "epoch": 5.17683465959328, "percentage": 73.95, "elapsed_time": "6:48:38", "remaining_time": "2:23:55"} +{"current_steps": 2935, "total_steps": 3962, "loss": 0.3949, "lr": 7.6605539036055e-06, "epoch": 5.185676392572944, "percentage": 74.08, "elapsed_time": "6:49:25", "remaining_time": "2:23:15"} +{"current_steps": 2940, "total_steps": 3962, "loss": 0.3833, "lr": 7.591322271208639e-06, "epoch": 5.194518125552609, "percentage": 74.2, "elapsed_time": "6:50:07", "remaining_time": "2:22:34"} +{"current_steps": 2945, "total_steps": 3962, "loss": 0.3966, "lr": 7.522331543631289e-06, "epoch": 5.203359858532273, "percentage": 74.33, "elapsed_time": "6:50:42", "remaining_time": "2:21:49"} +{"current_steps": 2950, "total_steps": 3962, "loss": 0.3912, "lr": 7.453583060274714e-06, "epoch": 5.212201591511937, "percentage": 74.46, "elapsed_time": "6:51:15", "remaining_time": "2:21:05"} +{"current_steps": 2955, "total_steps": 3962, "loss": 0.4172, "lr": 7.385078155837226e-06, "epoch": 5.221043324491601, "percentage": 74.58, "elapsed_time": "6:51:47", "remaining_time": "2:20:19"} +{"current_steps": 2960, "total_steps": 3962, "loss": 0.3916, "lr": 7.316818160288195e-06, "epoch": 5.2298850574712645, "percentage": 74.71, "elapsed_time": "6:52:34", "remaining_time": "2:19:39"} +{"current_steps": 2965, "total_steps": 3962, "loss": 0.4376, "lr": 7.248804398842322e-06, "epoch": 5.2387267904509285, "percentage": 74.84, "elapsed_time": "6:53:16", "remaining_time": "2:18:58"} +{"current_steps": 2970, "total_steps": 3962, "loss": 0.3725, "lr": 7.181038191933833e-06, "epoch": 5.247568523430592, "percentage": 74.96, "elapsed_time": "6:53:58", "remaining_time": "2:18:16"} +{"current_steps": 2975, "total_steps": 3962, "loss": 0.3862, "lr": 7.113520855190907e-06, "epoch": 5.256410256410256, "percentage": 75.09, "elapsed_time": "6:54:29", "remaining_time": "2:17:30"} +{"current_steps": 2980, "total_steps": 3962, "loss": 0.3901, "lr": 7.046253699410058e-06, "epoch": 5.26525198938992, "percentage": 75.21, "elapsed_time": "6:55:12", "remaining_time": "2:16:49"} +{"current_steps": 2985, "total_steps": 3962, "loss": 0.3823, "lr": 6.979238030530775e-06, "epoch": 5.274093722369584, "percentage": 75.34, "elapsed_time": "6:56:05", "remaining_time": "2:16:11"} +{"current_steps": 2990, "total_steps": 3962, "loss": 0.375, "lr": 6.912475149610094e-06, "epoch": 5.282935455349248, "percentage": 75.47, "elapsed_time": "6:56:51", "remaining_time": "2:15:30"} +{"current_steps": 2995, "total_steps": 3962, "loss": 0.4253, "lr": 6.8459663527973995e-06, "epoch": 5.291777188328912, "percentage": 75.59, "elapsed_time": "6:57:27", "remaining_time": "2:14:47"} +{"current_steps": 3000, "total_steps": 3962, "loss": 0.4069, "lr": 6.779712931309186e-06, "epoch": 5.300618921308576, "percentage": 75.72, "elapsed_time": "6:58:17", "remaining_time": "2:14:07"} +{"current_steps": 3005, "total_steps": 3962, "loss": 0.4349, "lr": 6.713716171404086e-06, "epoch": 5.30946065428824, "percentage": 75.85, "elapsed_time": "6:59:43", "remaining_time": "2:13:40"} +{"current_steps": 3010, "total_steps": 3962, "loss": 0.4308, "lr": 6.647977354357804e-06, "epoch": 5.318302387267904, "percentage": 75.97, "elapsed_time": "7:00:18", "remaining_time": "2:12:55"} +{"current_steps": 3015, "total_steps": 3962, "loss": 0.386, "lr": 6.582497756438326e-06, "epoch": 5.327144120247569, "percentage": 76.1, "elapsed_time": "7:00:56", "remaining_time": "2:12:12"} +{"current_steps": 3020, "total_steps": 3962, "loss": 0.3716, "lr": 6.517278648881054e-06, "epoch": 5.335985853227233, "percentage": 76.22, "elapsed_time": "7:01:43", "remaining_time": "2:11:32"} +{"current_steps": 3025, "total_steps": 3962, "loss": 0.4082, "lr": 6.452321297864212e-06, "epoch": 5.344827586206897, "percentage": 76.35, "elapsed_time": "7:02:24", "remaining_time": "2:10:50"} +{"current_steps": 3030, "total_steps": 3962, "loss": 0.3963, "lr": 6.387626964484197e-06, "epoch": 5.353669319186561, "percentage": 76.48, "elapsed_time": "7:03:04", "remaining_time": "2:10:08"} +{"current_steps": 3035, "total_steps": 3962, "loss": 0.3854, "lr": 6.323196904731155e-06, "epoch": 5.362511052166225, "percentage": 76.6, "elapsed_time": "7:03:46", "remaining_time": "2:09:26"} +{"current_steps": 3040, "total_steps": 3962, "loss": 0.3956, "lr": 6.259032369464522e-06, "epoch": 5.371352785145889, "percentage": 76.73, "elapsed_time": "7:04:28", "remaining_time": "2:08:44"} +{"current_steps": 3045, "total_steps": 3962, "loss": 0.4388, "lr": 6.195134604388819e-06, "epoch": 5.380194518125553, "percentage": 76.86, "elapsed_time": "7:05:10", "remaining_time": "2:08:02"} +{"current_steps": 3050, "total_steps": 3962, "loss": 0.4576, "lr": 6.1315048500294125e-06, "epoch": 5.389036251105217, "percentage": 76.98, "elapsed_time": "7:05:44", "remaining_time": "2:07:18"} +{"current_steps": 3055, "total_steps": 3962, "loss": 0.4117, "lr": 6.068144341708464e-06, "epoch": 5.3978779840848805, "percentage": 77.11, "elapsed_time": "7:06:30", "remaining_time": "2:06:37"} +{"current_steps": 3060, "total_steps": 3962, "loss": 0.402, "lr": 6.0050543095209215e-06, "epoch": 5.4067197170645445, "percentage": 77.23, "elapsed_time": "7:07:20", "remaining_time": "2:05:58"} +{"current_steps": 3065, "total_steps": 3962, "loss": 0.4086, "lr": 5.942235978310649e-06, "epoch": 5.415561450044208, "percentage": 77.36, "elapsed_time": "7:08:07", "remaining_time": "2:05:17"} +{"current_steps": 3070, "total_steps": 3962, "loss": 0.4072, "lr": 5.879690567646645e-06, "epoch": 5.424403183023872, "percentage": 77.49, "elapsed_time": "7:09:03", "remaining_time": "2:04:39"} +{"current_steps": 3075, "total_steps": 3962, "loss": 0.4171, "lr": 5.817419291799388e-06, "epoch": 5.433244916003536, "percentage": 77.61, "elapsed_time": "7:10:00", "remaining_time": "2:04:02"} +{"current_steps": 3080, "total_steps": 3962, "loss": 0.3953, "lr": 5.755423359717222e-06, "epoch": 5.442086648983201, "percentage": 77.74, "elapsed_time": "7:10:36", "remaining_time": "2:03:18"} +{"current_steps": 3085, "total_steps": 3962, "loss": 0.4028, "lr": 5.693703975002911e-06, "epoch": 5.450928381962865, "percentage": 77.86, "elapsed_time": "7:11:23", "remaining_time": "2:02:38"} +{"current_steps": 3090, "total_steps": 3962, "loss": 0.3457, "lr": 5.632262335890262e-06, "epoch": 5.459770114942529, "percentage": 77.99, "elapsed_time": "7:12:01", "remaining_time": "2:01:55"} +{"current_steps": 3095, "total_steps": 3962, "loss": 0.3906, "lr": 5.571099635220887e-06, "epoch": 5.468611847922193, "percentage": 78.12, "elapsed_time": "7:12:46", "remaining_time": "2:01:14"} +{"current_steps": 3100, "total_steps": 3962, "loss": 0.3922, "lr": 5.510217060421006e-06, "epoch": 5.477453580901857, "percentage": 78.24, "elapsed_time": "7:13:26", "remaining_time": "2:00:31"} +{"current_steps": 3105, "total_steps": 3962, "loss": 0.4078, "lr": 5.449615793478411e-06, "epoch": 5.486295313881521, "percentage": 78.37, "elapsed_time": "7:14:10", "remaining_time": "1:59:50"} +{"current_steps": 3110, "total_steps": 3962, "loss": 0.4097, "lr": 5.389297010919545e-06, "epoch": 5.495137046861185, "percentage": 78.5, "elapsed_time": "7:14:58", "remaining_time": "1:59:09"} +{"current_steps": 3115, "total_steps": 3962, "loss": 0.4226, "lr": 5.329261883786611e-06, "epoch": 5.503978779840849, "percentage": 78.62, "elapsed_time": "7:15:38", "remaining_time": "1:58:27"} +{"current_steps": 3120, "total_steps": 3962, "loss": 0.3965, "lr": 5.2695115776148765e-06, "epoch": 5.512820512820513, "percentage": 78.75, "elapsed_time": "7:16:10", "remaining_time": "1:57:42"} +{"current_steps": 3125, "total_steps": 3962, "loss": 0.3822, "lr": 5.21004725241002e-06, "epoch": 5.521662245800177, "percentage": 78.87, "elapsed_time": "7:16:57", "remaining_time": "1:57:01"} +{"current_steps": 3130, "total_steps": 3962, "loss": 0.3983, "lr": 5.150870062625639e-06, "epoch": 5.530503978779841, "percentage": 79.0, "elapsed_time": "7:17:52", "remaining_time": "1:56:23"} +{"current_steps": 3135, "total_steps": 3962, "loss": 0.4035, "lr": 5.091981157140808e-06, "epoch": 5.539345711759505, "percentage": 79.13, "elapsed_time": "7:18:27", "remaining_time": "1:55:39"} +{"current_steps": 3140, "total_steps": 3962, "loss": 0.3976, "lr": 5.03338167923779e-06, "epoch": 5.548187444739169, "percentage": 79.25, "elapsed_time": "7:19:24", "remaining_time": "1:55:01"} +{"current_steps": 3145, "total_steps": 3962, "loss": 0.4048, "lr": 4.975072766579829e-06, "epoch": 5.5570291777188325, "percentage": 79.38, "elapsed_time": "7:20:10", "remaining_time": "1:54:20"} +{"current_steps": 3150, "total_steps": 3962, "loss": 0.3766, "lr": 4.917055551189089e-06, "epoch": 5.5658709106984965, "percentage": 79.51, "elapsed_time": "7:20:56", "remaining_time": "1:53:39"} +{"current_steps": 3155, "total_steps": 3962, "loss": 0.3818, "lr": 4.859331159424645e-06, "epoch": 5.574712643678161, "percentage": 79.63, "elapsed_time": "7:21:33", "remaining_time": "1:52:56"} +{"current_steps": 3160, "total_steps": 3962, "loss": 0.3838, "lr": 4.801900711960628e-06, "epoch": 5.583554376657825, "percentage": 79.76, "elapsed_time": "7:22:10", "remaining_time": "1:52:13"} +{"current_steps": 3165, "total_steps": 3962, "loss": 0.4141, "lr": 4.744765323764469e-06, "epoch": 5.592396109637489, "percentage": 79.88, "elapsed_time": "7:22:43", "remaining_time": "1:51:29"} +{"current_steps": 3170, "total_steps": 3962, "loss": 0.3959, "lr": 4.6879261040752685e-06, "epoch": 5.601237842617153, "percentage": 80.01, "elapsed_time": "7:23:28", "remaining_time": "1:50:47"} +{"current_steps": 3175, "total_steps": 3962, "loss": 0.4117, "lr": 4.63138415638223e-06, "epoch": 5.610079575596817, "percentage": 80.14, "elapsed_time": "7:24:08", "remaining_time": "1:50:05"} +{"current_steps": 3180, "total_steps": 3962, "loss": 0.4084, "lr": 4.575140578403256e-06, "epoch": 5.618921308576481, "percentage": 80.26, "elapsed_time": "7:24:50", "remaining_time": "1:49:23"} +{"current_steps": 3185, "total_steps": 3962, "loss": 0.3603, "lr": 4.519196462063628e-06, "epoch": 5.627763041556145, "percentage": 80.39, "elapsed_time": "7:25:43", "remaining_time": "1:48:44"} +{"current_steps": 3190, "total_steps": 3962, "loss": 0.4099, "lr": 4.4635528934748315e-06, "epoch": 5.636604774535809, "percentage": 80.51, "elapsed_time": "7:26:26", "remaining_time": "1:48:02"} +{"current_steps": 3195, "total_steps": 3962, "loss": 0.4076, "lr": 4.408210952913434e-06, "epoch": 5.645446507515473, "percentage": 80.64, "elapsed_time": "7:26:54", "remaining_time": "1:47:17"} +{"current_steps": 3200, "total_steps": 3962, "loss": 0.3617, "lr": 4.353171714800135e-06, "epoch": 5.654288240495137, "percentage": 80.77, "elapsed_time": "7:27:37", "remaining_time": "1:46:35"} +{"current_steps": 3205, "total_steps": 3962, "loss": 0.4097, "lr": 4.298436247678892e-06, "epoch": 5.663129973474801, "percentage": 80.89, "elapsed_time": "7:28:15", "remaining_time": "1:45:52"} +{"current_steps": 3210, "total_steps": 3962, "loss": 0.4246, "lr": 4.2440056141962116e-06, "epoch": 5.671971706454465, "percentage": 81.02, "elapsed_time": "7:28:51", "remaining_time": "1:45:09"} +{"current_steps": 3215, "total_steps": 3962, "loss": 0.4049, "lr": 4.189880871080465e-06, "epoch": 5.680813439434129, "percentage": 81.15, "elapsed_time": "7:29:38", "remaining_time": "1:44:28"} +{"current_steps": 3220, "total_steps": 3962, "loss": 0.3795, "lr": 4.136063069121412e-06, "epoch": 5.689655172413794, "percentage": 81.27, "elapsed_time": "7:30:13", "remaining_time": "1:43:44"} +{"current_steps": 3225, "total_steps": 3962, "loss": 0.3919, "lr": 4.082553253149784e-06, "epoch": 5.698496905393457, "percentage": 81.4, "elapsed_time": "7:30:59", "remaining_time": "1:43:03"} +{"current_steps": 3230, "total_steps": 3962, "loss": 0.4019, "lr": 4.029352462017016e-06, "epoch": 5.7073386383731215, "percentage": 81.52, "elapsed_time": "7:31:41", "remaining_time": "1:42:21"} +{"current_steps": 3235, "total_steps": 3962, "loss": 0.3985, "lr": 3.9764617285750516e-06, "epoch": 5.7161803713527854, "percentage": 81.65, "elapsed_time": "7:32:30", "remaining_time": "1:41:41"} +{"current_steps": 3240, "total_steps": 3962, "loss": 0.3979, "lr": 3.923882079656311e-06, "epoch": 5.725022104332449, "percentage": 81.78, "elapsed_time": "7:33:08", "remaining_time": "1:40:58"} +{"current_steps": 3245, "total_steps": 3962, "loss": 0.3869, "lr": 3.8716145360537516e-06, "epoch": 5.733863837312113, "percentage": 81.9, "elapsed_time": "7:33:52", "remaining_time": "1:40:17"} +{"current_steps": 3250, "total_steps": 3962, "loss": 0.4063, "lr": 3.819660112501053e-06, "epoch": 5.742705570291777, "percentage": 82.03, "elapsed_time": "7:34:36", "remaining_time": "1:39:35"} +{"current_steps": 3255, "total_steps": 3962, "loss": 0.4158, "lr": 3.768019817652906e-06, "epoch": 5.751547303271441, "percentage": 82.16, "elapsed_time": "7:35:07", "remaining_time": "1:38:51"} +{"current_steps": 3260, "total_steps": 3962, "loss": 0.3863, "lr": 3.7166946540654403e-06, "epoch": 5.760389036251105, "percentage": 82.28, "elapsed_time": "7:35:47", "remaining_time": "1:38:08"} +{"current_steps": 3265, "total_steps": 3962, "loss": 0.427, "lr": 3.6656856181767487e-06, "epoch": 5.769230769230769, "percentage": 82.41, "elapsed_time": "7:36:22", "remaining_time": "1:37:25"} +{"current_steps": 3270, "total_steps": 3962, "loss": 0.4139, "lr": 3.6149937002875725e-06, "epoch": 5.778072502210433, "percentage": 82.53, "elapsed_time": "7:36:46", "remaining_time": "1:36:39"} +{"current_steps": 3275, "total_steps": 3962, "loss": 0.4073, "lr": 3.564619884542033e-06, "epoch": 5.786914235190097, "percentage": 82.66, "elapsed_time": "7:37:14", "remaining_time": "1:35:55"} +{"current_steps": 3280, "total_steps": 3962, "loss": 0.4115, "lr": 3.514565148908553e-06, "epoch": 5.795755968169761, "percentage": 82.79, "elapsed_time": "7:37:51", "remaining_time": "1:35:12"} +{"current_steps": 3285, "total_steps": 3962, "loss": 0.3956, "lr": 3.4648304651608623e-06, "epoch": 5.804597701149425, "percentage": 82.91, "elapsed_time": "7:38:40", "remaining_time": "1:34:31"} +{"current_steps": 3290, "total_steps": 3962, "loss": 0.3837, "lr": 3.4154167988591367e-06, "epoch": 5.813439434129089, "percentage": 83.04, "elapsed_time": "7:39:31", "remaining_time": "1:33:51"} +{"current_steps": 3295, "total_steps": 3962, "loss": 0.4257, "lr": 3.3663251093312477e-06, "epoch": 5.822281167108754, "percentage": 83.17, "elapsed_time": "7:40:07", "remaining_time": "1:33:08"} +{"current_steps": 3300, "total_steps": 3962, "loss": 0.3822, "lr": 3.317556349654125e-06, "epoch": 5.831122900088418, "percentage": 83.29, "elapsed_time": "7:40:46", "remaining_time": "1:32:26"} +{"current_steps": 3305, "total_steps": 3962, "loss": 0.41, "lr": 3.2691114666352887e-06, "epoch": 5.839964633068082, "percentage": 83.42, "elapsed_time": "7:41:20", "remaining_time": "1:31:42"} +{"current_steps": 3310, "total_steps": 3962, "loss": 0.3794, "lr": 3.220991400794431e-06, "epoch": 5.848806366047746, "percentage": 83.54, "elapsed_time": "7:42:03", "remaining_time": "1:31:00"} +{"current_steps": 3315, "total_steps": 3962, "loss": 0.3949, "lr": 3.1731970863451746e-06, "epoch": 5.85764809902741, "percentage": 83.67, "elapsed_time": "7:42:39", "remaining_time": "1:30:17"} +{"current_steps": 3320, "total_steps": 3962, "loss": 0.3945, "lr": 3.1257294511769263e-06, "epoch": 5.8664898320070735, "percentage": 83.8, "elapsed_time": "7:43:07", "remaining_time": "1:29:33"} +{"current_steps": 3325, "total_steps": 3962, "loss": 0.4101, "lr": 3.0785894168368857e-06, "epoch": 5.8753315649867375, "percentage": 83.92, "elapsed_time": "7:43:47", "remaining_time": "1:28:51"} +{"current_steps": 3330, "total_steps": 3962, "loss": 0.4128, "lr": 3.0317778985121182e-06, "epoch": 5.884173297966401, "percentage": 84.05, "elapsed_time": "7:44:42", "remaining_time": "1:28:11"} +{"current_steps": 3335, "total_steps": 3962, "loss": 0.4182, "lr": 2.9852958050118275e-06, "epoch": 5.893015030946065, "percentage": 84.17, "elapsed_time": "7:45:24", "remaining_time": "1:27:29"} +{"current_steps": 3340, "total_steps": 3962, "loss": 0.4242, "lr": 2.9391440387496617e-06, "epoch": 5.901856763925729, "percentage": 84.3, "elapsed_time": "7:46:02", "remaining_time": "1:26:47"} +{"current_steps": 3345, "total_steps": 3962, "loss": 0.3703, "lr": 2.89332349572625e-06, "epoch": 5.910698496905393, "percentage": 84.43, "elapsed_time": "7:46:46", "remaining_time": "1:26:05"} +{"current_steps": 3350, "total_steps": 3962, "loss": 0.3988, "lr": 2.847835065511766e-06, "epoch": 5.919540229885057, "percentage": 84.55, "elapsed_time": "7:47:17", "remaining_time": "1:25:22"} +{"current_steps": 3355, "total_steps": 3962, "loss": 0.4373, "lr": 2.8026796312286843e-06, "epoch": 5.928381962864721, "percentage": 84.68, "elapsed_time": "7:48:04", "remaining_time": "1:24:41"} +{"current_steps": 3360, "total_steps": 3962, "loss": 0.3984, "lr": 2.757858069534598e-06, "epoch": 5.937223695844385, "percentage": 84.81, "elapsed_time": "7:48:54", "remaining_time": "1:24:00"} +{"current_steps": 3365, "total_steps": 3962, "loss": 0.417, "lr": 2.71337125060525e-06, "epoch": 5.946065428824049, "percentage": 84.93, "elapsed_time": "7:49:24", "remaining_time": "1:23:16"} +{"current_steps": 3370, "total_steps": 3962, "loss": 0.4419, "lr": 2.669220038117597e-06, "epoch": 5.954907161803714, "percentage": 85.06, "elapsed_time": "7:49:59", "remaining_time": "1:22:33"} +{"current_steps": 3375, "total_steps": 3962, "loss": 0.4438, "lr": 2.6254052892330737e-06, "epoch": 5.963748894783378, "percentage": 85.18, "elapsed_time": "7:50:34", "remaining_time": "1:21:50"} +{"current_steps": 3380, "total_steps": 3962, "loss": 0.4149, "lr": 2.5819278545809103e-06, "epoch": 5.972590627763042, "percentage": 85.31, "elapsed_time": "7:51:30", "remaining_time": "1:21:11"} +{"current_steps": 3385, "total_steps": 3962, "loss": 0.3631, "lr": 2.5387885782416712e-06, "epoch": 5.981432360742706, "percentage": 85.44, "elapsed_time": "7:52:05", "remaining_time": "1:20:28"} +{"current_steps": 3390, "total_steps": 3962, "loss": 0.4035, "lr": 2.495988297730818e-06, "epoch": 5.99027409372237, "percentage": 85.56, "elapsed_time": "7:52:41", "remaining_time": "1:19:45"} +{"current_steps": 3395, "total_steps": 3962, "loss": 0.3689, "lr": 2.453527843982497e-06, "epoch": 5.999115826702034, "percentage": 85.69, "elapsed_time": "7:53:28", "remaining_time": "1:19:04"} +{"current_steps": 3400, "total_steps": 3962, "loss": 0.3823, "lr": 2.4114080413333474e-06, "epoch": 6.007073386383731, "percentage": 85.82, "elapsed_time": "7:54:06", "remaining_time": "1:18:22"} +{"current_steps": 3405, "total_steps": 3962, "loss": 0.3901, "lr": 2.369629707506569e-06, "epoch": 6.015915119363395, "percentage": 85.94, "elapsed_time": "7:54:44", "remaining_time": "1:17:39"} +{"current_steps": 3410, "total_steps": 3962, "loss": 0.3892, "lr": 2.328193653595985e-06, "epoch": 6.024756852343059, "percentage": 86.07, "elapsed_time": "7:55:36", "remaining_time": "1:16:59"} +{"current_steps": 3415, "total_steps": 3962, "loss": 0.385, "lr": 2.2871006840503384e-06, "epoch": 6.033598585322723, "percentage": 86.19, "elapsed_time": "7:56:22", "remaining_time": "1:16:18"} +{"current_steps": 3420, "total_steps": 3962, "loss": 0.3856, "lr": 2.2463515966576342e-06, "epoch": 6.042440318302387, "percentage": 86.32, "elapsed_time": "7:57:02", "remaining_time": "1:15:36"} +{"current_steps": 3425, "total_steps": 3962, "loss": 0.3931, "lr": 2.2059471825296973e-06, "epoch": 6.051282051282051, "percentage": 86.45, "elapsed_time": "7:57:43", "remaining_time": "1:14:54"} +{"current_steps": 3430, "total_steps": 3962, "loss": 0.3711, "lr": 2.1658882260867698e-06, "epoch": 6.060123784261715, "percentage": 86.57, "elapsed_time": "7:58:18", "remaining_time": "1:14:11"} +{"current_steps": 3435, "total_steps": 3962, "loss": 0.3914, "lr": 2.1261755050423204e-06, "epoch": 6.068965517241379, "percentage": 86.7, "elapsed_time": "7:58:59", "remaining_time": "1:13:29"} +{"current_steps": 3440, "total_steps": 3962, "loss": 0.3824, "lr": 2.086809790387905e-06, "epoch": 6.077807250221043, "percentage": 86.82, "elapsed_time": "7:59:30", "remaining_time": "1:12:45"} +{"current_steps": 3445, "total_steps": 3962, "loss": 0.3832, "lr": 2.047791846378242e-06, "epoch": 6.086648983200707, "percentage": 86.95, "elapsed_time": "8:00:13", "remaining_time": "1:12:04"} +{"current_steps": 3450, "total_steps": 3962, "loss": 0.3862, "lr": 2.009122430516337e-06, "epoch": 6.095490716180372, "percentage": 87.08, "elapsed_time": "8:01:00", "remaining_time": "1:11:23"} +{"current_steps": 3455, "total_steps": 3962, "loss": 0.3777, "lr": 1.970802293538807e-06, "epoch": 6.104332449160036, "percentage": 87.2, "elapsed_time": "8:01:51", "remaining_time": "1:10:42"} +{"current_steps": 3460, "total_steps": 3962, "loss": 0.3882, "lr": 1.9328321794012762e-06, "epoch": 6.1131741821397, "percentage": 87.33, "elapsed_time": "8:02:41", "remaining_time": "1:10:01"} +{"current_steps": 3465, "total_steps": 3962, "loss": 0.3912, "lr": 1.895212825263959e-06, "epoch": 6.122015915119364, "percentage": 87.46, "elapsed_time": "8:03:20", "remaining_time": "1:09:19"} +{"current_steps": 3470, "total_steps": 3962, "loss": 0.3729, "lr": 1.8579449614773314e-06, "epoch": 6.130857648099028, "percentage": 87.58, "elapsed_time": "8:04:13", "remaining_time": "1:08:39"} +{"current_steps": 3475, "total_steps": 3962, "loss": 0.4061, "lr": 1.8210293115679677e-06, "epoch": 6.1396993810786915, "percentage": 87.71, "elapsed_time": "8:04:45", "remaining_time": "1:07:56"} +{"current_steps": 3480, "total_steps": 3962, "loss": 0.3966, "lr": 1.784466592224472e-06, "epoch": 6.1485411140583555, "percentage": 87.83, "elapsed_time": "8:05:22", "remaining_time": "1:07:13"} +{"current_steps": 3485, "total_steps": 3962, "loss": 0.3926, "lr": 1.74825751328358e-06, "epoch": 6.157382847038019, "percentage": 87.96, "elapsed_time": "8:06:09", "remaining_time": "1:06:32"} +{"current_steps": 3490, "total_steps": 3962, "loss": 0.4201, "lr": 1.7124027777163732e-06, "epoch": 6.166224580017683, "percentage": 88.09, "elapsed_time": "8:06:45", "remaining_time": "1:05:49"} +{"current_steps": 3495, "total_steps": 3962, "loss": 0.3965, "lr": 1.6769030816146404e-06, "epoch": 6.175066312997347, "percentage": 88.21, "elapsed_time": "8:07:23", "remaining_time": "1:05:07"} +{"current_steps": 3500, "total_steps": 3962, "loss": 0.4146, "lr": 1.6417591141773458e-06, "epoch": 6.183908045977011, "percentage": 88.34, "elapsed_time": "8:08:07", "remaining_time": "1:04:25"} +{"current_steps": 3505, "total_steps": 3962, "loss": 0.3904, "lr": 1.6069715576972634e-06, "epoch": 6.192749778956675, "percentage": 88.47, "elapsed_time": "8:08:42", "remaining_time": "1:03:43"} +{"current_steps": 3510, "total_steps": 3962, "loss": 0.3608, "lr": 1.5725410875477187e-06, "epoch": 6.201591511936339, "percentage": 88.59, "elapsed_time": "8:09:16", "remaining_time": "1:03:00"} +{"current_steps": 3515, "total_steps": 3962, "loss": 0.3889, "lr": 1.5384683721694993e-06, "epoch": 6.210433244916003, "percentage": 88.72, "elapsed_time": "8:09:55", "remaining_time": "1:02:18"} +{"current_steps": 3520, "total_steps": 3962, "loss": 0.4015, "lr": 1.504754073057846e-06, "epoch": 6.219274977895668, "percentage": 88.84, "elapsed_time": "8:10:41", "remaining_time": "1:01:36"} +{"current_steps": 3525, "total_steps": 3962, "loss": 0.4037, "lr": 1.4713988447496342e-06, "epoch": 6.228116710875332, "percentage": 88.97, "elapsed_time": "8:11:14", "remaining_time": "1:00:54"} +{"current_steps": 3530, "total_steps": 3962, "loss": 0.3768, "lr": 1.438403334810663e-06, "epoch": 6.236958443854996, "percentage": 89.1, "elapsed_time": "8:12:00", "remaining_time": "1:00:12"} +{"current_steps": 3535, "total_steps": 3962, "loss": 0.3864, "lr": 1.405768183823073e-06, "epoch": 6.24580017683466, "percentage": 89.22, "elapsed_time": "8:12:32", "remaining_time": "0:59:29"} +{"current_steps": 3540, "total_steps": 3962, "loss": 0.3777, "lr": 1.3734940253729167e-06, "epoch": 6.254641909814324, "percentage": 89.35, "elapsed_time": "8:13:14", "remaining_time": "0:58:47"} +{"current_steps": 3545, "total_steps": 3962, "loss": 0.3766, "lr": 1.3415814860378573e-06, "epoch": 6.263483642793988, "percentage": 89.48, "elapsed_time": "8:13:48", "remaining_time": "0:58:05"} +{"current_steps": 3550, "total_steps": 3962, "loss": 0.4088, "lr": 1.3100311853750114e-06, "epoch": 6.272325375773652, "percentage": 89.6, "elapsed_time": "8:14:29", "remaining_time": "0:57:23"} +{"current_steps": 3555, "total_steps": 3962, "loss": 0.3869, "lr": 1.2788437359089056e-06, "epoch": 6.281167108753316, "percentage": 89.73, "elapsed_time": "8:15:19", "remaining_time": "0:56:42"} +{"current_steps": 3560, "total_steps": 3962, "loss": 0.3677, "lr": 1.248019743119595e-06, "epoch": 6.29000884173298, "percentage": 89.85, "elapsed_time": "8:16:08", "remaining_time": "0:56:01"} +{"current_steps": 3565, "total_steps": 3962, "loss": 0.3637, "lr": 1.2175598054309058e-06, "epoch": 6.2988505747126435, "percentage": 89.98, "elapsed_time": "8:16:45", "remaining_time": "0:55:19"} +{"current_steps": 3570, "total_steps": 3962, "loss": 0.389, "lr": 1.187464514198824e-06, "epoch": 6.3076923076923075, "percentage": 90.11, "elapsed_time": "8:17:21", "remaining_time": "0:54:36"} +{"current_steps": 3575, "total_steps": 3962, "loss": 0.3619, "lr": 1.1577344537000012e-06, "epoch": 6.316534040671971, "percentage": 90.23, "elapsed_time": "8:18:04", "remaining_time": "0:53:55"} +{"current_steps": 3580, "total_steps": 3962, "loss": 0.4175, "lr": 1.128370201120419e-06, "epoch": 6.325375773651635, "percentage": 90.36, "elapsed_time": "8:18:48", "remaining_time": "0:53:13"} +{"current_steps": 3585, "total_steps": 3962, "loss": 0.3823, "lr": 1.0993723265441835e-06, "epoch": 6.334217506631299, "percentage": 90.48, "elapsed_time": "8:19:32", "remaining_time": "0:52:31"} +{"current_steps": 3590, "total_steps": 3962, "loss": 0.415, "lr": 1.0707413929424626e-06, "epoch": 6.343059239610964, "percentage": 90.61, "elapsed_time": "8:20:12", "remaining_time": "0:51:49"} +{"current_steps": 3595, "total_steps": 3962, "loss": 0.3905, "lr": 1.0424779561625465e-06, "epoch": 6.351900972590628, "percentage": 90.74, "elapsed_time": "8:20:56", "remaining_time": "0:51:08"} +{"current_steps": 3600, "total_steps": 3962, "loss": 0.4086, "lr": 1.0145825649170593e-06, "epoch": 6.360742705570292, "percentage": 90.86, "elapsed_time": "8:21:35", "remaining_time": "0:50:26"} +{"current_steps": 3605, "total_steps": 3962, "loss": 0.3799, "lr": 9.870557607733056e-07, "epoch": 6.369584438549956, "percentage": 90.99, "elapsed_time": "8:22:08", "remaining_time": "0:49:43"} +{"current_steps": 3610, "total_steps": 3962, "loss": 0.4035, "lr": 9.59898078142767e-07, "epoch": 6.37842617152962, "percentage": 91.12, "elapsed_time": "8:22:45", "remaining_time": "0:49:01"} +{"current_steps": 3615, "total_steps": 3962, "loss": 0.4052, "lr": 9.331100442707108e-07, "epoch": 6.387267904509284, "percentage": 91.24, "elapsed_time": "8:23:37", "remaining_time": "0:48:20"} +{"current_steps": 3620, "total_steps": 3962, "loss": 0.389, "lr": 9.066921792259654e-07, "epoch": 6.396109637488948, "percentage": 91.37, "elapsed_time": "8:24:20", "remaining_time": "0:47:38"} +{"current_steps": 3625, "total_steps": 3962, "loss": 0.382, "lr": 8.806449958908115e-07, "epoch": 6.404951370468612, "percentage": 91.49, "elapsed_time": "8:25:06", "remaining_time": "0:46:57"} +{"current_steps": 3630, "total_steps": 3962, "loss": 0.3822, "lr": 8.549689999510446e-07, "epoch": 6.413793103448276, "percentage": 91.62, "elapsed_time": "8:25:53", "remaining_time": "0:46:16"} +{"current_steps": 3635, "total_steps": 3962, "loss": 0.3807, "lr": 8.296646898861405e-07, "epoch": 6.42263483642794, "percentage": 91.75, "elapsed_time": "8:26:40", "remaining_time": "0:45:34"} +{"current_steps": 3640, "total_steps": 3962, "loss": 0.3883, "lr": 8.047325569595821e-07, "epoch": 6.431476569407604, "percentage": 91.87, "elapsed_time": "8:27:33", "remaining_time": "0:44:54"} +{"current_steps": 3645, "total_steps": 3962, "loss": 0.4044, "lr": 7.801730852093193e-07, "epoch": 6.440318302387268, "percentage": 92.0, "elapsed_time": "8:28:33", "remaining_time": "0:44:13"} +{"current_steps": 3650, "total_steps": 3962, "loss": 0.3647, "lr": 7.559867514383867e-07, "epoch": 6.449160035366932, "percentage": 92.13, "elapsed_time": "8:29:23", "remaining_time": "0:43:32"} +{"current_steps": 3655, "total_steps": 3962, "loss": 0.4066, "lr": 7.321740252056253e-07, "epoch": 6.458001768346596, "percentage": 92.25, "elapsed_time": "8:30:18", "remaining_time": "0:42:51"} +{"current_steps": 3660, "total_steps": 3962, "loss": 0.4453, "lr": 7.087353688165776e-07, "epoch": 6.4668435013262595, "percentage": 92.38, "elapsed_time": "8:30:58", "remaining_time": "0:42:09"} +{"current_steps": 3665, "total_steps": 3962, "loss": 0.3908, "lr": 6.856712373145158e-07, "epoch": 6.475685234305924, "percentage": 92.5, "elapsed_time": "8:31:50", "remaining_time": "0:41:28"} +{"current_steps": 3670, "total_steps": 3962, "loss": 0.399, "lr": 6.62982078471599e-07, "epoch": 6.484526967285588, "percentage": 92.63, "elapsed_time": "8:32:42", "remaining_time": "0:40:47"} +{"current_steps": 3675, "total_steps": 3962, "loss": 0.3775, "lr": 6.406683327801877e-07, "epoch": 6.493368700265252, "percentage": 92.76, "elapsed_time": "8:33:16", "remaining_time": "0:40:05"} +{"current_steps": 3680, "total_steps": 3962, "loss": 0.3885, "lr": 6.187304334442856e-07, "epoch": 6.502210433244916, "percentage": 92.88, "elapsed_time": "8:33:59", "remaining_time": "0:39:23"} +{"current_steps": 3685, "total_steps": 3962, "loss": 0.3798, "lr": 5.97168806371129e-07, "epoch": 6.51105216622458, "percentage": 93.01, "elapsed_time": "8:34:41", "remaining_time": "0:38:41"} +{"current_steps": 3690, "total_steps": 3962, "loss": 0.3876, "lr": 5.759838701629284e-07, "epoch": 6.519893899204244, "percentage": 93.13, "elapsed_time": "8:35:19", "remaining_time": "0:37:59"} +{"current_steps": 3695, "total_steps": 3962, "loss": 0.3781, "lr": 5.551760361087288e-07, "epoch": 6.528735632183908, "percentage": 93.26, "elapsed_time": "8:36:00", "remaining_time": "0:37:17"} +{"current_steps": 3700, "total_steps": 3962, "loss": 0.387, "lr": 5.347457081764318e-07, "epoch": 6.537577365163572, "percentage": 93.39, "elapsed_time": "8:36:28", "remaining_time": "0:36:34"} +{"current_steps": 3705, "total_steps": 3962, "loss": 0.3908, "lr": 5.146932830049545e-07, "epoch": 6.546419098143236, "percentage": 93.51, "elapsed_time": "8:37:20", "remaining_time": "0:35:53"} +{"current_steps": 3710, "total_steps": 3962, "loss": 0.391, "lr": 4.950191498965207e-07, "epoch": 6.5552608311229, "percentage": 93.64, "elapsed_time": "8:38:04", "remaining_time": "0:35:11"} +{"current_steps": 3715, "total_steps": 3962, "loss": 0.402, "lr": 4.7572369080910897e-07, "epoch": 6.564102564102564, "percentage": 93.77, "elapsed_time": "8:38:51", "remaining_time": "0:34:29"} +{"current_steps": 3720, "total_steps": 3962, "loss": 0.4178, "lr": 4.568072803490409e-07, "epoch": 6.572944297082228, "percentage": 93.89, "elapsed_time": "8:39:31", "remaining_time": "0:33:47"} +{"current_steps": 3725, "total_steps": 3962, "loss": 0.3803, "lr": 4.382702857637022e-07, "epoch": 6.581786030061892, "percentage": 94.02, "elapsed_time": "8:40:15", "remaining_time": "0:33:06"} +{"current_steps": 3730, "total_steps": 3962, "loss": 0.4013, "lr": 4.2011306693441554e-07, "epoch": 6.590627763041557, "percentage": 94.14, "elapsed_time": "8:40:58", "remaining_time": "0:32:24"} +{"current_steps": 3735, "total_steps": 3962, "loss": 0.3904, "lr": 4.0233597636944565e-07, "epoch": 6.59946949602122, "percentage": 94.27, "elapsed_time": "8:41:39", "remaining_time": "0:31:42"} +{"current_steps": 3740, "total_steps": 3962, "loss": 0.4063, "lr": 3.84939359197174e-07, "epoch": 6.6083112290008845, "percentage": 94.4, "elapsed_time": "8:42:20", "remaining_time": "0:31:00"} +{"current_steps": 3745, "total_steps": 3962, "loss": 0.3735, "lr": 3.6792355315937947e-07, "epoch": 6.6171529619805485, "percentage": 94.52, "elapsed_time": "8:43:06", "remaining_time": "0:30:18"} +{"current_steps": 3750, "total_steps": 3962, "loss": 0.3885, "lr": 3.5128888860468836e-07, "epoch": 6.625994694960212, "percentage": 94.65, "elapsed_time": "8:43:48", "remaining_time": "0:29:36"} +{"current_steps": 3755, "total_steps": 3962, "loss": 0.4011, "lr": 3.350356884821748e-07, "epoch": 6.634836427939876, "percentage": 94.78, "elapsed_time": "8:44:18", "remaining_time": "0:28:54"} +{"current_steps": 3760, "total_steps": 3962, "loss": 0.3918, "lr": 3.191642683350571e-07, "epoch": 6.64367816091954, "percentage": 94.9, "elapsed_time": "8:45:00", "remaining_time": "0:28:12"} +{"current_steps": 3765, "total_steps": 3962, "loss": 0.388, "lr": 3.036749362946112e-07, "epoch": 6.652519893899204, "percentage": 95.03, "elapsed_time": "8:45:39", "remaining_time": "0:27:30"} +{"current_steps": 3770, "total_steps": 3962, "loss": 0.3903, "lr": 2.8856799307415807e-07, "epoch": 6.661361626878868, "percentage": 95.15, "elapsed_time": "8:46:23", "remaining_time": "0:26:48"} +{"current_steps": 3775, "total_steps": 3962, "loss": 0.3681, "lr": 2.7384373196324365e-07, "epoch": 6.670203359858532, "percentage": 95.28, "elapsed_time": "8:47:03", "remaining_time": "0:26:06"} +{"current_steps": 3780, "total_steps": 3962, "loss": 0.3841, "lr": 2.595024388219347e-07, "epoch": 6.679045092838196, "percentage": 95.41, "elapsed_time": "8:47:39", "remaining_time": "0:25:24"} +{"current_steps": 3785, "total_steps": 3962, "loss": 0.3825, "lr": 2.4554439207527424e-07, "epoch": 6.68788682581786, "percentage": 95.53, "elapsed_time": "8:48:28", "remaining_time": "0:24:42"} +{"current_steps": 3790, "total_steps": 3962, "loss": 0.4226, "lr": 2.3196986270787704e-07, "epoch": 6.696728558797524, "percentage": 95.66, "elapsed_time": "8:49:12", "remaining_time": "0:24:00"} +{"current_steps": 3795, "total_steps": 3962, "loss": 0.3864, "lr": 2.1877911425866705e-07, "epoch": 6.705570291777188, "percentage": 95.78, "elapsed_time": "8:49:52", "remaining_time": "0:23:19"} +{"current_steps": 3800, "total_steps": 3962, "loss": 0.3834, "lr": 2.059724028157506e-07, "epoch": 6.714412024756852, "percentage": 95.91, "elapsed_time": "8:50:29", "remaining_time": "0:22:36"} +{"current_steps": 3805, "total_steps": 3962, "loss": 0.3951, "lr": 1.9354997701146904e-07, "epoch": 6.723253757736517, "percentage": 96.04, "elapsed_time": "8:51:11", "remaining_time": "0:21:55"} +{"current_steps": 3810, "total_steps": 3962, "loss": 0.4429, "lr": 1.8151207801754722e-07, "epoch": 6.732095490716181, "percentage": 96.16, "elapsed_time": "8:51:48", "remaining_time": "0:21:12"} +{"current_steps": 3815, "total_steps": 3962, "loss": 0.4009, "lr": 1.6985893954042598e-07, "epoch": 6.740937223695845, "percentage": 96.29, "elapsed_time": "8:52:28", "remaining_time": "0:20:31"} +{"current_steps": 3820, "total_steps": 3962, "loss": 0.3758, "lr": 1.5859078781671477e-07, "epoch": 6.749778956675509, "percentage": 96.42, "elapsed_time": "8:53:06", "remaining_time": "0:19:49"} +{"current_steps": 3825, "total_steps": 3962, "loss": 0.383, "lr": 1.477078416088107e-07, "epoch": 6.758620689655173, "percentage": 96.54, "elapsed_time": "8:53:47", "remaining_time": "0:19:07"} +{"current_steps": 3830, "total_steps": 3962, "loss": 0.3985, "lr": 1.3721031220064185e-07, "epoch": 6.7674624226348365, "percentage": 96.67, "elapsed_time": "8:54:22", "remaining_time": "0:18:25"} +{"current_steps": 3835, "total_steps": 3962, "loss": 0.3803, "lr": 1.2709840339357515e-07, "epoch": 6.7763041556145005, "percentage": 96.79, "elapsed_time": "8:55:06", "remaining_time": "0:17:43"} +{"current_steps": 3840, "total_steps": 3962, "loss": 0.383, "lr": 1.1737231150244388e-07, "epoch": 6.7851458885941645, "percentage": 96.92, "elapsed_time": "8:55:50", "remaining_time": "0:17:01"} +{"current_steps": 3845, "total_steps": 3962, "loss": 0.3603, "lr": 1.0803222535175295e-07, "epoch": 6.793987621573828, "percentage": 97.05, "elapsed_time": "8:56:36", "remaining_time": "0:16:19"} +{"current_steps": 3850, "total_steps": 3962, "loss": 0.3988, "lr": 9.907832627200631e-08, "epoch": 6.802829354553492, "percentage": 97.17, "elapsed_time": "8:57:11", "remaining_time": "0:15:37"} +{"current_steps": 3855, "total_steps": 3962, "loss": 0.3876, "lr": 9.051078809618752e-08, "epoch": 6.811671087533156, "percentage": 97.3, "elapsed_time": "8:57:51", "remaining_time": "0:14:55"} +{"current_steps": 3860, "total_steps": 3962, "loss": 0.3803, "lr": 8.232977715637358e-08, "epoch": 6.82051282051282, "percentage": 97.43, "elapsed_time": "8:58:32", "remaining_time": "0:14:13"} +{"current_steps": 3865, "total_steps": 3962, "loss": 0.389, "lr": 7.453545228053305e-08, "epoch": 6.829354553492484, "percentage": 97.55, "elapsed_time": "8:59:11", "remaining_time": "0:13:31"} +{"current_steps": 3870, "total_steps": 3962, "loss": 0.4068, "lr": 6.712796478940853e-08, "epoch": 6.838196286472148, "percentage": 97.68, "elapsed_time": "8:59:56", "remaining_time": "0:12:50"} +{"current_steps": 3875, "total_steps": 3962, "loss": 0.3891, "lr": 6.010745849361011e-08, "epoch": 6.847038019451812, "percentage": 97.8, "elapsed_time": "9:00:50", "remaining_time": "0:12:08"} +{"current_steps": 3880, "total_steps": 3962, "loss": 0.417, "lr": 5.347406969079982e-08, "epoch": 6.855879752431477, "percentage": 97.93, "elapsed_time": "9:01:22", "remaining_time": "0:11:26"} +{"current_steps": 3885, "total_steps": 3962, "loss": 0.3896, "lr": 4.722792716306046e-08, "epoch": 6.864721485411141, "percentage": 98.06, "elapsed_time": "9:01:55", "remaining_time": "0:10:44"} +{"current_steps": 3890, "total_steps": 3962, "loss": 0.372, "lr": 4.1369152174381975e-08, "epoch": 6.873563218390805, "percentage": 98.18, "elapsed_time": "9:02:36", "remaining_time": "0:10:02"} +{"current_steps": 3895, "total_steps": 3962, "loss": 0.3872, "lr": 3.589785846832783e-08, "epoch": 6.882404951370469, "percentage": 98.31, "elapsed_time": "9:03:16", "remaining_time": "0:09:20"} +{"current_steps": 3900, "total_steps": 3962, "loss": 0.3451, "lr": 3.081415226579898e-08, "epoch": 6.891246684350133, "percentage": 98.44, "elapsed_time": "9:03:57", "remaining_time": "0:08:38"} +{"current_steps": 3905, "total_steps": 3962, "loss": 0.3851, "lr": 2.6118132263002193e-08, "epoch": 6.900088417329797, "percentage": 98.56, "elapsed_time": "9:04:46", "remaining_time": "0:07:57"} +{"current_steps": 3910, "total_steps": 3962, "loss": 0.3911, "lr": 2.18098896295027e-08, "epoch": 6.908930150309461, "percentage": 98.69, "elapsed_time": "9:05:24", "remaining_time": "0:07:15"} +{"current_steps": 3915, "total_steps": 3962, "loss": 0.3883, "lr": 1.788950800648337e-08, "epoch": 6.917771883289125, "percentage": 98.81, "elapsed_time": "9:06:13", "remaining_time": "0:06:33"} +{"current_steps": 3920, "total_steps": 3962, "loss": 0.4133, "lr": 1.4357063505101576e-08, "epoch": 6.926613616268789, "percentage": 98.94, "elapsed_time": "9:06:49", "remaining_time": "0:05:51"} +{"current_steps": 3925, "total_steps": 3962, "loss": 0.4242, "lr": 1.1212624705014829e-08, "epoch": 6.9354553492484525, "percentage": 99.07, "elapsed_time": "9:07:24", "remaining_time": "0:05:09"} +{"current_steps": 3930, "total_steps": 3962, "loss": 0.4284, "lr": 8.456252653055164e-09, "epoch": 6.9442970822281165, "percentage": 99.19, "elapsed_time": "9:08:11", "remaining_time": "0:04:27"} +{"current_steps": 3935, "total_steps": 3962, "loss": 0.3761, "lr": 6.08800086204342e-09, "epoch": 6.95313881520778, "percentage": 99.32, "elapsed_time": "9:08:51", "remaining_time": "0:03:45"} +{"current_steps": 3940, "total_steps": 3962, "loss": 0.4059, "lr": 4.107915309743416e-09, "epoch": 6.961980548187444, "percentage": 99.44, "elapsed_time": "9:09:29", "remaining_time": "0:03:04"} +{"current_steps": 3945, "total_steps": 3962, "loss": 0.4263, "lr": 2.516034437973769e-09, "epoch": 6.970822281167109, "percentage": 99.57, "elapsed_time": "9:10:04", "remaining_time": "0:02:22"} +{"current_steps": 3950, "total_steps": 3962, "loss": 0.4027, "lr": 1.312389151861826e-09, "epoch": 6.979664014146772, "percentage": 99.7, "elapsed_time": "9:10:38", "remaining_time": "0:01:40"} +{"current_steps": 3955, "total_steps": 3962, "loss": 0.4011, "lr": 4.970028192485821e-10, "epoch": 6.988505747126437, "percentage": 99.82, "elapsed_time": "9:11:11", "remaining_time": "0:00:58"} +{"current_steps": 3960, "total_steps": 3962, "loss": 0.392, "lr": 6.989127021794773e-11, "epoch": 6.997347480106101, "percentage": 99.95, "elapsed_time": "9:11:39", "remaining_time": "0:00:16"} +{"current_steps": 3962, "total_steps": 3962, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "9:12:30", "remaining_time": "0:00:00"} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..c4ad50e --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,8759 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 7.0, + "eval_steps": 500, + "global_step": 3962, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.008841732979664015, + "grad_norm": 16.43759145601646, + "learning_rate": 4.030226700251889e-07, + "loss": 0.9913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4914407730102539, + "step": 5, + "valid_targets_mean": 3975.9, + "valid_targets_min": 247 + }, + { + "epoch": 0.01768346595932803, + "grad_norm": 17.984303937601393, + "learning_rate": 9.068010075566751e-07, + "loss": 1.09, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5117278099060059, + "step": 10, + "valid_targets_mean": 2293.8, + "valid_targets_min": 269 + }, + { + "epoch": 0.026525198938992044, + "grad_norm": 17.430054844624365, + "learning_rate": 1.4105793450881613e-06, + "loss": 1.0664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.48715919256210327, + "step": 15, + "valid_targets_mean": 3742.1, + "valid_targets_min": 610 + }, + { + "epoch": 0.03536693191865606, + "grad_norm": 13.157985816910156, + "learning_rate": 1.9143576826196476e-06, + "loss": 1.0244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.48635387420654297, + "step": 20, + "valid_targets_mean": 3909.9, + "valid_targets_min": 431 + }, + { + "epoch": 0.04420866489832007, + "grad_norm": 7.039459793103061, + "learning_rate": 2.4181360201511335e-06, + "loss": 0.9523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5950973629951477, + "step": 25, + "valid_targets_mean": 4854.0, + "valid_targets_min": 1882 + }, + { + "epoch": 0.05305039787798409, + "grad_norm": 4.37502689672069, + "learning_rate": 2.92191435768262e-06, + "loss": 0.8882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4377889037132263, + "step": 30, + "valid_targets_mean": 3904.2, + "valid_targets_min": 558 + }, + { + "epoch": 0.0618921308576481, + "grad_norm": 2.2984916066569143, + "learning_rate": 3.425692695214106e-06, + "loss": 0.8596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3730544149875641, + "step": 35, + "valid_targets_mean": 4253.4, + "valid_targets_min": 403 + }, + { + "epoch": 0.07073386383731212, + "grad_norm": 1.749502864868188, + "learning_rate": 3.9294710327455925e-06, + "loss": 0.8071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37501755356788635, + "step": 40, + "valid_targets_mean": 3304.0, + "valid_targets_min": 463 + }, + { + "epoch": 0.07957559681697612, + "grad_norm": 1.4297619383408833, + "learning_rate": 4.433249370277078e-06, + "loss": 0.7654, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2531526982784271, + "step": 45, + "valid_targets_mean": 2443.0, + "valid_targets_min": 536 + }, + { + "epoch": 0.08841732979664015, + "grad_norm": 1.2107916623135075, + "learning_rate": 4.937027707808565e-06, + "loss": 0.7661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26174238324165344, + "step": 50, + "valid_targets_mean": 1962.4, + "valid_targets_min": 419 + }, + { + "epoch": 0.09725906277630415, + "grad_norm": 1.1177863382586022, + "learning_rate": 5.440806045340051e-06, + "loss": 0.7088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2441769391298294, + "step": 55, + "valid_targets_mean": 1324.0, + "valid_targets_min": 387 + }, + { + "epoch": 0.10610079575596817, + "grad_norm": 1.3240485836200855, + "learning_rate": 5.944584382871537e-06, + "loss": 0.7418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.45804762840270996, + "step": 60, + "valid_targets_mean": 2281.6, + "valid_targets_min": 299 + }, + { + "epoch": 0.11494252873563218, + "grad_norm": 0.9887476322800939, + "learning_rate": 6.448362720403023e-06, + "loss": 0.7786, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3559702932834625, + "step": 65, + "valid_targets_mean": 2576.8, + "valid_targets_min": 979 + }, + { + "epoch": 0.1237842617152962, + "grad_norm": 0.8313614619463878, + "learning_rate": 6.9521410579345095e-06, + "loss": 0.7667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32869428396224976, + "step": 70, + "valid_targets_mean": 2681.1, + "valid_targets_min": 559 + }, + { + "epoch": 0.13262599469496023, + "grad_norm": 1.2928448614693209, + "learning_rate": 7.455919395465996e-06, + "loss": 0.7316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4524758458137512, + "step": 75, + "valid_targets_mean": 2086.6, + "valid_targets_min": 305 + }, + { + "epoch": 0.14146772767462423, + "grad_norm": 0.9039110142607959, + "learning_rate": 7.959697732997482e-06, + "loss": 0.7216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.41223078966140747, + "step": 80, + "valid_targets_mean": 2522.0, + "valid_targets_min": 418 + }, + { + "epoch": 0.15030946065428824, + "grad_norm": 1.1531713116573887, + "learning_rate": 8.463476070528968e-06, + "loss": 0.6962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31595444679260254, + "step": 85, + "valid_targets_mean": 2714.1, + "valid_targets_min": 435 + }, + { + "epoch": 0.15915119363395225, + "grad_norm": 0.7279561415401078, + "learning_rate": 8.967254408060454e-06, + "loss": 0.7161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.45249640941619873, + "step": 90, + "valid_targets_mean": 4901.6, + "valid_targets_min": 628 + }, + { + "epoch": 0.16799292661361626, + "grad_norm": 0.7881029215112537, + "learning_rate": 9.47103274559194e-06, + "loss": 0.706, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31990885734558105, + "step": 95, + "valid_targets_mean": 2807.6, + "valid_targets_min": 268 + }, + { + "epoch": 0.1768346595932803, + "grad_norm": 0.7086656082236659, + "learning_rate": 9.974811083123427e-06, + "loss": 0.6583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.270596981048584, + "step": 100, + "valid_targets_mean": 2979.0, + "valid_targets_min": 722 + }, + { + "epoch": 0.1856763925729443, + "grad_norm": 0.8874052957709296, + "learning_rate": 1.0478589420654912e-05, + "loss": 0.6697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24225851893424988, + "step": 105, + "valid_targets_mean": 1624.0, + "valid_targets_min": 356 + }, + { + "epoch": 0.1945181255526083, + "grad_norm": 0.8682741626307907, + "learning_rate": 1.0982367758186399e-05, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38384777307510376, + "step": 110, + "valid_targets_mean": 2603.8, + "valid_targets_min": 504 + }, + { + "epoch": 0.20335985853227231, + "grad_norm": 0.7893830841438993, + "learning_rate": 1.1486146095717885e-05, + "loss": 0.6651, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3616026043891907, + "step": 115, + "valid_targets_mean": 5229.1, + "valid_targets_min": 648 + }, + { + "epoch": 0.21220159151193635, + "grad_norm": 0.8435136463460109, + "learning_rate": 1.1989924433249371e-05, + "loss": 0.7056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35327407717704773, + "step": 120, + "valid_targets_mean": 3276.9, + "valid_targets_min": 557 + }, + { + "epoch": 0.22104332449160036, + "grad_norm": 0.8326030890475514, + "learning_rate": 1.2493702770780859e-05, + "loss": 0.6327, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29393622279167175, + "step": 125, + "valid_targets_mean": 3015.4, + "valid_targets_min": 1786 + }, + { + "epoch": 0.22988505747126436, + "grad_norm": 0.5791447791458552, + "learning_rate": 1.2997481108312344e-05, + "loss": 0.6477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31838011741638184, + "step": 130, + "valid_targets_mean": 4220.1, + "valid_targets_min": 704 + }, + { + "epoch": 0.23872679045092837, + "grad_norm": 0.7833412749104234, + "learning_rate": 1.350125944584383e-05, + "loss": 0.6188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3599586486816406, + "step": 135, + "valid_targets_mean": 3493.0, + "valid_targets_min": 562 + }, + { + "epoch": 0.2475685234305924, + "grad_norm": 0.6930132817315054, + "learning_rate": 1.4005037783375318e-05, + "loss": 0.6729, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3735961318016052, + "step": 140, + "valid_targets_mean": 3788.9, + "valid_targets_min": 1905 + }, + { + "epoch": 0.2564102564102564, + "grad_norm": 0.6900812305728492, + "learning_rate": 1.4508816120906802e-05, + "loss": 0.5868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2900860905647278, + "step": 145, + "valid_targets_mean": 3795.8, + "valid_targets_min": 881 + }, + { + "epoch": 0.26525198938992045, + "grad_norm": 0.668587653722343, + "learning_rate": 1.5012594458438288e-05, + "loss": 0.6371, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23740538954734802, + "step": 150, + "valid_targets_mean": 3166.9, + "valid_targets_min": 1434 + }, + { + "epoch": 0.27409372236958446, + "grad_norm": 0.6857654288467885, + "learning_rate": 1.5516372795969776e-05, + "loss": 0.6119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.49299874901771545, + "step": 155, + "valid_targets_mean": 5421.9, + "valid_targets_min": 2002 + }, + { + "epoch": 0.28293545534924847, + "grad_norm": 0.7011124721817551, + "learning_rate": 1.602015113350126e-05, + "loss": 0.6135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2792966365814209, + "step": 160, + "valid_targets_mean": 3557.1, + "valid_targets_min": 307 + }, + { + "epoch": 0.2917771883289125, + "grad_norm": 0.7181568311757064, + "learning_rate": 1.6523929471032747e-05, + "loss": 0.6163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3261794447898865, + "step": 165, + "valid_targets_mean": 3577.6, + "valid_targets_min": 1825 + }, + { + "epoch": 0.3006189213085765, + "grad_norm": 0.6383260621735827, + "learning_rate": 1.7027707808564233e-05, + "loss": 0.6208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2658522427082062, + "step": 170, + "valid_targets_mean": 4118.4, + "valid_targets_min": 554 + }, + { + "epoch": 0.3094606542882405, + "grad_norm": 0.873748558543848, + "learning_rate": 1.753148614609572e-05, + "loss": 0.6582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27786922454833984, + "step": 175, + "valid_targets_mean": 2538.9, + "valid_targets_min": 411 + }, + { + "epoch": 0.3183023872679045, + "grad_norm": 0.7741218070486372, + "learning_rate": 1.8035264483627205e-05, + "loss": 0.661, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3300468325614929, + "step": 180, + "valid_targets_mean": 3783.0, + "valid_targets_min": 716 + }, + { + "epoch": 0.3271441202475685, + "grad_norm": 0.7153501560841902, + "learning_rate": 1.8539042821158694e-05, + "loss": 0.613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30669140815734863, + "step": 185, + "valid_targets_mean": 2831.9, + "valid_targets_min": 663 + }, + { + "epoch": 0.3359858532272325, + "grad_norm": 0.8733028655615769, + "learning_rate": 1.9042821158690177e-05, + "loss": 0.6091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4316086769104004, + "step": 190, + "valid_targets_mean": 3605.1, + "valid_targets_min": 411 + }, + { + "epoch": 0.3448275862068966, + "grad_norm": 0.8909617924940159, + "learning_rate": 1.9546599496221663e-05, + "loss": 0.7227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29832324385643005, + "step": 195, + "valid_targets_mean": 2360.1, + "valid_targets_min": 1393 + }, + { + "epoch": 0.3536693191865606, + "grad_norm": 0.7676692325940812, + "learning_rate": 2.0050377833753152e-05, + "loss": 0.6012, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.349293053150177, + "step": 200, + "valid_targets_mean": 3419.4, + "valid_targets_min": 532 + }, + { + "epoch": 0.3625110521662246, + "grad_norm": 0.6966533272502462, + "learning_rate": 2.0554156171284634e-05, + "loss": 0.597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34834665060043335, + "step": 205, + "valid_targets_mean": 4089.6, + "valid_targets_min": 2040 + }, + { + "epoch": 0.3713527851458886, + "grad_norm": 0.9033467905392003, + "learning_rate": 2.1057934508816124e-05, + "loss": 0.6181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3413087725639343, + "step": 210, + "valid_targets_mean": 2691.6, + "valid_targets_min": 1037 + }, + { + "epoch": 0.3801945181255526, + "grad_norm": 1.709473285401154, + "learning_rate": 2.156171284634761e-05, + "loss": 0.6068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2899201512336731, + "step": 215, + "valid_targets_mean": 3180.1, + "valid_targets_min": 317 + }, + { + "epoch": 0.3890362511052166, + "grad_norm": 0.7521210734695193, + "learning_rate": 2.2065491183879092e-05, + "loss": 0.5964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3372876048088074, + "step": 220, + "valid_targets_mean": 3230.0, + "valid_targets_min": 383 + }, + { + "epoch": 0.3978779840848806, + "grad_norm": 0.8333691908125227, + "learning_rate": 2.256926952141058e-05, + "loss": 0.6837, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3745100498199463, + "step": 225, + "valid_targets_mean": 2964.1, + "valid_targets_min": 761 + }, + { + "epoch": 0.40671971706454463, + "grad_norm": 0.6656840184265772, + "learning_rate": 2.3073047858942067e-05, + "loss": 0.603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19232776761054993, + "step": 230, + "valid_targets_mean": 2728.2, + "valid_targets_min": 321 + }, + { + "epoch": 0.4155614500442087, + "grad_norm": 0.7255450538392068, + "learning_rate": 2.3576826196473553e-05, + "loss": 0.597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33167585730552673, + "step": 235, + "valid_targets_mean": 3975.6, + "valid_targets_min": 1787 + }, + { + "epoch": 0.4244031830238727, + "grad_norm": 0.7811965432597004, + "learning_rate": 2.408060453400504e-05, + "loss": 0.6116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3258014917373657, + "step": 240, + "valid_targets_mean": 4064.9, + "valid_targets_min": 1431 + }, + { + "epoch": 0.4332449160035367, + "grad_norm": 0.7283721698739326, + "learning_rate": 2.4584382871536528e-05, + "loss": 0.6241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2866038680076599, + "step": 245, + "valid_targets_mean": 2983.4, + "valid_targets_min": 1332 + }, + { + "epoch": 0.4420866489832007, + "grad_norm": 0.8218129094311453, + "learning_rate": 2.508816120906801e-05, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33566445112228394, + "step": 250, + "valid_targets_mean": 3558.0, + "valid_targets_min": 493 + }, + { + "epoch": 0.4509283819628647, + "grad_norm": 0.7072939560249456, + "learning_rate": 2.55919395465995e-05, + "loss": 0.5453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31181544065475464, + "step": 255, + "valid_targets_mean": 3208.2, + "valid_targets_min": 460 + }, + { + "epoch": 0.45977011494252873, + "grad_norm": 1.0523349102236121, + "learning_rate": 2.6095717884130986e-05, + "loss": 0.6377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4069092869758606, + "step": 260, + "valid_targets_mean": 3098.2, + "valid_targets_min": 411 + }, + { + "epoch": 0.46861184792219274, + "grad_norm": 0.6450257152535478, + "learning_rate": 2.659949622166247e-05, + "loss": 0.623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27830231189727783, + "step": 265, + "valid_targets_mean": 4357.8, + "valid_targets_min": 425 + }, + { + "epoch": 0.47745358090185674, + "grad_norm": 0.7522066599890925, + "learning_rate": 2.7103274559193958e-05, + "loss": 0.5872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18803122639656067, + "step": 270, + "valid_targets_mean": 2124.2, + "valid_targets_min": 409 + }, + { + "epoch": 0.48629531388152075, + "grad_norm": 0.884412534841973, + "learning_rate": 2.760705289672544e-05, + "loss": 0.616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3839704692363739, + "step": 275, + "valid_targets_mean": 2501.4, + "valid_targets_min": 368 + }, + { + "epoch": 0.4951370468611848, + "grad_norm": 0.8891118328744042, + "learning_rate": 2.811083123425693e-05, + "loss": 0.6361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3874850273132324, + "step": 280, + "valid_targets_mean": 2678.1, + "valid_targets_min": 1297 + }, + { + "epoch": 0.5039787798408488, + "grad_norm": 0.8262092882520712, + "learning_rate": 2.8614609571788415e-05, + "loss": 0.605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38311082124710083, + "step": 285, + "valid_targets_mean": 3422.0, + "valid_targets_min": 870 + }, + { + "epoch": 0.5128205128205128, + "grad_norm": 0.709275574520186, + "learning_rate": 2.91183879093199e-05, + "loss": 0.6046, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18932947516441345, + "step": 290, + "valid_targets_mean": 2332.1, + "valid_targets_min": 718 + }, + { + "epoch": 0.5216622458001768, + "grad_norm": 0.7786332977338201, + "learning_rate": 2.9622166246851387e-05, + "loss": 0.6052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35691413283348083, + "step": 295, + "valid_targets_mean": 3540.5, + "valid_targets_min": 1245 + }, + { + "epoch": 0.5305039787798409, + "grad_norm": 0.7101179367848214, + "learning_rate": 3.0125944584382876e-05, + "loss": 0.6084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17877447605133057, + "step": 300, + "valid_targets_mean": 2138.0, + "valid_targets_min": 296 + }, + { + "epoch": 0.5393457117595049, + "grad_norm": 0.7234460485976838, + "learning_rate": 3.062972292191436e-05, + "loss": 0.5926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23484167456626892, + "step": 305, + "valid_targets_mean": 2718.2, + "valid_targets_min": 1374 + }, + { + "epoch": 0.5481874447391689, + "grad_norm": 0.8316290022850806, + "learning_rate": 3.113350125944585e-05, + "loss": 0.5576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2605739235877991, + "step": 310, + "valid_targets_mean": 2342.1, + "valid_targets_min": 390 + }, + { + "epoch": 0.5570291777188329, + "grad_norm": 0.7443583580419373, + "learning_rate": 3.1637279596977334e-05, + "loss": 0.5824, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3526822626590729, + "step": 315, + "valid_targets_mean": 2949.9, + "valid_targets_min": 378 + }, + { + "epoch": 0.5658709106984969, + "grad_norm": 0.9191837030143825, + "learning_rate": 3.214105793450882e-05, + "loss": 0.5984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35114723443984985, + "step": 320, + "valid_targets_mean": 2730.0, + "valid_targets_min": 479 + }, + { + "epoch": 0.5747126436781609, + "grad_norm": 0.7133394084017918, + "learning_rate": 3.2644836272040306e-05, + "loss": 0.5448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3304479122161865, + "step": 325, + "valid_targets_mean": 4008.5, + "valid_targets_min": 687 + }, + { + "epoch": 0.583554376657825, + "grad_norm": 0.7542186085539615, + "learning_rate": 3.314861460957179e-05, + "loss": 0.5912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35879507660865784, + "step": 330, + "valid_targets_mean": 3446.0, + "valid_targets_min": 1762 + }, + { + "epoch": 0.5923961096374889, + "grad_norm": 0.8806283364510236, + "learning_rate": 3.365239294710328e-05, + "loss": 0.546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2994898855686188, + "step": 335, + "valid_targets_mean": 2490.4, + "valid_targets_min": 1455 + }, + { + "epoch": 0.601237842617153, + "grad_norm": 0.7925231456510854, + "learning_rate": 3.415617128463476e-05, + "loss": 0.5375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27049198746681213, + "step": 340, + "valid_targets_mean": 3216.2, + "valid_targets_min": 1140 + }, + { + "epoch": 0.610079575596817, + "grad_norm": 0.8151714993878474, + "learning_rate": 3.465994962216625e-05, + "loss": 0.5658, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3359305262565613, + "step": 345, + "valid_targets_mean": 2819.4, + "valid_targets_min": 420 + }, + { + "epoch": 0.618921308576481, + "grad_norm": 0.6987780960519617, + "learning_rate": 3.516372795969774e-05, + "loss": 0.5964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22273704409599304, + "step": 350, + "valid_targets_mean": 3495.1, + "valid_targets_min": 2035 + }, + { + "epoch": 0.627763041556145, + "grad_norm": 0.82782268216302, + "learning_rate": 3.566750629722922e-05, + "loss": 0.5694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.282134473323822, + "step": 355, + "valid_targets_mean": 2781.4, + "valid_targets_min": 836 + }, + { + "epoch": 0.636604774535809, + "grad_norm": 0.7171815954941675, + "learning_rate": 3.617128463476071e-05, + "loss": 0.542, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24987182021141052, + "step": 360, + "valid_targets_mean": 2726.6, + "valid_targets_min": 650 + }, + { + "epoch": 0.6454465075154731, + "grad_norm": 0.6554762528349989, + "learning_rate": 3.667506297229219e-05, + "loss": 0.5764, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21046540141105652, + "step": 365, + "valid_targets_mean": 2741.9, + "valid_targets_min": 647 + }, + { + "epoch": 0.654288240495137, + "grad_norm": 0.7169452163324568, + "learning_rate": 3.717884130982368e-05, + "loss": 0.5865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35952502489089966, + "step": 370, + "valid_targets_mean": 4276.4, + "valid_targets_min": 1909 + }, + { + "epoch": 0.6631299734748011, + "grad_norm": 0.7498682876453387, + "learning_rate": 3.7682619647355165e-05, + "loss": 0.6103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.398249089717865, + "step": 375, + "valid_targets_mean": 3914.2, + "valid_targets_min": 395 + }, + { + "epoch": 0.671971706454465, + "grad_norm": 0.7431702929941265, + "learning_rate": 3.8186397984886654e-05, + "loss": 0.5234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36680591106414795, + "step": 380, + "valid_targets_mean": 3600.5, + "valid_targets_min": 653 + }, + { + "epoch": 0.6808134394341291, + "grad_norm": 0.7032240193017438, + "learning_rate": 3.8690176322418137e-05, + "loss": 0.5644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25154560804367065, + "step": 385, + "valid_targets_mean": 3544.6, + "valid_targets_min": 514 + }, + { + "epoch": 0.6896551724137931, + "grad_norm": 0.7824728334071819, + "learning_rate": 3.9193954659949626e-05, + "loss": 0.587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2563400864601135, + "step": 390, + "valid_targets_mean": 2525.2, + "valid_targets_min": 417 + }, + { + "epoch": 0.6984969053934571, + "grad_norm": 0.5938754028594158, + "learning_rate": 3.969773299748111e-05, + "loss": 0.594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36213839054107666, + "step": 395, + "valid_targets_mean": 4965.6, + "valid_targets_min": 1573 + }, + { + "epoch": 0.7073386383731212, + "grad_norm": 0.8560713693271218, + "learning_rate": 3.999996893720319e-05, + "loss": 0.5368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28493037819862366, + "step": 400, + "valid_targets_mean": 2209.5, + "valid_targets_min": 482 + }, + { + "epoch": 0.7161803713527851, + "grad_norm": 0.6574999517551925, + "learning_rate": 3.999961948184714e-05, + "loss": 0.5683, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27876657247543335, + "step": 405, + "valid_targets_mean": 4695.0, + "valid_targets_min": 739 + }, + { + "epoch": 0.7250221043324492, + "grad_norm": 0.7910350694289134, + "learning_rate": 3.999888174944605e-05, + "loss": 0.543, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29521095752716064, + "step": 410, + "valid_targets_mean": 2854.2, + "valid_targets_min": 572 + }, + { + "epoch": 0.7338638373121131, + "grad_norm": 0.7327617592282828, + "learning_rate": 3.9997755754322415e-05, + "loss": 0.5316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23895704746246338, + "step": 415, + "valid_targets_mean": 3236.0, + "valid_targets_min": 1129 + }, + { + "epoch": 0.7427055702917772, + "grad_norm": 0.683762113730083, + "learning_rate": 3.9996241518336554e-05, + "loss": 0.5805, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2622902989387512, + "step": 420, + "valid_targets_mean": 3360.2, + "valid_targets_min": 778 + }, + { + "epoch": 0.7515473032714411, + "grad_norm": 0.6712193589006633, + "learning_rate": 3.999433907088618e-05, + "loss": 0.5688, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33563822507858276, + "step": 425, + "valid_targets_mean": 4434.6, + "valid_targets_min": 830 + }, + { + "epoch": 0.7603890362511052, + "grad_norm": 0.8978969987784136, + "learning_rate": 3.999204844890582e-05, + "loss": 0.5326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21699407696723938, + "step": 430, + "valid_targets_mean": 1812.0, + "valid_targets_min": 380 + }, + { + "epoch": 0.7692307692307693, + "grad_norm": 0.7936562082241674, + "learning_rate": 3.998936969686614e-05, + "loss": 0.565, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2873769700527191, + "step": 435, + "valid_targets_mean": 2613.8, + "valid_targets_min": 351 + }, + { + "epoch": 0.7780725022104332, + "grad_norm": 0.6494725254339784, + "learning_rate": 3.9986302866773e-05, + "loss": 0.561, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27636170387268066, + "step": 440, + "valid_targets_mean": 3525.8, + "valid_targets_min": 515 + }, + { + "epoch": 0.7869142351900973, + "grad_norm": 0.7239196043024896, + "learning_rate": 3.998284801816654e-05, + "loss": 0.5455, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27213937044143677, + "step": 445, + "valid_targets_mean": 2831.9, + "valid_targets_min": 445 + }, + { + "epoch": 0.7957559681697612, + "grad_norm": 0.6995801380039492, + "learning_rate": 3.997900521811995e-05, + "loss": 0.5635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28841322660446167, + "step": 450, + "valid_targets_mean": 2727.2, + "valid_targets_min": 663 + }, + { + "epoch": 0.8045977011494253, + "grad_norm": 0.7321413221468167, + "learning_rate": 3.997477454123818e-05, + "loss": 0.5781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2708323299884796, + "step": 455, + "valid_targets_mean": 3125.6, + "valid_targets_min": 1084 + }, + { + "epoch": 0.8134394341290893, + "grad_norm": 0.834232877873331, + "learning_rate": 3.997015606965656e-05, + "loss": 0.5392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3525821566581726, + "step": 460, + "valid_targets_mean": 2664.1, + "valid_targets_min": 1235 + }, + { + "epoch": 0.8222811671087533, + "grad_norm": 0.8321360896222851, + "learning_rate": 3.996514989303911e-05, + "loss": 0.6028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32734864950180054, + "step": 465, + "valid_targets_mean": 2494.2, + "valid_targets_min": 1261 + }, + { + "epoch": 0.8311229000884174, + "grad_norm": 0.6935337345612683, + "learning_rate": 3.9959756108576853e-05, + "loss": 0.5558, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24893325567245483, + "step": 470, + "valid_targets_mean": 2565.8, + "valid_targets_min": 1449 + }, + { + "epoch": 0.8399646330680813, + "grad_norm": 0.8571991620574829, + "learning_rate": 3.995397482098591e-05, + "loss": 0.5884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36881160736083984, + "step": 475, + "valid_targets_mean": 2929.9, + "valid_targets_min": 412 + }, + { + "epoch": 0.8488063660477454, + "grad_norm": 0.7459479118876244, + "learning_rate": 3.994780614250548e-05, + "loss": 0.5396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3047880232334137, + "step": 480, + "valid_targets_mean": 3779.6, + "valid_targets_min": 2634 + }, + { + "epoch": 0.8576480990274093, + "grad_norm": 0.7142768197579014, + "learning_rate": 3.994125019289566e-05, + "loss": 0.5359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2945425808429718, + "step": 485, + "valid_targets_mean": 3228.9, + "valid_targets_min": 708 + }, + { + "epoch": 0.8664898320070734, + "grad_norm": 0.6309840561705765, + "learning_rate": 3.99343070994351e-05, + "loss": 0.5466, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2996477782726288, + "step": 490, + "valid_targets_mean": 4352.0, + "valid_targets_min": 784 + }, + { + "epoch": 0.8753315649867374, + "grad_norm": 0.72422812308097, + "learning_rate": 3.992697699691857e-05, + "loss": 0.5754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3740094304084778, + "step": 495, + "valid_targets_mean": 3836.0, + "valid_targets_min": 1609 + }, + { + "epoch": 0.8841732979664014, + "grad_norm": 0.8938896424491545, + "learning_rate": 3.9919260027654304e-05, + "loss": 0.612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3498684763908386, + "step": 500, + "valid_targets_mean": 2197.9, + "valid_targets_min": 1020 + }, + { + "epoch": 0.8930150309460654, + "grad_norm": 0.6203004592548081, + "learning_rate": 3.991115634146123e-05, + "loss": 0.5209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26198410987854004, + "step": 505, + "valid_targets_mean": 3834.1, + "valid_targets_min": 1492 + }, + { + "epoch": 0.9018567639257294, + "grad_norm": 0.8296110311313931, + "learning_rate": 3.990266609566614e-05, + "loss": 0.5822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23738741874694824, + "step": 510, + "valid_targets_mean": 1985.0, + "valid_targets_min": 412 + }, + { + "epoch": 0.9106984969053935, + "grad_norm": 0.6830643774979811, + "learning_rate": 3.9893789455100514e-05, + "loss": 0.5182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2690092921257019, + "step": 515, + "valid_targets_mean": 3141.5, + "valid_targets_min": 1099 + }, + { + "epoch": 0.9195402298850575, + "grad_norm": 0.6736971639546346, + "learning_rate": 3.988452659209745e-05, + "loss": 0.5723, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22991755604743958, + "step": 520, + "valid_targets_mean": 2799.1, + "valid_targets_min": 829 + }, + { + "epoch": 0.9283819628647215, + "grad_norm": 0.7173030371663041, + "learning_rate": 3.9874877686488197e-05, + "loss": 0.5628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34016090631484985, + "step": 525, + "valid_targets_mean": 3242.2, + "valid_targets_min": 1744 + }, + { + "epoch": 0.9372236958443855, + "grad_norm": 0.7040214824132874, + "learning_rate": 3.986484292559877e-05, + "loss": 0.5405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2545274496078491, + "step": 530, + "valid_targets_mean": 3138.1, + "valid_targets_min": 1853 + }, + { + "epoch": 0.9460654288240495, + "grad_norm": 0.8218611125304961, + "learning_rate": 3.9854422504246224e-05, + "loss": 0.5626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32547083497047424, + "step": 535, + "valid_targets_mean": 2763.6, + "valid_targets_min": 501 + }, + { + "epoch": 0.9549071618037135, + "grad_norm": 0.6214205266111335, + "learning_rate": 3.984361662473494e-05, + "loss": 0.5616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16753855347633362, + "step": 540, + "valid_targets_mean": 2641.5, + "valid_targets_min": 1835 + }, + { + "epoch": 0.9637488947833776, + "grad_norm": 0.5778657679333664, + "learning_rate": 3.9832425496852644e-05, + "loss": 0.5737, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28100019693374634, + "step": 545, + "valid_targets_mean": 4093.9, + "valid_targets_min": 566 + }, + { + "epoch": 0.9725906277630415, + "grad_norm": 0.7198881631279556, + "learning_rate": 3.982084933786639e-05, + "loss": 0.5622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2683573067188263, + "step": 550, + "valid_targets_mean": 3153.2, + "valid_targets_min": 460 + }, + { + "epoch": 0.9814323607427056, + "grad_norm": 0.7294048125531857, + "learning_rate": 3.9808888372518285e-05, + "loss": 0.523, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22038066387176514, + "step": 555, + "valid_targets_mean": 2419.9, + "valid_targets_min": 281 + }, + { + "epoch": 0.9902740937223696, + "grad_norm": 0.7554402239187559, + "learning_rate": 3.979654283302115e-05, + "loss": 0.561, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33254435658454895, + "step": 560, + "valid_targets_mean": 3315.4, + "valid_targets_min": 1551 + }, + { + "epoch": 0.9991158267020336, + "grad_norm": 0.9531782119454033, + "learning_rate": 3.9783812959054054e-05, + "loss": 0.54, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2633528709411621, + "step": 565, + "valid_targets_mean": 2802.5, + "valid_targets_min": 1365 + }, + { + "epoch": 1.0070733863837311, + "grad_norm": 0.7219142907133131, + "learning_rate": 3.9770698997757564e-05, + "loss": 0.5341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.360717236995697, + "step": 570, + "valid_targets_mean": 3532.2, + "valid_targets_min": 1467 + }, + { + "epoch": 1.0159151193633953, + "grad_norm": 0.6832964222244942, + "learning_rate": 3.975720120372905e-05, + "loss": 0.5604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3534933924674988, + "step": 575, + "valid_targets_mean": 4285.2, + "valid_targets_min": 473 + }, + { + "epoch": 1.0247568523430592, + "grad_norm": 0.7104879022906077, + "learning_rate": 3.974331983901766e-05, + "loss": 0.5139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23602774739265442, + "step": 580, + "valid_targets_mean": 3051.0, + "valid_targets_min": 769 + }, + { + "epoch": 1.0335985853227232, + "grad_norm": 1.0289475556516747, + "learning_rate": 3.972905517311929e-05, + "loss": 0.5025, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2523854076862335, + "step": 585, + "valid_targets_mean": 4518.4, + "valid_targets_min": 1272 + }, + { + "epoch": 1.0424403183023874, + "grad_norm": 0.6070195547061199, + "learning_rate": 3.9714407482971335e-05, + "loss": 0.503, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1908818781375885, + "step": 590, + "valid_targets_mean": 3155.4, + "valid_targets_min": 1502 + }, + { + "epoch": 1.0512820512820513, + "grad_norm": 0.8043171275547331, + "learning_rate": 3.969937705294728e-05, + "loss": 0.5078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33768388628959656, + "step": 595, + "valid_targets_mean": 3010.2, + "valid_targets_min": 1505 + }, + { + "epoch": 1.0601237842617153, + "grad_norm": 0.7749567786956729, + "learning_rate": 3.968396417485125e-05, + "loss": 0.5508, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2937096357345581, + "step": 600, + "valid_targets_mean": 2740.4, + "valid_targets_min": 401 + }, + { + "epoch": 1.0689655172413792, + "grad_norm": 0.6956637921840406, + "learning_rate": 3.966816914791226e-05, + "loss": 0.5343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3460909426212311, + "step": 605, + "valid_targets_mean": 4797.0, + "valid_targets_min": 1353 + }, + { + "epoch": 1.0778072502210434, + "grad_norm": 0.8116625470978949, + "learning_rate": 3.965199227877846e-05, + "loss": 0.5254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32285335659980774, + "step": 610, + "valid_targets_mean": 2429.6, + "valid_targets_min": 438 + }, + { + "epoch": 1.0866489832007074, + "grad_norm": 0.7159169923970375, + "learning_rate": 3.963543388151117e-05, + "loss": 0.5176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2541963458061218, + "step": 615, + "valid_targets_mean": 4086.0, + "valid_targets_min": 702 + }, + { + "epoch": 1.0954907161803713, + "grad_norm": 0.851138769147014, + "learning_rate": 3.9618494277578806e-05, + "loss": 0.5254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1655346155166626, + "step": 620, + "valid_targets_mean": 1852.5, + "valid_targets_min": 330 + }, + { + "epoch": 1.1043324491600353, + "grad_norm": 0.7278081843736119, + "learning_rate": 3.960117379585057e-05, + "loss": 0.56, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3517983555793762, + "step": 625, + "valid_targets_mean": 4008.0, + "valid_targets_min": 1452 + }, + { + "epoch": 1.1131741821396994, + "grad_norm": 0.719616659459927, + "learning_rate": 3.958347277259015e-05, + "loss": 0.4971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31380581855773926, + "step": 630, + "valid_targets_mean": 3580.6, + "valid_targets_min": 309 + }, + { + "epoch": 1.1220159151193634, + "grad_norm": 0.63160465301193, + "learning_rate": 3.956539155144912e-05, + "loss": 0.5234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2329138219356537, + "step": 635, + "valid_targets_mean": 4057.8, + "valid_targets_min": 1396 + }, + { + "epoch": 1.1308576480990273, + "grad_norm": 0.6825427065012454, + "learning_rate": 3.9546930483460326e-05, + "loss": 0.516, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27975958585739136, + "step": 640, + "valid_targets_mean": 3343.4, + "valid_targets_min": 1645 + }, + { + "epoch": 1.1396993810786915, + "grad_norm": 0.699265105549181, + "learning_rate": 3.952808992703102e-05, + "loss": 0.5083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23706836998462677, + "step": 645, + "valid_targets_mean": 2710.6, + "valid_targets_min": 507 + }, + { + "epoch": 1.1485411140583555, + "grad_norm": 0.8045984010228572, + "learning_rate": 3.9508870247935964e-05, + "loss": 0.5351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1919955015182495, + "step": 650, + "valid_targets_mean": 1751.8, + "valid_targets_min": 284 + }, + { + "epoch": 1.1573828470380194, + "grad_norm": 0.6012250412087359, + "learning_rate": 3.948927181931024e-05, + "loss": 0.52, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.263777494430542, + "step": 655, + "valid_targets_mean": 4245.5, + "valid_targets_min": 854 + }, + { + "epoch": 1.1662245800176834, + "grad_norm": 0.5992821189180728, + "learning_rate": 3.94692950216421e-05, + "loss": 0.5235, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23570390045642853, + "step": 660, + "valid_targets_mean": 3959.2, + "valid_targets_min": 276 + }, + { + "epoch": 1.1750663129973475, + "grad_norm": 0.610845100602426, + "learning_rate": 3.944894024276552e-05, + "loss": 0.5026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1973716914653778, + "step": 665, + "valid_targets_mean": 3387.4, + "valid_targets_min": 675 + }, + { + "epoch": 1.1839080459770115, + "grad_norm": 0.7207065986679495, + "learning_rate": 3.9428207877852684e-05, + "loss": 0.5115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17878985404968262, + "step": 670, + "valid_targets_mean": 2142.6, + "valid_targets_min": 384 + }, + { + "epoch": 1.1927497789566754, + "grad_norm": 0.7934727448753174, + "learning_rate": 3.940709832940632e-05, + "loss": 0.5465, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2502514123916626, + "step": 675, + "valid_targets_mean": 2718.2, + "valid_targets_min": 1759 + }, + { + "epoch": 1.2015915119363396, + "grad_norm": 0.7998141403870273, + "learning_rate": 3.938561200725189e-05, + "loss": 0.513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2249201387166977, + "step": 680, + "valid_targets_mean": 2136.0, + "valid_targets_min": 315 + }, + { + "epoch": 1.2104332449160036, + "grad_norm": 0.6227661283561698, + "learning_rate": 3.9363749328529594e-05, + "loss": 0.5482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.259385883808136, + "step": 685, + "valid_targets_mean": 3826.6, + "valid_targets_min": 1730 + }, + { + "epoch": 1.2192749778956675, + "grad_norm": 0.6206992015741707, + "learning_rate": 3.934151071768634e-05, + "loss": 0.5537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2900537848472595, + "step": 690, + "valid_targets_mean": 4350.5, + "valid_targets_min": 595 + }, + { + "epoch": 1.2281167108753315, + "grad_norm": 0.5635939679566414, + "learning_rate": 3.931889660646744e-05, + "loss": 0.5482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2819467782974243, + "step": 695, + "valid_targets_mean": 4096.9, + "valid_targets_min": 1070 + }, + { + "epoch": 1.2369584438549956, + "grad_norm": 0.6692534359398423, + "learning_rate": 3.9295907433908264e-05, + "loss": 0.5415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2925758361816406, + "step": 700, + "valid_targets_mean": 4126.9, + "valid_targets_min": 1240 + }, + { + "epoch": 1.2458001768346596, + "grad_norm": 0.7190209534372782, + "learning_rate": 3.9272543646325703e-05, + "loss": 0.5317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19594435393810272, + "step": 705, + "valid_targets_mean": 2114.2, + "valid_targets_min": 1022 + }, + { + "epoch": 1.2546419098143236, + "grad_norm": 0.7405430028094008, + "learning_rate": 3.924880569730951e-05, + "loss": 0.5281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31587642431259155, + "step": 710, + "valid_targets_mean": 3316.2, + "valid_targets_min": 1055 + }, + { + "epoch": 1.2634836427939877, + "grad_norm": 0.7318705208252564, + "learning_rate": 3.9224694047713475e-05, + "loss": 0.51, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1906820833683014, + "step": 715, + "valid_targets_mean": 2082.6, + "valid_targets_min": 350 + }, + { + "epoch": 1.2723253757736517, + "grad_norm": 0.6136614929326403, + "learning_rate": 3.920020916564652e-05, + "loss": 0.504, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2813029885292053, + "step": 720, + "valid_targets_mean": 3609.0, + "valid_targets_min": 1686 + }, + { + "epoch": 1.2811671087533156, + "grad_norm": 0.7619702273083326, + "learning_rate": 3.917535152646356e-05, + "loss": 0.57, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29840072989463806, + "step": 725, + "valid_targets_mean": 3075.8, + "valid_targets_min": 350 + }, + { + "epoch": 1.2900088417329796, + "grad_norm": 0.6340553976724329, + "learning_rate": 3.915012161275633e-05, + "loss": 0.5579, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35292381048202515, + "step": 730, + "valid_targets_mean": 4762.0, + "valid_targets_min": 576 + }, + { + "epoch": 1.2988505747126438, + "grad_norm": 0.6314054240931711, + "learning_rate": 3.912451991434395e-05, + "loss": 0.5253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2579632103443146, + "step": 735, + "valid_targets_mean": 3673.4, + "valid_targets_min": 591 + }, + { + "epoch": 1.3076923076923077, + "grad_norm": 0.5775959962805894, + "learning_rate": 3.909854692826348e-05, + "loss": 0.5043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20548564195632935, + "step": 740, + "valid_targets_mean": 3846.4, + "valid_targets_min": 1071 + }, + { + "epoch": 1.3165340406719717, + "grad_norm": 0.655758917865089, + "learning_rate": 3.9072203158760215e-05, + "loss": 0.5015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2677724361419678, + "step": 745, + "valid_targets_mean": 3850.2, + "valid_targets_min": 515 + }, + { + "epoch": 1.3253757736516358, + "grad_norm": 0.8148294806624113, + "learning_rate": 3.904548911727793e-05, + "loss": 0.5228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3152320384979248, + "step": 750, + "valid_targets_mean": 3107.8, + "valid_targets_min": 812 + }, + { + "epoch": 1.3342175066312998, + "grad_norm": 0.8146168712526004, + "learning_rate": 3.901840532244897e-05, + "loss": 0.4892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3347662687301636, + "step": 755, + "valid_targets_mean": 3066.6, + "valid_targets_min": 372 + }, + { + "epoch": 1.3430592396109637, + "grad_norm": 0.7139126711376225, + "learning_rate": 3.899095230008411e-05, + "loss": 0.4955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2709360718727112, + "step": 760, + "valid_targets_mean": 3221.8, + "valid_targets_min": 275 + }, + { + "epoch": 1.3519009725906277, + "grad_norm": 0.7341120923859575, + "learning_rate": 3.896313058316242e-05, + "loss": 0.5131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2554779648780823, + "step": 765, + "valid_targets_mean": 3690.6, + "valid_targets_min": 864 + }, + { + "epoch": 1.3607427055702916, + "grad_norm": 0.7351206776886251, + "learning_rate": 3.8934940711820876e-05, + "loss": 0.5282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2886347770690918, + "step": 770, + "valid_targets_mean": 3220.2, + "valid_targets_min": 1394 + }, + { + "epoch": 1.3695844385499558, + "grad_norm": 0.6815412632856188, + "learning_rate": 3.8906383233343886e-05, + "loss": 0.5301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2817658483982086, + "step": 775, + "valid_targets_mean": 3736.1, + "valid_targets_min": 1035 + }, + { + "epoch": 1.3784261715296198, + "grad_norm": 0.6083778824304598, + "learning_rate": 3.887745870215268e-05, + "loss": 0.5448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20323900878429413, + "step": 780, + "valid_targets_mean": 3170.0, + "valid_targets_min": 260 + }, + { + "epoch": 1.387267904509284, + "grad_norm": 0.701861952740278, + "learning_rate": 3.884816767979449e-05, + "loss": 0.5251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28836336731910706, + "step": 785, + "valid_targets_mean": 3401.8, + "valid_targets_min": 1408 + }, + { + "epoch": 1.396109637488948, + "grad_norm": 0.6895304322708055, + "learning_rate": 3.881851073493174e-05, + "loss": 0.5549, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2803962528705597, + "step": 790, + "valid_targets_mean": 3533.6, + "valid_targets_min": 518 + }, + { + "epoch": 1.4049513704686118, + "grad_norm": 0.8606543782305618, + "learning_rate": 3.878848844333091e-05, + "loss": 0.4985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2970787286758423, + "step": 795, + "valid_targets_mean": 3216.2, + "valid_targets_min": 1616 + }, + { + "epoch": 1.4137931034482758, + "grad_norm": 0.748948338513349, + "learning_rate": 3.875810138785144e-05, + "loss": 0.517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20471307635307312, + "step": 800, + "valid_targets_mean": 2873.0, + "valid_targets_min": 1791 + }, + { + "epoch": 1.4226348364279398, + "grad_norm": 0.6282655364858861, + "learning_rate": 3.872735015843435e-05, + "loss": 0.5369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2569165825843811, + "step": 805, + "valid_targets_mean": 4159.0, + "valid_targets_min": 2118 + }, + { + "epoch": 1.431476569407604, + "grad_norm": 0.6800159245193907, + "learning_rate": 3.8696235352090827e-05, + "loss": 0.4849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21237662434577942, + "step": 810, + "valid_targets_mean": 2913.5, + "valid_targets_min": 1511 + }, + { + "epoch": 1.4403183023872679, + "grad_norm": 0.7491849980098594, + "learning_rate": 3.8664757572890624e-05, + "loss": 0.5431, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31936168670654297, + "step": 815, + "valid_targets_mean": 3183.8, + "valid_targets_min": 443 + }, + { + "epoch": 1.449160035366932, + "grad_norm": 0.6726532976813931, + "learning_rate": 3.863291743195031e-05, + "loss": 0.5368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3247930407524109, + "step": 820, + "valid_targets_mean": 5290.1, + "valid_targets_min": 1596 + }, + { + "epoch": 1.458001768346596, + "grad_norm": 0.6414216904520894, + "learning_rate": 3.860071554742144e-05, + "loss": 0.5517, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23261283338069916, + "step": 825, + "valid_targets_mean": 2761.5, + "valid_targets_min": 544 + }, + { + "epoch": 1.46684350132626, + "grad_norm": 0.6133136558161559, + "learning_rate": 3.856815254447854e-05, + "loss": 0.538, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27468377351760864, + "step": 830, + "valid_targets_mean": 4492.1, + "valid_targets_min": 1240 + }, + { + "epoch": 1.475685234305924, + "grad_norm": 0.6535282175604957, + "learning_rate": 3.853522905530698e-05, + "loss": 0.4972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28734225034713745, + "step": 835, + "valid_targets_mean": 4208.9, + "valid_targets_min": 1370 + }, + { + "epoch": 1.4845269672855879, + "grad_norm": 0.7163769356371759, + "learning_rate": 3.850194571909065e-05, + "loss": 0.5515, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21620656549930573, + "step": 840, + "valid_targets_mean": 2672.6, + "valid_targets_min": 530 + }, + { + "epoch": 1.493368700265252, + "grad_norm": 0.6339266507899239, + "learning_rate": 3.8468303181999625e-05, + "loss": 0.5241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22579747438430786, + "step": 845, + "valid_targets_mean": 3050.4, + "valid_targets_min": 1845 + }, + { + "epoch": 1.502210433244916, + "grad_norm": 0.6670589515749927, + "learning_rate": 3.843430209717758e-05, + "loss": 0.501, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25417882204055786, + "step": 850, + "valid_targets_mean": 2978.0, + "valid_targets_min": 1018 + }, + { + "epoch": 1.5110521662245802, + "grad_norm": 0.6632769562515543, + "learning_rate": 3.839994312472911e-05, + "loss": 0.5055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.244868203997612, + "step": 855, + "valid_targets_mean": 3159.6, + "valid_targets_min": 395 + }, + { + "epoch": 1.5198938992042441, + "grad_norm": 0.7476673252142214, + "learning_rate": 3.836522693170692e-05, + "loss": 0.5333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.322563499212265, + "step": 860, + "valid_targets_mean": 3074.9, + "valid_targets_min": 1925 + }, + { + "epoch": 1.528735632183908, + "grad_norm": 1.182699133656073, + "learning_rate": 3.833015419209888e-05, + "loss": 0.5195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.233692467212677, + "step": 865, + "valid_targets_mean": 2652.8, + "valid_targets_min": 505 + }, + { + "epoch": 1.537577365163572, + "grad_norm": 0.5963050788873372, + "learning_rate": 3.8294725586814925e-05, + "loss": 0.5379, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31656789779663086, + "step": 870, + "valid_targets_mean": 4504.1, + "valid_targets_min": 279 + }, + { + "epoch": 1.546419098143236, + "grad_norm": 0.7076807714391373, + "learning_rate": 3.8258941803673845e-05, + "loss": 0.4895, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21023747324943542, + "step": 875, + "valid_targets_mean": 2384.8, + "valid_targets_min": 663 + }, + { + "epoch": 1.5552608311229, + "grad_norm": 0.7242194753984217, + "learning_rate": 3.822280353738995e-05, + "loss": 0.5278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15555477142333984, + "step": 880, + "valid_targets_mean": 1807.2, + "valid_targets_min": 367 + }, + { + "epoch": 1.564102564102564, + "grad_norm": 0.680725926895947, + "learning_rate": 3.818631148955954e-05, + "loss": 0.5183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23022373020648956, + "step": 885, + "valid_targets_mean": 3061.0, + "valid_targets_min": 472 + }, + { + "epoch": 1.5729442970822283, + "grad_norm": 0.6589551518144537, + "learning_rate": 3.814946636864732e-05, + "loss": 0.5016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3253025710582733, + "step": 890, + "valid_targets_mean": 4214.9, + "valid_targets_min": 464 + }, + { + "epoch": 1.5817860300618922, + "grad_norm": 0.695071470979805, + "learning_rate": 3.8112268889972635e-05, + "loss": 0.5002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27869266271591187, + "step": 895, + "valid_targets_mean": 3458.9, + "valid_targets_min": 541 + }, + { + "epoch": 1.5906277630415562, + "grad_norm": 0.6394253917274505, + "learning_rate": 3.807471977569558e-05, + "loss": 0.5247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28981101512908936, + "step": 900, + "valid_targets_mean": 3587.0, + "valid_targets_min": 714 + }, + { + "epoch": 1.5994694960212201, + "grad_norm": 0.6407279388785145, + "learning_rate": 3.803681975480298e-05, + "loss": 0.5339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30930954217910767, + "step": 905, + "valid_targets_mean": 4241.2, + "valid_targets_min": 1531 + }, + { + "epoch": 1.608311229000884, + "grad_norm": 0.6262370337590383, + "learning_rate": 3.799856956309424e-05, + "loss": 0.5043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15924446284770966, + "step": 910, + "valid_targets_mean": 2515.5, + "valid_targets_min": 251 + }, + { + "epoch": 1.617152961980548, + "grad_norm": 0.5799667981131503, + "learning_rate": 3.7959969943167064e-05, + "loss": 0.4945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2013358175754547, + "step": 915, + "valid_targets_mean": 3255.0, + "valid_targets_min": 888 + }, + { + "epoch": 1.6259946949602122, + "grad_norm": 0.7839747219704393, + "learning_rate": 3.7921021644403024e-05, + "loss": 0.513, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.39778536558151245, + "step": 920, + "valid_targets_mean": 3479.8, + "valid_targets_min": 1418 + }, + { + "epoch": 1.6348364279398764, + "grad_norm": 1.0927382964698964, + "learning_rate": 3.788172542295303e-05, + "loss": 0.4882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3143307566642761, + "step": 925, + "valid_targets_mean": 3410.4, + "valid_targets_min": 680 + }, + { + "epoch": 1.6436781609195403, + "grad_norm": 0.71590844445193, + "learning_rate": 3.784208204172262e-05, + "loss": 0.4901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3356863856315613, + "step": 930, + "valid_targets_mean": 3325.4, + "valid_targets_min": 1757 + }, + { + "epoch": 1.6525198938992043, + "grad_norm": 0.6973512644137526, + "learning_rate": 3.7802092270357196e-05, + "loss": 0.5329, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.272472620010376, + "step": 935, + "valid_targets_mean": 2601.2, + "valid_targets_min": 260 + }, + { + "epoch": 1.6613616268788682, + "grad_norm": 0.6008785059006879, + "learning_rate": 3.7761756885227046e-05, + "loss": 0.491, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2572758197784424, + "step": 940, + "valid_targets_mean": 4301.5, + "valid_targets_min": 2006 + }, + { + "epoch": 1.6702033598585322, + "grad_norm": 0.5744209498415186, + "learning_rate": 3.772107666941226e-05, + "loss": 0.5167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26439422369003296, + "step": 945, + "valid_targets_mean": 4495.4, + "valid_targets_min": 2496 + }, + { + "epoch": 1.6790450928381961, + "grad_norm": 0.6465740308526822, + "learning_rate": 3.768005241268757e-05, + "loss": 0.5639, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25202465057373047, + "step": 950, + "valid_targets_mean": 3123.2, + "valid_targets_min": 939 + }, + { + "epoch": 1.6878868258178603, + "grad_norm": 0.7051342522734189, + "learning_rate": 3.7638684911506993e-05, + "loss": 0.5478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1941746175289154, + "step": 955, + "valid_targets_mean": 2783.6, + "valid_targets_min": 466 + }, + { + "epoch": 1.6967285587975243, + "grad_norm": 0.6946362639039605, + "learning_rate": 3.7596974968988366e-05, + "loss": 0.4773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2674318552017212, + "step": 960, + "valid_targets_mean": 2750.2, + "valid_targets_min": 520 + }, + { + "epoch": 1.7055702917771884, + "grad_norm": 0.6323893584576677, + "learning_rate": 3.755492339489775e-05, + "loss": 0.5122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2906394600868225, + "step": 965, + "valid_targets_mean": 4283.9, + "valid_targets_min": 1633 + }, + { + "epoch": 1.7144120247568524, + "grad_norm": 0.7054390689371448, + "learning_rate": 3.751253100563373e-05, + "loss": 0.4883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21445819735527039, + "step": 970, + "valid_targets_mean": 2264.2, + "valid_targets_min": 451 + }, + { + "epoch": 1.7232537577365163, + "grad_norm": 0.7148446633987146, + "learning_rate": 3.746979862421154e-05, + "loss": 0.492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3135313391685486, + "step": 975, + "valid_targets_mean": 4694.2, + "valid_targets_min": 1787 + }, + { + "epoch": 1.7320954907161803, + "grad_norm": 0.7119677167199814, + "learning_rate": 3.742672708024711e-05, + "loss": 0.5171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30675750970840454, + "step": 980, + "valid_targets_mean": 2838.9, + "valid_targets_min": 482 + }, + { + "epoch": 1.7409372236958442, + "grad_norm": 0.6482828478440643, + "learning_rate": 3.7383317209940936e-05, + "loss": 0.5151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1551651656627655, + "step": 985, + "valid_targets_mean": 1954.4, + "valid_targets_min": 246 + }, + { + "epoch": 1.7497789566755084, + "grad_norm": 0.7314955066133645, + "learning_rate": 3.7339569856061864e-05, + "loss": 0.5084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22127586603164673, + "step": 990, + "valid_targets_mean": 2476.5, + "valid_targets_min": 826 + }, + { + "epoch": 1.7586206896551724, + "grad_norm": 1.098815890414233, + "learning_rate": 3.7295485867930715e-05, + "loss": 0.509, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23905551433563232, + "step": 995, + "valid_targets_mean": 2440.1, + "valid_targets_min": 321 + }, + { + "epoch": 1.7674624226348365, + "grad_norm": 0.6764041908437947, + "learning_rate": 3.72510661014038e-05, + "loss": 0.5291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24814735352993011, + "step": 1000, + "valid_targets_mean": 3079.6, + "valid_targets_min": 1683 + }, + { + "epoch": 1.7763041556145005, + "grad_norm": 0.5186517018593776, + "learning_rate": 3.720631141885633e-05, + "loss": 0.5058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20242926478385925, + "step": 1005, + "valid_targets_mean": 4913.6, + "valid_targets_min": 628 + }, + { + "epoch": 1.7851458885941645, + "grad_norm": 0.7772370190529831, + "learning_rate": 3.716122268916561e-05, + "loss": 0.4809, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2603060007095337, + "step": 1010, + "valid_targets_mean": 3256.9, + "valid_targets_min": 686 + }, + { + "epoch": 1.7939876215738284, + "grad_norm": 0.5469582973910361, + "learning_rate": 3.711580078769424e-05, + "loss": 0.5089, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27079907059669495, + "step": 1015, + "valid_targets_mean": 4628.6, + "valid_targets_min": 920 + }, + { + "epoch": 1.8028293545534924, + "grad_norm": 0.6974198275003209, + "learning_rate": 3.707004659627308e-05, + "loss": 0.4978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31995758414268494, + "step": 1020, + "valid_targets_mean": 3138.6, + "valid_targets_min": 636 + }, + { + "epoch": 1.8116710875331565, + "grad_norm": 0.6920590455597191, + "learning_rate": 3.702396100318414e-05, + "loss": 0.5847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28330913186073303, + "step": 1025, + "valid_targets_mean": 3097.5, + "valid_targets_min": 1473 + }, + { + "epoch": 1.8205128205128205, + "grad_norm": 0.7496027840560946, + "learning_rate": 3.697754490314335e-05, + "loss": 0.5644, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2400278002023697, + "step": 1030, + "valid_targets_mean": 2275.6, + "valid_targets_min": 719 + }, + { + "epoch": 1.8293545534924847, + "grad_norm": 0.6856958367471065, + "learning_rate": 3.693079919728314e-05, + "loss": 0.4957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2846917510032654, + "step": 1035, + "valid_targets_mean": 3595.0, + "valid_targets_min": 683 + }, + { + "epoch": 1.8381962864721486, + "grad_norm": 0.5935125821966083, + "learning_rate": 3.688372479313503e-05, + "loss": 0.5339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.36108407378196716, + "step": 1040, + "valid_targets_mean": 4035.4, + "valid_targets_min": 1791 + }, + { + "epoch": 1.8470380194518126, + "grad_norm": 0.7416423484223358, + "learning_rate": 3.683632260461191e-05, + "loss": 0.5628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22433266043663025, + "step": 1045, + "valid_targets_mean": 3904.5, + "valid_targets_min": 1328 + }, + { + "epoch": 1.8558797524314765, + "grad_norm": 0.6245382430385877, + "learning_rate": 3.6788593551990395e-05, + "loss": 0.4787, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25612908601760864, + "step": 1050, + "valid_targets_mean": 3262.2, + "valid_targets_min": 666 + }, + { + "epoch": 1.8647214854111405, + "grad_norm": 0.6171431811555288, + "learning_rate": 3.674053856189289e-05, + "loss": 0.5058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35327455401420593, + "step": 1055, + "valid_targets_mean": 4502.4, + "valid_targets_min": 2273 + }, + { + "epoch": 1.8735632183908046, + "grad_norm": 0.6939023212762249, + "learning_rate": 3.66921585672696e-05, + "loss": 0.5145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15852488577365875, + "step": 1060, + "valid_targets_mean": 1888.6, + "valid_targets_min": 239 + }, + { + "epoch": 1.8824049513704686, + "grad_norm": 0.7982037605123552, + "learning_rate": 3.664345450738048e-05, + "loss": 0.4853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16701588034629822, + "step": 1065, + "valid_targets_mean": 1619.1, + "valid_targets_min": 339 + }, + { + "epoch": 1.8912466843501328, + "grad_norm": 0.608658314659487, + "learning_rate": 3.659442732777694e-05, + "loss": 0.5163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3004249930381775, + "step": 1070, + "valid_targets_mean": 5308.4, + "valid_targets_min": 646 + }, + { + "epoch": 1.9000884173297967, + "grad_norm": 0.7906418390790385, + "learning_rate": 3.6545077980283516e-05, + "loss": 0.5004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33155688643455505, + "step": 1075, + "valid_targets_mean": 2850.4, + "valid_targets_min": 758 + }, + { + "epoch": 1.9089301503094607, + "grad_norm": 0.7032647160707013, + "learning_rate": 3.649540742297937e-05, + "loss": 0.5095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2129090428352356, + "step": 1080, + "valid_targets_mean": 2458.6, + "valid_targets_min": 621 + }, + { + "epoch": 1.9177718832891246, + "grad_norm": 0.6238133398192949, + "learning_rate": 3.6445416620179715e-05, + "loss": 0.4988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.209529310464859, + "step": 1085, + "valid_targets_mean": 3219.8, + "valid_targets_min": 1912 + }, + { + "epoch": 1.9266136162687886, + "grad_norm": 0.7568137310829532, + "learning_rate": 3.6395106542417066e-05, + "loss": 0.5155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3271511495113373, + "step": 1090, + "valid_targets_mean": 2758.9, + "valid_targets_min": 1274 + }, + { + "epoch": 1.9354553492484527, + "grad_norm": 0.6192848137574003, + "learning_rate": 3.6344478166422435e-05, + "loss": 0.4981, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2642071545124054, + "step": 1095, + "valid_targets_mean": 3695.9, + "valid_targets_min": 1417 + }, + { + "epoch": 1.9442970822281167, + "grad_norm": 0.7309050802016251, + "learning_rate": 3.6293532475106325e-05, + "loss": 0.482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29965919256210327, + "step": 1100, + "valid_targets_mean": 2750.0, + "valid_targets_min": 454 + }, + { + "epoch": 1.9531388152077809, + "grad_norm": 1.0623788457569725, + "learning_rate": 3.6242270457539695e-05, + "loss": 0.5106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2692793607711792, + "step": 1105, + "valid_targets_mean": 2734.0, + "valid_targets_min": 1420 + }, + { + "epoch": 1.9619805481874448, + "grad_norm": 0.7151768641889232, + "learning_rate": 3.6190693108934685e-05, + "loss": 0.4966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22051319479942322, + "step": 1110, + "valid_targets_mean": 2504.2, + "valid_targets_min": 515 + }, + { + "epoch": 1.9708222811671088, + "grad_norm": 0.6957676386448085, + "learning_rate": 3.613880143062539e-05, + "loss": 0.5274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3472147583961487, + "step": 1115, + "valid_targets_mean": 4914.9, + "valid_targets_min": 2074 + }, + { + "epoch": 1.9796640141467727, + "grad_norm": 0.5806190920195576, + "learning_rate": 3.6086596430048355e-05, + "loss": 0.544, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17797411978244781, + "step": 1120, + "valid_targets_mean": 2610.4, + "valid_targets_min": 1172 + }, + { + "epoch": 1.9885057471264367, + "grad_norm": 0.79939207014776, + "learning_rate": 3.603407912072303e-05, + "loss": 0.4664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3026364743709564, + "step": 1125, + "valid_targets_mean": 2167.8, + "valid_targets_min": 606 + }, + { + "epoch": 1.9973474801061006, + "grad_norm": 0.6158400263989293, + "learning_rate": 3.598125052223209e-05, + "loss": 0.4927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2575317621231079, + "step": 1130, + "valid_targets_mean": 3856.8, + "valid_targets_min": 266 + }, + { + "epoch": 2.0053050397877983, + "grad_norm": 0.6506509574828292, + "learning_rate": 3.592811166020166e-05, + "loss": 0.461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2540547847747803, + "step": 1135, + "valid_targets_mean": 3808.8, + "valid_targets_min": 433 + }, + { + "epoch": 2.0141467727674622, + "grad_norm": 0.7334124808950342, + "learning_rate": 3.5874663566281386e-05, + "loss": 0.4984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2256934642791748, + "step": 1140, + "valid_targets_mean": 2785.5, + "valid_targets_min": 435 + }, + { + "epoch": 2.0229885057471266, + "grad_norm": 0.5825400538253857, + "learning_rate": 3.582090727812441e-05, + "loss": 0.4376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22117963433265686, + "step": 1145, + "valid_targets_mean": 5034.1, + "valid_targets_min": 1744 + }, + { + "epoch": 2.0318302387267906, + "grad_norm": 0.7871465022788394, + "learning_rate": 3.576684383936721e-05, + "loss": 0.4825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28266459703445435, + "step": 1150, + "valid_targets_mean": 2724.8, + "valid_targets_min": 933 + }, + { + "epoch": 2.0406719717064545, + "grad_norm": 0.6415857615517944, + "learning_rate": 3.571247429960939e-05, + "loss": 0.4354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30939337611198425, + "step": 1155, + "valid_targets_mean": 4437.4, + "valid_targets_min": 535 + }, + { + "epoch": 2.0495137046861185, + "grad_norm": 0.6177273757478585, + "learning_rate": 3.5657799714393226e-05, + "loss": 0.4842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17025458812713623, + "step": 1160, + "valid_targets_mean": 3223.8, + "valid_targets_min": 1553 + }, + { + "epoch": 2.0583554376657824, + "grad_norm": 0.833706903246219, + "learning_rate": 3.560282114518324e-05, + "loss": 0.4675, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26239508390426636, + "step": 1165, + "valid_targets_mean": 2714.1, + "valid_targets_min": 1097 + }, + { + "epoch": 2.0671971706454464, + "grad_norm": 0.7225359837532538, + "learning_rate": 3.554753965934556e-05, + "loss": 0.4865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35689157247543335, + "step": 1170, + "valid_targets_mean": 4220.5, + "valid_targets_min": 1543 + }, + { + "epoch": 2.0760389036251103, + "grad_norm": 0.7784056460093122, + "learning_rate": 3.5491956330127206e-05, + "loss": 0.5007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3038363456726074, + "step": 1175, + "valid_targets_mean": 3015.6, + "valid_targets_min": 295 + }, + { + "epoch": 2.0848806366047747, + "grad_norm": 0.6565097352886429, + "learning_rate": 3.543607223663524e-05, + "loss": 0.4824, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24286240339279175, + "step": 1180, + "valid_targets_mean": 3437.2, + "valid_targets_min": 576 + }, + { + "epoch": 2.0937223695844387, + "grad_norm": 0.6492970939073816, + "learning_rate": 3.537988846381585e-05, + "loss": 0.4959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.303530752658844, + "step": 1185, + "valid_targets_mean": 4899.6, + "valid_targets_min": 1488 + }, + { + "epoch": 2.1025641025641026, + "grad_norm": 0.7925259880545755, + "learning_rate": 3.532340610243325e-05, + "loss": 0.5028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27291086316108704, + "step": 1190, + "valid_targets_mean": 3204.2, + "valid_targets_min": 880 + }, + { + "epoch": 2.1114058355437666, + "grad_norm": 0.6589724671449128, + "learning_rate": 3.526662624904852e-05, + "loss": 0.4576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2381266951560974, + "step": 1195, + "valid_targets_mean": 3589.5, + "valid_targets_min": 913 + }, + { + "epoch": 2.1202475685234305, + "grad_norm": 0.7528452910033151, + "learning_rate": 3.5209550005998314e-05, + "loss": 0.4621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2670268714427948, + "step": 1200, + "valid_targets_mean": 3119.5, + "valid_targets_min": 531 + }, + { + "epoch": 2.1290893015030945, + "grad_norm": 0.5446738881024474, + "learning_rate": 3.515217848137347e-05, + "loss": 0.5064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26400917768478394, + "step": 1205, + "valid_targets_mean": 5657.0, + "valid_targets_min": 2360 + }, + { + "epoch": 2.1379310344827585, + "grad_norm": 0.8894408640488581, + "learning_rate": 3.509451278899748e-05, + "loss": 0.4645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17728659510612488, + "step": 1210, + "valid_targets_mean": 2654.2, + "valid_targets_min": 278 + }, + { + "epoch": 2.146772767462423, + "grad_norm": 0.7198826676958434, + "learning_rate": 3.503655404840488e-05, + "loss": 0.4721, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26327475905418396, + "step": 1215, + "valid_targets_mean": 3134.6, + "valid_targets_min": 283 + }, + { + "epoch": 2.155614500442087, + "grad_norm": 0.8407871800228818, + "learning_rate": 3.497830338481949e-05, + "loss": 0.4882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.295600950717926, + "step": 1220, + "valid_targets_mean": 2603.4, + "valid_targets_min": 547 + }, + { + "epoch": 2.1644562334217508, + "grad_norm": 0.6328345124649135, + "learning_rate": 3.491976192913262e-05, + "loss": 0.4497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22263498604297638, + "step": 1225, + "valid_targets_mean": 3946.1, + "valid_targets_min": 447 + }, + { + "epoch": 2.1732979664014147, + "grad_norm": 0.7203331611468773, + "learning_rate": 3.486093081788106e-05, + "loss": 0.4413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2181500494480133, + "step": 1230, + "valid_targets_mean": 2403.6, + "valid_targets_min": 257 + }, + { + "epoch": 2.1821396993810787, + "grad_norm": 1.2624507413601598, + "learning_rate": 3.480181119322504e-05, + "loss": 0.5526, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21810586750507355, + "step": 1235, + "valid_targets_mean": 3192.0, + "valid_targets_min": 574 + }, + { + "epoch": 2.1909814323607426, + "grad_norm": 0.6145928910538749, + "learning_rate": 3.474240420292606e-05, + "loss": 0.4818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26425665616989136, + "step": 1240, + "valid_targets_mean": 4262.5, + "valid_targets_min": 2190 + }, + { + "epoch": 2.1998231653404066, + "grad_norm": 0.7136638714717287, + "learning_rate": 3.4682711000324586e-05, + "loss": 0.4567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22414344549179077, + "step": 1245, + "valid_targets_mean": 3129.0, + "valid_targets_min": 956 + }, + { + "epoch": 2.2086648983200705, + "grad_norm": 0.6530586834174523, + "learning_rate": 3.462273274431769e-05, + "loss": 0.4573, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2845330536365509, + "step": 1250, + "valid_targets_mean": 3753.6, + "valid_targets_min": 354 + }, + { + "epoch": 2.217506631299735, + "grad_norm": 0.6049021187332466, + "learning_rate": 3.456247059933653e-05, + "loss": 0.4824, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23369532823562622, + "step": 1255, + "valid_targets_mean": 3603.4, + "valid_targets_min": 247 + }, + { + "epoch": 2.226348364279399, + "grad_norm": 0.7452682692760721, + "learning_rate": 3.450192573532373e-05, + "loss": 0.5275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.37186628580093384, + "step": 1260, + "valid_targets_mean": 3171.0, + "valid_targets_min": 718 + }, + { + "epoch": 2.235190097259063, + "grad_norm": 0.6365702923616391, + "learning_rate": 3.444109932771072e-05, + "loss": 0.4654, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.261175274848938, + "step": 1265, + "valid_targets_mean": 4370.4, + "valid_targets_min": 1426 + }, + { + "epoch": 2.2440318302387268, + "grad_norm": 0.5681744054075202, + "learning_rate": 3.4379992557394846e-05, + "loss": 0.5126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20251402258872986, + "step": 1270, + "valid_targets_mean": 4562.1, + "valid_targets_min": 1713 + }, + { + "epoch": 2.2528735632183907, + "grad_norm": 0.7410762502762586, + "learning_rate": 3.4318606610716484e-05, + "loss": 0.5167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20561201870441437, + "step": 1275, + "valid_targets_mean": 2180.5, + "valid_targets_min": 1254 + }, + { + "epoch": 2.2617152961980547, + "grad_norm": 0.5452558320658369, + "learning_rate": 3.4256942679436015e-05, + "loss": 0.4922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19533419609069824, + "step": 1280, + "valid_targets_mean": 3569.5, + "valid_targets_min": 1534 + }, + { + "epoch": 2.270557029177719, + "grad_norm": 0.7468519348908569, + "learning_rate": 3.419500196071067e-05, + "loss": 0.4754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2667611241340637, + "step": 1285, + "valid_targets_mean": 2884.8, + "valid_targets_min": 641 + }, + { + "epoch": 2.279398762157383, + "grad_norm": 0.6333342302390959, + "learning_rate": 3.413278565707128e-05, + "loss": 0.4993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15673427283763885, + "step": 1290, + "valid_targets_mean": 2277.5, + "valid_targets_min": 340 + }, + { + "epoch": 2.288240495137047, + "grad_norm": 0.6520958194331384, + "learning_rate": 3.407029497639896e-05, + "loss": 0.4577, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2410448044538498, + "step": 1295, + "valid_targets_mean": 3485.1, + "valid_targets_min": 844 + }, + { + "epoch": 2.297082228116711, + "grad_norm": 0.7282805052878496, + "learning_rate": 3.400753113190164e-05, + "loss": 0.5239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.356065034866333, + "step": 1300, + "valid_targets_mean": 2978.1, + "valid_targets_min": 327 + }, + { + "epoch": 2.305923961096375, + "grad_norm": 0.7494491120423273, + "learning_rate": 3.394449534209049e-05, + "loss": 0.475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2870040535926819, + "step": 1305, + "valid_targets_mean": 3106.1, + "valid_targets_min": 646 + }, + { + "epoch": 2.314765694076039, + "grad_norm": 0.7866263743420345, + "learning_rate": 3.388118883075632e-05, + "loss": 0.4645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3140355348587036, + "step": 1310, + "valid_targets_mean": 2766.9, + "valid_targets_min": 1396 + }, + { + "epoch": 2.323607427055703, + "grad_norm": 0.6490756330304519, + "learning_rate": 3.381761282694576e-05, + "loss": 0.4587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1746228039264679, + "step": 1315, + "valid_targets_mean": 1878.6, + "valid_targets_min": 366 + }, + { + "epoch": 2.3324491600353667, + "grad_norm": 0.5903200212592301, + "learning_rate": 3.375376856493744e-05, + "loss": 0.474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2511587142944336, + "step": 1320, + "valid_targets_mean": 4894.8, + "valid_targets_min": 641 + }, + { + "epoch": 2.341290893015031, + "grad_norm": 2.254093889370584, + "learning_rate": 3.368965728421802e-05, + "loss": 0.4457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.161946639418602, + "step": 1325, + "valid_targets_mean": 2834.8, + "valid_targets_min": 392 + }, + { + "epoch": 2.350132625994695, + "grad_norm": 0.9142370689095928, + "learning_rate": 3.362528022945811e-05, + "loss": 0.4635, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2488413155078888, + "step": 1330, + "valid_targets_mean": 1759.2, + "valid_targets_min": 432 + }, + { + "epoch": 2.358974358974359, + "grad_norm": 0.6231014207273252, + "learning_rate": 3.3560638650488116e-05, + "loss": 0.481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24347589910030365, + "step": 1335, + "valid_targets_mean": 3643.8, + "valid_targets_min": 1798 + }, + { + "epoch": 2.367816091954023, + "grad_norm": 0.7798321013057438, + "learning_rate": 3.3495733802273973e-05, + "loss": 0.4947, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27684855461120605, + "step": 1340, + "valid_targets_mean": 2807.4, + "valid_targets_min": 671 + }, + { + "epoch": 2.376657824933687, + "grad_norm": 0.6835229910495109, + "learning_rate": 3.3430566944892797e-05, + "loss": 0.4769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20981459319591522, + "step": 1345, + "valid_targets_mean": 2786.4, + "valid_targets_min": 697 + }, + { + "epoch": 2.385499557913351, + "grad_norm": 0.7027687967506704, + "learning_rate": 3.3365139343508394e-05, + "loss": 0.5036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24709592759609222, + "step": 1350, + "valid_targets_mean": 2751.4, + "valid_targets_min": 429 + }, + { + "epoch": 2.394341290893015, + "grad_norm": 0.6262006292592385, + "learning_rate": 3.329945226834672e-05, + "loss": 0.4645, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18077601492404938, + "step": 1355, + "valid_targets_mean": 2843.1, + "valid_targets_min": 994 + }, + { + "epoch": 2.4031830238726792, + "grad_norm": 0.6277485840526359, + "learning_rate": 3.3233506994671226e-05, + "loss": 0.4951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2642451524734497, + "step": 1360, + "valid_targets_mean": 3429.4, + "valid_targets_min": 446 + }, + { + "epoch": 2.412024756852343, + "grad_norm": 0.6280596559682324, + "learning_rate": 3.316730480275804e-05, + "loss": 0.4464, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22805391252040863, + "step": 1365, + "valid_targets_mean": 3516.9, + "valid_targets_min": 1427 + }, + { + "epoch": 2.420866489832007, + "grad_norm": 0.6174264929077061, + "learning_rate": 3.3100846977871205e-05, + "loss": 0.4913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2780839502811432, + "step": 1370, + "valid_targets_mean": 4372.0, + "valid_targets_min": 595 + }, + { + "epoch": 2.429708222811671, + "grad_norm": 0.656729892977582, + "learning_rate": 3.303413481023767e-05, + "loss": 0.4994, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19668014347553253, + "step": 1375, + "valid_targets_mean": 2811.8, + "valid_targets_min": 482 + }, + { + "epoch": 2.438549955791335, + "grad_norm": 0.7226257651578697, + "learning_rate": 3.296716959502222e-05, + "loss": 0.4784, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22153441607952118, + "step": 1380, + "valid_targets_mean": 2547.9, + "valid_targets_min": 650 + }, + { + "epoch": 2.447391688770999, + "grad_norm": 0.7651983874835208, + "learning_rate": 3.2899952632302406e-05, + "loss": 0.4922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2565222978591919, + "step": 1385, + "valid_targets_mean": 2316.4, + "valid_targets_min": 389 + }, + { + "epoch": 2.456233421750663, + "grad_norm": 0.629453575504003, + "learning_rate": 3.2832485227043224e-05, + "loss": 0.4593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19831818342208862, + "step": 1390, + "valid_targets_mean": 3157.9, + "valid_targets_min": 1057 + }, + { + "epoch": 2.465075154730327, + "grad_norm": 0.6047254462995167, + "learning_rate": 3.276476868907185e-05, + "loss": 0.4621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29224517941474915, + "step": 1395, + "valid_targets_mean": 4613.8, + "valid_targets_min": 1331 + }, + { + "epoch": 2.4739168877099913, + "grad_norm": 0.7333279372759346, + "learning_rate": 3.2696804333052134e-05, + "loss": 0.497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1974330097436905, + "step": 1400, + "valid_targets_mean": 2125.1, + "valid_targets_min": 329 + }, + { + "epoch": 2.4827586206896552, + "grad_norm": 0.7776273687671615, + "learning_rate": 3.2628593478459166e-05, + "loss": 0.5055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2529323399066925, + "step": 1405, + "valid_targets_mean": 2489.1, + "valid_targets_min": 724 + }, + { + "epoch": 2.491600353669319, + "grad_norm": 0.7273539498207023, + "learning_rate": 3.256013744955359e-05, + "loss": 0.4718, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30455833673477173, + "step": 1410, + "valid_targets_mean": 3809.0, + "valid_targets_min": 1703 + }, + { + "epoch": 2.500442086648983, + "grad_norm": 0.564269031629325, + "learning_rate": 3.249143757535593e-05, + "loss": 0.4583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21314361691474915, + "step": 1415, + "valid_targets_mean": 3426.6, + "valid_targets_min": 1214 + }, + { + "epoch": 2.509283819628647, + "grad_norm": 0.5557251931105729, + "learning_rate": 3.242249518962075e-05, + "loss": 0.4994, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18279360234737396, + "step": 1420, + "valid_targets_mean": 3213.4, + "valid_targets_min": 1033 + }, + { + "epoch": 2.5181255526083115, + "grad_norm": 0.550481771742281, + "learning_rate": 3.2353311630810824e-05, + "loss": 0.4564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30488190054893494, + "step": 1425, + "valid_targets_mean": 5551.5, + "valid_targets_min": 1786 + }, + { + "epoch": 2.5269672855879755, + "grad_norm": 0.7806815136684526, + "learning_rate": 3.2283888242071084e-05, + "loss": 0.4889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23620276153087616, + "step": 1430, + "valid_targets_mean": 2326.1, + "valid_targets_min": 260 + }, + { + "epoch": 2.5358090185676394, + "grad_norm": 0.6636248793061827, + "learning_rate": 3.221422637120259e-05, + "loss": 0.4679, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1364372968673706, + "step": 1435, + "valid_targets_mean": 1784.4, + "valid_targets_min": 384 + }, + { + "epoch": 2.5446507515473034, + "grad_norm": 0.689385789889328, + "learning_rate": 3.2144327370636346e-05, + "loss": 0.454, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20073749125003815, + "step": 1440, + "valid_targets_mean": 3205.1, + "valid_targets_min": 381 + }, + { + "epoch": 2.5534924845269673, + "grad_norm": 0.6328008971941544, + "learning_rate": 3.2074192597407035e-05, + "loss": 0.4613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3022666573524475, + "step": 1445, + "valid_targets_mean": 4333.4, + "valid_targets_min": 1507 + }, + { + "epoch": 2.5623342175066313, + "grad_norm": 0.59131850878343, + "learning_rate": 3.200382341312669e-05, + "loss": 0.4492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17799311876296997, + "step": 1450, + "valid_targets_mean": 3369.5, + "valid_targets_min": 1668 + }, + { + "epoch": 2.571175950486295, + "grad_norm": 0.7805466539055157, + "learning_rate": 3.193322118395825e-05, + "loss": 0.4892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27352964878082275, + "step": 1455, + "valid_targets_mean": 2186.5, + "valid_targets_min": 560 + }, + { + "epoch": 2.580017683465959, + "grad_norm": 0.6876454265526983, + "learning_rate": 3.1862387280589035e-05, + "loss": 0.4779, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3268851041793823, + "step": 1460, + "valid_targets_mean": 3722.8, + "valid_targets_min": 1455 + }, + { + "epoch": 2.588859416445623, + "grad_norm": 0.6736850428355156, + "learning_rate": 3.179132307820415e-05, + "loss": 0.4415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23798906803131104, + "step": 1465, + "valid_targets_mean": 2838.0, + "valid_targets_min": 682 + }, + { + "epoch": 2.5977011494252875, + "grad_norm": 0.596929830688196, + "learning_rate": 3.1720029956459765e-05, + "loss": 0.4591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2674519419670105, + "step": 1470, + "valid_targets_mean": 4175.8, + "valid_targets_min": 1486 + }, + { + "epoch": 2.6065428824049515, + "grad_norm": 0.5748031569774971, + "learning_rate": 3.1648509299456354e-05, + "loss": 0.4262, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2019733488559723, + "step": 1475, + "valid_targets_mean": 3431.9, + "valid_targets_min": 417 + }, + { + "epoch": 2.6153846153846154, + "grad_norm": 0.6572317898083503, + "learning_rate": 3.15767624957118e-05, + "loss": 0.5071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3238973915576935, + "step": 1480, + "valid_targets_mean": 4004.2, + "valid_targets_min": 1921 + }, + { + "epoch": 2.6242263483642794, + "grad_norm": 0.6374727405441111, + "learning_rate": 3.150479093813444e-05, + "loss": 0.4698, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.257358580827713, + "step": 1485, + "valid_targets_mean": 3410.9, + "valid_targets_min": 1841 + }, + { + "epoch": 2.6330680813439433, + "grad_norm": 0.7370301376235759, + "learning_rate": 3.143259602399605e-05, + "loss": 0.4813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24704976379871368, + "step": 1490, + "valid_targets_mean": 2845.5, + "valid_targets_min": 494 + }, + { + "epoch": 2.6419098143236073, + "grad_norm": 0.6458521957650634, + "learning_rate": 3.13601791549047e-05, + "loss": 0.4572, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21648521721363068, + "step": 1495, + "valid_targets_mean": 2931.2, + "valid_targets_min": 1190 + }, + { + "epoch": 2.6507515473032717, + "grad_norm": 0.6857098017912163, + "learning_rate": 3.128754173677753e-05, + "loss": 0.4732, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17468172311782837, + "step": 1500, + "valid_targets_mean": 2179.5, + "valid_targets_min": 428 + }, + { + "epoch": 2.6595932802829356, + "grad_norm": 0.7760295420887048, + "learning_rate": 3.121468517981348e-05, + "loss": 0.4793, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2126651257276535, + "step": 1505, + "valid_targets_mean": 2069.2, + "valid_targets_min": 643 + }, + { + "epoch": 2.6684350132625996, + "grad_norm": 0.7256165385608961, + "learning_rate": 3.1141610898465886e-05, + "loss": 0.4586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24016624689102173, + "step": 1510, + "valid_targets_mean": 2405.6, + "valid_targets_min": 769 + }, + { + "epoch": 2.6772767462422635, + "grad_norm": 0.8041492470671632, + "learning_rate": 3.106832031141505e-05, + "loss": 0.4882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2537711560726166, + "step": 1515, + "valid_targets_mean": 2232.1, + "valid_targets_min": 538 + }, + { + "epoch": 2.6861184792219275, + "grad_norm": 0.6768740030703516, + "learning_rate": 3.099481484154066e-05, + "loss": 0.4694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2770196199417114, + "step": 1520, + "valid_targets_mean": 3394.1, + "valid_targets_min": 951 + }, + { + "epoch": 2.6949602122015914, + "grad_norm": 0.7614885023952586, + "learning_rate": 3.092109591589421e-05, + "loss": 0.47, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24348753690719604, + "step": 1525, + "valid_targets_mean": 1985.0, + "valid_targets_min": 661 + }, + { + "epoch": 2.7038019451812554, + "grad_norm": 0.6973530090116009, + "learning_rate": 3.084716496567125e-05, + "loss": 0.4691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2216261327266693, + "step": 1530, + "valid_targets_mean": 2607.2, + "valid_targets_min": 927 + }, + { + "epoch": 2.7126436781609193, + "grad_norm": 0.6643269820883152, + "learning_rate": 3.0773023426183646e-05, + "loss": 0.5029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21378345787525177, + "step": 1535, + "valid_targets_mean": 2372.9, + "valid_targets_min": 298 + }, + { + "epoch": 2.7214854111405833, + "grad_norm": 0.6302383408350807, + "learning_rate": 3.069867273683166e-05, + "loss": 0.4813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18604375422000885, + "step": 1540, + "valid_targets_mean": 2405.8, + "valid_targets_min": 708 + }, + { + "epoch": 2.7303271441202477, + "grad_norm": 0.7402043292567106, + "learning_rate": 3.062411434107607e-05, + "loss": 0.4961, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27701494097709656, + "step": 1545, + "valid_targets_mean": 3043.9, + "valid_targets_min": 1120 + }, + { + "epoch": 2.7391688770999116, + "grad_norm": 0.7333854416465081, + "learning_rate": 3.0549349686410086e-05, + "loss": 0.4807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1735975593328476, + "step": 1550, + "valid_targets_mean": 1787.8, + "valid_targets_min": 1101 + }, + { + "epoch": 2.7480106100795756, + "grad_norm": 0.5787318917413554, + "learning_rate": 3.0474380224331292e-05, + "loss": 0.4601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26284363865852356, + "step": 1555, + "valid_targets_mean": 3658.6, + "valid_targets_min": 1467 + }, + { + "epoch": 2.7568523430592395, + "grad_norm": 0.5153363716994127, + "learning_rate": 3.039920741031342e-05, + "loss": 0.452, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1932397484779358, + "step": 1560, + "valid_targets_mean": 3985.8, + "valid_targets_min": 2070 + }, + { + "epoch": 2.7656940760389035, + "grad_norm": 0.7429137625185662, + "learning_rate": 3.0323832703778168e-05, + "loss": 0.477, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2431662678718567, + "step": 1565, + "valid_targets_mean": 2817.0, + "valid_targets_min": 1312 + }, + { + "epoch": 2.774535809018568, + "grad_norm": 0.6481250155554005, + "learning_rate": 3.024825756806677e-05, + "loss": 0.4784, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3212037980556488, + "step": 1570, + "valid_targets_mean": 3536.4, + "valid_targets_min": 307 + }, + { + "epoch": 2.783377541998232, + "grad_norm": 0.5946835818022652, + "learning_rate": 3.017248347041168e-05, + "loss": 0.4674, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17257541418075562, + "step": 1575, + "valid_targets_mean": 3216.1, + "valid_targets_min": 338 + }, + { + "epoch": 2.792219274977896, + "grad_norm": 0.7079495479617642, + "learning_rate": 3.0096511881908007e-05, + "loss": 0.476, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25472956895828247, + "step": 1580, + "valid_targets_mean": 2929.1, + "valid_targets_min": 920 + }, + { + "epoch": 2.8010610079575597, + "grad_norm": 0.6686876235075944, + "learning_rate": 3.0020344277485017e-05, + "loss": 0.48, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24332070350646973, + "step": 1585, + "valid_targets_mean": 3509.1, + "valid_targets_min": 1355 + }, + { + "epoch": 2.8099027409372237, + "grad_norm": 0.5961265521760359, + "learning_rate": 2.994398213587746e-05, + "loss": 0.4652, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16399900615215302, + "step": 1590, + "valid_targets_mean": 2690.2, + "valid_targets_min": 998 + }, + { + "epoch": 2.8187444739168876, + "grad_norm": 0.6932732714841346, + "learning_rate": 2.9867426939596876e-05, + "loss": 0.4838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23998896777629852, + "step": 1595, + "valid_targets_mean": 2742.6, + "valid_targets_min": 462 + }, + { + "epoch": 2.8275862068965516, + "grad_norm": 0.6373428022728593, + "learning_rate": 2.9790680174902818e-05, + "loss": 0.4958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28616029024124146, + "step": 1600, + "valid_targets_mean": 3503.4, + "valid_targets_min": 1984 + }, + { + "epoch": 2.8364279398762156, + "grad_norm": 0.5701727639748247, + "learning_rate": 2.971374333177398e-05, + "loss": 0.4531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2033827304840088, + "step": 1605, + "valid_targets_mean": 3583.5, + "valid_targets_min": 371 + }, + { + "epoch": 2.8452696728558795, + "grad_norm": 0.6938709515640729, + "learning_rate": 2.963661790387928e-05, + "loss": 0.4687, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16415715217590332, + "step": 1610, + "valid_targets_mean": 1516.6, + "valid_targets_min": 348 + }, + { + "epoch": 2.854111405835544, + "grad_norm": 0.6819822107535831, + "learning_rate": 2.9559305388548884e-05, + "loss": 0.4605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30489426851272583, + "step": 1615, + "valid_targets_mean": 3739.5, + "valid_targets_min": 1669 + }, + { + "epoch": 2.862953138815208, + "grad_norm": 0.6256616922874445, + "learning_rate": 2.948180728674508e-05, + "loss": 0.4769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2562219798564911, + "step": 1620, + "valid_targets_mean": 3812.9, + "valid_targets_min": 446 + }, + { + "epoch": 2.871794871794872, + "grad_norm": 0.6400236041741094, + "learning_rate": 2.9404125103033207e-05, + "loss": 0.4986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29524898529052734, + "step": 1625, + "valid_targets_mean": 4371.4, + "valid_targets_min": 1584 + }, + { + "epoch": 2.8806366047745358, + "grad_norm": 0.6341608498880749, + "learning_rate": 2.9326260345552384e-05, + "loss": 0.4532, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2372559905052185, + "step": 1630, + "valid_targets_mean": 3315.1, + "valid_targets_min": 807 + }, + { + "epoch": 2.8894783377541997, + "grad_norm": 0.6276072795012839, + "learning_rate": 2.924821452598628e-05, + "loss": 0.4596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32003140449523926, + "step": 1635, + "valid_targets_mean": 4198.9, + "valid_targets_min": 294 + }, + { + "epoch": 2.898320070733864, + "grad_norm": 0.7616482436393485, + "learning_rate": 2.916998915953373e-05, + "loss": 0.4898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20601674914360046, + "step": 1640, + "valid_targets_mean": 2052.5, + "valid_targets_min": 778 + }, + { + "epoch": 2.907161803713528, + "grad_norm": 0.5882065240627146, + "learning_rate": 2.9091585764879334e-05, + "loss": 0.4942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24223053455352783, + "step": 1645, + "valid_targets_mean": 4031.1, + "valid_targets_min": 378 + }, + { + "epoch": 2.916003536693192, + "grad_norm": 0.6054495841065836, + "learning_rate": 2.9013005864163967e-05, + "loss": 0.4683, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18661022186279297, + "step": 1650, + "valid_targets_mean": 3359.5, + "valid_targets_min": 1665 + }, + { + "epoch": 2.924845269672856, + "grad_norm": 0.6838185112738919, + "learning_rate": 2.8934250982955245e-05, + "loss": 0.5104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21030931174755096, + "step": 1655, + "valid_targets_mean": 2463.9, + "valid_targets_min": 367 + }, + { + "epoch": 2.93368700265252, + "grad_norm": 0.5869513062851025, + "learning_rate": 2.8855322650217878e-05, + "loss": 0.4734, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2261839509010315, + "step": 1660, + "valid_targets_mean": 4131.2, + "valid_targets_min": 1915 + }, + { + "epoch": 2.942528735632184, + "grad_norm": 0.6635908796868752, + "learning_rate": 2.877622239828402e-05, + "loss": 0.4742, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3128895163536072, + "step": 1665, + "valid_targets_mean": 3485.6, + "valid_targets_min": 1311 + }, + { + "epoch": 2.951370468611848, + "grad_norm": 0.5866931808918497, + "learning_rate": 2.8696951762823482e-05, + "loss": 0.4536, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27576667070388794, + "step": 1670, + "valid_targets_mean": 5840.1, + "valid_targets_min": 867 + }, + { + "epoch": 2.9602122015915118, + "grad_norm": 0.7047207677935268, + "learning_rate": 2.8617512282813962e-05, + "loss": 0.4773, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2672806978225708, + "step": 1675, + "valid_targets_mean": 3142.0, + "valid_targets_min": 411 + }, + { + "epoch": 2.9690539345711757, + "grad_norm": 0.6805728312782533, + "learning_rate": 2.8537905500511115e-05, + "loss": 0.4409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22739487886428833, + "step": 1680, + "valid_targets_mean": 2617.9, + "valid_targets_min": 488 + }, + { + "epoch": 2.97789566755084, + "grad_norm": 0.6399928488222026, + "learning_rate": 2.845813296141867e-05, + "loss": 0.4841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.33402326703071594, + "step": 1685, + "valid_targets_mean": 3724.4, + "valid_targets_min": 283 + }, + { + "epoch": 2.986737400530504, + "grad_norm": 0.657324357265603, + "learning_rate": 2.8378196214258368e-05, + "loss": 0.4642, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23617523908615112, + "step": 1690, + "valid_targets_mean": 3832.5, + "valid_targets_min": 442 + }, + { + "epoch": 2.995579133510168, + "grad_norm": 0.7665365085077115, + "learning_rate": 2.8298096810939947e-05, + "loss": 0.4763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22332416474819183, + "step": 1695, + "valid_targets_mean": 2495.6, + "valid_targets_min": 1444 + }, + { + "epoch": 3.0035366931918657, + "grad_norm": 0.6631145203555193, + "learning_rate": 2.821783630653097e-05, + "loss": 0.4496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.41785138845443726, + "step": 1700, + "valid_targets_mean": 4816.5, + "valid_targets_min": 2915 + }, + { + "epoch": 3.0123784261715296, + "grad_norm": 0.6337435624348, + "learning_rate": 2.8137416259226647e-05, + "loss": 0.4547, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2246091365814209, + "step": 1705, + "valid_targets_mean": 3841.2, + "valid_targets_min": 1235 + }, + { + "epoch": 3.0212201591511936, + "grad_norm": 0.6936797200273987, + "learning_rate": 2.805683823031962e-05, + "loss": 0.4457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1735125035047531, + "step": 1710, + "valid_targets_mean": 2731.0, + "valid_targets_min": 714 + }, + { + "epoch": 3.0300618921308575, + "grad_norm": 0.7891995315990228, + "learning_rate": 2.797610378416958e-05, + "loss": 0.4231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16492772102355957, + "step": 1715, + "valid_targets_mean": 2113.0, + "valid_targets_min": 578 + }, + { + "epoch": 3.0389036251105215, + "grad_norm": 0.7386808391583857, + "learning_rate": 2.789521448817297e-05, + "loss": 0.4209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26257234811782837, + "step": 1720, + "valid_targets_mean": 3744.8, + "valid_targets_min": 1677 + }, + { + "epoch": 3.047745358090186, + "grad_norm": 0.8448422789924801, + "learning_rate": 2.7814171912732505e-05, + "loss": 0.4595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2198343276977539, + "step": 1725, + "valid_targets_mean": 2466.9, + "valid_targets_min": 579 + }, + { + "epoch": 3.05658709106985, + "grad_norm": 0.5394050393186041, + "learning_rate": 2.7732977631226707e-05, + "loss": 0.4599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1662464141845703, + "step": 1730, + "valid_targets_mean": 3657.5, + "valid_targets_min": 418 + }, + { + "epoch": 3.065428824049514, + "grad_norm": 0.7249259150149697, + "learning_rate": 2.7651633219979354e-05, + "loss": 0.4421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2690415382385254, + "step": 1735, + "valid_targets_mean": 3475.8, + "valid_targets_min": 1327 + }, + { + "epoch": 3.0742705570291777, + "grad_norm": 0.5613143824306901, + "learning_rate": 2.757014025822887e-05, + "loss": 0.4157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1862303614616394, + "step": 1740, + "valid_targets_mean": 5056.2, + "valid_targets_min": 562 + }, + { + "epoch": 3.0831122900088417, + "grad_norm": 0.6722692705575857, + "learning_rate": 2.7488500328097676e-05, + "loss": 0.4646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23648124933242798, + "step": 1745, + "valid_targets_mean": 2867.6, + "valid_targets_min": 595 + }, + { + "epoch": 3.0919540229885056, + "grad_norm": 0.6814783628326924, + "learning_rate": 2.740671501456147e-05, + "loss": 0.4398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12536823749542236, + "step": 1750, + "valid_targets_mean": 1615.6, + "valid_targets_min": 327 + }, + { + "epoch": 3.1007957559681696, + "grad_norm": 0.6898698530287688, + "learning_rate": 2.732478590541846e-05, + "loss": 0.4825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14612561464309692, + "step": 1755, + "valid_targets_mean": 2145.4, + "valid_targets_min": 409 + }, + { + "epoch": 3.109637488947834, + "grad_norm": 0.7057545284878672, + "learning_rate": 2.7242714591258515e-05, + "loss": 0.4489, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2028021216392517, + "step": 1760, + "valid_targets_mean": 2730.9, + "valid_targets_min": 821 + }, + { + "epoch": 3.118479221927498, + "grad_norm": 0.7145345954957985, + "learning_rate": 2.716050266543233e-05, + "loss": 0.447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2143976241350174, + "step": 1765, + "valid_targets_mean": 2795.2, + "valid_targets_min": 354 + }, + { + "epoch": 3.127320954907162, + "grad_norm": 0.6387454256981671, + "learning_rate": 2.707815172402045e-05, + "loss": 0.4511, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2258991003036499, + "step": 1770, + "valid_targets_mean": 4250.8, + "valid_targets_min": 292 + }, + { + "epoch": 3.136162687886826, + "grad_norm": 0.6217741057104463, + "learning_rate": 2.6995663365802297e-05, + "loss": 0.4653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2483760118484497, + "step": 1775, + "valid_targets_mean": 4210.9, + "valid_targets_min": 283 + }, + { + "epoch": 3.14500442086649, + "grad_norm": 0.6457517067956914, + "learning_rate": 2.6913039192225143e-05, + "loss": 0.4716, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32969963550567627, + "step": 1780, + "valid_targets_mean": 4354.4, + "valid_targets_min": 756 + }, + { + "epoch": 3.1538461538461537, + "grad_norm": 0.6429893214891368, + "learning_rate": 2.683028080737301e-05, + "loss": 0.4321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21806424856185913, + "step": 1785, + "valid_targets_mean": 3157.8, + "valid_targets_min": 532 + }, + { + "epoch": 3.1626878868258177, + "grad_norm": 0.692439432500108, + "learning_rate": 2.6747389817935513e-05, + "loss": 0.4697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31872475147247314, + "step": 1790, + "valid_targets_mean": 3962.4, + "valid_targets_min": 956 + }, + { + "epoch": 3.171529619805482, + "grad_norm": 0.655636164934992, + "learning_rate": 2.6664367833176706e-05, + "loss": 0.4435, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24065600335597992, + "step": 1795, + "valid_targets_mean": 4039.6, + "valid_targets_min": 767 + }, + { + "epoch": 3.180371352785146, + "grad_norm": 0.6356274580947101, + "learning_rate": 2.6581216464903783e-05, + "loss": 0.447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21401917934417725, + "step": 1800, + "valid_targets_mean": 3759.8, + "valid_targets_min": 778 + }, + { + "epoch": 3.18921308576481, + "grad_norm": 0.6755187398673654, + "learning_rate": 2.649793732743585e-05, + "loss": 0.4587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2595488727092743, + "step": 1805, + "valid_targets_mean": 4247.6, + "valid_targets_min": 583 + }, + { + "epoch": 3.198054818744474, + "grad_norm": 0.6601036816629008, + "learning_rate": 2.641453203757253e-05, + "loss": 0.4575, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24937765300273895, + "step": 1810, + "valid_targets_mean": 5081.9, + "valid_targets_min": 1584 + }, + { + "epoch": 3.206896551724138, + "grad_norm": 0.7345675030768746, + "learning_rate": 2.6331002214562612e-05, + "loss": 0.4535, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2856788635253906, + "step": 1815, + "valid_targets_mean": 3258.6, + "valid_targets_min": 418 + }, + { + "epoch": 3.215738284703802, + "grad_norm": 0.6443854997962501, + "learning_rate": 2.624734948007259e-05, + "loss": 0.4782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19514860212802887, + "step": 1820, + "valid_targets_mean": 2690.8, + "valid_targets_min": 1080 + }, + { + "epoch": 3.224580017683466, + "grad_norm": 0.6505251815752711, + "learning_rate": 2.616357545815518e-05, + "loss": 0.4341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18154998123645782, + "step": 1825, + "valid_targets_mean": 2853.5, + "valid_targets_min": 1039 + }, + { + "epoch": 3.2334217506631298, + "grad_norm": 0.639089706648105, + "learning_rate": 2.6079681775217833e-05, + "loss": 0.4494, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1521425098180771, + "step": 1830, + "valid_targets_mean": 2546.0, + "valid_targets_min": 1092 + }, + { + "epoch": 3.242263483642794, + "grad_norm": 0.8346126474494834, + "learning_rate": 2.5995670059991085e-05, + "loss": 0.4564, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20812271535396576, + "step": 1835, + "valid_targets_mean": 2109.9, + "valid_targets_min": 475 + }, + { + "epoch": 3.251105216622458, + "grad_norm": 0.6974668474879332, + "learning_rate": 2.5911541943497e-05, + "loss": 0.4148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21064886450767517, + "step": 1840, + "valid_targets_mean": 3080.6, + "valid_targets_min": 308 + }, + { + "epoch": 3.259946949602122, + "grad_norm": 0.7071438987421578, + "learning_rate": 2.582729905901747e-05, + "loss": 0.4271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3176460564136505, + "step": 1845, + "valid_targets_mean": 3679.4, + "valid_targets_min": 835 + }, + { + "epoch": 3.268788682581786, + "grad_norm": 0.8145462041803657, + "learning_rate": 2.574294304206254e-05, + "loss": 0.4524, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27845755219459534, + "step": 1850, + "valid_targets_mean": 2862.0, + "valid_targets_min": 557 + }, + { + "epoch": 3.27763041556145, + "grad_norm": 0.7045266012648904, + "learning_rate": 2.56584755303386e-05, + "loss": 0.4439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2471604347229004, + "step": 1855, + "valid_targets_mean": 3010.8, + "valid_targets_min": 659 + }, + { + "epoch": 3.286472148541114, + "grad_norm": 0.7384311436163473, + "learning_rate": 2.5573898163716663e-05, + "loss": 0.4215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20069456100463867, + "step": 1860, + "valid_targets_mean": 2391.2, + "valid_targets_min": 546 + }, + { + "epoch": 3.2953138815207783, + "grad_norm": 0.766502608504117, + "learning_rate": 2.5489212584200446e-05, + "loss": 0.448, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2833523452281952, + "step": 1865, + "valid_targets_mean": 2948.2, + "valid_targets_min": 340 + }, + { + "epoch": 3.3041556145004423, + "grad_norm": 0.9146044226587593, + "learning_rate": 2.5404420435894578e-05, + "loss": 0.449, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.265963613986969, + "step": 1870, + "valid_targets_mean": 2752.6, + "valid_targets_min": 587 + }, + { + "epoch": 3.312997347480106, + "grad_norm": 0.557404768668353, + "learning_rate": 2.5319523364972606e-05, + "loss": 0.447, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22600683569908142, + "step": 1875, + "valid_targets_mean": 5350.0, + "valid_targets_min": 433 + }, + { + "epoch": 3.32183908045977, + "grad_norm": 0.7993682463700219, + "learning_rate": 2.5234523019645086e-05, + "loss": 0.4362, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2509821057319641, + "step": 1880, + "valid_targets_mean": 2375.5, + "valid_targets_min": 605 + }, + { + "epoch": 3.330680813439434, + "grad_norm": 0.58659727071677, + "learning_rate": 2.5149421050127556e-05, + "loss": 0.4341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19044440984725952, + "step": 1885, + "valid_targets_mean": 4073.1, + "valid_targets_min": 1747 + }, + { + "epoch": 3.339522546419098, + "grad_norm": 0.7845792945000336, + "learning_rate": 2.5064219108608525e-05, + "loss": 0.4351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1808401346206665, + "step": 1890, + "valid_targets_mean": 1915.0, + "valid_targets_min": 461 + }, + { + "epoch": 3.348364279398762, + "grad_norm": 0.7289729636417263, + "learning_rate": 2.497891884921735e-05, + "loss": 0.4492, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19839441776275635, + "step": 1895, + "valid_targets_mean": 2404.8, + "valid_targets_min": 386 + }, + { + "epoch": 3.357206012378426, + "grad_norm": 0.6820854233253595, + "learning_rate": 2.4893521927992182e-05, + "loss": 0.4703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27235740423202515, + "step": 1900, + "valid_targets_mean": 2999.2, + "valid_targets_min": 442 + }, + { + "epoch": 3.3660477453580904, + "grad_norm": 0.5855412571643762, + "learning_rate": 2.4808030002847775e-05, + "loss": 0.4376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19236628711223602, + "step": 1905, + "valid_targets_mean": 3963.6, + "valid_targets_min": 1110 + }, + { + "epoch": 3.3748894783377543, + "grad_norm": 0.7338094054626427, + "learning_rate": 2.472244473354332e-05, + "loss": 0.4769, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22928746044635773, + "step": 1910, + "valid_targets_mean": 2708.8, + "valid_targets_min": 1158 + }, + { + "epoch": 3.3837312113174183, + "grad_norm": 0.7995982234481557, + "learning_rate": 2.4636767781650183e-05, + "loss": 0.4615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2549368739128113, + "step": 1915, + "valid_targets_mean": 2276.2, + "valid_targets_min": 1059 + }, + { + "epoch": 3.3925729442970822, + "grad_norm": 0.6376992232354394, + "learning_rate": 2.4551000810519714e-05, + "loss": 0.4899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2908145785331726, + "step": 1920, + "valid_targets_mean": 4513.8, + "valid_targets_min": 294 + }, + { + "epoch": 3.401414677276746, + "grad_norm": 0.7776074545649672, + "learning_rate": 2.4465145485250888e-05, + "loss": 0.4519, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23057112097740173, + "step": 1925, + "valid_targets_mean": 3097.4, + "valid_targets_min": 670 + }, + { + "epoch": 3.41025641025641, + "grad_norm": 0.7652952479222617, + "learning_rate": 2.437920347265802e-05, + "loss": 0.4214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17387378215789795, + "step": 1930, + "valid_targets_mean": 1660.1, + "valid_targets_min": 289 + }, + { + "epoch": 3.419098143236074, + "grad_norm": 0.6605377290323325, + "learning_rate": 2.4293176441238396e-05, + "loss": 0.4112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23506543040275574, + "step": 1935, + "valid_targets_mean": 3702.8, + "valid_targets_min": 443 + }, + { + "epoch": 3.4279398762157385, + "grad_norm": 0.5979410720887383, + "learning_rate": 2.420706606113986e-05, + "loss": 0.4189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2637672424316406, + "step": 1940, + "valid_targets_mean": 4603.4, + "valid_targets_min": 673 + }, + { + "epoch": 3.4367816091954024, + "grad_norm": 0.5739576956888619, + "learning_rate": 2.4120874004128422e-05, + "loss": 0.4861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22790098190307617, + "step": 1945, + "valid_targets_mean": 3478.2, + "valid_targets_min": 426 + }, + { + "epoch": 3.4456233421750664, + "grad_norm": 0.6888223638237597, + "learning_rate": 2.4034601943555775e-05, + "loss": 0.4576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2896411418914795, + "step": 1950, + "valid_targets_mean": 3563.5, + "valid_targets_min": 296 + }, + { + "epoch": 3.4544650751547303, + "grad_norm": 0.6188357957447922, + "learning_rate": 2.3948251554326826e-05, + "loss": 0.4412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27495166659355164, + "step": 1955, + "valid_targets_mean": 4352.5, + "valid_targets_min": 572 + }, + { + "epoch": 3.4633068081343943, + "grad_norm": 0.6700510097036785, + "learning_rate": 2.3861824512867172e-05, + "loss": 0.421, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3003349304199219, + "step": 1960, + "valid_targets_mean": 5187.4, + "valid_targets_min": 1645 + }, + { + "epoch": 3.4721485411140582, + "grad_norm": 0.6558839463348246, + "learning_rate": 2.377532249709054e-05, + "loss": 0.4557, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.35241687297821045, + "step": 1965, + "valid_targets_mean": 4643.0, + "valid_targets_min": 571 + }, + { + "epoch": 3.480990274093722, + "grad_norm": 0.6349474618857128, + "learning_rate": 2.368874718636625e-05, + "loss": 0.4472, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1423875242471695, + "step": 1970, + "valid_targets_mean": 2537.1, + "valid_targets_min": 694 + }, + { + "epoch": 3.489832007073386, + "grad_norm": 0.6813167822681871, + "learning_rate": 2.3602100261486557e-05, + "loss": 0.4754, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27694791555404663, + "step": 1975, + "valid_targets_mean": 4163.6, + "valid_targets_min": 1557 + }, + { + "epoch": 3.4986737400530505, + "grad_norm": 0.6514986467289062, + "learning_rate": 2.3515383404634075e-05, + "loss": 0.4378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1669061779975891, + "step": 1980, + "valid_targets_mean": 2230.2, + "valid_targets_min": 296 + }, + { + "epoch": 3.5075154730327145, + "grad_norm": 0.7914161143585046, + "learning_rate": 2.3428598299349076e-05, + "loss": 0.4694, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27049192786216736, + "step": 1985, + "valid_targets_mean": 1989.0, + "valid_targets_min": 267 + }, + { + "epoch": 3.5163572060123784, + "grad_norm": 0.8656201914218805, + "learning_rate": 2.3341746630496828e-05, + "loss": 0.4454, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25898832082748413, + "step": 1990, + "valid_targets_mean": 1998.6, + "valid_targets_min": 734 + }, + { + "epoch": 3.5251989389920424, + "grad_norm": 0.7646102018521315, + "learning_rate": 2.3254830084234877e-05, + "loss": 0.4168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21087685227394104, + "step": 1995, + "valid_targets_mean": 3901.9, + "valid_targets_min": 1727 + }, + { + "epoch": 3.5340406719717063, + "grad_norm": 0.7970932854441665, + "learning_rate": 2.316785034798032e-05, + "loss": 0.4506, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.256100058555603, + "step": 2000, + "valid_targets_mean": 2907.2, + "valid_targets_min": 1306 + }, + { + "epoch": 3.5428824049513707, + "grad_norm": 0.7147517419674159, + "learning_rate": 2.308080911037703e-05, + "loss": 0.4358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2644729018211365, + "step": 2005, + "valid_targets_mean": 3793.5, + "valid_targets_min": 1606 + }, + { + "epoch": 3.5517241379310347, + "grad_norm": 0.6331675123587539, + "learning_rate": 2.2993708061262886e-05, + "loss": 0.458, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1513529121875763, + "step": 2010, + "valid_targets_mean": 2805.9, + "valid_targets_min": 1291 + }, + { + "epoch": 3.5605658709106986, + "grad_norm": 0.7549622939379798, + "learning_rate": 2.2906548891636956e-05, + "loss": 0.4567, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24897724390029907, + "step": 2015, + "valid_targets_mean": 2534.6, + "valid_targets_min": 1037 + }, + { + "epoch": 3.5694076038903626, + "grad_norm": 0.9923863265222221, + "learning_rate": 2.2819333293626686e-05, + "loss": 0.4483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16775819659233093, + "step": 2020, + "valid_targets_mean": 1303.4, + "valid_targets_min": 324 + }, + { + "epoch": 3.5782493368700266, + "grad_norm": 0.6137184109496221, + "learning_rate": 2.2732062960455014e-05, + "loss": 0.4373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15827752649784088, + "step": 2025, + "valid_targets_mean": 3152.2, + "valid_targets_min": 308 + }, + { + "epoch": 3.5870910698496905, + "grad_norm": 0.7316389088145041, + "learning_rate": 2.264473958640753e-05, + "loss": 0.412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19498181343078613, + "step": 2030, + "valid_targets_mean": 2589.9, + "valid_targets_min": 411 + }, + { + "epoch": 3.5959328028293545, + "grad_norm": 0.7269422076299851, + "learning_rate": 2.2557364866799572e-05, + "loss": 0.4285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3297356367111206, + "step": 2035, + "valid_targets_mean": 3257.0, + "valid_targets_min": 461 + }, + { + "epoch": 3.6047745358090184, + "grad_norm": 0.6557829256691635, + "learning_rate": 2.246994049794332e-05, + "loss": 0.4663, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11620749533176422, + "step": 2040, + "valid_targets_mean": 2108.5, + "valid_targets_min": 1626 + }, + { + "epoch": 3.6136162687886824, + "grad_norm": 0.6578106972416874, + "learning_rate": 2.2382468177114834e-05, + "loss": 0.4001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1800394058227539, + "step": 2045, + "valid_targets_mean": 2848.1, + "valid_targets_min": 491 + }, + { + "epoch": 3.6224580017683468, + "grad_norm": 0.6460106377859882, + "learning_rate": 2.2294949602521142e-05, + "loss": 0.4664, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20682604610919952, + "step": 2050, + "valid_targets_mean": 3096.0, + "valid_targets_min": 401 + }, + { + "epoch": 3.6312997347480107, + "grad_norm": 0.7686693214243684, + "learning_rate": 2.2207386473267247e-05, + "loss": 0.4407, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2174399495124817, + "step": 2055, + "valid_targets_mean": 2397.0, + "valid_targets_min": 638 + }, + { + "epoch": 3.6401414677276747, + "grad_norm": 0.7189899231337926, + "learning_rate": 2.2119780489323154e-05, + "loss": 0.4363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19445934891700745, + "step": 2060, + "valid_targets_mean": 2458.8, + "valid_targets_min": 990 + }, + { + "epoch": 3.6489832007073386, + "grad_norm": 0.7020436393545836, + "learning_rate": 2.2032133351490835e-05, + "loss": 0.4571, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30607905983924866, + "step": 2065, + "valid_targets_mean": 3775.8, + "valid_targets_min": 1317 + }, + { + "epoch": 3.6578249336870026, + "grad_norm": 0.7444068107077655, + "learning_rate": 2.1944446761371264e-05, + "loss": 0.4217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22787776589393616, + "step": 2070, + "valid_targets_mean": 2930.4, + "valid_targets_min": 1730 + }, + { + "epoch": 3.6666666666666665, + "grad_norm": 0.6968317634420128, + "learning_rate": 2.1856722421331322e-05, + "loss": 0.444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15648722648620605, + "step": 2075, + "valid_targets_mean": 2251.6, + "valid_targets_min": 350 + }, + { + "epoch": 3.675508399646331, + "grad_norm": 0.6959983172874498, + "learning_rate": 2.1768962034470803e-05, + "loss": 0.4696, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24266773462295532, + "step": 2080, + "valid_targets_mean": 3423.4, + "valid_targets_min": 384 + }, + { + "epoch": 3.684350132625995, + "grad_norm": 0.7788541548960379, + "learning_rate": 2.1681167304589295e-05, + "loss": 0.4074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1628911793231964, + "step": 2085, + "valid_targets_mean": 2365.0, + "valid_targets_min": 461 + }, + { + "epoch": 3.693191865605659, + "grad_norm": 0.7039562542774168, + "learning_rate": 2.1593339936153148e-05, + "loss": 0.424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17437390983104706, + "step": 2090, + "valid_targets_mean": 2311.9, + "valid_targets_min": 1444 + }, + { + "epoch": 3.7020335985853228, + "grad_norm": 0.5741843896967402, + "learning_rate": 2.1505481634262354e-05, + "loss": 0.4053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22777321934700012, + "step": 2095, + "valid_targets_mean": 4313.0, + "valid_targets_min": 1591 + }, + { + "epoch": 3.7108753315649867, + "grad_norm": 0.7672460830420991, + "learning_rate": 2.141759410461746e-05, + "loss": 0.4182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1350998878479004, + "step": 2100, + "valid_targets_mean": 1726.9, + "valid_targets_min": 382 + }, + { + "epoch": 3.7197170645446507, + "grad_norm": 0.6710207783728802, + "learning_rate": 2.1329679053486444e-05, + "loss": 0.4478, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29351454973220825, + "step": 2105, + "valid_targets_mean": 3874.4, + "valid_targets_min": 1654 + }, + { + "epoch": 3.7285587975243146, + "grad_norm": 0.6423318027598373, + "learning_rate": 2.1241738187671595e-05, + "loss": 0.4299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19800537824630737, + "step": 2110, + "valid_targets_mean": 2980.0, + "valid_targets_min": 1460 + }, + { + "epoch": 3.7374005305039786, + "grad_norm": 0.6914935831642892, + "learning_rate": 2.115377321447637e-05, + "loss": 0.4992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1961551457643509, + "step": 2115, + "valid_targets_mean": 3261.6, + "valid_targets_min": 1418 + }, + { + "epoch": 3.7462422634836425, + "grad_norm": 0.6625084903349797, + "learning_rate": 2.106578584167225e-05, + "loss": 0.4114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2027662992477417, + "step": 2120, + "valid_targets_mean": 2802.2, + "valid_targets_min": 610 + }, + { + "epoch": 3.755083996463307, + "grad_norm": 0.644453283873008, + "learning_rate": 2.0977777777465594e-05, + "loss": 0.4229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17548662424087524, + "step": 2125, + "valid_targets_mean": 3109.0, + "valid_targets_min": 714 + }, + { + "epoch": 3.763925729442971, + "grad_norm": 0.7667734390353328, + "learning_rate": 2.0889750730464474e-05, + "loss": 0.4612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23370791971683502, + "step": 2130, + "valid_targets_mean": 2261.5, + "valid_targets_min": 598 + }, + { + "epoch": 3.772767462422635, + "grad_norm": 0.738277857442572, + "learning_rate": 2.0801706409645473e-05, + "loss": 0.4607, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21809722483158112, + "step": 2135, + "valid_targets_mean": 3180.4, + "valid_targets_min": 682 + }, + { + "epoch": 3.781609195402299, + "grad_norm": 0.8463179804355774, + "learning_rate": 2.0713646524320557e-05, + "loss": 0.4408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22101402282714844, + "step": 2140, + "valid_targets_mean": 2733.5, + "valid_targets_min": 477 + }, + { + "epoch": 3.7904509283819627, + "grad_norm": 0.7086110797536909, + "learning_rate": 2.0625572784103855e-05, + "loss": 0.471, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23744723200798035, + "step": 2145, + "valid_targets_mean": 2938.8, + "valid_targets_min": 350 + }, + { + "epoch": 3.799292661361627, + "grad_norm": 0.6251176123735659, + "learning_rate": 2.053748689887848e-05, + "loss": 0.4261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20360612869262695, + "step": 2150, + "valid_targets_mean": 3229.5, + "valid_targets_min": 844 + }, + { + "epoch": 3.808134394341291, + "grad_norm": 0.6958759696778948, + "learning_rate": 2.0449390578763336e-05, + "loss": 0.4283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2020493447780609, + "step": 2155, + "valid_targets_mean": 2590.4, + "valid_targets_min": 420 + }, + { + "epoch": 3.816976127320955, + "grad_norm": 0.7006461931706444, + "learning_rate": 2.036128553407989e-05, + "loss": 0.4411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2114584743976593, + "step": 2160, + "valid_targets_mean": 2864.6, + "valid_targets_min": 616 + }, + { + "epoch": 3.825817860300619, + "grad_norm": 0.6980121359538078, + "learning_rate": 2.027317347531902e-05, + "loss": 0.4583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2123686671257019, + "step": 2165, + "valid_targets_mean": 3107.0, + "valid_targets_min": 1375 + }, + { + "epoch": 3.834659593280283, + "grad_norm": 0.7098528867513164, + "learning_rate": 2.0185056113107763e-05, + "loss": 0.495, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23799559473991394, + "step": 2170, + "valid_targets_mean": 3973.5, + "valid_targets_min": 1517 + }, + { + "epoch": 3.843501326259947, + "grad_norm": 0.9443823890149703, + "learning_rate": 2.0096935158176105e-05, + "loss": 0.434, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21758808195590973, + "step": 2175, + "valid_targets_mean": 1717.0, + "valid_targets_min": 343 + }, + { + "epoch": 3.852343059239611, + "grad_norm": 0.8056251979105057, + "learning_rate": 2.000881232132381e-05, + "loss": 0.4657, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17145347595214844, + "step": 2180, + "valid_targets_mean": 1844.9, + "valid_targets_min": 606 + }, + { + "epoch": 3.861184792219275, + "grad_norm": 0.631753151558534, + "learning_rate": 1.9920689313387148e-05, + "loss": 0.4246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23968084156513214, + "step": 2185, + "valid_targets_mean": 4621.9, + "valid_targets_min": 1216 + }, + { + "epoch": 3.8700265251989387, + "grad_norm": 0.5921935896404549, + "learning_rate": 1.9832567845205735e-05, + "loss": 0.4161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23088482022285461, + "step": 2190, + "valid_targets_mean": 4285.4, + "valid_targets_min": 363 + }, + { + "epoch": 3.878868258178603, + "grad_norm": 0.6575693180610859, + "learning_rate": 1.974444962758929e-05, + "loss": 0.4294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.220181405544281, + "step": 2195, + "valid_targets_mean": 3333.4, + "valid_targets_min": 1980 + }, + { + "epoch": 3.887709991158267, + "grad_norm": 0.6941860616336191, + "learning_rate": 1.9656336371284406e-05, + "loss": 0.4552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22298529744148254, + "step": 2200, + "valid_targets_mean": 2727.5, + "valid_targets_min": 601 + }, + { + "epoch": 3.896551724137931, + "grad_norm": 0.7225249260002937, + "learning_rate": 1.956822978694137e-05, + "loss": 0.4438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18556898832321167, + "step": 2205, + "valid_targets_mean": 2341.8, + "valid_targets_min": 442 + }, + { + "epoch": 3.905393457117595, + "grad_norm": 0.7406697584636266, + "learning_rate": 1.9480131585080946e-05, + "loss": 0.4231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2133459746837616, + "step": 2210, + "valid_targets_mean": 2642.8, + "valid_targets_min": 431 + }, + { + "epoch": 3.914235190097259, + "grad_norm": 0.7039889962915561, + "learning_rate": 1.939204347606115e-05, + "loss": 0.4493, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2137300670146942, + "step": 2215, + "valid_targets_mean": 2678.2, + "valid_targets_min": 1169 + }, + { + "epoch": 3.9230769230769234, + "grad_norm": 0.634420740737628, + "learning_rate": 1.9303967170044043e-05, + "loss": 0.4358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17572371661663055, + "step": 2220, + "valid_targets_mean": 3010.6, + "valid_targets_min": 1313 + }, + { + "epoch": 3.9319186560565873, + "grad_norm": 0.7155018581712755, + "learning_rate": 1.9215904376962555e-05, + "loss": 0.4263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21080003678798676, + "step": 2225, + "valid_targets_mean": 2322.0, + "valid_targets_min": 742 + }, + { + "epoch": 3.9407603890362513, + "grad_norm": 0.758819158514058, + "learning_rate": 1.9127856806487266e-05, + "loss": 0.4388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16472750902175903, + "step": 2230, + "valid_targets_mean": 2019.2, + "valid_targets_min": 431 + }, + { + "epoch": 3.949602122015915, + "grad_norm": 0.8777006692099467, + "learning_rate": 1.9039826167993235e-05, + "loss": 0.4483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17932608723640442, + "step": 2235, + "valid_targets_mean": 1764.1, + "valid_targets_min": 682 + }, + { + "epoch": 3.958443854995579, + "grad_norm": 0.6089818772904589, + "learning_rate": 1.895181417052677e-05, + "loss": 0.4231, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24629013240337372, + "step": 2240, + "valid_targets_mean": 4223.6, + "valid_targets_min": 459 + }, + { + "epoch": 3.967285587975243, + "grad_norm": 0.639631153985411, + "learning_rate": 1.88638225227723e-05, + "loss": 0.4245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21447336673736572, + "step": 2245, + "valid_targets_mean": 3402.6, + "valid_targets_min": 424 + }, + { + "epoch": 3.976127320954907, + "grad_norm": 0.8458138613793146, + "learning_rate": 1.877585293301918e-05, + "loss": 0.4163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22714388370513916, + "step": 2250, + "valid_targets_mean": 2087.0, + "valid_targets_min": 488 + }, + { + "epoch": 3.984969053934571, + "grad_norm": 0.8014506952688943, + "learning_rate": 1.868790710912853e-05, + "loss": 0.4301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27369236946105957, + "step": 2255, + "valid_targets_mean": 2659.0, + "valid_targets_min": 1183 + }, + { + "epoch": 3.993810786914235, + "grad_norm": 0.5931369878866818, + "learning_rate": 1.8599986758500047e-05, + "loss": 0.4667, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2135334014892578, + "step": 2260, + "valid_targets_mean": 3793.0, + "valid_targets_min": 765 + }, + { + "epoch": 4.001768346595933, + "grad_norm": 0.6460139121405902, + "learning_rate": 1.8512093588038915e-05, + "loss": 0.4144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2704264223575592, + "step": 2265, + "valid_targets_mean": 4983.9, + "valid_targets_min": 244 + }, + { + "epoch": 4.010610079575597, + "grad_norm": 0.7103598023526009, + "learning_rate": 1.842422930412262e-05, + "loss": 0.4182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22416162490844727, + "step": 2270, + "valid_targets_mean": 3300.9, + "valid_targets_min": 1126 + }, + { + "epoch": 4.0194518125552605, + "grad_norm": 0.6926185487221391, + "learning_rate": 1.8336395612567857e-05, + "loss": 0.4081, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19507721066474915, + "step": 2275, + "valid_targets_mean": 3702.0, + "valid_targets_min": 308 + }, + { + "epoch": 4.0282935455349245, + "grad_norm": 0.6966627277554577, + "learning_rate": 1.824859421859736e-05, + "loss": 0.4291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2344420850276947, + "step": 2280, + "valid_targets_mean": 3541.6, + "valid_targets_min": 532 + }, + { + "epoch": 4.037135278514588, + "grad_norm": 0.8185873096759235, + "learning_rate": 1.8160826826806856e-05, + "loss": 0.4333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16348719596862793, + "step": 2285, + "valid_targets_mean": 1622.6, + "valid_targets_min": 345 + }, + { + "epoch": 4.045977011494253, + "grad_norm": 0.6298356213417173, + "learning_rate": 1.8073095141131946e-05, + "loss": 0.3803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15070627629756927, + "step": 2290, + "valid_targets_mean": 4094.2, + "valid_targets_min": 411 + }, + { + "epoch": 4.054818744473917, + "grad_norm": 0.7055842030089096, + "learning_rate": 1.7985400864815027e-05, + "loss": 0.4017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1813596785068512, + "step": 2295, + "valid_targets_mean": 2406.0, + "valid_targets_min": 429 + }, + { + "epoch": 4.063660477453581, + "grad_norm": 0.6605651518692166, + "learning_rate": 1.7897745700372194e-05, + "loss": 0.403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19027772545814514, + "step": 2300, + "valid_targets_mean": 3733.2, + "valid_targets_min": 558 + }, + { + "epoch": 4.072502210433245, + "grad_norm": 0.638116942250368, + "learning_rate": 1.781013134956025e-05, + "loss": 0.3903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1789359450340271, + "step": 2305, + "valid_targets_mean": 4052.6, + "valid_targets_min": 1744 + }, + { + "epoch": 4.081343943412909, + "grad_norm": 0.6312271133669283, + "learning_rate": 1.7722559513343616e-05, + "loss": 0.4298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18907594680786133, + "step": 2310, + "valid_targets_mean": 4083.4, + "valid_targets_min": 312 + }, + { + "epoch": 4.090185676392573, + "grad_norm": 0.6831522353731495, + "learning_rate": 1.7635031891861334e-05, + "loss": 0.4048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2140839397907257, + "step": 2315, + "valid_targets_mean": 3038.2, + "valid_targets_min": 653 + }, + { + "epoch": 4.099027409372237, + "grad_norm": 0.7541794171611146, + "learning_rate": 1.7547550184394036e-05, + "loss": 0.3999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14385363459587097, + "step": 2320, + "valid_targets_mean": 1814.5, + "valid_targets_min": 392 + }, + { + "epoch": 4.107869142351901, + "grad_norm": 0.850080748839246, + "learning_rate": 1.746011608933098e-05, + "loss": 0.4263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1753498613834381, + "step": 2325, + "valid_targets_mean": 2009.9, + "valid_targets_min": 260 + }, + { + "epoch": 4.116710875331565, + "grad_norm": 0.6727035464038962, + "learning_rate": 1.7372731304137072e-05, + "loss": 0.4234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.156248539686203, + "step": 2330, + "valid_targets_mean": 2836.2, + "valid_targets_min": 1037 + }, + { + "epoch": 4.125552608311229, + "grad_norm": 0.7915258988052476, + "learning_rate": 1.7285397525319897e-05, + "loss": 0.4209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18911907076835632, + "step": 2335, + "valid_targets_mean": 2722.6, + "valid_targets_min": 558 + }, + { + "epoch": 4.134394341290893, + "grad_norm": 0.7225681941913896, + "learning_rate": 1.719811644839679e-05, + "loss": 0.4446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2196042686700821, + "step": 2340, + "valid_targets_mean": 2874.2, + "valid_targets_min": 1010 + }, + { + "epoch": 4.143236074270557, + "grad_norm": 0.6793110061906088, + "learning_rate": 1.711088976786192e-05, + "loss": 0.4049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22990606725215912, + "step": 2345, + "valid_targets_mean": 3720.2, + "valid_targets_min": 1376 + }, + { + "epoch": 4.152077807250221, + "grad_norm": 0.6309626795534368, + "learning_rate": 1.7023719177153397e-05, + "loss": 0.4287, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25914740562438965, + "step": 2350, + "valid_targets_mean": 5181.9, + "valid_targets_min": 365 + }, + { + "epoch": 4.160919540229885, + "grad_norm": 0.7534348626475472, + "learning_rate": 1.6936606368620393e-05, + "loss": 0.426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30650636553764343, + "step": 2355, + "valid_targets_mean": 3284.2, + "valid_targets_min": 1120 + }, + { + "epoch": 4.1697612732095495, + "grad_norm": 0.7973625055634738, + "learning_rate": 1.684955303349027e-05, + "loss": 0.4116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11398676037788391, + "step": 2360, + "valid_targets_mean": 1583.0, + "valid_targets_min": 341 + }, + { + "epoch": 4.178603006189213, + "grad_norm": 0.6773926752150286, + "learning_rate": 1.6762560861835778e-05, + "loss": 0.3691, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13966532051563263, + "step": 2365, + "valid_targets_mean": 2208.0, + "valid_targets_min": 1095 + }, + { + "epoch": 4.187444739168877, + "grad_norm": 0.7600418307606107, + "learning_rate": 1.6675631542542206e-05, + "loss": 0.4199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1887199878692627, + "step": 2370, + "valid_targets_mean": 2575.6, + "valid_targets_min": 1492 + }, + { + "epoch": 4.196286472148541, + "grad_norm": 0.825716048698755, + "learning_rate": 1.658876676327464e-05, + "loss": 0.4325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17904534935951233, + "step": 2375, + "valid_targets_mean": 1817.2, + "valid_targets_min": 509 + }, + { + "epoch": 4.205128205128205, + "grad_norm": 0.7357744240798385, + "learning_rate": 1.6501968210445144e-05, + "loss": 0.433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28740018606185913, + "step": 2380, + "valid_targets_mean": 3760.6, + "valid_targets_min": 2060 + }, + { + "epoch": 4.213969938107869, + "grad_norm": 0.6102035784766663, + "learning_rate": 1.641523756918006e-05, + "loss": 0.4051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19327875971794128, + "step": 2385, + "valid_targets_mean": 4250.9, + "valid_targets_min": 1501 + }, + { + "epoch": 4.222811671087533, + "grad_norm": 0.6953359184280162, + "learning_rate": 1.6328576523287284e-05, + "loss": 0.4268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.310172438621521, + "step": 2390, + "valid_targets_mean": 4208.6, + "valid_targets_min": 1314 + }, + { + "epoch": 4.231653404067197, + "grad_norm": 0.7297311607993835, + "learning_rate": 1.6241986755223574e-05, + "loss": 0.4281, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32732078433036804, + "step": 2395, + "valid_targets_mean": 3946.0, + "valid_targets_min": 421 + }, + { + "epoch": 4.240495137046861, + "grad_norm": 0.7130243864792679, + "learning_rate": 1.6155469946061863e-05, + "loss": 0.3957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1902158409357071, + "step": 2400, + "valid_targets_mean": 3486.8, + "valid_targets_min": 1190 + }, + { + "epoch": 4.249336870026525, + "grad_norm": 0.7379540908447911, + "learning_rate": 1.6069027775458665e-05, + "loss": 0.4381, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1608520746231079, + "step": 2405, + "valid_targets_mean": 2679.8, + "valid_targets_min": 1319 + }, + { + "epoch": 4.258178603006189, + "grad_norm": 0.8452056516818466, + "learning_rate": 1.5982661921621437e-05, + "loss": 0.4092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23513582348823547, + "step": 2410, + "valid_targets_mean": 2361.6, + "valid_targets_min": 426 + }, + { + "epoch": 4.267020335985853, + "grad_norm": 0.730287777008674, + "learning_rate": 1.5896374061276015e-05, + "loss": 0.4286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2784014344215393, + "step": 2415, + "valid_targets_mean": 5109.2, + "valid_targets_min": 1990 + }, + { + "epoch": 4.275862068965517, + "grad_norm": 0.7103251487687208, + "learning_rate": 1.5810165869634027e-05, + "loss": 0.4031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2809576392173767, + "step": 2420, + "valid_targets_mean": 5307.9, + "valid_targets_min": 900 + }, + { + "epoch": 4.284703801945181, + "grad_norm": 0.6866454436464177, + "learning_rate": 1.572403902036042e-05, + "loss": 0.4139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1964649111032486, + "step": 2425, + "valid_targets_mean": 2979.6, + "valid_targets_min": 1814 + }, + { + "epoch": 4.293545534924846, + "grad_norm": 0.7150372488857892, + "learning_rate": 1.5637995185540932e-05, + "loss": 0.3881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1866159737110138, + "step": 2430, + "valid_targets_mean": 3078.5, + "valid_targets_min": 1192 + }, + { + "epoch": 4.30238726790451, + "grad_norm": 0.8579495181131218, + "learning_rate": 1.5552036035649656e-05, + "loss": 0.4188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.200179323554039, + "step": 2435, + "valid_targets_mean": 2049.5, + "valid_targets_min": 523 + }, + { + "epoch": 4.311229000884174, + "grad_norm": 0.7013758701584984, + "learning_rate": 1.5466163239516553e-05, + "loss": 0.3927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.30045637488365173, + "step": 2440, + "valid_targets_mean": 3139.2, + "valid_targets_min": 453 + }, + { + "epoch": 4.3200707338638376, + "grad_norm": 0.7497089575459133, + "learning_rate": 1.5380378464295133e-05, + "loss": 0.3999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16102385520935059, + "step": 2445, + "valid_targets_mean": 2777.8, + "valid_targets_min": 673 + }, + { + "epoch": 4.3289124668435015, + "grad_norm": 0.7738772317856076, + "learning_rate": 1.5294683375430035e-05, + "loss": 0.45, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24177439510822296, + "step": 2450, + "valid_targets_mean": 3024.8, + "valid_targets_min": 403 + }, + { + "epoch": 4.3377541998231655, + "grad_norm": 0.8087896123657419, + "learning_rate": 1.520907963662471e-05, + "loss": 0.398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17100030183792114, + "step": 2455, + "valid_targets_mean": 1706.0, + "valid_targets_min": 503 + }, + { + "epoch": 4.346595932802829, + "grad_norm": 0.6521224471842675, + "learning_rate": 1.5123568909809103e-05, + "loss": 0.3993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21314716339111328, + "step": 2460, + "valid_targets_mean": 4596.2, + "valid_targets_min": 1946 + }, + { + "epoch": 4.355437665782493, + "grad_norm": 0.6730460262609402, + "learning_rate": 1.5038152855107422e-05, + "loss": 0.4331, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29492098093032837, + "step": 2465, + "valid_targets_mean": 4156.1, + "valid_targets_min": 286 + }, + { + "epoch": 4.364279398762157, + "grad_norm": 0.8227541669467124, + "learning_rate": 1.4952833130805884e-05, + "loss": 0.4228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20231404900550842, + "step": 2470, + "valid_targets_mean": 2325.4, + "valid_targets_min": 1373 + }, + { + "epoch": 4.373121131741821, + "grad_norm": 0.6978839330328747, + "learning_rate": 1.4867611393320533e-05, + "loss": 0.4432, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23436486721038818, + "step": 2475, + "valid_targets_mean": 3332.9, + "valid_targets_min": 317 + }, + { + "epoch": 4.381962864721485, + "grad_norm": 0.7946215788236765, + "learning_rate": 1.478248929716505e-05, + "loss": 0.3911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1627664864063263, + "step": 2480, + "valid_targets_mean": 1966.0, + "valid_targets_min": 856 + }, + { + "epoch": 4.390804597701149, + "grad_norm": 0.7156697773599238, + "learning_rate": 1.4697468494918687e-05, + "loss": 0.4436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.186476469039917, + "step": 2485, + "valid_targets_mean": 2992.4, + "valid_targets_min": 607 + }, + { + "epoch": 4.399646330680813, + "grad_norm": 0.8727002600998265, + "learning_rate": 1.4612550637194141e-05, + "loss": 0.4475, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19441717863082886, + "step": 2490, + "valid_targets_mean": 2303.6, + "valid_targets_min": 708 + }, + { + "epoch": 4.408488063660477, + "grad_norm": 0.7507265043943055, + "learning_rate": 1.4527737372605529e-05, + "loss": 0.4507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23913750052452087, + "step": 2495, + "valid_targets_mean": 3582.6, + "valid_targets_min": 1482 + }, + { + "epoch": 4.417329796640141, + "grad_norm": 0.7610940521640887, + "learning_rate": 1.4443030347736347e-05, + "loss": 0.4381, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1793220490217209, + "step": 2500, + "valid_targets_mean": 2593.2, + "valid_targets_min": 267 + }, + { + "epoch": 4.426171529619806, + "grad_norm": 0.6342963620181833, + "learning_rate": 1.435843120710756e-05, + "loss": 0.4017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20556139945983887, + "step": 2505, + "valid_targets_mean": 4132.1, + "valid_targets_min": 1120 + }, + { + "epoch": 4.43501326259947, + "grad_norm": 0.7530536406998339, + "learning_rate": 1.4273941593145636e-05, + "loss": 0.4483, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.38451525568962097, + "step": 2510, + "valid_targets_mean": 4499.5, + "valid_targets_min": 1789 + }, + { + "epoch": 4.443854995579134, + "grad_norm": 0.8273793851318227, + "learning_rate": 1.4189563146150669e-05, + "loss": 0.4212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20944646000862122, + "step": 2515, + "valid_targets_mean": 2535.8, + "valid_targets_min": 623 + }, + { + "epoch": 4.452696728558798, + "grad_norm": 0.7909970336145224, + "learning_rate": 1.4105297504264516e-05, + "loss": 0.4347, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3092140555381775, + "step": 2520, + "valid_targets_mean": 3188.4, + "valid_targets_min": 1031 + }, + { + "epoch": 4.461538461538462, + "grad_norm": 0.9428226334726033, + "learning_rate": 1.4021146303439031e-05, + "loss": 0.4029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2530262768268585, + "step": 2525, + "valid_targets_mean": 2076.4, + "valid_targets_min": 349 + }, + { + "epoch": 4.470380194518126, + "grad_norm": 0.7317845516311463, + "learning_rate": 1.3937111177404279e-05, + "loss": 0.4369, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24385397136211395, + "step": 2530, + "valid_targets_mean": 3438.1, + "valid_targets_min": 1464 + }, + { + "epoch": 4.47922192749779, + "grad_norm": 0.7770528449780305, + "learning_rate": 1.385319375763682e-05, + "loss": 0.3756, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17684635519981384, + "step": 2535, + "valid_targets_mean": 2598.0, + "valid_targets_min": 227 + }, + { + "epoch": 4.4880636604774535, + "grad_norm": 0.7420657248975656, + "learning_rate": 1.376939567332804e-05, + "loss": 0.4351, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18782931566238403, + "step": 2540, + "valid_targets_mean": 2944.4, + "valid_targets_min": 1125 + }, + { + "epoch": 4.4969053934571175, + "grad_norm": 1.0340838110233663, + "learning_rate": 1.3685718551352518e-05, + "loss": 0.4428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.160398930311203, + "step": 2545, + "valid_targets_mean": 3630.4, + "valid_targets_min": 1189 + }, + { + "epoch": 4.505747126436781, + "grad_norm": 0.6091047868776585, + "learning_rate": 1.3602164016236444e-05, + "loss": 0.4019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1208481639623642, + "step": 2550, + "valid_targets_mean": 2871.2, + "valid_targets_min": 301 + }, + { + "epoch": 4.514588859416445, + "grad_norm": 0.7276768828189113, + "learning_rate": 1.3518733690126084e-05, + "loss": 0.4236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21554812788963318, + "step": 2555, + "valid_targets_mean": 3198.2, + "valid_targets_min": 308 + }, + { + "epoch": 4.523430592396109, + "grad_norm": 0.8138197550507267, + "learning_rate": 1.3435429192756275e-05, + "loss": 0.388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15686780214309692, + "step": 2560, + "valid_targets_mean": 1802.8, + "valid_targets_min": 391 + }, + { + "epoch": 4.532272325375773, + "grad_norm": 0.7698296993001761, + "learning_rate": 1.3352252141418998e-05, + "loss": 0.4202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21974670886993408, + "step": 2565, + "valid_targets_mean": 2627.8, + "valid_targets_min": 1299 + }, + { + "epoch": 4.541114058355438, + "grad_norm": 0.6991515960307244, + "learning_rate": 1.3269204150931953e-05, + "loss": 0.4112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1762574017047882, + "step": 2570, + "valid_targets_mean": 2943.6, + "valid_targets_min": 409 + }, + { + "epoch": 4.549955791335101, + "grad_norm": 0.5961797549163438, + "learning_rate": 1.3186286833607244e-05, + "loss": 0.4039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24313318729400635, + "step": 2575, + "valid_targets_mean": 4766.8, + "valid_targets_min": 662 + }, + { + "epoch": 4.558797524314766, + "grad_norm": 0.7490840636312823, + "learning_rate": 1.3103501799220033e-05, + "loss": 0.4085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23084694147109985, + "step": 2580, + "valid_targets_mean": 4158.1, + "valid_targets_min": 1584 + }, + { + "epoch": 4.56763925729443, + "grad_norm": 0.7065075883727937, + "learning_rate": 1.3020850654977333e-05, + "loss": 0.4209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1791738122701645, + "step": 2585, + "valid_targets_mean": 2766.2, + "valid_targets_min": 294 + }, + { + "epoch": 4.576480990274094, + "grad_norm": 0.6016645740317225, + "learning_rate": 1.293833500548678e-05, + "loss": 0.4446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17156481742858887, + "step": 2590, + "valid_targets_mean": 3903.5, + "valid_targets_min": 1670 + }, + { + "epoch": 4.585322723253758, + "grad_norm": 0.6114926043432934, + "learning_rate": 1.2855956452725471e-05, + "loss": 0.3752, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23596268892288208, + "step": 2595, + "valid_targets_mean": 3700.5, + "valid_targets_min": 682 + }, + { + "epoch": 4.594164456233422, + "grad_norm": 0.7917827130664251, + "learning_rate": 1.2773716596008889e-05, + "loss": 0.3987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21856589615345, + "step": 2600, + "valid_targets_mean": 3063.4, + "valid_targets_min": 844 + }, + { + "epoch": 4.603006189213086, + "grad_norm": 0.648273474654547, + "learning_rate": 1.2691617031959843e-05, + "loss": 0.4105, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17004728317260742, + "step": 2605, + "valid_targets_mean": 3463.0, + "valid_targets_min": 1261 + }, + { + "epoch": 4.61184792219275, + "grad_norm": 0.8189757224237537, + "learning_rate": 1.2609659354477458e-05, + "loss": 0.4349, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3089355528354645, + "step": 2610, + "valid_targets_mean": 3244.4, + "valid_targets_min": 776 + }, + { + "epoch": 4.620689655172414, + "grad_norm": 0.7858403164318954, + "learning_rate": 1.2527845154706264e-05, + "loss": 0.3781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20955795049667358, + "step": 2615, + "valid_targets_mean": 3477.9, + "valid_targets_min": 906 + }, + { + "epoch": 4.629531388152078, + "grad_norm": 0.6689115673937959, + "learning_rate": 1.2446176021005245e-05, + "loss": 0.4202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19080306589603424, + "step": 2620, + "valid_targets_mean": 3002.6, + "valid_targets_min": 285 + }, + { + "epoch": 4.638373121131742, + "grad_norm": 0.6541092626716796, + "learning_rate": 1.2364653538917076e-05, + "loss": 0.4161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25211408734321594, + "step": 2625, + "valid_targets_mean": 5283.1, + "valid_targets_min": 593 + }, + { + "epoch": 4.647214854111406, + "grad_norm": 0.6591383126713584, + "learning_rate": 1.2283279291137291e-05, + "loss": 0.4246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23830297589302063, + "step": 2630, + "valid_targets_mean": 4273.6, + "valid_targets_min": 2174 + }, + { + "epoch": 4.6560565870910695, + "grad_norm": 0.6424277501690692, + "learning_rate": 1.2202054857483576e-05, + "loss": 0.4014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27352088689804077, + "step": 2635, + "valid_targets_mean": 4946.4, + "valid_targets_min": 1302 + }, + { + "epoch": 4.6648983200707335, + "grad_norm": 0.7211760280647633, + "learning_rate": 1.2120981814865073e-05, + "loss": 0.4114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23283889889717102, + "step": 2640, + "valid_targets_mean": 3097.9, + "valid_targets_min": 392 + }, + { + "epoch": 4.673740053050398, + "grad_norm": 0.7571275814501419, + "learning_rate": 1.2040061737251807e-05, + "loss": 0.4629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3724607229232788, + "step": 2645, + "valid_targets_mean": 3724.1, + "valid_targets_min": 1291 + }, + { + "epoch": 4.682581786030062, + "grad_norm": 0.6466326044624365, + "learning_rate": 1.19592961956441e-05, + "loss": 0.3891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22775639593601227, + "step": 2650, + "valid_targets_mean": 4530.5, + "valid_targets_min": 1760 + }, + { + "epoch": 4.691423519009726, + "grad_norm": 0.731960782868472, + "learning_rate": 1.1878686758042086e-05, + "loss": 0.4552, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20677362382411957, + "step": 2655, + "valid_targets_mean": 2433.1, + "valid_targets_min": 1698 + }, + { + "epoch": 4.70026525198939, + "grad_norm": 0.6658248910649158, + "learning_rate": 1.179823498941523e-05, + "loss": 0.4191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20261318981647491, + "step": 2660, + "valid_targets_mean": 3311.1, + "valid_targets_min": 1568 + }, + { + "epoch": 4.709106984969054, + "grad_norm": 0.7076657293158575, + "learning_rate": 1.1717942451672008e-05, + "loss": 0.4428, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2810763120651245, + "step": 2665, + "valid_targets_mean": 4327.8, + "valid_targets_min": 1118 + }, + { + "epoch": 4.717948717948718, + "grad_norm": 0.7884816045404514, + "learning_rate": 1.1637810703629549e-05, + "loss": 0.4001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21002733707427979, + "step": 2670, + "valid_targets_mean": 2842.2, + "valid_targets_min": 715 + }, + { + "epoch": 4.726790450928382, + "grad_norm": 0.7169004560389791, + "learning_rate": 1.1557841300983363e-05, + "loss": 0.4537, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17877726256847382, + "step": 2675, + "valid_targets_mean": 2562.5, + "valid_targets_min": 643 + }, + { + "epoch": 4.735632183908046, + "grad_norm": 0.5669741728591965, + "learning_rate": 1.1478035796277158e-05, + "loss": 0.4426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.10677316039800644, + "step": 2680, + "valid_targets_mean": 2404.2, + "valid_targets_min": 1020 + }, + { + "epoch": 4.74447391688771, + "grad_norm": 0.7657675790094381, + "learning_rate": 1.1398395738872683e-05, + "loss": 0.422, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1494864672422409, + "step": 2685, + "valid_targets_mean": 2797.8, + "valid_targets_min": 818 + }, + { + "epoch": 4.753315649867374, + "grad_norm": 0.6799388910970321, + "learning_rate": 1.1318922674919675e-05, + "loss": 0.4646, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2254074662923813, + "step": 2690, + "valid_targets_mean": 3502.0, + "valid_targets_min": 880 + }, + { + "epoch": 4.762157382847038, + "grad_norm": 0.7628855637000989, + "learning_rate": 1.1239618147325802e-05, + "loss": 0.3928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2163882851600647, + "step": 2695, + "valid_targets_mean": 2970.4, + "valid_targets_min": 1874 + }, + { + "epoch": 4.770999115826702, + "grad_norm": 0.7194697076051723, + "learning_rate": 1.116048369572674e-05, + "loss": 0.4034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21982774138450623, + "step": 2700, + "valid_targets_mean": 3383.4, + "valid_targets_min": 1312 + }, + { + "epoch": 4.779840848806366, + "grad_norm": 0.6669494326491152, + "learning_rate": 1.1081520856456267e-05, + "loss": 0.409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23762443661689758, + "step": 2705, + "valid_targets_mean": 3892.1, + "valid_targets_min": 412 + }, + { + "epoch": 4.78868258178603, + "grad_norm": 0.7108382848669145, + "learning_rate": 1.1002731162516453e-05, + "loss": 0.4359, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1936943084001541, + "step": 2710, + "valid_targets_mean": 2535.1, + "valid_targets_min": 1712 + }, + { + "epoch": 4.797524314765694, + "grad_norm": 0.6713475501297167, + "learning_rate": 1.0924116143547878e-05, + "loss": 0.4171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21732935309410095, + "step": 2715, + "valid_targets_mean": 3802.6, + "valid_targets_min": 1567 + }, + { + "epoch": 4.8063660477453585, + "grad_norm": 0.7413050176699072, + "learning_rate": 1.0845677325799935e-05, + "loss": 0.4312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25657641887664795, + "step": 2720, + "valid_targets_mean": 3387.0, + "valid_targets_min": 385 + }, + { + "epoch": 4.815207780725022, + "grad_norm": 0.7577009577762279, + "learning_rate": 1.0767416232101215e-05, + "loss": 0.4391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28581398725509644, + "step": 2725, + "valid_targets_mean": 3098.0, + "valid_targets_min": 1745 + }, + { + "epoch": 4.824049513704686, + "grad_norm": 0.7724716975951001, + "learning_rate": 1.0689334381829948e-05, + "loss": 0.4088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20168830454349518, + "step": 2730, + "valid_targets_mean": 2979.0, + "valid_targets_min": 666 + }, + { + "epoch": 4.83289124668435, + "grad_norm": 0.7089679302709749, + "learning_rate": 1.0611433290884472e-05, + "loss": 0.4004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11011864989995956, + "step": 2735, + "valid_targets_mean": 2865.8, + "valid_targets_min": 492 + }, + { + "epoch": 4.841732979664014, + "grad_norm": 0.8144495361272787, + "learning_rate": 1.0533714471653832e-05, + "loss": 0.4312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19665873050689697, + "step": 2740, + "valid_targets_mean": 2790.5, + "valid_targets_min": 368 + }, + { + "epoch": 4.850574712643678, + "grad_norm": 0.77684643133323, + "learning_rate": 1.04561794329884e-05, + "loss": 0.4497, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21007674932479858, + "step": 2745, + "valid_targets_mean": 2555.6, + "valid_targets_min": 1571 + }, + { + "epoch": 4.859416445623342, + "grad_norm": 0.742546614835338, + "learning_rate": 1.0378829680170622e-05, + "loss": 0.4322, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3378821611404419, + "step": 2750, + "valid_targets_mean": 4008.6, + "valid_targets_min": 1946 + }, + { + "epoch": 4.868258178603006, + "grad_norm": 0.7479115324842988, + "learning_rate": 1.0301666714885725e-05, + "loss": 0.4325, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2188922017812729, + "step": 2755, + "valid_targets_mean": 3129.8, + "valid_targets_min": 1540 + }, + { + "epoch": 4.87709991158267, + "grad_norm": 0.7454709519506926, + "learning_rate": 1.0224692035192625e-05, + "loss": 0.4438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28481394052505493, + "step": 2760, + "valid_targets_mean": 3897.9, + "valid_targets_min": 1390 + }, + { + "epoch": 4.885941644562334, + "grad_norm": 0.769621578421721, + "learning_rate": 1.0147907135494803e-05, + "loss": 0.4236, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15574485063552856, + "step": 2765, + "valid_targets_mean": 2061.8, + "valid_targets_min": 933 + }, + { + "epoch": 4.894783377541998, + "grad_norm": 0.7396299843802391, + "learning_rate": 1.0071313506511334e-05, + "loss": 0.3959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16915792226791382, + "step": 2770, + "valid_targets_mean": 2474.2, + "valid_targets_min": 598 + }, + { + "epoch": 4.903625110521662, + "grad_norm": 0.6989394194624301, + "learning_rate": 9.9949126352479e-06, + "loss": 0.3991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22265878319740295, + "step": 2775, + "valid_targets_mean": 3984.8, + "valid_targets_min": 1638 + }, + { + "epoch": 4.912466843501326, + "grad_norm": 0.6502932314793353, + "learning_rate": 9.918706004967948e-06, + "loss": 0.4288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32565969228744507, + "step": 2780, + "valid_targets_mean": 4374.5, + "valid_targets_min": 1492 + }, + { + "epoch": 4.921308576480991, + "grad_norm": 0.7229307437239456, + "learning_rate": 9.842695095163878e-06, + "loss": 0.423, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24379673600196838, + "step": 2785, + "valid_targets_mean": 3383.4, + "valid_targets_min": 974 + }, + { + "epoch": 4.930150309460654, + "grad_norm": 0.7940649246854591, + "learning_rate": 9.766881381528357e-06, + "loss": 0.4199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25852537155151367, + "step": 2790, + "valid_targets_mean": 3000.1, + "valid_targets_min": 760 + }, + { + "epoch": 4.938992042440319, + "grad_norm": 0.6722076902519407, + "learning_rate": 9.691266335925615e-06, + "loss": 0.4507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1473044753074646, + "step": 2795, + "valid_targets_mean": 2647.0, + "valid_targets_min": 648 + }, + { + "epoch": 4.947833775419983, + "grad_norm": 0.819920472445427, + "learning_rate": 9.615851426362904e-06, + "loss": 0.4385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1795499622821808, + "step": 2800, + "valid_targets_mean": 2951.1, + "valid_targets_min": 1215 + }, + { + "epoch": 4.9566755083996465, + "grad_norm": 0.7025906740887181, + "learning_rate": 9.540638116961986e-06, + "loss": 0.4195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25529012084007263, + "step": 2805, + "valid_targets_mean": 3555.2, + "valid_targets_min": 1071 + }, + { + "epoch": 4.9655172413793105, + "grad_norm": 0.7370327390638789, + "learning_rate": 9.465627867930734e-06, + "loss": 0.4017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20865119993686676, + "step": 2810, + "valid_targets_mean": 2461.0, + "valid_targets_min": 257 + }, + { + "epoch": 4.9743589743589745, + "grad_norm": 0.6324581481449822, + "learning_rate": 9.390822135534738e-06, + "loss": 0.4037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20276159048080444, + "step": 2815, + "valid_targets_mean": 3668.0, + "valid_targets_min": 1824 + }, + { + "epoch": 4.983200707338638, + "grad_norm": 0.7834993482168726, + "learning_rate": 9.31622237206907e-06, + "loss": 0.4356, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17606160044670105, + "step": 2820, + "valid_targets_mean": 2788.4, + "valid_targets_min": 456 + }, + { + "epoch": 4.992042440318302, + "grad_norm": 0.6837420383955042, + "learning_rate": 9.241830025830059e-06, + "loss": 0.4128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18292655050754547, + "step": 2825, + "valid_targets_mean": 3192.5, + "valid_targets_min": 743 + }, + { + "epoch": 5.0, + "grad_norm": 1.1516433834283342, + "learning_rate": 9.167646541087216e-06, + "loss": 0.4185, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.4343792200088501, + "step": 2830, + "valid_targets_mean": 2228.5, + "valid_targets_min": 488 + }, + { + "epoch": 5.008841732979664, + "grad_norm": 0.7806271076048815, + "learning_rate": 9.09367335805515e-06, + "loss": 0.418, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21847274899482727, + "step": 2835, + "valid_targets_mean": 3220.6, + "valid_targets_min": 649 + }, + { + "epoch": 5.017683465959328, + "grad_norm": 0.6706581564830443, + "learning_rate": 9.019911912865634e-06, + "loss": 0.3993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25733518600463867, + "step": 2840, + "valid_targets_mean": 3993.9, + "valid_targets_min": 1384 + }, + { + "epoch": 5.026525198938992, + "grad_norm": 0.728929240628752, + "learning_rate": 8.946363637539699e-06, + "loss": 0.3912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16333594918251038, + "step": 2845, + "valid_targets_mean": 2894.0, + "valid_targets_min": 487 + }, + { + "epoch": 5.035366931918656, + "grad_norm": 0.728458524357944, + "learning_rate": 8.87302995995988e-06, + "loss": 0.387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20494450628757477, + "step": 2850, + "valid_targets_mean": 3790.2, + "valid_targets_min": 1159 + }, + { + "epoch": 5.04420866489832, + "grad_norm": 0.7084662868772482, + "learning_rate": 8.799912303842437e-06, + "loss": 0.4087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20348328351974487, + "step": 2855, + "valid_targets_mean": 3220.6, + "valid_targets_min": 406 + }, + { + "epoch": 5.053050397877984, + "grad_norm": 0.7088150993211034, + "learning_rate": 8.727012088709751e-06, + "loss": 0.3722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22844524681568146, + "step": 2860, + "valid_targets_mean": 4072.2, + "valid_targets_min": 1095 + }, + { + "epoch": 5.061892130857648, + "grad_norm": 0.8455946822457715, + "learning_rate": 8.654330729862752e-06, + "loss": 0.3869, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19593322277069092, + "step": 2865, + "valid_targets_mean": 2430.2, + "valid_targets_min": 432 + }, + { + "epoch": 5.0707338638373125, + "grad_norm": 0.5858642767010211, + "learning_rate": 8.58186963835346e-06, + "loss": 0.3783, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21078699827194214, + "step": 2870, + "valid_targets_mean": 4977.0, + "valid_targets_min": 1444 + }, + { + "epoch": 5.0795755968169765, + "grad_norm": 0.7994534314183666, + "learning_rate": 8.509630220957554e-06, + "loss": 0.4093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19775576889514923, + "step": 2875, + "valid_targets_mean": 2545.8, + "valid_targets_min": 573 + }, + { + "epoch": 5.08841732979664, + "grad_norm": 0.8314569923246584, + "learning_rate": 8.437613880147093e-06, + "loss": 0.3913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1837921142578125, + "step": 2880, + "valid_targets_mean": 2678.4, + "valid_targets_min": 459 + }, + { + "epoch": 5.097259062776304, + "grad_norm": 0.7860099404554846, + "learning_rate": 8.365822014063287e-06, + "loss": 0.3658, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17934468388557434, + "step": 2885, + "valid_targets_mean": 3174.5, + "valid_targets_min": 512 + }, + { + "epoch": 5.106100795755968, + "grad_norm": 0.7604145315647566, + "learning_rate": 8.29425601648933e-06, + "loss": 0.3952, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21388058364391327, + "step": 2890, + "valid_targets_mean": 2896.4, + "valid_targets_min": 353 + }, + { + "epoch": 5.114942528735632, + "grad_norm": 0.8107815627893672, + "learning_rate": 8.222917276823361e-06, + "loss": 0.3976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22443638741970062, + "step": 2895, + "valid_targets_mean": 3731.9, + "valid_targets_min": 1274 + }, + { + "epoch": 5.123784261715296, + "grad_norm": 0.7079702745049611, + "learning_rate": 8.151807180051474e-06, + "loss": 0.4313, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25032246112823486, + "step": 2900, + "valid_targets_mean": 3908.5, + "valid_targets_min": 386 + }, + { + "epoch": 5.13262599469496, + "grad_norm": 0.7899459874887411, + "learning_rate": 8.080927106720862e-06, + "loss": 0.4158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1818743646144867, + "step": 2905, + "valid_targets_mean": 2431.4, + "valid_targets_min": 258 + }, + { + "epoch": 5.141467727674624, + "grad_norm": 0.8962540094006461, + "learning_rate": 8.010278432912971e-06, + "loss": 0.4258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.31215745210647583, + "step": 2910, + "valid_targets_mean": 3037.2, + "valid_targets_min": 1060 + }, + { + "epoch": 5.150309460654288, + "grad_norm": 0.7521497447867146, + "learning_rate": 7.939862530216808e-06, + "loss": 0.3872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18189725279808044, + "step": 2915, + "valid_targets_mean": 2674.8, + "valid_targets_min": 979 + }, + { + "epoch": 5.159151193633952, + "grad_norm": 0.7250094122688368, + "learning_rate": 7.869680765702313e-06, + "loss": 0.4319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1579514592885971, + "step": 2920, + "valid_targets_mean": 2929.2, + "valid_targets_min": 1224 + }, + { + "epoch": 5.167992926613616, + "grad_norm": 0.7675162922726106, + "learning_rate": 7.799734501893825e-06, + "loss": 0.3872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1362682580947876, + "step": 2925, + "valid_targets_mean": 2386.4, + "valid_targets_min": 618 + }, + { + "epoch": 5.17683465959328, + "grad_norm": 0.6709418238351449, + "learning_rate": 7.730025096743601e-06, + "loss": 0.4124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16993936896324158, + "step": 2930, + "valid_targets_mean": 3081.4, + "valid_targets_min": 358 + }, + { + "epoch": 5.185676392572944, + "grad_norm": 0.6432114501479861, + "learning_rate": 7.6605539036055e-06, + "loss": 0.3949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1883753538131714, + "step": 2935, + "valid_targets_mean": 4789.6, + "valid_targets_min": 321 + }, + { + "epoch": 5.194518125552609, + "grad_norm": 0.7001052560650384, + "learning_rate": 7.591322271208639e-06, + "loss": 0.3833, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1550978720188141, + "step": 2940, + "valid_targets_mean": 2667.6, + "valid_targets_min": 1459 + }, + { + "epoch": 5.203359858532273, + "grad_norm": 1.0203017538563217, + "learning_rate": 7.522331543631289e-06, + "loss": 0.3966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27559781074523926, + "step": 2945, + "valid_targets_mean": 2583.2, + "valid_targets_min": 558 + }, + { + "epoch": 5.212201591511937, + "grad_norm": 0.63220733334086, + "learning_rate": 7.453583060274714e-06, + "loss": 0.3912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1653447449207306, + "step": 2950, + "valid_targets_mean": 4349.5, + "valid_targets_min": 2007 + }, + { + "epoch": 5.221043324491601, + "grad_norm": 0.7658723022429813, + "learning_rate": 7.385078155837226e-06, + "loss": 0.4172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2508220672607422, + "step": 2955, + "valid_targets_mean": 3356.6, + "valid_targets_min": 1549 + }, + { + "epoch": 5.2298850574712645, + "grad_norm": 0.6379179057891206, + "learning_rate": 7.316818160288195e-06, + "loss": 0.3916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2654326558113098, + "step": 2960, + "valid_targets_mean": 4930.0, + "valid_targets_min": 447 + }, + { + "epoch": 5.2387267904509285, + "grad_norm": 0.8198169061308748, + "learning_rate": 7.248804398842322e-06, + "loss": 0.4376, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17658288776874542, + "step": 2965, + "valid_targets_mean": 2807.2, + "valid_targets_min": 1191 + }, + { + "epoch": 5.247568523430592, + "grad_norm": 0.7161368425685732, + "learning_rate": 7.181038191933833e-06, + "loss": 0.3725, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23815590143203735, + "step": 2970, + "valid_targets_mean": 3746.0, + "valid_targets_min": 347 + }, + { + "epoch": 5.256410256410256, + "grad_norm": 0.7383520605352984, + "learning_rate": 7.113520855190907e-06, + "loss": 0.3862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17981159687042236, + "step": 2975, + "valid_targets_mean": 2893.6, + "valid_targets_min": 1261 + }, + { + "epoch": 5.26525198938992, + "grad_norm": 0.7617118383380348, + "learning_rate": 7.046253699410058e-06, + "loss": 0.3901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24191364645957947, + "step": 2980, + "valid_targets_mean": 3604.0, + "valid_targets_min": 298 + }, + { + "epoch": 5.274093722369584, + "grad_norm": 0.761360266153581, + "learning_rate": 6.979238030530775e-06, + "loss": 0.3823, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29760921001434326, + "step": 2985, + "valid_targets_mean": 5094.0, + "valid_targets_min": 830 + }, + { + "epoch": 5.282935455349248, + "grad_norm": 0.6957464522130561, + "learning_rate": 6.912475149610094e-06, + "loss": 0.375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14544111490249634, + "step": 2990, + "valid_targets_mean": 2849.9, + "valid_targets_min": 1018 + }, + { + "epoch": 5.291777188328912, + "grad_norm": 0.8834015419681706, + "learning_rate": 6.8459663527973995e-06, + "loss": 0.4253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2348986715078354, + "step": 2995, + "valid_targets_mean": 2487.2, + "valid_targets_min": 360 + }, + { + "epoch": 5.300618921308576, + "grad_norm": 0.7175307826338068, + "learning_rate": 6.779712931309186e-06, + "loss": 0.4069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13426730036735535, + "step": 3000, + "valid_targets_mean": 2886.1, + "valid_targets_min": 1293 + }, + { + "epoch": 5.30946065428824, + "grad_norm": 0.6263326470511927, + "learning_rate": 6.713716171404086e-06, + "loss": 0.4349, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2130982130765915, + "step": 3005, + "valid_targets_mean": 4677.0, + "valid_targets_min": 1091 + }, + { + "epoch": 5.318302387267904, + "grad_norm": 0.7281926036143173, + "learning_rate": 6.647977354357804e-06, + "loss": 0.4308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22627121210098267, + "step": 3010, + "valid_targets_mean": 2928.8, + "valid_targets_min": 460 + }, + { + "epoch": 5.327144120247569, + "grad_norm": 0.6832070210761304, + "learning_rate": 6.582497756438326e-06, + "loss": 0.386, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27786123752593994, + "step": 3015, + "valid_targets_mean": 4205.2, + "valid_targets_min": 1913 + }, + { + "epoch": 5.335985853227233, + "grad_norm": 0.7067931683994918, + "learning_rate": 6.517278648881054e-06, + "loss": 0.3716, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2012796401977539, + "step": 3020, + "valid_targets_mean": 3926.8, + "valid_targets_min": 1419 + }, + { + "epoch": 5.344827586206897, + "grad_norm": 1.0101144556395403, + "learning_rate": 6.452321297864212e-06, + "loss": 0.4082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1759074628353119, + "step": 3025, + "valid_targets_mean": 1739.6, + "valid_targets_min": 565 + }, + { + "epoch": 5.353669319186561, + "grad_norm": 0.6504695714072357, + "learning_rate": 6.387626964484197e-06, + "loss": 0.3963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1815790832042694, + "step": 3030, + "valid_targets_mean": 3034.5, + "valid_targets_min": 260 + }, + { + "epoch": 5.362511052166225, + "grad_norm": 0.829852685254614, + "learning_rate": 6.323196904731155e-06, + "loss": 0.3854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1513374149799347, + "step": 3035, + "valid_targets_mean": 2116.5, + "valid_targets_min": 769 + }, + { + "epoch": 5.371352785145889, + "grad_norm": 0.7446352358190379, + "learning_rate": 6.259032369464522e-06, + "loss": 0.3956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27236083149909973, + "step": 3040, + "valid_targets_mean": 3079.9, + "valid_targets_min": 366 + }, + { + "epoch": 5.380194518125553, + "grad_norm": 0.8228515281616915, + "learning_rate": 6.195134604388819e-06, + "loss": 0.4388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3066047430038452, + "step": 3045, + "valid_targets_mean": 3165.6, + "valid_targets_min": 1862 + }, + { + "epoch": 5.389036251105217, + "grad_norm": 0.7798826897148097, + "learning_rate": 6.1315048500294125e-06, + "loss": 0.4576, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19620686769485474, + "step": 3050, + "valid_targets_mean": 3101.9, + "valid_targets_min": 515 + }, + { + "epoch": 5.3978779840848805, + "grad_norm": 0.930463249760995, + "learning_rate": 6.068144341708464e-06, + "loss": 0.4117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18991626799106598, + "step": 3055, + "valid_targets_mean": 2486.2, + "valid_targets_min": 287 + }, + { + "epoch": 5.4067197170645445, + "grad_norm": 0.7704365886141176, + "learning_rate": 6.0050543095209215e-06, + "loss": 0.402, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1924263834953308, + "step": 3060, + "valid_targets_mean": 3358.0, + "valid_targets_min": 1254 + }, + { + "epoch": 5.415561450044208, + "grad_norm": 0.8532428692792394, + "learning_rate": 5.942235978310649e-06, + "loss": 0.4086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22423534095287323, + "step": 3065, + "valid_targets_mean": 3000.2, + "valid_targets_min": 1198 + }, + { + "epoch": 5.424403183023872, + "grad_norm": 0.669085550320398, + "learning_rate": 5.879690567646645e-06, + "loss": 0.4072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1893330216407776, + "step": 3070, + "valid_targets_mean": 3361.8, + "valid_targets_min": 1890 + }, + { + "epoch": 5.433244916003536, + "grad_norm": 0.7376176849413955, + "learning_rate": 5.817419291799388e-06, + "loss": 0.4171, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16862516105175018, + "step": 3075, + "valid_targets_mean": 3250.4, + "valid_targets_min": 1327 + }, + { + "epoch": 5.442086648983201, + "grad_norm": 0.6542529886450859, + "learning_rate": 5.755423359717222e-06, + "loss": 0.3953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13393324613571167, + "step": 3080, + "valid_targets_mean": 2877.9, + "valid_targets_min": 559 + }, + { + "epoch": 5.450928381962865, + "grad_norm": 0.6392677271638753, + "learning_rate": 5.693703975002911e-06, + "loss": 0.4028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13595180213451385, + "step": 3085, + "valid_targets_mean": 2198.1, + "valid_targets_min": 1258 + }, + { + "epoch": 5.459770114942529, + "grad_norm": 0.8729225649131562, + "learning_rate": 5.632262335890262e-06, + "loss": 0.3457, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21021749079227448, + "step": 3090, + "valid_targets_mean": 2377.5, + "valid_targets_min": 526 + }, + { + "epoch": 5.468611847922193, + "grad_norm": 0.6919169604156997, + "learning_rate": 5.571099635220887e-06, + "loss": 0.3906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.09621213376522064, + "step": 3095, + "valid_targets_mean": 1912.2, + "valid_targets_min": 309 + }, + { + "epoch": 5.477453580901857, + "grad_norm": 0.9121306344310365, + "learning_rate": 5.510217060421006e-06, + "loss": 0.3922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.281181275844574, + "step": 3100, + "valid_targets_mean": 2873.5, + "valid_targets_min": 1299 + }, + { + "epoch": 5.486295313881521, + "grad_norm": 0.7192489768020969, + "learning_rate": 5.449615793478411e-06, + "loss": 0.4078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16287308931350708, + "step": 3105, + "valid_targets_mean": 3211.4, + "valid_targets_min": 961 + }, + { + "epoch": 5.495137046861185, + "grad_norm": 0.831717545619796, + "learning_rate": 5.389297010919545e-06, + "loss": 0.4097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19926907122135162, + "step": 3110, + "valid_targets_mean": 2817.5, + "valid_targets_min": 1149 + }, + { + "epoch": 5.503978779840849, + "grad_norm": 0.8140212742785664, + "learning_rate": 5.329261883786611e-06, + "loss": 0.4226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15885740518569946, + "step": 3115, + "valid_targets_mean": 2335.2, + "valid_targets_min": 514 + }, + { + "epoch": 5.512820512820513, + "grad_norm": 0.9603182918185311, + "learning_rate": 5.2695115776148765e-06, + "loss": 0.3965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2298716902732849, + "step": 3120, + "valid_targets_mean": 1846.4, + "valid_targets_min": 431 + }, + { + "epoch": 5.521662245800177, + "grad_norm": 0.8019735181021684, + "learning_rate": 5.21004725241002e-06, + "loss": 0.3822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22657175362110138, + "step": 3125, + "valid_targets_mean": 2703.9, + "valid_targets_min": 1080 + }, + { + "epoch": 5.530503978779841, + "grad_norm": 0.6986863564233587, + "learning_rate": 5.150870062625639e-06, + "loss": 0.3983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12742537260055542, + "step": 3130, + "valid_targets_mean": 2276.5, + "valid_targets_min": 391 + }, + { + "epoch": 5.539345711759505, + "grad_norm": 0.6392753287000917, + "learning_rate": 5.091981157140808e-06, + "loss": 0.4035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16173365712165833, + "step": 3135, + "valid_targets_mean": 3372.1, + "valid_targets_min": 567 + }, + { + "epoch": 5.548187444739169, + "grad_norm": 0.6393994411262591, + "learning_rate": 5.03338167923779e-06, + "loss": 0.3976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24456486105918884, + "step": 3140, + "valid_targets_mean": 4942.8, + "valid_targets_min": 1585 + }, + { + "epoch": 5.5570291777188325, + "grad_norm": 0.6957281925877212, + "learning_rate": 4.975072766579829e-06, + "loss": 0.4048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13130195438861847, + "step": 3145, + "valid_targets_mean": 2417.5, + "valid_targets_min": 344 + }, + { + "epoch": 5.5658709106984965, + "grad_norm": 0.9301033896027021, + "learning_rate": 4.917055551189089e-06, + "loss": 0.3766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24469897150993347, + "step": 3150, + "valid_targets_mean": 2273.6, + "valid_targets_min": 1133 + }, + { + "epoch": 5.574712643678161, + "grad_norm": 0.6781134728348155, + "learning_rate": 4.859331159424645e-06, + "loss": 0.3818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16952422261238098, + "step": 3155, + "valid_targets_mean": 3207.5, + "valid_targets_min": 298 + }, + { + "epoch": 5.583554376657825, + "grad_norm": 0.6976758942726916, + "learning_rate": 4.801900711960628e-06, + "loss": 0.3838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16358278691768646, + "step": 3160, + "valid_targets_mean": 3211.9, + "valid_targets_min": 1839 + }, + { + "epoch": 5.592396109637489, + "grad_norm": 0.7660887912670873, + "learning_rate": 4.744765323764469e-06, + "loss": 0.4141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2197507917881012, + "step": 3165, + "valid_targets_mean": 2894.8, + "valid_targets_min": 1342 + }, + { + "epoch": 5.601237842617153, + "grad_norm": 0.7314275252775809, + "learning_rate": 4.6879261040752685e-06, + "loss": 0.3959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14985954761505127, + "step": 3170, + "valid_targets_mean": 2667.5, + "valid_targets_min": 465 + }, + { + "epoch": 5.610079575596817, + "grad_norm": 0.6999874428567335, + "learning_rate": 4.63138415638223e-06, + "loss": 0.4117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18852269649505615, + "step": 3175, + "valid_targets_mean": 3877.0, + "valid_targets_min": 667 + }, + { + "epoch": 5.618921308576481, + "grad_norm": 0.7215106059187592, + "learning_rate": 4.575140578403256e-06, + "loss": 0.4084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15598289668560028, + "step": 3180, + "valid_targets_mean": 2837.5, + "valid_targets_min": 247 + }, + { + "epoch": 5.627763041556145, + "grad_norm": 0.6810403634872003, + "learning_rate": 4.519196462063628e-06, + "loss": 0.3603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24649617075920105, + "step": 3185, + "valid_targets_mean": 4866.0, + "valid_targets_min": 503 + }, + { + "epoch": 5.636604774535809, + "grad_norm": 0.8661083461110505, + "learning_rate": 4.4635528934748315e-06, + "loss": 0.4099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25795987248420715, + "step": 3190, + "valid_targets_mean": 2327.2, + "valid_targets_min": 327 + }, + { + "epoch": 5.645446507515473, + "grad_norm": 0.9984452335642174, + "learning_rate": 4.408210952913434e-06, + "loss": 0.4076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21475867927074432, + "step": 3195, + "valid_targets_mean": 2365.8, + "valid_targets_min": 523 + }, + { + "epoch": 5.654288240495137, + "grad_norm": 0.63284420296626, + "learning_rate": 4.353171714800135e-06, + "loss": 0.3617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21914245188236237, + "step": 3200, + "valid_targets_mean": 4543.1, + "valid_targets_min": 1153 + }, + { + "epoch": 5.663129973474801, + "grad_norm": 0.7215660888800569, + "learning_rate": 4.298436247678892e-06, + "loss": 0.4097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18757544457912445, + "step": 3205, + "valid_targets_mean": 3180.9, + "valid_targets_min": 260 + }, + { + "epoch": 5.671971706454465, + "grad_norm": 0.8776106727330101, + "learning_rate": 4.2440056141962116e-06, + "loss": 0.4246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23493947088718414, + "step": 3210, + "valid_targets_mean": 2881.6, + "valid_targets_min": 329 + }, + { + "epoch": 5.680813439434129, + "grad_norm": 0.8049825392272455, + "learning_rate": 4.189880871080465e-06, + "loss": 0.4049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13369911909103394, + "step": 3215, + "valid_targets_mean": 3066.9, + "valid_targets_min": 371 + }, + { + "epoch": 5.689655172413794, + "grad_norm": 0.8302974347090468, + "learning_rate": 4.136063069121412e-06, + "loss": 0.3795, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1873476505279541, + "step": 3220, + "valid_targets_mean": 2237.5, + "valid_targets_min": 687 + }, + { + "epoch": 5.698496905393457, + "grad_norm": 0.6993234633000938, + "learning_rate": 4.082553253149784e-06, + "loss": 0.3919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21738377213478088, + "step": 3225, + "valid_targets_mean": 3679.9, + "valid_targets_min": 1340 + }, + { + "epoch": 5.7073386383731215, + "grad_norm": 0.9105087640110349, + "learning_rate": 4.029352462017016e-06, + "loss": 0.4019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23904664814472198, + "step": 3230, + "valid_targets_mean": 2628.5, + "valid_targets_min": 778 + }, + { + "epoch": 5.7161803713527854, + "grad_norm": 0.7887831667909359, + "learning_rate": 3.9764617285750516e-06, + "loss": 0.3985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15723231434822083, + "step": 3235, + "valid_targets_mean": 2306.4, + "valid_targets_min": 505 + }, + { + "epoch": 5.725022104332449, + "grad_norm": 0.8628976638475314, + "learning_rate": 3.923882079656311e-06, + "loss": 0.3979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1998981535434723, + "step": 3240, + "valid_targets_mean": 2389.6, + "valid_targets_min": 368 + }, + { + "epoch": 5.733863837312113, + "grad_norm": 0.8851868206445387, + "learning_rate": 3.8716145360537516e-06, + "loss": 0.3869, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23257210850715637, + "step": 3245, + "valid_targets_mean": 2343.6, + "valid_targets_min": 480 + }, + { + "epoch": 5.742705570291777, + "grad_norm": 0.7909943609866004, + "learning_rate": 3.819660112501053e-06, + "loss": 0.4063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.237594872713089, + "step": 3250, + "valid_targets_mean": 3360.4, + "valid_targets_min": 1582 + }, + { + "epoch": 5.751547303271441, + "grad_norm": 0.9465551894292238, + "learning_rate": 3.768019817652906e-06, + "loss": 0.4158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17449277639389038, + "step": 3255, + "valid_targets_mean": 1845.4, + "valid_targets_min": 668 + }, + { + "epoch": 5.760389036251105, + "grad_norm": 0.8378732351349432, + "learning_rate": 3.7166946540654403e-06, + "loss": 0.3863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22095929086208344, + "step": 3260, + "valid_targets_mean": 2153.5, + "valid_targets_min": 459 + }, + { + "epoch": 5.769230769230769, + "grad_norm": 0.7193963936499834, + "learning_rate": 3.6656856181767487e-06, + "loss": 0.427, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17883676290512085, + "step": 3265, + "valid_targets_mean": 3431.5, + "valid_targets_min": 778 + }, + { + "epoch": 5.778072502210433, + "grad_norm": 0.8619394466221819, + "learning_rate": 3.6149937002875725e-06, + "loss": 0.4139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1710013896226883, + "step": 3270, + "valid_targets_mean": 1953.4, + "valid_targets_min": 296 + }, + { + "epoch": 5.786914235190097, + "grad_norm": 0.7617624941176476, + "learning_rate": 3.564619884542033e-06, + "loss": 0.4073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18097054958343506, + "step": 3275, + "valid_targets_mean": 2563.1, + "valid_targets_min": 1498 + }, + { + "epoch": 5.795755968169761, + "grad_norm": 0.7210899911422212, + "learning_rate": 3.514565148908553e-06, + "loss": 0.4115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21109169721603394, + "step": 3280, + "valid_targets_mean": 3776.4, + "valid_targets_min": 1323 + }, + { + "epoch": 5.804597701149425, + "grad_norm": 0.8741955579576905, + "learning_rate": 3.4648304651608623e-06, + "loss": 0.3956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17497266829013824, + "step": 3285, + "valid_targets_mean": 2469.2, + "valid_targets_min": 1320 + }, + { + "epoch": 5.813439434129089, + "grad_norm": 0.7414269383554729, + "learning_rate": 3.4154167988591367e-06, + "loss": 0.3837, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15306875109672546, + "step": 3290, + "valid_targets_mean": 2028.0, + "valid_targets_min": 559 + }, + { + "epoch": 5.822281167108754, + "grad_norm": 0.680343087267019, + "learning_rate": 3.3663251093312477e-06, + "loss": 0.4257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15991319715976715, + "step": 3295, + "valid_targets_mean": 3004.1, + "valid_targets_min": 1060 + }, + { + "epoch": 5.831122900088418, + "grad_norm": 0.7192829761203814, + "learning_rate": 3.317556349654125e-06, + "loss": 0.3822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24054303765296936, + "step": 3300, + "valid_targets_mean": 4578.8, + "valid_targets_min": 867 + }, + { + "epoch": 5.839964633068082, + "grad_norm": 0.8129183520607333, + "learning_rate": 3.2691114666352887e-06, + "loss": 0.41, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17372924089431763, + "step": 3305, + "valid_targets_mean": 1957.9, + "valid_targets_min": 308 + }, + { + "epoch": 5.848806366047746, + "grad_norm": 0.6912822577892667, + "learning_rate": 3.220991400794431e-06, + "loss": 0.3794, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20085839927196503, + "step": 3310, + "valid_targets_mean": 4113.1, + "valid_targets_min": 478 + }, + { + "epoch": 5.85764809902741, + "grad_norm": 0.7568673476778853, + "learning_rate": 3.1731970863451746e-06, + "loss": 0.3949, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16372664272785187, + "step": 3315, + "valid_targets_mean": 2882.0, + "valid_targets_min": 350 + }, + { + "epoch": 5.8664898320070735, + "grad_norm": 0.8292901753145713, + "learning_rate": 3.1257294511769263e-06, + "loss": 0.3945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1919775903224945, + "step": 3320, + "valid_targets_mean": 2993.4, + "valid_targets_min": 409 + }, + { + "epoch": 5.8753315649867375, + "grad_norm": 0.66874118757708, + "learning_rate": 3.0785894168368857e-06, + "loss": 0.4101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3156202435493469, + "step": 3325, + "valid_targets_mean": 4430.4, + "valid_targets_min": 1275 + }, + { + "epoch": 5.884173297966401, + "grad_norm": 0.7803502732071088, + "learning_rate": 3.0317778985121182e-06, + "loss": 0.4128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17863729596138, + "step": 3330, + "valid_targets_mean": 2628.6, + "valid_targets_min": 262 + }, + { + "epoch": 5.893015030946065, + "grad_norm": 0.8120192943631549, + "learning_rate": 2.9852958050118275e-06, + "loss": 0.4182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1689552515745163, + "step": 3335, + "valid_targets_mean": 3196.8, + "valid_targets_min": 318 + }, + { + "epoch": 5.901856763925729, + "grad_norm": 0.7503397178701974, + "learning_rate": 2.9391440387496617e-06, + "loss": 0.4242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1889551877975464, + "step": 3340, + "valid_targets_mean": 3213.4, + "valid_targets_min": 363 + }, + { + "epoch": 5.910698496905393, + "grad_norm": 0.8591198480547091, + "learning_rate": 2.89332349572625e-06, + "loss": 0.3703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1662624180316925, + "step": 3345, + "valid_targets_mean": 1885.9, + "valid_targets_min": 543 + }, + { + "epoch": 5.919540229885057, + "grad_norm": 0.9519020720938417, + "learning_rate": 2.847835065511766e-06, + "loss": 0.3988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17353492975234985, + "step": 3350, + "valid_targets_mean": 1727.4, + "valid_targets_min": 349 + }, + { + "epoch": 5.928381962864721, + "grad_norm": 0.8747102894127499, + "learning_rate": 2.8026796312286843e-06, + "loss": 0.4373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23620933294296265, + "step": 3355, + "valid_targets_mean": 3666.1, + "valid_targets_min": 1644 + }, + { + "epoch": 5.937223695844385, + "grad_norm": 0.6376827702661823, + "learning_rate": 2.757858069534598e-06, + "loss": 0.3984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1924460232257843, + "step": 3360, + "valid_targets_mean": 4527.5, + "valid_targets_min": 553 + }, + { + "epoch": 5.946065428824049, + "grad_norm": 0.6516051452822853, + "learning_rate": 2.71337125060525e-06, + "loss": 0.417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3005494475364685, + "step": 3365, + "valid_targets_mean": 5757.8, + "valid_targets_min": 2223 + }, + { + "epoch": 5.954907161803714, + "grad_norm": 0.732478020417441, + "learning_rate": 2.669220038117597e-06, + "loss": 0.4419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27111363410949707, + "step": 3370, + "valid_targets_mean": 3390.0, + "valid_targets_min": 458 + }, + { + "epoch": 5.963748894783378, + "grad_norm": 0.8080636185217684, + "learning_rate": 2.6254052892330737e-06, + "loss": 0.4438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3034144341945648, + "step": 3375, + "valid_targets_mean": 3722.1, + "valid_targets_min": 517 + }, + { + "epoch": 5.972590627763042, + "grad_norm": 0.7169451114480241, + "learning_rate": 2.5819278545809103e-06, + "loss": 0.4149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27992749214172363, + "step": 3380, + "valid_targets_mean": 3570.2, + "valid_targets_min": 396 + }, + { + "epoch": 5.981432360742706, + "grad_norm": 0.844425388762182, + "learning_rate": 2.5387885782416712e-06, + "loss": 0.3631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17740076780319214, + "step": 3385, + "valid_targets_mean": 2162.0, + "valid_targets_min": 550 + }, + { + "epoch": 5.99027409372237, + "grad_norm": 0.6494113116563578, + "learning_rate": 2.495988297730818e-06, + "loss": 0.4035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20014826953411102, + "step": 3390, + "valid_targets_mean": 4345.4, + "valid_targets_min": 438 + }, + { + "epoch": 5.999115826702034, + "grad_norm": 0.6847608100268655, + "learning_rate": 2.453527843982497e-06, + "loss": 0.3689, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.28000521659851074, + "step": 3395, + "valid_targets_mean": 5669.8, + "valid_targets_min": 1543 + }, + { + "epoch": 6.007073386383731, + "grad_norm": 0.7892539431347021, + "learning_rate": 2.4114080413333474e-06, + "loss": 0.3823, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21648083627223969, + "step": 3400, + "valid_targets_mean": 3293.4, + "valid_targets_min": 1170 + }, + { + "epoch": 6.015915119363395, + "grad_norm": 0.7327489748764502, + "learning_rate": 2.369629707506569e-06, + "loss": 0.3901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21525824069976807, + "step": 3405, + "valid_targets_mean": 2875.0, + "valid_targets_min": 1100 + }, + { + "epoch": 6.024756852343059, + "grad_norm": 0.7427914142271864, + "learning_rate": 2.328193653595985e-06, + "loss": 0.3892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29550355672836304, + "step": 3410, + "valid_targets_mean": 3901.6, + "valid_targets_min": 1147 + }, + { + "epoch": 6.033598585322723, + "grad_norm": 0.7551934122627986, + "learning_rate": 2.2871006840503384e-06, + "loss": 0.385, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1656990498304367, + "step": 3415, + "valid_targets_mean": 2678.4, + "valid_targets_min": 911 + }, + { + "epoch": 6.042440318302387, + "grad_norm": 0.8014400239410849, + "learning_rate": 2.2463515966576342e-06, + "loss": 0.3856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19182810187339783, + "step": 3420, + "valid_targets_mean": 2418.2, + "valid_targets_min": 415 + }, + { + "epoch": 6.051282051282051, + "grad_norm": 0.897788988403115, + "learning_rate": 2.2059471825296973e-06, + "loss": 0.3931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.26385846734046936, + "step": 3425, + "valid_targets_mean": 2770.5, + "valid_targets_min": 562 + }, + { + "epoch": 6.060123784261715, + "grad_norm": 0.8149264081278768, + "learning_rate": 2.1658882260867698e-06, + "loss": 0.3711, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12121979147195816, + "step": 3430, + "valid_targets_mean": 1847.2, + "valid_targets_min": 1211 + }, + { + "epoch": 6.068965517241379, + "grad_norm": 0.9058022749241772, + "learning_rate": 2.1261755050423204e-06, + "loss": 0.3914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18681831657886505, + "step": 3435, + "valid_targets_mean": 2502.9, + "valid_targets_min": 294 + }, + { + "epoch": 6.077807250221043, + "grad_norm": 0.5875487670316494, + "learning_rate": 2.086809790387905e-06, + "loss": 0.3824, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14535044133663177, + "step": 3440, + "valid_targets_mean": 3132.5, + "valid_targets_min": 673 + }, + { + "epoch": 6.086648983200707, + "grad_norm": 0.7952935546054049, + "learning_rate": 2.047791846378242e-06, + "loss": 0.3832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18173527717590332, + "step": 3445, + "valid_targets_mean": 3148.6, + "valid_targets_min": 482 + }, + { + "epoch": 6.095490716180372, + "grad_norm": 0.7607277089232913, + "learning_rate": 2.009122430516337e-06, + "loss": 0.3862, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17606256902217865, + "step": 3450, + "valid_targets_mean": 2331.9, + "valid_targets_min": 1478 + }, + { + "epoch": 6.104332449160036, + "grad_norm": 0.7496258419853713, + "learning_rate": 1.970802293538807e-06, + "loss": 0.3777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27735546231269836, + "step": 3455, + "valid_targets_mean": 4273.4, + "valid_targets_min": 1153 + }, + { + "epoch": 6.1131741821397, + "grad_norm": 0.6985174849382113, + "learning_rate": 1.9328321794012762e-06, + "loss": 0.3882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2295549213886261, + "step": 3460, + "valid_targets_mean": 3212.6, + "valid_targets_min": 358 + }, + { + "epoch": 6.122015915119364, + "grad_norm": 0.6160591675123345, + "learning_rate": 1.895212825263959e-06, + "loss": 0.3912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.262872576713562, + "step": 3465, + "valid_targets_mean": 6619.6, + "valid_targets_min": 1010 + }, + { + "epoch": 6.130857648099028, + "grad_norm": 0.8207914026042112, + "learning_rate": 1.8579449614773314e-06, + "loss": 0.3729, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13713327050209045, + "step": 3470, + "valid_targets_mean": 1882.8, + "valid_targets_min": 591 + }, + { + "epoch": 6.1396993810786915, + "grad_norm": 0.8071469248304369, + "learning_rate": 1.8210293115679677e-06, + "loss": 0.4061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2146981954574585, + "step": 3475, + "valid_targets_mean": 3234.0, + "valid_targets_min": 559 + }, + { + "epoch": 6.1485411140583555, + "grad_norm": 0.6897319556110078, + "learning_rate": 1.784466592224472e-06, + "loss": 0.3966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13424663245677948, + "step": 3480, + "valid_targets_mean": 2311.5, + "valid_targets_min": 676 + }, + { + "epoch": 6.157382847038019, + "grad_norm": 0.729819719486692, + "learning_rate": 1.74825751328358e-06, + "loss": 0.3926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19196979701519012, + "step": 3485, + "valid_targets_mean": 3340.2, + "valid_targets_min": 554 + }, + { + "epoch": 6.166224580017683, + "grad_norm": 0.8426168349719839, + "learning_rate": 1.7124027777163732e-06, + "loss": 0.4201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14435023069381714, + "step": 3490, + "valid_targets_mean": 1912.6, + "valid_targets_min": 319 + }, + { + "epoch": 6.175066312997347, + "grad_norm": 0.759757715201301, + "learning_rate": 1.6769030816146404e-06, + "loss": 0.3965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22856047749519348, + "step": 3495, + "valid_targets_mean": 3739.8, + "valid_targets_min": 924 + }, + { + "epoch": 6.183908045977011, + "grad_norm": 0.8366056994371286, + "learning_rate": 1.6417591141773458e-06, + "loss": 0.4146, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17554280161857605, + "step": 3500, + "valid_targets_mean": 2551.6, + "valid_targets_min": 529 + }, + { + "epoch": 6.192749778956675, + "grad_norm": 0.7980312027283708, + "learning_rate": 1.6069715576972634e-06, + "loss": 0.3904, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.27862659096717834, + "step": 3505, + "valid_targets_mean": 3707.2, + "valid_targets_min": 1715 + }, + { + "epoch": 6.201591511936339, + "grad_norm": 0.7364325995709389, + "learning_rate": 1.5725410875477187e-06, + "loss": 0.3608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1674642115831375, + "step": 3510, + "valid_targets_mean": 2912.5, + "valid_targets_min": 263 + }, + { + "epoch": 6.210433244916003, + "grad_norm": 0.8858927969586514, + "learning_rate": 1.5384683721694993e-06, + "loss": 0.3889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18463276326656342, + "step": 3515, + "valid_targets_mean": 2316.4, + "valid_targets_min": 715 + }, + { + "epoch": 6.219274977895668, + "grad_norm": 0.8919860695858821, + "learning_rate": 1.504754073057846e-06, + "loss": 0.4015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19577711820602417, + "step": 3520, + "valid_targets_mean": 1823.4, + "valid_targets_min": 384 + }, + { + "epoch": 6.228116710875332, + "grad_norm": 0.8455766242568858, + "learning_rate": 1.4713988447496342e-06, + "loss": 0.4037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19854457676410675, + "step": 3525, + "valid_targets_mean": 2662.8, + "valid_targets_min": 608 + }, + { + "epoch": 6.236958443854996, + "grad_norm": 0.744453900421472, + "learning_rate": 1.438403334810663e-06, + "loss": 0.3768, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15537121891975403, + "step": 3530, + "valid_targets_mean": 2982.4, + "valid_targets_min": 2031 + }, + { + "epoch": 6.24580017683466, + "grad_norm": 0.8827206937052091, + "learning_rate": 1.405768183823073e-06, + "loss": 0.3864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19907264411449432, + "step": 3535, + "valid_targets_mean": 2362.4, + "valid_targets_min": 452 + }, + { + "epoch": 6.254641909814324, + "grad_norm": 0.8416510383985708, + "learning_rate": 1.3734940253729167e-06, + "loss": 0.3777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22170794010162354, + "step": 3540, + "valid_targets_mean": 3408.8, + "valid_targets_min": 293 + }, + { + "epoch": 6.263483642793988, + "grad_norm": 0.7873873101117113, + "learning_rate": 1.3415814860378573e-06, + "loss": 0.3766, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14214427769184113, + "step": 3545, + "valid_targets_mean": 2900.8, + "valid_targets_min": 394 + }, + { + "epoch": 6.272325375773652, + "grad_norm": 0.7347622266646417, + "learning_rate": 1.3100311853750114e-06, + "loss": 0.4088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.152814120054245, + "step": 3550, + "valid_targets_mean": 2783.9, + "valid_targets_min": 780 + }, + { + "epoch": 6.281167108753316, + "grad_norm": 0.8638119930741502, + "learning_rate": 1.2788437359089056e-06, + "loss": 0.3869, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2797715365886688, + "step": 3555, + "valid_targets_mean": 3625.0, + "valid_targets_min": 1228 + }, + { + "epoch": 6.29000884173298, + "grad_norm": 0.7458458853206296, + "learning_rate": 1.248019743119595e-06, + "loss": 0.3677, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2126968950033188, + "step": 3560, + "valid_targets_mean": 3209.9, + "valid_targets_min": 275 + }, + { + "epoch": 6.2988505747126435, + "grad_norm": 0.7013433868816651, + "learning_rate": 1.2175598054309058e-06, + "loss": 0.3637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24043208360671997, + "step": 3565, + "valid_targets_mean": 4891.2, + "valid_targets_min": 711 + }, + { + "epoch": 6.3076923076923075, + "grad_norm": 0.7155286710184046, + "learning_rate": 1.187464514198824e-06, + "loss": 0.389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22147774696350098, + "step": 3570, + "valid_targets_mean": 3511.0, + "valid_targets_min": 661 + }, + { + "epoch": 6.316534040671971, + "grad_norm": 0.8942958090189175, + "learning_rate": 1.1577344537000012e-06, + "loss": 0.3619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24931302666664124, + "step": 3575, + "valid_targets_mean": 3223.0, + "valid_targets_min": 1451 + }, + { + "epoch": 6.325375773651635, + "grad_norm": 0.8019003945889316, + "learning_rate": 1.128370201120419e-06, + "loss": 0.4175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2635502517223358, + "step": 3580, + "valid_targets_mean": 3202.5, + "valid_targets_min": 1373 + }, + { + "epoch": 6.334217506631299, + "grad_norm": 0.6817340392127685, + "learning_rate": 1.0993723265441835e-06, + "loss": 0.3823, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13677793741226196, + "step": 3585, + "valid_targets_mean": 2905.6, + "valid_targets_min": 1394 + }, + { + "epoch": 6.343059239610964, + "grad_norm": 0.6095420535867488, + "learning_rate": 1.0707413929424626e-06, + "loss": 0.415, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17292746901512146, + "step": 3590, + "valid_targets_mean": 3958.5, + "valid_targets_min": 2560 + }, + { + "epoch": 6.351900972590628, + "grad_norm": 0.6319517497546866, + "learning_rate": 1.0424779561625465e-06, + "loss": 0.3905, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15072670578956604, + "step": 3595, + "valid_targets_mean": 3169.4, + "valid_targets_min": 981 + }, + { + "epoch": 6.360742705570292, + "grad_norm": 0.806370402271801, + "learning_rate": 1.0145825649170593e-06, + "loss": 0.4086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2352861762046814, + "step": 3600, + "valid_targets_mean": 2252.2, + "valid_targets_min": 323 + }, + { + "epoch": 6.369584438549956, + "grad_norm": 0.6699724587109076, + "learning_rate": 9.870557607733056e-07, + "loss": 0.3799, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16308927536010742, + "step": 3605, + "valid_targets_mean": 3615.8, + "valid_targets_min": 415 + }, + { + "epoch": 6.37842617152962, + "grad_norm": 0.827228282016501, + "learning_rate": 9.59898078142767e-07, + "loss": 0.4035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2147194743156433, + "step": 3610, + "valid_targets_mean": 2595.4, + "valid_targets_min": 491 + }, + { + "epoch": 6.387267904509284, + "grad_norm": 0.6652223634579235, + "learning_rate": 9.331100442707108e-07, + "loss": 0.4052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17819935083389282, + "step": 3615, + "valid_targets_mean": 3927.1, + "valid_targets_min": 979 + }, + { + "epoch": 6.396109637488948, + "grad_norm": 0.7289789412288719, + "learning_rate": 9.066921792259654e-07, + "loss": 0.389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18159447610378265, + "step": 3620, + "valid_targets_mean": 3477.9, + "valid_targets_min": 363 + }, + { + "epoch": 6.404951370468612, + "grad_norm": 0.6396828577240828, + "learning_rate": 8.806449958908115e-07, + "loss": 0.382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22703109681606293, + "step": 3625, + "valid_targets_mean": 5019.6, + "valid_targets_min": 1272 + }, + { + "epoch": 6.413793103448276, + "grad_norm": 0.8721346570560746, + "learning_rate": 8.549689999510446e-07, + "loss": 0.3822, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23551982641220093, + "step": 3630, + "valid_targets_mean": 2339.8, + "valid_targets_min": 431 + }, + { + "epoch": 6.42263483642794, + "grad_norm": 0.6947586156644703, + "learning_rate": 8.296646898861405e-07, + "loss": 0.3807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16428089141845703, + "step": 3635, + "valid_targets_mean": 3315.1, + "valid_targets_min": 706 + }, + { + "epoch": 6.431476569407604, + "grad_norm": 0.7795433915349836, + "learning_rate": 8.047325569595821e-07, + "loss": 0.3883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1826629936695099, + "step": 3640, + "valid_targets_mean": 2893.4, + "valid_targets_min": 458 + }, + { + "epoch": 6.440318302387268, + "grad_norm": 0.6984355115855847, + "learning_rate": 7.801730852093193e-07, + "loss": 0.4044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21642327308654785, + "step": 3645, + "valid_targets_mean": 3958.0, + "valid_targets_min": 435 + }, + { + "epoch": 6.449160035366932, + "grad_norm": 1.0772469112743712, + "learning_rate": 7.559867514383867e-07, + "loss": 0.3647, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2273642122745514, + "step": 3650, + "valid_targets_mean": 3464.5, + "valid_targets_min": 565 + }, + { + "epoch": 6.458001768346596, + "grad_norm": 0.8907493802415359, + "learning_rate": 7.321740252056253e-07, + "loss": 0.4066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19292961061000824, + "step": 3655, + "valid_targets_mean": 2551.0, + "valid_targets_min": 358 + }, + { + "epoch": 6.4668435013262595, + "grad_norm": 0.8209923973422765, + "learning_rate": 7.087353688165776e-07, + "loss": 0.4453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1861528754234314, + "step": 3660, + "valid_targets_mean": 2526.1, + "valid_targets_min": 577 + }, + { + "epoch": 6.475685234305924, + "grad_norm": 0.7474743887332304, + "learning_rate": 6.856712373145158e-07, + "loss": 0.3908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22273015975952148, + "step": 3665, + "valid_targets_mean": 2730.5, + "valid_targets_min": 328 + }, + { + "epoch": 6.484526967285588, + "grad_norm": 0.7947503636901528, + "learning_rate": 6.62982078471599e-07, + "loss": 0.399, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3024711310863495, + "step": 3670, + "valid_targets_mean": 4017.4, + "valid_targets_min": 826 + }, + { + "epoch": 6.493368700265252, + "grad_norm": 0.8974195325023576, + "learning_rate": 6.406683327801877e-07, + "loss": 0.3775, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1381479799747467, + "step": 3675, + "valid_targets_mean": 1530.0, + "valid_targets_min": 406 + }, + { + "epoch": 6.502210433244916, + "grad_norm": 0.7191615989293343, + "learning_rate": 6.187304334442856e-07, + "loss": 0.3885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1408117115497589, + "step": 3680, + "valid_targets_mean": 3383.2, + "valid_targets_min": 736 + }, + { + "epoch": 6.51105216622458, + "grad_norm": 0.9329960975796369, + "learning_rate": 5.97168806371129e-07, + "loss": 0.3798, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.2396770715713501, + "step": 3685, + "valid_targets_mean": 2167.9, + "valid_targets_min": 769 + }, + { + "epoch": 6.519893899204244, + "grad_norm": 0.6478034299508139, + "learning_rate": 5.759838701629284e-07, + "loss": 0.3876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18991714715957642, + "step": 3690, + "valid_targets_mean": 3872.1, + "valid_targets_min": 1687 + }, + { + "epoch": 6.528735632183908, + "grad_norm": 0.665389821538992, + "learning_rate": 5.551760361087288e-07, + "loss": 0.3781, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20422768592834473, + "step": 3695, + "valid_targets_mean": 3974.6, + "valid_targets_min": 1072 + }, + { + "epoch": 6.537577365163572, + "grad_norm": 0.8481964209332128, + "learning_rate": 5.347457081764318e-07, + "loss": 0.387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12965896725654602, + "step": 3700, + "valid_targets_mean": 2102.9, + "valid_targets_min": 547 + }, + { + "epoch": 6.546419098143236, + "grad_norm": 0.7959235784114853, + "learning_rate": 5.146932830049545e-07, + "loss": 0.3908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.13871905207633972, + "step": 3705, + "valid_targets_mean": 2381.4, + "valid_targets_min": 416 + }, + { + "epoch": 6.5552608311229, + "grad_norm": 0.9738963676820827, + "learning_rate": 4.950191498965207e-07, + "loss": 0.391, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24106061458587646, + "step": 3710, + "valid_targets_mean": 2475.1, + "valid_targets_min": 958 + }, + { + "epoch": 6.564102564102564, + "grad_norm": 0.6979946706582677, + "learning_rate": 4.7572369080910897e-07, + "loss": 0.402, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.283669114112854, + "step": 3715, + "valid_targets_mean": 3481.0, + "valid_targets_min": 515 + }, + { + "epoch": 6.572944297082228, + "grad_norm": 0.8704935577886896, + "learning_rate": 4.568072803490409e-07, + "loss": 0.4178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18020617961883545, + "step": 3720, + "valid_targets_mean": 2580.9, + "valid_targets_min": 609 + }, + { + "epoch": 6.581786030061892, + "grad_norm": 0.7804746793990116, + "learning_rate": 4.382702857637022e-07, + "loss": 0.3803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17412936687469482, + "step": 3725, + "valid_targets_mean": 3689.2, + "valid_targets_min": 378 + }, + { + "epoch": 6.590627763041557, + "grad_norm": 0.8487934940824559, + "learning_rate": 4.2011306693441554e-07, + "loss": 0.4013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24455024302005768, + "step": 3730, + "valid_targets_mean": 2609.2, + "valid_targets_min": 657 + }, + { + "epoch": 6.59946949602122, + "grad_norm": 0.6852406296840956, + "learning_rate": 4.0233597636944565e-07, + "loss": 0.3904, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19759978353977203, + "step": 3735, + "valid_targets_mean": 3594.5, + "valid_targets_min": 438 + }, + { + "epoch": 6.6083112290008845, + "grad_norm": 0.7416508492161489, + "learning_rate": 3.84939359197174e-07, + "loss": 0.4063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.138950914144516, + "step": 3740, + "valid_targets_mean": 2434.2, + "valid_targets_min": 283 + }, + { + "epoch": 6.6171529619805485, + "grad_norm": 0.8357824054733599, + "learning_rate": 3.6792355315937947e-07, + "loss": 0.3735, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19350282847881317, + "step": 3745, + "valid_targets_mean": 2571.5, + "valid_targets_min": 1450 + }, + { + "epoch": 6.625994694960212, + "grad_norm": 0.8587156622200902, + "learning_rate": 3.5128888860468836e-07, + "loss": 0.3885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22190819680690765, + "step": 3750, + "valid_targets_mean": 3109.5, + "valid_targets_min": 339 + }, + { + "epoch": 6.634836427939876, + "grad_norm": 0.6581213951003092, + "learning_rate": 3.350356884821748e-07, + "loss": 0.4011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21432948112487793, + "step": 3755, + "valid_targets_mean": 3528.0, + "valid_targets_min": 635 + }, + { + "epoch": 6.64367816091954, + "grad_norm": 0.8286218218972864, + "learning_rate": 3.191642683350571e-07, + "loss": 0.3918, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.32919830083847046, + "step": 3760, + "valid_targets_mean": 4206.6, + "valid_targets_min": 560 + }, + { + "epoch": 6.652519893899204, + "grad_norm": 0.7950121098953326, + "learning_rate": 3.036749362946112e-07, + "loss": 0.388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.18096879124641418, + "step": 3765, + "valid_targets_mean": 2454.1, + "valid_targets_min": 480 + }, + { + "epoch": 6.661361626878868, + "grad_norm": 0.7940166037642752, + "learning_rate": 2.8856799307415807e-07, + "loss": 0.3903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14865876734256744, + "step": 3770, + "valid_targets_mean": 2513.9, + "valid_targets_min": 888 + }, + { + "epoch": 6.670203359858532, + "grad_norm": 0.7495945684460611, + "learning_rate": 2.7384373196324365e-07, + "loss": 0.3681, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.11169509589672089, + "step": 3775, + "valid_targets_mean": 2019.8, + "valid_targets_min": 563 + }, + { + "epoch": 6.679045092838196, + "grad_norm": 0.711551778287024, + "learning_rate": 2.595024388219347e-07, + "loss": 0.3841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22360673546791077, + "step": 3780, + "valid_targets_mean": 3386.1, + "valid_targets_min": 459 + }, + { + "epoch": 6.68788682581786, + "grad_norm": 0.7177246883491567, + "learning_rate": 2.4554439207527424e-07, + "loss": 0.3825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19970688223838806, + "step": 3785, + "valid_targets_mean": 4797.1, + "valid_targets_min": 1729 + }, + { + "epoch": 6.696728558797524, + "grad_norm": 0.7780793009957203, + "learning_rate": 2.3196986270787704e-07, + "loss": 0.4226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.3514820635318756, + "step": 3790, + "valid_targets_mean": 4338.2, + "valid_targets_min": 1681 + }, + { + "epoch": 6.705570291777188, + "grad_norm": 0.7174415720541817, + "learning_rate": 2.1877911425866705e-07, + "loss": 0.3864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15473148226737976, + "step": 3795, + "valid_targets_mean": 2806.8, + "valid_targets_min": 362 + }, + { + "epoch": 6.714412024756852, + "grad_norm": 0.6743683915959348, + "learning_rate": 2.059724028157506e-07, + "loss": 0.3834, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16321048140525818, + "step": 3800, + "valid_targets_mean": 3285.9, + "valid_targets_min": 341 + }, + { + "epoch": 6.723253757736517, + "grad_norm": 0.7217029334413514, + "learning_rate": 1.9354997701146904e-07, + "loss": 0.3951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.24354010820388794, + "step": 3805, + "valid_targets_mean": 3629.1, + "valid_targets_min": 1637 + }, + { + "epoch": 6.732095490716181, + "grad_norm": 0.7644466171909563, + "learning_rate": 1.8151207801754722e-07, + "loss": 0.4429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22783520817756653, + "step": 3810, + "valid_targets_mean": 3151.8, + "valid_targets_min": 679 + }, + { + "epoch": 6.740937223695845, + "grad_norm": 0.697996637149306, + "learning_rate": 1.6985893954042598e-07, + "loss": 0.4009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.34702497720718384, + "step": 3815, + "valid_targets_mean": 5219.4, + "valid_targets_min": 661 + }, + { + "epoch": 6.749778956675509, + "grad_norm": 0.6524281262476507, + "learning_rate": 1.5859078781671477e-07, + "loss": 0.3758, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16086144745349884, + "step": 3820, + "valid_targets_mean": 3767.5, + "valid_targets_min": 1390 + }, + { + "epoch": 6.758620689655173, + "grad_norm": 0.8703374924931297, + "learning_rate": 1.477078416088107e-07, + "loss": 0.383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.157963365316391, + "step": 3825, + "valid_targets_mean": 2099.6, + "valid_targets_min": 703 + }, + { + "epoch": 6.7674624226348365, + "grad_norm": 0.9150276768989083, + "learning_rate": 1.3721031220064185e-07, + "loss": 0.3985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20869338512420654, + "step": 3830, + "valid_targets_mean": 2169.6, + "valid_targets_min": 769 + }, + { + "epoch": 6.7763041556145005, + "grad_norm": 0.8582742028385791, + "learning_rate": 1.2709840339357515e-07, + "loss": 0.3803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1651896834373474, + "step": 3835, + "valid_targets_mean": 1981.6, + "valid_targets_min": 281 + }, + { + "epoch": 6.7851458885941645, + "grad_norm": 0.8933135468827135, + "learning_rate": 1.1737231150244388e-07, + "loss": 0.383, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16246512532234192, + "step": 3840, + "valid_targets_mean": 2891.0, + "valid_targets_min": 542 + }, + { + "epoch": 6.793987621573828, + "grad_norm": 0.8039369028796995, + "learning_rate": 1.0803222535175295e-07, + "loss": 0.3603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.12738923728466034, + "step": 3845, + "valid_targets_mean": 2474.1, + "valid_targets_min": 458 + }, + { + "epoch": 6.802829354553492, + "grad_norm": 0.800841966247947, + "learning_rate": 9.907832627200631e-08, + "loss": 0.3988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.19415853917598724, + "step": 3850, + "valid_targets_mean": 2828.2, + "valid_targets_min": 1638 + }, + { + "epoch": 6.811671087533156, + "grad_norm": 0.7602967171940971, + "learning_rate": 9.051078809618752e-08, + "loss": 0.3876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.29658013582229614, + "step": 3855, + "valid_targets_mean": 4289.4, + "valid_targets_min": 1496 + }, + { + "epoch": 6.82051282051282, + "grad_norm": 0.6866320695142892, + "learning_rate": 8.232977715637358e-08, + "loss": 0.3803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.22931569814682007, + "step": 3860, + "valid_targets_mean": 5008.4, + "valid_targets_min": 406 + }, + { + "epoch": 6.829354553492484, + "grad_norm": 0.8047620480314491, + "learning_rate": 7.453545228053305e-08, + "loss": 0.389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.17397227883338928, + "step": 3865, + "valid_targets_mean": 2955.0, + "valid_targets_min": 544 + }, + { + "epoch": 6.838196286472148, + "grad_norm": 0.7586490896107623, + "learning_rate": 6.712796478940853e-08, + "loss": 0.4068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.16233235597610474, + "step": 3870, + "valid_targets_mean": 2807.6, + "valid_targets_min": 372 + }, + { + "epoch": 6.847038019451812, + "grad_norm": 0.6581619537458464, + "learning_rate": 6.010745849361011e-08, + "loss": 0.3891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.133625328540802, + "step": 3875, + "valid_targets_mean": 4207.5, + "valid_targets_min": 275 + }, + { + "epoch": 6.855879752431477, + "grad_norm": 0.7436096405016829, + "learning_rate": 5.347406969079982e-08, + "loss": 0.417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1265230029821396, + "step": 3880, + "valid_targets_mean": 2987.5, + "valid_targets_min": 346 + }, + { + "epoch": 6.864721485411141, + "grad_norm": 0.7763730599939348, + "learning_rate": 4.722792716306046e-08, + "loss": 0.3896, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20675580203533173, + "step": 3885, + "valid_targets_mean": 3732.2, + "valid_targets_min": 1566 + }, + { + "epoch": 6.873563218390805, + "grad_norm": 0.7715820038607789, + "learning_rate": 4.1369152174381975e-08, + "loss": 0.372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21535265445709229, + "step": 3890, + "valid_targets_mean": 3796.9, + "valid_targets_min": 674 + }, + { + "epoch": 6.882404951370469, + "grad_norm": 0.9019028296801088, + "learning_rate": 3.589785846832783e-08, + "loss": 0.3872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20554758608341217, + "step": 3895, + "valid_targets_mean": 2699.5, + "valid_targets_min": 889 + }, + { + "epoch": 6.891246684350133, + "grad_norm": 0.7944162594852624, + "learning_rate": 3.081415226579898e-08, + "loss": 0.3451, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.15075156092643738, + "step": 3900, + "valid_targets_mean": 2368.2, + "valid_targets_min": 783 + }, + { + "epoch": 6.900088417329797, + "grad_norm": 0.7617097376400151, + "learning_rate": 2.6118132263002193e-08, + "loss": 0.3851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1630379855632782, + "step": 3905, + "valid_targets_mean": 3169.9, + "valid_targets_min": 378 + }, + { + "epoch": 6.908930150309461, + "grad_norm": 0.7539821586393874, + "learning_rate": 2.18098896295027e-08, + "loss": 0.3911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14324209094047546, + "step": 3910, + "valid_targets_mean": 2474.1, + "valid_targets_min": 680 + }, + { + "epoch": 6.917771883289125, + "grad_norm": 0.797486908920383, + "learning_rate": 1.788950800648337e-08, + "loss": 0.3883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1615052968263626, + "step": 3915, + "valid_targets_mean": 2934.4, + "valid_targets_min": 354 + }, + { + "epoch": 6.926613616268789, + "grad_norm": 0.7651379607020341, + "learning_rate": 1.4357063505101576e-08, + "loss": 0.4133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.14266857504844666, + "step": 3920, + "valid_targets_mean": 2230.8, + "valid_targets_min": 395 + }, + { + "epoch": 6.9354553492484525, + "grad_norm": 0.7502594071352197, + "learning_rate": 1.1212624705014829e-08, + "loss": 0.4242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.321631520986557, + "step": 3925, + "valid_targets_mean": 3950.1, + "valid_targets_min": 335 + }, + { + "epoch": 6.9442970822281165, + "grad_norm": 0.6647778859131394, + "learning_rate": 8.456252653055164e-09, + "loss": 0.4284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.23882895708084106, + "step": 3930, + "valid_targets_mean": 3747.4, + "valid_targets_min": 556 + }, + { + "epoch": 6.95313881520778, + "grad_norm": 0.6155232006040645, + "learning_rate": 6.08800086204342e-09, + "loss": 0.3761, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1027369350194931, + "step": 3935, + "valid_targets_mean": 3219.8, + "valid_targets_min": 1858 + }, + { + "epoch": 6.961980548187444, + "grad_norm": 0.9711608387054405, + "learning_rate": 4.107915309743416e-09, + "loss": 0.4059, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.190896674990654, + "step": 3940, + "valid_targets_mean": 2195.4, + "valid_targets_min": 362 + }, + { + "epoch": 6.970822281167109, + "grad_norm": 0.7122188828888222, + "learning_rate": 2.516034437973769e-09, + "loss": 0.4263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.21069204807281494, + "step": 3945, + "valid_targets_mean": 3195.0, + "valid_targets_min": 411 + }, + { + "epoch": 6.979664014146772, + "grad_norm": 0.7376023644733862, + "learning_rate": 1.312389151861826e-09, + "loss": 0.4027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.25383979082107544, + "step": 3950, + "valid_targets_mean": 3817.6, + "valid_targets_min": 1252 + }, + { + "epoch": 6.988505747126437, + "grad_norm": 0.627582373951346, + "learning_rate": 4.970028192485821e-10, + "loss": 0.4011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.1778397411108017, + "step": 3955, + "valid_targets_mean": 3882.2, + "valid_targets_min": 411 + }, + { + "epoch": 6.997347480106101, + "grad_norm": 0.7920130024563453, + "learning_rate": 6.989127021794773e-11, + "loss": 0.392, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.20227769017219543, + "step": 3960, + "valid_targets_mean": 2815.9, + "valid_targets_min": 305 + }, + { + "epoch": 7.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.48488524556159973, + "step": 3962, + "total_flos": 9.02500960062931e+17, + "train_loss": 0.468742822619895, + "train_runtime": 33154.24, + "train_samples_per_second": 1.91, + "train_steps_per_second": 0.12, + "valid_targets_mean": 3460.0, + "valid_targets_min": 1632 + } + ], + "logging_steps": 5, + "max_steps": 3962, + "num_input_tokens_seen": 0, + "num_train_epochs": 7, + "save_steps": 1500, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 9.02500960062931e+17, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..e94b292 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a92ec062620d6e155a6b92bf41d4642681cdf122cae251832d20bc409036174 +size 8593 diff --git a/training_loss.png b/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..3bffd5291647e782947adf4bc1fafd06229fb434 GIT binary patch literal 46910 zcmdqJcQ}^+|2KZxL{@gPQ`ySiNu;DS?5&W!_qaq7p)@E$lw>B^v&@o}WN#vSWUt@z zrO)^NevkXOkKg_O{XX8GKD}M8^E%Jhcs?KNbv?MMsdo4f%OMQI4y#{KxrSl*I1IxZ zCMAZSh`0BT!~e;+o!51{?r7=eY36bpyKLs>WasE+cgLK=VLZTudDaK*?JRu6<7j;jg%F1RRUixbOA*5JM#Cpii$$kecENZ+`rv~(g}w|8(d!JmgS1fzj}+*w}! zaya-~fdDa11^#(OL7>FN#g(ENipK%Jpmm}KdlVKHmj1*Hy8ti${3?R+!0Xeum@ry& zfzuS&19)AA`TwoACo?AbEtB!6e_5OBi(f6z)XrAc*JpXC%FUy$tgfz}pSbT=y7+~> zJ=dfvUm>ye{X18G%|HD-Cr*qB2X0=9Fwu$O`JN!1UzfZ6gC`*Z`vC096ImhBw}M@^Ky49+qvS)7v+AZn!}5$t94)QkuPmdCe;iL zRkb%P^c7KcnFPw0ddwYCR8)l7Go9_u+gJ$PpUGRe&mIuwJXX&sBf~-*jCbnPsW=6H znJ9L}9H05)m!2nkE)0sWL{1G>$PW6i59IsD35K`c8EbxVhNLN0*s)V0A^Y36i{&r^ z-5<d}z^7z|mHPZ2@dJoIj_UgxxQ>+p{aj=z_ZX=dozTsPhpFBfktB>!=iW zaIeqZ=i=wTl((?GP!(M^UrO%3y;fJYP#HnPt!nx!OV4YyQ>S(JY?76q=F!{=5}a`5 zhIs|vFgzZqdW_Sbx3PtWHN7va61|CU-n?n$ZfBv8fAre*>%ro-zr_B?PP|JBxT~7_ zIp+8!5%=jEFg#>>dU{?s+`T`sC>IwMo$RwK3FT91|2=z|j&1~=-p_2-?a_wp_2NWb*~ z&l-oKv58oddU#iGTU%ScjpLZE@ZZcDDs{yk~I`IR`q#CBSI4s6YsuX*#@F_ ze(;2ZhJG0uVkaP`sP1#D5**r}ObQ%b>vL3t$uSdSp*eCSSa!ac;NHD^%L>Bfi}-B5 zv!a;N#fyh{)bH}BhkIlh6j55{Gsl_)NMF2oF}c%bsYQ07ah;KlPARpWLr#uWnbdoG zcYP>2E{8S(_BFp7cVcdYAOvG8Cmh4wD_y~`WaqXIbE(d_4FS2E>tj%jEs;T zI`rk|`|DbUhO7bMmy{= zpRugIb=s^hoStp6rz%iUsC0^JV{?;JL4hq7woh=EN8RKn@1*NbzJ{o=c@sW(@IZu# zVyY+q#Gu#M;ku!FJnAAZG&cTrT$!knoOE>`ttH!;a|}G!nkYXqGZV46=;XC+xUtfz zDC*EJ1#`p2$%&U+zI^DpkkRzgI=R@+7G9L|DLgzpDc9c=Ii=HlgoK0~r%%&HD{P&# zlQ@bEZ!C?4J$y)rp=If^ZB+Jc);5xI@w;Pjjv2e){Ks$CBO!{Vy}{VnY8BnQ0+xYeRmyu76R z{QVy%Cg#YjW#;9cKR4*RApdu+j}fZ0v$J!Ys6}XlRf;RcO4Kn~5ts1`XjYFOCyHPc ze!kxG!R%Z`ZtQmVr?H0Ub1^*SOZ7)}i=AG}$xZ&aBwY9Y`a6!0>L%f;han+^@V?P+ z{JAPxT8~qVhWyu$L79D6Tr9;zLHs5yZ4|cubH(c|H_tg!4>uahD()*QD?3d*(;2M} zA_(_SSa?-)pK1(hCTc`n+}umE`K`*NLD%1Dj-ZQPy-ICvZZ6_DDA&2xZC6OF$o(_X z3O0NAn>RdWr(cBdN7QlMy?eLzE)n^-eWp$>gHMGq&++3AVEY?GHM{WrrTC?X?25*N zlaZ2x)E4y*X@o2O#=yW))do{3oP+_YgC!O+;J~O%y41iP7#8nXsfSTJR&J(k?5wob z!F7cA`1r)T$NO#>3uxV&Pqn=sg^dv2FcVM#?duSh0xQ=1dz|R#E6+iiGnU_} zVX;0uCaWDF0Jqa)l|-fkT#nsXjy#qj7*Uq)eY zXvrA_9`*fgJ4f|(+kbC!@{6fRn5ad4W1wTpEgtS}JL6fET?03Ge z`^oxo@mjAf5w-;D{%dY?%J~RF%o%!a)7(C^>hYBws2FTXM9>ZHVjQYbtf!0vcimAL zi7;>|Ilr^J5E#3ze(@r$yzd%adwcun`*(@x_NjwOs2E~+PPN=V{h}6!M*#b**lYUz zyV}vZh&rhC=t)15u-_=>1*}kpaR^oIxGcf?egOOOoT2x`vr#}@&(`rcEWgKb4h2BF zMDKvb_^2q`q{?{Dms!LV7pE9liCQXpB6**`)X$zhTdr)W$_7jkE;;0PU2duN$d|4z z9e{}uqod~DRcO6qS3fc0&;W)-M$!vc?R@ltQlATTrKL948q0&Z2o_>L_KD8M{;y>jYr$n*q=E@vr1os?h^s z758`YslO~$9y??C5IV@Rc;NP&Q7?FH4E0jmYP6hf^GwfX0^&*gZD%TO%7PJaLXoeopc*MB+H@h(o z3Ng-QWHfXNI+)zX$J}+Y3+3FF%`cDhsMB`5yQ1@HKO-}TRN`~13Jxpo*LxfbL(MUxD}BMIh3ex@0&~UU7t4} zt$o1OYH{&mc$|pYT{QzJ6vlW;7^-!Ko&)YF>FF0%otY_!y@#NwA>4IxJ_(vrn@vGR zgQ}`(c)UZYdZj$zj_CF99y{-X--n)ef+IU8cs07Sygx81vpPQcWtMYBCC z+T7lbxYLp5op5f>QG3pHB#4BKI)>+gQJKfrzC+~X=XG`CMjcB|-Xlg|dL z`1q9i$wFnsuI@yZ`T*LXXLnGGVx>X1>A%|f#WMfYn!EoMSTNpx5)%^>WWk>~*u2MS zy!)UL3IM398>zWZKk0+Et#&5;i7Sb8P{cc~D3W330QcGK-70cyv5iLVXi{hz3efxO z_FAacH#WSqw6%F1_q(e0j$@5Ut_%_9RnDJ(5U{)TAR~j%y9$QV7^7~LUr#7+Ho(%m zX6P55Dei5Y!>$r$4=Usj`K?^WQyQO~^p&&JVPBJ8HoMPp? zU9|VGBBr`>lTclsu#fZ?oPH7;d*ZK8Me*Msm*@j!QIW)I zp_vLex&{OQ-MlhrDG`4jwpUnqc#PuYjBiCb5$^Hh$0={#s0{9nKe_U4KkMhupN)Oc zb}gYeop*OHD8D>+W)3z6eLz4!`0h&&?4LV7KlVSm2_z{ttNLn!Mxf8!0gPLARG3!MwS z1>`SYyzrWOeP6D=yEyH=QCUQ0W~SEFt2lC@VhoeZ8EGD@@O54uS3mFB0*L8Rd^|su zdH<(7N9v=FML_2=?MSQ+|rhj<%F8-!kW~cea;s{Kbe?_$W`uu>D%Q&e+$pix(1H-q5cnw}d zm#@dWi=9)|7(32U$%g>-8-@i{2bhX7zL_|pF2!e$JzxV5@u_m}mA1E+7)$!TywAw^ zHq*_L+CC*}D#yWr6%G1i`WfVQSpdUsY-~(lcP<@u?e%N@^X(b`>rNX{+g}28Ylsvm zlkNaTIhR6bTMhs->>b9Y7fepRtL#Ed!YoG^*R_(3khOfM8o`Ls9-aFl-#C1jf}z zvs1-4hejTi#K$W4wrnrNgg_q~OpToHqE|MBy6v?+R|M?9q_Kv%|MDvt`kmM?Q_fg3$VpwBtM~Ta>te}vP>YY2M;OD6uN9|{AwUP>KyS|v`A$oFc zXRaT_4q$)FUW$L*Wcq;)F56caMnjhXWd=?vzBQa2J6#TuOdP27(@IPDw*Ftzz`9$FNB@z zHAbET$M*1p6B&)%g0El&J|bstX8PkroIBjhn&^6%yc%J>~ffDuYaXtSldj5pF? zi!xfgCr_piHcZP6_T5(;_8K%iarp0aCwYa>D*mw72*C7f8ZS;085B9JZp4&Kr9@yD zV&{lN{hjHe0;=h9_%uiWxj~vxE=H-yFj`t#xf~jxkbqIHSH61kB(+#kN=nz64O+!| zLZXy2KG2?U#Qar36xe1C~QH>pgrQ(Kb0Kz#u`e;M0=f^o`0 za&^@;>WM2o3rp`*GRKJ%Bv3yNAh)Be$1IZ=%VD5+9m7jTrEW{zzXNuGcn!BI?*FxZ z_hco19!57TBI3H=qVEcT`PV5a_z?_(Utssox+|_%F{;P3WgAFtF4S$Ztk3pzjCC7V z_>90q-uWOH=}lQ)0;FpR(AWq7=PyUD$OT;zDk1DLbUln%#(8Wc>*MgwvIG+a5|Wmn zt#E(>2Y>}{Z#lNgbo%G}aOeK!Y^d=afO*hDhI=zz`Q6MGSfx3id)>x{4{B(a=-TB~ z&^5-M=@@^8X)=?DpP0)@I)mx=yi09X_oX0rONfr&rc_WiN> z>Q!7^dg;JwMXBSEg51jYGaG;2C0*6lPV279a}Ik67-)4@erC^Rf?4c;fC(${^n zKr(@U*!qknuS<#lWgdxiXnrY<6coCB!CRJ=qrh^l#JSf(k2+KX99-(Qh~^X&JPZ^5 zp>M8u_G1&vF8fy~UCuqXV^0ls!<-`Ztv>STxoTD}3$#eKAUVS8%(cSyfYOEYgvKD#lgxPOX-AIi~(9=pb-rgJxLJT1?yGe2u) z#yL7VN;io>%%sO*7IO;=`gK90(i@`EshobA$6l^TXSWhi$>D$ojzY!w5=O&~numIf zoB|_D=KI{FqJ|;e78|0L>hkw2D?5F29vX2XcpwfIPgk}Gm!~m_+t7I|3`P=>GYrE> zS>I^$sucSzy;$GX#R$N!c58Je&%EwXmVUvZrssk+P(&YgX6l^F>`eLikro8v#SKkw zXnP{JztIVR!hz-|(SJ?v`zu*S#ofP0h!3;;6o_s%x^B{R_^3o9URR>L?~Q%3YaIzh zMSvzk036_3G(^?GklgR?*4^0HFa=PtF|@yH;$2l=&Mh zLqY~iWOs?{iM_q`sw8*Izkb(zH71uOdvr_NQ`LOG&pKb}BzROt0!tn8+Yas;{%TSJ+nY**Kn%l;;5Hl2r{ahVnM$=g%8E8)MNY z`S@%^l3`Ge8vD+P8+wi0L!07*!+=b*hS2cl=Bbcs7)w#pY7BGFT>{1^_c7-_<*{q! zBrWItbAv!LJ|1g$7u6D^=O#$IE`sW30TLGz^i1HRCp!7aabwcHRba&A@xlPKWCJB%a5ZlsJYBYlR8LfX{vpoVvGNj=1_vEaH?-T8p zi)+QGyE8?qqT5HLaSc|z&um|tZ98?>`gLHa6LSm^M1aKDCPB_$ZnQq8;K!t7^ep7L zp}%EK=;4zB0<}PUgQ0DH>pOGiOzUQUx*^)BtZ(LZlT?a z{^MEg)<_QnF2*h{E*_pIcl-A35Bk~Ru1JdmHn8_4XTb+s1d@MJn^^CYHBFXw=FV9O zfDMF1L}t)PGWf#)k7p)!odVGu);#KzSAmKyEX^Ao!C8F&1q_ZDT31O~6O;#!0lU7! z!@$P0+}uq-3?(HeU)gB&Yfm}9xUwRf$u$fToX$?MRqjTD#E`2Dh~3?G5(2s(l=AjL ztOA9I&ZKy6Z!hDmJz)2Sp{(A?FSQSj=7=NiBLCMDX#}7a(&nD3f*us&wYa!g|Uw zETJW#WUYRB>iUfcu|S|mCxwM$9Rs2NG`6%nH|Ybgz`@6N2qZ-99q#2CD#c+C`I@yG zhx)7veaR@3=aV?Bd;tePK))y>qd)lWc%#`B=e4>kL_yy~a1t<<=b*RR zl2ojK-rXNRu0^ju>9nZ>)+0Prs4L*Lzq?Mu%>3Z*-@iWWU7N`a_d#Lpl*zf=87Fm8 zLW1GWojXVZr{A6(C}V^k;qZe`DzdZ9Dnzmru1W%e{&FaAvMkVPv>Hg92=!4rhtYWS z{CVh~j(6N}30RP|Pzx48V&Xb^k`&cQ7{$<+FIj3E8Z1EA&Ujq361fDQGL{zaa5p-d zDox|XU3z|PQ;-S5MSV0|hUdYm2@fhpZ$&l@(9Eu*_^j?;mMsYnW^$|8pb6vPp#UmV zW@|^FIl`tZ*oM8v5L-a{u+vlKciMl4Wj^X z*&Ki%bdskHvH9C8TL^0a08|5=TND&&xZyDn!hxO01Iin}{dFFQ`_pI7%s?~6ALI9-9V)(H%7^KTK9Kaz5hJ_M@(Qyo!ZYcjsTdbhc(tE(5 z$ktkdv9SQLw)po;TT>CHMOanbLPC_TlP&f?R@uQ&+5t51*<^2-u^*YS;3#~(^#%Io zBG?oo$o~inL%vl=pF`QTzp0H&~ zf=FQE^XIr-e=!YWNY}2>E-x=H0=MSmPnu6(48X@nkEjKV%b9?Kp#fYRsi9|ohWY0z^j=+3ac129x}K*l@ z8-d?BYi!KMAY>SZV0ir@$=?Om7jE6+N%UJ*M@$9vJSVtvV^YVt`;<2|bO~5%@{Rph zZ?Y-|fVTa&`s3}U55DUTeo&{Ew>J!pbJJL)U3iqwof8Ey1Z)BF7@iUEvmBr2bO21n zS!}e!(u@Lcb{G^Wm76!8mH(XG)Sb?K-AbAZ%dxuYr&R!C zc!7m@BUdnl8d?LsgZQt2%?U<4CDp)ec6~&l8-W%l@K81N!sW~KNQ&;R z^e=0WHoEj&3a)a=(6w2dOHR%ZT$;yEpYk{qj}Yepgz!$<->%v}0xgFTG;ig19S_>t zu8Icic$N5tKLPO#DgEe4f!fl7YtD7*lzPASFRg%l zByM@A$k8O);;8Ji#MV12itm)AzU9b)(7+`mqzSk&3|L15gbN17^r3drLDi$LtgOVx z?MRv!8VbO|6arID1s*R>$~nbp-_Xfl^ObuKaJ}0864wJw77GL6v92=Gd-vx>KhoF6 zIky1ngI{elwd%9EG7eRZ9xB4pR=?lQQUgNm$aO%E1(ISOfVa&(Fq4q}8VyG4(G&2$ z$t5}P=ANX$#z&767Dg%xfB@*2Iu(8K^VO7Cu*G#rJwvgWJs~R6L9iA|5~Rs9NZzLI{|gXXYxf zmDE1x{D@i^>c93w7V(SVKZYkKbD-w{$Q)3o(9+dfVHaJrUcSA4{<;G9jU=meawMoD z`zEw63b1&Z=rf=hG34Q}5)eG)sr8T(wqswF}7nS*t17q?AoMn(qR6G151 zC_G~UEnQHdrVT_PSUR0=b1?iJ@Zr&7^vQ-oi_-^}n zZRP!^PdD7}MrW?*ZMU6LRID0Ybz1fD&wS2pbNT%F^Tsnp_)%Yv589{|>Z~%};O25c zp$R|e9mophP^TrPVtWXP>*O~<>VnYQP0zhG#GH$ujv#s=*ulXF`<_E#_iu;KI!&|g zP;)%cieCn-0sY0!AS%{)JE|GDHH&u*114GX3A}dgT0Z@%13ynY?Sc#>z*bJm${q!K zG}AK)SqO)e1aI%}?E=!z@J#xh@j@>Nn0CRS#w}QAaz{$?d-5#QD)@(BUd?}|YYBFz ztVI7OLDo@Rhles^={3Vl)vl&ReUG0#yH{PU)Z)a=#bpD21mICMLqk@vmn|>IEif-i z&|x3N#dY^KbHHunJ5B#Q<^49cB@}O1+DWKC0R9sYdx48Bx}@m0Z{Of|PX)nYEKxEmT*@iZXpY#RYWQ^XijdeYu zJc2nu(}l$>1JxmDcGk`h1kGZA-sSU2py46SwXevr0ns%OVaq`P6#QijPjXa%f&62B zzLuU|Pw(Z|mViVM$(~x>`sHvj{-+tf5~MhS2uMbwWaq2Jy9_&q_aM81Bss9H7NPJK zDv>`3OV7^hn``|39n1)*9IStRD$9!V4-OILq4SO>VixVT*um8la2~ zPVGK<@&q9W0!#sL(@LiR+)oYM59Bpyj~p49ob2jter-8AGegeK&Yl3G8eC5`HLoE4 z=Wh`nUWofeGp9t|&%LuNqe1-PcwDn3{JZG^*(CnLP#EW_SrIvhyCtrZTp-QujmT6( z5-<_Pzkp-f{t!i37=U=MwH-;sg^6*O7r`A!fu+4C4Iw96Ntpcfc4SvVUMEMr0ji*+ z*XBfQ>-C8Af)C`yWE8{%6vXFjC4=Gj)I+F2lp!T0Rf2z>L>(q4m%Wmm^6RJBX&mtB z?h0Q?*zAWf7>HVEK}h4rqGkuc!KH7ITF*^SR|*JFKnlz5_Ii<9$IVxK8MS)?QKFDp zbcfN-w`^9vaf1$We5%oGkpK&hVXzU1LBd9Y{GUI6pd@aX4#r@YxfSd!SBM?}HJD`dysZ zoof+AM$Kv5MBV-wgx(XK*#mSiQ*}1^Mc=Mmmq+**I@%JzZS%>NS5qJ@04xgw?&zI# zBGC(ff1^RsX}B7Xf=Q%$j1^i1AHw~p*l&R23GP+sL{qG!*PQptZ!?HUps3y6T2a*q zgRA5D+YVJ&|MzyZ%7ZhdkQH-wsDR%t~=!zk}CUKDZCBd)Z|=?iZ%~up_`X zD5Hl2X>g}yLsemt!!z3<5gt4l`?2NIyidpw=|W($s~RP$PzM*#`$z~VkO(UWIRcrC zT`Ncj@LK+Q0y+K!7=wT=4onIOuU+*gyd&Ug9mUiN7eI(bI$1k}cd+U+t#aH8@h~4i z4d_e)HjlFf?kuUwE6D82Xkgu1dUKceb0NPfQwRvp=l) z5yS<+Q#Q+EZ&vQ(nI5$&DB2Y`PNSvvy2Hk)=23`tnTPAj`nuzqD}Iz|$1@&vm$qVH z_dC$qQ63@;a0F~7CUnoBmwFoaDqFp)d5AZgo+W{zw1VpIIzPcQLl_6Z%osqeXGNVq ze-48!r3Qe2#XSm80Cc#fBWhT+Wxg4#fXg-!WuUHcpE^Z$MR8Xwl!Ey#Y>_dL6(-#@ zZ34byh0YR|kk)OCgdo*?)qa57TDJx07UyDxj23%sb6n3P7L+ctju!toOT8{o@tBzvfCu!}%9s zomhaMBof~oC+B?{37x3qSoy=l#8^{ZH|tCP_z|V;Qa^qAq(@TJJBM$wH?Mn}NBjqS zO z*PU-g^()6H0vyO9^vf2+9}c_BJ+&f+W!Mr6M7vJId|ECJ&n`IR(g~4+u(gc?1=h#W zMUni<)eSYZ7owP5@Ik)1eX|z(aQK=BUXl4Z^vXGNtef~0Z;%K93S&1vL}T4MXFJJ5 z4RG7W5?zMjE|l{ql%j07sbkbRJGl$R7;>RMW+&$an6SdLv-t1}YrlcoKH?!O^IUM4 zOS{S~0-s1&hJ#8yC3o-{P1Pp}l;NTn3M98x1qPy^86+x!V*o*pDKnh>{vsG4BIF2$ z-^Lo>1!)5SSm=ijB0M}iNL3DBnd`|XVKni}^Q-ioFCl>)v%Cvq4;B&709v5pNPoEr zTJZY2H*YWuv};00(2m?=rVJnOeriQIIY9N*0_Humu4YGO%#D19n$+5LN1i_%Sk% zA&g}Xf9(z_X(KCP*SoqUMAF`@5dw6B7r{4@fYmcw*RKz_vX^x~L!!pa9Pp z0%ib{j-fLV*r4}eds+YwKsidZWI%y}z1}ou1lkQ)4|#y(fE3d~1d02{j~@rx0fyux z=xt+=UVt1IYvt~mfuTpwZM5o2Jr|Z(|H(O|7gj3!{Ke&V*rd_SmhZiuvlW*)wcl8gX@@gT_1X3cucAKXCHWCD z0JTRJMenTJjk0)(LqUt%yfF z@7o7HWM7Wqf!jU=&+-Kr&wU`=2nt)d=Rk2AdvZk~2r5B7u4-?KA1qa$wb=*2=xXcg zMxa~Ofq^tWhPDsIQ3(ocTr^O^prigOC5srTMEqeGEyz?q>{^o!Hh4D_u$`^m#d-W- z{P8#<&K{w8oQXCXi1HwR$fEg#j0rK|U+{p}^s^?Z_p1ooOFvm6j{&6eU;i%}{R(dwGPQ zS|ZFHy=%(v;FSj7@4&NOnFxfnFD;5^v%~9+%!{4fvyH-%E0;A?+!Cc?PiAIi*-bpZ z>grmVHs93t_}sScLK+RS24N8$13at*W%{7Xxp&@NWy=S&{ykA1@zQhV=3I&1znPJ2 zEBIq@i*$r^Z*YH;>Ep%B$1H!M9khb72L!lMC?T%H1qmXwL0O3&A6K`T&~7iGR!#=A z13x1rBU{oniDL!0Xnpzx3PtogHylG^F-yPVnKMU_ya}O@`!FX-An6>NFP#ypt*-~$ z?3W&Cc~te_nYWF6*~FNgym3es#Y5W(3E-O=kaoj3NP>QfLVIk?74)7K!9yDQ;G5%4 z5Z!zTt|w{tK7f!-Q6SSBmL!5q|I0E9@nYY`N zUa7u2jJdkFKrSS^n*qWh0Gc2|@wuz3Ym6zsha$g6U`U8xR`G>&*$3{TEd5HOTOX?( z7~8C+gzmw#wj8s8_$U{|w@I)o3Y$F8Z6=aHxq1~_D19Q3kjafyOe*G64)a+67%8spcgk>T z;QymMQeieE^tn|ZF8VzDYzhf{siDi~H0?2_=}Cez>|3+;`16~oCVq?FRWQsn?taI3 z33S1}fLM(M&|-}BwlU&@p!xGYj# zp-1h`R5f}zUx$WarW2hS`(2+gyGY9{9SB|{6?N(@~rQg$Te`Gq(K_&(1hZF1*@#Z_kkP2+1fJH82`-;TmTbxV89gW;-POJG^!KEU`@+~xs4nzdkU zJ%_*l`zR9lC|&y<62%H`0$u&D2S){4j-lI2b#D5v+r@+b&XU**t~x`YTc`Km7ougQ zNzNUVCXZuQf{&E(1oSFmMcmd}EeiZc<)I6(3hi%zrg1_Q4Y+ zxc_u%z^yf6F2s-cgQ#K5R?M*O&=L~d?E}3hof*CQrdOw7>N}?WONq2S{J)>=cOu@W zULp+!16v6wSYa|48Z=khFm3L$xnn8^aGLGlhB&RuFl9e~OsX^p{bCCddYVEKCX9M? zk`%inO@juqg$6zI7%d+0_GxrJGUfMYD3l$=x3J(IA`Jx9Lts3Azr>?(A;#TIAXJ7Q zO@^W&c2>tDX0|QEy}(0na|O5`=~|CFTPcGfoDM%}KtJ&ykUfL@&kyRb580W`7%|H+ z=IW1pw)_%Eppn6c`%gGSFy-h(h?}tVzysZ@y#$7%Ub+F>nz1FQwmGQhQ~fX|V{)f) z2O~7a3iCgf@D|(stB)z^-8>vZo!t#{!DX`mgYOJ`BIz>?ray<@DZcj04xRTbaD_pU zvcjfjQlI4qO>`!ZqDQgHJx7ECl&0e1avJ(FNZ3)(KD`HufN>+dkD?K9009|-`UM$8 z27OXFGk7FFqX-1Xqz>ku1WKAA&}+-q#7Iyh*-%^yZ7c9Y08qc5-~WE56?MS|bP^B2 z-^%Uz8tCwmfCmelnr0@yZ}prv61D#KjD{eMIqmIi7K56ATsDyBNxO-f=1b}(*Kj&A96UkxC%l)xKw3h-cw+U54YyL6QDa@Q^bxdoTh8An#RM71ks1h) zvZ)Wi4!G9QP=V9gEF|LL(dhdCQY--`_o|5Mu~XI4doeoc=Ng4ahfliXDn!z7uv=bL zP|{!wbaX)10jB8Z$pcoAmX^+F&`6M?L8%T1VSqY{q!A>MfjPhC^Xk7eH+48a_N(Ew zDz_&ddC2Ar9#+SjLxNToj6EUFY78<`s!#&a2@5b#AXI+@((d&b1I>f^5*64e24C0t(aP2OL($_ZS!Ub7mC`)P_>`nQ?oddME+}38`uM zU)Ew=aHI|L)u0)RBN($X(9iq+D8b3NgJo~|+IEguEEY*(y`SzdoxVj1+%6R2ALJk$ z!E=ycNF!KUT8fkP6v9m5y6C_f;zYl{Gb2p^GG<<26B(?Sc{ve7BmIY6^pHdfR8j>r zK{(|g4d(|qAd?0VE9OLKf}Hm?(aPM?QkGV^6$)@rsHv%ONM{0jQ4OMH{POtjE$SQ+ zWlGlen6B>Uf3+=<2e!yS*jh$b76sVjCj|xN9mnvBEa^sdE6E6G?{cbFk9!83Ev{md zO?>5KoTCPXti7Oi-P53pvmW!fC6hgN{9`ZC=s7<;>>e+9hOJ$84`{VqHVtUQDd?-Q zf9SMS`;beugLb6H9d}y^FtWmWMbY*y^q@}e6aw9U)FvONcl_r6d~0d%1Agszi}bWJ zm|V@jd!>b%q&Yc@U)YC-EpbMzM*OQW`A|S2SD-xC6U&~)^&DqC&=RbWhV{<93HxS& zUHZ>20@#b}DAB;j!xi@mnMNH<)xo=6iE)L!n8@I51`%5?RB3ulQKcb2+x0UF?;)kj zEiBV^_GD&Zp?(?MeEKe+!TPU8)e;R%N~zHdXH^?$TfA@oD;<{)>Knt|Lh?qVO05FD z>T(y?%z}ewMr|$O3`RIzkEcq+f??hh2u{*yb)cg4>6#IydvyQn7`F25-y%x0fKRz2 zmV=kZDLDSAA_qVD#Ih=6`lOEd$&1W`e$#<2#iQOs#A@31`ARNPwevye za)TO)m(7YD@{Z4E;IP7n5z@L2H%-#tRE@d6HT}>1!l+PM_t#_i|0$x;c&4($Sp-ut zn97ahRPwmDrfBfq!@?lw?bT6#j7MS4i2D7jW5l>Q+?&&6Zye-J4=TOZ!Hs-!xNV9n z6&mh8{cri-LGNUN9ZLQ0L3^MbP)apb7sDLoG-JEteHV}%w%)PK^@=ty>-x&ShIzts$-{{cQA{_i1gPx)L@fI0m7DC@8`efWQ7!=7aXZYaa>lc`W3_<=H_ z3yBTh%P+@QWx$Ala9ViM^W>YS2newDf+tGL{JO-bkF#9q>OE{t33L*4ldz~LZM*2G zsQS;rBsZf=;C3Jrj|1Q794TIAXE=1X+(DsX=n&|PlHIRD$cIS>ODM$&~q%^GO}hWfnDB`|PUxW2gS7Am=uibN#AW{j`6{qNKI+ZT<4m zO2)l>sw6vwsBK}5x*_2i_rYEz=qXyCenLR zW>@$4Hdprn{Jadf@|cq#LH_m)vdSKB;&?d4BG_mbDGq@O4C1*DKF z8HrBa1*8h_;-?ha)RW`4yEt*bS=0hQB;bkZ^&0Lfqox&)Dh!}Reyj6wjY?{mbzZNQ zLt){qd^BdSP<@kXz%oR)tZ7W0p1R(WJYXxtP?VLfeZ@*$p5GnOFh$p)fPxn1`rSn8 zU#&a>H*{j>aN^97J{uDJk4$2)^27mmdzfD}Pj8UOWW{7o<2L`nVO6M4n$|arPgxO* z$TX5-jY98jzVf1~gG$<~wsZ|bXG^RsWD^h5q}M65jz_oV54Wb7PJ~;7uF%emF^C?t zz{Ai$G}GPj%B-;bi}*fX(_px{h6n@rf){vA6J1h_k0!a( zSaMMK_!oBUQQb8W^a}8hITe2k439&omJxeoq(5M84?~o)_5ixW>s}&(Y5eLqQ#H}4 z9~mq+^s@w!)5~RZUtb>Efpj7Yk8iF)?jj0&%ZIGewD2Vu)^*Pd1T*d>8`WdP%>LA- zZFtzni*ZEgTU-|4Z3&=``uQIlhy{D=Gy47zaDq4i5273ze^JidRYAhJ7(Bx1k2qEm zWIC+27kCh8zLL2I2`@bCxv)tT$}%GJ27SE;e5c0;_oH2*FpLIs-!PF=->KAA_?%MO z2su99W>JOr&uL~_VUW(hs;f(i!BJ&#NMm6b#HG?R%z2yC1qrNkv~spa63G0@AK9YT z`Pef%5idc+3?E4^6rdkMn7{sw`V$O8A`tAv8Ht?3TKojp&9pVwE_e{*h|(DD!24(l zuD}}&i=8;p;ewqVKR-w>l2TETV333)Km{Eh&wja6)>vY_r_!BS>0rH&8^P_t*_#ih zpYfyT(6@W=e@gQw71>DsX0H0Sju?1B&*zY<4Yyuq#n_N?a+J6qU63{ke{%j=T-ym2 zAEV5MJv5CM_2mztGgv4cwz&qw`WVa(IH62bS7-Q3BQiIdLH{rZ;Z;40Cq=SWcsiZk zR}J;Xocj~cygiwn@p+_wnZcGHJ%W5T8>Rp@9VAHzFwh}LqUDxJp^Jok|E>YGuI!mX zm&6^OM&@!B+W{5oV9kg|B?8>mrO(ATqhS(LG}Af>s^M1=1Hu-;_C;S$Lk^x=Ftp=Q z_zoEBiC+bv@}A9fE_YL$Z9ZFYiJ`58r=R&3K3X5bus)y~r)Rl671V=dybv7k!Ia?e zQUWv2adrH^y`@Y3+aISB-wBxofco7tm?Zlw{4{$02cLW}DWAXAs2)S)?lkoKQ26Q$ z0*sPf0lt19MBBlr@6BVLDKU59SGL4X8bzd7^%atpa<*1vz@@Zg!+pac2^49}%&q(a zIaq3Tb}DQGRCp&y8Wy8ktH!cb?@}wBy?1_9?x6Ne_v=?sa$qRe4QDYRVvS+wiyDx* z^GV-6wKWeyV(9sSde+0IpyTAoDUx!VqE1Okkz3mbrP(y^C(#8svIhsiIpAE`mTREW z{O2@tH5`&o zfp6?Vs&M7z@1ux4qH}5O5a9!}I;(y1#s44N0nZM4c%vd{SwTrjCh?S@u;@!CyB@2z z$|q-Sbk^9Cx^8$coufga&JI(ITpCc!#iv>S z&!`BTYZMYkF>1(PcKL&^2N@nZ#q9dy_@Bt}Mo#B*mliUZI+T>WH8_vzg%U`kK-kZq za}y!=?tSfpZxmRH4%{I?EIzdbj(uX_oq!ctw+4Rz#}o6~f#voAj?DK%7;bf563z>O zOWdRgU!M|bGqh>yNw#6?_dBitBpB|PoSRiXSsHSki&gLYIcdXX1YhI|e6Wq!svRO! z4htOy4r%p0+XN+k1j!X}u&zDb6`n{51ZnufhCF#mNk$NgSJ`Y&zd-&KpCyOye^Ki@ zg281W->UlNlpoWu#xYS~8)I(oQ*4nOL26BaHw>rRgCVa8kvx1r)bKC*?hptVFTx^& zq4%j^gD?wbNiZoG(d(NKQGqa&NY)I6U^-)6trOeAcoqh6r$sk=;$IU;UJp@#SOD~fUSLQKi^E2Su zk=U#_X;)q_Q{Vdxfz}{bxC#$sM4~FR#12biY>MVs82kFfH=@)5_B3kzlG~P`xxDTw z*t&qB)qggd7Av*fn3`3OA&eZCCZ@(p)kyHMsPUWF)#s6TPzfhcWXEjJ$M9F~-h+dR zm?yH@(Q-#@TJHy2J06CEhtAMz`Hp`COKyBqX^fDOyCFa=>Bv}z<)@^9*5b6^GP4`` zC4Fy^LP1Mk0m#yFr=t8W@hgU}BT#L3dv0HS9*!tl3&a3q-#rIPa_wIEvJHg>1s*ml zqctl^hNMXupwV*)+P5i&TkkLDc?7ckc*2@_4@ye^k7jt56bX1Y$!`kGGf7}6{YZE1 zAz4(v!SAt~{FaeryfDMSj8h7xj6W_M&PE z&c8;t=?WMssOMgF#}l8LsnnoO-Vb|M*)$n-KJriiBs&3QpWuj77U}8r={*d0z>1(=+rK5+1!}0KATx^P|v|U^2jmqd(^c(3)W3N@hfeD z;41@{j2b6~&_jyDL-ylBsB_oh?KVwSZjq#qirAYnrH20dA$d7WGX*zYI+MNrKBOeX z#-GJ&85?!HybLMC6m0;=1V`{c^v+>8ESR!Gm6w~Z4NeU=N)}jlpeLpm#b&GFqb2s9 zxJUja!R!=2PmG{X<|oD-i!)LJy2KJgM-2P)2HAIQ16wg9VdygxR7ZWkO&fOI?gI@} zZrwS2;lL_(W}*aYkWGK~h`==oL*$6t)MI!k=0|neT7+=X61NLg|NA4uH5j_@O_n;| zF}h1%lz%b9w6OOBfcT62(y~wt(o;JCjZN)r3Z|0!kIIpsUymZYd-h#W&vYYYj{Ktt zW6`rxFLi=;^=^k97Uk;hQfr|@9HHS0g(-OONQ_OAzFP}!AdC+G8ff@P?!fTS zYJj;rLmS1>c8aT-W50443!&mUi_b;V5(Xq;ZwdZ=9pbpP~}$N=sQ2))D=g^ftxkSar2Z154HXW@(~mP^3bvX69Mk+576d7S1alRIut8lhYORCfY_F<9T=C zTz|1J3HU-1f22^+0Xsq#2NPQCb5(AuUK(Gii}Zt<8wMyP-cM6KMx@eH3^NVXX4WV; zbI)kv`OUFy#gBP~4}uKu^@M*pMDEh`T|nY8jK?9F8(6W^h%$T&O^vk}`X+{pgMZ6}6|W_Av%dpsm#eMH?q?)v-r3!2dx zu;e@vPOcU2UvMD8l0STLtr*#IauJ2;oI!>sxbGtHokMc_J1gk$C^04LLFi3b_=fk>`?%1sfSAej+~ggkqb91F6Rb8us%?afZTeUu_i2 zW?#*`p(PGRYcm&&I;5LJe~N_8lX@jdLATsX6rwep&{76{Cm>=hl8C{N7>y5k7%4W_sCTTX@!l=xY5eAhr4|)S=0t+4#`Iy$r#~- z%Jk|AsN0`(1>k5n2}u9Kjvdxw=-_3cT~CV7cjVWjP7L3*q2%T!2EFS($Sff9d;c#t z;GO*AH=*m!ES-X^d&GiY2q-pY7KMNjIt)}t8l8GmS|19nAZj8WSSP)nqIMjBcN=f` zOo5Xpam|+J;G18}ec{r;c5Xy}{r~9t>ZqurZ{MLoK)SmWDFJDur3C42X@`!XJ48tl z2?=Q#>F!Pm2?d63r5mL2o%!9j?z-=-_x@1V!qGL~IOpvBsr~(XC(yTJfT{;jrfa~X z-iNe#g3KzPw$cAV)C%pci!7tYN#Y;saDrwMCpSL!bt1>lS3;PYseP$ z1`c)~rTl-IAMXEf2_XKD1^59O0*+9C4$=+49&1QT7l6qAFO&$k{&E3>(lc&JzbMgS zT=Y>2rKeHErD)iID2Utm{l(Go2mAAqy0CpOn?K{D*Z_!v_rd-L*)ZhJ`rl*&;JJ|o zIXz=x|9Vi#ejgkR?aPxanX=$z1U&NbuO*X7PU7R-c5H#2l@bJ_Q13hGd^-zv<&Ui# zfUd_-}Cagb*ah1)6I@pfY>%kX9rFNk08gngbB#1+Bn%v7C^X$NV2de843yGV>C= zQ^*Bcc1~!Nsj!|#mUqlA{$jJbAXBX*aR8nEDX$E6PX8aO)^D)w=D(zy$-12UQCw)C zNtisLmSQiBYXMf6#O&+@WYh=Xosjn6V%?IB_e>!4CPG1*;_%Uh8vt3+LqG&2GRdj zVbnHZB4A^cVi+A5%zHUv9EeSjaEJmZ1F+RfMwNvEfRD7Xl=dgpqfl(7%2R7TW>h?- z2Ny2;f4~_6D}{WZeOnm8#5Y1v)zz=Cf0({SGs%W70oDIE-i-0~TjIS^+}S`?0Lh4+ zc>A0i_2Xz&$^|x3{jZ{W8k&cw+;?k}1~bg^to$Vbc4Y=@ufMf@TfMH3dD z4cG}cW|xPOt!)R`YNVfC^D2p3)KVa>p25!IW(6|{3Hst%AM?OM7T3UXYUAes)Iv&b zl%jLSV9#?JX1f#^xW6X6?243N{_O-9te_?;e|3b-J=D=Flc!wPFj?2F^~ZrB$5$4Q ztXED|u<`-57cZPh(4@7{{n9b{L)4xS-8a^{;C+o#(xN^6+swj?5aIVrCa2*T(Mzy$ zC>`QTtKk|+TyS^v9wzq^5d6QK>f4}J$|w)c5Bhq6^#px###`>NEVO(*@kFp(3i%+c z@|YDweA!Wq<_xTFuU>2YGk|nn1lwAHV{WL#fjaAWE+~)Z)K1Uv)rKRfPTKKQ{I8j8 z-RYyz&BWaTin?SiWD!OUuFLj%lo{el{ecj*Q*-_*rtI<2@59Hx9nF*b-hw)RWqDq` z3t9vI+b0kIOk&tZ^342uj>rk1ZE}(u-xxhU~tQUm?RiJT{w@h}Ug?xjn$BzepC%(uD z%%hW+&=u+mzQYrMFCBuEBz>Xn%rm_=*7q&%<Ow*?aqA;6bHejk9BRwpk2y#-bH-?`>Ta5rtz! zhfEZUFIgkpjPb-5<*6r5&`id9Rj}Th#gXOnsFQIPF^KZ&{dblGNis=xqCFB_=<(OjA6_paWH!2b(f+vm!>GKdGzCzF$Xvi#+4P za>x-xA}m(&@-Q3JxP~9}&EmGCS=1)I@`Eb*(1JTkDZ&B*b;eBf_6^O)vm8FylvklR zZx)wVb@8Czp8YtrTX71DGGe2?fTe(D#E2NYP-?fXF)EMF6S{IU-D!t~1&8ZEGIVw$ z>XVOsZ~lu(JdX$_hit!?l#xrjuj&)jurjtTqQNJ!2k7zX*{bf)tkx-251Q z1_{}XVii!isJx&K{xVOaZB_L|)s{0>(x|UG2$VTXuEf|f+G8z@z3K_~I9=S+DeZ1u zX)rhMtH0nNhnH8a>Sz|`!E5Fme`h_8NlbM4*z(@gO7bFXQYhJQphb<`>a+^=HbwK@ zuf81;u^p@P>fXhxgMDrx!=uFmuG>oCn_DwvBLhJANsH}Nk0P@W{AhK%6uRe5`xO2{p&f^YfI^^Y zafv?!YTEfj6mxvm>7e}&cshx~co1c(m2bUl+;kAsc(y;xXn2*l7RLM6odYMFt@YbL zlgMGxk3p_$w7?%Sw3q3CsR4mIzr7C7t3b)w^cqEBV$PfHg?u1=792U}Q>RC*H_bA~ zH+cJj#Mwp25B8jKkyinUA4eUm749*r5y6JCC@j z1~h}gOR0kg!THGAwVV^F#=k>E4Pse%6F~##i z+b9lg)&>YV98^ER^|0quZpLiOR{oSOf=w<94NV#AmyS^S% z0#FEFxm^L`?$O^kg~K$)g#8}Vuo1B8(`rs2_fX&dh!y0(~PmD_9ct~aq71l?KBiYa9D@lW`*Rp1<7z_wDSQN71n2~ zDEqErAdnj8Xv*O=KWB@6-N%SVLi64!`gND11uO`tqv_`%Id-ay&Q#MFwk7!H2y*B8 zSq#1XA2M&8W=Sqo3ud8m0JWEDBj0`aXAQh82h>T-hx(?!8oA~N^O}u9MxECI6vNIg zJj|J~(a80B6J{ATB;;ZRX)8l^dy|=z5Uu<-0>qf!IJ#|5nL9&{1M`kMjMbaz@)ukz zmnlE#A}o5k0;Z-!C-HWO!>BVtOd-n$?&zVM7k?PVzP~F^L}4$5m;AdhR$#inu_KRw zScb)Zf8v2|k8CTsdy-c2r*h`z8mT(UpG9VIMmkCz%%qU6CUie|_V!oVmU{?0S>lCqrM<;;OC*n9YpzKpL%Bw*jC`e-#&_3 zE#$n(^VfkmdW9wg4fgi;T)~UESG63gE&9GVioSEl42EbJ>4t*?5CR!0hU!#ob9Lp_ z=S8uKPCra>K@-t2{?ec9pz1GBfeIF>&f_EjJ0^Ri-~gx@(3F03Qx&}0B8dYp^6UF+ zzYBfNxV52`d<+dVrcX6)Flv0~Hb$J7V9B?8KcS^_so`LAa$6sNQ7ZlcE5p>nHI)$k z>e@oi$*EIAih)#rdS%pMbg!z^z|Q$J2~(3a>9_$6E&P zJ1!PIzUZGhNCaJn#rPZ7`FGZofdWW^rd2Qs1#(j}RB5R$G)?!trvz;B1A(GQ;Xl9% z1M1cVkmy3np(I+#V*E0H^u~=7e(Ck9SjyPiiGN`qpIe_l_V$Vyagih-6&q+drQK}s zgG7xQK4tYm6~CpHJ_hBi+6Y9e#{R%^V)WD(m-G%_(#J=Zz?wYmX!R?e?@dlGA>K>8 zzTC_QBdu^6@PrAaB+Av*dpA3>I-e@yjz1G4GV$jxe0^8!LM0uj2g{*DpV3oQq zemPwxBshFs{i{M@#!OvXd5v#YO?)KbrK>h(G^YbETm`#X9;2Dg*gN*?6O^3cawv%j z@^XN#6&!dn@63C;M3Lg#5pb+4tKfxJn1$E&et1N;$^DOvWbgY9EWx?47jK1K(Zj}w z7VPtlwdw-p^t1$V3SkM;RmJb0t!z_~yaP{N$I#KB@*W=0+F>TDaGZ!Ean$>}jaR@> zwC2)6O>}AAmGm>lqdigW2PN~4i`w$Zpu00cl}^RWnTmhLri+9QH&Q;ou9~abRzg{5 zQi~Ry_c1Dy%zFm;!SU^HV*)tS9@|2;Gtb`R%4Um{SXm^v%pNZi^9brjA0v{tL7Fmv$rK%w!{TPzZnh3y0kvE{;hJ0;w;)%Ox zddbfd-I&YI#m=2&$X9OY3C4^xH;bH{esQAwc-A(oP_s)GC52-|Dj8Tco^7X z8o00MF5*<=1KvHop0?GBBs}8p)kt>#vEID=Lr*;Zk8esbXr(|8RK~&a-TxI(y`vdB zu@+1yfz^){^MfZ0>tBOUe$^X-yyzNt;5&-7E|rCGkd7G2nKo84@BN^$})+A zVFbc9D|u#`jY1N+OMgYCQn@`VdS>)=4IO!}?Vm^6lMqc@btyAW+FmuOj=Mg@DRps= zU`3&rE*Ew@`u4BP2|U?Hssdh*Y9tS(617$re5ZB2|@pOHre?f2|IZ7%W zM4x!QBCBn}Vdy7p#kkJQYG^?16B6@%kvQs%PM{ho#weJYY{+m(bv52c9p(7e-Ow^> z5i^vg0lG}7{}=9;fe1wA*(-f4xa6azG0P1zimykXgr53g{>XU}W#vfQq^;Lbj zq4uOUa5_M-Sf8Jk;DAv4jg0^#HXx~1=DKjUs7Sz)Vg5k+CkoeJ!H+9rQ>>o=!i=_s<*r=yNyZsNQQ?~_-okX;?F#OTT3Qg@;gb}PC(&xBJcg4PMTAHWi2dy7> z4`Kdg1q$k)z-OEagj`5f=jQY;IC(SX0~(+;1Ej0~VtKLlhfsyoHh z{Go?jZqs$Nyyaa*@dH(g8!IBw3D@(pD)E6ig(Fpf0KA$VYl_O#D1mJ`o&QwtBdf{W zW6adQ?=>C0F+J44#aQfzngHnece#bWQ5^D;G~U!(h8uHtr?xLAkk$0V&4TyupMTO5 z-NBg_K5gh%>4HKk=k~^-tO*x)hXXMmjP>H)2U=|ielXo1=IEJdeL(x8q?5bOP#xfT z=0HRw5_}(k3>p0|MH09y12B02DN06ql!^y{5gk}4rf%TpSIr}s@!#k;x8|Ju-(=f2 z`A-D~Bc_yUsqsUaE!0^=AH9c9jd&C#jyliQ*Y-Ad?tS?VnTdo8cV+?^!khO@-?;>s zfUd-)LLw~C(B}L13XMPShZjPCKEeGGrl30cZwtYbuq7iC%p%|BX1=O4h$ljf& z%?S6~Ffd_FiWW{O;hmbOmH*reBp!_?ksntg#%!{Y+U*Gjnoc9Ls4Y|w&GrAlL)Xq5 zK`bAL$YbK;BLbnLY{2Mi<7_Y>?$m0@8~40Bb9boO1!x#gstFrpBPcOX*@ZZp_rddBFbcP}}S!;_t6$JT4+lE+{y<(9{uHn^(jQsn z$4Tj|UwBHua80l51;?ALA#J*8IJ`T&zS5;Tfj~0tyfRjwDGiHz1!Ks$N6OqzYFnEX z_<9-(s(Bdsgqf{=?^n&3R0oL`+HRygvBRlYNQwii4RC zp#A<=Le0krCRAw+K6qx?n`7=0=&s+zM^32^CE{&aUZfjLsi2Bl?*~50fc$*SX z!5!=p2boqvtkm}C?U{H`k?E&_N2 zKH6cZgIDdpuxlWgjR5X>7GS$Vib8RvwzSLCg;@zg**eJPSJuJ)5f6U~g{1%%0-WX?YV# zD57cK4R*15TXIYA^E8K=cdxRh0>1Y0ZCf9H)&eM}&JTzlV&-|jjvuGGm4@Nh3PEsa zOC1b%#gi=Ua({VB=Q_heRQHVTE8YkgGV%`S!;tuT0K~a$v@OFZs1L_VE=wb;#ZcxWKl2PC)WxbI>YA7cyN@QtaS(#@{ z;!0ZO#ofBM7gk*o?(e~-#- zxI3*G=w|X;6oqCmy`>n21{%L4x)bi0)KI#jYsx>u1xR1yC^x?V=gaX)(_eu&lKOfX zbj===;v_Qzdny z^WM7c_BIdf&AQ>*1dY~=X8}a7N^>`T8 z0pQV1q@i^Xg)yh}Zqu*z2ahZ7z(nER1cqZ>)2$f=-ZaI{Ohm}6W8~B$!o5v4?Riy` z`3wNr)!m#D66FjO29A{p*;{=vC(nAEH$9z;DxG&7fd#j_M~xNJ(J|JIp-0mgk@bqk z|EtU0$)zl`^j;+4P!5> zWh@$r?NVlPC)}MY=19ePBGht$ikRZDf|%~&P76=;I!BrK{n?Q@j{XhFQX|*vcC5?w zuiYHtc(t0I{5)loy$XnakL&&O1;55*tuheRfdr7r?N@s=am-2bW=jeqHjZG26l z2ESp50Qx%Guqnh!=tw)s56#v3@+AlNe>yjZi{WBA0(-QL6#|HYC;kAa$@xIB2ypUB z*E>x|F|80nDTcEIf-YkRg8ZMB;Xo#!@KHn8DqN3c(D3{3mN7=r1p>rFHE{EUKJNxC z`>-dq>^Srf7qnz=lTP$*@I5eK+7hyV(Hm;FU(rLE`D_lR660_=-#T4-@2zwcPyBnHU5aq4E3z#HhS>GUWcp2* z8tMCo?wOla@7pv?t$KE)=(VgjOe!+IY#79Icjm|edfWl)@yfEe+ImN@HS*W+O|$LB zLQ75pg`VY7de8W-fP1Bl`}RW~ox!x(J=EDkUC^&ruD{@m-$>!Cww!XV2_G(Ys0=_* zMOuBaUIVC3FX(oz*+kv_nr6vuAQJTdqyV*wXoEJzuT)i64qSe8$Qw zX6IxjMz4uQv_2Nm=>#9HOqhR5O*LH3p`W#`h0Y}P8^Z-gXd`Qk1BFISh_qW z{A-sy*tHBQt+a+~LjDs@4Xrmo2rzq^&?JxS7BdB?aWG$*j+2qu_X>uu)8L)89>c_WBzq~0l*3+OF9`FH0s6?XQj^DP zzqoZS`VC9cF@PU>(W%@5{g?yJjcz^J3BpO_h!}QaHn4-i4tuv2&J+PelKCy79SgCW z|7r-7Uk5cpHCmxEj!ft&PEwIpbt=#y+_0PL4m2*r^w>A!BW)tIVw&?Q&w+%j^|cqIqBY_It7L2ZX2oKR|vFX!CNDH(yo z6#MTTJQ)y1P)yBGg%{_J3zXe8`1h0X$*edvPxnKC0HV3^m8Ek0QO_}|jkmijoWZO$ zk3m3d(K_-88tpDS*456qcztBh_w>(bZ?Z3rw~K!V(}f)eL5M|0a(r0eWLfEY=A%lu5O+Hy%-u^G-Mox zSGf4_*0&iw$d3+yE9|3)N%Rb6dyhBfiGx2kAmb8f_I0y~x>|8*E6o>J>r%{6r1)iy zsO~&c?(Pg*7e@=w7ra{n#Wl|7VsQfo&o9J+)ByQBAtg!a4-Ic=Gqmy9nU^q|_ff83 zHvt+OnunWRmUVI^i5hRJn0gUdfoow$fNKD(itMX>$`0i_OWx)dtFk|XcUD!F2`o2{ zAmBY@=Q(6x!D=t3>MZ@qK|A7QeF9ML#vF&nfb4qEn77nEP;^h0`R0&U-p@9)5R^x0 z+I>r1`pSp52#+mUkn#&L=ITl90~AMbvxs$!Re{&0_K;6m!C4`oIH ztpiFduArHuIH^`Hid4`xT1YXdGGxUjMd~&d=-2K9UBvG{=u8ad68QYPS`_#b1!>zX zQ9-iO(P%S^$VdIqJ}HJCxpjYthAn}I%5MLb%|^z!c)y_k_Ia+wspc5<`|{Aj-60OW zjL!Q#emo`Y#0DIu|4{TK*yk63qU#$aVS~`_s_dGE$)hmYy{=KAk@`ArOYxnHmx-qr zTS`Le>wEasaZ)5a%k`q2si|z51U+OV4cFg#clMe#L?I(uoC{6oEzgf%E_?KY@jJ8|=zy7Ayct-Xf!U2P8^I z6Hrpqsr=?hmfA1664(70t9f5E>E~|-uvkXMuzuTe*4vWiwl-s8Rkx`xx#HLF_;W!| z`JtpJITwbbkV@ea9yB9OC*4x^yeXwkgjbS&}3q!D0I>iBSScMO>rl6j1zlB;>Z7YFbPeW(J%p=qa4oZ`6dI=9WH z?e%xk=U#7~qTg_Yiy;gK1R=3_0v58__OYt?QPeJ7=?Wit8@=?-0c*S(@iOp*el+UH zd2cn8s*^f3J^UcDc+rlgh2g-cLL;mI`#NZty}04WQf41CungLh`yAAf-8*-pC-s?g z{9^n2RfI5dxVMDCg}(856iOwL)VEXZa{B3$^Jw=ZcUO~G><=eYRexX%nX;Hpg|h&}YZ4Rx zfOu|25|H-AB*LCN4up#EQY$=ZKFzN4^xPmxz~t9LZL63@r_>-eP1Kv|-^)=P1ME## zjFxBm&8lR0uSMo|w$w&soec#6Xb6lBJp&!KmPI1w z&!=fTb**5A6e7z`Z+SzO`5zqL99!;*XySR7TugCy*ioEM-fJVtA5-dzHgt99PQP~j z9TtF}yRXBqF5S%4dc;X!yubrLISSrOK*~YS-s5+-m-6=oDlp)GGvO} zkmBGL0-ZYngcn}AOhe+>`}>ZLgc?~vWIz1lTdJ~Gtdho{O3wK+Np`ge!BHIs%%9J2 zx6_kjaD~=XtE@7O4J2THf%45Kz*3!SIV)01J=Jn^kQitY)~c2PR34IT##y0t(lM`Q zIe*N|)j0dkjHeFY6bM+0+eG2TRj*|a?a{BqQky+?QORYOQVcCl=JYm2Gl>6|E+nDl zCtxD*^wiGmZ*r5orRYZFUPeeot1c~zJ4M#$72Y_gO@aghR;V2S3O3xr%GWm)ykn#- z(<<`j5jnqxW?$e4M(>{kca)oN2PLT14Qiwi`NpI`(HFZ#O_k$bdp+|4LGOrwOi+n5 zW4aF2Z@I1muyn9Y!}MZi@NOpGm+aEQ3bUM=Gyyb%5`U$D(i6A@ChK2yPld0MUCc*@ z^g;DK38vwt>U%+|+BM$LF{i*J#q>Bj0pB#M75?{Wob+(zAl4`oOf6#EJt}pz01ojEmQobmQ=W5CB3eGxm2KMj~+k+%znAFc+YQ zk+l(ofRFA$h^wQymL>-H{xk6Xs2XTR9%U%&*Wit8f!F}DXo{N-bEK3s^Wg>NaBjLFXddB>8tnB4ZUG#PI0IupxKq(K+a+a zQi2&aghs1!!v^HEyLkoJ@IV^>0JS-d4*hqY0o^ypJ|6q8k&G9E6m9Qz-pk&o>(w>0 zL_*n>B01lg-JgNZ^>fEdZ>=C9hhCiFqw|ylw&%ydbKFmSL`K_Od+;q*HL zeBYg#T$*9QUA@=k{_T^G9%Z?d*L2JitFYK@WIv_4A~OhPub7&b*`xpt;C+LfVZ6Dw z)l>lC1#T$-5~5FGz661RuP+9P&)yw#iRZV*6M!P^JEui0pqs~th0DRh{V;GODvvP* zd!i0F&#FZhq`;TG1b+l5i^)`~O#$%N_m%qADB~^~Pk<4WzDUgJfB_efBf_OR>;a&DIr`Q090=^XHiXpN4hXP_ z$m}~SKk*hkjvQL7hk_cw|{*S#1_+*E~4!``q?4A%3a}nRq@IpvPGO zT92=0AJ9>LpZX!v%1;jcvh+0h3r5)1?I=3u(0nP=Y2W^C8D*?!rT&(Pa`{bYcazJS z4%~>owmcx)Dncd!*arM7V&VJ@a-QySn3U9^jdA;_ zQdV#q=Mc^uwXaS@jDC z&kH>99R1h}4|p~O{pXk7(DTPMNOB+GVHNARrY*@OT$}We6ul`3>iMX%vqO@!Nff## zDYSd z{ZTJO3K4t83(lF|7FZF2;*xfdQ=ha|FXKaAGOI!9Uj^@ZdO)kxt14=kXcyjp@!F5) zuBgxZZVkkl=HZ_$1ie~1qvr;Ngz=O=4CEO({q>+u^^?4FEAGuNx7&4y?>Md}v)0b4 zze<&U(KxR1A^$5|m{iUxq(oE%jTLgFiNgytFTeR>4{GBA=x_0j&SG(-wHp1V1t!M^ ztVAUdjk(^AgbLmXpK9Jo8sRGxiZwTxv_!(Fah^Rrz>H&M0zQl5naqG%YJfMm0eCbpQevD^v75C}` zz(Yf=331v8bQ@&}4=aDC6{Yb5$ew>?~%Wp@EdEEP* z>}~aZ1~lnBA&&8_aDY}Iv(Rt?^Nd?WA)iq6v{Rmo8%uJa*ae!uJdab^1Grw?20Tin zT#@x>Qg^FuCF`JvXuFD^e>-OR@XUEUzHGIMwC`ypkI%`;5>Nu}xn&Bs`*GikJ;&jb zQShB#V0gIJ_wV2W`|U#Zzmpwmu4Ncz$=^SW12%avbHkG}uM{0ZY~(~7)R5yqbenfgD#RI?D1nTs4_GUF=Rws|wQF59aM=QvM$=-k z0%geer01S=dF&SQkvxU147i-!>jl}&3EJ>t?6-;;IyuW(@O*QfHz+SEV!;H2T=y^@~)~= zeZ;TNWnP!pjUD}QJ{opR;1~>h@E^sfXbvt|AD#zi9 zfaF3S`v8L5^{8;}Y$7ZVVba##4QE&QS1$abJO`uvgO z(w_B2ljky8XZl^dV}(qSOj-v$&BNayzmB(Aerih7lc8Z-$Ev2m=h4Wyul@EDMsTbF zhnQYV=a7Ub_UT2J%^kI{Ts8=rWF!(C1V;|3j=^)=lrIFJdF>}X)WzMKtpA1)2}K-{ z(@auCG@3Q2n-GFBp7IkVYUgp^PSDVdMLtxI^ZQmfASW`}OMAbvToum>Ji zbk5!R0%bAegmc6PHYKwqKn$3OFf5+!gF0LTr|lLOuP2E3An-Rz#2VX$ts}*Oq6WXU z%-seCEs^5g^e!B;)O&6J{XH*~I0Y?qzU~8`*rB`U&t{;9B|x9U`?+k3$TT?j>}3oY zpfRvk+St8w2g8827+yP5$z7xL5K^O3Qh9IDzQb3h37wo|`j$8JD2@;IyZynd z#Bb}#eQ#6%5}=tRV58O3bfRy_(8%|my3UNH&fwLiO+d0DWQ#3fl{*{|NAA*Jf4x*H z!M`<0sA<8_p*WB3{<|(OviI?udvl{5X^OLCJYXIs#CfnySx^D3zh*A3mJ65?-e3s@ zSd0cbhZoa^DjZ!|FpbyPX(oL;aNn}TbmcCN>H}m!q;z#k0RZVo{X23eBgRD>$=9(I z7t!6xXzNF3CvDMet4LAbH#(9_0FF9}eM}fTpnVIMwy}Lxaxym?5rX-VS*27+Z|dtu z6rJ5`PfQpQ3TDKW|6#K?zGGYRK$XEh7}osMWB2~~^d`^_-JXj@O#d3~*VvVGd9cYF zS+jaAne(4<3U!8yd8n07OGvex7DaR1lGIJS-{S~LW5ZJ{Cf=~x3&KnrfJzRiqWET< z*dDs9(*cVDYt)Ues>tz#a-|V%+>thpCBP~sXJ}=5z;^jtR}U#{#D}!VV=#i)?17V4 zfE0Pu@0rl~zWb$biX(Vn>yeL;?H+#AiKd<|OH?Un(hum9!eo=G=S9E*pStk?oe+z!H52-)) z+__z(ks_^v^YIi+BjyQRrn1Msx=aA6k_J=u-bl@G>+2M8l++6W+9qZ+d{Di0`P0M? zF6Lo*3?26;L>$jL!^_k6o7pQ-3o`ly9E|d^7DR_=#FG6>r~A?wqq-lafVc z{5Yv;bt)Eq1-ke=A(e_>E77$g*eC%tzb49N(hgrBAS-KTODbDRAJNU*)V>UggH}&0 zu7JAs8$AII3lN^qRFDQ|78@J=fZ^q34^he^M)G$l6{WjK65m1$&K)TwgO@u{IyqE|9 z9^zjo|4qv6iR&Fumx3Mzz!|v8AAzhN``?|M?>=1M1>b>Oijtngo?i`cBporuEFgoUqIU_o~`=U`!tKOoStODc*wx#CbY@r zr$Q}9-}{k;NqVL`-m8Z|c`7YGU7cI5;St9V@f_kV+5LGT^!{u6N_CY=mFVz^z}wTq zt?D4YV#8O6O?mDdyyw$bUYB?n*Igrqf1|>O&%`h4@(lY|7v&xxfaxa|H zWr}q1A}T64N4FhSCegQG(JL-W?(D2Ml(S{`TF=kpsB}1Oen|{X=$8C7@au;s2=9{6 zL|{GLj{j1(*a{G7S75D6^MC~d<%ss)E@->O?4IC4{x$5gez|dGFf)b`0>~{J_$j^! z5@0=!v{Z7Z1Q3KPVvF?5%i$LgOCC#c60Cp*6m*U1M7PM+?y32#`mu;f%Mc4H9#C}U z{!)sT77?0xhk^s^!3Dy9V58b%Yp{5j(~nkTXe{mnW%T_hGHN zI!DrCzY+Xs$sDD|`3-Xz*%tcb;+WqDJ)i*GrEd5d3fwLOP~GR)wo{huEntb8))gKI z!m=P9prfR^dIZRJMo57ICOayH-QU^3h5WhdcxX+N$8d2KpgX}iswtzuD!eAK*UV*Q z)Ok$@^Jw)})Z}@&{27T1c(EcP01d>82 z!tMgbpGr1rI`mxc)HU*R)1wi~QZFDxQwF#4gUk?5n-9Px-XX1|ongOOs0?br5+heA7pS6>vMyD6m0cv)_wLs`M@N{>3!c-Xe zcK?_xGRS@Gq261YR3ZjA!8#C#s?sDz0D|k-3Sdx|*(KM52nyL*vhpc*{RFQu2vqRn z8lUKSG=A?24-+KhX^?nmo83!bKhn!OH!-!kNK>+)=(eg>k1OLrGtkow2UN8|sTVL# zCxz1{sYqMam3SXJ|6uPvF|~7@u~B}$c}Ip{x*o{bf~V*%k@|B!s8uP*F(V#6_Rwqd z%dyv3FEAA68`&_cRSjLr_2EGqP8+>o{==PLxLruhphkHs_K&A>`H>l*yWs||4WJUwRc}AXsawn+Gn^qu( zi5Rd7a|LD$U@gKc#vk>hR-Uj$u|X6pm9>eLDQGGTD3*k>K6(5bgifsb$guTa#P^RT zu^~AJ2Z9Y|j`4RIsf=gf@C^v8#U|kOL4WJTL|apBiW&>dUl530bV=pbW`4A)zGn`K zTvCr~w~b|jgX@}^)z3E0Nzv(wT&gmt%1;0sXWQ-ce+&X=T7v4K5Jr7+Hg-88EsSf`0egU zWRTgz-M~;DS1@$|nG^mc_}&+pwgRL#yjQ_V$do(Z+FZRB zX&`|uYF`Y$5Tfk?+W4xCRJ@H8(Pl8f`$-=|(M!e`i%kgn?|pX0@x!x~XreasC@-Cx zsF2&Rr6rJgAc=oK02O~0&==Gjz*$6-c6nya4P2W4p5e~(#~}3!Aaa`Q^H1T$e#z#W zE2VZt-ZxdV|2o>l6P&A6Z?NtIs~^AmCGaY}wve;T=1mNjR!P`MMY6ntOn@EbTm6aS zC`GK%t%=tQwl6X<;!ooh2M}(5idaT6kH5##qb$4m%H(iq5pooMk_B3_LeJ%o2XEZ} z-7B4*`Br;|mJgnb7HxjoP;)o;)$%(xE6)gSD<;=xo}XAh65S8{ninbcYj)Kd4y8Bn zS`q!o9(y=R` znVK7)-R(5Sdb++jtW{MZZQ|Nonu}I(*bz&mnR^?*l}tsh#70Z)C~^CF=%0Tsd5LqJ zjLkpxmi*KhI`d4OtW16_^_Fp{X5_wAbnMT#lg+a{k`f|6M zQf{?QXzyvcyh9NkE!IdJ{y?<=ZtY8|cJ|_~Zzr}B9$f8x5ihK;y|Un)_iIMA7iU*o zR_GAHvZcPBGE=XOWWlZi-DqNHa7O-1s8gErgRbA#UY~H)ypA28-j+5g{^6N6AYxdh zmbj?n@n~f6@si43&wY9Hfrf&RC8Vvb4dlfj2b~6IykM3Ae}c)Gw~_}SFIXPTqNMlV zt2*9##KaoH_PN&JGg0K>jp(;^g)6b?hpw-d%aj@z9sDBTN3hY-??fH_uJJTU$|4iB z#~RPQgI}`IPP)4hvpiRsZDV?2Ag6xWCSSDXEk5seePn*4;@T8s@z~k=-`n($Vi|DS z(dEg?Hk<+RSo9UsG5_wQvhn!ww`Lw>KL^-SxrPi=BId z?+(2$w^YfzvddpM{d>b5%UA35_k_hHme2F-EEhben+N6Vehw6wv8&^Sez&KpWJY49 zbyQg+u%Cnf#Est8By*b$nzzb?3!Ykjp#3KQ;vFiT#KYFs2KyI9VFB7pVe#}>9O+{6 z7~@#t2jxX$PsDf#j(Fm^7tq(H7hWqmE4MjV#Z{!oNRCdCyL*o@4OvkHi7w}8>f88jmP}owLU2+Dc%jt&(ClC*Rx88Vd%MeR~8}hrOt!n zyOZ&V-wc|AATP%=wiz8EPr~}Z|6*x~d8dMcnakSy=Pyqjgg5kIMy1Cqt+q)Ro#Z%fm3z^N8CV`_c4iqS+R@Fw?<=^v1gWleHx@Tf`~p5%e5?7JQ&&Ub7uTYeeYkzN zTecV^{AY#^&)4Qv8a-9mA#}bi1%+3pC3HaK*zh$z&y*1neO{*nfi2^+H%D5k)*GnI zD6~&NAVd_sA2#yTja675C)jELE~-(OA)IFQ5DvnZ`nu(A8~_M5_Lt4bMC+* zjf!mOvHwA0he0@|;V+g;NgQ)d9k$)zAB62^?<+KOXD7r0O#g@p8*-;cPb=H1{$d#{ zkk6{4`E>@(tZ?pG3WI(+JFJhx)3sde79llr==ogoqY`%U`k4FCLgL=Fgll~@nZuv{ zkaZL74DUxYRg6m^w&Rt!MPaWzc@_yD$AJsW^G@2&e%sAUDwdJmVfIo<55rj zJC5%1kYTK^))kSiJx0{*p<8BuxV?_B^`mwa(-mn({G5%czV>4OtwmY)fGf)hh1Vzd zk8_LmSyPGqUS}!=l!&Uh7tO=!Hh!Z?5q(j+uZS}pY|3<{cR1~JEd>6!#ZORZ(NGd0 zUsjSaX1ni1wd~k4hK+K%afUd-1l|weA}U|C3FRUVG(Y9I`k% zGsPK{H6q2=VSk#2^=A}Bh6)hugzK7^iUvt)jq^r6EqwzMmbsEb6X2R|J(c-)N*CYZ z>-TuP|E%{Ue7XQ*r8t2-$^8;Rg;1J5<+RP2Kj@XH(YZ7$#(728W+q=N_>yYcu0MZl z^~F1_w_hY5rxY~>B^11P$l83bB*OUO$+{wYQHJc%U93HPgI|&!97a;YQF&#<@$;pyQl80Fo$>Mt1ih&bljha`O%8#PeuQH z>vblYX}`PE)3!|x-_V-z+smtIxu8JgR?osrUdwAgrq874sUSl)*~M^L^xB#%ADGEf ztMxpy9GeY=Wi6`+<_;h9_88)Xw{LFrqrX6fYq0YI>jv#}A3_i_hPm=`3pq>z1O@xo zWrGP-quEkVoA*KT8=IpL%@UB)b|`0QeT&fAHf>BMlaU8OIhvQMJY@VhlMis3{rXt+ zwQ!>B+o)@-x;1>9j($+>lJ~E6!#GFo%3^ z#rtJA%n}SVedLQuT74;prB`6++LTL|y6Xt;5~fPpgMZ$d%%Aw5P+HmVR?9s~KB_8_ zm^OSV@^FO6D4A|Eq0vaYWqz?VGZ|;-?C%t$u@>ggV*cd3<;|Z1O=y$i%c4w z$+E=UoAV-r+a;q&z_%B8@ELAVS2iC{V)IJGw-84nP>r@_A;jO-NMm+k@NqEY=#~7l z`}MKMl~%7XL6HPjBFBVh#|^x*gZ}A2zW1Y?(snw;e6uD~n!AhRVb_g$>iPig`UmI) zitDR{P5t^6@*47CJ7bN-pOGF2Bdl`yvK1oM+@1e zjpM~g7(K5@jrVkR_Dc)IeJ_y@-Q1{R{$^Oc(sQa--Zg=;|5)qfWy{M@s#(t!mCcyf zkKZvm_MO+Y@P#T0Pw35|1`RlN=5@)(*-YF;Cmt$MXn!fW*d9=GtQY;}-Q@nk4eC7H zRLo5tVyIYLx!d4MvtGRXULUUo;^zn2`bVn+CmbK^Io*@N6kc^*w&SSFw z(r#^szvq@Wkxx3NP(XWo(LL>TZdCGFL5lA~6?WZSUH(8lVydX9Kr|>^NgWLDHrf__IK5NFZAdvDh-A4Y zF#Wi>#X>Fnl=Y<8IK_7*MMd9Ub$Yxy<&^g4OG@}}s~q9BRXVO8LLP;bF7H~SZYW;% z<@6Vh+^;qs6DjQ5#|gCNHpQssOyy5Xu=3f{bNcZ-H~i?iq;~&J$%G14(u^RAdC(n@ zwf8#IbvR}7O9@}4RSwe<+m)H~ueDnr9lW&majy-&!%A|Ym-QKhs>a#gP4odXZ?fcs zs~`@hs`Wvr;JnW4FSm3k6~OYLo|VovneKXZck;Im-Or|~j<~UvCQjEuw%yrR^Ly@` zc@`(xHZya{*593Lxy1USLs(WI?m}yB5U1Lr2OD42HIf)GU4VG`s&5^Uc5wKe9ywZJ z*FWp=lt#uOT9C&e)=chggZJKqNzh9O4Qd%Gn3rm?xRzJ6ZIR-h6=&6(xa4r@nI$nd z1v>lZE4hQ0)I~G$-=CUbr(9AHXYWhDrEFi_xnoXC?aVWC_ma1%8OBgz(a7SqPXr_7 zINgMILA0v88@W`BXiy|}eq_W>FvusReLivaWH@Tu*R~~__N`Lnr-cMT*1bZKCQ)5} zb)ku+$jfpzH7EP;RXf?ewZpcR4qD=DrYpa8;i>uyDu=%DsO+b9DF0JZr)v@*MB3E< zpgK)9R(N;$oz3hb_GuUI%I4%Ho%gP{1bzrg8iwTTb4-7uPkD-%8jnaecC8o4E7 zy6H72F0kWBnN5WSqo>AkzY{IaeRv+(uicvMY2t9Au2oi8$#Sx41zQd|G>RchR>8#H=HLUmMg z`viz)1I(zdc8-G03x@;Kx?HzWGpXx=&>ZtL?x2j=# ziV4J6A3J$L6?OD@KmG2Wi^6+6*GeRAKiIPv=`6_djN7 z@Bhm^Ml&f%604N1*%HM%m&9--uOhRGfQMvqxxc0}`HXrmm!j=+q04IY=ea%oq{Opv zcGI~IOam!)Cp3=~Z!Hwv=bca;B!9gSl&t38pnz(6uV{US{O)I;-$S}5gjINAr8sCM z;#kvC^P7ELGKKiOOl-&c(Qj0KrWD)KYo%GS?nta^@REF^Otc=lzm~9{l$giBmTG+C z=y(4LDl@0dx5}<3&NE4tqwzE{TtcQ7X)_sj>IQ?VLady{qkGT_G2c1`G&)b0ds`Y5 zTN<5^i4{&0UBVI9g3#GU-09?WS2nD_N9)jOwHbCBHtPo_72TT+tBbk&;+2A#=4WY& z^Vw}1^Qux1e~;yCIF2#3nas$#u!aPMl70NZdonTfbmkLsJDv|)Nu@tA)HxbUDvYTt z&vZK@ngjpjoE*}d7*b6!q)t(x4#oZPzR$+wd-aGCIeW~=Xdc(V&dW@;{HX?)OP~8S z&GuD3hI4h|TH0M2Re2{a#8uLsHHPm=5nrS&)TmuwxRkYSE9b4|sE9-Rs`qd)%XZm& zEEB(O(b{#Hm}VY&(^~GW*(Y^UguAWTnR5rwko#O?(L4wda$9&3p&yu^P$@Sl(JTmF zERQ{2r%dR_+hpnfg9#*a&Ld@~WHMeh#MBhTDsMjTqduP%B+L^ML_wC8W|4r1R;_qoe1DcWX4DbrYWr8o2iLgSCY6WY)z)=9dUNuGsj`5B24 zdCy;JFK-d&a3-uBck@ByN|#4d%p2;FQ@LgZK#CNE0FStsA=$gfuhB0Fkh$j zoe(|kPbhc!@|jH5lS zr`{=uQju#d+%XTYj*dXer@1}(x*!gJVG81g_`?LZH3cm_AvqpG0PYdmf>yJX--kLv zhKt#P^n&5k%$O9v&s&{OTWsu?vce9Z_@tU4r-YY;Q{Y{*99*vpw!U7&kqu2LHBhKm zrXF;@EpnYXuG&$Z{$|RY%_ZegYc78mGs2^cp=ZbTl7+4-w(2-jyrQLsF5T1vvnA^8 z6>;QCPv)lk|JNvHu~P=;FH{4hpRDhgWaYHHr*>louv2Jg>!;d_Sk;W zGx|}K%qVkWO^rUD3+f;GDE7{iwlF1D2{ZdmxcjOY)6G~EEi^;i*LTFb3|x70r)g)2 zo1VoPVtwI%P2vQ%=<%qWCft^_)S3(VXp8#dbFK&xeu-B}vLR}p^FDu>zJ+9lC>|(z zP1Xy9rnLOM1Z6oT#5wMZY)j@l-Vy#j9ru%ccr?XUM)6Kse@^5CV~6*o!AvCWr%>5{ z{nsCs9>df`rBz9aVpB7)WJx@5O3w`GVo3VKC^nGWL`1))rr48N}_9KH7)&DvrjaInisSb*GY&hhr>|1iJwAmu_!`oQc2z}=fQ#Q zrWa&~dniR68o>X41sYoOf8Cv&LKt~;aCuTD6%+;X;eZo|7b9oC6^vLc-1x%b9RIhM z8Im@St@2K3=2R6RsQbXGp-V&xl&8!GD2iz&x8au!vFcl zjP*t{BlLKHs)c%X#umd2H=qqA1?C7#*-ZbOE6I-Rg2I1(KGlS6%Y~|=JpS;BJUxsL zxWnmqiHlX?L{!4FwXStPU=pFnnxr!xJ=(;`h*l7$EvGmf$)%Pqaxm5Zb1u|{9qabQ z0IZy@m51O<9bvO2v-;}8qK~VT7(AVCdxB74U0roGOR|_fNa2tIMg_s4e(UWGP0a!n zCZAp*P9f_StdD}GX+Ujl?Fw~}$J(ssh{w1uaA?SgP6O2*MYB(u8I7K7S;)!D-zw1M z;O0Iaf5n)g!p6a&8B|X*dgjvm=U0Hfno(2p;9E{{F%3}P15~nQKui4qbYLa>ADgVNo%Vn@(RUE-0E?i^O`Rms&t`ByEQb6X4 zfo!d=wl={}^y<~+jhi6Nz%M5Dg6+CzRLV7%;L#^Liwk(k-`|&(=I62Sc0E5gcSwqq z_X}SjEw@=;Ej?@GX?pRKX}Hi|0Qr{18+nEL0)q|2z00g3XZHbW3Xp0+kU2F1j`B5k zkoqiZY?SNk?QME*Q0sFo8Gsy;@a8cPg&0-U)h&T`HnrqvXNR>cODr(1O9ha23FwDL z<@MVBg%t-2t;R}#qQ3Lla_)AscW_{+NNf`lxc4r6ail5+`D{SI5%;B@nE>r*0SL~Mj;CPC z&uARMg!137jItjp4?TEKm@ol!@iIeIlgHc=<6dx2?B9I zVW})JKAzi)+9Nr1duu(sXEE^94gYRyIe0%FS(FhCwcVBZEr2`~t&qUODOR45qfI#bKI=m@b zLJ}$J2$~83g8-VPxo+RuM{KX6#IRuY*RKG>f^%U}KC5TAQM;SOn+iTY*Wm$a>gzv6 zq;tXiH(|cWA{ubkM0Xw5Q!_3ZD2ho3OFv_$ZT2$ps>#GZ1eJMu}RUmA!M!@nVb zGEhkd7-VXFYQzZ4s)mjZ4hUm+T=kk`>oA~G;V;?AV{!Yb2iVc7JakZgn_By@jIFS=FRdq?K=pP9M;08vwA<`Oa&xg(-Qrz;o-2pK3z=~Qy+$~Cac}wJ6tRt zX=K%wfcyXl%G}x6-tHP1xo$C~uA&kECSzm6 zC_?=;OaD#(-KIHJfX<_y7XC1g)Xvbj0JJzn-5c~{gseJP5rF~{H@3Z|*)KZP!N3B~ zEh-{HcDNAJ3O@*#dl#r6I5n=o!H3id^O!-+BN$~gJ!MKEJ85Djr0PD@?g7qiz!?3?FjJaRF%XHq~7ncelcpkzi6iJ)VF!eoZ6ZIy|4+;Kh^Sd zO2L;(CMV7Q!Xp={F}gA|cQsLJXQ7N=Ts%H5KE4b#o|Aq|PYY&sxBQx)XTla1>^V6( zExt6u92bp0xbpC!(I&{z4Ut4OIzzH%%d(O(tIksRD~wtInvj)M zXR3u>ks)#rM^j=pmozoDzI-vaU(Kgv!Z8Z(0+%Q67aR09>2XSs4Jc6NLs$?Xdn zA?M8G<>enDUpcEg{2o(6gBe841=t6_2B8iML2UuBKV~4af#u=hd0SoWtht&VhUabg5 zj$c3k4^_iEP|kN>oo)^N{k6E@LG=q5hER}9gPEDx04#nQfT8>O>FJ%_fjsm169M)< zvrJE2UqDOvrz9gtMQh4gq5jQ4)& zwLKIQ$<}HuEh{rnRt}xLmXwq<0ASSwV0ufW;H9=_v)U}nLWf>Tdf-O^bAvp3kdAtX zCE`~oow^t$B_#*HW~(N)nwvqMZXy!Ppv>{w(-cm`uAN~)y>ppSuWh&X6+3nQMw>&; zx^9jJT3<^mdRDY~NW)22SGN@AN+htM9#Se&ga91ubZ->)p)+wSCT$l7*AszJ1LN;Y zN5{{Yn};<31NOpwS>x+;_0pAiZ4x3Qc1nBUe_4t1&{z)qo&pjrEU6|Ba z2Po$&Gyk*Mp`b*Bn?SZcLpL9^kN<&#NRYIT`Rxpk7lUy=Vm*$Zib_s~RPyG{r&E5L zvS780C&&OxObNBj?w=|}>i71;WHGIzDe58Ish&sRFaaGM6yV|h4>KjD$=R_5z%+)E zi~!WL;N#~!QP5q$2@L|Gng02+ihhAEaykcPBFKoKe1QN3NpS*XvZ7keH`^Vb1pfFE zp9OU>WzZ26!qm;x;RRqi;Gm8~-q=P1=3#kweBb>dffEPYVJ z#!W&T#5hfo{#_c6L{Pp62pYI?KgxW)y(NEkrbU9beEs~5nAWR(qcB_{Md+(9p&zk^ z0NaSpW9%_E(r7diiC7?nYM|-i>_O%`2nd9m2U~YQ$4cgP&z5h8%S=Z`em<3L1vBc= z>a?