From 70680c9f935edc63d24ce4c94f2bdadac5279c55 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Wed, 3 Jun 2026 19:44:14 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: laion/openthoughts-4-code-qwen3-32b-annotated-32k_qwen3-1.7B_32k Source: Original Platform --- .gitattributes | 53 + README.md | 36 + added_tokens.json | 28 + all_results.json | 16 + chat_template.jinja | 89 + config.json | 60 + configuration.json | 1 + generation_config.json | 13 + merges.txt | 3 + model.safetensors | 3 + run_summary.json | 12 + special_tokens_map.json | 31 + tokenizer.json | 3 + tokenizer_config.json | 240 + train_results.json | 16 + trainer_log.jsonl | 1557 ++++ trainer_state.json | 16525 ++++++++++++++++++++++++++++++++++++++ training_args.bin | 3 + training_loss.png | Bin 0 -> 47290 bytes vocab.json | 3 + 20 files changed, 18692 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 added_tokens.json create mode 100644 all_results.json create mode 100644 chat_template.jinja create mode 100644 config.json create mode 100644 configuration.json create mode 100644 generation_config.json create mode 100644 merges.txt create mode 100644 model.safetensors create mode 100644 run_summary.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train_results.json create mode 100644 trainer_log.jsonl create mode 100644 trainer_state.json create mode 100644 training_args.bin create mode 100644 training_loss.png create mode 100644 vocab.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..75a69d2 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,53 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text + + +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zstandard filter=lfs diff=lfs merge=lfs -text +*.tfevents* filter=lfs diff=lfs merge=lfs -text +*.db* filter=lfs diff=lfs merge=lfs -text +*.ark* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*data* filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.meta filter=lfs diff=lfs merge=lfs -text +**/*ckpt*.index filter=lfs diff=lfs merge=lfs -text + +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.gguf* filter=lfs diff=lfs merge=lfs -text +*.ggml filter=lfs diff=lfs merge=lfs -text +*.llamafile* filter=lfs diff=lfs merge=lfs -text +*.pt2 filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text + +tokenizer.json filter=lfs diff=lfs merge=lfs -text +vocab.json filter=lfs diff=lfs merge=lfs -text +model.safetensors filter=lfs diff=lfs merge=lfs -text +training_args.bin filter=lfs diff=lfs merge=lfs -text +merges.txt filter=lfs diff=lfs merge=lfs -text \ No newline at end of file diff --git a/README.md b/README.md new file mode 100644 index 0000000..da9ff57 --- /dev/null +++ b/README.md @@ -0,0 +1,36 @@ +--- +license: apache-2.0 +datasets: +- laion/openthoughts-4-code-qwen3-32b-32k-annotated +base_model: +- Qwen/Qwen3-1.7B +--- + +Test Qwen3 1.7B post-trained on laion/openthoughts-4-code-qwen3-32b-32k-annotated (Qwen3 32B 32k output length annotated, using https://huggingface.co/datasets/mlfoundations-dev/hero_run_4_code as seed for generation) + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 0.00015 +- per_device_train_batch_size: 1 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 256 +- total_train_batch_size: 256 +- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.99) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 2.0 + +### Training results + + + +### Framework versions + +- Transformers 4.55.0 +- Pytorch 2.7.1+cu128 +- Datasets 3.6.0 +- Tokenizers 0.21.1 \ No newline at end of file diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000..b54f913 --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,28 @@ +{ + "": 151668, + "": 151658, + "": 151666, + "": 151667, + "": 151657, + "": 151665, + "<|box_end|>": 151649, + "<|box_start|>": 151648, + "<|endoftext|>": 151643, + "<|file_sep|>": 151664, + "<|fim_middle|>": 151660, + "<|fim_pad|>": 151662, + "<|fim_prefix|>": 151659, + "<|fim_suffix|>": 151661, + "<|im_end|>": 151645, + "<|im_start|>": 151644, + "<|image_pad|>": 151655, + "<|object_ref_end|>": 151647, + "<|object_ref_start|>": 151646, + "<|quad_end|>": 151651, + "<|quad_start|>": 151650, + "<|repo_name|>": 151663, + "<|video_pad|>": 151656, + "<|vision_end|>": 151653, + "<|vision_pad|>": 151654, + "<|vision_start|>": 151652 +} diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..ae81f6e --- /dev/null +++ b/all_results.json @@ -0,0 +1,16 @@ +{ + "achieved_tflops_per_gpu": 0.006294075316425587, + "achieved_tflops_per_gpu_theoretical": 530.5945130815979, + "epoch": 2.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.598960816860199, + "mfu_percent": 0.002017331832187688, + "mfu_percent_theoretical": 170.06234393640958, + "total_flos": 2.3824840797454336e+16, + "train_loss": 0.11019459065355108, + "train_runtime": 14786.2521, + "train_samples_per_second": 129.744, + "train_steps_per_second": 0.507, + "valid_targets_mean": 15636.4, + "valid_targets_min": 509 +} \ No newline at end of file diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000..01be9b3 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,89 @@ +{%- if tools %} + {{- '<|im_start|>system\n' }} + {%- if messages[0].role == 'system' %} + {{- messages[0].content + '\n\n' }} + {%- endif %} + {{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within XML tags:\n" }} + {%- for tool in tools %} + {{- "\n" }} + {{- tool | tojson }} + {%- endfor %} + {{- "\n\n\nFor each function call, return a json object with function name and arguments within XML tags:\n\n{\"name\": , \"arguments\": }\n<|im_end|>\n" }} +{%- else %} + {%- if messages[0].role == 'system' %} + {{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }} + {%- endif %} +{%- endif %} +{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %} +{%- for message in messages[::-1] %} + {%- set index = (messages|length - 1) - loop.index0 %} + {%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('') and message.content.endswith('')) %} + {%- set ns.multi_step_tool = false %} + {%- set ns.last_query_index = index %} + {%- endif %} +{%- endfor %} +{%- for message in messages %} + {%- if message.content is string %} + {%- set content = message.content %} + {%- else %} + {%- set content = '' %} + {%- endif %} + {%- if (message.role == "user") or (message.role == "system" and not loop.first) %} + {{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }} + {%- elif message.role == "assistant" %} + {%- set reasoning_content = '' %} + {%- if message.reasoning_content is string %} + {%- set reasoning_content = message.reasoning_content %} + {%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} + {%- endif %} + {%- if loop.index0 > ns.last_query_index %} + {%- if loop.last or (not loop.last and reasoning_content) %} + {{- '<|im_start|>' + message.role + '\n\n' + reasoning_content.strip('\n') + '\n\n\n' + content.lstrip('\n') }} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- else %} + {{- '<|im_start|>' + message.role + '\n' + content }} + {%- endif %} + {%- if message.tool_calls %} + {%- for tool_call in message.tool_calls %} + {%- if (loop.first and content) or (not loop.first) %} + {{- '\n' }} + {%- endif %} + {%- if tool_call.function %} + {%- set tool_call = tool_call.function %} + {%- endif %} + {{- '\n{"name": "' }} + {{- tool_call.name }} + {{- '", "arguments": ' }} + {%- if tool_call.arguments is string %} + {{- tool_call.arguments }} + {%- else %} + {{- tool_call.arguments | tojson }} + {%- endif %} + {{- '}\n' }} + {%- endfor %} + {%- endif %} + {{- '<|im_end|>\n' }} + {%- elif message.role == "tool" %} + {%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|im_start|>user' }} + {%- endif %} + {{- '\n\n' }} + {{- content }} + {{- '\n' }} + {%- if loop.last or (messages[loop.index0 + 1].role != "tool") %} + {{- '<|im_end|>\n' }} + {%- endif %} + {%- endif %} +{%- endfor %} +{%- if add_generation_prompt %} + {{- '<|im_start|>assistant\n' }} + {%- if enable_thinking is defined and enable_thinking is false %} + {{- '\n\n\n\n' }} + {%- endif %} +{%- endif %} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..26358f4 --- /dev/null +++ b/config.json @@ -0,0 +1,60 @@ +{ + "architectures": [ + "Qwen3ForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 151643, + "eos_token_id": 151645, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 2048, + "initializer_range": 0.02, + "intermediate_size": 6144, + "layer_types": [ + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention", + "full_attention" + ], + "max_position_embeddings": 40960, + "max_window_layers": 28, + "model_type": "qwen3", + "num_attention_heads": 16, + "num_hidden_layers": 28, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-06, + "rope_scaling": null, + "rope_theta": 1000000, + "sliding_window": null, + "tie_word_embeddings": true, + "torch_dtype": "bfloat16", + "transformers_version": "4.55.0", + "use_cache": false, + "use_sliding_window": false, + "vocab_size": 151936 +} diff --git a/configuration.json b/configuration.json new file mode 100644 index 0000000..159097f --- /dev/null +++ b/configuration.json @@ -0,0 +1 @@ +{"framework": "pytorch", "task": "others", "allow_remote": true} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..4b23077 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,13 @@ +{ + "bos_token_id": 151643, + "do_sample": true, + "eos_token_id": [ + 151645, + 151643 + ], + "pad_token_id": 151643, + "temperature": 0.6, + "top_k": 20, + "top_p": 0.95, + "transformers_version": "4.55.0" +} diff --git a/merges.txt b/merges.txt new file mode 100644 index 0000000..80c1a19 --- /dev/null +++ b/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/model.safetensors b/model.safetensors new file mode 100644 index 0000000..1cb6e90 --- /dev/null +++ b/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1bd22739b33efa165dfb6de72edd03a6e7c06fac8ef40ee11d8f7d906da5e7 +size 3441185608 diff --git a/run_summary.json b/run_summary.json new file mode 100644 index 0000000..34eb0f7 --- /dev/null +++ b/run_summary.json @@ -0,0 +1,12 @@ +{ + "agent_name": null, + "training_start": null, + "training_end": null, + "created_by": "DCAgent", + "base_model_name": "/p/scratch/synthlaion/dc-agent-shared/hf_hub/models--Qwen--Qwen3-1.7B/snapshots/70d244cc86ccca08cf5af4e1e306ecf908b1ad5e", + "dataset_name": "laion/Qwen3-32B_hero_run_4_code_32k-sharegpt", + "training_type": "SFT", + "training_parameters": "https://huggingface.co/mlfoundations-dev/Qwen3-32B_hero_run_4_code_32k-sharegpt_save-strategy_steps_Qwen3-1-7B/blob/main/config.json", + "wandb_link": null, + "traces_location_s3": null +} \ No newline at end of file diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..ac23c0a --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,31 @@ +{ + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "eos_token": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..cd71f61 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4 +size 11422654 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..e9dc937 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,240 @@ +{ + "add_bos_token": false, + "add_prefix_space": false, + "added_tokens_decoder": { + "151643": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151644": { + "content": "<|im_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151645": { + "content": "<|im_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151646": { + "content": "<|object_ref_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151647": { + "content": "<|object_ref_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151648": { + "content": "<|box_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151649": { + "content": "<|box_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151650": { + "content": "<|quad_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151651": { + "content": "<|quad_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151652": { + "content": "<|vision_start|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151653": { + "content": "<|vision_end|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151654": { + "content": "<|vision_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151655": { + "content": "<|image_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151656": { + "content": "<|video_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151657": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151658": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151659": { + "content": "<|fim_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151660": { + "content": "<|fim_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151661": { + "content": "<|fim_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151662": { + "content": "<|fim_pad|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151663": { + "content": "<|repo_name|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151664": { + "content": "<|file_sep|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151665": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151666": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151667": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151668": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|im_start|>", + "<|im_end|>", + "<|object_ref_start|>", + "<|object_ref_end|>", + "<|box_start|>", + "<|box_end|>", + "<|quad_start|>", + "<|quad_end|>", + "<|vision_start|>", + "<|vision_end|>", + "<|vision_pad|>", + "<|image_pad|>", + "<|video_pad|>" + ], + "bos_token": null, + "clean_up_tokenization_spaces": false, + "eos_token": "<|im_end|>", + "errors": "replace", + "extra_special_tokens": {}, + "model_max_length": 32768, + "pad_token": "<|endoftext|>", + "padding_side": "right", + "split_special_tokens": false, + "tokenizer_class": "Qwen2Tokenizer", + "unk_token": null +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..ae81f6e --- /dev/null +++ b/train_results.json @@ -0,0 +1,16 @@ +{ + "achieved_tflops_per_gpu": 0.006294075316425587, + "achieved_tflops_per_gpu_theoretical": 530.5945130815979, + "epoch": 2.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.598960816860199, + "mfu_percent": 0.002017331832187688, + "mfu_percent_theoretical": 170.06234393640958, + "total_flos": 2.3824840797454336e+16, + "train_loss": 0.11019459065355108, + "train_runtime": 14786.2521, + "train_samples_per_second": 129.744, + "train_steps_per_second": 0.507, + "valid_targets_mean": 15636.4, + "valid_targets_min": 509 +} \ No newline at end of file diff --git a/trainer_log.jsonl b/trainer_log.jsonl new file mode 100644 index 0000000..5f04ca7 --- /dev/null +++ b/trainer_log.jsonl @@ -0,0 +1,1557 @@ +{"current_steps": 5, "total_steps": 7494, "loss": 0.8094, "lr": 7.999999999999999e-07, "epoch": 0.0013344008540165466, "percentage": 0.07, "elapsed_time": "0:14:50", "remaining_time": "15 days, 10:29:05"} +{"current_steps": 10, "total_steps": 7494, "loss": 0.7891, "lr": 1.8e-06, "epoch": 0.0026688017080330933, "percentage": 0.13, "elapsed_time": "0:16:43", "remaining_time": "8 days, 16:40:40"} +{"current_steps": 15, "total_steps": 7494, "loss": 0.7545, "lr": 2.8e-06, "epoch": 0.0040032025620496394, "percentage": 0.2, "elapsed_time": "0:18:06", "remaining_time": "6 days, 6:27:47"} +{"current_steps": 20, "total_steps": 7494, "loss": 0.751, "lr": 3.7999999999999996e-06, "epoch": 0.0053376034160661865, "percentage": 0.27, "elapsed_time": "0:19:38", "remaining_time": "5 days, 2:19:34"} +{"current_steps": 25, "total_steps": 7494, "loss": 0.6974, "lr": 4.8e-06, "epoch": 0.006672004270082733, "percentage": 0.33, "elapsed_time": "0:20:27", "remaining_time": "4 days, 5:50:57"} +{"current_steps": 30, "total_steps": 7494, "loss": 0.7026, "lr": 5.7999999999999995e-06, "epoch": 0.008006405124099279, "percentage": 0.4, "elapsed_time": "0:21:16", "remaining_time": "3 days, 16:14:13"} +{"current_steps": 35, "total_steps": 7494, "loss": 0.671, "lr": 6.8e-06, "epoch": 0.009340805978115827, "percentage": 0.47, "elapsed_time": "0:22:19", "remaining_time": "3 days, 7:17:20"} +{"current_steps": 40, "total_steps": 7494, "loss": 0.686, "lr": 7.799999999999998e-06, "epoch": 0.010675206832132373, "percentage": 0.53, "elapsed_time": "0:22:55", "remaining_time": "2 days, 23:10:48"} +{"current_steps": 45, "total_steps": 7494, "loss": 0.6603, "lr": 8.799999999999999e-06, "epoch": 0.01200960768614892, "percentage": 0.6, "elapsed_time": "0:23:32", "remaining_time": "2 days, 16:56:49"} +{"current_steps": 50, "total_steps": 7494, "loss": 0.6859, "lr": 9.799999999999998e-06, "epoch": 0.013344008540165465, "percentage": 0.67, "elapsed_time": "0:24:35", "remaining_time": "2 days, 13:01:48"} +{"current_steps": 55, "total_steps": 7494, "loss": 0.6601, "lr": 1.0799999999999998e-05, "epoch": 0.014678409394182012, "percentage": 0.73, "elapsed_time": "0:25:11", "remaining_time": "2 days, 8:47:02"} +{"current_steps": 60, "total_steps": 7494, "loss": 0.6605, "lr": 1.1799999999999999e-05, "epoch": 0.016012810248198558, "percentage": 0.8, "elapsed_time": "0:25:46", "remaining_time": "2 days, 5:13:57"} +{"current_steps": 65, "total_steps": 7494, "loss": 0.6674, "lr": 1.2799999999999998e-05, "epoch": 0.017347211102215106, "percentage": 0.87, "elapsed_time": "0:26:40", "remaining_time": "2 days, 2:49:14"} +{"current_steps": 70, "total_steps": 7494, "loss": 0.6615, "lr": 1.3799999999999998e-05, "epoch": 0.018681611956231654, "percentage": 0.93, "elapsed_time": "0:27:23", "remaining_time": "2 days, 0:24:36"} +{"current_steps": 75, "total_steps": 7494, "loss": 0.6482, "lr": 1.4799999999999999e-05, "epoch": 0.020016012810248198, "percentage": 1.0, "elapsed_time": "0:27:57", "remaining_time": "1 day, 22:04:53"} +{"current_steps": 80, "total_steps": 7494, "loss": 0.6546, "lr": 1.5799999999999998e-05, "epoch": 0.021350413664264746, "percentage": 1.07, "elapsed_time": "0:28:33", "remaining_time": "1 day, 20:07:10"} +{"current_steps": 85, "total_steps": 7494, "loss": 0.6514, "lr": 1.68e-05, "epoch": 0.02268481451828129, "percentage": 1.13, "elapsed_time": "0:29:34", "remaining_time": "1 day, 18:58:32"} +{"current_steps": 90, "total_steps": 7494, "loss": 0.6534, "lr": 1.78e-05, "epoch": 0.02401921537229784, "percentage": 1.2, "elapsed_time": "0:30:08", "remaining_time": "1 day, 17:19:46"} +{"current_steps": 95, "total_steps": 7494, "loss": 0.6642, "lr": 1.8799999999999996e-05, "epoch": 0.025353616226314386, "percentage": 1.27, "elapsed_time": "0:30:42", "remaining_time": "1 day, 15:52:14"} +{"current_steps": 100, "total_steps": 7494, "loss": 0.6403, "lr": 1.98e-05, "epoch": 0.02668801708033093, "percentage": 1.33, "elapsed_time": "0:31:45", "remaining_time": "1 day, 15:07:47"} +{"current_steps": 105, "total_steps": 7494, "loss": 0.6474, "lr": 2.0799999999999997e-05, "epoch": 0.02802241793434748, "percentage": 1.4, "elapsed_time": "0:32:25", "remaining_time": "1 day, 14:01:20"} +{"current_steps": 110, "total_steps": 7494, "loss": 0.6414, "lr": 2.1799999999999998e-05, "epoch": 0.029356818788364023, "percentage": 1.47, "elapsed_time": "0:32:58", "remaining_time": "1 day, 12:53:44"} +{"current_steps": 115, "total_steps": 7494, "loss": 0.653, "lr": 2.28e-05, "epoch": 0.03069121964238057, "percentage": 1.53, "elapsed_time": "0:33:48", "remaining_time": "1 day, 12:09:39"} +{"current_steps": 120, "total_steps": 7494, "loss": 0.6551, "lr": 2.38e-05, "epoch": 0.032025620496397116, "percentage": 1.6, "elapsed_time": "0:34:32", "remaining_time": "1 day, 11:22:57"} +{"current_steps": 125, "total_steps": 7494, "loss": 0.6566, "lr": 2.4799999999999996e-05, "epoch": 0.03336002135041367, "percentage": 1.67, "elapsed_time": "0:35:06", "remaining_time": "1 day, 10:29:58"} +{"current_steps": 130, "total_steps": 7494, "loss": 0.641, "lr": 2.5799999999999997e-05, "epoch": 0.03469442220443021, "percentage": 1.73, "elapsed_time": "0:35:42", "remaining_time": "1 day, 9:42:56"} +{"current_steps": 135, "total_steps": 7494, "loss": 0.6375, "lr": 2.6799999999999998e-05, "epoch": 0.036028823058446756, "percentage": 1.8, "elapsed_time": "0:36:45", "remaining_time": "1 day, 9:23:36"} +{"current_steps": 140, "total_steps": 7494, "loss": 0.6648, "lr": 2.7799999999999995e-05, "epoch": 0.03736322391246331, "percentage": 1.87, "elapsed_time": "0:37:17", "remaining_time": "1 day, 8:38:49"} +{"current_steps": 145, "total_steps": 7494, "loss": 0.6534, "lr": 2.88e-05, "epoch": 0.03869762476647985, "percentage": 1.93, "elapsed_time": "0:37:48", "remaining_time": "1 day, 7:56:30"} +{"current_steps": 150, "total_steps": 7494, "loss": 0.6485, "lr": 2.9799999999999996e-05, "epoch": 0.040032025620496396, "percentage": 2.0, "elapsed_time": "0:38:48", "remaining_time": "1 day, 7:40:20"} +{"current_steps": 155, "total_steps": 7494, "loss": 0.654, "lr": 3.0799999999999996e-05, "epoch": 0.04136642647451294, "percentage": 2.07, "elapsed_time": "0:39:23", "remaining_time": "1 day, 7:04:50"} +{"current_steps": 160, "total_steps": 7494, "loss": 0.6442, "lr": 3.1799999999999994e-05, "epoch": 0.04270082732852949, "percentage": 2.14, "elapsed_time": "0:39:54", "remaining_time": "1 day, 6:29:14"} +{"current_steps": 165, "total_steps": 7494, "loss": 0.6282, "lr": 3.28e-05, "epoch": 0.044035228182546036, "percentage": 2.2, "elapsed_time": "0:40:36", "remaining_time": "1 day, 6:03:50"} +{"current_steps": 170, "total_steps": 7494, "loss": 0.6459, "lr": 3.3799999999999995e-05, "epoch": 0.04536962903656258, "percentage": 2.27, "elapsed_time": "0:41:29", "remaining_time": "1 day, 5:47:50"} +{"current_steps": 175, "total_steps": 7494, "loss": 0.6257, "lr": 3.48e-05, "epoch": 0.04670402989057913, "percentage": 2.34, "elapsed_time": "0:42:02", "remaining_time": "1 day, 5:18:02"} +{"current_steps": 180, "total_steps": 7494, "loss": 0.6617, "lr": 3.5799999999999996e-05, "epoch": 0.04803843074459568, "percentage": 2.4, "elapsed_time": "0:42:35", "remaining_time": "1 day, 4:50:43"} +{"current_steps": 185, "total_steps": 7494, "loss": 0.6367, "lr": 3.679999999999999e-05, "epoch": 0.04937283159861222, "percentage": 2.47, "elapsed_time": "0:43:40", "remaining_time": "1 day, 4:45:13"} +{"current_steps": 190, "total_steps": 7494, "loss": 0.6586, "lr": 3.78e-05, "epoch": 0.05070723245262877, "percentage": 2.54, "elapsed_time": "0:44:13", "remaining_time": "1 day, 4:19:53"} +{"current_steps": 195, "total_steps": 7494, "loss": 0.6426, "lr": 3.8799999999999994e-05, "epoch": 0.05204163330664532, "percentage": 2.6, "elapsed_time": "0:44:44", "remaining_time": "1 day, 3:54:56"} +{"current_steps": 200, "total_steps": 7494, "loss": 0.6433, "lr": 3.979999999999999e-05, "epoch": 0.05337603416066186, "percentage": 2.67, "elapsed_time": "0:45:37", "remaining_time": "1 day, 3:43:59"} +{"current_steps": 205, "total_steps": 7494, "loss": 0.6543, "lr": 4.08e-05, "epoch": 0.054710435014678406, "percentage": 2.74, "elapsed_time": "0:46:28", "remaining_time": "1 day, 3:32:25"} +{"current_steps": 210, "total_steps": 7494, "loss": 0.6531, "lr": 4.18e-05, "epoch": 0.05604483586869496, "percentage": 2.8, "elapsed_time": "0:47:00", "remaining_time": "1 day, 3:10:19"} +{"current_steps": 215, "total_steps": 7494, "loss": 0.6408, "lr": 4.28e-05, "epoch": 0.0573792367227115, "percentage": 2.87, "elapsed_time": "0:47:34", "remaining_time": "1 day, 2:50:38"} +{"current_steps": 220, "total_steps": 7494, "loss": 0.6479, "lr": 4.3799999999999994e-05, "epoch": 0.058713637576728046, "percentage": 2.94, "elapsed_time": "0:48:38", "remaining_time": "1 day, 2:48:10"} +{"current_steps": 225, "total_steps": 7494, "loss": 0.6398, "lr": 4.48e-05, "epoch": 0.0600480384307446, "percentage": 3.0, "elapsed_time": "0:49:10", "remaining_time": "1 day, 2:28:33"} +{"current_steps": 230, "total_steps": 7494, "loss": 0.6594, "lr": 4.5799999999999995e-05, "epoch": 0.06138243928476114, "percentage": 3.07, "elapsed_time": "0:49:42", "remaining_time": "1 day, 2:09:50"} +{"current_steps": 235, "total_steps": 7494, "loss": 0.6482, "lr": 4.68e-05, "epoch": 0.0627168401387777, "percentage": 3.14, "elapsed_time": "0:50:43", "remaining_time": "1 day, 2:06:53"} +{"current_steps": 240, "total_steps": 7494, "loss": 0.6426, "lr": 4.7799999999999996e-05, "epoch": 0.06405124099279423, "percentage": 3.2, "elapsed_time": "0:51:23", "remaining_time": "1 day, 1:53:33"} +{"current_steps": 245, "total_steps": 7494, "loss": 0.637, "lr": 4.8799999999999994e-05, "epoch": 0.06538564184681078, "percentage": 3.27, "elapsed_time": "0:51:55", "remaining_time": "1 day, 1:36:27"} +{"current_steps": 250, "total_steps": 7494, "loss": 0.6589, "lr": 4.98e-05, "epoch": 0.06672004270082733, "percentage": 3.34, "elapsed_time": "0:52:33", "remaining_time": "1 day, 1:22:54"} +{"current_steps": 255, "total_steps": 7494, "loss": 0.6496, "lr": 5.0799999999999995e-05, "epoch": 0.06805444355484387, "percentage": 3.4, "elapsed_time": "0:53:36", "remaining_time": "1 day, 1:21:53"} +{"current_steps": 260, "total_steps": 7494, "loss": 0.6354, "lr": 5.179999999999999e-05, "epoch": 0.06938884440886042, "percentage": 3.47, "elapsed_time": "0:54:08", "remaining_time": "1 day, 1:06:09"} +{"current_steps": 265, "total_steps": 7494, "loss": 0.6368, "lr": 5.279999999999999e-05, "epoch": 0.07072324526287697, "percentage": 3.54, "elapsed_time": "0:54:38", "remaining_time": "1 day, 0:50:45"} +{"current_steps": 270, "total_steps": 7494, "loss": 0.6445, "lr": 5.38e-05, "epoch": 0.07205764611689351, "percentage": 3.6, "elapsed_time": "0:55:36", "remaining_time": "1 day, 0:47:44"} +{"current_steps": 275, "total_steps": 7494, "loss": 0.6404, "lr": 5.48e-05, "epoch": 0.07339204697091006, "percentage": 3.67, "elapsed_time": "0:56:17", "remaining_time": "1 day, 0:37:33"} +{"current_steps": 280, "total_steps": 7494, "loss": 0.63, "lr": 5.5799999999999994e-05, "epoch": 0.07472644782492661, "percentage": 3.74, "elapsed_time": "0:56:49", "remaining_time": "1 day, 0:24:02"} +{"current_steps": 285, "total_steps": 7494, "loss": 0.6413, "lr": 5.679999999999999e-05, "epoch": 0.07606084867894315, "percentage": 3.8, "elapsed_time": "0:57:29", "remaining_time": "1 day, 0:14:16"} +{"current_steps": 290, "total_steps": 7494, "loss": 0.633, "lr": 5.78e-05, "epoch": 0.0773952495329597, "percentage": 3.87, "elapsed_time": "0:58:30", "remaining_time": "1 day, 0:13:27"} +{"current_steps": 295, "total_steps": 7494, "loss": 0.6317, "lr": 5.88e-05, "epoch": 0.07872965038697624, "percentage": 3.94, "elapsed_time": "0:59:02", "remaining_time": "1 day, 0:00:42"} +{"current_steps": 300, "total_steps": 7494, "loss": 0.6602, "lr": 5.98e-05, "epoch": 0.08006405124099279, "percentage": 4.0, "elapsed_time": "0:59:33", "remaining_time": "23:48:09"} +{"current_steps": 305, "total_steps": 7494, "loss": 0.6367, "lr": 6.0799999999999994e-05, "epoch": 0.08139845209500934, "percentage": 4.07, "elapsed_time": "1:00:43", "remaining_time": "23:51:26"} +{"current_steps": 310, "total_steps": 7494, "loss": 0.6459, "lr": 6.18e-05, "epoch": 0.08273285294902588, "percentage": 4.14, "elapsed_time": "1:01:23", "remaining_time": "23:42:36"} +{"current_steps": 315, "total_steps": 7494, "loss": 0.6357, "lr": 6.28e-05, "epoch": 0.08406725380304243, "percentage": 4.2, "elapsed_time": "1:01:54", "remaining_time": "23:30:47"} +{"current_steps": 320, "total_steps": 7494, "loss": 0.6412, "lr": 6.379999999999999e-05, "epoch": 0.08540165465705898, "percentage": 4.27, "elapsed_time": "1:02:36", "remaining_time": "23:23:41"} +{"current_steps": 325, "total_steps": 7494, "loss": 0.624, "lr": 6.479999999999999e-05, "epoch": 0.08673605551107552, "percentage": 4.34, "elapsed_time": "1:03:36", "remaining_time": "23:23:13"} +{"current_steps": 330, "total_steps": 7494, "loss": 0.6242, "lr": 6.579999999999999e-05, "epoch": 0.08807045636509207, "percentage": 4.4, "elapsed_time": "1:04:08", "remaining_time": "23:12:26"} +{"current_steps": 335, "total_steps": 7494, "loss": 0.6308, "lr": 6.68e-05, "epoch": 0.08940485721910862, "percentage": 4.47, "elapsed_time": "1:04:39", "remaining_time": "23:01:49"} +{"current_steps": 340, "total_steps": 7494, "loss": 0.6419, "lr": 6.78e-05, "epoch": 0.09073925807312516, "percentage": 4.54, "elapsed_time": "1:05:42", "remaining_time": "23:02:32"} +{"current_steps": 345, "total_steps": 7494, "loss": 0.6334, "lr": 6.879999999999999e-05, "epoch": 0.09207365892714171, "percentage": 4.6, "elapsed_time": "1:06:23", "remaining_time": "22:55:45"} +{"current_steps": 350, "total_steps": 7494, "loss": 0.6437, "lr": 6.979999999999999e-05, "epoch": 0.09340805978115826, "percentage": 4.67, "elapsed_time": "1:06:55", "remaining_time": "22:45:56"} +{"current_steps": 355, "total_steps": 7494, "loss": 0.6437, "lr": 7.079999999999999e-05, "epoch": 0.0947424606351748, "percentage": 4.74, "elapsed_time": "1:07:36", "remaining_time": "22:39:29"} +{"current_steps": 360, "total_steps": 7494, "loss": 0.6294, "lr": 7.18e-05, "epoch": 0.09607686148919135, "percentage": 4.8, "elapsed_time": "1:08:37", "remaining_time": "22:39:59"} +{"current_steps": 365, "total_steps": 7494, "loss": 0.6413, "lr": 7.28e-05, "epoch": 0.0974112623432079, "percentage": 4.87, "elapsed_time": "1:09:10", "remaining_time": "22:31:00"} +{"current_steps": 370, "total_steps": 7494, "loss": 0.6352, "lr": 7.379999999999999e-05, "epoch": 0.09874566319722444, "percentage": 4.94, "elapsed_time": "1:09:42", "remaining_time": "22:22:02"} +{"current_steps": 375, "total_steps": 7494, "loss": 0.6426, "lr": 7.479999999999999e-05, "epoch": 0.100080064051241, "percentage": 5.0, "elapsed_time": "1:10:37", "remaining_time": "22:20:52"} +{"current_steps": 380, "total_steps": 7494, "loss": 0.6297, "lr": 7.579999999999999e-05, "epoch": 0.10141446490525755, "percentage": 5.07, "elapsed_time": "1:11:22", "remaining_time": "22:16:04"} +{"current_steps": 385, "total_steps": 7494, "loss": 0.6355, "lr": 7.68e-05, "epoch": 0.10274886575927408, "percentage": 5.14, "elapsed_time": "1:11:53", "remaining_time": "22:07:26"} +{"current_steps": 390, "total_steps": 7494, "loss": 0.6413, "lr": 7.780000000000001e-05, "epoch": 0.10408326661329063, "percentage": 5.2, "elapsed_time": "1:12:33", "remaining_time": "22:01:36"} +{"current_steps": 395, "total_steps": 7494, "loss": 0.63, "lr": 7.879999999999999e-05, "epoch": 0.10541766746730719, "percentage": 5.27, "elapsed_time": "1:13:37", "remaining_time": "22:03:14"} +{"current_steps": 400, "total_steps": 7494, "loss": 0.6405, "lr": 7.98e-05, "epoch": 0.10675206832132372, "percentage": 5.34, "elapsed_time": "1:14:10", "remaining_time": "21:55:35"} +{"current_steps": 405, "total_steps": 7494, "loss": 0.6473, "lr": 8.079999999999999e-05, "epoch": 0.10808646917534027, "percentage": 5.4, "elapsed_time": "1:14:52", "remaining_time": "21:50:32"} +{"current_steps": 410, "total_steps": 7494, "loss": 0.6357, "lr": 8.18e-05, "epoch": 0.10942087002935681, "percentage": 5.47, "elapsed_time": "1:15:46", "remaining_time": "21:49:20"} +{"current_steps": 415, "total_steps": 7494, "loss": 0.6131, "lr": 8.28e-05, "epoch": 0.11075527088337336, "percentage": 5.54, "elapsed_time": "1:16:35", "remaining_time": "21:46:36"} +{"current_steps": 420, "total_steps": 7494, "loss": 0.6145, "lr": 8.379999999999999e-05, "epoch": 0.11208967173738991, "percentage": 5.6, "elapsed_time": "1:17:08", "remaining_time": "21:39:09"} +{"current_steps": 425, "total_steps": 7494, "loss": 0.6274, "lr": 8.48e-05, "epoch": 0.11342407259140645, "percentage": 5.67, "elapsed_time": "1:17:44", "remaining_time": "21:33:03"} +{"current_steps": 430, "total_steps": 7494, "loss": 0.6338, "lr": 8.579999999999998e-05, "epoch": 0.114758473445423, "percentage": 5.74, "elapsed_time": "1:18:48", "remaining_time": "21:34:32"} +{"current_steps": 435, "total_steps": 7494, "loss": 0.6439, "lr": 8.68e-05, "epoch": 0.11609287429943956, "percentage": 5.8, "elapsed_time": "1:19:25", "remaining_time": "21:28:53"} +{"current_steps": 440, "total_steps": 7494, "loss": 0.6323, "lr": 8.779999999999999e-05, "epoch": 0.11742727515345609, "percentage": 5.87, "elapsed_time": "1:19:56", "remaining_time": "21:21:42"} +{"current_steps": 445, "total_steps": 7494, "loss": 0.6283, "lr": 8.879999999999999e-05, "epoch": 0.11876167600747264, "percentage": 5.94, "elapsed_time": "1:20:47", "remaining_time": "21:19:48"} +{"current_steps": 450, "total_steps": 7494, "loss": 0.637, "lr": 8.98e-05, "epoch": 0.1200960768614892, "percentage": 6.0, "elapsed_time": "1:21:41", "remaining_time": "21:18:51"} +{"current_steps": 455, "total_steps": 7494, "loss": 0.6232, "lr": 9.079999999999998e-05, "epoch": 0.12143047771550573, "percentage": 6.07, "elapsed_time": "1:22:14", "remaining_time": "21:12:11"} +{"current_steps": 460, "total_steps": 7494, "loss": 0.6288, "lr": 9.18e-05, "epoch": 0.12276487856952228, "percentage": 6.14, "elapsed_time": "1:22:49", "remaining_time": "21:06:25"} +{"current_steps": 465, "total_steps": 7494, "loss": 0.6389, "lr": 9.279999999999999e-05, "epoch": 0.12409927942353884, "percentage": 6.2, "elapsed_time": "1:23:50", "remaining_time": "21:07:16"} +{"current_steps": 470, "total_steps": 7494, "loss": 0.6294, "lr": 9.379999999999999e-05, "epoch": 0.1254336802775554, "percentage": 6.27, "elapsed_time": "1:24:33", "remaining_time": "21:03:41"} +{"current_steps": 475, "total_steps": 7494, "loss": 0.6481, "lr": 9.479999999999999e-05, "epoch": 0.12676808113157192, "percentage": 6.34, "elapsed_time": "1:25:05", "remaining_time": "20:57:21"} +{"current_steps": 480, "total_steps": 7494, "loss": 0.6352, "lr": 9.58e-05, "epoch": 0.12810248198558846, "percentage": 6.41, "elapsed_time": "1:25:48", "remaining_time": "20:53:47"} +{"current_steps": 485, "total_steps": 7494, "loss": 0.6405, "lr": 9.68e-05, "epoch": 0.12943688283960503, "percentage": 6.47, "elapsed_time": "1:26:48", "remaining_time": "20:54:25"} +{"current_steps": 490, "total_steps": 7494, "loss": 0.6278, "lr": 9.779999999999999e-05, "epoch": 0.13077128369362157, "percentage": 6.54, "elapsed_time": "1:27:22", "remaining_time": "20:48:59"} +{"current_steps": 495, "total_steps": 7494, "loss": 0.6328, "lr": 9.879999999999999e-05, "epoch": 0.1321056845476381, "percentage": 6.61, "elapsed_time": "1:27:56", "remaining_time": "20:43:22"} +{"current_steps": 500, "total_steps": 7494, "loss": 0.6409, "lr": 9.979999999999999e-05, "epoch": 0.13344008540165467, "percentage": 6.67, "elapsed_time": "1:28:54", "remaining_time": "20:43:45"} +{"current_steps": 505, "total_steps": 7494, "loss": 0.637, "lr": 0.0001008, "epoch": 0.1347744862556712, "percentage": 6.74, "elapsed_time": "1:29:52", "remaining_time": "20:43:55"} +{"current_steps": 510, "total_steps": 7494, "loss": 0.6318, "lr": 0.00010179999999999998, "epoch": 0.13610888710968774, "percentage": 6.81, "elapsed_time": "1:30:24", "remaining_time": "20:38:07"} +{"current_steps": 515, "total_steps": 7494, "loss": 0.6263, "lr": 0.00010279999999999999, "epoch": 0.1374432879637043, "percentage": 6.87, "elapsed_time": "1:31:02", "remaining_time": "20:33:50"} +{"current_steps": 520, "total_steps": 7494, "loss": 0.624, "lr": 0.00010379999999999999, "epoch": 0.13877768881772085, "percentage": 6.94, "elapsed_time": "1:32:07", "remaining_time": "20:35:32"} +{"current_steps": 525, "total_steps": 7494, "loss": 0.6396, "lr": 0.00010479999999999999, "epoch": 0.14011208967173738, "percentage": 7.01, "elapsed_time": "1:32:44", "remaining_time": "20:31:04"} +{"current_steps": 530, "total_steps": 7494, "loss": 0.6326, "lr": 0.0001058, "epoch": 0.14144649052575395, "percentage": 7.07, "elapsed_time": "1:33:16", "remaining_time": "20:25:34"} +{"current_steps": 535, "total_steps": 7494, "loss": 0.6309, "lr": 0.00010679999999999998, "epoch": 0.14278089137977049, "percentage": 7.14, "elapsed_time": "1:34:04", "remaining_time": "20:23:35"} +{"current_steps": 540, "total_steps": 7494, "loss": 0.643, "lr": 0.00010779999999999999, "epoch": 0.14411529223378702, "percentage": 7.21, "elapsed_time": "1:34:59", "remaining_time": "20:23:11"} +{"current_steps": 545, "total_steps": 7494, "loss": 0.6337, "lr": 0.0001088, "epoch": 0.1454496930878036, "percentage": 7.27, "elapsed_time": "1:35:32", "remaining_time": "20:18:05"} +{"current_steps": 550, "total_steps": 7494, "loss": 0.6524, "lr": 0.00010979999999999999, "epoch": 0.14678409394182013, "percentage": 7.34, "elapsed_time": "1:36:07", "remaining_time": "20:13:31"} +{"current_steps": 555, "total_steps": 7494, "loss": 0.6142, "lr": 0.0001108, "epoch": 0.14811849479583666, "percentage": 7.41, "elapsed_time": "1:37:04", "remaining_time": "20:13:37"} +{"current_steps": 560, "total_steps": 7494, "loss": 0.6373, "lr": 0.00011179999999999998, "epoch": 0.14945289564985323, "percentage": 7.47, "elapsed_time": "1:37:49", "remaining_time": "20:11:15"} +{"current_steps": 565, "total_steps": 7494, "loss": 0.6092, "lr": 0.00011279999999999999, "epoch": 0.15078729650386977, "percentage": 7.54, "elapsed_time": "1:38:21", "remaining_time": "20:06:13"} +{"current_steps": 570, "total_steps": 7494, "loss": 0.627, "lr": 0.0001138, "epoch": 0.1521216973578863, "percentage": 7.61, "elapsed_time": "1:39:06", "remaining_time": "20:03:48"} +{"current_steps": 575, "total_steps": 7494, "loss": 0.6334, "lr": 0.00011479999999999999, "epoch": 0.15345609821190287, "percentage": 7.67, "elapsed_time": "1:40:06", "remaining_time": "20:04:40"} +{"current_steps": 580, "total_steps": 7494, "loss": 0.6426, "lr": 0.0001158, "epoch": 0.1547904990659194, "percentage": 7.74, "elapsed_time": "1:40:42", "remaining_time": "20:00:35"} +{"current_steps": 585, "total_steps": 7494, "loss": 0.6461, "lr": 0.00011679999999999998, "epoch": 0.15612489991993594, "percentage": 7.81, "elapsed_time": "1:41:15", "remaining_time": "19:55:57"} +{"current_steps": 590, "total_steps": 7494, "loss": 0.6436, "lr": 0.00011779999999999999, "epoch": 0.15745930077395248, "percentage": 7.87, "elapsed_time": "1:42:07", "remaining_time": "19:55:00"} +{"current_steps": 595, "total_steps": 7494, "loss": 0.6271, "lr": 0.0001188, "epoch": 0.15879370162796905, "percentage": 7.94, "elapsed_time": "1:43:01", "remaining_time": "19:54:39"} +{"current_steps": 600, "total_steps": 7494, "loss": 0.6226, "lr": 0.00011979999999999998, "epoch": 0.16012810248198558, "percentage": 8.01, "elapsed_time": "1:43:35", "remaining_time": "19:50:19"} +{"current_steps": 605, "total_steps": 7494, "loss": 0.6379, "lr": 0.0001208, "epoch": 0.16146250333600212, "percentage": 8.07, "elapsed_time": "1:44:25", "remaining_time": "19:49:07"} +{"current_steps": 610, "total_steps": 7494, "loss": 0.6316, "lr": 0.00012179999999999999, "epoch": 0.1627969041900187, "percentage": 8.14, "elapsed_time": "1:45:24", "remaining_time": "19:49:30"} +{"current_steps": 615, "total_steps": 7494, "loss": 0.6256, "lr": 0.00012279999999999998, "epoch": 0.16413130504403523, "percentage": 8.21, "elapsed_time": "1:46:07", "remaining_time": "19:47:05"} +{"current_steps": 620, "total_steps": 7494, "loss": 0.6395, "lr": 0.0001238, "epoch": 0.16546570589805176, "percentage": 8.27, "elapsed_time": "1:46:41", "remaining_time": "19:42:48"} +{"current_steps": 625, "total_steps": 7494, "loss": 0.6414, "lr": 0.00012479999999999997, "epoch": 0.16680010675206833, "percentage": 8.34, "elapsed_time": "1:47:26", "remaining_time": "19:40:54"} +{"current_steps": 630, "total_steps": 7494, "loss": 0.6317, "lr": 0.0001258, "epoch": 0.16813450760608487, "percentage": 8.41, "elapsed_time": "1:48:23", "remaining_time": "19:40:52"} +{"current_steps": 635, "total_steps": 7494, "loss": 0.6339, "lr": 0.0001268, "epoch": 0.1694689084601014, "percentage": 8.47, "elapsed_time": "1:49:02", "remaining_time": "19:37:49"} +{"current_steps": 640, "total_steps": 7494, "loss": 0.6319, "lr": 0.0001278, "epoch": 0.17080330931411797, "percentage": 8.54, "elapsed_time": "1:49:37", "remaining_time": "19:34:02"} +{"current_steps": 645, "total_steps": 7494, "loss": 0.6239, "lr": 0.0001288, "epoch": 0.1721377101681345, "percentage": 8.61, "elapsed_time": "1:50:31", "remaining_time": "19:33:34"} +{"current_steps": 650, "total_steps": 7494, "loss": 0.6429, "lr": 0.00012979999999999998, "epoch": 0.17347211102215104, "percentage": 8.67, "elapsed_time": "1:51:22", "remaining_time": "19:32:46"} +{"current_steps": 655, "total_steps": 7494, "loss": 0.6401, "lr": 0.00013079999999999998, "epoch": 0.1748065118761676, "percentage": 8.74, "elapsed_time": "1:51:57", "remaining_time": "19:28:54"} +{"current_steps": 660, "total_steps": 7494, "loss": 0.6239, "lr": 0.0001318, "epoch": 0.17614091273018415, "percentage": 8.81, "elapsed_time": "1:52:36", "remaining_time": "19:25:58"} +{"current_steps": 665, "total_steps": 7494, "loss": 0.6387, "lr": 0.00013279999999999998, "epoch": 0.17747531358420068, "percentage": 8.87, "elapsed_time": "1:53:34", "remaining_time": "19:26:14"} +{"current_steps": 670, "total_steps": 7494, "loss": 0.6424, "lr": 0.0001338, "epoch": 0.17880971443821725, "percentage": 8.94, "elapsed_time": "1:54:19", "remaining_time": "19:24:24"} +{"current_steps": 675, "total_steps": 7494, "loss": 0.6444, "lr": 0.00013479999999999997, "epoch": 0.1801441152922338, "percentage": 9.01, "elapsed_time": "1:54:53", "remaining_time": "19:20:35"} +{"current_steps": 680, "total_steps": 7494, "loss": 0.6242, "lr": 0.0001358, "epoch": 0.18147851614625032, "percentage": 9.07, "elapsed_time": "1:55:42", "remaining_time": "19:19:25"} +{"current_steps": 685, "total_steps": 7494, "loss": 0.6377, "lr": 0.0001368, "epoch": 0.1828129170002669, "percentage": 9.14, "elapsed_time": "1:56:37", "remaining_time": "19:19:19"} +{"current_steps": 690, "total_steps": 7494, "loss": 0.6253, "lr": 0.0001378, "epoch": 0.18414731785428343, "percentage": 9.21, "elapsed_time": "1:57:18", "remaining_time": "19:16:42"} +{"current_steps": 695, "total_steps": 7494, "loss": 0.625, "lr": 0.00013879999999999999, "epoch": 0.18548171870829996, "percentage": 9.27, "elapsed_time": "1:57:53", "remaining_time": "19:13:14"} +{"current_steps": 700, "total_steps": 7494, "loss": 0.6324, "lr": 0.00013979999999999998, "epoch": 0.18681611956231653, "percentage": 9.34, "elapsed_time": "1:58:44", "remaining_time": "19:12:31"} +{"current_steps": 705, "total_steps": 7494, "loss": 0.6318, "lr": 0.00014079999999999998, "epoch": 0.18815052041633307, "percentage": 9.41, "elapsed_time": "1:59:49", "remaining_time": "19:13:49"} +{"current_steps": 710, "total_steps": 7494, "loss": 0.6333, "lr": 0.0001418, "epoch": 0.1894849212703496, "percentage": 9.47, "elapsed_time": "2:00:25", "remaining_time": "19:10:40"} +{"current_steps": 715, "total_steps": 7494, "loss": 0.624, "lr": 0.00014279999999999997, "epoch": 0.19081932212436617, "percentage": 9.54, "elapsed_time": "2:01:04", "remaining_time": "19:07:59"} +{"current_steps": 720, "total_steps": 7494, "loss": 0.6072, "lr": 0.0001438, "epoch": 0.1921537229783827, "percentage": 9.61, "elapsed_time": "2:02:01", "remaining_time": "19:07:59"} +{"current_steps": 725, "total_steps": 7494, "loss": 0.6215, "lr": 0.0001448, "epoch": 0.19348812383239924, "percentage": 9.67, "elapsed_time": "2:02:47", "remaining_time": "19:06:25"} +{"current_steps": 730, "total_steps": 7494, "loss": 0.6339, "lr": 0.0001458, "epoch": 0.1948225246864158, "percentage": 9.74, "elapsed_time": "2:03:21", "remaining_time": "19:03:01"} +{"current_steps": 735, "total_steps": 7494, "loss": 0.6278, "lr": 0.0001468, "epoch": 0.19615692554043235, "percentage": 9.81, "elapsed_time": "2:04:07", "remaining_time": "19:01:30"} +{"current_steps": 740, "total_steps": 7494, "loss": 0.6382, "lr": 0.0001478, "epoch": 0.19749132639444889, "percentage": 9.87, "elapsed_time": "2:05:06", "remaining_time": "19:01:54"} +{"current_steps": 745, "total_steps": 7494, "loss": 0.6266, "lr": 0.00014879999999999998, "epoch": 0.19882572724846545, "percentage": 9.94, "elapsed_time": "2:05:48", "remaining_time": "18:59:41"} +{"current_steps": 750, "total_steps": 7494, "loss": 0.6311, "lr": 0.00014979999999999998, "epoch": 0.200160128102482, "percentage": 10.01, "elapsed_time": "2:06:24", "remaining_time": "18:56:36"} +{"current_steps": 755, "total_steps": 7494, "loss": 0.6291, "lr": 0.00014999986979857214, "epoch": 0.20149452895649853, "percentage": 10.07, "elapsed_time": "2:07:13", "remaining_time": "18:55:39"} +{"current_steps": 760, "total_steps": 7494, "loss": 0.6301, "lr": 0.00014999934085604638, "epoch": 0.2028289298105151, "percentage": 10.14, "elapsed_time": "2:08:06", "remaining_time": "18:55:05"} +{"current_steps": 765, "total_steps": 7494, "loss": 0.6316, "lr": 0.00014999840503770068, "epoch": 0.20416333066453163, "percentage": 10.21, "elapsed_time": "2:08:45", "remaining_time": "18:52:31"} +{"current_steps": 770, "total_steps": 7494, "loss": 0.643, "lr": 0.00014999706234861205, "epoch": 0.20549773151854817, "percentage": 10.27, "elapsed_time": "2:09:23", "remaining_time": "18:49:55"} +{"current_steps": 775, "total_steps": 7494, "loss": 0.6354, "lr": 0.00014999531279606457, "epoch": 0.20683213237256473, "percentage": 10.34, "elapsed_time": "2:10:17", "remaining_time": "18:49:34"} +{"current_steps": 780, "total_steps": 7494, "loss": 0.6348, "lr": 0.00014999315638954965, "epoch": 0.20816653322658127, "percentage": 10.41, "elapsed_time": "2:11:07", "remaining_time": "18:48:42"} +{"current_steps": 785, "total_steps": 7494, "loss": 0.6352, "lr": 0.000149990593140766, "epoch": 0.2095009340805978, "percentage": 10.48, "elapsed_time": "2:11:44", "remaining_time": "18:45:52"} +{"current_steps": 790, "total_steps": 7494, "loss": 0.6319, "lr": 0.00014998762306361933, "epoch": 0.21083533493461437, "percentage": 10.54, "elapsed_time": "2:12:26", "remaining_time": "18:43:52"} +{"current_steps": 795, "total_steps": 7494, "loss": 0.6247, "lr": 0.00014998424617422253, "epoch": 0.2121697357886309, "percentage": 10.61, "elapsed_time": "2:13:20", "remaining_time": "18:43:36"} +{"current_steps": 800, "total_steps": 7494, "loss": 0.6309, "lr": 0.00014998046249089538, "epoch": 0.21350413664264745, "percentage": 10.68, "elapsed_time": "2:14:05", "remaining_time": "18:42:03"} +{"current_steps": 805, "total_steps": 7494, "loss": 0.6271, "lr": 0.00014997627203416458, "epoch": 0.214838537496664, "percentage": 10.74, "elapsed_time": "2:14:51", "remaining_time": "18:40:33"} +{"current_steps": 810, "total_steps": 7494, "loss": 0.6284, "lr": 0.00014997167482676366, "epoch": 0.21617293835068055, "percentage": 10.81, "elapsed_time": "2:15:38", "remaining_time": "18:39:17"} +{"current_steps": 815, "total_steps": 7494, "loss": 0.6265, "lr": 0.00014996667089363272, "epoch": 0.2175073392046971, "percentage": 10.88, "elapsed_time": "2:16:34", "remaining_time": "18:39:14"} +{"current_steps": 820, "total_steps": 7494, "loss": 0.6424, "lr": 0.00014996126026191832, "epoch": 0.21884174005871362, "percentage": 10.94, "elapsed_time": "2:17:15", "remaining_time": "18:37:05"} +{"current_steps": 825, "total_steps": 7494, "loss": 0.6283, "lr": 0.00014995544296097355, "epoch": 0.2201761409127302, "percentage": 11.01, "elapsed_time": "2:17:53", "remaining_time": "18:34:41"} +{"current_steps": 830, "total_steps": 7494, "loss": 0.6302, "lr": 0.00014994921902235757, "epoch": 0.22151054176674673, "percentage": 11.08, "elapsed_time": "2:18:44", "remaining_time": "18:33:54"} +{"current_steps": 835, "total_steps": 7494, "loss": 0.6197, "lr": 0.0001499425884798356, "epoch": 0.22284494262076326, "percentage": 11.14, "elapsed_time": "2:19:36", "remaining_time": "18:33:22"} +{"current_steps": 840, "total_steps": 7494, "loss": 0.63, "lr": 0.00014993555136937872, "epoch": 0.22417934347477983, "percentage": 11.21, "elapsed_time": "2:20:15", "remaining_time": "18:31:00"} +{"current_steps": 845, "total_steps": 7494, "loss": 0.636, "lr": 0.0001499281077291637, "epoch": 0.22551374432879637, "percentage": 11.28, "elapsed_time": "2:20:56", "remaining_time": "18:29:04"} +{"current_steps": 850, "total_steps": 7494, "loss": 0.6516, "lr": 0.00014992025759957267, "epoch": 0.2268481451828129, "percentage": 11.34, "elapsed_time": "2:21:48", "remaining_time": "18:28:27"} +{"current_steps": 855, "total_steps": 7494, "loss": 0.6251, "lr": 0.0001499120010231931, "epoch": 0.22818254603682947, "percentage": 11.41, "elapsed_time": "2:22:36", "remaining_time": "18:27:20"} +{"current_steps": 860, "total_steps": 7494, "loss": 0.6276, "lr": 0.00014990333804481738, "epoch": 0.229516946890846, "percentage": 11.48, "elapsed_time": "2:23:14", "remaining_time": "18:24:55"} +{"current_steps": 865, "total_steps": 7494, "loss": 0.6279, "lr": 0.00014989426871144266, "epoch": 0.23085134774486255, "percentage": 11.54, "elapsed_time": "2:23:59", "remaining_time": "18:23:29"} +{"current_steps": 870, "total_steps": 7494, "loss": 0.6138, "lr": 0.00014988479307227062, "epoch": 0.2321857485988791, "percentage": 11.61, "elapsed_time": "2:24:52", "remaining_time": "18:23:05"} +{"current_steps": 875, "total_steps": 7494, "loss": 0.6296, "lr": 0.00014987491117870717, "epoch": 0.23352014945289565, "percentage": 11.68, "elapsed_time": "2:25:37", "remaining_time": "18:21:31"} +{"current_steps": 880, "total_steps": 7494, "loss": 0.6174, "lr": 0.00014986462308436214, "epoch": 0.23485455030691219, "percentage": 11.74, "elapsed_time": "2:26:15", "remaining_time": "18:19:17"} +{"current_steps": 885, "total_steps": 7494, "loss": 0.6305, "lr": 0.00014985392884504903, "epoch": 0.23618895116092875, "percentage": 11.81, "elapsed_time": "2:27:03", "remaining_time": "18:18:13"} +{"current_steps": 890, "total_steps": 7494, "loss": 0.6277, "lr": 0.00014984282851878477, "epoch": 0.2375233520149453, "percentage": 11.88, "elapsed_time": "2:28:00", "remaining_time": "18:18:14"} +{"current_steps": 895, "total_steps": 7494, "loss": 0.6276, "lr": 0.00014983132216578923, "epoch": 0.23885775286896183, "percentage": 11.94, "elapsed_time": "2:28:42", "remaining_time": "18:16:28"} +{"current_steps": 900, "total_steps": 7494, "loss": 0.6095, "lr": 0.00014981940984848508, "epoch": 0.2401921537229784, "percentage": 12.01, "elapsed_time": "2:29:24", "remaining_time": "18:14:37"} +{"current_steps": 805, "total_steps": 7494, "loss": 0.627, "lr": 0.00014997627203416458, "epoch": 0.214838537496664, "percentage": 10.74, "elapsed_time": "0:07:18", "remaining_time": "1:00:45"} +{"current_steps": 810, "total_steps": 7494, "loss": 0.6285, "lr": 0.00014997167482676366, "epoch": 0.21617293835068055, "percentage": 10.81, "elapsed_time": "0:08:24", "remaining_time": "1:09:25"} +{"current_steps": 815, "total_steps": 7494, "loss": 0.6266, "lr": 0.00014996667089363272, "epoch": 0.2175073392046971, "percentage": 10.88, "elapsed_time": "0:09:32", "remaining_time": "1:18:08"} +{"current_steps": 820, "total_steps": 7494, "loss": 0.6425, "lr": 0.00014996126026191832, "epoch": 0.21884174005871362, "percentage": 10.94, "elapsed_time": "0:10:38", "remaining_time": "1:26:39"} +{"current_steps": 825, "total_steps": 7494, "loss": 0.6282, "lr": 0.00014995544296097355, "epoch": 0.2201761409127302, "percentage": 11.01, "elapsed_time": "0:11:20", "remaining_time": "1:31:44"} +{"current_steps": 830, "total_steps": 7494, "loss": 0.6304, "lr": 0.00014994921902235757, "epoch": 0.22151054176674673, "percentage": 11.08, "elapsed_time": "0:11:59", "remaining_time": "1:36:16"} +{"current_steps": 835, "total_steps": 7494, "loss": 0.62, "lr": 0.0001499425884798356, "epoch": 0.22284494262076326, "percentage": 11.14, "elapsed_time": "0:12:59", "remaining_time": "1:43:37"} +{"current_steps": 840, "total_steps": 7494, "loss": 0.6298, "lr": 0.00014993555136937872, "epoch": 0.22417934347477983, "percentage": 11.21, "elapsed_time": "0:13:36", "remaining_time": "1:47:47"} +{"current_steps": 845, "total_steps": 7494, "loss": 0.6358, "lr": 0.0001499281077291637, "epoch": 0.22551374432879637, "percentage": 11.28, "elapsed_time": "0:14:11", "remaining_time": "1:51:42"} +{"current_steps": 850, "total_steps": 7494, "loss": 0.6569, "lr": 0.00014992025759957267, "epoch": 0.2268481451828129, "percentage": 11.34, "elapsed_time": "0:15:12", "remaining_time": "1:58:49"} +{"current_steps": 855, "total_steps": 7494, "loss": 0.6297, "lr": 0.0001499120010231931, "epoch": 0.22818254603682947, "percentage": 11.41, "elapsed_time": "0:15:45", "remaining_time": "2:02:18"} +{"current_steps": 860, "total_steps": 7494, "loss": 0.6312, "lr": 0.00014990333804481738, "epoch": 0.229516946890846, "percentage": 11.48, "elapsed_time": "0:16:18", "remaining_time": "2:05:45"} +{"current_steps": 865, "total_steps": 7494, "loss": 0.6304, "lr": 0.00014989426871144266, "epoch": 0.23085134774486255, "percentage": 11.54, "elapsed_time": "0:17:10", "remaining_time": "2:11:35"} +{"current_steps": 870, "total_steps": 7494, "loss": 0.6153, "lr": 0.00014988479307227062, "epoch": 0.2321857485988791, "percentage": 11.61, "elapsed_time": "0:17:46", "remaining_time": "2:15:21"} +{"current_steps": 875, "total_steps": 7494, "loss": 0.632, "lr": 0.00014987491117870717, "epoch": 0.23352014945289565, "percentage": 11.68, "elapsed_time": "0:18:18", "remaining_time": "2:18:33"} +{"current_steps": 880, "total_steps": 7494, "loss": 0.619, "lr": 0.00014986462308436214, "epoch": 0.23485455030691219, "percentage": 11.74, "elapsed_time": "0:18:52", "remaining_time": "2:21:54"} +{"current_steps": 885, "total_steps": 7494, "loss": 0.6327, "lr": 0.00014985392884504903, "epoch": 0.23618895116092875, "percentage": 11.81, "elapsed_time": "0:19:49", "remaining_time": "2:28:04"} +{"current_steps": 890, "total_steps": 7494, "loss": 0.6277, "lr": 0.00014984282851878477, "epoch": 0.2375233520149453, "percentage": 11.88, "elapsed_time": "0:20:20", "remaining_time": "2:31:00"} +{"current_steps": 895, "total_steps": 7494, "loss": 0.6277, "lr": 0.00014983132216578923, "epoch": 0.23885775286896183, "percentage": 11.94, "elapsed_time": "0:20:52", "remaining_time": "2:33:57"} +{"current_steps": 900, "total_steps": 7494, "loss": 0.6095, "lr": 0.00014981940984848508, "epoch": 0.2401921537229784, "percentage": 12.01, "elapsed_time": "0:21:52", "remaining_time": "2:40:12"} +{"current_steps": 905, "total_steps": 7494, "loss": 0.6352, "lr": 0.00014980709163149732, "epoch": 0.24152655457699493, "percentage": 12.08, "elapsed_time": "0:22:30", "remaining_time": "2:43:52"} +{"current_steps": 910, "total_steps": 7494, "loss": 0.6286, "lr": 0.000149794367581653, "epoch": 0.24286095543101147, "percentage": 12.14, "elapsed_time": "0:23:02", "remaining_time": "2:46:41"} +{"current_steps": 915, "total_steps": 7494, "loss": 0.6189, "lr": 0.00014978123776798082, "epoch": 0.24419535628502803, "percentage": 12.21, "elapsed_time": "0:23:55", "remaining_time": "2:52:03"} +{"current_steps": 920, "total_steps": 7494, "loss": 0.6211, "lr": 0.00014976770226171084, "epoch": 0.24552975713904457, "percentage": 12.28, "elapsed_time": "0:24:36", "remaining_time": "2:55:47"} +{"current_steps": 925, "total_steps": 7494, "loss": 0.6243, "lr": 0.00014975376113627394, "epoch": 0.2468641579930611, "percentage": 12.34, "elapsed_time": "0:25:07", "remaining_time": "2:58:28"} +{"current_steps": 930, "total_steps": 7494, "loss": 0.6417, "lr": 0.00014973941446730154, "epoch": 0.24819855884707767, "percentage": 12.41, "elapsed_time": "0:25:44", "remaining_time": "3:01:38"} +{"current_steps": 935, "total_steps": 7494, "loss": 0.6268, "lr": 0.00014972466233262517, "epoch": 0.2495329597010942, "percentage": 12.48, "elapsed_time": "0:26:42", "remaining_time": "3:07:22"} +{"current_steps": 940, "total_steps": 7494, "loss": 0.6271, "lr": 0.00014970950481227603, "epoch": 0.2508673605551108, "percentage": 12.54, "elapsed_time": "0:27:13", "remaining_time": "3:09:52"} +{"current_steps": 945, "total_steps": 7494, "loss": 0.6291, "lr": 0.00014969394198848456, "epoch": 0.2522017614091273, "percentage": 12.61, "elapsed_time": "0:27:45", "remaining_time": "3:12:21"} +{"current_steps": 950, "total_steps": 7494, "loss": 0.6102, "lr": 0.00014967797394567993, "epoch": 0.25353616226314385, "percentage": 12.68, "elapsed_time": "0:28:49", "remaining_time": "3:18:36"} +{"current_steps": 955, "total_steps": 7494, "loss": 0.6088, "lr": 0.00014966160077048982, "epoch": 0.2548705631171604, "percentage": 12.74, "elapsed_time": "0:29:23", "remaining_time": "3:21:16"} +{"current_steps": 960, "total_steps": 7494, "loss": 0.6355, "lr": 0.00014964482255173958, "epoch": 0.2562049639711769, "percentage": 12.81, "elapsed_time": "0:29:56", "remaining_time": "3:23:46"} +{"current_steps": 965, "total_steps": 7494, "loss": 0.6343, "lr": 0.00014962763938045206, "epoch": 0.25753936482519346, "percentage": 12.88, "elapsed_time": "0:30:43", "remaining_time": "3:27:49"} +{"current_steps": 970, "total_steps": 7494, "loss": 0.6238, "lr": 0.00014961005134984693, "epoch": 0.25887376567921005, "percentage": 12.94, "elapsed_time": "0:31:35", "remaining_time": "3:32:25"} +{"current_steps": 975, "total_steps": 7494, "loss": 0.6215, "lr": 0.00014959205855534036, "epoch": 0.2602081665332266, "percentage": 13.01, "elapsed_time": "0:32:07", "remaining_time": "3:34:47"} +{"current_steps": 980, "total_steps": 7494, "loss": 0.6165, "lr": 0.00014957366109454427, "epoch": 0.26154256738724313, "percentage": 13.08, "elapsed_time": "0:32:41", "remaining_time": "3:37:18"} +{"current_steps": 985, "total_steps": 7494, "loss": 0.631, "lr": 0.00014955485906726596, "epoch": 0.26287696824125967, "percentage": 13.14, "elapsed_time": "0:33:46", "remaining_time": "3:43:11"} +{"current_steps": 990, "total_steps": 7494, "loss": 0.6403, "lr": 0.00014953565257550756, "epoch": 0.2642113690952762, "percentage": 13.21, "elapsed_time": "0:34:18", "remaining_time": "3:45:26"} +{"current_steps": 995, "total_steps": 7494, "loss": 0.6321, "lr": 0.00014951604172346535, "epoch": 0.26554576994929274, "percentage": 13.28, "elapsed_time": "0:34:51", "remaining_time": "3:47:39"} +{"current_steps": 1000, "total_steps": 7494, "loss": 0.6361, "lr": 0.00014949602661752944, "epoch": 0.26688017080330934, "percentage": 13.34, "elapsed_time": "0:35:45", "remaining_time": "3:52:11"} +{"current_steps": 1005, "total_steps": 7494, "loss": 0.6048, "lr": 0.0001494756073662829, "epoch": 0.2682145716573259, "percentage": 13.41, "elapsed_time": "0:36:35", "remaining_time": "3:56:13"} +{"current_steps": 1010, "total_steps": 7494, "loss": 0.6241, "lr": 0.00014945478408050135, "epoch": 0.2695489725113424, "percentage": 13.48, "elapsed_time": "0:37:06", "remaining_time": "3:58:15"} +{"current_steps": 1015, "total_steps": 7494, "loss": 0.6346, "lr": 0.00014943355687315239, "epoch": 0.27088337336535895, "percentage": 13.54, "elapsed_time": "0:37:43", "remaining_time": "4:00:47"} +{"current_steps": 1020, "total_steps": 7494, "loss": 0.6198, "lr": 0.0001494119258593948, "epoch": 0.2722177742193755, "percentage": 13.61, "elapsed_time": "0:38:46", "remaining_time": "4:06:06"} +{"current_steps": 1025, "total_steps": 7494, "loss": 0.6438, "lr": 0.00014938989115657815, "epoch": 0.273552175073392, "percentage": 13.68, "elapsed_time": "0:39:18", "remaining_time": "4:08:05"} +{"current_steps": 1030, "total_steps": 7494, "loss": 0.6411, "lr": 0.00014936745288424198, "epoch": 0.2748865759274086, "percentage": 13.74, "elapsed_time": "0:39:50", "remaining_time": "4:09:59"} +{"current_steps": 1035, "total_steps": 7494, "loss": 0.6388, "lr": 0.0001493446111641152, "epoch": 0.27622097678142515, "percentage": 13.81, "elapsed_time": "0:40:49", "remaining_time": "4:14:46"} +{"current_steps": 1040, "total_steps": 7494, "loss": 0.619, "lr": 0.00014932136612011554, "epoch": 0.2775553776354417, "percentage": 13.88, "elapsed_time": "0:41:28", "remaining_time": "4:17:22"} +{"current_steps": 1045, "total_steps": 7494, "loss": 0.6239, "lr": 0.00014929771787834868, "epoch": 0.27888977848945823, "percentage": 13.94, "elapsed_time": "0:41:59", "remaining_time": "4:19:09"} +{"current_steps": 1050, "total_steps": 7494, "loss": 0.6361, "lr": 0.00014927366656710772, "epoch": 0.28022417934347477, "percentage": 14.01, "elapsed_time": "0:42:40", "remaining_time": "4:21:54"} +{"current_steps": 1055, "total_steps": 7494, "loss": 0.6446, "lr": 0.00014924921231687245, "epoch": 0.2815585801974913, "percentage": 14.08, "elapsed_time": "0:43:41", "remaining_time": "4:26:39"} +{"current_steps": 1060, "total_steps": 7494, "loss": 0.6279, "lr": 0.0001492243552603086, "epoch": 0.2828929810515079, "percentage": 14.14, "elapsed_time": "0:44:13", "remaining_time": "4:28:25"} +{"current_steps": 1065, "total_steps": 7494, "loss": 0.629, "lr": 0.00014919909553226716, "epoch": 0.28422738190552443, "percentage": 14.21, "elapsed_time": "0:44:45", "remaining_time": "4:30:09"} +{"current_steps": 1070, "total_steps": 7494, "loss": 0.626, "lr": 0.00014917343326978366, "epoch": 0.28556178275954097, "percentage": 14.28, "elapsed_time": "0:45:50", "remaining_time": "4:35:10"} +{"current_steps": 1075, "total_steps": 7494, "loss": 0.614, "lr": 0.00014914736861207733, "epoch": 0.2868961836135575, "percentage": 14.34, "elapsed_time": "0:46:26", "remaining_time": "4:37:20"} +{"current_steps": 1080, "total_steps": 7494, "loss": 0.634, "lr": 0.0001491209017005505, "epoch": 0.28823058446757405, "percentage": 14.41, "elapsed_time": "0:46:58", "remaining_time": "4:38:56"} +{"current_steps": 1085, "total_steps": 7494, "loss": 0.6226, "lr": 0.00014909403267878771, "epoch": 0.2895649853215906, "percentage": 14.48, "elapsed_time": "0:47:39", "remaining_time": "4:41:33"} +{"current_steps": 1090, "total_steps": 7494, "loss": 0.6507, "lr": 0.000149066761692555, "epoch": 0.2908993861756072, "percentage": 14.54, "elapsed_time": "0:48:40", "remaining_time": "4:45:58"} +{"current_steps": 1095, "total_steps": 7494, "loss": 0.6703, "lr": 0.00014903908888979904, "epoch": 0.2922337870296237, "percentage": 14.61, "elapsed_time": "0:49:12", "remaining_time": "4:47:31"} +{"current_steps": 1100, "total_steps": 7494, "loss": 0.6394, "lr": 0.00014901101442064637, "epoch": 0.29356818788364025, "percentage": 14.68, "elapsed_time": "0:49:43", "remaining_time": "4:49:03"} +{"current_steps": 1105, "total_steps": 7494, "loss": 0.6191, "lr": 0.00014898253843740271, "epoch": 0.2949025887376568, "percentage": 14.75, "elapsed_time": "0:50:59", "remaining_time": "4:54:48"} +{"current_steps": 1110, "total_steps": 7494, "loss": 0.6227, "lr": 0.00014895366109455189, "epoch": 0.2962369895916733, "percentage": 14.81, "elapsed_time": "0:51:39", "remaining_time": "4:57:05"} +{"current_steps": 1115, "total_steps": 7494, "loss": 0.6332, "lr": 0.00014892438254875522, "epoch": 0.29757139044568987, "percentage": 14.88, "elapsed_time": "0:52:10", "remaining_time": "4:58:32"} +{"current_steps": 1120, "total_steps": 7494, "loss": 0.6263, "lr": 0.00014889470295885047, "epoch": 0.29890579129970646, "percentage": 14.95, "elapsed_time": "0:52:54", "remaining_time": "5:01:06"} +{"current_steps": 1125, "total_steps": 7494, "loss": 0.622, "lr": 0.0001488646224858512, "epoch": 0.300240192153723, "percentage": 15.01, "elapsed_time": "0:53:56", "remaining_time": "5:05:21"} +{"current_steps": 1130, "total_steps": 7494, "loss": 0.6249, "lr": 0.00014883414129294575, "epoch": 0.30157459300773953, "percentage": 15.08, "elapsed_time": "0:54:28", "remaining_time": "5:06:47"} +{"current_steps": 1135, "total_steps": 7494, "loss": 0.6111, "lr": 0.00014880325954549635, "epoch": 0.30290899386175607, "percentage": 15.15, "elapsed_time": "0:55:00", "remaining_time": "5:08:13"} +{"current_steps": 1140, "total_steps": 7494, "loss": 0.6169, "lr": 0.00014877197741103827, "epoch": 0.3042433947157726, "percentage": 15.21, "elapsed_time": "0:56:03", "remaining_time": "5:12:26"} +{"current_steps": 1145, "total_steps": 7494, "loss": 0.628, "lr": 0.00014874029505927897, "epoch": 0.30557779556978915, "percentage": 15.28, "elapsed_time": "0:56:43", "remaining_time": "5:14:34"} +{"current_steps": 1150, "total_steps": 7494, "loss": 0.6389, "lr": 0.00014870821266209705, "epoch": 0.30691219642380574, "percentage": 15.35, "elapsed_time": "0:57:15", "remaining_time": "5:15:52"} +{"current_steps": 1155, "total_steps": 7494, "loss": 0.636, "lr": 0.00014867573039354138, "epoch": 0.3082465972778223, "percentage": 15.41, "elapsed_time": "0:57:58", "remaining_time": "5:18:12"} +{"current_steps": 1160, "total_steps": 7494, "loss": 0.6384, "lr": 0.00014864284842983018, "epoch": 0.3095809981318388, "percentage": 15.48, "elapsed_time": "0:59:00", "remaining_time": "5:22:09"} +{"current_steps": 1165, "total_steps": 7494, "loss": 0.6175, "lr": 0.00014860956694935003, "epoch": 0.31091539898585535, "percentage": 15.55, "elapsed_time": "0:59:32", "remaining_time": "5:23:27"} +{"current_steps": 1170, "total_steps": 7494, "loss": 0.611, "lr": 0.0001485758861326549, "epoch": 0.3122497998398719, "percentage": 15.61, "elapsed_time": "1:00:05", "remaining_time": "5:24:47"} +{"current_steps": 1175, "total_steps": 7494, "loss": 0.6145, "lr": 0.00014854180616246523, "epoch": 0.3135842006938884, "percentage": 15.68, "elapsed_time": "1:01:06", "remaining_time": "5:28:37"} +{"current_steps": 1180, "total_steps": 7494, "loss": 0.6354, "lr": 0.00014850732722366682, "epoch": 0.31491860154790496, "percentage": 15.75, "elapsed_time": "1:01:52", "remaining_time": "5:31:02"} +{"current_steps": 1185, "total_steps": 7494, "loss": 0.627, "lr": 0.00014847244950330998, "epoch": 0.31625300240192156, "percentage": 15.81, "elapsed_time": "1:02:24", "remaining_time": "5:32:14"} +{"current_steps": 1190, "total_steps": 7494, "loss": 0.6318, "lr": 0.00014843717319060833, "epoch": 0.3175874032559381, "percentage": 15.88, "elapsed_time": "1:03:04", "remaining_time": "5:34:09"} +{"current_steps": 1195, "total_steps": 7494, "loss": 0.6272, "lr": 0.00014840149847693794, "epoch": 0.31892180410995463, "percentage": 15.95, "elapsed_time": "1:04:07", "remaining_time": "5:37:59"} +{"current_steps": 1200, "total_steps": 7494, "loss": 0.6184, "lr": 0.00014836542555583628, "epoch": 0.32025620496397117, "percentage": 16.01, "elapsed_time": "1:04:41", "remaining_time": "5:39:18"} +{"current_steps": 1205, "total_steps": 7494, "loss": 0.6301, "lr": 0.000148328954623001, "epoch": 0.3215906058179877, "percentage": 16.08, "elapsed_time": "1:05:24", "remaining_time": "5:41:19"} +{"current_steps": 1210, "total_steps": 7494, "loss": 0.6165, "lr": 0.00014829208587628908, "epoch": 0.32292500667200424, "percentage": 16.15, "elapsed_time": "1:06:23", "remaining_time": "5:44:46"} +{"current_steps": 1215, "total_steps": 7494, "loss": 0.6172, "lr": 0.0001482548195157156, "epoch": 0.32425940752602084, "percentage": 16.21, "elapsed_time": "1:07:47", "remaining_time": "5:50:21"} +{"current_steps": 1220, "total_steps": 7494, "loss": 0.6091, "lr": 0.00014821715574345277, "epoch": 0.3255938083800374, "percentage": 16.28, "elapsed_time": "1:08:20", "remaining_time": "5:51:27"} +{"current_steps": 1225, "total_steps": 7494, "loss": 0.6176, "lr": 0.0001481790947638288, "epoch": 0.3269282092340539, "percentage": 16.35, "elapsed_time": "1:08:59", "remaining_time": "5:53:04"} +{"current_steps": 1230, "total_steps": 7494, "loss": 0.6144, "lr": 0.00014814063678332667, "epoch": 0.32826261008807045, "percentage": 16.41, "elapsed_time": "1:10:03", "remaining_time": "5:56:46"} +{"current_steps": 1235, "total_steps": 7494, "loss": 0.6105, "lr": 0.00014810178201058323, "epoch": 0.329597010942087, "percentage": 16.48, "elapsed_time": "1:10:40", "remaining_time": "5:58:12"} +{"current_steps": 1240, "total_steps": 7494, "loss": 0.6111, "lr": 0.00014806253065638786, "epoch": 0.3309314117961035, "percentage": 16.55, "elapsed_time": "1:11:13", "remaining_time": "5:59:14"} +{"current_steps": 1245, "total_steps": 7494, "loss": 0.6128, "lr": 0.00014802288293368148, "epoch": 0.3322658126501201, "percentage": 16.61, "elapsed_time": "1:12:06", "remaining_time": "6:01:58"} +{"current_steps": 1250, "total_steps": 7494, "loss": 0.6247, "lr": 0.0001479828390575553, "epoch": 0.33360021350413666, "percentage": 16.68, "elapsed_time": "1:13:00", "remaining_time": "6:04:41"} +{"current_steps": 1255, "total_steps": 7494, "loss": 0.6225, "lr": 0.00014794239924524968, "epoch": 0.3349346143581532, "percentage": 16.75, "elapsed_time": "1:13:33", "remaining_time": "6:05:42"} +{"current_steps": 1260, "total_steps": 7494, "loss": 0.6246, "lr": 0.00014790156371615303, "epoch": 0.33626901521216973, "percentage": 16.81, "elapsed_time": "1:14:09", "remaining_time": "6:06:53"} +{"current_steps": 1265, "total_steps": 7494, "loss": 0.6068, "lr": 0.00014786033269180044, "epoch": 0.33760341606618627, "percentage": 16.88, "elapsed_time": "1:15:11", "remaining_time": "6:10:14"} +{"current_steps": 1270, "total_steps": 7494, "loss": 0.6282, "lr": 0.00014781870639587262, "epoch": 0.3389378169202028, "percentage": 16.95, "elapsed_time": "1:15:56", "remaining_time": "6:12:08"} +{"current_steps": 1275, "total_steps": 7494, "loss": 0.6341, "lr": 0.0001477766850541947, "epoch": 0.3402722177742194, "percentage": 17.01, "elapsed_time": "1:16:28", "remaining_time": "6:13:01"} +{"current_steps": 1280, "total_steps": 7494, "loss": 0.629, "lr": 0.00014773426889473493, "epoch": 0.34160661862823594, "percentage": 17.08, "elapsed_time": "1:17:16", "remaining_time": "6:15:10"} +{"current_steps": 1285, "total_steps": 7494, "loss": 0.6411, "lr": 0.0001476914581476034, "epoch": 0.3429410194822525, "percentage": 17.15, "elapsed_time": "1:18:18", "remaining_time": "6:18:20"} +{"current_steps": 1290, "total_steps": 7494, "loss": 0.616, "lr": 0.000147648253045051, "epoch": 0.344275420336269, "percentage": 17.21, "elapsed_time": "1:18:52", "remaining_time": "6:19:22"} +{"current_steps": 1295, "total_steps": 7494, "loss": 0.6124, "lr": 0.0001476046538214679, "epoch": 0.34560982119028555, "percentage": 17.28, "elapsed_time": "1:19:26", "remaining_time": "6:20:16"} +{"current_steps": 1300, "total_steps": 7494, "loss": 0.6378, "lr": 0.00014756066071338247, "epoch": 0.3469442220443021, "percentage": 17.35, "elapsed_time": "1:20:22", "remaining_time": "6:22:59"} +{"current_steps": 1305, "total_steps": 7494, "loss": 0.6217, "lr": 0.00014751627395945984, "epoch": 0.3482786228983187, "percentage": 17.41, "elapsed_time": "1:21:21", "remaining_time": "6:25:49"} +{"current_steps": 1310, "total_steps": 7494, "loss": 0.6174, "lr": 0.0001474714938005008, "epoch": 0.3496130237523352, "percentage": 17.48, "elapsed_time": "1:21:54", "remaining_time": "6:26:37"} +{"current_steps": 1315, "total_steps": 7494, "loss": 0.637, "lr": 0.00014742632047944033, "epoch": 0.35094742460635175, "percentage": 17.55, "elapsed_time": "1:22:34", "remaining_time": "6:28:01"} +{"current_steps": 1320, "total_steps": 7494, "loss": 0.6263, "lr": 0.00014738075424134634, "epoch": 0.3522818254603683, "percentage": 17.61, "elapsed_time": "1:23:35", "remaining_time": "6:30:56"} +{"current_steps": 1325, "total_steps": 7494, "loss": 0.6195, "lr": 0.00014733479533341837, "epoch": 0.35361622631438483, "percentage": 17.68, "elapsed_time": "1:24:14", "remaining_time": "6:32:10"} +{"current_steps": 1330, "total_steps": 7494, "loss": 0.6254, "lr": 0.00014728844400498616, "epoch": 0.35495062716840137, "percentage": 17.75, "elapsed_time": "1:24:46", "remaining_time": "6:32:55"} +{"current_steps": 1335, "total_steps": 7494, "loss": 0.6215, "lr": 0.00014724170050750836, "epoch": 0.35628502802241796, "percentage": 17.81, "elapsed_time": "1:25:38", "remaining_time": "6:35:06"} +{"current_steps": 1340, "total_steps": 7494, "loss": 0.6297, "lr": 0.00014719456509457122, "epoch": 0.3576194288764345, "percentage": 17.88, "elapsed_time": "1:26:32", "remaining_time": "6:37:27"} +{"current_steps": 1345, "total_steps": 7494, "loss": 0.6265, "lr": 0.00014714703802188713, "epoch": 0.35895382973045104, "percentage": 17.95, "elapsed_time": "1:27:06", "remaining_time": "6:38:16"} +{"current_steps": 1350, "total_steps": 7494, "loss": 0.6318, "lr": 0.0001470991195472932, "epoch": 0.3602882305844676, "percentage": 18.01, "elapsed_time": "1:27:43", "remaining_time": "6:39:14"} +{"current_steps": 1355, "total_steps": 7494, "loss": 0.6186, "lr": 0.00014705080993075, "epoch": 0.3616226314384841, "percentage": 18.08, "elapsed_time": "1:28:41", "remaining_time": "6:41:48"} +{"current_steps": 1360, "total_steps": 7494, "loss": 0.6284, "lr": 0.00014700210943433998, "epoch": 0.36295703229250065, "percentage": 18.15, "elapsed_time": "1:29:26", "remaining_time": "6:43:24"} +{"current_steps": 1365, "total_steps": 7494, "loss": 0.6353, "lr": 0.00014695301832226627, "epoch": 0.36429143314651724, "percentage": 18.21, "elapsed_time": "1:29:58", "remaining_time": "6:43:58"} +{"current_steps": 1370, "total_steps": 7494, "loss": 0.6165, "lr": 0.00014690353686085098, "epoch": 0.3656258340005338, "percentage": 18.28, "elapsed_time": "1:30:43", "remaining_time": "6:45:33"} +{"current_steps": 1375, "total_steps": 7494, "loss": 0.6232, "lr": 0.00014685366531853395, "epoch": 0.3669602348545503, "percentage": 18.35, "elapsed_time": "1:31:41", "remaining_time": "6:48:02"} +{"current_steps": 1380, "total_steps": 7494, "loss": 0.6233, "lr": 0.00014680340396587118, "epoch": 0.36829463570856685, "percentage": 18.41, "elapsed_time": "1:32:20", "remaining_time": "6:49:05"} +{"current_steps": 1385, "total_steps": 7494, "loss": 0.6084, "lr": 0.0001467527530755335, "epoch": 0.3696290365625834, "percentage": 18.48, "elapsed_time": "1:32:53", "remaining_time": "6:49:42"} +{"current_steps": 1390, "total_steps": 7494, "loss": 0.6202, "lr": 0.000146701712922305, "epoch": 0.37096343741659993, "percentage": 18.55, "elapsed_time": "1:33:46", "remaining_time": "6:51:49"} +{"current_steps": 1395, "total_steps": 7494, "loss": 0.6251, "lr": 0.00014665028378308138, "epoch": 0.37229783827061647, "percentage": 18.61, "elapsed_time": "1:34:39", "remaining_time": "6:53:50"} +{"current_steps": 1400, "total_steps": 7494, "loss": 0.624, "lr": 0.00014659846593686885, "epoch": 0.37363223912463306, "percentage": 18.68, "elapsed_time": "1:35:14", "remaining_time": "6:54:32"} +{"current_steps": 1405, "total_steps": 7494, "loss": 0.6298, "lr": 0.0001465462596647822, "epoch": 0.3749666399786496, "percentage": 18.75, "elapsed_time": "1:36:04", "remaining_time": "6:56:21"} +{"current_steps": 1410, "total_steps": 7494, "loss": 0.6008, "lr": 0.0001464936652500435, "epoch": 0.37630104083266613, "percentage": 18.82, "elapsed_time": "1:37:03", "remaining_time": "6:58:49"} +{"current_steps": 1415, "total_steps": 7494, "loss": 0.6157, "lr": 0.0001464406829779806, "epoch": 0.37763544168668267, "percentage": 18.88, "elapsed_time": "1:37:47", "remaining_time": "7:00:06"} +{"current_steps": 1420, "total_steps": 7494, "loss": 0.6106, "lr": 0.0001463873131360254, "epoch": 0.3789698425406992, "percentage": 18.95, "elapsed_time": "1:38:20", "remaining_time": "7:00:38"} +{"current_steps": 1425, "total_steps": 7494, "loss": 0.6156, "lr": 0.0001463335560137124, "epoch": 0.38030424339471575, "percentage": 19.02, "elapsed_time": "1:39:05", "remaining_time": "7:02:01"} +{"current_steps": 1430, "total_steps": 7494, "loss": 0.6152, "lr": 0.00014627941190267717, "epoch": 0.38163864424873234, "percentage": 19.08, "elapsed_time": "1:39:58", "remaining_time": "7:03:58"} +{"current_steps": 1435, "total_steps": 7494, "loss": 0.6285, "lr": 0.00014622488109665468, "epoch": 0.3829730451027489, "percentage": 19.15, "elapsed_time": "1:40:37", "remaining_time": "7:04:53"} +{"current_steps": 1440, "total_steps": 7494, "loss": 0.6203, "lr": 0.0001461699638914777, "epoch": 0.3843074459567654, "percentage": 19.22, "elapsed_time": "1:41:11", "remaining_time": "7:05:26"} +{"current_steps": 1445, "total_steps": 7494, "loss": 0.616, "lr": 0.00014611466058507536, "epoch": 0.38564184681078195, "percentage": 19.28, "elapsed_time": "1:42:03", "remaining_time": "7:07:15"} +{"current_steps": 1450, "total_steps": 7494, "loss": 0.6251, "lr": 0.00014605897147747132, "epoch": 0.3869762476647985, "percentage": 19.35, "elapsed_time": "1:42:56", "remaining_time": "7:09:07"} +{"current_steps": 1455, "total_steps": 7494, "loss": 0.6302, "lr": 0.0001460028968707822, "epoch": 0.388310648518815, "percentage": 19.42, "elapsed_time": "1:43:32", "remaining_time": "7:09:43"} +{"current_steps": 1460, "total_steps": 7494, "loss": 0.6189, "lr": 0.0001459464370692161, "epoch": 0.3896450493728316, "percentage": 19.48, "elapsed_time": "1:44:12", "remaining_time": "7:10:38"} +{"current_steps": 1465, "total_steps": 7494, "loss": 0.6212, "lr": 0.0001458895923790707, "epoch": 0.39097945022684816, "percentage": 19.55, "elapsed_time": "1:45:09", "remaining_time": "7:12:45"} +{"current_steps": 1470, "total_steps": 7494, "loss": 0.6206, "lr": 0.0001458323631087318, "epoch": 0.3923138510808647, "percentage": 19.62, "elapsed_time": "1:45:55", "remaining_time": "7:14:03"} +{"current_steps": 1475, "total_steps": 7494, "loss": 0.6028, "lr": 0.00014577474956867155, "epoch": 0.39364825193488123, "percentage": 19.68, "elapsed_time": "1:46:29", "remaining_time": "7:14:31"} +{"current_steps": 1480, "total_steps": 7494, "loss": 0.6285, "lr": 0.00014571675207144676, "epoch": 0.39498265278889777, "percentage": 19.75, "elapsed_time": "1:47:14", "remaining_time": "7:15:45"} +{"current_steps": 1485, "total_steps": 7494, "loss": 0.6326, "lr": 0.00014565837093169728, "epoch": 0.3963170536429143, "percentage": 19.82, "elapsed_time": "1:48:09", "remaining_time": "7:17:41"} +{"current_steps": 1490, "total_steps": 7494, "loss": 0.6314, "lr": 0.00014559960646614418, "epoch": 0.3976514544969309, "percentage": 19.88, "elapsed_time": "1:48:51", "remaining_time": "7:18:38"} +{"current_steps": 1495, "total_steps": 7494, "loss": 0.6203, "lr": 0.00014554045899358814, "epoch": 0.39898585535094744, "percentage": 19.95, "elapsed_time": "1:49:26", "remaining_time": "7:19:10"} +{"current_steps": 1500, "total_steps": 7494, "loss": 0.6219, "lr": 0.00014548092883490772, "epoch": 0.400320256204964, "percentage": 20.02, "elapsed_time": "1:50:19", "remaining_time": "7:20:52"} +{"current_steps": 1505, "total_steps": 7494, "loss": 0.6341, "lr": 0.00014542101631305745, "epoch": 0.4016546570589805, "percentage": 20.08, "elapsed_time": "1:51:23", "remaining_time": "7:23:14"} +{"current_steps": 1510, "total_steps": 7494, "loss": 0.616, "lr": 0.00014536072175306628, "epoch": 0.40298905791299705, "percentage": 20.15, "elapsed_time": "1:51:59", "remaining_time": "7:23:49"} +{"current_steps": 1515, "total_steps": 7494, "loss": 0.6096, "lr": 0.00014530004548203573, "epoch": 0.4043234587670136, "percentage": 20.22, "elapsed_time": "1:52:40", "remaining_time": "7:24:40"} +{"current_steps": 1520, "total_steps": 7494, "loss": 0.6363, "lr": 0.00014523898782913818, "epoch": 0.4056578596210302, "percentage": 20.28, "elapsed_time": "1:53:38", "remaining_time": "7:26:37"} +{"current_steps": 1525, "total_steps": 7494, "loss": 0.6225, "lr": 0.00014517754912561496, "epoch": 0.4069922604750467, "percentage": 20.35, "elapsed_time": "1:54:25", "remaining_time": "7:27:50"} +{"current_steps": 1530, "total_steps": 7494, "loss": 0.6092, "lr": 0.00014511572970477457, "epoch": 0.40832666132906326, "percentage": 20.42, "elapsed_time": "1:54:59", "remaining_time": "7:28:14"} +{"current_steps": 1535, "total_steps": 7494, "loss": 0.6212, "lr": 0.00014505352990199107, "epoch": 0.4096610621830798, "percentage": 20.48, "elapsed_time": "1:55:44", "remaining_time": "7:29:18"} +{"current_steps": 1540, "total_steps": 7494, "loss": 0.6203, "lr": 0.000144990950054702, "epoch": 0.41099546303709633, "percentage": 20.55, "elapsed_time": "1:56:38", "remaining_time": "7:30:58"} +{"current_steps": 1545, "total_steps": 7494, "loss": 0.6229, "lr": 0.0001449279905024067, "epoch": 0.41232986389111287, "percentage": 20.62, "elapsed_time": "1:57:21", "remaining_time": "7:31:53"} +{"current_steps": 1550, "total_steps": 7494, "loss": 0.622, "lr": 0.00014486465158666443, "epoch": 0.41366426474512946, "percentage": 20.68, "elapsed_time": "1:57:56", "remaining_time": "7:32:16"} +{"current_steps": 1555, "total_steps": 7494, "loss": 0.6375, "lr": 0.00014480093365109252, "epoch": 0.414998665599146, "percentage": 20.75, "elapsed_time": "1:58:44", "remaining_time": "7:33:28"} +{"current_steps": 1560, "total_steps": 7494, "loss": 0.6183, "lr": 0.00014473683704136454, "epoch": 0.41633306645316254, "percentage": 20.82, "elapsed_time": "1:59:39", "remaining_time": "7:35:11"} +{"current_steps": 1565, "total_steps": 7494, "loss": 0.6182, "lr": 0.0001446723621052083, "epoch": 0.4176674673071791, "percentage": 20.88, "elapsed_time": "2:00:19", "remaining_time": "7:35:50"} +{"current_steps": 1570, "total_steps": 7494, "loss": 0.6069, "lr": 0.00014460750919240416, "epoch": 0.4190018681611956, "percentage": 20.95, "elapsed_time": "2:00:56", "remaining_time": "7:36:19"} +{"current_steps": 1575, "total_steps": 7494, "loss": 0.6221, "lr": 0.00014454227865478292, "epoch": 0.42033626901521215, "percentage": 21.02, "elapsed_time": "2:01:49", "remaining_time": "7:37:49"} +{"current_steps": 1580, "total_steps": 7494, "loss": 0.636, "lr": 0.0001444766708462241, "epoch": 0.42167066986922874, "percentage": 21.08, "elapsed_time": "2:02:38", "remaining_time": "7:39:01"} +{"current_steps": 1585, "total_steps": 7494, "loss": 0.624, "lr": 0.0001444106861226539, "epoch": 0.4230050707232453, "percentage": 21.15, "elapsed_time": "2:03:14", "remaining_time": "7:39:28"} +{"current_steps": 1590, "total_steps": 7494, "loss": 0.6263, "lr": 0.00014434432484204335, "epoch": 0.4243394715772618, "percentage": 21.22, "elapsed_time": "2:03:55", "remaining_time": "7:40:08"} +{"current_steps": 1595, "total_steps": 7494, "loss": 0.624, "lr": 0.0001442775873644062, "epoch": 0.42567387243127836, "percentage": 21.28, "elapsed_time": "2:04:50", "remaining_time": "7:41:41"} +{"current_steps": 1600, "total_steps": 7494, "loss": 0.6314, "lr": 0.00014421047405179725, "epoch": 0.4270082732852949, "percentage": 21.35, "elapsed_time": "2:05:34", "remaining_time": "7:42:34"} +{"current_steps": 1605, "total_steps": 7494, "loss": 0.6274, "lr": 0.00014414298526831012, "epoch": 0.42834267413931143, "percentage": 21.42, "elapsed_time": "2:06:22", "remaining_time": "7:43:39"} +{"current_steps": 1610, "total_steps": 7494, "loss": 0.6304, "lr": 0.00014407512138007547, "epoch": 0.429677074993328, "percentage": 21.48, "elapsed_time": "2:07:08", "remaining_time": "7:44:37"} +{"current_steps": 1615, "total_steps": 7494, "loss": 0.6082, "lr": 0.0001440068827552588, "epoch": 0.43101147584734456, "percentage": 21.55, "elapsed_time": "2:08:02", "remaining_time": "7:46:06"} +{"current_steps": 1620, "total_steps": 7494, "loss": 0.6416, "lr": 0.0001439382697640587, "epoch": 0.4323458767013611, "percentage": 21.62, "elapsed_time": "2:08:43", "remaining_time": "7:46:45"} +{"current_steps": 1625, "total_steps": 7494, "loss": 0.6022, "lr": 0.00014386928277870461, "epoch": 0.43368027755537764, "percentage": 21.68, "elapsed_time": "2:09:20", "remaining_time": "7:47:10"} +{"current_steps": 1630, "total_steps": 7494, "loss": 0.6372, "lr": 0.00014379992217345504, "epoch": 0.4350146784093942, "percentage": 21.75, "elapsed_time": "2:10:10", "remaining_time": "7:48:18"} +{"current_steps": 1635, "total_steps": 7494, "loss": 0.6217, "lr": 0.0001437301883245953, "epoch": 0.4363490792634107, "percentage": 21.82, "elapsed_time": "2:11:05", "remaining_time": "7:49:44"} +{"current_steps": 1640, "total_steps": 7494, "loss": 0.6169, "lr": 0.0001436600816104356, "epoch": 0.43768348011742725, "percentage": 21.88, "elapsed_time": "2:11:44", "remaining_time": "7:50:14"} +{"current_steps": 1645, "total_steps": 7494, "loss": 0.6192, "lr": 0.000143589602411309, "epoch": 0.43901788097144384, "percentage": 21.95, "elapsed_time": "2:12:24", "remaining_time": "7:50:46"} +{"current_steps": 1650, "total_steps": 7494, "loss": 0.6159, "lr": 0.00014351875110956927, "epoch": 0.4403522818254604, "percentage": 22.02, "elapsed_time": "2:13:17", "remaining_time": "7:52:06"} +{"current_steps": 1655, "total_steps": 7494, "loss": 0.6345, "lr": 0.00014344752808958887, "epoch": 0.4416866826794769, "percentage": 22.08, "elapsed_time": "2:14:04", "remaining_time": "7:53:02"} +{"current_steps": 1660, "total_steps": 7494, "loss": 0.6159, "lr": 0.0001433759337377569, "epoch": 0.44302108353349345, "percentage": 22.15, "elapsed_time": "2:14:42", "remaining_time": "7:53:24"} +{"current_steps": 1665, "total_steps": 7494, "loss": 0.6133, "lr": 0.00014330396844247685, "epoch": 0.44435548438751, "percentage": 22.22, "elapsed_time": "2:15:26", "remaining_time": "7:54:09"} +{"current_steps": 1670, "total_steps": 7494, "loss": 0.6224, "lr": 0.0001432316325941647, "epoch": 0.44568988524152653, "percentage": 22.28, "elapsed_time": "2:16:19", "remaining_time": "7:55:26"} +{"current_steps": 1675, "total_steps": 7494, "loss": 0.6286, "lr": 0.00014315892658524665, "epoch": 0.4470242860955431, "percentage": 22.35, "elapsed_time": "2:17:05", "remaining_time": "7:56:15"} +{"current_steps": 1680, "total_steps": 7494, "loss": 0.6024, "lr": 0.0001430858508101571, "epoch": 0.44835868694955966, "percentage": 22.42, "elapsed_time": "2:17:44", "remaining_time": "7:56:39"} +{"current_steps": 1685, "total_steps": 7494, "loss": 0.6395, "lr": 0.00014301240566533637, "epoch": 0.4496930878035762, "percentage": 22.48, "elapsed_time": "2:18:31", "remaining_time": "7:57:33"} +{"current_steps": 1690, "total_steps": 7494, "loss": 0.6121, "lr": 0.00014293859154922866, "epoch": 0.45102748865759273, "percentage": 22.55, "elapsed_time": "2:19:26", "remaining_time": "7:58:53"} +{"current_steps": 1695, "total_steps": 7494, "loss": 0.6259, "lr": 0.00014286440886227995, "epoch": 0.45236188951160927, "percentage": 22.62, "elapsed_time": "2:20:11", "remaining_time": "7:59:36"} +{"current_steps": 1700, "total_steps": 7494, "loss": 0.6394, "lr": 0.00014278985800693562, "epoch": 0.4536962903656258, "percentage": 22.68, "elapsed_time": "2:20:51", "remaining_time": "8:00:04"} +{"current_steps": 1705, "total_steps": 7494, "loss": 0.6132, "lr": 0.0001427149393876384, "epoch": 0.4550306912196424, "percentage": 22.75, "elapsed_time": "2:21:51", "remaining_time": "8:01:38"} +{"current_steps": 1710, "total_steps": 7494, "loss": 0.6216, "lr": 0.00014263965341082622, "epoch": 0.45636509207365894, "percentage": 22.82, "elapsed_time": "2:22:43", "remaining_time": "8:02:46"} +{"current_steps": 1715, "total_steps": 7494, "loss": 0.6389, "lr": 0.00014256400048492994, "epoch": 0.4576994929276755, "percentage": 22.88, "elapsed_time": "2:23:23", "remaining_time": "8:03:12"} +{"current_steps": 1720, "total_steps": 7494, "loss": 0.6025, "lr": 0.00014248798102037106, "epoch": 0.459033893781692, "percentage": 22.95, "elapsed_time": "2:24:05", "remaining_time": "8:03:43"} +{"current_steps": 1725, "total_steps": 7494, "loss": 0.6276, "lr": 0.0001424115954295597, "epoch": 0.46036829463570855, "percentage": 23.02, "elapsed_time": "2:24:57", "remaining_time": "8:04:49"} +{"current_steps": 1730, "total_steps": 7494, "loss": 0.6234, "lr": 0.00014233484412689212, "epoch": 0.4617026954897251, "percentage": 23.09, "elapsed_time": "2:25:47", "remaining_time": "8:05:45"} +{"current_steps": 1735, "total_steps": 7494, "loss": 0.6114, "lr": 0.00014225772752874866, "epoch": 0.4630370963437417, "percentage": 23.15, "elapsed_time": "2:26:26", "remaining_time": "8:06:06"} +{"current_steps": 1740, "total_steps": 7494, "loss": 0.6043, "lr": 0.00014218024605349133, "epoch": 0.4643714971977582, "percentage": 23.22, "elapsed_time": "2:27:10", "remaining_time": "8:06:41"} +{"current_steps": 1745, "total_steps": 7494, "loss": 0.6141, "lr": 0.00014210240012146178, "epoch": 0.46570589805177476, "percentage": 23.29, "elapsed_time": "2:28:03", "remaining_time": "8:07:46"} +{"current_steps": 1750, "total_steps": 7494, "loss": 0.6251, "lr": 0.00014202419015497863, "epoch": 0.4670402989057913, "percentage": 23.35, "elapsed_time": "2:28:48", "remaining_time": "8:08:26"} +{"current_steps": 1755, "total_steps": 7494, "loss": 0.6238, "lr": 0.00014194561657833563, "epoch": 0.46837469975980783, "percentage": 23.42, "elapsed_time": "2:29:28", "remaining_time": "8:08:46"} +{"current_steps": 1760, "total_steps": 7494, "loss": 0.6126, "lr": 0.000141866679817799, "epoch": 0.46970910061382437, "percentage": 23.49, "elapsed_time": "2:30:12", "remaining_time": "8:09:23"} +{"current_steps": 1765, "total_steps": 7494, "loss": 0.623, "lr": 0.00014178738030160527, "epoch": 0.47104350146784096, "percentage": 23.55, "elapsed_time": "2:31:05", "remaining_time": "8:10:25"} +{"current_steps": 1770, "total_steps": 7494, "loss": 0.6191, "lr": 0.000141707718459959, "epoch": 0.4723779023218575, "percentage": 23.62, "elapsed_time": "2:31:47", "remaining_time": "8:10:51"} +{"current_steps": 1775, "total_steps": 7494, "loss": 0.6017, "lr": 0.00014162769472503032, "epoch": 0.47371230317587404, "percentage": 23.69, "elapsed_time": "2:32:27", "remaining_time": "8:11:13"} +{"current_steps": 1780, "total_steps": 7494, "loss": 0.6015, "lr": 0.00014154730953095274, "epoch": 0.4750467040298906, "percentage": 23.75, "elapsed_time": "2:33:14", "remaining_time": "8:11:56"} +{"current_steps": 1785, "total_steps": 7494, "loss": 0.6276, "lr": 0.0001414665633138206, "epoch": 0.4763811048839071, "percentage": 23.82, "elapsed_time": "2:34:05", "remaining_time": "8:12:49"} +{"current_steps": 1790, "total_steps": 7494, "loss": 0.6299, "lr": 0.00014138545651168683, "epoch": 0.47771550573792365, "percentage": 23.89, "elapsed_time": "2:34:46", "remaining_time": "8:13:12"} +{"current_steps": 1795, "total_steps": 7494, "loss": 0.6121, "lr": 0.00014130398956456062, "epoch": 0.47904990659194024, "percentage": 23.95, "elapsed_time": "2:35:27", "remaining_time": "8:13:35"} +{"current_steps": 1800, "total_steps": 7494, "loss": 0.6189, "lr": 0.00014122216291440496, "epoch": 0.4803843074459568, "percentage": 24.02, "elapsed_time": "2:36:17", "remaining_time": "8:14:24"} +{"current_steps": 1805, "total_steps": 7494, "loss": 0.6247, "lr": 0.00014113997700513422, "epoch": 0.4817187082999733, "percentage": 24.09, "elapsed_time": "2:37:51", "remaining_time": "8:17:30"} +{"current_steps": 1810, "total_steps": 7494, "loss": 0.5971, "lr": 0.00014105743228261174, "epoch": 0.48305310915398986, "percentage": 24.15, "elapsed_time": "2:38:31", "remaining_time": "8:17:50"} +{"current_steps": 1815, "total_steps": 7494, "loss": 0.6275, "lr": 0.00014097452919464748, "epoch": 0.4843875100080064, "percentage": 24.22, "elapsed_time": "2:39:15", "remaining_time": "8:18:17"} +{"current_steps": 1820, "total_steps": 7494, "loss": 0.6076, "lr": 0.00014089126819099557, "epoch": 0.48572191086202293, "percentage": 24.29, "elapsed_time": "2:40:05", "remaining_time": "8:19:04"} +{"current_steps": 1825, "total_steps": 7494, "loss": 0.6276, "lr": 0.00014080764972335184, "epoch": 0.4870563117160395, "percentage": 24.35, "elapsed_time": "2:40:52", "remaining_time": "8:19:43"} +{"current_steps": 1830, "total_steps": 7494, "loss": 0.6162, "lr": 0.00014072367424535135, "epoch": 0.48839071257005606, "percentage": 24.42, "elapsed_time": "2:41:32", "remaining_time": "8:19:58"} +{"current_steps": 1835, "total_steps": 7494, "loss": 0.6172, "lr": 0.000140639342212566, "epoch": 0.4897251134240726, "percentage": 24.49, "elapsed_time": "2:42:20", "remaining_time": "8:20:37"} +{"current_steps": 1840, "total_steps": 7494, "loss": 0.6136, "lr": 0.000140554654082502, "epoch": 0.49105951427808914, "percentage": 24.55, "elapsed_time": "2:43:09", "remaining_time": "8:21:22"} +{"current_steps": 1845, "total_steps": 7494, "loss": 0.6327, "lr": 0.0001404696103145975, "epoch": 0.4923939151321057, "percentage": 24.62, "elapsed_time": "2:43:54", "remaining_time": "8:21:52"} +{"current_steps": 1850, "total_steps": 7494, "loss": 0.6096, "lr": 0.0001403842113702198, "epoch": 0.4937283159861222, "percentage": 24.69, "elapsed_time": "2:44:36", "remaining_time": "8:22:09"} +{"current_steps": 1855, "total_steps": 7494, "loss": 0.6279, "lr": 0.00014029845771266325, "epoch": 0.49506271684013875, "percentage": 24.75, "elapsed_time": "2:45:23", "remaining_time": "8:22:45"} +{"current_steps": 1860, "total_steps": 7494, "loss": 0.6311, "lr": 0.00014021234980714648, "epoch": 0.49639711769415534, "percentage": 24.82, "elapsed_time": "2:46:12", "remaining_time": "8:23:27"} +{"current_steps": 1865, "total_steps": 7494, "loss": 0.6301, "lr": 0.00014012588812080992, "epoch": 0.4977315185481719, "percentage": 24.89, "elapsed_time": "2:46:56", "remaining_time": "8:23:51"} +{"current_steps": 1870, "total_steps": 7494, "loss": 0.6167, "lr": 0.00014003907312271319, "epoch": 0.4990659194021884, "percentage": 24.95, "elapsed_time": "2:47:36", "remaining_time": "8:24:05"} +{"current_steps": 1875, "total_steps": 7494, "loss": 0.6169, "lr": 0.0001399519052838329, "epoch": 0.500400320256205, "percentage": 25.02, "elapsed_time": "2:48:23", "remaining_time": "8:24:38"} +{"current_steps": 1880, "total_steps": 7494, "loss": 0.6232, "lr": 0.00013986438507705958, "epoch": 0.5017347211102215, "percentage": 25.09, "elapsed_time": "2:49:13", "remaining_time": "8:25:21"} +{"current_steps": 1885, "total_steps": 7494, "loss": 0.6223, "lr": 0.00013977651297719548, "epoch": 0.503069121964238, "percentage": 25.15, "elapsed_time": "2:49:55", "remaining_time": "8:25:36"} +{"current_steps": 1890, "total_steps": 7494, "loss": 0.6094, "lr": 0.00013968828946095193, "epoch": 0.5044035228182546, "percentage": 25.22, "elapsed_time": "2:50:36", "remaining_time": "8:25:53"} +{"current_steps": 1895, "total_steps": 7494, "loss": 0.6166, "lr": 0.00013959971500694668, "epoch": 0.5057379236722711, "percentage": 25.29, "elapsed_time": "2:51:24", "remaining_time": "8:26:26"} +{"current_steps": 1900, "total_steps": 7494, "loss": 0.6212, "lr": 0.00013951079009570132, "epoch": 0.5070723245262877, "percentage": 25.35, "elapsed_time": "2:52:12", "remaining_time": "8:27:01"} +{"current_steps": 1905, "total_steps": 7494, "loss": 0.6174, "lr": 0.00013942151520963868, "epoch": 0.5084067253803043, "percentage": 25.42, "elapsed_time": "2:53:04", "remaining_time": "8:27:45"} +{"current_steps": 1910, "total_steps": 7494, "loss": 0.6246, "lr": 0.00013933189083308031, "epoch": 0.5097411262343208, "percentage": 25.49, "elapsed_time": "2:53:47", "remaining_time": "8:28:06"} +{"current_steps": 1915, "total_steps": 7494, "loss": 0.612, "lr": 0.00013924191745224364, "epoch": 0.5110755270883374, "percentage": 25.55, "elapsed_time": "2:54:40", "remaining_time": "8:28:53"} +{"current_steps": 1920, "total_steps": 7494, "loss": 0.6345, "lr": 0.00013915159555523957, "epoch": 0.5124099279423538, "percentage": 25.62, "elapsed_time": "2:55:27", "remaining_time": "8:29:22"} +{"current_steps": 1925, "total_steps": 7494, "loss": 0.6057, "lr": 0.00013906092563206968, "epoch": 0.5137443287963704, "percentage": 25.69, "elapsed_time": "2:56:07", "remaining_time": "8:29:32"} +{"current_steps": 1930, "total_steps": 7494, "loss": 0.6312, "lr": 0.00013896990817462363, "epoch": 0.5150787296503869, "percentage": 25.75, "elapsed_time": "2:56:52", "remaining_time": "8:29:54"} +{"current_steps": 1935, "total_steps": 7494, "loss": 0.6222, "lr": 0.00013887854367667645, "epoch": 0.5164131305044035, "percentage": 25.82, "elapsed_time": "2:57:44", "remaining_time": "8:30:38"} +{"current_steps": 1940, "total_steps": 7494, "loss": 0.6267, "lr": 0.00013878683263388587, "epoch": 0.5177475313584201, "percentage": 25.89, "elapsed_time": "2:58:28", "remaining_time": "8:30:56"} +{"current_steps": 1945, "total_steps": 7494, "loss": 0.6228, "lr": 0.00013869477554378972, "epoch": 0.5190819322124366, "percentage": 25.95, "elapsed_time": "2:59:09", "remaining_time": "8:31:09"} +{"current_steps": 1950, "total_steps": 7494, "loss": 0.6051, "lr": 0.00013860237290580306, "epoch": 0.5204163330664532, "percentage": 26.02, "elapsed_time": "2:59:53", "remaining_time": "8:31:27"} +{"current_steps": 1955, "total_steps": 7494, "loss": 0.6279, "lr": 0.00013850962522121569, "epoch": 0.5217507339204697, "percentage": 26.09, "elapsed_time": "3:00:43", "remaining_time": "8:32:02"} +{"current_steps": 1960, "total_steps": 7494, "loss": 0.616, "lr": 0.00013841653299318915, "epoch": 0.5230851347744863, "percentage": 26.15, "elapsed_time": "3:01:28", "remaining_time": "8:32:24"} +{"current_steps": 1965, "total_steps": 7494, "loss": 0.6014, "lr": 0.00013832309672675428, "epoch": 0.5244195356285029, "percentage": 26.22, "elapsed_time": "3:02:10", "remaining_time": "8:32:35"} +{"current_steps": 1970, "total_steps": 7494, "loss": 0.6229, "lr": 0.00013822931692880828, "epoch": 0.5257539364825193, "percentage": 26.29, "elapsed_time": "3:02:54", "remaining_time": "8:32:52"} +{"current_steps": 1975, "total_steps": 7494, "loss": 0.617, "lr": 0.00013813519410811208, "epoch": 0.5270883373365359, "percentage": 26.35, "elapsed_time": "3:03:44", "remaining_time": "8:33:26"} +{"current_steps": 1980, "total_steps": 7494, "loss": 0.6305, "lr": 0.00013804072877528746, "epoch": 0.5284227381905524, "percentage": 26.42, "elapsed_time": "3:04:29", "remaining_time": "8:33:47"} +{"current_steps": 1985, "total_steps": 7494, "loss": 0.6107, "lr": 0.0001379459214428144, "epoch": 0.529757139044569, "percentage": 26.49, "elapsed_time": "3:05:12", "remaining_time": "8:34:00"} +{"current_steps": 1990, "total_steps": 7494, "loss": 0.6194, "lr": 0.0001378507726250283, "epoch": 0.5310915398985855, "percentage": 26.55, "elapsed_time": "3:05:58", "remaining_time": "8:34:23"} +{"current_steps": 1995, "total_steps": 7494, "loss": 0.6142, "lr": 0.00013775528283811695, "epoch": 0.5324259407526021, "percentage": 26.62, "elapsed_time": "3:06:45", "remaining_time": "8:34:47"} +{"current_steps": 2000, "total_steps": 7494, "loss": 0.6181, "lr": 0.00013765945260011815, "epoch": 0.5337603416066187, "percentage": 26.69, "elapsed_time": "3:07:32", "remaining_time": "8:35:09"} +{"current_steps": 2005, "total_steps": 7494, "loss": 0.6153, "lr": 0.0001375632824309165, "epoch": 0.5350947424606352, "percentage": 26.75, "elapsed_time": "3:08:24", "remaining_time": "8:35:48"} +{"current_steps": 2010, "total_steps": 7494, "loss": 0.6166, "lr": 0.00013746677285224082, "epoch": 0.5364291433146517, "percentage": 26.82, "elapsed_time": "3:09:09", "remaining_time": "8:36:04"} +{"current_steps": 2015, "total_steps": 7494, "loss": 0.61, "lr": 0.00013736992438766123, "epoch": 0.5377635441686682, "percentage": 26.89, "elapsed_time": "3:09:58", "remaining_time": "8:36:33"} +{"current_steps": 2020, "total_steps": 7494, "loss": 0.6096, "lr": 0.00013727273756258633, "epoch": 0.5390979450226848, "percentage": 26.95, "elapsed_time": "3:10:43", "remaining_time": "8:36:49"} +{"current_steps": 2025, "total_steps": 7494, "loss": 0.6103, "lr": 0.00013717521290426034, "epoch": 0.5404323458767014, "percentage": 27.02, "elapsed_time": "3:11:26", "remaining_time": "8:37:01"} +{"current_steps": 2030, "total_steps": 7494, "loss": 0.6141, "lr": 0.00013707735094176026, "epoch": 0.5417667467307179, "percentage": 27.09, "elapsed_time": "3:12:13", "remaining_time": "8:37:23"} +{"current_steps": 2035, "total_steps": 7494, "loss": 0.62, "lr": 0.00013697915220599294, "epoch": 0.5431011475847345, "percentage": 27.16, "elapsed_time": "3:13:01", "remaining_time": "8:37:46"} +{"current_steps": 2040, "total_steps": 7494, "loss": 0.6114, "lr": 0.0001368806172296923, "epoch": 0.544435548438751, "percentage": 27.22, "elapsed_time": "3:13:45", "remaining_time": "8:38:02"} +{"current_steps": 2045, "total_steps": 7494, "loss": 0.599, "lr": 0.00013678174654741638, "epoch": 0.5457699492927676, "percentage": 27.29, "elapsed_time": "3:14:26", "remaining_time": "8:38:07"} +{"current_steps": 2050, "total_steps": 7494, "loss": 0.6259, "lr": 0.00013668254069554439, "epoch": 0.547104350146784, "percentage": 27.36, "elapsed_time": "3:15:14", "remaining_time": "8:38:29"} +{"current_steps": 2055, "total_steps": 7494, "loss": 0.6241, "lr": 0.00013658300021227387, "epoch": 0.5484387510008006, "percentage": 27.42, "elapsed_time": "3:16:01", "remaining_time": "8:38:48"} +{"current_steps": 2060, "total_steps": 7494, "loss": 0.5985, "lr": 0.00013648312563761784, "epoch": 0.5497731518548172, "percentage": 27.49, "elapsed_time": "3:16:45", "remaining_time": "8:39:01"} +{"current_steps": 2065, "total_steps": 7494, "loss": 0.6066, "lr": 0.0001363829175134017, "epoch": 0.5511075527088337, "percentage": 27.56, "elapsed_time": "3:17:28", "remaining_time": "8:39:11"} +{"current_steps": 2070, "total_steps": 7494, "loss": 0.6182, "lr": 0.00013628237638326038, "epoch": 0.5524419535628503, "percentage": 27.62, "elapsed_time": "3:18:15", "remaining_time": "8:39:29"} +{"current_steps": 2075, "total_steps": 7494, "loss": 0.611, "lr": 0.0001361815027926354, "epoch": 0.5537763544168668, "percentage": 27.69, "elapsed_time": "3:19:03", "remaining_time": "8:39:50"} +{"current_steps": 2080, "total_steps": 7494, "loss": 0.6056, "lr": 0.00013608029728877195, "epoch": 0.5551107552708834, "percentage": 27.76, "elapsed_time": "3:19:49", "remaining_time": "8:40:06"} +{"current_steps": 2085, "total_steps": 7494, "loss": 0.6189, "lr": 0.00013597876042071574, "epoch": 0.5564451561248999, "percentage": 27.82, "elapsed_time": "3:20:31", "remaining_time": "8:40:12"} +{"current_steps": 2090, "total_steps": 7494, "loss": 0.612, "lr": 0.00013587689273931032, "epoch": 0.5577795569789165, "percentage": 27.89, "elapsed_time": "3:21:19", "remaining_time": "8:40:34"} +{"current_steps": 2095, "total_steps": 7494, "loss": 0.6292, "lr": 0.00013577469479719376, "epoch": 0.559113957832933, "percentage": 27.96, "elapsed_time": "3:22:08", "remaining_time": "8:40:55"} +{"current_steps": 2100, "total_steps": 7494, "loss": 0.6036, "lr": 0.00013567216714879593, "epoch": 0.5604483586869495, "percentage": 28.02, "elapsed_time": "3:22:51", "remaining_time": "8:41:02"} +{"current_steps": 2105, "total_steps": 7494, "loss": 0.6206, "lr": 0.00013556931035033526, "epoch": 0.5617827595409661, "percentage": 28.09, "elapsed_time": "3:23:46", "remaining_time": "8:41:40"} +{"current_steps": 2110, "total_steps": 7494, "loss": 0.6209, "lr": 0.00013546612495981603, "epoch": 0.5631171603949826, "percentage": 28.16, "elapsed_time": "3:24:33", "remaining_time": "8:41:58"} +{"current_steps": 2115, "total_steps": 7494, "loss": 0.6081, "lr": 0.00013536261153702494, "epoch": 0.5644515612489992, "percentage": 28.22, "elapsed_time": "3:25:20", "remaining_time": "8:42:14"} +{"current_steps": 2120, "total_steps": 7494, "loss": 0.5997, "lr": 0.0001352587706435284, "epoch": 0.5657859621030158, "percentage": 28.29, "elapsed_time": "3:26:05", "remaining_time": "8:42:26"} +{"current_steps": 2125, "total_steps": 7494, "loss": 0.6137, "lr": 0.00013515460284266933, "epoch": 0.5671203629570323, "percentage": 28.36, "elapsed_time": "3:26:48", "remaining_time": "8:42:31"} +{"current_steps": 2130, "total_steps": 7494, "loss": 0.6081, "lr": 0.0001350501086995642, "epoch": 0.5684547638110489, "percentage": 28.42, "elapsed_time": "3:27:35", "remaining_time": "8:42:47"} +{"current_steps": 2135, "total_steps": 7494, "loss": 0.6266, "lr": 0.00013494528878109978, "epoch": 0.5697891646650654, "percentage": 28.49, "elapsed_time": "3:28:22", "remaining_time": "8:43:02"} +{"current_steps": 2140, "total_steps": 7494, "loss": 0.618, "lr": 0.00013484014365593036, "epoch": 0.5711235655190819, "percentage": 28.56, "elapsed_time": "3:29:05", "remaining_time": "8:43:06"} +{"current_steps": 2145, "total_steps": 7494, "loss": 0.6084, "lr": 0.00013473467389447436, "epoch": 0.5724579663730984, "percentage": 28.62, "elapsed_time": "3:29:50", "remaining_time": "8:43:17"} +{"current_steps": 2150, "total_steps": 7494, "loss": 0.6039, "lr": 0.0001346288800689114, "epoch": 0.573792367227115, "percentage": 28.69, "elapsed_time": "3:30:41", "remaining_time": "8:43:41"} +{"current_steps": 2155, "total_steps": 7494, "loss": 0.6276, "lr": 0.00013452276275317926, "epoch": 0.5751267680811316, "percentage": 28.76, "elapsed_time": "3:31:26", "remaining_time": "8:43:49"} +{"current_steps": 2160, "total_steps": 7494, "loss": 0.6048, "lr": 0.00013441632252297054, "epoch": 0.5764611689351481, "percentage": 28.82, "elapsed_time": "3:32:10", "remaining_time": "8:43:56"} +{"current_steps": 2165, "total_steps": 7494, "loss": 0.6178, "lr": 0.0001343095599557297, "epoch": 0.5777955697891647, "percentage": 28.89, "elapsed_time": "3:32:51", "remaining_time": "8:43:57"} +{"current_steps": 2170, "total_steps": 7494, "loss": 0.6254, "lr": 0.00013420247563064998, "epoch": 0.5791299706431812, "percentage": 28.96, "elapsed_time": "3:33:40", "remaining_time": "8:44:13"} +{"current_steps": 2175, "total_steps": 7494, "loss": 0.6199, "lr": 0.0001340950701286701, "epoch": 0.5804643714971978, "percentage": 29.02, "elapsed_time": "3:34:27", "remaining_time": "8:44:26"} +{"current_steps": 2180, "total_steps": 7494, "loss": 0.6229, "lr": 0.0001339873440324712, "epoch": 0.5817987723512144, "percentage": 29.09, "elapsed_time": "3:35:10", "remaining_time": "8:44:31"} +{"current_steps": 2185, "total_steps": 7494, "loss": 0.6077, "lr": 0.00013387929792647366, "epoch": 0.5831331732052308, "percentage": 29.16, "elapsed_time": "3:35:55", "remaining_time": "8:44:39"} +{"current_steps": 2190, "total_steps": 7494, "loss": 0.6245, "lr": 0.00013377093239683396, "epoch": 0.5844675740592474, "percentage": 29.22, "elapsed_time": "3:36:42", "remaining_time": "8:44:50"} +{"current_steps": 2195, "total_steps": 7494, "loss": 0.6367, "lr": 0.0001336622480314414, "epoch": 0.5858019749132639, "percentage": 29.29, "elapsed_time": "3:37:27", "remaining_time": "8:44:58"} +{"current_steps": 2200, "total_steps": 7494, "loss": 0.6069, "lr": 0.00013355324541991512, "epoch": 0.5871363757672805, "percentage": 29.36, "elapsed_time": "3:38:12", "remaining_time": "8:45:05"} +{"current_steps": 2205, "total_steps": 7494, "loss": 0.5964, "lr": 0.00013344392515360055, "epoch": 0.588470776621297, "percentage": 29.42, "elapsed_time": "3:39:08", "remaining_time": "8:45:38"} +{"current_steps": 2210, "total_steps": 7494, "loss": 0.6124, "lr": 0.0001333342878255667, "epoch": 0.5898051774753136, "percentage": 29.49, "elapsed_time": "3:39:56", "remaining_time": "8:45:52"} +{"current_steps": 2215, "total_steps": 7494, "loss": 0.6144, "lr": 0.00013322433403060237, "epoch": 0.5911395783293302, "percentage": 29.56, "elapsed_time": "3:40:41", "remaining_time": "8:45:58"} +{"current_steps": 2220, "total_steps": 7494, "loss": 0.6057, "lr": 0.0001331140643652134, "epoch": 0.5924739791833467, "percentage": 29.62, "elapsed_time": "3:41:26", "remaining_time": "8:46:05"} +{"current_steps": 2225, "total_steps": 7494, "loss": 0.6097, "lr": 0.00013300347942761916, "epoch": 0.5938083800373632, "percentage": 29.69, "elapsed_time": "3:42:12", "remaining_time": "8:46:12"} +{"current_steps": 2230, "total_steps": 7494, "loss": 0.6196, "lr": 0.00013289257981774944, "epoch": 0.5951427808913797, "percentage": 29.76, "elapsed_time": "3:42:57", "remaining_time": "8:46:17"} +{"current_steps": 2235, "total_steps": 7494, "loss": 0.6239, "lr": 0.0001327813661372411, "epoch": 0.5964771817453963, "percentage": 29.82, "elapsed_time": "3:43:41", "remaining_time": "8:46:20"} +{"current_steps": 2240, "total_steps": 7494, "loss": 0.6006, "lr": 0.00013266983898943495, "epoch": 0.5978115825994129, "percentage": 29.89, "elapsed_time": "3:44:27", "remaining_time": "8:46:29"} +{"current_steps": 2245, "total_steps": 7494, "loss": 0.6258, "lr": 0.00013255799897937218, "epoch": 0.5991459834534294, "percentage": 29.96, "elapsed_time": "3:45:12", "remaining_time": "8:46:32"} +{"current_steps": 2250, "total_steps": 7494, "loss": 0.6229, "lr": 0.0001324458467137915, "epoch": 0.600480384307446, "percentage": 30.02, "elapsed_time": "3:45:55", "remaining_time": "8:46:34"} +{"current_steps": 2255, "total_steps": 7494, "loss": 0.6093, "lr": 0.00013233338280112548, "epoch": 0.6018147851614625, "percentage": 30.09, "elapsed_time": "3:46:41", "remaining_time": "8:46:39"} +{"current_steps": 2260, "total_steps": 7494, "loss": 0.6198, "lr": 0.00013222060785149744, "epoch": 0.6031491860154791, "percentage": 30.16, "elapsed_time": "3:47:30", "remaining_time": "8:46:53"} +{"current_steps": 2265, "total_steps": 7494, "loss": 0.63, "lr": 0.00013210752247671813, "epoch": 0.6044835868694955, "percentage": 30.22, "elapsed_time": "3:48:14", "remaining_time": "8:46:54"} +{"current_steps": 2270, "total_steps": 7494, "loss": 0.6124, "lr": 0.00013199412729028226, "epoch": 0.6058179877235121, "percentage": 30.29, "elapsed_time": "3:48:57", "remaining_time": "8:46:55"} +{"current_steps": 2275, "total_steps": 7494, "loss": 0.6219, "lr": 0.00013188042290736542, "epoch": 0.6071523885775287, "percentage": 30.36, "elapsed_time": "3:49:43", "remaining_time": "8:47:00"} +{"current_steps": 2280, "total_steps": 7494, "loss": 0.5975, "lr": 0.00013176640994482056, "epoch": 0.6084867894315452, "percentage": 30.42, "elapsed_time": "3:50:30", "remaining_time": "8:47:08"} +{"current_steps": 2285, "total_steps": 7494, "loss": 0.6194, "lr": 0.00013165208902117466, "epoch": 0.6098211902855618, "percentage": 30.49, "elapsed_time": "3:51:15", "remaining_time": "8:47:11"} +{"current_steps": 2290, "total_steps": 7494, "loss": 0.6161, "lr": 0.0001315374607566254, "epoch": 0.6111555911395783, "percentage": 30.56, "elapsed_time": "3:51:59", "remaining_time": "8:47:12"} +{"current_steps": 2295, "total_steps": 7494, "loss": 0.6226, "lr": 0.0001314225257730379, "epoch": 0.6124899919935949, "percentage": 30.62, "elapsed_time": "3:52:44", "remaining_time": "8:47:13"} +{"current_steps": 2300, "total_steps": 7494, "loss": 0.6149, "lr": 0.00013130728469394113, "epoch": 0.6138243928476115, "percentage": 30.69, "elapsed_time": "3:53:28", "remaining_time": "8:47:15"} +{"current_steps": 2305, "total_steps": 7494, "loss": 0.6145, "lr": 0.00013119173814452474, "epoch": 0.615158793701628, "percentage": 30.76, "elapsed_time": "3:54:28", "remaining_time": "8:47:51"} +{"current_steps": 2310, "total_steps": 7494, "loss": 0.6148, "lr": 0.0001310758867516355, "epoch": 0.6164931945556446, "percentage": 30.82, "elapsed_time": "3:55:15", "remaining_time": "8:47:56"} +{"current_steps": 2315, "total_steps": 7494, "loss": 0.6037, "lr": 0.00013095973114377401, "epoch": 0.617827595409661, "percentage": 30.89, "elapsed_time": "3:55:58", "remaining_time": "8:47:53"} +{"current_steps": 2320, "total_steps": 7494, "loss": 0.6237, "lr": 0.00013084327195109127, "epoch": 0.6191619962636776, "percentage": 30.96, "elapsed_time": "3:56:44", "remaining_time": "8:47:57"} +{"current_steps": 2325, "total_steps": 7494, "loss": 0.6294, "lr": 0.0001307265098053852, "epoch": 0.6204963971176941, "percentage": 31.02, "elapsed_time": "3:57:31", "remaining_time": "8:48:04"} +{"current_steps": 2330, "total_steps": 7494, "loss": 0.6133, "lr": 0.00013060944534009727, "epoch": 0.6218307979717107, "percentage": 31.09, "elapsed_time": "3:58:15", "remaining_time": "8:48:02"} +{"current_steps": 2335, "total_steps": 7494, "loss": 0.624, "lr": 0.00013049207919030913, "epoch": 0.6231651988257273, "percentage": 31.16, "elapsed_time": "3:59:00", "remaining_time": "8:48:05"} +{"current_steps": 2340, "total_steps": 7494, "loss": 0.6252, "lr": 0.000130374411992739, "epoch": 0.6244995996797438, "percentage": 31.22, "elapsed_time": "3:59:48", "remaining_time": "8:48:12"} +{"current_steps": 2345, "total_steps": 7494, "loss": 0.6261, "lr": 0.00013025644438573828, "epoch": 0.6258340005337604, "percentage": 31.29, "elapsed_time": "4:00:34", "remaining_time": "8:48:13"} +{"current_steps": 2350, "total_steps": 7494, "loss": 0.613, "lr": 0.0001301381770092882, "epoch": 0.6271684013877769, "percentage": 31.36, "elapsed_time": "4:01:18", "remaining_time": "8:48:13"} +{"current_steps": 2355, "total_steps": 7494, "loss": 0.6101, "lr": 0.00013001961050499618, "epoch": 0.6285028022417934, "percentage": 31.43, "elapsed_time": "4:02:05", "remaining_time": "8:48:16"} +{"current_steps": 2360, "total_steps": 7494, "loss": 0.5978, "lr": 0.00012990074551609248, "epoch": 0.6298372030958099, "percentage": 31.49, "elapsed_time": "4:02:53", "remaining_time": "8:48:23"} +{"current_steps": 2365, "total_steps": 7494, "loss": 0.5993, "lr": 0.00012978158268742656, "epoch": 0.6311716039498265, "percentage": 31.56, "elapsed_time": "4:03:37", "remaining_time": "8:48:20"} +{"current_steps": 2370, "total_steps": 7494, "loss": 0.6259, "lr": 0.00012966212266546384, "epoch": 0.6325060048038431, "percentage": 31.63, "elapsed_time": "4:04:20", "remaining_time": "8:48:17"} +{"current_steps": 2375, "total_steps": 7494, "loss": 0.6286, "lr": 0.0001295423660982819, "epoch": 0.6338404056578596, "percentage": 31.69, "elapsed_time": "4:05:08", "remaining_time": "8:48:21"} +{"current_steps": 2380, "total_steps": 7494, "loss": 0.6269, "lr": 0.00012942231363556717, "epoch": 0.6351748065118762, "percentage": 31.76, "elapsed_time": "4:05:56", "remaining_time": "8:48:27"} +{"current_steps": 2385, "total_steps": 7494, "loss": 0.5945, "lr": 0.00012930196592861123, "epoch": 0.6365092073658927, "percentage": 31.83, "elapsed_time": "4:06:39", "remaining_time": "8:48:23"} +{"current_steps": 2390, "total_steps": 7494, "loss": 0.6173, "lr": 0.0001291813236303075, "epoch": 0.6378436082199093, "percentage": 31.89, "elapsed_time": "4:07:22", "remaining_time": "8:48:17"} +{"current_steps": 2395, "total_steps": 7494, "loss": 0.6167, "lr": 0.0001290603873951475, "epoch": 0.6391780090739259, "percentage": 31.96, "elapsed_time": "4:08:10", "remaining_time": "8:48:23"} +{"current_steps": 2400, "total_steps": 7494, "loss": 0.6095, "lr": 0.0001289391578792174, "epoch": 0.6405124099279423, "percentage": 32.03, "elapsed_time": "4:08:58", "remaining_time": "8:48:27"} +{"current_steps": 2405, "total_steps": 7494, "loss": 0.614, "lr": 0.0001288176357401944, "epoch": 0.6418468107819589, "percentage": 32.09, "elapsed_time": "4:09:52", "remaining_time": "8:48:43"} +{"current_steps": 2410, "total_steps": 7494, "loss": 0.6158, "lr": 0.00012869582163734327, "epoch": 0.6431812116359754, "percentage": 32.16, "elapsed_time": "4:10:35", "remaining_time": "8:48:38"} +{"current_steps": 2415, "total_steps": 7494, "loss": 0.6008, "lr": 0.00012857371623151265, "epoch": 0.644515612489992, "percentage": 32.23, "elapsed_time": "4:11:22", "remaining_time": "8:48:39"} +{"current_steps": 2420, "total_steps": 7494, "loss": 0.6121, "lr": 0.00012845132018513147, "epoch": 0.6458500133440085, "percentage": 32.29, "elapsed_time": "4:12:07", "remaining_time": "8:48:38"} +{"current_steps": 2425, "total_steps": 7494, "loss": 0.6229, "lr": 0.00012832863416220556, "epoch": 0.6471844141980251, "percentage": 32.36, "elapsed_time": "4:12:50", "remaining_time": "8:48:31"} +{"current_steps": 2430, "total_steps": 7494, "loss": 0.6053, "lr": 0.00012820565882831365, "epoch": 0.6485188150520417, "percentage": 32.43, "elapsed_time": "4:13:33", "remaining_time": "8:48:24"} +{"current_steps": 2435, "total_steps": 7494, "loss": 0.6015, "lr": 0.00012808239485060426, "epoch": 0.6498532159060582, "percentage": 32.49, "elapsed_time": "4:14:22", "remaining_time": "8:48:29"} +{"current_steps": 2440, "total_steps": 7494, "loss": 0.6091, "lr": 0.00012795884289779161, "epoch": 0.6511876167600748, "percentage": 32.56, "elapsed_time": "4:15:05", "remaining_time": "8:48:23"} +{"current_steps": 2445, "total_steps": 7494, "loss": 0.6038, "lr": 0.00012783500364015233, "epoch": 0.6525220176140912, "percentage": 32.63, "elapsed_time": "4:15:47", "remaining_time": "8:48:12"} +{"current_steps": 2450, "total_steps": 7494, "loss": 0.6173, "lr": 0.00012771087774952165, "epoch": 0.6538564184681078, "percentage": 32.69, "elapsed_time": "4:16:33", "remaining_time": "8:48:12"} +{"current_steps": 2455, "total_steps": 7494, "loss": 0.6113, "lr": 0.00012758646589928975, "epoch": 0.6551908193221244, "percentage": 32.76, "elapsed_time": "4:17:22", "remaining_time": "8:48:15"} +{"current_steps": 2460, "total_steps": 7494, "loss": 0.6304, "lr": 0.00012746176876439824, "epoch": 0.6565252201761409, "percentage": 32.83, "elapsed_time": "4:18:05", "remaining_time": "8:48:08"} +{"current_steps": 2465, "total_steps": 7494, "loss": 0.604, "lr": 0.00012733678702133642, "epoch": 0.6578596210301575, "percentage": 32.89, "elapsed_time": "4:18:48", "remaining_time": "8:48:00"} +{"current_steps": 2470, "total_steps": 7494, "loss": 0.616, "lr": 0.00012721152134813755, "epoch": 0.659194021884174, "percentage": 32.96, "elapsed_time": "4:19:31", "remaining_time": "8:47:51"} +{"current_steps": 2475, "total_steps": 7494, "loss": 0.6111, "lr": 0.00012708597242437524, "epoch": 0.6605284227381906, "percentage": 33.03, "elapsed_time": "4:20:20", "remaining_time": "8:47:57"} +{"current_steps": 2480, "total_steps": 7494, "loss": 0.6239, "lr": 0.00012696014093115974, "epoch": 0.661862823592207, "percentage": 33.09, "elapsed_time": "4:21:06", "remaining_time": "8:47:53"} +{"current_steps": 2485, "total_steps": 7494, "loss": 0.6011, "lr": 0.00012683402755113432, "epoch": 0.6631972244462236, "percentage": 33.16, "elapsed_time": "4:21:48", "remaining_time": "8:47:43"} +{"current_steps": 2490, "total_steps": 7494, "loss": 0.6053, "lr": 0.0001267076329684714, "epoch": 0.6645316253002402, "percentage": 33.23, "elapsed_time": "4:22:33", "remaining_time": "8:47:37"} +{"current_steps": 2495, "total_steps": 7494, "loss": 0.6128, "lr": 0.0001265809578688691, "epoch": 0.6658660261542567, "percentage": 33.29, "elapsed_time": "4:23:21", "remaining_time": "8:47:39"} +{"current_steps": 2500, "total_steps": 7494, "loss": 0.6182, "lr": 0.00012645400293954714, "epoch": 0.6672004270082733, "percentage": 33.36, "elapsed_time": "4:24:06", "remaining_time": "8:47:34"} +{"current_steps": 2505, "total_steps": 7494, "loss": 0.6264, "lr": 0.0001263267688692435, "epoch": 0.6685348278622898, "percentage": 33.43, "elapsed_time": "4:24:58", "remaining_time": "8:47:43"} +{"current_steps": 2510, "total_steps": 7494, "loss": 0.6123, "lr": 0.00012619925634821052, "epoch": 0.6698692287163064, "percentage": 33.49, "elapsed_time": "4:25:43", "remaining_time": "8:47:38"} +{"current_steps": 2515, "total_steps": 7494, "loss": 0.6048, "lr": 0.00012607146606821105, "epoch": 0.671203629570323, "percentage": 33.56, "elapsed_time": "4:26:32", "remaining_time": "8:47:40"} +{"current_steps": 2520, "total_steps": 7494, "loss": 0.6174, "lr": 0.00012594339872251483, "epoch": 0.6725380304243395, "percentage": 33.63, "elapsed_time": "4:27:18", "remaining_time": "8:47:36"} +{"current_steps": 2525, "total_steps": 7494, "loss": 0.6156, "lr": 0.00012581505500589474, "epoch": 0.673872431278356, "percentage": 33.69, "elapsed_time": "4:28:01", "remaining_time": "8:47:27"} +{"current_steps": 2530, "total_steps": 7494, "loss": 0.6093, "lr": 0.00012568643561462298, "epoch": 0.6752068321323725, "percentage": 33.76, "elapsed_time": "4:28:46", "remaining_time": "8:47:20"} +{"current_steps": 2535, "total_steps": 7494, "loss": 0.6061, "lr": 0.00012555754124646729, "epoch": 0.6765412329863891, "percentage": 33.83, "elapsed_time": "4:29:34", "remaining_time": "8:47:20"} +{"current_steps": 2540, "total_steps": 7494, "loss": 0.6034, "lr": 0.0001254283726006871, "epoch": 0.6778756338404056, "percentage": 33.89, "elapsed_time": "4:30:20", "remaining_time": "8:47:15"} +{"current_steps": 2545, "total_steps": 7494, "loss": 0.6168, "lr": 0.00012529893037803, "epoch": 0.6792100346944222, "percentage": 33.96, "elapsed_time": "4:31:03", "remaining_time": "8:47:05"} +{"current_steps": 2550, "total_steps": 7494, "loss": 0.6037, "lr": 0.00012516921528072752, "epoch": 0.6805444355484388, "percentage": 34.03, "elapsed_time": "4:31:48", "remaining_time": "8:46:59"} +{"current_steps": 2555, "total_steps": 7494, "loss": 0.6323, "lr": 0.00012503922801249172, "epoch": 0.6818788364024553, "percentage": 34.09, "elapsed_time": "4:32:33", "remaining_time": "8:46:52"} +{"current_steps": 2560, "total_steps": 7494, "loss": 0.6149, "lr": 0.00012490896927851118, "epoch": 0.6832132372564719, "percentage": 34.16, "elapsed_time": "4:33:21", "remaining_time": "8:46:51"} +{"current_steps": 2565, "total_steps": 7494, "loss": 0.6063, "lr": 0.0001247784397854471, "epoch": 0.6845476381104884, "percentage": 34.23, "elapsed_time": "4:34:04", "remaining_time": "8:46:40"} +{"current_steps": 2570, "total_steps": 7494, "loss": 0.6173, "lr": 0.0001246476402414297, "epoch": 0.685882038964505, "percentage": 34.29, "elapsed_time": "4:34:48", "remaining_time": "8:46:31"} +{"current_steps": 2575, "total_steps": 7494, "loss": 0.6197, "lr": 0.0001245165713560541, "epoch": 0.6872164398185214, "percentage": 34.36, "elapsed_time": "4:35:36", "remaining_time": "8:46:28"} +{"current_steps": 2580, "total_steps": 7494, "loss": 0.621, "lr": 0.00012438523384037675, "epoch": 0.688550840672538, "percentage": 34.43, "elapsed_time": "4:36:22", "remaining_time": "8:46:24"} +{"current_steps": 2585, "total_steps": 7494, "loss": 0.5967, "lr": 0.0001242536284069113, "epoch": 0.6898852415265546, "percentage": 34.49, "elapsed_time": "4:37:06", "remaining_time": "8:46:14"} +{"current_steps": 2590, "total_steps": 7494, "loss": 0.608, "lr": 0.00012412175576962504, "epoch": 0.6912196423805711, "percentage": 34.56, "elapsed_time": "4:37:49", "remaining_time": "8:46:02"} +{"current_steps": 2595, "total_steps": 7494, "loss": 0.6197, "lr": 0.00012398961664393467, "epoch": 0.6925540432345877, "percentage": 34.63, "elapsed_time": "4:38:39", "remaining_time": "8:46:03"} +{"current_steps": 2600, "total_steps": 7494, "loss": 0.6225, "lr": 0.0001238572117467027, "epoch": 0.6938884440886042, "percentage": 34.69, "elapsed_time": "4:39:26", "remaining_time": "8:45:59"} +{"current_steps": 2605, "total_steps": 7494, "loss": 0.6049, "lr": 0.0001237245417962335, "epoch": 0.6952228449426208, "percentage": 34.76, "elapsed_time": "4:40:20", "remaining_time": "8:46:08"} +{"current_steps": 2610, "total_steps": 7494, "loss": 0.6206, "lr": 0.0001235916075122693, "epoch": 0.6965572457966374, "percentage": 34.83, "elapsed_time": "4:41:02", "remaining_time": "8:45:54"} +{"current_steps": 2615, "total_steps": 7494, "loss": 0.6321, "lr": 0.00012345840961598638, "epoch": 0.6978916466506538, "percentage": 34.89, "elapsed_time": "4:41:50", "remaining_time": "8:45:51"} +{"current_steps": 2620, "total_steps": 7494, "loss": 0.6159, "lr": 0.00012332494882999113, "epoch": 0.6992260475046704, "percentage": 34.96, "elapsed_time": "4:42:39", "remaining_time": "8:45:49"} +{"current_steps": 2625, "total_steps": 7494, "loss": 0.6, "lr": 0.00012319122587831614, "epoch": 0.7005604483586869, "percentage": 35.03, "elapsed_time": "4:43:21", "remaining_time": "8:45:36"} +{"current_steps": 2630, "total_steps": 7494, "loss": 0.6098, "lr": 0.00012305724148641627, "epoch": 0.7018948492127035, "percentage": 35.09, "elapsed_time": "4:44:04", "remaining_time": "8:45:23"} +{"current_steps": 2635, "total_steps": 7494, "loss": 0.6145, "lr": 0.00012292299638116472, "epoch": 0.70322925006672, "percentage": 35.16, "elapsed_time": "4:44:52", "remaining_time": "8:45:18"} +{"current_steps": 2640, "total_steps": 7494, "loss": 0.6009, "lr": 0.00012278849129084902, "epoch": 0.7045636509207366, "percentage": 35.23, "elapsed_time": "4:45:40", "remaining_time": "8:45:14"} +{"current_steps": 2645, "total_steps": 7494, "loss": 0.6179, "lr": 0.00012265372694516714, "epoch": 0.7058980517747532, "percentage": 35.29, "elapsed_time": "4:46:21", "remaining_time": "8:44:58"} +{"current_steps": 2650, "total_steps": 7494, "loss": 0.6177, "lr": 0.00012251870407522364, "epoch": 0.7072324526287697, "percentage": 35.36, "elapsed_time": "4:47:05", "remaining_time": "8:44:46"} +{"current_steps": 2655, "total_steps": 7494, "loss": 0.6005, "lr": 0.00012238342341352546, "epoch": 0.7085668534827863, "percentage": 35.43, "elapsed_time": "4:47:52", "remaining_time": "8:44:40"} +{"current_steps": 2660, "total_steps": 7494, "loss": 0.6208, "lr": 0.00012224788569397806, "epoch": 0.7099012543368027, "percentage": 35.5, "elapsed_time": "4:48:37", "remaining_time": "8:44:31"} +{"current_steps": 2665, "total_steps": 7494, "loss": 0.6232, "lr": 0.0001221120916518816, "epoch": 0.7112356551908193, "percentage": 35.56, "elapsed_time": "4:49:21", "remaining_time": "8:44:19"} +{"current_steps": 2670, "total_steps": 7494, "loss": 0.5925, "lr": 0.0001219760420239267, "epoch": 0.7125700560448359, "percentage": 35.63, "elapsed_time": "4:50:04", "remaining_time": "8:44:05"} +{"current_steps": 2675, "total_steps": 7494, "loss": 0.593, "lr": 0.00012183973754819051, "epoch": 0.7139044568988524, "percentage": 35.7, "elapsed_time": "4:50:51", "remaining_time": "8:43:58"} +{"current_steps": 2680, "total_steps": 7494, "loss": 0.6018, "lr": 0.00012170317896413284, "epoch": 0.715238857752869, "percentage": 35.76, "elapsed_time": "4:51:37", "remaining_time": "8:43:50"} +{"current_steps": 2685, "total_steps": 7494, "loss": 0.6038, "lr": 0.00012156636701259202, "epoch": 0.7165732586068855, "percentage": 35.83, "elapsed_time": "4:52:20", "remaining_time": "8:43:36"} +{"current_steps": 2690, "total_steps": 7494, "loss": 0.6007, "lr": 0.00012142930243578092, "epoch": 0.7179076594609021, "percentage": 35.9, "elapsed_time": "4:53:06", "remaining_time": "8:43:26"} +{"current_steps": 2695, "total_steps": 7494, "loss": 0.6157, "lr": 0.00012129198597728285, "epoch": 0.7192420603149186, "percentage": 35.96, "elapsed_time": "4:53:53", "remaining_time": "8:43:20"} +{"current_steps": 2700, "total_steps": 7494, "loss": 0.6158, "lr": 0.00012115441838204767, "epoch": 0.7205764611689351, "percentage": 36.03, "elapsed_time": "4:54:39", "remaining_time": "8:43:10"} +{"current_steps": 2705, "total_steps": 7494, "loss": 0.5824, "lr": 0.00012101660039638766, "epoch": 0.7219108620229517, "percentage": 36.1, "elapsed_time": "4:55:31", "remaining_time": "8:43:12"} +{"current_steps": 2710, "total_steps": 7494, "loss": 0.6129, "lr": 0.00012087853276797346, "epoch": 0.7232452628769682, "percentage": 36.16, "elapsed_time": "4:56:14", "remaining_time": "8:42:57"} +{"current_steps": 2715, "total_steps": 7494, "loss": 0.6202, "lr": 0.00012074021624583005, "epoch": 0.7245796637309848, "percentage": 36.23, "elapsed_time": "4:57:01", "remaining_time": "8:42:49"} +{"current_steps": 2720, "total_steps": 7494, "loss": 0.5989, "lr": 0.00012060165158033268, "epoch": 0.7259140645850013, "percentage": 36.3, "elapsed_time": "4:57:46", "remaining_time": "8:42:38"} +{"current_steps": 2725, "total_steps": 7494, "loss": 0.613, "lr": 0.00012046283952320275, "epoch": 0.7272484654390179, "percentage": 36.36, "elapsed_time": "4:58:31", "remaining_time": "8:42:26"} +{"current_steps": 2730, "total_steps": 7494, "loss": 0.5955, "lr": 0.00012032378082750382, "epoch": 0.7285828662930345, "percentage": 36.43, "elapsed_time": "4:59:13", "remaining_time": "8:42:10"} +{"current_steps": 2735, "total_steps": 7494, "loss": 0.6203, "lr": 0.00012018447624763748, "epoch": 0.729917267147051, "percentage": 36.5, "elapsed_time": "4:59:59", "remaining_time": "8:41:59"} +{"current_steps": 2740, "total_steps": 7494, "loss": 0.6089, "lr": 0.00012004492653933923, "epoch": 0.7312516680010676, "percentage": 36.56, "elapsed_time": "5:00:44", "remaining_time": "8:41:48"} +{"current_steps": 2745, "total_steps": 7494, "loss": 0.6106, "lr": 0.0001199051324596744, "epoch": 0.732586068855084, "percentage": 36.63, "elapsed_time": "5:01:28", "remaining_time": "8:41:33"} +{"current_steps": 2750, "total_steps": 7494, "loss": 0.612, "lr": 0.00011976509476703408, "epoch": 0.7339204697091006, "percentage": 36.7, "elapsed_time": "5:02:11", "remaining_time": "8:41:17"} +{"current_steps": 2755, "total_steps": 7494, "loss": 0.6197, "lr": 0.00011962481422113098, "epoch": 0.7352548705631171, "percentage": 36.76, "elapsed_time": "5:02:57", "remaining_time": "8:41:07"} +{"current_steps": 2760, "total_steps": 7494, "loss": 0.5971, "lr": 0.00011948429158299523, "epoch": 0.7365892714171337, "percentage": 36.83, "elapsed_time": "5:03:41", "remaining_time": "8:40:54"} +{"current_steps": 2765, "total_steps": 7494, "loss": 0.6128, "lr": 0.00011934352761497043, "epoch": 0.7379236722711503, "percentage": 36.9, "elapsed_time": "5:04:26", "remaining_time": "8:40:41"} +{"current_steps": 2770, "total_steps": 7494, "loss": 0.611, "lr": 0.00011920252308070936, "epoch": 0.7392580731251668, "percentage": 36.96, "elapsed_time": "5:05:10", "remaining_time": "8:40:27"} +{"current_steps": 2775, "total_steps": 7494, "loss": 0.6344, "lr": 0.00011906127874516985, "epoch": 0.7405924739791834, "percentage": 37.03, "elapsed_time": "5:05:57", "remaining_time": "8:40:18"} +{"current_steps": 2780, "total_steps": 7494, "loss": 0.6043, "lr": 0.00011891979537461069, "epoch": 0.7419268748331999, "percentage": 37.1, "elapsed_time": "5:06:41", "remaining_time": "8:40:03"} +{"current_steps": 2785, "total_steps": 7494, "loss": 0.6157, "lr": 0.00011877807373658751, "epoch": 0.7432612756872164, "percentage": 37.16, "elapsed_time": "5:07:27", "remaining_time": "8:39:51"} +{"current_steps": 2790, "total_steps": 7494, "loss": 0.5936, "lr": 0.00011863611459994845, "epoch": 0.7445956765412329, "percentage": 37.23, "elapsed_time": "5:08:11", "remaining_time": "8:39:37"} +{"current_steps": 2795, "total_steps": 7494, "loss": 0.6124, "lr": 0.00011849391873483016, "epoch": 0.7459300773952495, "percentage": 37.3, "elapsed_time": "5:08:57", "remaining_time": "8:39:26"} +{"current_steps": 2800, "total_steps": 7494, "loss": 0.5987, "lr": 0.00011835148691265355, "epoch": 0.7472644782492661, "percentage": 37.36, "elapsed_time": "5:09:42", "remaining_time": "8:39:11"} +{"current_steps": 2805, "total_steps": 7494, "loss": 0.6139, "lr": 0.00011820881990611963, "epoch": 0.7485988791032826, "percentage": 37.43, "elapsed_time": "5:10:35", "remaining_time": "8:39:12"} +{"current_steps": 2810, "total_steps": 7494, "loss": 0.6111, "lr": 0.00011806591848920521, "epoch": 0.7499332799572992, "percentage": 37.5, "elapsed_time": "5:11:19", "remaining_time": "8:38:56"} +{"current_steps": 2815, "total_steps": 7494, "loss": 0.6255, "lr": 0.00011792278343715892, "epoch": 0.7512676808113157, "percentage": 37.56, "elapsed_time": "5:12:04", "remaining_time": "8:38:42"} +{"current_steps": 2820, "total_steps": 7494, "loss": 0.6097, "lr": 0.00011777941552649674, "epoch": 0.7526020816653323, "percentage": 37.63, "elapsed_time": "5:12:49", "remaining_time": "8:38:28"} +{"current_steps": 2825, "total_steps": 7494, "loss": 0.6251, "lr": 0.00011763581553499803, "epoch": 0.7539364825193489, "percentage": 37.7, "elapsed_time": "5:13:31", "remaining_time": "8:38:10"} +{"current_steps": 2830, "total_steps": 7494, "loss": 0.5954, "lr": 0.00011749198424170117, "epoch": 0.7552708833733653, "percentage": 37.76, "elapsed_time": "5:14:16", "remaining_time": "8:37:57"} +{"current_steps": 2835, "total_steps": 7494, "loss": 0.6087, "lr": 0.00011734792242689934, "epoch": 0.7566052842273819, "percentage": 37.83, "elapsed_time": "5:15:02", "remaining_time": "8:37:44"} +{"current_steps": 2840, "total_steps": 7494, "loss": 0.6068, "lr": 0.00011720363087213629, "epoch": 0.7579396850813984, "percentage": 37.9, "elapsed_time": "5:15:47", "remaining_time": "8:37:30"} +{"current_steps": 2845, "total_steps": 7494, "loss": 0.6124, "lr": 0.00011705911036020222, "epoch": 0.759274085935415, "percentage": 37.96, "elapsed_time": "5:16:32", "remaining_time": "8:37:15"} +{"current_steps": 2850, "total_steps": 7494, "loss": 0.614, "lr": 0.00011691436167512938, "epoch": 0.7606084867894315, "percentage": 38.03, "elapsed_time": "5:17:15", "remaining_time": "8:36:57"} +{"current_steps": 2855, "total_steps": 7494, "loss": 0.6254, "lr": 0.00011676938560218781, "epoch": 0.7619428876434481, "percentage": 38.1, "elapsed_time": "5:18:05", "remaining_time": "8:36:50"} +{"current_steps": 2860, "total_steps": 7494, "loss": 0.5968, "lr": 0.00011662418292788127, "epoch": 0.7632772884974647, "percentage": 38.16, "elapsed_time": "5:18:49", "remaining_time": "8:36:34"} +{"current_steps": 2865, "total_steps": 7494, "loss": 0.6114, "lr": 0.00011647875443994271, "epoch": 0.7646116893514812, "percentage": 38.23, "elapsed_time": "5:19:32", "remaining_time": "8:36:17"} +{"current_steps": 2870, "total_steps": 7494, "loss": 0.612, "lr": 0.00011633310092733027, "epoch": 0.7659460902054978, "percentage": 38.3, "elapsed_time": "5:20:16", "remaining_time": "8:36:01"} +{"current_steps": 2875, "total_steps": 7494, "loss": 0.6033, "lr": 0.00011618722318022273, "epoch": 0.7672804910595142, "percentage": 38.36, "elapsed_time": "5:21:01", "remaining_time": "8:35:45"} +{"current_steps": 2880, "total_steps": 7494, "loss": 0.6155, "lr": 0.00011604112199001546, "epoch": 0.7686148919135308, "percentage": 38.43, "elapsed_time": "5:21:46", "remaining_time": "8:35:30"} +{"current_steps": 2885, "total_steps": 7494, "loss": 0.6315, "lr": 0.00011589479814931598, "epoch": 0.7699492927675474, "percentage": 38.5, "elapsed_time": "5:22:29", "remaining_time": "8:35:13"} +{"current_steps": 2890, "total_steps": 7494, "loss": 0.6069, "lr": 0.0001157482524519397, "epoch": 0.7712836936215639, "percentage": 38.56, "elapsed_time": "5:23:12", "remaining_time": "8:34:54"} +{"current_steps": 2895, "total_steps": 7494, "loss": 0.6207, "lr": 0.00011560148569290558, "epoch": 0.7726180944755805, "percentage": 38.63, "elapsed_time": "5:23:59", "remaining_time": "8:34:41"} +{"current_steps": 2900, "total_steps": 7494, "loss": 0.61, "lr": 0.00011545449866843194, "epoch": 0.773952495329597, "percentage": 38.7, "elapsed_time": "5:24:45", "remaining_time": "8:34:26"} +{"current_steps": 2905, "total_steps": 7494, "loss": 0.6188, "lr": 0.00011530729217593198, "epoch": 0.7752868961836136, "percentage": 38.76, "elapsed_time": "5:25:38", "remaining_time": "8:34:24"} +{"current_steps": 2910, "total_steps": 7494, "loss": 0.6055, "lr": 0.00011515986701400955, "epoch": 0.77662129703763, "percentage": 38.83, "elapsed_time": "5:26:21", "remaining_time": "8:34:06"} +{"current_steps": 2915, "total_steps": 7494, "loss": 0.6069, "lr": 0.00011501222398245478, "epoch": 0.7779556978916466, "percentage": 38.9, "elapsed_time": "5:27:08", "remaining_time": "8:33:53"} +{"current_steps": 2920, "total_steps": 7494, "loss": 0.6077, "lr": 0.00011486436388223977, "epoch": 0.7792900987456632, "percentage": 38.96, "elapsed_time": "5:27:55", "remaining_time": "8:33:39"} +{"current_steps": 2925, "total_steps": 7494, "loss": 0.6068, "lr": 0.00011471628751551426, "epoch": 0.7806244995996797, "percentage": 39.03, "elapsed_time": "5:29:28", "remaining_time": "8:34:39"} +{"current_steps": 2930, "total_steps": 7494, "loss": 0.6103, "lr": 0.0001145679956856012, "epoch": 0.7819589004536963, "percentage": 39.1, "elapsed_time": "5:30:10", "remaining_time": "8:34:17"} +{"current_steps": 2935, "total_steps": 7494, "loss": 0.5993, "lr": 0.00011441948919699249, "epoch": 0.7832933013077128, "percentage": 39.16, "elapsed_time": "5:31:33", "remaining_time": "8:35:00"} +{"current_steps": 2940, "total_steps": 7494, "loss": 0.6165, "lr": 0.00011427076885534445, "epoch": 0.7846277021617294, "percentage": 39.23, "elapsed_time": "5:32:18", "remaining_time": "8:34:44"} +{"current_steps": 2945, "total_steps": 7494, "loss": 0.6275, "lr": 0.00011412183546747374, "epoch": 0.785962103015746, "percentage": 39.3, "elapsed_time": "5:33:01", "remaining_time": "8:34:24"} +{"current_steps": 2950, "total_steps": 7494, "loss": 0.6104, "lr": 0.00011397268984135266, "epoch": 0.7872965038697625, "percentage": 39.36, "elapsed_time": "5:33:44", "remaining_time": "8:34:03"} +{"current_steps": 2955, "total_steps": 7494, "loss": 0.6128, "lr": 0.00011382333278610503, "epoch": 0.7886309047237791, "percentage": 39.43, "elapsed_time": "5:34:31", "remaining_time": "8:33:49"} +{"current_steps": 2960, "total_steps": 7494, "loss": 0.5935, "lr": 0.00011367376511200157, "epoch": 0.7899653055777955, "percentage": 39.5, "elapsed_time": "5:35:18", "remaining_time": "8:33:37"} +{"current_steps": 2965, "total_steps": 7494, "loss": 0.6111, "lr": 0.00011352398763045569, "epoch": 0.7912997064318121, "percentage": 39.56, "elapsed_time": "5:35:58", "remaining_time": "8:33:11"} +{"current_steps": 2970, "total_steps": 7494, "loss": 0.5908, "lr": 0.00011337400115401905, "epoch": 0.7926341072858286, "percentage": 39.63, "elapsed_time": "5:36:41", "remaining_time": "8:32:51"} +{"current_steps": 2975, "total_steps": 7494, "loss": 0.6056, "lr": 0.00011322380649637704, "epoch": 0.7939685081398452, "percentage": 39.7, "elapsed_time": "5:37:27", "remaining_time": "8:32:36"} +{"current_steps": 2980, "total_steps": 7494, "loss": 0.6138, "lr": 0.00011307340447234449, "epoch": 0.7953029089938618, "percentage": 39.77, "elapsed_time": "5:38:14", "remaining_time": "8:32:21"} +{"current_steps": 2985, "total_steps": 7494, "loss": 0.5993, "lr": 0.00011292279589786115, "epoch": 0.7966373098478783, "percentage": 39.83, "elapsed_time": "5:38:56", "remaining_time": "8:31:59"} +{"current_steps": 2990, "total_steps": 7494, "loss": 0.6094, "lr": 0.00011277198158998744, "epoch": 0.7979717107018949, "percentage": 39.9, "elapsed_time": "5:39:38", "remaining_time": "8:31:36"} +{"current_steps": 2995, "total_steps": 7494, "loss": 0.6156, "lr": 0.00011262096236689978, "epoch": 0.7993061115559114, "percentage": 39.97, "elapsed_time": "5:40:26", "remaining_time": "8:31:24"} +{"current_steps": 3000, "total_steps": 7494, "loss": 0.5946, "lr": 0.0001124697390478863, "epoch": 0.800640512409928, "percentage": 40.03, "elapsed_time": "5:41:11", "remaining_time": "8:31:05"} +{"current_steps": 3005, "total_steps": 7494, "loss": 0.6174, "lr": 0.00011231831245334238, "epoch": 0.8019749132639445, "percentage": 40.1, "elapsed_time": "5:42:01", "remaining_time": "8:30:56"} +{"current_steps": 3010, "total_steps": 7494, "loss": 0.5986, "lr": 0.00011216668340476618, "epoch": 0.803309314117961, "percentage": 40.17, "elapsed_time": "5:42:44", "remaining_time": "8:30:35"} +{"current_steps": 3015, "total_steps": 7494, "loss": 0.6186, "lr": 0.00011201485272475416, "epoch": 0.8046437149719776, "percentage": 40.23, "elapsed_time": "5:43:28", "remaining_time": "8:30:15"} +{"current_steps": 3020, "total_steps": 7494, "loss": 0.6125, "lr": 0.00011186282123699664, "epoch": 0.8059781158259941, "percentage": 40.3, "elapsed_time": "5:44:15", "remaining_time": "8:30:00"} +{"current_steps": 3025, "total_steps": 7494, "loss": 0.6114, "lr": 0.00011171058976627341, "epoch": 0.8073125166800107, "percentage": 40.37, "elapsed_time": "5:44:58", "remaining_time": "8:29:38"} +{"current_steps": 3030, "total_steps": 7494, "loss": 0.6052, "lr": 0.00011155815913844906, "epoch": 0.8086469175340272, "percentage": 40.43, "elapsed_time": "5:45:39", "remaining_time": "8:29:14"} +{"current_steps": 3035, "total_steps": 7494, "loss": 0.6166, "lr": 0.00011140553018046872, "epoch": 0.8099813183880438, "percentage": 40.5, "elapsed_time": "5:46:23", "remaining_time": "8:28:54"} +{"current_steps": 3040, "total_steps": 7494, "loss": 0.6056, "lr": 0.00011125270372035342, "epoch": 0.8113157192420604, "percentage": 40.57, "elapsed_time": "5:47:07", "remaining_time": "8:28:35"} +{"current_steps": 3045, "total_steps": 7494, "loss": 0.6035, "lr": 0.00011109968058719565, "epoch": 0.8126501200960768, "percentage": 40.63, "elapsed_time": "5:47:49", "remaining_time": "8:28:12"} +{"current_steps": 3050, "total_steps": 7494, "loss": 0.5999, "lr": 0.00011094646161115489, "epoch": 0.8139845209500934, "percentage": 40.7, "elapsed_time": "5:48:30", "remaining_time": "8:27:47"} +{"current_steps": 3055, "total_steps": 7494, "loss": 0.6041, "lr": 0.00011079304762345307, "epoch": 0.8153189218041099, "percentage": 40.77, "elapsed_time": "5:49:44", "remaining_time": "8:28:11"} +{"current_steps": 3060, "total_steps": 7494, "loss": 0.5932, "lr": 0.00011063943945637005, "epoch": 0.8166533226581265, "percentage": 40.83, "elapsed_time": "5:50:31", "remaining_time": "8:27:54"} +{"current_steps": 3065, "total_steps": 7494, "loss": 0.6041, "lr": 0.00011048563794323915, "epoch": 0.817987723512143, "percentage": 40.9, "elapsed_time": "5:51:16", "remaining_time": "8:27:36"} +{"current_steps": 3070, "total_steps": 7494, "loss": 0.6086, "lr": 0.00011033164391844259, "epoch": 0.8193221243661596, "percentage": 40.97, "elapsed_time": "5:51:57", "remaining_time": "8:27:11"} +{"current_steps": 3075, "total_steps": 7494, "loss": 0.6091, "lr": 0.00011017745821740696, "epoch": 0.8206565252201762, "percentage": 41.03, "elapsed_time": "5:52:42", "remaining_time": "8:26:52"} +{"current_steps": 3080, "total_steps": 7494, "loss": 0.6186, "lr": 0.00011002308167659877, "epoch": 0.8219909260741927, "percentage": 41.1, "elapsed_time": "5:53:29", "remaining_time": "8:26:35"} +{"current_steps": 3085, "total_steps": 7494, "loss": 0.6211, "lr": 0.00010986851513351976, "epoch": 0.8233253269282093, "percentage": 41.17, "elapsed_time": "5:54:14", "remaining_time": "8:26:16"} +{"current_steps": 3090, "total_steps": 7494, "loss": 0.6453, "lr": 0.00010971375942670251, "epoch": 0.8246597277822257, "percentage": 41.23, "elapsed_time": "5:54:55", "remaining_time": "8:25:51"} +{"current_steps": 3095, "total_steps": 7494, "loss": 0.6047, "lr": 0.00010955881539570581, "epoch": 0.8259941286362423, "percentage": 41.3, "elapsed_time": "5:55:40", "remaining_time": "8:25:31"} +{"current_steps": 3100, "total_steps": 7494, "loss": 0.5913, "lr": 0.00010940368388111008, "epoch": 0.8273285294902589, "percentage": 41.37, "elapsed_time": "5:56:26", "remaining_time": "8:25:13"} +{"current_steps": 3105, "total_steps": 7494, "loss": 0.6101, "lr": 0.00010924836572451287, "epoch": 0.8286629303442754, "percentage": 41.43, "elapsed_time": "5:57:21", "remaining_time": "8:25:07"} +{"current_steps": 3110, "total_steps": 7494, "loss": 0.6102, "lr": 0.00010909286176852432, "epoch": 0.829997331198292, "percentage": 41.5, "elapsed_time": "5:58:02", "remaining_time": "8:24:42"} +{"current_steps": 3115, "total_steps": 7494, "loss": 0.6019, "lr": 0.0001089371728567625, "epoch": 0.8313317320523085, "percentage": 41.57, "elapsed_time": "5:58:44", "remaining_time": "8:24:19"} +{"current_steps": 3120, "total_steps": 7494, "loss": 0.6014, "lr": 0.00010878129983384886, "epoch": 0.8326661329063251, "percentage": 41.63, "elapsed_time": "5:59:31", "remaining_time": "8:24:01"} +{"current_steps": 3125, "total_steps": 7494, "loss": 0.5978, "lr": 0.00010862524354540369, "epoch": 0.8340005337603416, "percentage": 41.7, "elapsed_time": "6:00:17", "remaining_time": "8:23:42"} +{"current_steps": 3130, "total_steps": 7494, "loss": 0.6117, "lr": 0.00010846900483804152, "epoch": 0.8353349346143581, "percentage": 41.77, "elapsed_time": "6:00:59", "remaining_time": "8:23:19"} +{"current_steps": 3135, "total_steps": 7494, "loss": 0.6267, "lr": 0.00010831258455936645, "epoch": 0.8366693354683747, "percentage": 41.83, "elapsed_time": "6:02:12", "remaining_time": "8:23:37"} +{"current_steps": 3140, "total_steps": 7494, "loss": 0.6126, "lr": 0.00010815598355796771, "epoch": 0.8380037363223912, "percentage": 41.9, "elapsed_time": "6:02:57", "remaining_time": "8:23:16"} +{"current_steps": 3145, "total_steps": 7494, "loss": 0.6168, "lr": 0.0001079992026834149, "epoch": 0.8393381371764078, "percentage": 41.97, "elapsed_time": "6:03:40", "remaining_time": "8:22:54"} +{"current_steps": 3150, "total_steps": 7494, "loss": 0.6087, "lr": 0.00010784224278625345, "epoch": 0.8406725380304243, "percentage": 42.03, "elapsed_time": "6:04:23", "remaining_time": "8:22:31"} +{"current_steps": 3155, "total_steps": 7494, "loss": 0.5997, "lr": 0.00010768510471799996, "epoch": 0.8420069388844409, "percentage": 42.1, "elapsed_time": "6:05:07", "remaining_time": "8:22:08"} +{"current_steps": 3160, "total_steps": 7494, "loss": 0.6084, "lr": 0.00010752778933113774, "epoch": 0.8433413397384575, "percentage": 42.17, "elapsed_time": "6:05:54", "remaining_time": "8:21:51"} +{"current_steps": 3165, "total_steps": 7494, "loss": 0.6241, "lr": 0.00010737029747911191, "epoch": 0.844675740592474, "percentage": 42.23, "elapsed_time": "6:06:41", "remaining_time": "8:21:32"} +{"current_steps": 3170, "total_steps": 7494, "loss": 0.6125, "lr": 0.00010721263001632503, "epoch": 0.8460101414464906, "percentage": 42.3, "elapsed_time": "6:07:22", "remaining_time": "8:21:06"} +{"current_steps": 3175, "total_steps": 7494, "loss": 0.6148, "lr": 0.00010705478779813235, "epoch": 0.847344542300507, "percentage": 42.37, "elapsed_time": "6:08:05", "remaining_time": "8:20:43"} +{"current_steps": 3180, "total_steps": 7494, "loss": 0.5979, "lr": 0.00010689677168083711, "epoch": 0.8486789431545236, "percentage": 42.43, "elapsed_time": "6:08:52", "remaining_time": "8:20:24"} +{"current_steps": 3185, "total_steps": 7494, "loss": 0.6144, "lr": 0.00010673858252168603, "epoch": 0.8500133440085401, "percentage": 42.5, "elapsed_time": "6:09:39", "remaining_time": "8:20:06"} +{"current_steps": 3190, "total_steps": 7494, "loss": 0.6103, "lr": 0.00010658022117886457, "epoch": 0.8513477448625567, "percentage": 42.57, "elapsed_time": "6:10:21", "remaining_time": "8:19:41"} +{"current_steps": 3195, "total_steps": 7494, "loss": 0.6168, "lr": 0.00010642168851149229, "epoch": 0.8526821457165733, "percentage": 42.63, "elapsed_time": "6:11:29", "remaining_time": "8:19:51"} +{"current_steps": 3200, "total_steps": 7494, "loss": 0.6018, "lr": 0.00010626298537961821, "epoch": 0.8540165465705898, "percentage": 42.7, "elapsed_time": "6:12:15", "remaining_time": "8:19:31"} +{"current_steps": 3205, "total_steps": 7494, "loss": 0.6099, "lr": 0.00010610411264421611, "epoch": 0.8553509474246064, "percentage": 42.77, "elapsed_time": "6:14:13", "remaining_time": "8:20:47"} +{"current_steps": 3210, "total_steps": 7494, "loss": 0.6128, "lr": 0.0001059450711671799, "epoch": 0.8566853482786229, "percentage": 42.83, "elapsed_time": "6:14:57", "remaining_time": "8:20:25"} +{"current_steps": 3215, "total_steps": 7494, "loss": 0.6224, "lr": 0.0001057858618113189, "epoch": 0.8580197491326395, "percentage": 42.9, "elapsed_time": "6:15:39", "remaining_time": "8:19:59"} +{"current_steps": 3220, "total_steps": 7494, "loss": 0.606, "lr": 0.00010562648544035323, "epoch": 0.859354149986656, "percentage": 42.97, "elapsed_time": "6:16:26", "remaining_time": "8:19:40"} +{"current_steps": 3225, "total_steps": 7494, "loss": 0.5854, "lr": 0.00010546694291890902, "epoch": 0.8606885508406725, "percentage": 43.03, "elapsed_time": "6:17:13", "remaining_time": "8:19:20"} +{"current_steps": 3230, "total_steps": 7494, "loss": 0.6144, "lr": 0.00010530723511251382, "epoch": 0.8620229516946891, "percentage": 43.1, "elapsed_time": "6:17:58", "remaining_time": "8:18:58"} +{"current_steps": 3235, "total_steps": 7494, "loss": 0.6078, "lr": 0.0001051473628875918, "epoch": 0.8633573525487056, "percentage": 43.17, "elapsed_time": "6:18:40", "remaining_time": "8:18:31"} +{"current_steps": 3240, "total_steps": 7494, "loss": 0.6201, "lr": 0.00010498732711145918, "epoch": 0.8646917534027222, "percentage": 43.23, "elapsed_time": "6:19:25", "remaining_time": "8:18:10"} +{"current_steps": 3245, "total_steps": 7494, "loss": 0.5843, "lr": 0.00010482712865231942, "epoch": 0.8660261542567387, "percentage": 43.3, "elapsed_time": "6:20:10", "remaining_time": "8:17:48"} +{"current_steps": 3250, "total_steps": 7494, "loss": 0.6054, "lr": 0.00010466676837925857, "epoch": 0.8673605551107553, "percentage": 43.37, "elapsed_time": "6:21:28", "remaining_time": "8:18:09"} +{"current_steps": 3255, "total_steps": 7494, "loss": 0.6173, "lr": 0.00010450624716224045, "epoch": 0.8686949559647719, "percentage": 43.43, "elapsed_time": "6:22:10", "remaining_time": "8:17:43"} +{"current_steps": 3260, "total_steps": 7494, "loss": 0.6004, "lr": 0.00010434556587210214, "epoch": 0.8700293568187883, "percentage": 43.5, "elapsed_time": "6:22:55", "remaining_time": "8:17:19"} +{"current_steps": 3265, "total_steps": 7494, "loss": 0.6214, "lr": 0.000104184725380549, "epoch": 0.8713637576728049, "percentage": 43.57, "elapsed_time": "6:24:17", "remaining_time": "8:17:44"} +{"current_steps": 3270, "total_steps": 7494, "loss": 0.6112, "lr": 0.0001040237265601502, "epoch": 0.8726981585268214, "percentage": 43.63, "elapsed_time": "6:25:14", "remaining_time": "8:17:38"} +{"current_steps": 3275, "total_steps": 7494, "loss": 0.6037, "lr": 0.00010386257028433366, "epoch": 0.874032559380838, "percentage": 43.7, "elapsed_time": "6:25:56", "remaining_time": "8:17:11"} +{"current_steps": 3280, "total_steps": 7494, "loss": 0.6033, "lr": 0.00010370125742738173, "epoch": 0.8753669602348545, "percentage": 43.77, "elapsed_time": "6:26:39", "remaining_time": "8:16:46"} +{"current_steps": 3285, "total_steps": 7494, "loss": 0.6264, "lr": 0.00010353978886442605, "epoch": 0.8767013610888711, "percentage": 43.84, "elapsed_time": "6:27:29", "remaining_time": "8:16:28"} +{"current_steps": 3290, "total_steps": 7494, "loss": 0.6302, "lr": 0.00010337816547144308, "epoch": 0.8780357619428877, "percentage": 43.9, "elapsed_time": "6:28:12", "remaining_time": "8:16:03"} +{"current_steps": 3295, "total_steps": 7494, "loss": 0.6155, "lr": 0.00010321638812524917, "epoch": 0.8793701627969042, "percentage": 43.97, "elapsed_time": "6:31:12", "remaining_time": "8:18:32"} +{"current_steps": 3300, "total_steps": 7494, "loss": 0.6024, "lr": 0.00010305445770349593, "epoch": 0.8807045636509208, "percentage": 44.04, "elapsed_time": "6:31:55", "remaining_time": "8:18:05"} +{"current_steps": 3305, "total_steps": 7494, "loss": 0.6057, "lr": 0.00010289237508466536, "epoch": 0.8820389645049372, "percentage": 44.1, "elapsed_time": "6:32:52", "remaining_time": "8:17:58"} +{"current_steps": 3310, "total_steps": 7494, "loss": 0.5999, "lr": 0.00010273014114806517, "epoch": 0.8833733653589538, "percentage": 44.17, "elapsed_time": "6:33:37", "remaining_time": "8:17:33"} +{"current_steps": 3315, "total_steps": 7494, "loss": 0.6134, "lr": 0.000102567756773824, "epoch": 0.8847077662129704, "percentage": 44.24, "elapsed_time": "6:34:18", "remaining_time": "8:17:05"} +{"current_steps": 3320, "total_steps": 7494, "loss": 0.6009, "lr": 0.00010240522284288657, "epoch": 0.8860421670669869, "percentage": 44.3, "elapsed_time": "6:35:02", "remaining_time": "8:16:39"} +{"current_steps": 3325, "total_steps": 7494, "loss": 0.6131, "lr": 0.00010224254023700899, "epoch": 0.8873765679210035, "percentage": 44.37, "elapsed_time": "6:35:50", "remaining_time": "8:16:18"} +{"current_steps": 3330, "total_steps": 7494, "loss": 0.6147, "lr": 0.00010207970983875395, "epoch": 0.88871096877502, "percentage": 44.44, "elapsed_time": "6:37:33", "remaining_time": "8:17:07"} +{"current_steps": 3335, "total_steps": 7494, "loss": 0.609, "lr": 0.00010191673253148589, "epoch": 0.8900453696290366, "percentage": 44.5, "elapsed_time": "6:38:18", "remaining_time": "8:16:42"} +{"current_steps": 3340, "total_steps": 7494, "loss": 0.611, "lr": 0.00010175360919936623, "epoch": 0.8913797704830531, "percentage": 44.57, "elapsed_time": "6:39:42", "remaining_time": "8:17:07"} +{"current_steps": 3345, "total_steps": 7494, "loss": 0.5914, "lr": 0.00010159034072734865, "epoch": 0.8927141713370697, "percentage": 44.64, "elapsed_time": "6:40:26", "remaining_time": "8:16:41"} +{"current_steps": 3350, "total_steps": 7494, "loss": 0.6028, "lr": 0.00010142692800117416, "epoch": 0.8940485721910862, "percentage": 44.7, "elapsed_time": "6:41:09", "remaining_time": "8:16:14"} +{"current_steps": 3355, "total_steps": 7494, "loss": 0.6085, "lr": 0.00010126337190736636, "epoch": 0.8953829730451027, "percentage": 44.77, "elapsed_time": "6:41:54", "remaining_time": "8:15:49"} +{"current_steps": 3360, "total_steps": 7494, "loss": 0.6069, "lr": 0.00010109967333322669, "epoch": 0.8967173738991193, "percentage": 44.84, "elapsed_time": "6:42:40", "remaining_time": "8:15:25"} +{"current_steps": 3365, "total_steps": 7494, "loss": 0.6048, "lr": 0.00010093583316682945, "epoch": 0.8980517747531358, "percentage": 44.9, "elapsed_time": "6:43:24", "remaining_time": "8:14:59"} +{"current_steps": 3370, "total_steps": 7494, "loss": 0.6036, "lr": 0.00010077185229701722, "epoch": 0.8993861756071524, "percentage": 44.97, "elapsed_time": "6:44:07", "remaining_time": "8:14:32"} +{"current_steps": 3375, "total_steps": 7494, "loss": 0.5992, "lr": 0.00010060773161339574, "epoch": 0.900720576461169, "percentage": 45.04, "elapsed_time": "6:44:53", "remaining_time": "8:14:08"} +{"current_steps": 3380, "total_steps": 7494, "loss": 0.5989, "lr": 0.00010044347200632943, "epoch": 0.9020549773151855, "percentage": 45.1, "elapsed_time": "6:45:37", "remaining_time": "8:13:42"} +{"current_steps": 3385, "total_steps": 7494, "loss": 0.6095, "lr": 0.00010027907436693623, "epoch": 0.9033893781692021, "percentage": 45.17, "elapsed_time": "6:46:22", "remaining_time": "8:13:17"} +{"current_steps": 3390, "total_steps": 7494, "loss": 0.6125, "lr": 0.00010011453958708297, "epoch": 0.9047237790232185, "percentage": 45.24, "elapsed_time": "6:47:08", "remaining_time": "8:12:53"} +{"current_steps": 3395, "total_steps": 7494, "loss": 0.609, "lr": 9.994986855938047e-05, "epoch": 0.9060581798772351, "percentage": 45.3, "elapsed_time": "6:47:49", "remaining_time": "8:12:23"} +{"current_steps": 3400, "total_steps": 7494, "loss": 0.6019, "lr": 9.978506217717874e-05, "epoch": 0.9073925807312516, "percentage": 45.37, "elapsed_time": "6:48:34", "remaining_time": "8:11:58"} +{"current_steps": 3405, "total_steps": 7494, "loss": 0.6129, "lr": 9.962012133456204e-05, "epoch": 0.9087269815852682, "percentage": 45.44, "elapsed_time": "6:49:30", "remaining_time": "8:11:46"} +{"current_steps": 3410, "total_steps": 7494, "loss": 0.5989, "lr": 9.945504692634409e-05, "epoch": 0.9100613824392848, "percentage": 45.5, "elapsed_time": "6:50:17", "remaining_time": "8:11:22"} +{"current_steps": 3415, "total_steps": 7494, "loss": 0.6009, "lr": 9.928983984806326e-05, "epoch": 0.9113957832933013, "percentage": 45.57, "elapsed_time": "6:51:00", "remaining_time": "8:10:55"} +{"current_steps": 3420, "total_steps": 7494, "loss": 0.6028, "lr": 9.912450099597765e-05, "epoch": 0.9127301841473179, "percentage": 45.64, "elapsed_time": "6:51:45", "remaining_time": "8:10:29"} +{"current_steps": 3425, "total_steps": 7494, "loss": 0.608, "lr": 9.895903126706019e-05, "epoch": 0.9140645850013344, "percentage": 45.7, "elapsed_time": "6:52:52", "remaining_time": "8:10:30"} +{"current_steps": 3430, "total_steps": 7494, "loss": 0.5938, "lr": 9.879343155899382e-05, "epoch": 0.915398985855351, "percentage": 45.77, "elapsed_time": "6:53:38", "remaining_time": "8:10:06"} +{"current_steps": 3435, "total_steps": 7494, "loss": 0.6054, "lr": 9.862770277016676e-05, "epoch": 0.9167333867093675, "percentage": 45.84, "elapsed_time": "6:54:20", "remaining_time": "8:09:36"} +{"current_steps": 3440, "total_steps": 7494, "loss": 0.6017, "lr": 9.846184579966733e-05, "epoch": 0.918067787563384, "percentage": 45.9, "elapsed_time": "6:55:05", "remaining_time": "8:09:10"} +{"current_steps": 3445, "total_steps": 7494, "loss": 0.6113, "lr": 9.829586154727933e-05, "epoch": 0.9194021884174006, "percentage": 45.97, "elapsed_time": "6:55:47", "remaining_time": "8:08:41"} +{"current_steps": 3450, "total_steps": 7494, "loss": 0.5973, "lr": 9.812975091347706e-05, "epoch": 0.9207365892714171, "percentage": 46.04, "elapsed_time": "6:56:33", "remaining_time": "8:08:16"} +{"current_steps": 3455, "total_steps": 7494, "loss": 0.6098, "lr": 9.796351479942047e-05, "epoch": 0.9220709901254337, "percentage": 46.1, "elapsed_time": "6:57:16", "remaining_time": "8:07:48"} +{"current_steps": 3460, "total_steps": 7494, "loss": 0.6065, "lr": 9.779715410695015e-05, "epoch": 0.9234053909794502, "percentage": 46.17, "elapsed_time": "6:58:00", "remaining_time": "8:07:21"} +{"current_steps": 3465, "total_steps": 7494, "loss": 0.6102, "lr": 9.76306697385827e-05, "epoch": 0.9247397918334668, "percentage": 46.24, "elapsed_time": "6:58:43", "remaining_time": "8:06:52"} +{"current_steps": 3470, "total_steps": 7494, "loss": 0.6204, "lr": 9.746406259750552e-05, "epoch": 0.9260741926874834, "percentage": 46.3, "elapsed_time": "6:59:29", "remaining_time": "8:06:28"} +{"current_steps": 3475, "total_steps": 7494, "loss": 0.5921, "lr": 9.729733358757213e-05, "epoch": 0.9274085935414998, "percentage": 46.37, "elapsed_time": "7:00:47", "remaining_time": "8:06:39"} +{"current_steps": 3480, "total_steps": 7494, "loss": 0.6044, "lr": 9.713048361329715e-05, "epoch": 0.9287429943955164, "percentage": 46.44, "elapsed_time": "7:01:54", "remaining_time": "8:06:39"} +{"current_steps": 3485, "total_steps": 7494, "loss": 0.6209, "lr": 9.696351357985154e-05, "epoch": 0.9300773952495329, "percentage": 46.5, "elapsed_time": "7:02:39", "remaining_time": "8:06:12"} +{"current_steps": 3490, "total_steps": 7494, "loss": 0.618, "lr": 9.679642439305744e-05, "epoch": 0.9314117961035495, "percentage": 46.57, "elapsed_time": "7:03:25", "remaining_time": "8:05:47"} +{"current_steps": 3495, "total_steps": 7494, "loss": 0.5986, "lr": 9.662921695938354e-05, "epoch": 0.932746196957566, "percentage": 46.64, "elapsed_time": "7:04:09", "remaining_time": "8:05:19"} +{"current_steps": 3500, "total_steps": 7494, "loss": 0.6074, "lr": 9.646189218593992e-05, "epoch": 0.9340805978115826, "percentage": 46.7, "elapsed_time": "7:04:53", "remaining_time": "8:04:51"} +{"current_steps": 3505, "total_steps": 7494, "loss": 0.6169, "lr": 9.629445098047334e-05, "epoch": 0.9354149986655992, "percentage": 46.77, "elapsed_time": "7:06:27", "remaining_time": "8:05:20"} +{"current_steps": 3510, "total_steps": 7494, "loss": 0.5954, "lr": 9.61268942513621e-05, "epoch": 0.9367493995196157, "percentage": 46.84, "elapsed_time": "7:07:12", "remaining_time": "8:04:54"} +{"current_steps": 3515, "total_steps": 7494, "loss": 0.6126, "lr": 9.595922290761128e-05, "epoch": 0.9380838003736323, "percentage": 46.9, "elapsed_time": "7:08:38", "remaining_time": "8:05:13"} +{"current_steps": 3520, "total_steps": 7494, "loss": 0.5916, "lr": 9.579143785884779e-05, "epoch": 0.9394182012276487, "percentage": 46.97, "elapsed_time": "7:09:21", "remaining_time": "8:04:44"} +{"current_steps": 3525, "total_steps": 7494, "loss": 0.6158, "lr": 9.562354001531532e-05, "epoch": 0.9407526020816653, "percentage": 47.04, "elapsed_time": "7:11:31", "remaining_time": "8:05:52"} +{"current_steps": 3530, "total_steps": 7494, "loss": 0.5935, "lr": 9.545553028786952e-05, "epoch": 0.9420870029356819, "percentage": 47.1, "elapsed_time": "7:12:17", "remaining_time": "8:05:26"} +{"current_steps": 3535, "total_steps": 7494, "loss": 0.6033, "lr": 9.5287409587973e-05, "epoch": 0.9434214037896984, "percentage": 47.17, "elapsed_time": "7:13:01", "remaining_time": "8:04:58"} +{"current_steps": 3540, "total_steps": 7494, "loss": 0.6005, "lr": 9.511917882769042e-05, "epoch": 0.944755804643715, "percentage": 47.24, "elapsed_time": "7:14:43", "remaining_time": "8:05:33"} +{"current_steps": 3545, "total_steps": 7494, "loss": 0.6097, "lr": 9.495083891968351e-05, "epoch": 0.9460902054977315, "percentage": 47.3, "elapsed_time": "7:15:55", "remaining_time": "8:05:36"} +{"current_steps": 3550, "total_steps": 7494, "loss": 0.6122, "lr": 9.478239077720615e-05, "epoch": 0.9474246063517481, "percentage": 47.37, "elapsed_time": "7:16:41", "remaining_time": "8:05:09"} +{"current_steps": 3555, "total_steps": 7494, "loss": 0.6013, "lr": 9.461383531409937e-05, "epoch": 0.9487590072057646, "percentage": 47.44, "elapsed_time": "7:17:27", "remaining_time": "8:04:43"} +{"current_steps": 3560, "total_steps": 7494, "loss": 0.6099, "lr": 9.444517344478645e-05, "epoch": 0.9500934080597812, "percentage": 47.5, "elapsed_time": "7:18:39", "remaining_time": "8:04:44"} +{"current_steps": 3565, "total_steps": 7494, "loss": 0.6045, "lr": 9.427640608426789e-05, "epoch": 0.9514278089137977, "percentage": 47.57, "elapsed_time": "7:19:23", "remaining_time": "8:04:15"} +{"current_steps": 3570, "total_steps": 7494, "loss": 0.5991, "lr": 9.410753414811654e-05, "epoch": 0.9527622097678142, "percentage": 47.64, "elapsed_time": "7:20:10", "remaining_time": "8:03:49"} +{"current_steps": 3575, "total_steps": 7494, "loss": 0.6299, "lr": 9.393855855247254e-05, "epoch": 0.9540966106218308, "percentage": 47.7, "elapsed_time": "7:20:54", "remaining_time": "8:03:20"} +{"current_steps": 3580, "total_steps": 7494, "loss": 0.6189, "lr": 9.376948021403838e-05, "epoch": 0.9554310114758473, "percentage": 47.77, "elapsed_time": "7:21:39", "remaining_time": "8:02:51"} +{"current_steps": 3585, "total_steps": 7494, "loss": 0.6087, "lr": 9.360030005007399e-05, "epoch": 0.9567654123298639, "percentage": 47.84, "elapsed_time": "7:22:23", "remaining_time": "8:02:22"} +{"current_steps": 3590, "total_steps": 7494, "loss": 0.6124, "lr": 9.343101897839169e-05, "epoch": 0.9580998131838805, "percentage": 47.9, "elapsed_time": "7:23:32", "remaining_time": "8:02:20"} +{"current_steps": 3595, "total_steps": 7494, "loss": 0.5915, "lr": 9.326163791735116e-05, "epoch": 0.959434214037897, "percentage": 47.97, "elapsed_time": "7:24:16", "remaining_time": "8:01:50"} +{"current_steps": 3600, "total_steps": 7494, "loss": 0.6081, "lr": 9.309215778585461e-05, "epoch": 0.9607686148919136, "percentage": 48.04, "elapsed_time": "7:25:35", "remaining_time": "8:01:59"} +{"current_steps": 3605, "total_steps": 7494, "loss": 0.6151, "lr": 9.29225795033417e-05, "epoch": 0.96210301574593, "percentage": 48.11, "elapsed_time": "7:26:27", "remaining_time": "8:01:37"} +{"current_steps": 3610, "total_steps": 7494, "loss": 0.6258, "lr": 9.275290398978454e-05, "epoch": 0.9634374165999466, "percentage": 48.17, "elapsed_time": "7:27:15", "remaining_time": "8:01:12"} +{"current_steps": 3615, "total_steps": 7494, "loss": 0.6089, "lr": 9.258313216568273e-05, "epoch": 0.9647718174539631, "percentage": 48.24, "elapsed_time": "7:28:02", "remaining_time": "8:00:45"} +{"current_steps": 3620, "total_steps": 7494, "loss": 0.6155, "lr": 9.241326495205836e-05, "epoch": 0.9661062183079797, "percentage": 48.31, "elapsed_time": "7:28:47", "remaining_time": "8:00:16"} +{"current_steps": 3625, "total_steps": 7494, "loss": 0.5971, "lr": 9.224330327045105e-05, "epoch": 0.9674406191619963, "percentage": 48.37, "elapsed_time": "7:29:32", "remaining_time": "7:59:48"} +{"current_steps": 3630, "total_steps": 7494, "loss": 0.6101, "lr": 9.207324804291285e-05, "epoch": 0.9687750200160128, "percentage": 48.44, "elapsed_time": "7:30:16", "remaining_time": "7:59:18"} +{"current_steps": 3635, "total_steps": 7494, "loss": 0.6062, "lr": 9.190310019200338e-05, "epoch": 0.9701094208700294, "percentage": 48.51, "elapsed_time": "7:31:05", "remaining_time": "7:58:53"} +{"current_steps": 3640, "total_steps": 7494, "loss": 0.6246, "lr": 9.173286064078465e-05, "epoch": 0.9714438217240459, "percentage": 48.57, "elapsed_time": "7:31:50", "remaining_time": "7:58:23"} +{"current_steps": 3645, "total_steps": 7494, "loss": 0.6205, "lr": 9.156253031281625e-05, "epoch": 0.9727782225780625, "percentage": 48.64, "elapsed_time": "7:32:33", "remaining_time": "7:57:53"} +{"current_steps": 3650, "total_steps": 7494, "loss": 0.6159, "lr": 9.139211013215013e-05, "epoch": 0.974112623432079, "percentage": 48.71, "elapsed_time": "7:33:18", "remaining_time": "7:57:24"} +{"current_steps": 3655, "total_steps": 7494, "loss": 0.6124, "lr": 9.122160102332583e-05, "epoch": 0.9754470242860955, "percentage": 48.77, "elapsed_time": "7:34:05", "remaining_time": "7:56:56"} +{"current_steps": 3660, "total_steps": 7494, "loss": 0.5969, "lr": 9.105100391136523e-05, "epoch": 0.9767814251401121, "percentage": 48.84, "elapsed_time": "7:34:49", "remaining_time": "7:56:27"} +{"current_steps": 3665, "total_steps": 7494, "loss": 0.597, "lr": 9.088031972176764e-05, "epoch": 0.9781158259941286, "percentage": 48.91, "elapsed_time": "7:35:33", "remaining_time": "7:55:56"} +{"current_steps": 3670, "total_steps": 7494, "loss": 0.6177, "lr": 9.070954938050482e-05, "epoch": 0.9794502268481452, "percentage": 48.97, "elapsed_time": "7:37:06", "remaining_time": "7:56:17"} +{"current_steps": 3675, "total_steps": 7494, "loss": 0.6078, "lr": 9.053869381401589e-05, "epoch": 0.9807846277021617, "percentage": 49.04, "elapsed_time": "7:37:52", "remaining_time": "7:55:49"} +{"current_steps": 3680, "total_steps": 7494, "loss": 0.6087, "lr": 9.036775394920228e-05, "epoch": 0.9821190285561783, "percentage": 49.11, "elapsed_time": "7:38:59", "remaining_time": "7:55:42"} +{"current_steps": 3685, "total_steps": 7494, "loss": 0.6044, "lr": 9.01967307134228e-05, "epoch": 0.9834534294101949, "percentage": 49.17, "elapsed_time": "7:39:42", "remaining_time": "7:55:10"} +{"current_steps": 3690, "total_steps": 7494, "loss": 0.5962, "lr": 9.00256250344885e-05, "epoch": 0.9847878302642114, "percentage": 49.24, "elapsed_time": "7:40:26", "remaining_time": "7:54:40"} +{"current_steps": 3695, "total_steps": 7494, "loss": 0.5963, "lr": 8.985443784065774e-05, "epoch": 0.9861222311182279, "percentage": 49.31, "elapsed_time": "7:41:13", "remaining_time": "7:54:12"} +{"current_steps": 3700, "total_steps": 7494, "loss": 0.6052, "lr": 8.968317006063107e-05, "epoch": 0.9874566319722444, "percentage": 49.37, "elapsed_time": "7:41:57", "remaining_time": "7:53:41"} +{"current_steps": 3705, "total_steps": 7494, "loss": 0.5855, "lr": 8.951182262354624e-05, "epoch": 0.988791032826261, "percentage": 49.44, "elapsed_time": "7:43:22", "remaining_time": "7:53:53"} +{"current_steps": 3710, "total_steps": 7494, "loss": 0.6119, "lr": 8.934039645897316e-05, "epoch": 0.9901254336802775, "percentage": 49.51, "elapsed_time": "7:44:09", "remaining_time": "7:53:25"} +{"current_steps": 3715, "total_steps": 7494, "loss": 0.6218, "lr": 8.916889249690877e-05, "epoch": 0.9914598345342941, "percentage": 49.57, "elapsed_time": "7:44:55", "remaining_time": "7:52:56"} +{"current_steps": 3720, "total_steps": 7494, "loss": 0.6203, "lr": 8.899731166777216e-05, "epoch": 0.9927942353883107, "percentage": 49.64, "elapsed_time": "7:45:38", "remaining_time": "7:52:24"} +{"current_steps": 3725, "total_steps": 7494, "loss": 0.5876, "lr": 8.882565490239935e-05, "epoch": 0.9941286362423272, "percentage": 49.71, "elapsed_time": "7:46:21", "remaining_time": "7:51:52"} +{"current_steps": 3730, "total_steps": 7494, "loss": 0.6016, "lr": 8.865392313203839e-05, "epoch": 0.9954630370963438, "percentage": 49.77, "elapsed_time": "7:47:09", "remaining_time": "7:51:24"} +{"current_steps": 3735, "total_steps": 7494, "loss": 0.625, "lr": 8.848211728834415e-05, "epoch": 0.9967974379503602, "percentage": 49.84, "elapsed_time": "7:47:53", "remaining_time": "7:50:53"} +{"current_steps": 3740, "total_steps": 7494, "loss": 0.6217, "lr": 8.831023830337348e-05, "epoch": 0.9981318388043768, "percentage": 49.91, "elapsed_time": "7:48:39", "remaining_time": "7:50:24"} +{"current_steps": 3745, "total_steps": 7494, "loss": 0.5884, "lr": 8.813828710957987e-05, "epoch": 0.9994662396583934, "percentage": 49.97, "elapsed_time": "7:49:48", "remaining_time": "7:50:18"} +{"current_steps": 3750, "total_steps": 7494, "loss": 0.5954, "lr": 8.796626463980863e-05, "epoch": 1.00080064051241, "percentage": 50.04, "elapsed_time": "7:50:41", "remaining_time": "7:49:56"} +{"current_steps": 3755, "total_steps": 7494, "loss": 0.6026, "lr": 8.779417182729181e-05, "epoch": 1.0021350413664265, "percentage": 50.11, "elapsed_time": "7:52:30", "remaining_time": "7:50:29"} +{"current_steps": 3760, "total_steps": 7494, "loss": 0.6066, "lr": 8.762200960564295e-05, "epoch": 1.003469442220443, "percentage": 50.17, "elapsed_time": "7:54:00", "remaining_time": "7:50:43"} +{"current_steps": 3765, "total_steps": 7494, "loss": 0.6009, "lr": 8.744977890885218e-05, "epoch": 1.0048038430744595, "percentage": 50.24, "elapsed_time": "7:55:18", "remaining_time": "7:50:46"} +{"current_steps": 3770, "total_steps": 7494, "loss": 0.6074, "lr": 8.727748067128116e-05, "epoch": 1.006138243928476, "percentage": 50.31, "elapsed_time": "7:56:07", "remaining_time": "7:50:18"} +{"current_steps": 3775, "total_steps": 7494, "loss": 0.6039, "lr": 8.71051158276579e-05, "epoch": 1.0074726447824927, "percentage": 50.37, "elapsed_time": "7:56:52", "remaining_time": "7:49:48"} +{"current_steps": 3780, "total_steps": 7494, "loss": 0.6119, "lr": 8.693268531307182e-05, "epoch": 1.0088070456365092, "percentage": 50.44, "elapsed_time": "7:58:31", "remaining_time": "7:50:10"} +{"current_steps": 3785, "total_steps": 7494, "loss": 0.6057, "lr": 8.676019006296851e-05, "epoch": 1.0101414464905258, "percentage": 50.51, "elapsed_time": "7:59:15", "remaining_time": "7:49:38"} +{"current_steps": 3790, "total_steps": 7494, "loss": 0.6095, "lr": 8.658763101314484e-05, "epoch": 1.0114758473445422, "percentage": 50.57, "elapsed_time": "8:00:37", "remaining_time": "7:49:43"} +{"current_steps": 3795, "total_steps": 7494, "loss": 0.5956, "lr": 8.64150090997438e-05, "epoch": 1.0128102481985588, "percentage": 50.64, "elapsed_time": "8:01:23", "remaining_time": "7:49:12"} +{"current_steps": 3800, "total_steps": 7494, "loss": 0.607, "lr": 8.624232525924936e-05, "epoch": 1.0141446490525754, "percentage": 50.71, "elapsed_time": "8:02:34", "remaining_time": "7:49:06"} +{"current_steps": 3805, "total_steps": 7494, "loss": 0.6059, "lr": 8.606958042848145e-05, "epoch": 1.015479049906592, "percentage": 50.77, "elapsed_time": "8:03:49", "remaining_time": "7:49:04"} +{"current_steps": 3810, "total_steps": 7494, "loss": 0.5885, "lr": 8.589677554459094e-05, "epoch": 1.0168134507606086, "percentage": 50.84, "elapsed_time": "8:05:03", "remaining_time": "7:49:00"} +{"current_steps": 3815, "total_steps": 7494, "loss": 0.5863, "lr": 8.572391154505444e-05, "epoch": 1.018147851614625, "percentage": 50.91, "elapsed_time": "8:05:51", "remaining_time": "7:48:31"} +{"current_steps": 3820, "total_steps": 7494, "loss": 0.5957, "lr": 8.555098936766927e-05, "epoch": 1.0194822524686415, "percentage": 50.97, "elapsed_time": "8:06:39", "remaining_time": "7:48:03"} +{"current_steps": 3825, "total_steps": 7494, "loss": 0.6157, "lr": 8.537800995054838e-05, "epoch": 1.0208166533226581, "percentage": 51.04, "elapsed_time": "8:07:24", "remaining_time": "7:47:31"} +{"current_steps": 3830, "total_steps": 7494, "loss": 0.5826, "lr": 8.520497423211527e-05, "epoch": 1.0221510541766747, "percentage": 51.11, "elapsed_time": "8:08:38", "remaining_time": "7:47:27"} +{"current_steps": 3835, "total_steps": 7494, "loss": 0.6114, "lr": 8.503188315109881e-05, "epoch": 1.0234854550306913, "percentage": 51.17, "elapsed_time": "8:09:52", "remaining_time": "7:47:23"} +{"current_steps": 3840, "total_steps": 7494, "loss": 0.5968, "lr": 8.485873764652832e-05, "epoch": 1.0248198558847077, "percentage": 51.24, "elapsed_time": "8:10:41", "remaining_time": "7:46:55"} +{"current_steps": 3845, "total_steps": 7494, "loss": 0.585, "lr": 8.468553865772826e-05, "epoch": 1.0261542567387243, "percentage": 51.31, "elapsed_time": "8:12:54", "remaining_time": "7:47:46"} +{"current_steps": 3850, "total_steps": 7494, "loss": 0.5997, "lr": 8.451228712431332e-05, "epoch": 1.0274886575927409, "percentage": 51.37, "elapsed_time": "8:13:39", "remaining_time": "7:47:14"} +{"current_steps": 3855, "total_steps": 7494, "loss": 0.6076, "lr": 8.433898398618319e-05, "epoch": 1.0288230584467575, "percentage": 51.44, "elapsed_time": "8:14:26", "remaining_time": "7:46:44"} +{"current_steps": 3860, "total_steps": 7494, "loss": 0.5866, "lr": 8.416563018351758e-05, "epoch": 1.0301574593007738, "percentage": 51.51, "elapsed_time": "8:15:37", "remaining_time": "7:46:36"} +{"current_steps": 3865, "total_steps": 7494, "loss": 0.6109, "lr": 8.399222665677105e-05, "epoch": 1.0314918601547904, "percentage": 51.57, "elapsed_time": "8:16:54", "remaining_time": "7:46:33"} +{"current_steps": 3870, "total_steps": 7494, "loss": 0.5897, "lr": 8.381877434666784e-05, "epoch": 1.032826261008807, "percentage": 51.64, "elapsed_time": "8:18:19", "remaining_time": "7:46:39"} +{"current_steps": 3875, "total_steps": 7494, "loss": 0.5923, "lr": 8.364527419419696e-05, "epoch": 1.0341606618628236, "percentage": 51.71, "elapsed_time": "8:19:30", "remaining_time": "7:46:30"} +{"current_steps": 3880, "total_steps": 7494, "loss": 0.6003, "lr": 8.347172714060686e-05, "epoch": 1.0354950627168402, "percentage": 51.77, "elapsed_time": "8:20:41", "remaining_time": "7:46:21"} +{"current_steps": 3885, "total_steps": 7494, "loss": 0.587, "lr": 8.32981341274005e-05, "epoch": 1.0368294635708566, "percentage": 51.84, "elapsed_time": "8:21:27", "remaining_time": "7:45:49"} +{"current_steps": 3890, "total_steps": 7494, "loss": 0.598, "lr": 8.312449609633014e-05, "epoch": 1.0381638644248732, "percentage": 51.91, "elapsed_time": "8:22:11", "remaining_time": "7:45:16"} +{"current_steps": 3895, "total_steps": 7494, "loss": 0.591, "lr": 8.295081398939227e-05, "epoch": 1.0394982652788898, "percentage": 51.97, "elapsed_time": "8:23:31", "remaining_time": "7:45:15"} +{"current_steps": 3900, "total_steps": 7494, "loss": 0.5922, "lr": 8.277708874882252e-05, "epoch": 1.0408326661329064, "percentage": 52.04, "elapsed_time": "8:24:20", "remaining_time": "7:44:46"} +{"current_steps": 3905, "total_steps": 7494, "loss": 0.5935, "lr": 8.26033213170905e-05, "epoch": 1.042167066986923, "percentage": 52.11, "elapsed_time": "8:25:48", "remaining_time": "7:44:52"} +{"current_steps": 3910, "total_steps": 7494, "loss": 0.6112, "lr": 8.242951263689468e-05, "epoch": 1.0435014678409393, "percentage": 52.18, "elapsed_time": "8:26:59", "remaining_time": "7:44:43"} +{"current_steps": 3915, "total_steps": 7494, "loss": 0.5971, "lr": 8.225566365115738e-05, "epoch": 1.044835868694956, "percentage": 52.24, "elapsed_time": "8:27:42", "remaining_time": "7:44:08"} +{"current_steps": 3920, "total_steps": 7494, "loss": 0.5968, "lr": 8.20817753030195e-05, "epoch": 1.0461702695489725, "percentage": 52.31, "elapsed_time": "8:28:29", "remaining_time": "7:43:36"} +{"current_steps": 3925, "total_steps": 7494, "loss": 0.6191, "lr": 8.190784853583554e-05, "epoch": 1.0475046704029891, "percentage": 52.38, "elapsed_time": "8:29:15", "remaining_time": "7:43:04"} +{"current_steps": 3930, "total_steps": 7494, "loss": 0.6043, "lr": 8.17338842931684e-05, "epoch": 1.0488390712570057, "percentage": 52.44, "elapsed_time": "8:30:30", "remaining_time": "7:42:58"} +{"current_steps": 3935, "total_steps": 7494, "loss": 0.5914, "lr": 8.155988351878433e-05, "epoch": 1.050173472111022, "percentage": 52.51, "elapsed_time": "8:31:14", "remaining_time": "7:42:23"} +{"current_steps": 3940, "total_steps": 7494, "loss": 0.621, "lr": 8.138584715664766e-05, "epoch": 1.0515078729650387, "percentage": 52.58, "elapsed_time": "8:33:34", "remaining_time": "7:43:15"} +{"current_steps": 3945, "total_steps": 7494, "loss": 0.6087, "lr": 8.121177615091591e-05, "epoch": 1.0528422738190553, "percentage": 52.64, "elapsed_time": "8:34:55", "remaining_time": "7:43:14"} +{"current_steps": 3950, "total_steps": 7494, "loss": 0.5978, "lr": 8.103767144593445e-05, "epoch": 1.0541766746730719, "percentage": 52.71, "elapsed_time": "8:35:40", "remaining_time": "7:42:40"} +{"current_steps": 3955, "total_steps": 7494, "loss": 0.5914, "lr": 8.086353398623154e-05, "epoch": 1.0555110755270882, "percentage": 52.78, "elapsed_time": "8:36:26", "remaining_time": "7:42:07"} +{"current_steps": 3960, "total_steps": 7494, "loss": 0.6052, "lr": 8.068936471651308e-05, "epoch": 1.0568454763811048, "percentage": 52.84, "elapsed_time": "8:37:36", "remaining_time": "7:41:55"} +{"current_steps": 3965, "total_steps": 7494, "loss": 0.594, "lr": 8.051516458165759e-05, "epoch": 1.0581798772351214, "percentage": 52.91, "elapsed_time": "8:38:21", "remaining_time": "7:41:21"} +{"current_steps": 3970, "total_steps": 7494, "loss": 0.6053, "lr": 8.0340934526711e-05, "epoch": 1.059514278089138, "percentage": 52.98, "elapsed_time": "8:39:32", "remaining_time": "7:41:10"} +{"current_steps": 3975, "total_steps": 7494, "loss": 0.5954, "lr": 8.016667549688157e-05, "epoch": 1.0608486789431546, "percentage": 53.04, "elapsed_time": "8:40:42", "remaining_time": "7:40:58"} +{"current_steps": 3980, "total_steps": 7494, "loss": 0.5988, "lr": 7.999238843753474e-05, "epoch": 1.062183079797171, "percentage": 53.11, "elapsed_time": "8:41:52", "remaining_time": "7:40:46"} +{"current_steps": 3985, "total_steps": 7494, "loss": 0.6255, "lr": 7.981807429418803e-05, "epoch": 1.0635174806511876, "percentage": 53.18, "elapsed_time": "8:43:16", "remaining_time": "7:40:46"} +{"current_steps": 3990, "total_steps": 7494, "loss": 0.5849, "lr": 7.96437340125059e-05, "epoch": 1.0648518815052042, "percentage": 53.24, "elapsed_time": "8:44:03", "remaining_time": "7:40:13"} +{"current_steps": 3995, "total_steps": 7494, "loss": 0.6035, "lr": 7.946936853829458e-05, "epoch": 1.0661862823592207, "percentage": 53.31, "elapsed_time": "8:44:48", "remaining_time": "7:39:39"} +{"current_steps": 4000, "total_steps": 7494, "loss": 0.5986, "lr": 7.929497881749699e-05, "epoch": 1.0675206832132373, "percentage": 53.38, "elapsed_time": "8:45:35", "remaining_time": "7:39:06"} +{"current_steps": 4005, "total_steps": 7494, "loss": 0.6101, "lr": 7.912056579618759e-05, "epoch": 1.0688550840672537, "percentage": 53.44, "elapsed_time": "8:46:29", "remaining_time": "7:38:39"} +{"current_steps": 4010, "total_steps": 7494, "loss": 0.5826, "lr": 7.894613042056721e-05, "epoch": 1.0701894849212703, "percentage": 53.51, "elapsed_time": "8:47:21", "remaining_time": "7:38:10"} +{"current_steps": 4015, "total_steps": 7494, "loss": 0.6027, "lr": 7.877167363695805e-05, "epoch": 1.071523885775287, "percentage": 53.58, "elapsed_time": "8:48:08", "remaining_time": "7:37:37"} +{"current_steps": 4020, "total_steps": 7494, "loss": 0.5863, "lr": 7.859719639179834e-05, "epoch": 1.0728582866293035, "percentage": 53.64, "elapsed_time": "8:48:54", "remaining_time": "7:37:04"} +{"current_steps": 4025, "total_steps": 7494, "loss": 0.6048, "lr": 7.842269963163735e-05, "epoch": 1.07419268748332, "percentage": 53.71, "elapsed_time": "8:49:41", "remaining_time": "7:36:30"} +{"current_steps": 4030, "total_steps": 7494, "loss": 0.5987, "lr": 7.824818430313028e-05, "epoch": 1.0755270883373365, "percentage": 53.78, "elapsed_time": "8:50:30", "remaining_time": "7:35:59"} +{"current_steps": 4035, "total_steps": 7494, "loss": 0.6152, "lr": 7.807365135303299e-05, "epoch": 1.076861489191353, "percentage": 53.84, "elapsed_time": "8:51:16", "remaining_time": "7:35:25"} +{"current_steps": 4040, "total_steps": 7494, "loss": 0.5986, "lr": 7.789910172819693e-05, "epoch": 1.0781958900453696, "percentage": 53.91, "elapsed_time": "8:52:00", "remaining_time": "7:34:50"} +{"current_steps": 4045, "total_steps": 7494, "loss": 0.6208, "lr": 7.772453637556411e-05, "epoch": 1.0795302908993862, "percentage": 53.98, "elapsed_time": "8:52:46", "remaining_time": "7:34:16"} +{"current_steps": 4050, "total_steps": 7494, "loss": 0.6002, "lr": 7.754995624216176e-05, "epoch": 1.0808646917534026, "percentage": 54.04, "elapsed_time": "8:53:56", "remaining_time": "7:34:03"} +{"current_steps": 4055, "total_steps": 7494, "loss": 0.5955, "lr": 7.737536227509734e-05, "epoch": 1.0821990926074192, "percentage": 54.11, "elapsed_time": "8:54:44", "remaining_time": "7:33:30"} +{"current_steps": 4060, "total_steps": 7494, "loss": 0.6277, "lr": 7.720075542155336e-05, "epoch": 1.0835334934614358, "percentage": 54.18, "elapsed_time": "8:55:29", "remaining_time": "7:32:55"} +{"current_steps": 4065, "total_steps": 7494, "loss": 0.6163, "lr": 7.702613662878223e-05, "epoch": 1.0848678943154524, "percentage": 54.24, "elapsed_time": "8:56:15", "remaining_time": "7:32:21"} +{"current_steps": 4070, "total_steps": 7494, "loss": 0.5985, "lr": 7.685150684410114e-05, "epoch": 1.086202295169469, "percentage": 54.31, "elapsed_time": "8:57:25", "remaining_time": "7:32:07"} +{"current_steps": 4075, "total_steps": 7494, "loss": 0.6014, "lr": 7.667686701488688e-05, "epoch": 1.0875366960234856, "percentage": 54.38, "elapsed_time": "8:58:34", "remaining_time": "7:31:52"} +{"current_steps": 4080, "total_steps": 7494, "loss": 0.6066, "lr": 7.650221808857081e-05, "epoch": 1.088871096877502, "percentage": 54.44, "elapsed_time": "8:59:18", "remaining_time": "7:31:16"} +{"current_steps": 4085, "total_steps": 7494, "loss": 0.5888, "lr": 7.632756101263358e-05, "epoch": 1.0902054977315185, "percentage": 54.51, "elapsed_time": "9:00:01", "remaining_time": "7:30:39"} +{"current_steps": 4090, "total_steps": 7494, "loss": 0.6023, "lr": 7.615289673460003e-05, "epoch": 1.0915398985855351, "percentage": 54.58, "elapsed_time": "9:00:52", "remaining_time": "7:30:09"} +{"current_steps": 4095, "total_steps": 7494, "loss": 0.5906, "lr": 7.59782262020341e-05, "epoch": 1.0928742994395517, "percentage": 54.64, "elapsed_time": "9:02:12", "remaining_time": "7:30:03"} +{"current_steps": 4100, "total_steps": 7494, "loss": 0.6024, "lr": 7.580355036253372e-05, "epoch": 1.094208700293568, "percentage": 54.71, "elapsed_time": "9:02:54", "remaining_time": "7:29:25"} +{"current_steps": 4105, "total_steps": 7494, "loss": 0.6077, "lr": 7.562887016372551e-05, "epoch": 1.0955431011475847, "percentage": 54.78, "elapsed_time": "9:03:48", "remaining_time": "7:28:57"} +{"current_steps": 4110, "total_steps": 7494, "loss": 0.602, "lr": 7.54541865532598e-05, "epoch": 1.0968775020016013, "percentage": 54.84, "elapsed_time": "9:04:35", "remaining_time": "7:28:23"} +{"current_steps": 4115, "total_steps": 7494, "loss": 0.6016, "lr": 7.527950047880543e-05, "epoch": 1.0982119028556179, "percentage": 54.91, "elapsed_time": "9:05:24", "remaining_time": "7:27:51"} +{"current_steps": 4120, "total_steps": 7494, "loss": 0.6074, "lr": 7.51048128880446e-05, "epoch": 1.0995463037096345, "percentage": 54.98, "elapsed_time": "9:06:06", "remaining_time": "7:27:13"} +{"current_steps": 4125, "total_steps": 7494, "loss": 0.6027, "lr": 7.493012472866769e-05, "epoch": 1.1008807045636508, "percentage": 55.04, "elapsed_time": "9:06:50", "remaining_time": "7:26:36"} +{"current_steps": 4130, "total_steps": 7494, "loss": 0.6022, "lr": 7.47554369483682e-05, "epoch": 1.1022151054176674, "percentage": 55.11, "elapsed_time": "9:07:36", "remaining_time": "7:26:02"} +{"current_steps": 4135, "total_steps": 7494, "loss": 0.5945, "lr": 7.458075049483762e-05, "epoch": 1.103549506271684, "percentage": 55.18, "elapsed_time": "9:08:24", "remaining_time": "7:25:29"} +{"current_steps": 4140, "total_steps": 7494, "loss": 0.6033, "lr": 7.44060663157602e-05, "epoch": 1.1048839071257006, "percentage": 55.24, "elapsed_time": "9:09:46", "remaining_time": "7:25:23"} +{"current_steps": 4145, "total_steps": 7494, "loss": 0.6026, "lr": 7.423138535880779e-05, "epoch": 1.1062183079797172, "percentage": 55.31, "elapsed_time": "9:10:30", "remaining_time": "7:24:47"} +{"current_steps": 4150, "total_steps": 7494, "loss": 0.6106, "lr": 7.405670857163489e-05, "epoch": 1.1075527088337336, "percentage": 55.38, "elapsed_time": "9:12:27", "remaining_time": "7:25:09"} +{"current_steps": 4155, "total_steps": 7494, "loss": 0.6031, "lr": 7.388203690187325e-05, "epoch": 1.1088871096877502, "percentage": 55.44, "elapsed_time": "9:13:35", "remaining_time": "7:24:52"} +{"current_steps": 4160, "total_steps": 7494, "loss": 0.5892, "lr": 7.370737129712695e-05, "epoch": 1.1102215105417668, "percentage": 55.51, "elapsed_time": "9:14:46", "remaining_time": "7:24:37"} +{"current_steps": 4165, "total_steps": 7494, "loss": 0.6097, "lr": 7.353271270496713e-05, "epoch": 1.1115559113957834, "percentage": 55.58, "elapsed_time": "9:15:31", "remaining_time": "7:24:01"} +{"current_steps": 4170, "total_steps": 7494, "loss": 0.6053, "lr": 7.335806207292687e-05, "epoch": 1.1128903122498, "percentage": 55.64, "elapsed_time": "9:16:18", "remaining_time": "7:23:26"} +{"current_steps": 4175, "total_steps": 7494, "loss": 0.6063, "lr": 7.31834203484961e-05, "epoch": 1.1142247131038163, "percentage": 55.71, "elapsed_time": "9:17:04", "remaining_time": "7:22:51"} +{"current_steps": 4180, "total_steps": 7494, "loss": 0.6083, "lr": 7.300878847911642e-05, "epoch": 1.115559113957833, "percentage": 55.78, "elapsed_time": "9:18:13", "remaining_time": "7:22:34"} +{"current_steps": 4185, "total_steps": 7494, "loss": 0.5863, "lr": 7.283416741217595e-05, "epoch": 1.1168935148118495, "percentage": 55.84, "elapsed_time": "9:18:59", "remaining_time": "7:21:58"} +{"current_steps": 4190, "total_steps": 7494, "loss": 0.6158, "lr": 7.26595580950042e-05, "epoch": 1.118227915665866, "percentage": 55.91, "elapsed_time": "9:20:12", "remaining_time": "7:21:45"} +{"current_steps": 4195, "total_steps": 7494, "loss": 0.5857, "lr": 7.248496147486695e-05, "epoch": 1.1195623165198825, "percentage": 55.98, "elapsed_time": "9:21:22", "remaining_time": "7:21:28"} +{"current_steps": 4200, "total_steps": 7494, "loss": 0.6139, "lr": 7.23103784989611e-05, "epoch": 1.120896717373899, "percentage": 56.04, "elapsed_time": "9:22:38", "remaining_time": "7:21:16"} +{"current_steps": 4205, "total_steps": 7494, "loss": 0.633, "lr": 7.213581011440954e-05, "epoch": 1.1222311182279157, "percentage": 56.11, "elapsed_time": "9:23:33", "remaining_time": "7:20:48"} +{"current_steps": 4210, "total_steps": 7494, "loss": 0.6032, "lr": 7.1961257268256e-05, "epoch": 1.1235655190819323, "percentage": 56.18, "elapsed_time": "9:25:32", "remaining_time": "7:21:08"} +{"current_steps": 4215, "total_steps": 7494, "loss": 0.5935, "lr": 7.178672090745986e-05, "epoch": 1.1248999199359488, "percentage": 56.24, "elapsed_time": "9:27:56", "remaining_time": "7:21:49"} +{"current_steps": 4220, "total_steps": 7494, "loss": 0.6054, "lr": 7.161220197889114e-05, "epoch": 1.1262343207899652, "percentage": 56.31, "elapsed_time": "9:29:06", "remaining_time": "7:21:32"} +{"current_steps": 4225, "total_steps": 7494, "loss": 0.6039, "lr": 7.143770142932524e-05, "epoch": 1.1275687216439818, "percentage": 56.38, "elapsed_time": "9:29:52", "remaining_time": "7:20:55"} +{"current_steps": 4230, "total_steps": 7494, "loss": 0.5982, "lr": 7.126322020543785e-05, "epoch": 1.1289031224979984, "percentage": 56.45, "elapsed_time": "9:30:38", "remaining_time": "7:20:19"} +{"current_steps": 4235, "total_steps": 7494, "loss": 0.5973, "lr": 7.108875925379991e-05, "epoch": 1.130237523352015, "percentage": 56.51, "elapsed_time": "9:31:50", "remaining_time": "7:20:02"} +{"current_steps": 4240, "total_steps": 7494, "loss": 0.6178, "lr": 7.091431952087221e-05, "epoch": 1.1315719242060316, "percentage": 56.58, "elapsed_time": "9:33:08", "remaining_time": "7:19:51"} +{"current_steps": 4245, "total_steps": 7494, "loss": 0.5956, "lr": 7.073990195300058e-05, "epoch": 1.132906325060048, "percentage": 56.65, "elapsed_time": "9:33:51", "remaining_time": "7:19:13"} +{"current_steps": 4250, "total_steps": 7494, "loss": 0.6004, "lr": 7.056550749641056e-05, "epoch": 1.1342407259140646, "percentage": 56.71, "elapsed_time": "9:35:34", "remaining_time": "7:19:20"} +{"current_steps": 4255, "total_steps": 7494, "loss": 0.6009, "lr": 7.039113709720227e-05, "epoch": 1.1355751267680811, "percentage": 56.78, "elapsed_time": "9:37:24", "remaining_time": "7:19:32"} +{"current_steps": 4260, "total_steps": 7494, "loss": 0.5925, "lr": 7.021679170134533e-05, "epoch": 1.1369095276220977, "percentage": 56.85, "elapsed_time": "9:38:13", "remaining_time": "7:18:57"} +{"current_steps": 4265, "total_steps": 7494, "loss": 0.5966, "lr": 7.004247225467381e-05, "epoch": 1.1382439284761143, "percentage": 56.91, "elapsed_time": "9:38:57", "remaining_time": "7:18:19"} +{"current_steps": 4270, "total_steps": 7494, "loss": 0.6006, "lr": 6.986817970288082e-05, "epoch": 1.1395783293301307, "percentage": 56.98, "elapsed_time": "9:39:42", "remaining_time": "7:17:41"} +{"current_steps": 4275, "total_steps": 7494, "loss": 0.5863, "lr": 6.969391499151371e-05, "epoch": 1.1409127301841473, "percentage": 57.05, "elapsed_time": "9:40:28", "remaining_time": "7:17:05"} +{"current_steps": 4280, "total_steps": 7494, "loss": 0.5983, "lr": 6.95196790659688e-05, "epoch": 1.1422471310381639, "percentage": 57.11, "elapsed_time": "9:41:16", "remaining_time": "7:16:29"} +{"current_steps": 4285, "total_steps": 7494, "loss": 0.6097, "lr": 6.934547287148614e-05, "epoch": 1.1435815318921805, "percentage": 57.18, "elapsed_time": "9:42:00", "remaining_time": "7:15:51"} +{"current_steps": 4290, "total_steps": 7494, "loss": 0.6038, "lr": 6.917129735314455e-05, "epoch": 1.1449159327461969, "percentage": 57.25, "elapsed_time": "9:42:43", "remaining_time": "7:15:12"} +{"current_steps": 4295, "total_steps": 7494, "loss": 0.5861, "lr": 6.899715345585649e-05, "epoch": 1.1462503336002134, "percentage": 57.31, "elapsed_time": "9:43:31", "remaining_time": "7:14:37"} +{"current_steps": 4300, "total_steps": 7494, "loss": 0.6057, "lr": 6.882304212436272e-05, "epoch": 1.14758473445423, "percentage": 57.38, "elapsed_time": "9:44:18", "remaining_time": "7:14:01"} +{"current_steps": 4305, "total_steps": 7494, "loss": 0.6244, "lr": 6.864896430322745e-05, "epoch": 1.1489191353082466, "percentage": 57.45, "elapsed_time": "9:45:14", "remaining_time": "7:13:31"} +{"current_steps": 4310, "total_steps": 7494, "loss": 0.5833, "lr": 6.84749209368331e-05, "epoch": 1.1502535361622632, "percentage": 57.51, "elapsed_time": "9:45:57", "remaining_time": "7:12:52"} +{"current_steps": 4315, "total_steps": 7494, "loss": 0.5968, "lr": 6.830091296937509e-05, "epoch": 1.1515879370162796, "percentage": 57.58, "elapsed_time": "9:46:42", "remaining_time": "7:12:15"} +{"current_steps": 4320, "total_steps": 7494, "loss": 0.6016, "lr": 6.812694134485686e-05, "epoch": 1.1529223378702962, "percentage": 57.65, "elapsed_time": "9:47:30", "remaining_time": "7:11:39"} +{"current_steps": 4325, "total_steps": 7494, "loss": 0.6048, "lr": 6.795300700708466e-05, "epoch": 1.1542567387243128, "percentage": 57.71, "elapsed_time": "9:48:16", "remaining_time": "7:11:02"} +{"current_steps": 4330, "total_steps": 7494, "loss": 0.5935, "lr": 6.777911089966245e-05, "epoch": 1.1555911395783294, "percentage": 57.78, "elapsed_time": "9:48:59", "remaining_time": "7:10:22"} +{"current_steps": 4335, "total_steps": 7494, "loss": 0.6142, "lr": 6.760525396598686e-05, "epoch": 1.156925540432346, "percentage": 57.85, "elapsed_time": "9:50:16", "remaining_time": "7:10:08"} +{"current_steps": 4340, "total_steps": 7494, "loss": 0.5889, "lr": 6.74314371492419e-05, "epoch": 1.1582599412863623, "percentage": 57.91, "elapsed_time": "9:51:05", "remaining_time": "7:09:34"} +{"current_steps": 4345, "total_steps": 7494, "loss": 0.6017, "lr": 6.725766139239399e-05, "epoch": 1.159594342140379, "percentage": 57.98, "elapsed_time": "9:51:50", "remaining_time": "7:08:55"} +{"current_steps": 4350, "total_steps": 7494, "loss": 0.5988, "lr": 6.708392763818681e-05, "epoch": 1.1609287429943955, "percentage": 58.05, "elapsed_time": "9:52:35", "remaining_time": "7:08:17"} +{"current_steps": 4355, "total_steps": 7494, "loss": 0.6136, "lr": 6.691023682913616e-05, "epoch": 1.1622631438484121, "percentage": 58.11, "elapsed_time": "9:53:20", "remaining_time": "7:07:39"} +{"current_steps": 4360, "total_steps": 7494, "loss": 0.5954, "lr": 6.673658990752484e-05, "epoch": 1.1635975447024287, "percentage": 58.18, "elapsed_time": "9:54:09", "remaining_time": "7:07:05"} +{"current_steps": 4365, "total_steps": 7494, "loss": 0.5896, "lr": 6.656298781539764e-05, "epoch": 1.164931945556445, "percentage": 58.25, "elapsed_time": "9:54:55", "remaining_time": "7:06:27"} +{"current_steps": 4370, "total_steps": 7494, "loss": 0.6066, "lr": 6.638943149455598e-05, "epoch": 1.1662663464104617, "percentage": 58.31, "elapsed_time": "9:55:37", "remaining_time": "7:05:47"} +{"current_steps": 4375, "total_steps": 7494, "loss": 0.5965, "lr": 6.621592188655314e-05, "epoch": 1.1676007472644783, "percentage": 58.38, "elapsed_time": "9:56:24", "remaining_time": "7:05:11"} +{"current_steps": 4380, "total_steps": 7494, "loss": 0.5927, "lr": 6.604245993268893e-05, "epoch": 1.1689351481184949, "percentage": 58.45, "elapsed_time": "9:57:11", "remaining_time": "7:04:34"} +{"current_steps": 4385, "total_steps": 7494, "loss": 0.5992, "lr": 6.586904657400457e-05, "epoch": 1.1702695489725112, "percentage": 58.51, "elapsed_time": "9:57:57", "remaining_time": "7:03:57"} +{"current_steps": 4390, "total_steps": 7494, "loss": 0.5812, "lr": 6.569568275127769e-05, "epoch": 1.1716039498265278, "percentage": 58.58, "elapsed_time": "9:58:41", "remaining_time": "7:03:18"} +{"current_steps": 4395, "total_steps": 7494, "loss": 0.5828, "lr": 6.552236940501725e-05, "epoch": 1.1729383506805444, "percentage": 58.65, "elapsed_time": "9:59:50", "remaining_time": "7:02:57"} +{"current_steps": 4400, "total_steps": 7494, "loss": 0.5854, "lr": 6.534910747545825e-05, "epoch": 1.174272751534561, "percentage": 58.71, "elapsed_time": "10:01:19", "remaining_time": "7:02:50"} +{"current_steps": 4405, "total_steps": 7494, "loss": 0.6129, "lr": 6.517589790255686e-05, "epoch": 1.1756071523885776, "percentage": 58.78, "elapsed_time": "10:02:15", "remaining_time": "7:02:20"} +{"current_steps": 4410, "total_steps": 7494, "loss": 0.606, "lr": 6.500274162598512e-05, "epoch": 1.1769415532425942, "percentage": 58.85, "elapsed_time": "10:03:01", "remaining_time": "7:01:42"} +{"current_steps": 4415, "total_steps": 7494, "loss": 0.598, "lr": 6.482963958512599e-05, "epoch": 1.1782759540966106, "percentage": 58.91, "elapsed_time": "10:03:44", "remaining_time": "7:01:02"} +{"current_steps": 4420, "total_steps": 7494, "loss": 0.593, "lr": 6.465659271906823e-05, "epoch": 1.1796103549506272, "percentage": 58.98, "elapsed_time": "10:04:33", "remaining_time": "7:00:27"} +{"current_steps": 4425, "total_steps": 7494, "loss": 0.6013, "lr": 6.448360196660116e-05, "epoch": 1.1809447558046438, "percentage": 59.05, "elapsed_time": "10:05:23", "remaining_time": "6:59:52"} +{"current_steps": 4430, "total_steps": 7494, "loss": 0.5937, "lr": 6.43106682662098e-05, "epoch": 1.1822791566586603, "percentage": 59.11, "elapsed_time": "10:06:36", "remaining_time": "6:59:33"} +{"current_steps": 4435, "total_steps": 7494, "loss": 0.5813, "lr": 6.413779255606961e-05, "epoch": 1.1836135575126767, "percentage": 59.18, "elapsed_time": "10:07:46", "remaining_time": "6:59:12"} +{"current_steps": 4440, "total_steps": 7494, "loss": 0.6091, "lr": 6.396497577404143e-05, "epoch": 1.1849479583666933, "percentage": 59.25, "elapsed_time": "10:08:34", "remaining_time": "6:58:36"} +{"current_steps": 4445, "total_steps": 7494, "loss": 0.5939, "lr": 6.379221885766643e-05, "epoch": 1.18628235922071, "percentage": 59.31, "elapsed_time": "10:09:25", "remaining_time": "6:58:01"} +{"current_steps": 4450, "total_steps": 7494, "loss": 0.5896, "lr": 6.361952274416106e-05, "epoch": 1.1876167600747265, "percentage": 59.38, "elapsed_time": "10:10:10", "remaining_time": "6:57:23"} +{"current_steps": 4455, "total_steps": 7494, "loss": 0.5932, "lr": 6.344688837041177e-05, "epoch": 1.188951160928743, "percentage": 59.45, "elapsed_time": "10:10:55", "remaining_time": "6:56:44"} +{"current_steps": 4460, "total_steps": 7494, "loss": 0.6017, "lr": 6.32743166729702e-05, "epoch": 1.1902855617827595, "percentage": 59.51, "elapsed_time": "10:11:41", "remaining_time": "6:56:06"} +{"current_steps": 4465, "total_steps": 7494, "loss": 0.6135, "lr": 6.310180858804794e-05, "epoch": 1.191619962636776, "percentage": 59.58, "elapsed_time": "10:12:29", "remaining_time": "6:55:30"} +{"current_steps": 4470, "total_steps": 7494, "loss": 0.6066, "lr": 6.292936505151145e-05, "epoch": 1.1929543634907926, "percentage": 59.65, "elapsed_time": "10:13:16", "remaining_time": "6:54:53"} +{"current_steps": 4475, "total_steps": 7494, "loss": 0.5821, "lr": 6.275698699887699e-05, "epoch": 1.1942887643448092, "percentage": 59.71, "elapsed_time": "10:14:01", "remaining_time": "6:54:14"} +{"current_steps": 4480, "total_steps": 7494, "loss": 0.5997, "lr": 6.258467536530565e-05, "epoch": 1.1956231651988256, "percentage": 59.78, "elapsed_time": "10:14:47", "remaining_time": "6:53:36"} +{"current_steps": 4485, "total_steps": 7494, "loss": 0.6013, "lr": 6.241243108559811e-05, "epoch": 1.1969575660528422, "percentage": 59.85, "elapsed_time": "10:15:34", "remaining_time": "6:52:59"} +{"current_steps": 4490, "total_steps": 7494, "loss": 0.6148, "lr": 6.224025509418971e-05, "epoch": 1.1982919669068588, "percentage": 59.91, "elapsed_time": "10:16:20", "remaining_time": "6:52:21"} +{"current_steps": 4495, "total_steps": 7494, "loss": 0.5996, "lr": 6.206814832514525e-05, "epoch": 1.1996263677608754, "percentage": 59.98, "elapsed_time": "10:17:06", "remaining_time": "6:51:43"} +{"current_steps": 4500, "total_steps": 7494, "loss": 0.5956, "lr": 6.189611171215405e-05, "epoch": 1.200960768614892, "percentage": 60.05, "elapsed_time": "10:17:52", "remaining_time": "6:51:05"} +{"current_steps": 4505, "total_steps": 7494, "loss": 0.6053, "lr": 6.172414618852488e-05, "epoch": 1.2022951694689086, "percentage": 60.11, "elapsed_time": "10:18:47", "remaining_time": "6:50:33"} +{"current_steps": 4510, "total_steps": 7494, "loss": 0.5858, "lr": 6.155225268718069e-05, "epoch": 1.203629570322925, "percentage": 60.18, "elapsed_time": "10:19:34", "remaining_time": "6:49:55"} +{"current_steps": 4515, "total_steps": 7494, "loss": 0.5931, "lr": 6.138043214065385e-05, "epoch": 1.2049639711769415, "percentage": 60.25, "elapsed_time": "10:20:19", "remaining_time": "6:49:17"} +{"current_steps": 4520, "total_steps": 7494, "loss": 0.5874, "lr": 6.120868548108093e-05, "epoch": 1.2062983720309581, "percentage": 60.31, "elapsed_time": "10:21:05", "remaining_time": "6:48:39"} +{"current_steps": 4525, "total_steps": 7494, "loss": 0.5992, "lr": 6.103701364019754e-05, "epoch": 1.2076327728849747, "percentage": 60.38, "elapsed_time": "10:21:50", "remaining_time": "6:48:00"} +{"current_steps": 4530, "total_steps": 7494, "loss": 0.6078, "lr": 6.0865417549333536e-05, "epoch": 1.208967173738991, "percentage": 60.45, "elapsed_time": "10:22:38", "remaining_time": "6:47:23"} +{"current_steps": 4535, "total_steps": 7494, "loss": 0.6084, "lr": 6.0693898139407786e-05, "epoch": 1.2103015745930077, "percentage": 60.52, "elapsed_time": "10:23:25", "remaining_time": "6:46:46"} +{"current_steps": 4540, "total_steps": 7494, "loss": 0.593, "lr": 6.0522456340923085e-05, "epoch": 1.2116359754470243, "percentage": 60.58, "elapsed_time": "10:24:10", "remaining_time": "6:46:07"} +{"current_steps": 4545, "total_steps": 7494, "loss": 0.5874, "lr": 6.0351093083961267e-05, "epoch": 1.2129703763010409, "percentage": 60.65, "elapsed_time": "10:24:53", "remaining_time": "6:45:27"} +{"current_steps": 4550, "total_steps": 7494, "loss": 0.596, "lr": 6.017980929817807e-05, "epoch": 1.2143047771550575, "percentage": 60.72, "elapsed_time": "10:25:40", "remaining_time": "6:44:50"} +{"current_steps": 4555, "total_steps": 7494, "loss": 0.5988, "lr": 6.000860591279801e-05, "epoch": 1.2156391780090738, "percentage": 60.78, "elapsed_time": "10:26:27", "remaining_time": "6:44:12"} +{"current_steps": 4560, "total_steps": 7494, "loss": 0.6011, "lr": 5.9837483856609527e-05, "epoch": 1.2169735788630904, "percentage": 60.85, "elapsed_time": "10:27:12", "remaining_time": "6:43:33"} +{"current_steps": 4565, "total_steps": 7494, "loss": 0.5963, "lr": 5.966644405795982e-05, "epoch": 1.218307979717107, "percentage": 60.92, "elapsed_time": "10:27:55", "remaining_time": "6:42:53"} +{"current_steps": 4570, "total_steps": 7494, "loss": 0.5878, "lr": 5.949548744474978e-05, "epoch": 1.2196423805711236, "percentage": 60.98, "elapsed_time": "10:28:40", "remaining_time": "6:42:14"} +{"current_steps": 4575, "total_steps": 7494, "loss": 0.6043, "lr": 5.9324614944429095e-05, "epoch": 1.22097678142514, "percentage": 61.05, "elapsed_time": "10:29:29", "remaining_time": "6:41:38"} +{"current_steps": 4580, "total_steps": 7494, "loss": 0.6088, "lr": 5.915382748399105e-05, "epoch": 1.2223111822791566, "percentage": 61.12, "elapsed_time": "10:30:15", "remaining_time": "6:40:59"} +{"current_steps": 4585, "total_steps": 7494, "loss": 0.6147, "lr": 5.8983125989967646e-05, "epoch": 1.2236455831331732, "percentage": 61.18, "elapsed_time": "10:31:00", "remaining_time": "6:40:21"} +{"current_steps": 4590, "total_steps": 7494, "loss": 0.5941, "lr": 5.881251138842453e-05, "epoch": 1.2249799839871898, "percentage": 61.25, "elapsed_time": "10:31:45", "remaining_time": "6:39:42"} +{"current_steps": 4595, "total_steps": 7494, "loss": 0.6006, "lr": 5.864198460495585e-05, "epoch": 1.2263143848412064, "percentage": 61.32, "elapsed_time": "10:32:33", "remaining_time": "6:39:04"} +{"current_steps": 4600, "total_steps": 7494, "loss": 0.5973, "lr": 5.847154656467944e-05, "epoch": 1.227648785695223, "percentage": 61.38, "elapsed_time": "10:33:18", "remaining_time": "6:38:26"} +{"current_steps": 4605, "total_steps": 7494, "loss": 0.593, "lr": 5.830119819223166e-05, "epoch": 1.2289831865492393, "percentage": 61.45, "elapsed_time": "10:34:12", "remaining_time": "6:37:52"} +{"current_steps": 4610, "total_steps": 7494, "loss": 0.5908, "lr": 5.8130940411762406e-05, "epoch": 1.230317587403256, "percentage": 61.52, "elapsed_time": "10:34:57", "remaining_time": "6:37:13"} +{"current_steps": 4615, "total_steps": 7494, "loss": 0.6099, "lr": 5.79607741469301e-05, "epoch": 1.2316519882572725, "percentage": 61.58, "elapsed_time": "10:35:45", "remaining_time": "6:36:36"} +{"current_steps": 4620, "total_steps": 7494, "loss": 0.6041, "lr": 5.779070032089674e-05, "epoch": 1.232986389111289, "percentage": 61.65, "elapsed_time": "10:36:33", "remaining_time": "6:35:59"} +{"current_steps": 4625, "total_steps": 7494, "loss": 0.5923, "lr": 5.762071985632276e-05, "epoch": 1.2343207899653055, "percentage": 61.72, "elapsed_time": "10:37:18", "remaining_time": "6:35:20"} +{"current_steps": 4630, "total_steps": 7494, "loss": 0.5906, "lr": 5.745083367536217e-05, "epoch": 1.235655190819322, "percentage": 61.78, "elapsed_time": "10:38:28", "remaining_time": "6:34:56"} +{"current_steps": 4635, "total_steps": 7494, "loss": 0.604, "lr": 5.7281042699657465e-05, "epoch": 1.2369895916733387, "percentage": 61.85, "elapsed_time": "10:39:14", "remaining_time": "6:34:18"} +{"current_steps": 4640, "total_steps": 7494, "loss": 0.598, "lr": 5.71113478503346e-05, "epoch": 1.2383239925273553, "percentage": 61.92, "elapsed_time": "10:40:01", "remaining_time": "6:33:40"} +{"current_steps": 4645, "total_steps": 7494, "loss": 0.602, "lr": 5.694175004799814e-05, "epoch": 1.2396583933813718, "percentage": 61.98, "elapsed_time": "10:40:47", "remaining_time": "6:33:01"} +{"current_steps": 4650, "total_steps": 7494, "loss": 0.5888, "lr": 5.6772250212726025e-05, "epoch": 1.2409927942353882, "percentage": 62.05, "elapsed_time": "10:41:32", "remaining_time": "6:32:22"} +{"current_steps": 4655, "total_steps": 7494, "loss": 0.5901, "lr": 5.660284926406484e-05, "epoch": 1.2423271950894048, "percentage": 62.12, "elapsed_time": "10:42:16", "remaining_time": "6:31:42"} +{"current_steps": 4660, "total_steps": 7494, "loss": 0.6052, "lr": 5.64335481210247e-05, "epoch": 1.2436615959434214, "percentage": 62.18, "elapsed_time": "10:43:01", "remaining_time": "6:31:03"} +{"current_steps": 4665, "total_steps": 7494, "loss": 0.5926, "lr": 5.626434770207414e-05, "epoch": 1.244995996797438, "percentage": 62.25, "elapsed_time": "10:43:50", "remaining_time": "6:30:26"} +{"current_steps": 4670, "total_steps": 7494, "loss": 0.5929, "lr": 5.60952489251354e-05, "epoch": 1.2463303976514546, "percentage": 62.32, "elapsed_time": "10:44:35", "remaining_time": "6:29:47"} +{"current_steps": 4675, "total_steps": 7494, "loss": 0.6034, "lr": 5.592625270757928e-05, "epoch": 1.247664798505471, "percentage": 62.38, "elapsed_time": "10:45:20", "remaining_time": "6:29:08"} +{"current_steps": 4680, "total_steps": 7494, "loss": 0.5839, "lr": 5.575735996622011e-05, "epoch": 1.2489991993594876, "percentage": 62.45, "elapsed_time": "10:46:06", "remaining_time": "6:28:29"} +{"current_steps": 4685, "total_steps": 7494, "loss": 0.5984, "lr": 5.558857161731093e-05, "epoch": 1.2503336002135041, "percentage": 62.52, "elapsed_time": "10:47:43", "remaining_time": "6:28:21"} +{"current_steps": 4690, "total_steps": 7494, "loss": 0.5965, "lr": 5.541988857653847e-05, "epoch": 1.2516680010675207, "percentage": 62.58, "elapsed_time": "10:48:30", "remaining_time": "6:27:43"} +{"current_steps": 4695, "total_steps": 7494, "loss": 0.5945, "lr": 5.5251311759018046e-05, "epoch": 1.2530024019215373, "percentage": 62.65, "elapsed_time": "10:49:39", "remaining_time": "6:27:18"} +{"current_steps": 4700, "total_steps": 7494, "loss": 0.5964, "lr": 5.508284207928879e-05, "epoch": 1.2543368027755537, "percentage": 62.72, "elapsed_time": "10:51:41", "remaining_time": "6:27:24"} +{"current_steps": 4705, "total_steps": 7494, "loss": 0.5897, "lr": 5.491448045130865e-05, "epoch": 1.2556712036295703, "percentage": 62.78, "elapsed_time": "10:52:36", "remaining_time": "6:26:51"} +{"current_steps": 4710, "total_steps": 7494, "loss": 0.5852, "lr": 5.4746227788449236e-05, "epoch": 1.257005604483587, "percentage": 62.85, "elapsed_time": "10:53:21", "remaining_time": "6:26:11"} +{"current_steps": 4715, "total_steps": 7494, "loss": 0.5992, "lr": 5.457808500349115e-05, "epoch": 1.2583400053376035, "percentage": 62.92, "elapsed_time": "10:54:06", "remaining_time": "6:25:31"} +{"current_steps": 4720, "total_steps": 7494, "loss": 0.5964, "lr": 5.441005300861887e-05, "epoch": 1.2596744061916199, "percentage": 62.98, "elapsed_time": "10:54:53", "remaining_time": "6:24:53"} +{"current_steps": 4725, "total_steps": 7494, "loss": 0.6162, "lr": 5.424213271541578e-05, "epoch": 1.2610088070456364, "percentage": 63.05, "elapsed_time": "10:56:06", "remaining_time": "6:24:30"} +{"current_steps": 4730, "total_steps": 7494, "loss": 0.5928, "lr": 5.4074325034859336e-05, "epoch": 1.262343207899653, "percentage": 63.12, "elapsed_time": "10:57:11", "remaining_time": "6:24:02"} +{"current_steps": 4735, "total_steps": 7494, "loss": 0.6071, "lr": 5.390663087731605e-05, "epoch": 1.2636776087536696, "percentage": 63.18, "elapsed_time": "10:57:59", "remaining_time": "6:23:23"} +{"current_steps": 4740, "total_steps": 7494, "loss": 0.5859, "lr": 5.3739051152536506e-05, "epoch": 1.2650120096076862, "percentage": 63.25, "elapsed_time": "10:59:16", "remaining_time": "6:23:02"} +{"current_steps": 4745, "total_steps": 7494, "loss": 0.5996, "lr": 5.357158676965059e-05, "epoch": 1.2663464104617028, "percentage": 63.32, "elapsed_time": "11:01:18", "remaining_time": "6:23:07"} +{"current_steps": 4750, "total_steps": 7494, "loss": 0.6024, "lr": 5.3404238637162364e-05, "epoch": 1.2676808113157192, "percentage": 63.38, "elapsed_time": "11:02:02", "remaining_time": "6:22:26"} +{"current_steps": 4755, "total_steps": 7494, "loss": 0.5936, "lr": 5.323700766294526e-05, "epoch": 1.2690152121697358, "percentage": 63.45, "elapsed_time": "11:02:46", "remaining_time": "6:21:46"} +{"current_steps": 4760, "total_steps": 7494, "loss": 0.5917, "lr": 5.306989475423712e-05, "epoch": 1.2703496130237524, "percentage": 63.52, "elapsed_time": "11:03:33", "remaining_time": "6:21:07"} +{"current_steps": 4765, "total_steps": 7494, "loss": 0.6058, "lr": 5.2902900817635264e-05, "epoch": 1.2716840138777687, "percentage": 63.58, "elapsed_time": "11:04:22", "remaining_time": "6:20:29"} +{"current_steps": 4770, "total_steps": 7494, "loss": 0.6186, "lr": 5.273602675909159e-05, "epoch": 1.2730184147317853, "percentage": 63.65, "elapsed_time": "11:05:06", "remaining_time": "6:19:49"} +{"current_steps": 4775, "total_steps": 7494, "loss": 0.6053, "lr": 5.256927348390765e-05, "epoch": 1.274352815585802, "percentage": 63.72, "elapsed_time": "11:05:51", "remaining_time": "6:19:09"} +{"current_steps": 4780, "total_steps": 7494, "loss": 0.599, "lr": 5.24026418967297e-05, "epoch": 1.2756872164398185, "percentage": 63.78, "elapsed_time": "11:06:38", "remaining_time": "6:18:30"} +{"current_steps": 4785, "total_steps": 7494, "loss": 0.5832, "lr": 5.2236132901543895e-05, "epoch": 1.2770216172938351, "percentage": 63.85, "elapsed_time": "11:08:00", "remaining_time": "6:18:11"} +{"current_steps": 4790, "total_steps": 7494, "loss": 0.595, "lr": 5.2069747401671334e-05, "epoch": 1.2783560181478517, "percentage": 63.92, "elapsed_time": "11:08:47", "remaining_time": "6:17:32"} +{"current_steps": 4795, "total_steps": 7494, "loss": 0.6005, "lr": 5.1903486299763026e-05, "epoch": 1.279690419001868, "percentage": 63.98, "elapsed_time": "11:09:33", "remaining_time": "6:16:52"} +{"current_steps": 4800, "total_steps": 7494, "loss": 0.6083, "lr": 5.173735049779523e-05, "epoch": 1.2810248198558847, "percentage": 64.05, "elapsed_time": "11:10:41", "remaining_time": "6:16:25"} +{"current_steps": 4805, "total_steps": 7494, "loss": 0.5984, "lr": 5.1571340897064454e-05, "epoch": 1.2823592207099013, "percentage": 64.12, "elapsed_time": "11:12:25", "remaining_time": "6:16:18"} +{"current_steps": 4810, "total_steps": 7494, "loss": 0.5876, "lr": 5.140545839818242e-05, "epoch": 1.2836936215639179, "percentage": 64.18, "elapsed_time": "11:13:12", "remaining_time": "6:15:39"} +{"current_steps": 4815, "total_steps": 7494, "loss": 0.5784, "lr": 5.1239703901071506e-05, "epoch": 1.2850280224179342, "percentage": 64.25, "elapsed_time": "11:13:59", "remaining_time": "6:14:59"} +{"current_steps": 4820, "total_steps": 7494, "loss": 0.5942, "lr": 5.1074078304959474e-05, "epoch": 1.2863624232719508, "percentage": 64.32, "elapsed_time": "11:15:11", "remaining_time": "6:14:34"} +{"current_steps": 4825, "total_steps": 7494, "loss": 0.6019, "lr": 5.090858250837495e-05, "epoch": 1.2876968241259674, "percentage": 64.38, "elapsed_time": "11:15:57", "remaining_time": "6:13:54"} +{"current_steps": 4830, "total_steps": 7494, "loss": 0.5932, "lr": 5.0743217409142344e-05, "epoch": 1.289031224979984, "percentage": 64.45, "elapsed_time": "11:16:45", "remaining_time": "6:13:16"} +{"current_steps": 4835, "total_steps": 7494, "loss": 0.6023, "lr": 5.057798390437696e-05, "epoch": 1.2903656258340006, "percentage": 64.52, "elapsed_time": "11:17:30", "remaining_time": "6:12:35"} +{"current_steps": 4840, "total_steps": 7494, "loss": 0.5968, "lr": 5.0412882890480266e-05, "epoch": 1.2917000266880172, "percentage": 64.59, "elapsed_time": "11:18:17", "remaining_time": "6:11:56"} +{"current_steps": 4845, "total_steps": 7494, "loss": 0.6027, "lr": 5.0247915263134984e-05, "epoch": 1.2930344275420336, "percentage": 64.65, "elapsed_time": "11:19:03", "remaining_time": "6:11:16"} +{"current_steps": 4850, "total_steps": 7494, "loss": 0.6145, "lr": 5.0083081917300086e-05, "epoch": 1.2943688283960502, "percentage": 64.72, "elapsed_time": "11:19:49", "remaining_time": "6:10:36"} +{"current_steps": 4855, "total_steps": 7494, "loss": 0.6125, "lr": 4.991838374720618e-05, "epoch": 1.2957032292500668, "percentage": 64.79, "elapsed_time": "11:20:35", "remaining_time": "6:09:56"} +{"current_steps": 4860, "total_steps": 7494, "loss": 0.5791, "lr": 4.975382164635051e-05, "epoch": 1.2970376301040831, "percentage": 64.85, "elapsed_time": "11:21:19", "remaining_time": "6:09:15"} +{"current_steps": 4865, "total_steps": 7494, "loss": 0.6033, "lr": 4.9589396507492044e-05, "epoch": 1.2983720309580997, "percentage": 64.92, "elapsed_time": "11:22:04", "remaining_time": "6:08:35"} +{"current_steps": 4870, "total_steps": 7494, "loss": 0.6003, "lr": 4.942510922264686e-05, "epoch": 1.2997064318121163, "percentage": 64.99, "elapsed_time": "11:23:11", "remaining_time": "6:08:06"} +{"current_steps": 4875, "total_steps": 7494, "loss": 0.593, "lr": 4.926096068308312e-05, "epoch": 1.301040832666133, "percentage": 65.05, "elapsed_time": "11:24:26", "remaining_time": "6:07:42"} +{"current_steps": 4880, "total_steps": 7494, "loss": 0.6053, "lr": 4.90969517793162e-05, "epoch": 1.3023752335201495, "percentage": 65.12, "elapsed_time": "11:25:39", "remaining_time": "6:07:16"} +{"current_steps": 4885, "total_steps": 7494, "loss": 0.6022, "lr": 4.893308340110407e-05, "epoch": 1.303709634374166, "percentage": 65.19, "elapsed_time": "11:26:52", "remaining_time": "6:06:50"} +{"current_steps": 4890, "total_steps": 7494, "loss": 0.6077, "lr": 4.876935643744229e-05, "epoch": 1.3050440352281825, "percentage": 65.25, "elapsed_time": "11:27:36", "remaining_time": "6:06:09"} +{"current_steps": 4895, "total_steps": 7494, "loss": 0.6017, "lr": 4.860577177655922e-05, "epoch": 1.306378436082199, "percentage": 65.32, "elapsed_time": "11:28:23", "remaining_time": "6:05:30"} +{"current_steps": 4900, "total_steps": 7494, "loss": 0.5987, "lr": 4.844233030591122e-05, "epoch": 1.3077128369362157, "percentage": 65.39, "elapsed_time": "11:29:11", "remaining_time": "6:04:50"} +{"current_steps": 4905, "total_steps": 7494, "loss": 0.5963, "lr": 4.827903291217785e-05, "epoch": 1.3090472377902322, "percentage": 65.45, "elapsed_time": "11:30:04", "remaining_time": "6:04:14"} +{"current_steps": 4910, "total_steps": 7494, "loss": 0.5979, "lr": 4.8115880481257066e-05, "epoch": 1.3103816386442486, "percentage": 65.52, "elapsed_time": "11:30:50", "remaining_time": "6:03:34"} +{"current_steps": 4915, "total_steps": 7494, "loss": 0.5967, "lr": 4.795287389826035e-05, "epoch": 1.3117160394982652, "percentage": 65.59, "elapsed_time": "11:31:35", "remaining_time": "6:02:53"} +{"current_steps": 4920, "total_steps": 7494, "loss": 0.5878, "lr": 4.779001404750797e-05, "epoch": 1.3130504403522818, "percentage": 65.65, "elapsed_time": "11:32:23", "remaining_time": "6:02:14"} +{"current_steps": 4925, "total_steps": 7494, "loss": 0.6056, "lr": 4.762730181252415e-05, "epoch": 1.3143848412062984, "percentage": 65.72, "elapsed_time": "11:33:07", "remaining_time": "6:01:33"} +{"current_steps": 4930, "total_steps": 7494, "loss": 0.581, "lr": 4.746473807603235e-05, "epoch": 1.315719242060315, "percentage": 65.79, "elapsed_time": "11:35:17", "remaining_time": "6:01:36"} +{"current_steps": 4935, "total_steps": 7494, "loss": 0.6075, "lr": 4.730232371995029e-05, "epoch": 1.3170536429143316, "percentage": 65.85, "elapsed_time": "11:36:37", "remaining_time": "6:01:13"} +{"current_steps": 4940, "total_steps": 7494, "loss": 0.6037, "lr": 4.714005962538543e-05, "epoch": 1.318388043768348, "percentage": 65.92, "elapsed_time": "11:37:25", "remaining_time": "6:00:34"} +{"current_steps": 4945, "total_steps": 7494, "loss": 0.6063, "lr": 4.6977946672630004e-05, "epoch": 1.3197224446223645, "percentage": 65.99, "elapsed_time": "11:38:12", "remaining_time": "5:59:54"} +{"current_steps": 4950, "total_steps": 7494, "loss": 0.6076, "lr": 4.681598574115622e-05, "epoch": 1.3210568454763811, "percentage": 66.05, "elapsed_time": "11:38:57", "remaining_time": "5:59:13"} +{"current_steps": 4955, "total_steps": 7494, "loss": 0.5986, "lr": 4.665417770961166e-05, "epoch": 1.3223912463303977, "percentage": 66.12, "elapsed_time": "11:40:11", "remaining_time": "5:58:47"} +{"current_steps": 4960, "total_steps": 7494, "loss": 0.5879, "lr": 4.6492523455814415e-05, "epoch": 1.323725647184414, "percentage": 66.19, "elapsed_time": "11:41:24", "remaining_time": "5:58:20"} +{"current_steps": 4965, "total_steps": 7494, "loss": 0.5941, "lr": 4.633102385674821e-05, "epoch": 1.3250600480384307, "percentage": 66.25, "elapsed_time": "11:42:09", "remaining_time": "5:57:39"} +{"current_steps": 4970, "total_steps": 7494, "loss": 0.5929, "lr": 4.616967978855788e-05, "epoch": 1.3263944488924473, "percentage": 66.32, "elapsed_time": "11:42:55", "remaining_time": "5:56:58"} +{"current_steps": 4975, "total_steps": 7494, "loss": 0.5828, "lr": 4.6008492126544476e-05, "epoch": 1.3277288497464639, "percentage": 66.39, "elapsed_time": "11:44:03", "remaining_time": "5:56:29"} +{"current_steps": 4980, "total_steps": 7494, "loss": 0.6022, "lr": 4.584746174516045e-05, "epoch": 1.3290632506004805, "percentage": 66.45, "elapsed_time": "11:44:49", "remaining_time": "5:55:48"} +{"current_steps": 4985, "total_steps": 7494, "loss": 0.5843, "lr": 4.568658951800512e-05, "epoch": 1.330397651454497, "percentage": 66.52, "elapsed_time": "11:46:41", "remaining_time": "5:55:40"} +{"current_steps": 4990, "total_steps": 7494, "loss": 0.6073, "lr": 4.552587631781969e-05, "epoch": 1.3317320523085134, "percentage": 66.59, "elapsed_time": "11:47:26", "remaining_time": "5:54:59"} +{"current_steps": 4995, "total_steps": 7494, "loss": 0.5901, "lr": 4.536532301648271e-05, "epoch": 1.33306645316253, "percentage": 66.65, "elapsed_time": "11:48:39", "remaining_time": "5:54:32"} +{"current_steps": 5000, "total_steps": 7494, "loss": 0.5923, "lr": 4.5204930485005306e-05, "epoch": 1.3344008540165466, "percentage": 66.72, "elapsed_time": "11:49:48", "remaining_time": "5:54:03"} +{"current_steps": 5005, "total_steps": 7494, "loss": 0.5955, "lr": 4.504469959352627e-05, "epoch": 1.335735254870563, "percentage": 66.79, "elapsed_time": "11:50:40", "remaining_time": "5:53:25"} +{"current_steps": 5010, "total_steps": 7494, "loss": 0.5977, "lr": 4.488463121130762e-05, "epoch": 1.3370696557245796, "percentage": 66.85, "elapsed_time": "11:51:27", "remaining_time": "5:52:44"} +{"current_steps": 5015, "total_steps": 7494, "loss": 0.5918, "lr": 4.472472620672976e-05, "epoch": 1.3384040565785962, "percentage": 66.92, "elapsed_time": "11:53:08", "remaining_time": "5:52:31"} +{"current_steps": 5020, "total_steps": 7494, "loss": 0.6004, "lr": 4.4564985447286614e-05, "epoch": 1.3397384574326128, "percentage": 66.99, "elapsed_time": "11:53:51", "remaining_time": "5:51:48"} +{"current_steps": 5025, "total_steps": 7494, "loss": 0.6061, "lr": 4.440540979958124e-05, "epoch": 1.3410728582866294, "percentage": 67.05, "elapsed_time": "11:55:14", "remaining_time": "5:51:25"} +{"current_steps": 5030, "total_steps": 7494, "loss": 0.5899, "lr": 4.4246000129320867e-05, "epoch": 1.342407259140646, "percentage": 67.12, "elapsed_time": "11:56:40", "remaining_time": "5:51:04"} +{"current_steps": 5035, "total_steps": 7494, "loss": 0.6129, "lr": 4.408675730131227e-05, "epoch": 1.3437416599946623, "percentage": 67.19, "elapsed_time": "11:57:28", "remaining_time": "5:50:23"} +{"current_steps": 5040, "total_steps": 7494, "loss": 0.6047, "lr": 4.3927682179457144e-05, "epoch": 1.345076060848679, "percentage": 67.25, "elapsed_time": "11:58:37", "remaining_time": "5:49:54"} +{"current_steps": 5045, "total_steps": 7494, "loss": 0.6056, "lr": 4.376877562674737e-05, "epoch": 1.3464104617026955, "percentage": 67.32, "elapsed_time": "11:59:24", "remaining_time": "5:49:13"} +{"current_steps": 5050, "total_steps": 7494, "loss": 0.6056, "lr": 4.3610038505260264e-05, "epoch": 1.347744862556712, "percentage": 67.39, "elapsed_time": "12:00:07", "remaining_time": "5:48:30"} +{"current_steps": 5055, "total_steps": 7494, "loss": 0.5998, "lr": 4.3451471676154035e-05, "epoch": 1.3490792634107285, "percentage": 67.45, "elapsed_time": "12:04:00", "remaining_time": "5:49:19"} +{"current_steps": 5060, "total_steps": 7494, "loss": 0.5861, "lr": 4.329307599966306e-05, "epoch": 1.350413664264745, "percentage": 67.52, "elapsed_time": "12:04:45", "remaining_time": "5:48:37"} +{"current_steps": 5065, "total_steps": 7494, "loss": 0.6008, "lr": 4.313485233509309e-05, "epoch": 1.3517480651187617, "percentage": 67.59, "elapsed_time": "12:05:29", "remaining_time": "5:47:55"} +{"current_steps": 5070, "total_steps": 7494, "loss": 0.5961, "lr": 4.297680154081686e-05, "epoch": 1.3530824659727783, "percentage": 67.65, "elapsed_time": "12:06:15", "remaining_time": "5:47:13"} +{"current_steps": 5075, "total_steps": 7494, "loss": 0.5814, "lr": 4.2818924474269126e-05, "epoch": 1.3544168668267949, "percentage": 67.72, "elapsed_time": "12:07:28", "remaining_time": "5:46:45"} +{"current_steps": 5080, "total_steps": 7494, "loss": 0.5819, "lr": 4.266122199194226e-05, "epoch": 1.3557512676808114, "percentage": 67.79, "elapsed_time": "12:08:15", "remaining_time": "5:46:04"} +{"current_steps": 5085, "total_steps": 7494, "loss": 0.5979, "lr": 4.250369494938146e-05, "epoch": 1.3570856685348278, "percentage": 67.85, "elapsed_time": "12:09:27", "remaining_time": "5:45:34"} +{"current_steps": 5090, "total_steps": 7494, "loss": 0.6068, "lr": 4.234634420118021e-05, "epoch": 1.3584200693888444, "percentage": 67.92, "elapsed_time": "12:10:14", "remaining_time": "5:44:53"} +{"current_steps": 5095, "total_steps": 7494, "loss": 0.5945, "lr": 4.218917060097547e-05, "epoch": 1.359754470242861, "percentage": 67.99, "elapsed_time": "12:11:23", "remaining_time": "5:44:22"} +{"current_steps": 5100, "total_steps": 7494, "loss": 0.5893, "lr": 4.203217500144326e-05, "epoch": 1.3610888710968774, "percentage": 68.05, "elapsed_time": "12:12:10", "remaining_time": "5:43:41"} +{"current_steps": 5105, "total_steps": 7494, "loss": 0.6088, "lr": 4.187535825429396e-05, "epoch": 1.362423271950894, "percentage": 68.12, "elapsed_time": "12:13:03", "remaining_time": "5:43:03"} +{"current_steps": 5110, "total_steps": 7494, "loss": 0.5972, "lr": 4.171872121026753e-05, "epoch": 1.3637576728049106, "percentage": 68.19, "elapsed_time": "12:13:50", "remaining_time": "5:42:21"} +{"current_steps": 5115, "total_steps": 7494, "loss": 0.593, "lr": 4.1562264719129165e-05, "epoch": 1.3650920736589272, "percentage": 68.25, "elapsed_time": "12:14:37", "remaining_time": "5:41:40"} +{"current_steps": 5120, "total_steps": 7494, "loss": 0.596, "lr": 4.140598962966447e-05, "epoch": 1.3664264745129437, "percentage": 68.32, "elapsed_time": "12:15:25", "remaining_time": "5:40:59"} +{"current_steps": 5125, "total_steps": 7494, "loss": 0.5977, "lr": 4.124989678967503e-05, "epoch": 1.3677608753669603, "percentage": 68.39, "elapsed_time": "12:16:10", "remaining_time": "5:40:17"} +{"current_steps": 5130, "total_steps": 7494, "loss": 0.5867, "lr": 4.109398704597357e-05, "epoch": 1.3690952762209767, "percentage": 68.45, "elapsed_time": "12:17:26", "remaining_time": "5:39:49"} +{"current_steps": 5135, "total_steps": 7494, "loss": 0.589, "lr": 4.093826124437962e-05, "epoch": 1.3704296770749933, "percentage": 68.52, "elapsed_time": "12:18:43", "remaining_time": "5:39:22"} +{"current_steps": 5140, "total_steps": 7494, "loss": 0.6006, "lr": 4.078272022971481e-05, "epoch": 1.37176407792901, "percentage": 68.59, "elapsed_time": "12:19:32", "remaining_time": "5:38:41"} +{"current_steps": 5145, "total_steps": 7494, "loss": 0.6014, "lr": 4.06273648457982e-05, "epoch": 1.3730984787830265, "percentage": 68.65, "elapsed_time": "12:21:07", "remaining_time": "5:38:21"} +{"current_steps": 5150, "total_steps": 7494, "loss": 0.586, "lr": 4.0472195935441904e-05, "epoch": 1.3744328796370429, "percentage": 68.72, "elapsed_time": "12:21:50", "remaining_time": "5:37:38"} +{"current_steps": 5155, "total_steps": 7494, "loss": 0.5996, "lr": 4.031721434044635e-05, "epoch": 1.3757672804910595, "percentage": 68.79, "elapsed_time": "12:22:38", "remaining_time": "5:36:57"} +{"current_steps": 5160, "total_steps": 7494, "loss": 0.6038, "lr": 4.016242090159574e-05, "epoch": 1.377101681345076, "percentage": 68.86, "elapsed_time": "12:23:27", "remaining_time": "5:36:17"} +{"current_steps": 5165, "total_steps": 7494, "loss": 0.6015, "lr": 4.0007816458653566e-05, "epoch": 1.3784360821990926, "percentage": 68.92, "elapsed_time": "12:24:13", "remaining_time": "5:35:34"} +{"current_steps": 5170, "total_steps": 7494, "loss": 0.596, "lr": 3.9853401850358036e-05, "epoch": 1.3797704830531092, "percentage": 68.99, "elapsed_time": "12:24:56", "remaining_time": "5:34:51"} +{"current_steps": 5175, "total_steps": 7494, "loss": 0.5981, "lr": 3.969917791441739e-05, "epoch": 1.3811048839071258, "percentage": 69.06, "elapsed_time": "12:25:44", "remaining_time": "5:34:10"} +{"current_steps": 5180, "total_steps": 7494, "loss": 0.5955, "lr": 3.954514548750553e-05, "epoch": 1.3824392847611422, "percentage": 69.12, "elapsed_time": "12:26:31", "remaining_time": "5:33:29"} +{"current_steps": 5185, "total_steps": 7494, "loss": 0.5907, "lr": 3.939130540525746e-05, "epoch": 1.3837736856151588, "percentage": 69.19, "elapsed_time": "12:27:18", "remaining_time": "5:32:47"} +{"current_steps": 5190, "total_steps": 7494, "loss": 0.5861, "lr": 3.923765850226456e-05, "epoch": 1.3851080864691754, "percentage": 69.26, "elapsed_time": "12:28:00", "remaining_time": "5:32:04"} +{"current_steps": 5195, "total_steps": 7494, "loss": 0.5892, "lr": 3.908420561207032e-05, "epoch": 1.3864424873231918, "percentage": 69.32, "elapsed_time": "12:29:19", "remaining_time": "5:31:36"} +{"current_steps": 5200, "total_steps": 7494, "loss": 0.6142, "lr": 3.893094756716569e-05, "epoch": 1.3877768881772083, "percentage": 69.39, "elapsed_time": "12:30:05", "remaining_time": "5:30:54"} +{"current_steps": 5205, "total_steps": 7494, "loss": 0.6024, "lr": 3.87778851989845e-05, "epoch": 1.389111289031225, "percentage": 69.46, "elapsed_time": "12:32:03", "remaining_time": "5:30:44"} +{"current_steps": 5210, "total_steps": 7494, "loss": 0.5973, "lr": 3.862501933789908e-05, "epoch": 1.3904456898852415, "percentage": 69.52, "elapsed_time": "12:32:47", "remaining_time": "5:30:00"} +{"current_steps": 5215, "total_steps": 7494, "loss": 0.5952, "lr": 3.847235081321573e-05, "epoch": 1.3917800907392581, "percentage": 69.59, "elapsed_time": "12:35:03", "remaining_time": "5:29:58"} +{"current_steps": 5220, "total_steps": 7494, "loss": 0.5938, "lr": 3.831988045317007e-05, "epoch": 1.3931144915932747, "percentage": 69.66, "elapsed_time": "12:35:47", "remaining_time": "5:29:14"} +{"current_steps": 5225, "total_steps": 7494, "loss": 0.6054, "lr": 3.816760908492282e-05, "epoch": 1.394448892447291, "percentage": 69.72, "elapsed_time": "12:37:11", "remaining_time": "5:28:49"} +{"current_steps": 5230, "total_steps": 7494, "loss": 0.5886, "lr": 3.8015537534555e-05, "epoch": 1.3957832933013077, "percentage": 69.79, "elapsed_time": "12:37:57", "remaining_time": "5:28:06"} +{"current_steps": 5235, "total_steps": 7494, "loss": 0.598, "lr": 3.786366662706372e-05, "epoch": 1.3971176941553243, "percentage": 69.86, "elapsed_time": "12:38:41", "remaining_time": "5:27:23"} +{"current_steps": 5240, "total_steps": 7494, "loss": 0.5837, "lr": 3.771199718635758e-05, "epoch": 1.3984520950093409, "percentage": 69.92, "elapsed_time": "12:39:29", "remaining_time": "5:26:41"} +{"current_steps": 5245, "total_steps": 7494, "loss": 0.6062, "lr": 3.756053003525213e-05, "epoch": 1.3997864958633572, "percentage": 69.99, "elapsed_time": "12:40:15", "remaining_time": "5:25:59"} +{"current_steps": 5250, "total_steps": 7494, "loss": 0.6059, "lr": 3.7409265995465577e-05, "epoch": 1.4011208967173738, "percentage": 70.06, "elapsed_time": "12:41:44", "remaining_time": "5:25:35"} +{"current_steps": 5255, "total_steps": 7494, "loss": 0.6073, "lr": 3.725820588761422e-05, "epoch": 1.4024552975713904, "percentage": 70.12, "elapsed_time": "12:42:27", "remaining_time": "5:24:51"} +{"current_steps": 5260, "total_steps": 7494, "loss": 0.6076, "lr": 3.7107350531207944e-05, "epoch": 1.403789698425407, "percentage": 70.19, "elapsed_time": "12:43:14", "remaining_time": "5:24:09"} +{"current_steps": 5265, "total_steps": 7494, "loss": 0.5942, "lr": 3.6956700744645934e-05, "epoch": 1.4051240992794236, "percentage": 70.26, "elapsed_time": "12:44:01", "remaining_time": "5:23:27"} +{"current_steps": 5270, "total_steps": 7494, "loss": 0.5898, "lr": 3.6806257345212136e-05, "epoch": 1.4064585001334402, "percentage": 70.32, "elapsed_time": "12:44:50", "remaining_time": "5:22:46"} +{"current_steps": 5275, "total_steps": 7494, "loss": 0.6009, "lr": 3.665602114907075e-05, "epoch": 1.4077929009874566, "percentage": 70.39, "elapsed_time": "12:45:33", "remaining_time": "5:22:02"} +{"current_steps": 5280, "total_steps": 7494, "loss": 0.6023, "lr": 3.650599297126198e-05, "epoch": 1.4091273018414732, "percentage": 70.46, "elapsed_time": "12:46:20", "remaining_time": "5:21:20"} +{"current_steps": 5285, "total_steps": 7494, "loss": 0.6002, "lr": 3.63561736256975e-05, "epoch": 1.4104617026954898, "percentage": 70.52, "elapsed_time": "12:47:05", "remaining_time": "5:20:37"} +{"current_steps": 5290, "total_steps": 7494, "loss": 0.601, "lr": 3.6206563925156e-05, "epoch": 1.4117961035495064, "percentage": 70.59, "elapsed_time": "12:48:22", "remaining_time": "5:20:07"} +{"current_steps": 5295, "total_steps": 7494, "loss": 0.5908, "lr": 3.605716468127889e-05, "epoch": 1.4131305044035227, "percentage": 70.66, "elapsed_time": "12:49:52", "remaining_time": "5:19:43"} +{"current_steps": 5300, "total_steps": 7494, "loss": 0.5883, "lr": 3.590797670456586e-05, "epoch": 1.4144649052575393, "percentage": 70.72, "elapsed_time": "12:50:40", "remaining_time": "5:19:01"} +{"current_steps": 5305, "total_steps": 7494, "loss": 0.573, "lr": 3.575900080437036e-05, "epoch": 1.415799306111556, "percentage": 70.79, "elapsed_time": "12:51:32", "remaining_time": "5:18:21"} +{"current_steps": 5310, "total_steps": 7494, "loss": 0.5964, "lr": 3.561023778889545e-05, "epoch": 1.4171337069655725, "percentage": 70.86, "elapsed_time": "12:52:50", "remaining_time": "5:17:52"} +{"current_steps": 5315, "total_steps": 7494, "loss": 0.5869, "lr": 3.546168846518915e-05, "epoch": 1.418468107819589, "percentage": 70.92, "elapsed_time": "12:53:33", "remaining_time": "5:17:08"} +{"current_steps": 5320, "total_steps": 7494, "loss": 0.5968, "lr": 3.531335363914027e-05, "epoch": 1.4198025086736055, "percentage": 70.99, "elapsed_time": "12:54:41", "remaining_time": "5:16:34"} +{"current_steps": 5325, "total_steps": 7494, "loss": 0.5922, "lr": 3.516523411547397e-05, "epoch": 1.421136909527622, "percentage": 71.06, "elapsed_time": "12:55:26", "remaining_time": "5:15:51"} +{"current_steps": 5330, "total_steps": 7494, "loss": 0.6091, "lr": 3.5017330697747276e-05, "epoch": 1.4224713103816387, "percentage": 71.12, "elapsed_time": "12:56:13", "remaining_time": "5:15:09"} +{"current_steps": 5335, "total_steps": 7494, "loss": 0.6012, "lr": 3.486964418834495e-05, "epoch": 1.4238057112356552, "percentage": 71.19, "elapsed_time": "12:57:01", "remaining_time": "5:14:27"} +{"current_steps": 5340, "total_steps": 7494, "loss": 0.5959, "lr": 3.472217538847496e-05, "epoch": 1.4251401120896716, "percentage": 71.26, "elapsed_time": "12:58:23", "remaining_time": "5:13:58"} +{"current_steps": 5345, "total_steps": 7494, "loss": 0.604, "lr": 3.457492509816416e-05, "epoch": 1.4264745129436882, "percentage": 71.32, "elapsed_time": "12:59:58", "remaining_time": "5:13:35"} +{"current_steps": 5350, "total_steps": 7494, "loss": 0.5921, "lr": 3.442789411625402e-05, "epoch": 1.4278089137977048, "percentage": 71.39, "elapsed_time": "13:01:40", "remaining_time": "5:13:15"} +{"current_steps": 5355, "total_steps": 7494, "loss": 0.6039, "lr": 3.428108324039626e-05, "epoch": 1.4291433146517214, "percentage": 71.46, "elapsed_time": "13:03:34", "remaining_time": "5:12:59"} +{"current_steps": 5360, "total_steps": 7494, "loss": 0.5998, "lr": 3.413449326704843e-05, "epoch": 1.430477715505738, "percentage": 71.52, "elapsed_time": "13:05:15", "remaining_time": "5:12:38"} +{"current_steps": 5365, "total_steps": 7494, "loss": 0.5847, "lr": 3.3988124991469764e-05, "epoch": 1.4318121163597546, "percentage": 71.59, "elapsed_time": "13:06:37", "remaining_time": "5:12:09"} +{"current_steps": 5370, "total_steps": 7494, "loss": 0.5912, "lr": 3.384197920771676e-05, "epoch": 1.433146517213771, "percentage": 71.66, "elapsed_time": "13:07:22", "remaining_time": "5:11:25"} +{"current_steps": 5375, "total_steps": 7494, "loss": 0.5934, "lr": 3.36960567086388e-05, "epoch": 1.4344809180677875, "percentage": 71.72, "elapsed_time": "13:09:33", "remaining_time": "5:11:16"} +{"current_steps": 5380, "total_steps": 7494, "loss": 0.6079, "lr": 3.355035828587403e-05, "epoch": 1.4358153189218041, "percentage": 71.79, "elapsed_time": "13:10:19", "remaining_time": "5:10:32"} +{"current_steps": 5385, "total_steps": 7494, "loss": 0.5836, "lr": 3.340488472984493e-05, "epoch": 1.4371497197758207, "percentage": 71.86, "elapsed_time": "13:11:05", "remaining_time": "5:09:49"} +{"current_steps": 5390, "total_steps": 7494, "loss": 0.6062, "lr": 3.3259636829754086e-05, "epoch": 1.438484120629837, "percentage": 71.92, "elapsed_time": "13:11:49", "remaining_time": "5:09:05"} +{"current_steps": 5395, "total_steps": 7494, "loss": 0.5921, "lr": 3.3114615373579827e-05, "epoch": 1.4398185214838537, "percentage": 71.99, "elapsed_time": "13:12:37", "remaining_time": "5:08:22"} +{"current_steps": 5305, "total_steps": 7494, "loss": 0.6039, "lr": 3.575900080437036e-05, "epoch": 1.415799306111556, "percentage": 70.79, "elapsed_time": "0:10:08", "remaining_time": "0:04:11"} +{"current_steps": 5310, "total_steps": 7494, "loss": 0.5867, "lr": 3.561023778889545e-05, "epoch": 1.4171337069655725, "percentage": 70.86, "elapsed_time": "0:11:23", "remaining_time": "0:04:41"} +{"current_steps": 5315, "total_steps": 7494, "loss": 0.5905, "lr": 3.546168846518915e-05, "epoch": 1.418468107819589, "percentage": 70.92, "elapsed_time": "0:12:37", "remaining_time": "0:05:10"} +{"current_steps": 5320, "total_steps": 7494, "loss": 0.5893, "lr": 3.531335363914027e-05, "epoch": 1.4198025086736055, "percentage": 70.99, "elapsed_time": "0:13:52", "remaining_time": "0:05:40"} +{"current_steps": 5325, "total_steps": 7494, "loss": 0.6034, "lr": 3.516523411547397e-05, "epoch": 1.421136909527622, "percentage": 71.06, "elapsed_time": "0:14:33", "remaining_time": "0:05:55"} +{"current_steps": 5330, "total_steps": 7494, "loss": 0.5959, "lr": 3.5017330697747276e-05, "epoch": 1.4224713103816387, "percentage": 71.12, "elapsed_time": "0:15:12", "remaining_time": "0:06:10"} +{"current_steps": 5335, "total_steps": 7494, "loss": 0.5995, "lr": 3.486964418834495e-05, "epoch": 1.4238057112356552, "percentage": 71.19, "elapsed_time": "0:16:12", "remaining_time": "0:06:33"} +{"current_steps": 5340, "total_steps": 7494, "loss": 0.5976, "lr": 3.472217538847496e-05, "epoch": 1.4251401120896716, "percentage": 71.26, "elapsed_time": "0:16:48", "remaining_time": "0:06:46"} +{"current_steps": 5345, "total_steps": 7494, "loss": 0.5888, "lr": 3.457492509816416e-05, "epoch": 1.4264745129436882, "percentage": 71.32, "elapsed_time": "0:17:21", "remaining_time": "0:06:58"} +{"current_steps": 5350, "total_steps": 7494, "loss": 0.6041, "lr": 3.442789411625402e-05, "epoch": 1.4278089137977048, "percentage": 71.39, "elapsed_time": "0:18:20", "remaining_time": "0:07:21"} +{"current_steps": 5355, "total_steps": 7494, "loss": 0.6022, "lr": 3.428108324039626e-05, "epoch": 1.4291433146517214, "percentage": 71.46, "elapsed_time": "0:18:54", "remaining_time": "0:07:33"} +{"current_steps": 5360, "total_steps": 7494, "loss": 0.5765, "lr": 3.413449326704843e-05, "epoch": 1.430477715505738, "percentage": 71.52, "elapsed_time": "0:19:26", "remaining_time": "0:07:44"} +{"current_steps": 5365, "total_steps": 7494, "loss": 0.6153, "lr": 3.3988124991469764e-05, "epoch": 1.4318121163597546, "percentage": 71.59, "elapsed_time": "0:20:18", "remaining_time": "0:08:03"} +{"current_steps": 5370, "total_steps": 7494, "loss": 0.5835, "lr": 3.384197920771676e-05, "epoch": 1.433146517213771, "percentage": 71.66, "elapsed_time": "0:20:58", "remaining_time": "0:08:17"} +{"current_steps": 5375, "total_steps": 7494, "loss": 0.6115, "lr": 3.36960567086388e-05, "epoch": 1.4344809180677875, "percentage": 71.72, "elapsed_time": "0:21:31", "remaining_time": "0:08:28"} +{"current_steps": 5380, "total_steps": 7494, "loss": 0.5911, "lr": 3.355035828587403e-05, "epoch": 1.4358153189218041, "percentage": 71.79, "elapsed_time": "0:22:04", "remaining_time": "0:08:40"} +{"current_steps": 5385, "total_steps": 7494, "loss": 0.5891, "lr": 3.340488472984493e-05, "epoch": 1.4371497197758207, "percentage": 71.86, "elapsed_time": "0:23:03", "remaining_time": "0:09:01"} +{"current_steps": 5390, "total_steps": 7494, "loss": 0.5966, "lr": 3.3259636829754086e-05, "epoch": 1.438484120629837, "percentage": 71.92, "elapsed_time": "0:23:35", "remaining_time": "0:09:12"} +{"current_steps": 5395, "total_steps": 7494, "loss": 0.5841, "lr": 3.3114615373579827e-05, "epoch": 1.4398185214838537, "percentage": 71.99, "elapsed_time": "0:24:07", "remaining_time": "0:09:23"} +{"current_steps": 5400, "total_steps": 7494, "loss": 0.6039, "lr": 3.296982114807207e-05, "epoch": 1.4411529223378703, "percentage": 72.06, "elapsed_time": "0:25:09", "remaining_time": "0:09:45"} +{"current_steps": 5405, "total_steps": 7494, "loss": 0.5931, "lr": 3.282525493874798e-05, "epoch": 1.4424873231918869, "percentage": 72.12, "elapsed_time": "0:25:49", "remaining_time": "0:09:59"} +{"current_steps": 5410, "total_steps": 7494, "loss": 0.6009, "lr": 3.2680917529887746e-05, "epoch": 1.4438217240459035, "percentage": 72.19, "elapsed_time": "0:26:21", "remaining_time": "0:10:09"} +{"current_steps": 5415, "total_steps": 7494, "loss": 0.5807, "lr": 3.2536809704530206e-05, "epoch": 1.44515612489992, "percentage": 72.26, "elapsed_time": "0:27:12", "remaining_time": "0:10:26"} +{"current_steps": 5420, "total_steps": 7494, "loss": 0.5964, "lr": 3.239293224446879e-05, "epoch": 1.4464905257539364, "percentage": 72.32, "elapsed_time": "0:27:53", "remaining_time": "0:10:40"} +{"current_steps": 5425, "total_steps": 7494, "loss": 0.5842, "lr": 3.224928593024719e-05, "epoch": 1.447824926607953, "percentage": 72.39, "elapsed_time": "0:28:24", "remaining_time": "0:10:50"} +{"current_steps": 5430, "total_steps": 7494, "loss": 0.6061, "lr": 3.210587154115501e-05, "epoch": 1.4491593274619696, "percentage": 72.46, "elapsed_time": "0:28:57", "remaining_time": "0:11:00"} +{"current_steps": 5435, "total_steps": 7494, "loss": 0.5967, "lr": 3.196268985522376e-05, "epoch": 1.450493728315986, "percentage": 72.52, "elapsed_time": "0:30:00", "remaining_time": "0:11:22"} +{"current_steps": 5440, "total_steps": 7494, "loss": 0.5873, "lr": 3.1819741649222485e-05, "epoch": 1.4518281291700026, "percentage": 72.59, "elapsed_time": "0:30:31", "remaining_time": "0:11:31"} +{"current_steps": 5445, "total_steps": 7494, "loss": 0.6164, "lr": 3.167702769865354e-05, "epoch": 1.4531625300240192, "percentage": 72.66, "elapsed_time": "0:31:02", "remaining_time": "0:11:40"} +{"current_steps": 5450, "total_steps": 7494, "loss": 0.5957, "lr": 3.153454877774849e-05, "epoch": 1.4544969308780358, "percentage": 72.72, "elapsed_time": "0:32:05", "remaining_time": "0:12:02"} +{"current_steps": 5455, "total_steps": 7494, "loss": 0.5899, "lr": 3.139230565946387e-05, "epoch": 1.4558313317320524, "percentage": 72.79, "elapsed_time": "0:32:39", "remaining_time": "0:12:12"} +{"current_steps": 5460, "total_steps": 7494, "loss": 0.6072, "lr": 3.1250299115476874e-05, "epoch": 1.457165732586069, "percentage": 72.86, "elapsed_time": "0:33:10", "remaining_time": "0:12:21"} +{"current_steps": 5465, "total_steps": 7494, "loss": 0.5976, "lr": 3.110852991618135e-05, "epoch": 1.4585001334400853, "percentage": 72.93, "elapsed_time": "0:33:53", "remaining_time": "0:12:35"} +{"current_steps": 5470, "total_steps": 7494, "loss": 0.5945, "lr": 3.0966998830683536e-05, "epoch": 1.459834534294102, "percentage": 72.99, "elapsed_time": "0:34:46", "remaining_time": "0:12:51"} +{"current_steps": 5475, "total_steps": 7494, "loss": 0.591, "lr": 3.082570662679782e-05, "epoch": 1.4611689351481185, "percentage": 73.06, "elapsed_time": "0:35:17", "remaining_time": "0:13:00"} +{"current_steps": 5480, "total_steps": 7494, "loss": 0.5945, "lr": 3.068465407104275e-05, "epoch": 1.4625033360021351, "percentage": 73.13, "elapsed_time": "0:35:48", "remaining_time": "0:13:09"} +{"current_steps": 5485, "total_steps": 7494, "loss": 0.5788, "lr": 3.054384192863664e-05, "epoch": 1.4638377368561515, "percentage": 73.19, "elapsed_time": "0:36:54", "remaining_time": "0:13:30"} +{"current_steps": 5490, "total_steps": 7494, "loss": 0.5879, "lr": 3.0403270963493657e-05, "epoch": 1.465172137710168, "percentage": 73.26, "elapsed_time": "0:37:27", "remaining_time": "0:13:40"} +{"current_steps": 5495, "total_steps": 7494, "loss": 0.5984, "lr": 3.026294193821954e-05, "epoch": 1.4665065385641847, "percentage": 73.33, "elapsed_time": "0:37:58", "remaining_time": "0:13:48"} +{"current_steps": 5500, "total_steps": 7494, "loss": 0.5935, "lr": 3.012285561410742e-05, "epoch": 1.4678409394182013, "percentage": 73.39, "elapsed_time": "0:38:52", "remaining_time": "0:14:05"} +{"current_steps": 5505, "total_steps": 7494, "loss": 0.5937, "lr": 2.9983012751133852e-05, "epoch": 1.4691753402722179, "percentage": 73.46, "elapsed_time": "0:39:44", "remaining_time": "0:14:21"} +{"current_steps": 5510, "total_steps": 7494, "loss": 0.5861, "lr": 2.9843414107954588e-05, "epoch": 1.4705097411262344, "percentage": 73.53, "elapsed_time": "0:40:15", "remaining_time": "0:14:29"} +{"current_steps": 5515, "total_steps": 7494, "loss": 0.6058, "lr": 2.9704060441900402e-05, "epoch": 1.4718441419802508, "percentage": 73.59, "elapsed_time": "0:40:48", "remaining_time": "0:14:38"} +{"current_steps": 5505, "total_steps": 7494, "loss": 0.5937, "lr": 2.9983012751133852e-05, "epoch": 1.4691753402722179, "percentage": 73.46, "elapsed_time": "0:08:47", "remaining_time": "0:03:10"} +{"current_steps": 5510, "total_steps": 7494, "loss": 0.5861, "lr": 2.9843414107954588e-05, "epoch": 1.4705097411262344, "percentage": 73.53, "elapsed_time": "0:11:21", "remaining_time": "0:04:05"} +{"current_steps": 5515, "total_steps": 7494, "loss": 0.6058, "lr": 2.9704060441900402e-05, "epoch": 1.4718441419802508, "percentage": 73.59, "elapsed_time": "0:14:15", "remaining_time": "0:05:06"} +{"current_steps": 5520, "total_steps": 7494, "loss": 0.5924, "lr": 2.956495250897311e-05, "epoch": 1.4731785428342674, "percentage": 73.66, "elapsed_time": "0:19:42", "remaining_time": "0:07:02"} +{"current_steps": 5525, "total_steps": 7494, "loss": 0.5716, "lr": 2.9426091063841444e-05, "epoch": 1.474512943688284, "percentage": 73.73, "elapsed_time": "0:20:20", "remaining_time": "0:07:14"} +{"current_steps": 5530, "total_steps": 7494, "loss": 0.5955, "lr": 2.9287476859836817e-05, "epoch": 1.4758473445423004, "percentage": 73.79, "elapsed_time": "0:21:30", "remaining_time": "0:07:38"} +{"current_steps": 5505, "total_steps": 7494, "loss": 0.5937, "lr": 2.9983012751133852e-05, "epoch": 1.4691753402722179, "percentage": 73.46, "elapsed_time": "0:17:21", "remaining_time": "0:06:16"} +{"current_steps": 5510, "total_steps": 7494, "loss": 0.586, "lr": 2.9843414107954588e-05, "epoch": 1.4705097411262344, "percentage": 73.53, "elapsed_time": "0:19:44", "remaining_time": "0:07:06"} +{"current_steps": 5515, "total_steps": 7494, "loss": 0.6058, "lr": 2.9704060441900402e-05, "epoch": 1.4718441419802508, "percentage": 73.59, "elapsed_time": "0:23:54", "remaining_time": "0:08:34"} +{"current_steps": 5520, "total_steps": 7494, "loss": 0.5923, "lr": 2.956495250897311e-05, "epoch": 1.4731785428342674, "percentage": 73.66, "elapsed_time": "0:25:44", "remaining_time": "0:09:12"} +{"current_steps": 5525, "total_steps": 7494, "loss": 0.5716, "lr": 2.9426091063841444e-05, "epoch": 1.474512943688284, "percentage": 73.73, "elapsed_time": "0:28:50", "remaining_time": "0:10:16"} +{"current_steps": 5505, "total_steps": 7494, "loss": 0.5937, "lr": 2.9983012751133852e-05, "epoch": 1.4691753402722179, "percentage": 73.46, "elapsed_time": "0:09:23", "remaining_time": "0:03:23"} +{"current_steps": 5510, "total_steps": 7494, "loss": 0.586, "lr": 2.9843414107954588e-05, "epoch": 1.4705097411262344, "percentage": 73.53, "elapsed_time": "0:10:28", "remaining_time": "0:03:46"} +{"current_steps": 5515, "total_steps": 7494, "loss": 0.6058, "lr": 2.9704060441900402e-05, "epoch": 1.4718441419802508, "percentage": 73.59, "elapsed_time": "0:11:38", "remaining_time": "0:04:10"} +{"current_steps": 5520, "total_steps": 7494, "loss": 0.5923, "lr": 2.956495250897311e-05, "epoch": 1.4731785428342674, "percentage": 73.66, "elapsed_time": "0:12:49", "remaining_time": "0:04:35"} +{"current_steps": 5525, "total_steps": 7494, "loss": 0.5716, "lr": 2.9426091063841444e-05, "epoch": 1.474512943688284, "percentage": 73.73, "elapsed_time": "0:13:29", "remaining_time": "0:04:48"} +{"current_steps": 5530, "total_steps": 7494, "loss": 0.5956, "lr": 2.9287476859836817e-05, "epoch": 1.4758473445423004, "percentage": 73.79, "elapsed_time": "0:14:09", "remaining_time": "0:05:01"} +{"current_steps": 5535, "total_steps": 7494, "loss": 0.6053, "lr": 2.9149110648949447e-05, "epoch": 1.477181745396317, "percentage": 73.86, "elapsed_time": "0:15:10", "remaining_time": "0:05:22"} +{"current_steps": 5540, "total_steps": 7494, "loss": 0.5969, "lr": 2.9010993181824158e-05, "epoch": 1.4785161462503336, "percentage": 73.93, "elapsed_time": "0:15:44", "remaining_time": "0:05:33"} +{"current_steps": 5545, "total_steps": 7494, "loss": 0.5957, "lr": 2.8873125207756255e-05, "epoch": 1.4798505471043502, "percentage": 73.99, "elapsed_time": "0:16:21", "remaining_time": "0:05:44"} +{"current_steps": 5550, "total_steps": 7494, "loss": 0.5978, "lr": 2.8735507474687603e-05, "epoch": 1.4811849479583667, "percentage": 74.06, "elapsed_time": "0:17:22", "remaining_time": "0:06:04"} +{"current_steps": 5555, "total_steps": 7494, "loss": 0.5844, "lr": 2.859814072920249e-05, "epoch": 1.4825193488123833, "percentage": 74.13, "elapsed_time": "0:17:55", "remaining_time": "0:06:15"} +{"current_steps": 5560, "total_steps": 7494, "loss": 0.5988, "lr": 2.846102571652352e-05, "epoch": 1.4838537496663997, "percentage": 74.19, "elapsed_time": "0:18:28", "remaining_time": "0:06:25"} +{"current_steps": 5565, "total_steps": 7494, "loss": 0.5953, "lr": 2.8324163180507716e-05, "epoch": 1.4851881505204163, "percentage": 74.26, "elapsed_time": "0:19:21", "remaining_time": "0:06:42"} +{"current_steps": 5570, "total_steps": 7494, "loss": 0.5881, "lr": 2.8187553863642314e-05, "epoch": 1.486522551374433, "percentage": 74.33, "elapsed_time": "0:20:02", "remaining_time": "0:06:55"} +{"current_steps": 5575, "total_steps": 7494, "loss": 0.6051, "lr": 2.8051198507040876e-05, "epoch": 1.4878569522284495, "percentage": 74.39, "elapsed_time": "0:20:36", "remaining_time": "0:07:05"} +{"current_steps": 5580, "total_steps": 7494, "loss": 0.5943, "lr": 2.7915097850439238e-05, "epoch": 1.4891913530824659, "percentage": 74.46, "elapsed_time": "0:21:12", "remaining_time": "0:07:16"} +{"current_steps": 5585, "total_steps": 7494, "loss": 0.5906, "lr": 2.7779252632191394e-05, "epoch": 1.4905257539364825, "percentage": 74.53, "elapsed_time": "0:22:15", "remaining_time": "0:07:36"} +{"current_steps": 5590, "total_steps": 7494, "loss": 0.5987, "lr": 2.7643663589265642e-05, "epoch": 1.491860154790499, "percentage": 74.59, "elapsed_time": "0:22:49", "remaining_time": "0:07:46"} +{"current_steps": 5595, "total_steps": 7494, "loss": 0.605, "lr": 2.750833145724049e-05, "epoch": 1.4931945556445156, "percentage": 74.66, "elapsed_time": "0:23:23", "remaining_time": "0:07:56"} +{"current_steps": 5600, "total_steps": 7494, "loss": 0.5993, "lr": 2.7373256970300663e-05, "epoch": 1.4945289564985322, "percentage": 74.73, "elapsed_time": "0:24:26", "remaining_time": "0:08:15"} +{"current_steps": 5605, "total_steps": 7494, "loss": 0.6093, "lr": 2.7238440861233176e-05, "epoch": 1.4958633573525488, "percentage": 74.79, "elapsed_time": "0:25:07", "remaining_time": "0:08:28"} +{"current_steps": 5610, "total_steps": 7494, "loss": 0.603, "lr": 2.710388386142335e-05, "epoch": 1.4971977582065652, "percentage": 74.86, "elapsed_time": "0:25:40", "remaining_time": "0:08:37"} +{"current_steps": 5615, "total_steps": 7494, "loss": 0.6003, "lr": 2.6969586700850753e-05, "epoch": 1.4985321590605818, "percentage": 74.93, "elapsed_time": "0:26:33", "remaining_time": "0:08:53"} +{"current_steps": 5620, "total_steps": 7494, "loss": 0.5914, "lr": 2.6835550108085373e-05, "epoch": 1.4998665599145984, "percentage": 74.99, "elapsed_time": "0:27:16", "remaining_time": "0:09:05"} +{"current_steps": 5625, "total_steps": 7494, "loss": 0.5887, "lr": 2.67017748102836e-05, "epoch": 1.5012009607686148, "percentage": 75.06, "elapsed_time": "0:27:49", "remaining_time": "0:09:14"} +{"current_steps": 5630, "total_steps": 7494, "loss": 0.6003, "lr": 2.6568261533184233e-05, "epoch": 1.5025353616226313, "percentage": 75.13, "elapsed_time": "0:28:25", "remaining_time": "0:09:24"} +{"current_steps": 5635, "total_steps": 7494, "loss": 0.5896, "lr": 2.643501100110463e-05, "epoch": 1.503869762476648, "percentage": 75.19, "elapsed_time": "0:29:28", "remaining_time": "0:09:43"} +{"current_steps": 5640, "total_steps": 7494, "loss": 0.597, "lr": 2.6302023936936776e-05, "epoch": 1.5052041633306645, "percentage": 75.26, "elapsed_time": "0:30:01", "remaining_time": "0:09:52"} +{"current_steps": 5645, "total_steps": 7494, "loss": 0.5937, "lr": 2.616930106214323e-05, "epoch": 1.5065385641846811, "percentage": 75.33, "elapsed_time": "0:30:34", "remaining_time": "0:10:01"} +{"current_steps": 5650, "total_steps": 7494, "loss": 0.5876, "lr": 2.6036843096753394e-05, "epoch": 1.5078729650386977, "percentage": 75.39, "elapsed_time": "0:31:37", "remaining_time": "0:10:19"} +{"current_steps": 5655, "total_steps": 7494, "loss": 0.602, "lr": 2.5904650759359528e-05, "epoch": 1.5092073658927143, "percentage": 75.46, "elapsed_time": "0:32:13", "remaining_time": "0:10:28"} +{"current_steps": 5660, "total_steps": 7494, "loss": 0.5901, "lr": 2.5772724767112753e-05, "epoch": 1.5105417667467307, "percentage": 75.53, "elapsed_time": "0:32:46", "remaining_time": "0:10:37"} +{"current_steps": 5665, "total_steps": 7494, "loss": 0.6093, "lr": 2.564106583571933e-05, "epoch": 1.5118761676007473, "percentage": 75.59, "elapsed_time": "0:33:32", "remaining_time": "0:10:49"} +{"current_steps": 5670, "total_steps": 7494, "loss": 0.5901, "lr": 2.550967467943668e-05, "epoch": 1.5132105684547636, "percentage": 75.66, "elapsed_time": "0:34:25", "remaining_time": "0:11:04"} +{"current_steps": 5675, "total_steps": 7494, "loss": 0.5955, "lr": 2.537855201106955e-05, "epoch": 1.5145449693087802, "percentage": 75.73, "elapsed_time": "0:34:58", "remaining_time": "0:11:12"} +{"current_steps": 5680, "total_steps": 7494, "loss": 0.6044, "lr": 2.5247698541966066e-05, "epoch": 1.5158793701627968, "percentage": 75.79, "elapsed_time": "0:35:32", "remaining_time": "0:11:20"} +{"current_steps": 5685, "total_steps": 7494, "loss": 0.5948, "lr": 2.511711498201397e-05, "epoch": 1.5172137710168134, "percentage": 75.86, "elapsed_time": "0:36:39", "remaining_time": "0:11:39"} +{"current_steps": 5690, "total_steps": 7494, "loss": 0.5948, "lr": 2.4986802039636773e-05, "epoch": 1.51854817187083, "percentage": 75.93, "elapsed_time": "0:37:13", "remaining_time": "0:11:47"} +{"current_steps": 5695, "total_steps": 7494, "loss": 0.5963, "lr": 2.485676042178976e-05, "epoch": 1.5198825727248466, "percentage": 75.99, "elapsed_time": "0:37:46", "remaining_time": "0:11:56"} +{"current_steps": 5700, "total_steps": 7494, "loss": 0.6006, "lr": 2.4726990833956363e-05, "epoch": 1.5212169735788632, "percentage": 76.06, "elapsed_time": "0:38:39", "remaining_time": "0:12:10"} +{"current_steps": 5705, "total_steps": 7494, "loss": 0.5886, "lr": 2.45974939801442e-05, "epoch": 1.5225513744328798, "percentage": 76.13, "elapsed_time": "0:39:38", "remaining_time": "0:12:25"} +{"current_steps": 5710, "total_steps": 7494, "loss": 0.5832, "lr": 2.446827056288131e-05, "epoch": 1.5238857752868962, "percentage": 76.19, "elapsed_time": "0:40:10", "remaining_time": "0:12:33"} +{"current_steps": 5715, "total_steps": 7494, "loss": 0.5965, "lr": 2.4339321283212276e-05, "epoch": 1.5252201761409128, "percentage": 76.26, "elapsed_time": "0:40:46", "remaining_time": "0:12:41"} +{"current_steps": 5720, "total_steps": 7494, "loss": 0.6029, "lr": 2.421064684069453e-05, "epoch": 1.5265545769949291, "percentage": 76.33, "elapsed_time": "0:41:51", "remaining_time": "0:12:58"} +{"current_steps": 5725, "total_steps": 7494, "loss": 0.5996, "lr": 2.4082247933394414e-05, "epoch": 1.5278889778489457, "percentage": 76.39, "elapsed_time": "0:42:24", "remaining_time": "0:13:06"} +{"current_steps": 5730, "total_steps": 7494, "loss": 0.5953, "lr": 2.3954125257883558e-05, "epoch": 1.5292233787029623, "percentage": 76.46, "elapsed_time": "0:42:58", "remaining_time": "0:13:13"} +{"current_steps": 5735, "total_steps": 7494, "loss": 0.5951, "lr": 2.382627950923501e-05, "epoch": 1.530557779556979, "percentage": 76.53, "elapsed_time": "0:43:57", "remaining_time": "0:13:28"} +{"current_steps": 5740, "total_steps": 7494, "loss": 0.5958, "lr": 2.3698711381019398e-05, "epoch": 1.5318921804109955, "percentage": 76.59, "elapsed_time": "0:44:41", "remaining_time": "0:13:39"} +{"current_steps": 5745, "total_steps": 7494, "loss": 0.5852, "lr": 2.3571421565301315e-05, "epoch": 1.533226581265012, "percentage": 76.66, "elapsed_time": "0:45:13", "remaining_time": "0:13:46"} +{"current_steps": 5750, "total_steps": 7494, "loss": 0.6006, "lr": 2.3444410752635512e-05, "epoch": 1.5345609821190287, "percentage": 76.73, "elapsed_time": "0:45:51", "remaining_time": "0:13:54"} +{"current_steps": 5755, "total_steps": 7494, "loss": 0.5877, "lr": 2.331767963206302e-05, "epoch": 1.535895382973045, "percentage": 76.79, "elapsed_time": "0:46:54", "remaining_time": "0:14:10"} +{"current_steps": 5760, "total_steps": 7494, "loss": 0.592, "lr": 2.319122889110763e-05, "epoch": 1.5372297838270617, "percentage": 76.86, "elapsed_time": "0:47:28", "remaining_time": "0:14:17"} +{"current_steps": 5765, "total_steps": 7494, "loss": 0.5867, "lr": 2.3065059215772057e-05, "epoch": 1.5385641846810783, "percentage": 76.93, "elapsed_time": "0:48:01", "remaining_time": "0:14:24"} +{"current_steps": 5770, "total_steps": 7494, "loss": 0.585, "lr": 2.2939171290534127e-05, "epoch": 1.5398985855350946, "percentage": 76.99, "elapsed_time": "0:49:01", "remaining_time": "0:14:38"} +{"current_steps": 5775, "total_steps": 7494, "loss": 0.5943, "lr": 2.281356579834324e-05, "epoch": 1.5412329863891112, "percentage": 77.06, "elapsed_time": "0:49:42", "remaining_time": "0:14:47"} +{"current_steps": 5780, "total_steps": 7494, "loss": 0.5857, "lr": 2.2688243420616573e-05, "epoch": 1.5425673872431278, "percentage": 77.13, "elapsed_time": "0:50:15", "remaining_time": "0:14:54"} +{"current_steps": 5785, "total_steps": 7494, "loss": 0.6055, "lr": 2.2563204837235323e-05, "epoch": 1.5439017880971444, "percentage": 77.2, "elapsed_time": "0:50:56", "remaining_time": "0:15:02"} +{"current_steps": 5790, "total_steps": 7494, "loss": 0.5776, "lr": 2.243845072654115e-05, "epoch": 1.545236188951161, "percentage": 77.26, "elapsed_time": "0:51:57", "remaining_time": "0:15:17"} +{"current_steps": 5795, "total_steps": 7494, "loss": 0.5935, "lr": 2.2313981765332464e-05, "epoch": 1.5465705898051776, "percentage": 77.33, "elapsed_time": "0:52:30", "remaining_time": "0:15:23"} +{"current_steps": 5800, "total_steps": 7494, "loss": 0.594, "lr": 2.2189798628860604e-05, "epoch": 1.5479049906591942, "percentage": 77.4, "elapsed_time": "0:53:03", "remaining_time": "0:15:29"} +{"current_steps": 5805, "total_steps": 7494, "loss": 0.5893, "lr": 2.206590199082642e-05, "epoch": 1.5492393915132106, "percentage": 77.46, "elapsed_time": "0:54:15", "remaining_time": "0:15:47"} +{"current_steps": 5810, "total_steps": 7494, "loss": 0.5924, "lr": 2.194229252337639e-05, "epoch": 1.5505737923672271, "percentage": 77.53, "elapsed_time": "0:54:57", "remaining_time": "0:15:55"} +{"current_steps": 5815, "total_steps": 7494, "loss": 0.5864, "lr": 2.181897089709913e-05, "epoch": 1.5519081932212435, "percentage": 77.6, "elapsed_time": "0:55:29", "remaining_time": "0:16:01"} +{"current_steps": 5820, "total_steps": 7494, "loss": 0.5812, "lr": 2.1695937781021736e-05, "epoch": 1.55324259407526, "percentage": 77.66, "elapsed_time": "0:56:11", "remaining_time": "0:16:09"} +{"current_steps": 5825, "total_steps": 7494, "loss": 0.5903, "lr": 2.1573193842606007e-05, "epoch": 1.5545769949292767, "percentage": 77.73, "elapsed_time": "0:57:13", "remaining_time": "0:16:23"} +{"current_steps": 5830, "total_steps": 7494, "loss": 0.5912, "lr": 2.1450739747745034e-05, "epoch": 1.5559113957832933, "percentage": 77.8, "elapsed_time": "0:57:47", "remaining_time": "0:16:29"} +{"current_steps": 5835, "total_steps": 7494, "loss": 0.5867, "lr": 2.1328576160759486e-05, "epoch": 1.5572457966373099, "percentage": 77.86, "elapsed_time": "0:58:21", "remaining_time": "0:16:35"} +{"current_steps": 5840, "total_steps": 7494, "loss": 0.6189, "lr": 2.1206703744393936e-05, "epoch": 1.5585801974913265, "percentage": 77.93, "elapsed_time": "0:59:23", "remaining_time": "0:16:49"} +{"current_steps": 5845, "total_steps": 7494, "loss": 0.5924, "lr": 2.1085123159813398e-05, "epoch": 1.559914598345343, "percentage": 78.0, "elapsed_time": "1:00:07", "remaining_time": "0:16:57"} +{"current_steps": 5850, "total_steps": 7494, "loss": 0.5842, "lr": 2.0963835066599703e-05, "epoch": 1.5612489991993594, "percentage": 78.06, "elapsed_time": "1:00:39", "remaining_time": "0:17:02"} +{"current_steps": 5855, "total_steps": 7494, "loss": 0.6054, "lr": 2.084284012274781e-05, "epoch": 1.562583400053376, "percentage": 78.13, "elapsed_time": "1:01:21", "remaining_time": "0:17:10"} +{"current_steps": 5860, "total_steps": 7494, "loss": 0.5818, "lr": 2.0722138984662415e-05, "epoch": 1.5639178009073926, "percentage": 78.2, "elapsed_time": "1:02:22", "remaining_time": "0:17:23"} +{"current_steps": 5865, "total_steps": 7494, "loss": 0.5926, "lr": 2.0601732307154283e-05, "epoch": 1.565252201761409, "percentage": 78.26, "elapsed_time": "1:02:57", "remaining_time": "0:17:29"} +{"current_steps": 5870, "total_steps": 7494, "loss": 0.5767, "lr": 2.048162074343665e-05, "epoch": 1.5665866026154256, "percentage": 78.33, "elapsed_time": "1:03:30", "remaining_time": "0:17:34"} +{"current_steps": 5875, "total_steps": 7494, "loss": 0.5886, "lr": 2.036180494512181e-05, "epoch": 1.5679210034694422, "percentage": 78.4, "elapsed_time": "1:04:27", "remaining_time": "0:17:45"} +{"current_steps": 5880, "total_steps": 7494, "loss": 0.6043, "lr": 2.024228556221752e-05, "epoch": 1.5692554043234588, "percentage": 78.46, "elapsed_time": "1:05:13", "remaining_time": "0:17:54"} +{"current_steps": 5885, "total_steps": 7494, "loss": 0.5994, "lr": 2.0123063243123395e-05, "epoch": 1.5705898051774754, "percentage": 78.53, "elapsed_time": "1:05:45", "remaining_time": "0:17:58"} +{"current_steps": 5890, "total_steps": 7494, "loss": 0.5866, "lr": 2.000413863462754e-05, "epoch": 1.571924206031492, "percentage": 78.6, "elapsed_time": "1:06:25", "remaining_time": "0:18:05"} +{"current_steps": 5895, "total_steps": 7494, "loss": 0.5792, "lr": 1.988551238190288e-05, "epoch": 1.5732586068855086, "percentage": 78.66, "elapsed_time": "1:07:29", "remaining_time": "0:18:18"} +{"current_steps": 5900, "total_steps": 7494, "loss": 0.5951, "lr": 1.9767185128503817e-05, "epoch": 1.574593007739525, "percentage": 78.73, "elapsed_time": "1:08:05", "remaining_time": "0:18:23"} +{"current_steps": 5905, "total_steps": 7494, "loss": 0.5988, "lr": 1.9649157516362663e-05, "epoch": 1.5759274085935415, "percentage": 78.8, "elapsed_time": "1:08:47", "remaining_time": "0:18:30"} +{"current_steps": 5910, "total_steps": 7494, "loss": 0.5936, "lr": 1.953143018578607e-05, "epoch": 1.577261809447558, "percentage": 78.86, "elapsed_time": "1:09:40", "remaining_time": "0:18:40"} +{"current_steps": 5915, "total_steps": 7494, "loss": 0.5975, "lr": 1.9414003775451754e-05, "epoch": 1.5785962103015745, "percentage": 78.93, "elapsed_time": "1:10:33", "remaining_time": "0:18:50"} +{"current_steps": 5920, "total_steps": 7494, "loss": 0.5988, "lr": 1.9296878922404868e-05, "epoch": 1.579930611155591, "percentage": 79.0, "elapsed_time": "1:11:07", "remaining_time": "0:18:54"} +{"current_steps": 5925, "total_steps": 7494, "loss": 0.5962, "lr": 1.9180056262054575e-05, "epoch": 1.5812650120096077, "percentage": 79.06, "elapsed_time": "1:11:44", "remaining_time": "0:18:59"} +{"current_steps": 5930, "total_steps": 7494, "loss": 0.5953, "lr": 1.9063536428170682e-05, "epoch": 1.5825994128636243, "percentage": 79.13, "elapsed_time": "1:12:48", "remaining_time": "0:19:12"} +{"current_steps": 5935, "total_steps": 7494, "loss": 0.5955, "lr": 1.8947320052880106e-05, "epoch": 1.5839338137176409, "percentage": 79.2, "elapsed_time": "1:13:28", "remaining_time": "0:19:18"} +{"current_steps": 5940, "total_steps": 7494, "loss": 0.6018, "lr": 1.8831407766663513e-05, "epoch": 1.5852682145716575, "percentage": 79.26, "elapsed_time": "1:14:01", "remaining_time": "0:19:21"} +{"current_steps": 5945, "total_steps": 7494, "loss": 0.5972, "lr": 1.8715800198351824e-05, "epoch": 1.5866026154256738, "percentage": 79.33, "elapsed_time": "1:14:51", "remaining_time": "0:19:30"} +{"current_steps": 5950, "total_steps": 7494, "loss": 0.5792, "lr": 1.8600497975122877e-05, "epoch": 1.5879370162796904, "percentage": 79.4, "elapsed_time": "1:15:49", "remaining_time": "0:19:40"} +{"current_steps": 5955, "total_steps": 7494, "loss": 0.5942, "lr": 1.8485501722498024e-05, "epoch": 1.589271417133707, "percentage": 79.46, "elapsed_time": "1:16:22", "remaining_time": "0:19:44"} +{"current_steps": 5960, "total_steps": 7494, "loss": 0.589, "lr": 1.8370812064338624e-05, "epoch": 1.5906058179877234, "percentage": 79.53, "elapsed_time": "1:16:59", "remaining_time": "0:19:48"} +{"current_steps": 5965, "total_steps": 7494, "loss": 0.5868, "lr": 1.8256429622842818e-05, "epoch": 1.59194021884174, "percentage": 79.6, "elapsed_time": "1:17:59", "remaining_time": "0:19:59"} +{"current_steps": 5970, "total_steps": 7494, "loss": 0.5879, "lr": 1.814235501854206e-05, "epoch": 1.5932746196957566, "percentage": 79.66, "elapsed_time": "1:18:43", "remaining_time": "0:20:05"} +{"current_steps": 5975, "total_steps": 7494, "loss": 0.5983, "lr": 1.8028588870297774e-05, "epoch": 1.5946090205497732, "percentage": 79.73, "elapsed_time": "1:19:15", "remaining_time": "0:20:09"} +{"current_steps": 5980, "total_steps": 7494, "loss": 0.5974, "lr": 1.7915131795297956e-05, "epoch": 1.5959434214037898, "percentage": 79.8, "elapsed_time": "1:19:59", "remaining_time": "0:20:15"} +{"current_steps": 5985, "total_steps": 7494, "loss": 0.5891, "lr": 1.7801984409053897e-05, "epoch": 1.5972778222578063, "percentage": 79.86, "elapsed_time": "1:21:03", "remaining_time": "0:20:26"} +{"current_steps": 5990, "total_steps": 7494, "loss": 0.5892, "lr": 1.7689147325396822e-05, "epoch": 1.598612223111823, "percentage": 79.93, "elapsed_time": "1:21:40", "remaining_time": "0:20:30"} +{"current_steps": 5995, "total_steps": 7494, "loss": 0.6015, "lr": 1.757662115647448e-05, "epoch": 1.5999466239658393, "percentage": 80.0, "elapsed_time": "1:22:14", "remaining_time": "0:20:33"} +{"current_steps": 6000, "total_steps": 7494, "loss": 0.5953, "lr": 1.7464406512747964e-05, "epoch": 1.601281024819856, "percentage": 80.06, "elapsed_time": "1:23:13", "remaining_time": "0:20:43"} +{"current_steps": 6005, "total_steps": 7494, "loss": 0.5993, "lr": 1.7352504002988303e-05, "epoch": 1.6026154256738723, "percentage": 80.13, "elapsed_time": "1:24:14", "remaining_time": "0:20:53"} +{"current_steps": 6010, "total_steps": 7494, "loss": 0.6101, "lr": 1.7240914234273126e-05, "epoch": 1.6039498265278889, "percentage": 80.2, "elapsed_time": "1:24:47", "remaining_time": "0:20:56"} +{"current_steps": 6015, "total_steps": 7494, "loss": 0.5892, "lr": 1.7129637811983507e-05, "epoch": 1.6052842273819055, "percentage": 80.26, "elapsed_time": "1:25:28", "remaining_time": "0:21:00"} +{"current_steps": 6020, "total_steps": 7494, "loss": 0.5985, "lr": 1.7018675339800557e-05, "epoch": 1.606618628235922, "percentage": 80.33, "elapsed_time": "1:26:31", "remaining_time": "0:21:11"} +{"current_steps": 6025, "total_steps": 7494, "loss": 0.5916, "lr": 1.690802741970217e-05, "epoch": 1.6079530290899386, "percentage": 80.4, "elapsed_time": "1:27:13", "remaining_time": "0:21:15"} +{"current_steps": 6030, "total_steps": 7494, "loss": 0.5843, "lr": 1.6797694651959806e-05, "epoch": 1.6092874299439552, "percentage": 80.46, "elapsed_time": "1:27:47", "remaining_time": "0:21:18"} +{"current_steps": 6035, "total_steps": 7494, "loss": 0.6001, "lr": 1.6687677635135218e-05, "epoch": 1.6106218307979718, "percentage": 80.53, "elapsed_time": "1:28:39", "remaining_time": "0:21:26"} +{"current_steps": 6040, "total_steps": 7494, "loss": 0.6013, "lr": 1.657797696607714e-05, "epoch": 1.6119562316519882, "percentage": 80.6, "elapsed_time": "1:29:36", "remaining_time": "0:21:34"} +{"current_steps": 6045, "total_steps": 7494, "loss": 0.6014, "lr": 1.6468593239918136e-05, "epoch": 1.6132906325060048, "percentage": 80.66, "elapsed_time": "1:31:23", "remaining_time": "0:21:54"} +{"current_steps": 6050, "total_steps": 7494, "loss": 0.5872, "lr": 1.635952705007136e-05, "epoch": 1.6146250333600214, "percentage": 80.73, "elapsed_time": "1:32:27", "remaining_time": "0:22:04"} +{"current_steps": 6055, "total_steps": 7494, "loss": 0.606, "lr": 1.6250778988227248e-05, "epoch": 1.6159594342140378, "percentage": 80.8, "elapsed_time": "1:35:08", "remaining_time": "0:22:36"} +{"current_steps": 6060, "total_steps": 7494, "loss": 0.5827, "lr": 1.614234964435044e-05, "epoch": 1.6172938350680544, "percentage": 80.86, "elapsed_time": "1:36:46", "remaining_time": "0:22:54"} +{"current_steps": 6065, "total_steps": 7494, "loss": 0.597, "lr": 1.603423960667645e-05, "epoch": 1.618628235922071, "percentage": 80.93, "elapsed_time": "1:37:54", "remaining_time": "0:23:04"} +{"current_steps": 6070, "total_steps": 7494, "loss": 0.6014, "lr": 1.5926449461708577e-05, "epoch": 1.6199626367760875, "percentage": 81.0, "elapsed_time": "1:39:07", "remaining_time": "0:23:15"} +{"current_steps": 6075, "total_steps": 7494, "loss": 0.5997, "lr": 1.581897979421471e-05, "epoch": 1.6212970376301041, "percentage": 81.06, "elapsed_time": "1:41:01", "remaining_time": "0:23:35"} +{"current_steps": 6080, "total_steps": 7494, "loss": 0.5958, "lr": 1.571183118722405e-05, "epoch": 1.6226314384841207, "percentage": 81.13, "elapsed_time": "1:42:03", "remaining_time": "0:23:44"} +{"current_steps": 6085, "total_steps": 7494, "loss": 0.6005, "lr": 1.5605004222024074e-05, "epoch": 1.6239658393381373, "percentage": 81.2, "elapsed_time": "1:43:29", "remaining_time": "0:23:57"} +{"current_steps": 6090, "total_steps": 7494, "loss": 0.6004, "lr": 1.549849947815737e-05, "epoch": 1.6253002401921537, "percentage": 81.27, "elapsed_time": "1:44:24", "remaining_time": "0:24:04"} +{"current_steps": 6095, "total_steps": 7494, "loss": 0.6025, "lr": 1.5392317533418366e-05, "epoch": 1.6266346410461703, "percentage": 81.33, "elapsed_time": "1:46:25", "remaining_time": "0:24:25"} +{"current_steps": 6100, "total_steps": 7494, "loss": 0.5856, "lr": 1.5286458963850363e-05, "epoch": 1.6279690419001867, "percentage": 81.4, "elapsed_time": "1:47:51", "remaining_time": "0:24:38"} +{"current_steps": 6105, "total_steps": 7494, "loss": 0.5891, "lr": 1.5180924343742316e-05, "epoch": 1.6293034427542032, "percentage": 81.47, "elapsed_time": "1:48:41", "remaining_time": "0:24:43"} +{"current_steps": 6110, "total_steps": 7494, "loss": 0.5782, "lr": 1.5075714245625689e-05, "epoch": 1.6306378436082198, "percentage": 81.53, "elapsed_time": "1:50:31", "remaining_time": "0:25:02"} +{"current_steps": 6115, "total_steps": 7494, "loss": 0.5857, "lr": 1.4970829240271448e-05, "epoch": 1.6319722444622364, "percentage": 81.6, "elapsed_time": "1:52:19", "remaining_time": "0:25:19"} +{"current_steps": 6120, "total_steps": 7494, "loss": 0.623, "lr": 1.4866269896686917e-05, "epoch": 1.633306645316253, "percentage": 81.67, "elapsed_time": "1:52:54", "remaining_time": "0:25:21"} +{"current_steps": 6125, "total_steps": 7494, "loss": 0.5999, "lr": 1.4762036782112624e-05, "epoch": 1.6346410461702696, "percentage": 81.73, "elapsed_time": "1:54:18", "remaining_time": "0:25:32"} +{"current_steps": 6105, "total_steps": 7494, "loss": 0.5891, "lr": 1.5180924343742316e-05, "epoch": 1.6293034427542032, "percentage": 81.47, "elapsed_time": "0:18:42", "remaining_time": "0:04:15"} +{"current_steps": 6110, "total_steps": 7494, "loss": 0.5782, "lr": 1.5075714245625689e-05, "epoch": 1.6306378436082198, "percentage": 81.53, "elapsed_time": "0:20:55", "remaining_time": "0:04:44"} +{"current_steps": 6115, "total_steps": 7494, "loss": 0.5857, "lr": 1.4970829240271448e-05, "epoch": 1.6319722444622364, "percentage": 81.6, "elapsed_time": "0:22:49", "remaining_time": "0:05:08"} +{"current_steps": 6120, "total_steps": 7494, "loss": 0.623, "lr": 1.4866269896686917e-05, "epoch": 1.633306645316253, "percentage": 81.67, "elapsed_time": "0:26:16", "remaining_time": "0:05:53"} +{"current_steps": 6125, "total_steps": 7494, "loss": 0.5999, "lr": 1.4762036782112624e-05, "epoch": 1.6346410461702696, "percentage": 81.73, "elapsed_time": "0:27:17", "remaining_time": "0:06:06"} +{"current_steps": 6130, "total_steps": 7494, "loss": 0.5883, "lr": 1.465813046201934e-05, "epoch": 1.6359754470242862, "percentage": 81.8, "elapsed_time": "0:29:34", "remaining_time": "0:06:34"} +{"current_steps": 6135, "total_steps": 7494, "loss": 0.5915, "lr": 1.4554551500104971e-05, "epoch": 1.6373098478783028, "percentage": 81.87, "elapsed_time": "0:32:12", "remaining_time": "0:07:08"} +{"current_steps": 6140, "total_steps": 7494, "loss": 0.5957, "lr": 1.4451300458291401e-05, "epoch": 1.6386442487323192, "percentage": 81.93, "elapsed_time": "0:32:54", "remaining_time": "0:07:15"} +{"current_steps": 6145, "total_steps": 7494, "loss": 0.588, "lr": 1.4348377896721635e-05, "epoch": 1.6399786495863358, "percentage": 82.0, "elapsed_time": "0:33:36", "remaining_time": "0:07:22"} +{"current_steps": 6150, "total_steps": 7494, "loss": 0.594, "lr": 1.4245784373756566e-05, "epoch": 1.6413130504403521, "percentage": 82.07, "elapsed_time": "0:36:30", "remaining_time": "0:07:58"} +{"current_steps": 6155, "total_steps": 7494, "loss": 0.6001, "lr": 1.4143520445972078e-05, "epoch": 1.6426474512943687, "percentage": 82.13, "elapsed_time": "0:37:10", "remaining_time": "0:08:05"} +{"current_steps": 6160, "total_steps": 7494, "loss": 0.6001, "lr": 1.4041586668155989e-05, "epoch": 1.6439818521483853, "percentage": 82.2, "elapsed_time": "0:37:47", "remaining_time": "0:08:11"} +{"current_steps": 6165, "total_steps": 7494, "loss": 0.5753, "lr": 1.3939983593304992e-05, "epoch": 1.645316253002402, "percentage": 82.27, "elapsed_time": "0:38:43", "remaining_time": "0:08:20"} +{"current_steps": 6170, "total_steps": 7494, "loss": 0.5935, "lr": 1.3838711772621743e-05, "epoch": 1.6466506538564185, "percentage": 82.33, "elapsed_time": "0:39:27", "remaining_time": "0:08:28"} +{"current_steps": 6175, "total_steps": 7494, "loss": 0.5997, "lr": 1.3737771755511811e-05, "epoch": 1.647985054710435, "percentage": 82.4, "elapsed_time": "0:40:02", "remaining_time": "0:08:33"} +{"current_steps": 6180, "total_steps": 7494, "loss": 0.5884, "lr": 1.3637164089580673e-05, "epoch": 1.6493194555644517, "percentage": 82.47, "elapsed_time": "0:40:40", "remaining_time": "0:08:38"} +{"current_steps": 6185, "total_steps": 7494, "loss": 0.5965, "lr": 1.3536889320630841e-05, "epoch": 1.650653856418468, "percentage": 82.53, "elapsed_time": "0:42:04", "remaining_time": "0:08:54"} +{"current_steps": 6190, "total_steps": 7494, "loss": 0.58, "lr": 1.3436947992658814e-05, "epoch": 1.6519882572724847, "percentage": 82.6, "elapsed_time": "0:43:03", "remaining_time": "0:09:04"} +{"current_steps": 6195, "total_steps": 7494, "loss": 0.594, "lr": 1.3337340647852135e-05, "epoch": 1.6533226581265013, "percentage": 82.67, "elapsed_time": "0:43:37", "remaining_time": "0:09:08"} +{"current_steps": 6200, "total_steps": 7494, "loss": 0.5991, "lr": 1.3238067826586491e-05, "epoch": 1.6546570589805176, "percentage": 82.73, "elapsed_time": "0:44:42", "remaining_time": "0:09:19"} +{"current_steps": 6205, "total_steps": 7494, "loss": 0.5967, "lr": 1.3139130067422792e-05, "epoch": 1.6559914598345342, "percentage": 82.8, "elapsed_time": "0:45:27", "remaining_time": "0:09:26"} +{"current_steps": 6210, "total_steps": 7494, "loss": 0.6057, "lr": 1.3040527907104126e-05, "epoch": 1.6573258606885508, "percentage": 82.87, "elapsed_time": "0:46:02", "remaining_time": "0:09:31"} +{"current_steps": 6215, "total_steps": 7494, "loss": 0.5899, "lr": 1.2942261880553012e-05, "epoch": 1.6586602615425674, "percentage": 82.93, "elapsed_time": "0:46:57", "remaining_time": "0:09:39"} +{"current_steps": 6220, "total_steps": 7494, "loss": 0.5864, "lr": 1.2844332520868433e-05, "epoch": 1.659994662396584, "percentage": 83.0, "elapsed_time": "0:47:41", "remaining_time": "0:09:46"} +{"current_steps": 6225, "total_steps": 7494, "loss": 0.5995, "lr": 1.2746740359322857e-05, "epoch": 1.6613290632506006, "percentage": 83.07, "elapsed_time": "0:48:15", "remaining_time": "0:09:50"} +{"current_steps": 6230, "total_steps": 7494, "loss": 0.6006, "lr": 1.2649485925359514e-05, "epoch": 1.6626634641046172, "percentage": 83.13, "elapsed_time": "0:48:52", "remaining_time": "0:09:54"} +{"current_steps": 6235, "total_steps": 7494, "loss": 0.5825, "lr": 1.2552569746589386e-05, "epoch": 1.6639978649586336, "percentage": 83.2, "elapsed_time": "0:49:55", "remaining_time": "0:10:04"} +{"current_steps": 6240, "total_steps": 7494, "loss": 0.5871, "lr": 1.245599234878846e-05, "epoch": 1.6653322658126501, "percentage": 83.27, "elapsed_time": "0:50:30", "remaining_time": "0:10:08"} +{"current_steps": 6245, "total_steps": 7494, "loss": 0.5959, "lr": 1.2359754255894737e-05, "epoch": 1.6666666666666665, "percentage": 83.33, "elapsed_time": "0:51:04", "remaining_time": "0:10:12"} +{"current_steps": 6250, "total_steps": 7494, "loss": 0.6018, "lr": 1.2263855990005527e-05, "epoch": 1.6680010675206831, "percentage": 83.4, "elapsed_time": "0:52:11", "remaining_time": "0:10:23"} +{"current_steps": 6255, "total_steps": 7494, "loss": 0.5963, "lr": 1.2168298071374543e-05, "epoch": 1.6693354683746997, "percentage": 83.47, "elapsed_time": "0:52:47", "remaining_time": "0:10:27"} +{"current_steps": 6260, "total_steps": 7494, "loss": 0.5883, "lr": 1.2073081018409112e-05, "epoch": 1.6706698692287163, "percentage": 83.53, "elapsed_time": "0:53:21", "remaining_time": "0:10:31"} +{"current_steps": 6265, "total_steps": 7494, "loss": 0.5954, "lr": 1.1978205347667303e-05, "epoch": 1.672004270082733, "percentage": 83.6, "elapsed_time": "0:54:09", "remaining_time": "0:10:37"} +{"current_steps": 6270, "total_steps": 7494, "loss": 0.5923, "lr": 1.1883671573855186e-05, "epoch": 1.6733386709367495, "percentage": 83.67, "elapsed_time": "0:55:02", "remaining_time": "0:10:44"} +{"current_steps": 6275, "total_steps": 7494, "loss": 0.5835, "lr": 1.1789480209824064e-05, "epoch": 1.674673071790766, "percentage": 83.73, "elapsed_time": "0:55:35", "remaining_time": "0:10:48"} +{"current_steps": 6280, "total_steps": 7494, "loss": 0.593, "lr": 1.1695631766567562e-05, "epoch": 1.6760074726447824, "percentage": 83.8, "elapsed_time": "0:56:10", "remaining_time": "0:10:51"} +{"current_steps": 6285, "total_steps": 7494, "loss": 0.5815, "lr": 1.1602126753219005e-05, "epoch": 1.677341873498799, "percentage": 83.87, "elapsed_time": "0:57:15", "remaining_time": "0:11:00"} +{"current_steps": 6290, "total_steps": 7494, "loss": 0.5976, "lr": 1.1508965677048585e-05, "epoch": 1.6786762743528156, "percentage": 83.93, "elapsed_time": "0:57:50", "remaining_time": "0:11:04"} +{"current_steps": 6295, "total_steps": 7494, "loss": 0.5845, "lr": 1.1416149043460562e-05, "epoch": 1.680010675206832, "percentage": 84.0, "elapsed_time": "0:58:24", "remaining_time": "0:11:07"} +{"current_steps": 6300, "total_steps": 7494, "loss": 0.6126, "lr": 1.132367735599066e-05, "epoch": 1.6813450760608486, "percentage": 84.07, "elapsed_time": "0:59:21", "remaining_time": "0:11:14"} +{"current_steps": 6305, "total_steps": 7494, "loss": 0.6014, "lr": 1.1231551116303162e-05, "epoch": 1.6826794769148652, "percentage": 84.13, "elapsed_time": "1:00:21", "remaining_time": "0:11:22"} +{"current_steps": 6310, "total_steps": 7494, "loss": 0.5883, "lr": 1.1139770824188334e-05, "epoch": 1.6840138777688818, "percentage": 84.2, "elapsed_time": "1:00:55", "remaining_time": "0:11:25"} +{"current_steps": 6315, "total_steps": 7494, "loss": 0.5877, "lr": 1.1048336977559666e-05, "epoch": 1.6853482786228984, "percentage": 84.27, "elapsed_time": "1:01:32", "remaining_time": "0:11:29"} +{"current_steps": 6320, "total_steps": 7494, "loss": 0.5978, "lr": 1.0957250072451084e-05, "epoch": 1.686682679476915, "percentage": 84.33, "elapsed_time": "1:02:39", "remaining_time": "0:11:38"} +{"current_steps": 6325, "total_steps": 7494, "loss": 0.6023, "lr": 1.0866510603014411e-05, "epoch": 1.6880170803309316, "percentage": 84.4, "elapsed_time": "1:03:14", "remaining_time": "0:11:41"} +{"current_steps": 6330, "total_steps": 7494, "loss": 0.598, "lr": 1.0776119061516613e-05, "epoch": 1.689351481184948, "percentage": 84.47, "elapsed_time": "1:03:48", "remaining_time": "0:11:43"} +{"current_steps": 6335, "total_steps": 7494, "loss": 0.5717, "lr": 1.0686075938337055e-05, "epoch": 1.6906858820389645, "percentage": 84.53, "elapsed_time": "1:04:51", "remaining_time": "0:11:52"} +{"current_steps": 6340, "total_steps": 7494, "loss": 0.6042, "lr": 1.0596381721964984e-05, "epoch": 1.692020282892981, "percentage": 84.6, "elapsed_time": "1:05:34", "remaining_time": "0:11:56"} +{"current_steps": 6345, "total_steps": 7494, "loss": 0.5825, "lr": 1.0507036898996787e-05, "epoch": 1.6933546837469975, "percentage": 84.67, "elapsed_time": "1:06:08", "remaining_time": "0:11:58"} +{"current_steps": 6350, "total_steps": 7494, "loss": 0.5914, "lr": 1.0418041954133346e-05, "epoch": 1.694689084601014, "percentage": 84.73, "elapsed_time": "1:06:50", "remaining_time": "0:12:02"} +{"current_steps": 6355, "total_steps": 7494, "loss": 0.5974, "lr": 1.032939737017745e-05, "epoch": 1.6960234854550307, "percentage": 84.8, "elapsed_time": "1:07:55", "remaining_time": "0:12:10"} +{"current_steps": 6360, "total_steps": 7494, "loss": 0.6183, "lr": 1.02411036280312e-05, "epoch": 1.6973578863090473, "percentage": 84.87, "elapsed_time": "1:08:29", "remaining_time": "0:12:12"} +{"current_steps": 6365, "total_steps": 7494, "loss": 0.5929, "lr": 1.0153161206693269e-05, "epoch": 1.6986922871630639, "percentage": 84.93, "elapsed_time": "1:09:03", "remaining_time": "0:12:14"} +{"current_steps": 6370, "total_steps": 7494, "loss": 0.5928, "lr": 1.0065570583256483e-05, "epoch": 1.7000266880170805, "percentage": 85.0, "elapsed_time": "1:10:06", "remaining_time": "0:12:22"} +{"current_steps": 6375, "total_steps": 7494, "loss": 0.5857, "lr": 9.978332232905114e-06, "epoch": 1.7013610888710968, "percentage": 85.07, "elapsed_time": "1:10:47", "remaining_time": "0:12:25"} +{"current_steps": 6380, "total_steps": 7494, "loss": 0.5944, "lr": 9.891446628912286e-06, "epoch": 1.7026954897251134, "percentage": 85.13, "elapsed_time": "1:11:22", "remaining_time": "0:12:27"} +{"current_steps": 6385, "total_steps": 7494, "loss": 0.5906, "lr": 9.804914242637541e-06, "epoch": 1.70402989057913, "percentage": 85.2, "elapsed_time": "1:12:05", "remaining_time": "0:12:31"} +{"current_steps": 6390, "total_steps": 7494, "loss": 0.5894, "lr": 9.718735543524103e-06, "epoch": 1.7053642914331464, "percentage": 85.27, "elapsed_time": "1:13:06", "remaining_time": "0:12:37"} +{"current_steps": 6395, "total_steps": 7494, "loss": 0.6003, "lr": 9.632910999096486e-06, "epoch": 1.706698692287163, "percentage": 85.33, "elapsed_time": "1:13:39", "remaining_time": "0:12:39"} +{"current_steps": 6400, "total_steps": 7494, "loss": 0.5922, "lr": 9.547441074957884e-06, "epoch": 1.7080330931411796, "percentage": 85.4, "elapsed_time": "1:14:13", "remaining_time": "0:12:41"} +{"current_steps": 6405, "total_steps": 7494, "loss": 0.5889, "lr": 9.462326234787621e-06, "epoch": 1.7093674939951962, "percentage": 85.47, "elapsed_time": "1:15:31", "remaining_time": "0:12:50"} +{"current_steps": 6410, "total_steps": 7494, "loss": 0.6031, "lr": 9.377566940338712e-06, "epoch": 1.7107018948492128, "percentage": 85.54, "elapsed_time": "1:16:15", "remaining_time": "0:12:53"} +{"current_steps": 6415, "total_steps": 7494, "loss": 0.5884, "lr": 9.293163651435298e-06, "epoch": 1.7120362957032293, "percentage": 85.6, "elapsed_time": "1:16:49", "remaining_time": "0:12:55"} +{"current_steps": 6420, "total_steps": 7494, "loss": 0.5808, "lr": 9.20911682597015e-06, "epoch": 1.713370696557246, "percentage": 85.67, "elapsed_time": "1:17:33", "remaining_time": "0:12:58"} +{"current_steps": 6425, "total_steps": 7494, "loss": 0.5697, "lr": 9.125426919902231e-06, "epoch": 1.7147050974112623, "percentage": 85.74, "elapsed_time": "1:18:35", "remaining_time": "0:13:04"} +{"current_steps": 6430, "total_steps": 7494, "loss": 0.5929, "lr": 9.042094387254212e-06, "epoch": 1.716039498265279, "percentage": 85.8, "elapsed_time": "1:19:09", "remaining_time": "0:13:05"} +{"current_steps": 6435, "total_steps": 7494, "loss": 0.5859, "lr": 8.959119680109918e-06, "epoch": 1.7173738991192953, "percentage": 85.87, "elapsed_time": "1:19:44", "remaining_time": "0:13:07"} +{"current_steps": 6440, "total_steps": 7494, "loss": 0.5943, "lr": 8.876503248612036e-06, "epoch": 1.7187082999733119, "percentage": 85.94, "elapsed_time": "1:20:48", "remaining_time": "0:13:13"} +{"current_steps": 6445, "total_steps": 7494, "loss": 0.5937, "lr": 8.794245540959546e-06, "epoch": 1.7200427008273285, "percentage": 86.0, "elapsed_time": "1:21:33", "remaining_time": "0:13:16"} +{"current_steps": 6450, "total_steps": 7494, "loss": 0.5809, "lr": 8.712347003405304e-06, "epoch": 1.721377101681345, "percentage": 86.07, "elapsed_time": "1:22:07", "remaining_time": "0:13:17"} +{"current_steps": 6455, "total_steps": 7494, "loss": 0.5871, "lr": 8.630808080253701e-06, "epoch": 1.7227115025353616, "percentage": 86.14, "elapsed_time": "1:22:52", "remaining_time": "0:13:20"} +{"current_steps": 6460, "total_steps": 7494, "loss": 0.591, "lr": 8.549629213858192e-06, "epoch": 1.7240459033893782, "percentage": 86.2, "elapsed_time": "1:23:55", "remaining_time": "0:13:26"} +{"current_steps": 6465, "total_steps": 7494, "loss": 0.5991, "lr": 8.468810844618842e-06, "epoch": 1.7253803042433948, "percentage": 86.27, "elapsed_time": "1:24:31", "remaining_time": "0:13:27"} +{"current_steps": 6470, "total_steps": 7494, "loss": 0.5931, "lr": 8.388353410980075e-06, "epoch": 1.7267147050974114, "percentage": 86.34, "elapsed_time": "1:25:06", "remaining_time": "0:13:28"} +{"current_steps": 6475, "total_steps": 7494, "loss": 0.5873, "lr": 8.308257349428154e-06, "epoch": 1.7280491059514278, "percentage": 86.4, "elapsed_time": "1:26:06", "remaining_time": "0:13:33"} +{"current_steps": 6480, "total_steps": 7494, "loss": 0.5853, "lr": 8.228523094488928e-06, "epoch": 1.7293835068054444, "percentage": 86.47, "elapsed_time": "1:26:54", "remaining_time": "0:13:36"} +{"current_steps": 6485, "total_steps": 7494, "loss": 0.6017, "lr": 8.149151078725416e-06, "epoch": 1.7307179076594608, "percentage": 86.54, "elapsed_time": "1:27:28", "remaining_time": "0:13:36"} +{"current_steps": 6490, "total_steps": 7494, "loss": 0.5879, "lr": 8.070141732735424e-06, "epoch": 1.7320523085134774, "percentage": 86.6, "elapsed_time": "1:28:10", "remaining_time": "0:13:38"} +{"current_steps": 6495, "total_steps": 7494, "loss": 0.5977, "lr": 7.991495485149294e-06, "epoch": 1.733386709367494, "percentage": 86.67, "elapsed_time": "1:29:15", "remaining_time": "0:13:43"} +{"current_steps": 6500, "total_steps": 7494, "loss": 0.5965, "lr": 7.913212762627539e-06, "epoch": 1.7347211102215105, "percentage": 86.74, "elapsed_time": "1:29:52", "remaining_time": "0:13:44"} +{"current_steps": 6505, "total_steps": 7494, "loss": 0.5932, "lr": 7.835293989858527e-06, "epoch": 1.7360555110755271, "percentage": 86.8, "elapsed_time": "1:30:40", "remaining_time": "0:13:47"} +{"current_steps": 6510, "total_steps": 7494, "loss": 0.5827, "lr": 7.75773958955614e-06, "epoch": 1.7373899119295437, "percentage": 86.87, "elapsed_time": "1:31:39", "remaining_time": "0:13:51"} +{"current_steps": 6515, "total_steps": 7494, "loss": 0.5967, "lr": 7.680549982457553e-06, "epoch": 1.7387243127835603, "percentage": 86.94, "elapsed_time": "1:32:31", "remaining_time": "0:13:54"} +{"current_steps": 6520, "total_steps": 7494, "loss": 0.604, "lr": 7.6037255873209165e-06, "epoch": 1.7400587136375767, "percentage": 87.0, "elapsed_time": "1:33:05", "remaining_time": "0:13:54"} +{"current_steps": 6525, "total_steps": 7494, "loss": 0.5963, "lr": 7.527266820923089e-06, "epoch": 1.7413931144915933, "percentage": 87.07, "elapsed_time": "1:33:45", "remaining_time": "0:13:55"} +{"current_steps": 6530, "total_steps": 7494, "loss": 0.5928, "lr": 7.45117409805733e-06, "epoch": 1.7427275153456097, "percentage": 87.14, "elapsed_time": "1:34:50", "remaining_time": "0:14:00"} +{"current_steps": 6535, "total_steps": 7494, "loss": 0.5901, "lr": 7.375447831531128e-06, "epoch": 1.7440619161996262, "percentage": 87.2, "elapsed_time": "1:35:29", "remaining_time": "0:14:00"} +{"current_steps": 6540, "total_steps": 7494, "loss": 0.5914, "lr": 7.300088432163945e-06, "epoch": 1.7453963170536428, "percentage": 87.27, "elapsed_time": "1:36:04", "remaining_time": "0:14:00"} +{"current_steps": 6545, "total_steps": 7494, "loss": 0.5722, "lr": 7.2250963087849e-06, "epoch": 1.7467307179076594, "percentage": 87.34, "elapsed_time": "1:36:55", "remaining_time": "0:14:03"} +{"current_steps": 6550, "total_steps": 7494, "loss": 0.5961, "lr": 7.1504718682306754e-06, "epoch": 1.748065118761676, "percentage": 87.4, "elapsed_time": "1:37:54", "remaining_time": "0:14:06"} +{"current_steps": 6555, "total_steps": 7494, "loss": 0.5846, "lr": 7.076215515343256e-06, "epoch": 1.7493995196156926, "percentage": 87.47, "elapsed_time": "1:38:29", "remaining_time": "0:14:06"} +{"current_steps": 6560, "total_steps": 7494, "loss": 0.6116, "lr": 7.0023276529676655e-06, "epoch": 1.7507339204697092, "percentage": 87.54, "elapsed_time": "1:39:09", "remaining_time": "0:14:07"} +{"current_steps": 6565, "total_steps": 7494, "loss": 0.5868, "lr": 6.928808681949919e-06, "epoch": 1.7520683213237258, "percentage": 87.6, "elapsed_time": "1:40:11", "remaining_time": "0:14:10"} +{"current_steps": 6570, "total_steps": 7494, "loss": 0.6064, "lr": 6.855659001134739e-06, "epoch": 1.7534027221777422, "percentage": 87.67, "elapsed_time": "1:40:55", "remaining_time": "0:14:11"} +{"current_steps": 6575, "total_steps": 7494, "loss": 0.5873, "lr": 6.78287900736342e-06, "epoch": 1.7547371230317588, "percentage": 87.74, "elapsed_time": "1:41:28", "remaining_time": "0:14:11"} +{"current_steps": 6580, "total_steps": 7494, "loss": 0.583, "lr": 6.710469095471701e-06, "epoch": 1.7560715238857751, "percentage": 87.8, "elapsed_time": "1:42:18", "remaining_time": "0:14:12"} +{"current_steps": 6585, "total_steps": 7494, "loss": 0.591, "lr": 6.638429658287603e-06, "epoch": 1.7574059247397917, "percentage": 87.87, "elapsed_time": "1:43:19", "remaining_time": "0:14:15"} +{"current_steps": 6590, "total_steps": 7494, "loss": 0.5869, "lr": 6.566761086629285e-06, "epoch": 1.7587403255938083, "percentage": 87.94, "elapsed_time": "1:43:56", "remaining_time": "0:14:15"} +{"current_steps": 6595, "total_steps": 7494, "loss": 0.5977, "lr": 6.495463769302952e-06, "epoch": 1.760074726447825, "percentage": 88.0, "elapsed_time": "1:44:33", "remaining_time": "0:14:15"} +{"current_steps": 6600, "total_steps": 7494, "loss": 0.6004, "lr": 6.424538093100745e-06, "epoch": 1.7614091273018415, "percentage": 88.07, "elapsed_time": "1:45:31", "remaining_time": "0:14:17"} +{"current_steps": 6605, "total_steps": 7494, "loss": 0.5969, "lr": 6.353984442798582e-06, "epoch": 1.762743528155858, "percentage": 88.14, "elapsed_time": "1:46:31", "remaining_time": "0:14:20"} +{"current_steps": 6610, "total_steps": 7494, "loss": 0.5831, "lr": 6.283803201154173e-06, "epoch": 1.7640779290098747, "percentage": 88.2, "elapsed_time": "1:47:06", "remaining_time": "0:14:19"} +{"current_steps": 6615, "total_steps": 7494, "loss": 0.5882, "lr": 6.213994748904866e-06, "epoch": 1.765412329863891, "percentage": 88.27, "elapsed_time": "1:47:49", "remaining_time": "0:14:19"} +{"current_steps": 6620, "total_steps": 7494, "loss": 0.5923, "lr": 6.144559464765605e-06, "epoch": 1.7667467307179077, "percentage": 88.34, "elapsed_time": "1:48:55", "remaining_time": "0:14:22"} +{"current_steps": 6625, "total_steps": 7494, "loss": 0.5955, "lr": 6.075497725426862e-06, "epoch": 1.7680811315719243, "percentage": 88.4, "elapsed_time": "1:49:35", "remaining_time": "0:14:22"} +{"current_steps": 6630, "total_steps": 7494, "loss": 0.6022, "lr": 6.0068099055526505e-06, "epoch": 1.7694155324259406, "percentage": 88.47, "elapsed_time": "1:50:10", "remaining_time": "0:14:21"} +{"current_steps": 6635, "total_steps": 7494, "loss": 0.5987, "lr": 5.938496377778395e-06, "epoch": 1.7707499332799572, "percentage": 88.54, "elapsed_time": "1:51:03", "remaining_time": "0:14:22"} +{"current_steps": 6640, "total_steps": 7494, "loss": 0.5945, "lr": 5.870557512709001e-06, "epoch": 1.7720843341339738, "percentage": 88.6, "elapsed_time": "1:51:59", "remaining_time": "0:14:24"} +{"current_steps": 6645, "total_steps": 7494, "loss": 0.6031, "lr": 5.802993678916773e-06, "epoch": 1.7734187349879904, "percentage": 88.67, "elapsed_time": "1:52:35", "remaining_time": "0:14:23"} +{"current_steps": 6650, "total_steps": 7494, "loss": 0.5958, "lr": 5.7358052429394785e-06, "epoch": 1.774753135842007, "percentage": 88.74, "elapsed_time": "1:53:14", "remaining_time": "0:14:22"} +{"current_steps": 6655, "total_steps": 7494, "loss": 0.5946, "lr": 5.668992569278347e-06, "epoch": 1.7760875366960236, "percentage": 88.8, "elapsed_time": "1:54:15", "remaining_time": "0:14:24"} +{"current_steps": 6660, "total_steps": 7494, "loss": 0.5753, "lr": 5.602556020396004e-06, "epoch": 1.7774219375500402, "percentage": 88.87, "elapsed_time": "1:55:03", "remaining_time": "0:14:24"} +{"current_steps": 6665, "total_steps": 7494, "loss": 0.5938, "lr": 5.5364959567146514e-06, "epoch": 1.7787563384040566, "percentage": 88.94, "elapsed_time": "1:55:37", "remaining_time": "0:14:22"} +{"current_steps": 6670, "total_steps": 7494, "loss": 0.5976, "lr": 5.470812736614014e-06, "epoch": 1.7800907392580732, "percentage": 89.0, "elapsed_time": "1:56:25", "remaining_time": "0:14:22"} +{"current_steps": 6675, "total_steps": 7494, "loss": 0.5907, "lr": 5.405506716429378e-06, "epoch": 1.7814251401120895, "percentage": 89.07, "elapsed_time": "1:57:26", "remaining_time": "0:14:24"} +{"current_steps": 6680, "total_steps": 7494, "loss": 0.5768, "lr": 5.340578250449742e-06, "epoch": 1.7827595409661061, "percentage": 89.14, "elapsed_time": "1:58:07", "remaining_time": "0:14:23"} +{"current_steps": 6685, "total_steps": 7494, "loss": 0.604, "lr": 5.276027690915868e-06, "epoch": 1.7840939418201227, "percentage": 89.2, "elapsed_time": "1:58:43", "remaining_time": "0:14:22"} +{"current_steps": 6690, "total_steps": 7494, "loss": 0.6026, "lr": 5.211855388018282e-06, "epoch": 1.7854283426741393, "percentage": 89.27, "elapsed_time": "1:59:35", "remaining_time": "0:14:22"} +{"current_steps": 6695, "total_steps": 7494, "loss": 0.6054, "lr": 5.148061689895519e-06, "epoch": 1.786762743528156, "percentage": 89.34, "elapsed_time": "2:00:32", "remaining_time": "0:14:23"} +{"current_steps": 6700, "total_steps": 7494, "loss": 0.5845, "lr": 5.084646942632123e-06, "epoch": 1.7880971443821725, "percentage": 89.4, "elapsed_time": "2:01:08", "remaining_time": "0:14:21"} +{"current_steps": 6705, "total_steps": 7494, "loss": 0.5873, "lr": 5.0216114902567995e-06, "epoch": 1.789431545236189, "percentage": 89.47, "elapsed_time": "2:02:04", "remaining_time": "0:14:21"} +{"current_steps": 6710, "total_steps": 7494, "loss": 0.5838, "lr": 4.9589556747406e-06, "epoch": 1.7907659460902055, "percentage": 89.54, "elapsed_time": "2:03:04", "remaining_time": "0:14:22"} +{"current_steps": 6715, "total_steps": 7494, "loss": 0.579, "lr": 4.896679835994965e-06, "epoch": 1.792100346944222, "percentage": 89.61, "elapsed_time": "2:03:53", "remaining_time": "0:14:22"} +{"current_steps": 6720, "total_steps": 7494, "loss": 0.577, "lr": 4.834784311869985e-06, "epoch": 1.7934347477982386, "percentage": 89.67, "elapsed_time": "2:04:29", "remaining_time": "0:14:20"} +{"current_steps": 6725, "total_steps": 7494, "loss": 0.6021, "lr": 4.773269438152516e-06, "epoch": 1.794769148652255, "percentage": 89.74, "elapsed_time": "2:05:15", "remaining_time": "0:14:19"} +{"current_steps": 6730, "total_steps": 7494, "loss": 0.5739, "lr": 4.712135548564333e-06, "epoch": 1.7961035495062716, "percentage": 89.81, "elapsed_time": "2:06:16", "remaining_time": "0:14:20"} +{"current_steps": 6735, "total_steps": 7494, "loss": 0.5972, "lr": 4.651382974760382e-06, "epoch": 1.7974379503602882, "percentage": 89.87, "elapsed_time": "2:06:57", "remaining_time": "0:14:18"} +{"current_steps": 6740, "total_steps": 7494, "loss": 0.5844, "lr": 4.591012046326944e-06, "epoch": 1.7987723512143048, "percentage": 89.94, "elapsed_time": "2:07:33", "remaining_time": "0:14:16"} +{"current_steps": 6745, "total_steps": 7494, "loss": 0.5912, "lr": 4.5310230907798285e-06, "epoch": 1.8001067520683214, "percentage": 90.01, "elapsed_time": "2:08:27", "remaining_time": "0:14:15"} +{"current_steps": 6750, "total_steps": 7494, "loss": 0.5864, "lr": 4.471416433562638e-06, "epoch": 1.801441152922338, "percentage": 90.07, "elapsed_time": "2:09:23", "remaining_time": "0:14:15"} +{"current_steps": 6755, "total_steps": 7494, "loss": 0.5825, "lr": 4.412192398044997e-06, "epoch": 1.8027755537763546, "percentage": 90.14, "elapsed_time": "2:10:01", "remaining_time": "0:14:13"} +{"current_steps": 6760, "total_steps": 7494, "loss": 0.5923, "lr": 4.353351305520747e-06, "epoch": 1.804109954630371, "percentage": 90.21, "elapsed_time": "2:10:41", "remaining_time": "0:14:11"} +{"current_steps": 6765, "total_steps": 7494, "loss": 0.6047, "lr": 4.2948934752062655e-06, "epoch": 1.8054443554843875, "percentage": 90.27, "elapsed_time": "2:11:41", "remaining_time": "0:14:11"} +{"current_steps": 6770, "total_steps": 7494, "loss": 0.5978, "lr": 4.2368192242387355e-06, "epoch": 1.806778756338404, "percentage": 90.34, "elapsed_time": "2:12:32", "remaining_time": "0:14:10"} +{"current_steps": 6775, "total_steps": 7494, "loss": 0.5728, "lr": 4.179128867674348e-06, "epoch": 1.8081131571924205, "percentage": 90.41, "elapsed_time": "2:13:08", "remaining_time": "0:14:07"} +{"current_steps": 6780, "total_steps": 7494, "loss": 0.5937, "lr": 4.121822718486664e-06, "epoch": 1.809447558046437, "percentage": 90.47, "elapsed_time": "2:13:53", "remaining_time": "0:14:06"} +{"current_steps": 6785, "total_steps": 7494, "loss": 0.6062, "lr": 4.064901087564918e-06, "epoch": 1.8107819589004537, "percentage": 90.54, "elapsed_time": "2:14:55", "remaining_time": "0:14:05"} +{"current_steps": 6790, "total_steps": 7494, "loss": 0.5764, "lr": 4.008364283712298e-06, "epoch": 1.8121163597544703, "percentage": 90.61, "elapsed_time": "2:15:36", "remaining_time": "0:14:03"} +{"current_steps": 6795, "total_steps": 7494, "loss": 0.5842, "lr": 3.9522126136442515e-06, "epoch": 1.8134507606084869, "percentage": 90.67, "elapsed_time": "2:16:14", "remaining_time": "0:14:00"} +{"current_steps": 6800, "total_steps": 7494, "loss": 0.5886, "lr": 3.896446381986901e-06, "epoch": 1.8147851614625035, "percentage": 90.74, "elapsed_time": "2:17:07", "remaining_time": "0:13:59"} +{"current_steps": 6805, "total_steps": 7494, "loss": 0.5814, "lr": 3.841065891275328e-06, "epoch": 1.8161195623165198, "percentage": 90.81, "elapsed_time": "2:18:20", "remaining_time": "0:14:00"} +{"current_steps": 6810, "total_steps": 7494, "loss": 0.5715, "lr": 3.786071441951918e-06, "epoch": 1.8174539631705364, "percentage": 90.87, "elapsed_time": "2:18:59", "remaining_time": "0:13:57"} +{"current_steps": 6815, "total_steps": 7494, "loss": 0.599, "lr": 3.7314633323647952e-06, "epoch": 1.818788364024553, "percentage": 90.94, "elapsed_time": "2:19:39", "remaining_time": "0:13:54"} +{"current_steps": 6820, "total_steps": 7494, "loss": 0.5895, "lr": 3.6772418587661474e-06, "epoch": 1.8201227648785694, "percentage": 91.01, "elapsed_time": "2:20:37", "remaining_time": "0:13:53"} +{"current_steps": 6825, "total_steps": 7494, "loss": 0.6095, "lr": 3.623407315310667e-06, "epoch": 1.821457165732586, "percentage": 91.07, "elapsed_time": "2:21:27", "remaining_time": "0:13:52"} +{"current_steps": 6830, "total_steps": 7494, "loss": 0.5932, "lr": 3.5699599940538836e-06, "epoch": 1.8227915665866026, "percentage": 91.14, "elapsed_time": "2:22:06", "remaining_time": "0:13:48"} +{"current_steps": 6835, "total_steps": 7494, "loss": 0.6144, "lr": 3.5169001849506496e-06, "epoch": 1.8241259674406192, "percentage": 91.21, "elapsed_time": "2:22:50", "remaining_time": "0:13:46"} +{"current_steps": 6840, "total_steps": 7494, "loss": 0.5942, "lr": 3.4642281758535645e-06, "epoch": 1.8254603682946358, "percentage": 91.27, "elapsed_time": "2:23:49", "remaining_time": "0:13:45"} +{"current_steps": 6845, "total_steps": 7494, "loss": 0.5938, "lr": 3.4119442525113283e-06, "epoch": 1.8267947691486524, "percentage": 91.34, "elapsed_time": "2:24:35", "remaining_time": "0:13:42"} +{"current_steps": 6850, "total_steps": 7494, "loss": 0.5848, "lr": 3.3600486985673163e-06, "epoch": 1.828129170002669, "percentage": 91.41, "elapsed_time": "2:25:12", "remaining_time": "0:13:39"} +{"current_steps": 6855, "total_steps": 7494, "loss": 0.5941, "lr": 3.308541795557948e-06, "epoch": 1.8294635708566853, "percentage": 91.47, "elapsed_time": "2:26:03", "remaining_time": "0:13:36"} +{"current_steps": 6860, "total_steps": 7494, "loss": 0.5902, "lr": 3.2574238229111704e-06, "epoch": 1.830797971710702, "percentage": 91.54, "elapsed_time": "2:26:58", "remaining_time": "0:13:34"} +{"current_steps": 6865, "total_steps": 7494, "loss": 0.582, "lr": 3.2066950579450024e-06, "epoch": 1.8321323725647183, "percentage": 91.61, "elapsed_time": "2:27:40", "remaining_time": "0:13:31"} +{"current_steps": 6870, "total_steps": 7494, "loss": 0.5792, "lr": 3.156355775865968e-06, "epoch": 1.8334667734187349, "percentage": 91.67, "elapsed_time": "2:28:18", "remaining_time": "0:13:28"} +{"current_steps": 6875, "total_steps": 7494, "loss": 0.5816, "lr": 3.106406249767607e-06, "epoch": 1.8348011742727515, "percentage": 91.74, "elapsed_time": "2:29:13", "remaining_time": "0:13:26"} +{"current_steps": 6880, "total_steps": 7494, "loss": 0.604, "lr": 3.056846750629041e-06, "epoch": 1.836135575126768, "percentage": 91.81, "elapsed_time": "2:30:04", "remaining_time": "0:13:23"} +{"current_steps": 6885, "total_steps": 7494, "loss": 0.5963, "lr": 3.007677547313436e-06, "epoch": 1.8374699759807847, "percentage": 91.87, "elapsed_time": "2:30:43", "remaining_time": "0:13:19"} +{"current_steps": 6890, "total_steps": 7494, "loss": 0.5962, "lr": 2.958898906566626e-06, "epoch": 1.8388043768348012, "percentage": 91.94, "elapsed_time": "2:31:26", "remaining_time": "0:13:16"} +{"current_steps": 6895, "total_steps": 7494, "loss": 0.5975, "lr": 2.910511093015588e-06, "epoch": 1.8401387776888178, "percentage": 92.01, "elapsed_time": "2:32:22", "remaining_time": "0:13:14"} +{"current_steps": 6900, "total_steps": 7494, "loss": 0.5879, "lr": 2.8625143691670404e-06, "epoch": 1.8414731785428344, "percentage": 92.07, "elapsed_time": "2:33:11", "remaining_time": "0:13:11"} +{"current_steps": 6905, "total_steps": 7494, "loss": 0.5852, "lr": 2.8149089954060287e-06, "epoch": 1.8428075793968508, "percentage": 92.14, "elapsed_time": "2:34:04", "remaining_time": "0:13:08"} +{"current_steps": 6910, "total_steps": 7494, "loss": 0.6108, "lr": 2.767695229994507e-06, "epoch": 1.8441419802508674, "percentage": 92.21, "elapsed_time": "2:34:49", "remaining_time": "0:13:05"} +{"current_steps": 6915, "total_steps": 7494, "loss": 0.5894, "lr": 2.720873329069895e-06, "epoch": 1.8454763811048838, "percentage": 92.27, "elapsed_time": "2:35:45", "remaining_time": "0:13:02"} +{"current_steps": 6920, "total_steps": 7494, "loss": 0.5904, "lr": 2.6744435466437535e-06, "epoch": 1.8468107819589004, "percentage": 92.34, "elapsed_time": "2:36:31", "remaining_time": "0:12:58"} +{"current_steps": 6925, "total_steps": 7494, "loss": 0.5878, "lr": 2.6284061346004055e-06, "epoch": 1.848145182812917, "percentage": 92.41, "elapsed_time": "2:37:09", "remaining_time": "0:12:54"} +{"current_steps": 6930, "total_steps": 7494, "loss": 0.5966, "lr": 2.5827613426954664e-06, "epoch": 1.8494795836669335, "percentage": 92.47, "elapsed_time": "2:37:58", "remaining_time": "0:12:51"} +{"current_steps": 6935, "total_steps": 7494, "loss": 0.5922, "lr": 2.537509418554631e-06, "epoch": 1.8508139845209501, "percentage": 92.54, "elapsed_time": "2:38:50", "remaining_time": "0:12:48"} +{"current_steps": 6940, "total_steps": 7494, "loss": 0.599, "lr": 2.4926506076722417e-06, "epoch": 1.8521483853749667, "percentage": 92.61, "elapsed_time": "2:39:31", "remaining_time": "0:12:44"} +{"current_steps": 6945, "total_steps": 7494, "loss": 0.5852, "lr": 2.4481851534099707e-06, "epoch": 1.8534827862289833, "percentage": 92.67, "elapsed_time": "2:40:13", "remaining_time": "0:12:39"} +{"current_steps": 6950, "total_steps": 7494, "loss": 0.6024, "lr": 2.404113296995505e-06, "epoch": 1.8548171870829997, "percentage": 92.74, "elapsed_time": "2:41:03", "remaining_time": "0:12:36"} +{"current_steps": 6955, "total_steps": 7494, "loss": 0.59, "lr": 2.360435277521275e-06, "epoch": 1.8561515879370163, "percentage": 92.81, "elapsed_time": "2:41:56", "remaining_time": "0:12:33"} +{"current_steps": 6960, "total_steps": 7494, "loss": 0.6038, "lr": 2.3171513319430596e-06, "epoch": 1.8574859887910327, "percentage": 92.87, "elapsed_time": "2:42:34", "remaining_time": "0:12:28"} +{"current_steps": 6965, "total_steps": 7494, "loss": 0.5971, "lr": 2.274261695078841e-06, "epoch": 1.8588203896450493, "percentage": 92.94, "elapsed_time": "2:43:19", "remaining_time": "0:12:24"} +{"current_steps": 6970, "total_steps": 7494, "loss": 0.5697, "lr": 2.231766599607371e-06, "epoch": 1.8601547904990658, "percentage": 93.01, "elapsed_time": "2:44:10", "remaining_time": "0:12:20"} +{"current_steps": 6975, "total_steps": 7494, "loss": 0.591, "lr": 2.1896662760670618e-06, "epoch": 1.8614891913530824, "percentage": 93.07, "elapsed_time": "2:44:58", "remaining_time": "0:12:16"} +{"current_steps": 6980, "total_steps": 7494, "loss": 0.5952, "lr": 2.1479609528546328e-06, "epoch": 1.862823592207099, "percentage": 93.14, "elapsed_time": "2:45:35", "remaining_time": "0:12:11"} +{"current_steps": 6985, "total_steps": 7494, "loss": 0.5975, "lr": 2.106650856223899e-06, "epoch": 1.8641579930611156, "percentage": 93.21, "elapsed_time": "2:46:21", "remaining_time": "0:12:07"} +{"current_steps": 6990, "total_steps": 7494, "loss": 0.5847, "lr": 2.0657362102845576e-06, "epoch": 1.8654923939151322, "percentage": 93.27, "elapsed_time": "2:47:12", "remaining_time": "0:12:03"} +{"current_steps": 6995, "total_steps": 7494, "loss": 0.5717, "lr": 2.0252172370009646e-06, "epoch": 1.8668267947691488, "percentage": 93.34, "elapsed_time": "2:47:56", "remaining_time": "0:11:58"} +{"current_steps": 7000, "total_steps": 7494, "loss": 0.6034, "lr": 1.985094156190925e-06, "epoch": 1.8681611956231652, "percentage": 93.41, "elapsed_time": "2:48:35", "remaining_time": "0:11:53"} +{"current_steps": 7005, "total_steps": 7494, "loss": 0.5913, "lr": 1.9453671855244963e-06, "epoch": 1.8694955964771818, "percentage": 93.47, "elapsed_time": "2:49:33", "remaining_time": "0:11:50"} +{"current_steps": 7010, "total_steps": 7494, "loss": 0.5972, "lr": 1.906036540522829e-06, "epoch": 1.8708299973311981, "percentage": 93.54, "elapsed_time": "2:50:25", "remaining_time": "0:11:46"} +{"current_steps": 7015, "total_steps": 7494, "loss": 0.5984, "lr": 1.8671024345569773e-06, "epoch": 1.8721643981852147, "percentage": 93.61, "elapsed_time": "2:51:08", "remaining_time": "0:11:41"} +{"current_steps": 7020, "total_steps": 7494, "loss": 0.5821, "lr": 1.8285650788467415e-06, "epoch": 1.8734987990392313, "percentage": 93.67, "elapsed_time": "2:51:47", "remaining_time": "0:11:35"} +{"current_steps": 7025, "total_steps": 7494, "loss": 0.5909, "lr": 1.7904246824595514e-06, "epoch": 1.874833199893248, "percentage": 93.74, "elapsed_time": "2:52:39", "remaining_time": "0:11:31"} +{"current_steps": 7030, "total_steps": 7494, "loss": 0.6039, "lr": 1.7526814523092763e-06, "epoch": 1.8761676007472645, "percentage": 93.81, "elapsed_time": "2:53:31", "remaining_time": "0:11:27"} +{"current_steps": 7035, "total_steps": 7494, "loss": 0.6158, "lr": 1.7153355931551592e-06, "epoch": 1.8775020016012811, "percentage": 93.88, "elapsed_time": "2:54:12", "remaining_time": "0:11:22"} +{"current_steps": 7040, "total_steps": 7494, "loss": 0.6037, "lr": 1.678387307600676e-06, "epoch": 1.8788364024552977, "percentage": 93.94, "elapsed_time": "2:54:57", "remaining_time": "0:11:16"} +{"current_steps": 7045, "total_steps": 7494, "loss": 0.5846, "lr": 1.6418367960924271e-06, "epoch": 1.880170803309314, "percentage": 94.01, "elapsed_time": "2:55:47", "remaining_time": "0:11:12"} +{"current_steps": 7050, "total_steps": 7494, "loss": 0.5923, "lr": 1.6056842569190987e-06, "epoch": 1.8815052041633307, "percentage": 94.08, "elapsed_time": "2:56:37", "remaining_time": "0:11:07"} +{"current_steps": 7055, "total_steps": 7494, "loss": 0.5891, "lr": 1.5699298862103276e-06, "epoch": 1.8828396050173473, "percentage": 94.14, "elapsed_time": "2:57:17", "remaining_time": "0:11:01"} +{"current_steps": 7060, "total_steps": 7494, "loss": 0.6002, "lr": 1.5345738779356714e-06, "epoch": 1.8841740058713636, "percentage": 94.21, "elapsed_time": "2:58:02", "remaining_time": "0:10:56"} +{"current_steps": 7065, "total_steps": 7494, "loss": 0.5748, "lr": 1.4996164239035408e-06, "epoch": 1.8855084067253802, "percentage": 94.28, "elapsed_time": "2:58:54", "remaining_time": "0:10:51"} +{"current_steps": 7070, "total_steps": 7494, "loss": 0.5957, "lr": 1.4650577137601843e-06, "epoch": 1.8868428075793968, "percentage": 94.34, "elapsed_time": "2:59:41", "remaining_time": "0:10:46"} +{"current_steps": 7075, "total_steps": 7494, "loss": 0.5924, "lr": 1.4308979349886146e-06, "epoch": 1.8881772084334134, "percentage": 94.41, "elapsed_time": "3:00:20", "remaining_time": "0:10:40"} +{"current_steps": 7080, "total_steps": 7494, "loss": 0.6024, "lr": 1.3971372729076503e-06, "epoch": 1.88951160928743, "percentage": 94.48, "elapsed_time": "3:01:06", "remaining_time": "0:10:35"} +{"current_steps": 7085, "total_steps": 7494, "loss": 0.5972, "lr": 1.3637759106708501e-06, "epoch": 1.8908460101414466, "percentage": 94.54, "elapsed_time": "3:01:59", "remaining_time": "0:10:30"} +{"current_steps": 7090, "total_steps": 7494, "loss": 0.58, "lr": 1.3308140292655645e-06, "epoch": 1.8921804109954632, "percentage": 94.61, "elapsed_time": "3:03:48", "remaining_time": "0:10:28"} +{"current_steps": 7095, "total_steps": 7494, "loss": 0.5763, "lr": 1.2982518075119352e-06, "epoch": 1.8935148118494796, "percentage": 94.68, "elapsed_time": "3:04:28", "remaining_time": "0:10:22"} +{"current_steps": 7100, "total_steps": 7494, "loss": 0.595, "lr": 1.2660894220619139e-06, "epoch": 1.8948492127034962, "percentage": 94.74, "elapsed_time": "3:05:16", "remaining_time": "0:10:16"} +{"current_steps": 7105, "total_steps": 7494, "loss": 0.597, "lr": 1.2343270473983286e-06, "epoch": 1.8961836135575125, "percentage": 94.81, "elapsed_time": "3:06:15", "remaining_time": "0:10:11"} +{"current_steps": 7110, "total_steps": 7494, "loss": 0.5831, "lr": 1.202964855833935e-06, "epoch": 1.8975180144115291, "percentage": 94.88, "elapsed_time": "3:06:57", "remaining_time": "0:10:05"} +{"current_steps": 7115, "total_steps": 7494, "loss": 0.5972, "lr": 1.1720030175104506e-06, "epoch": 1.8988524152655457, "percentage": 94.94, "elapsed_time": "3:07:40", "remaining_time": "0:09:59"} +{"current_steps": 7120, "total_steps": 7494, "loss": 0.5787, "lr": 1.1414417003976634e-06, "epoch": 1.9001868161195623, "percentage": 95.01, "elapsed_time": "3:08:31", "remaining_time": "0:09:54"} +{"current_steps": 7125, "total_steps": 7494, "loss": 0.5852, "lr": 1.1112810702925163e-06, "epoch": 1.901521216973579, "percentage": 95.08, "elapsed_time": "3:09:18", "remaining_time": "0:09:48"} +{"current_steps": 7130, "total_steps": 7494, "loss": 0.584, "lr": 1.0815212908181825e-06, "epoch": 1.9028556178275955, "percentage": 95.14, "elapsed_time": "3:10:01", "remaining_time": "0:09:42"} +{"current_steps": 7135, "total_steps": 7494, "loss": 0.5959, "lr": 1.0521625234232333e-06, "epoch": 1.904190018681612, "percentage": 95.21, "elapsed_time": "3:10:45", "remaining_time": "0:09:35"} +{"current_steps": 7140, "total_steps": 7494, "loss": 0.6016, "lr": 1.023204927380672e-06, "epoch": 1.9055244195356285, "percentage": 95.28, "elapsed_time": "3:11:33", "remaining_time": "0:09:29"} +{"current_steps": 7145, "total_steps": 7494, "loss": 0.5931, "lr": 9.946486597871672e-07, "epoch": 1.906858820389645, "percentage": 95.34, "elapsed_time": "3:12:22", "remaining_time": "0:09:23"} +{"current_steps": 7150, "total_steps": 7494, "loss": 0.5861, "lr": 9.664938755621632e-07, "epoch": 1.9081932212436616, "percentage": 95.41, "elapsed_time": "3:13:04", "remaining_time": "0:09:17"} +{"current_steps": 7155, "total_steps": 7494, "loss": 0.5903, "lr": 9.387407274469793e-07, "epoch": 1.909527622097678, "percentage": 95.48, "elapsed_time": "3:13:48", "remaining_time": "0:09:10"} +{"current_steps": 7160, "total_steps": 7494, "loss": 0.5876, "lr": 9.113893660041033e-07, "epoch": 1.9108620229516946, "percentage": 95.54, "elapsed_time": "3:14:36", "remaining_time": "0:09:04"} +{"current_steps": 7165, "total_steps": 7494, "loss": 0.5817, "lr": 8.844399396162577e-07, "epoch": 1.9121964238057112, "percentage": 95.61, "elapsed_time": "3:15:23", "remaining_time": "0:08:58"} +{"current_steps": 7170, "total_steps": 7494, "loss": 0.6009, "lr": 8.578925944856596e-07, "epoch": 1.9135308246597278, "percentage": 95.68, "elapsed_time": "3:16:05", "remaining_time": "0:08:51"} +{"current_steps": 7175, "total_steps": 7494, "loss": 0.5763, "lr": 8.317474746332126e-07, "epoch": 1.9148652255137444, "percentage": 95.74, "elapsed_time": "3:16:52", "remaining_time": "0:08:45"} +{"current_steps": 7180, "total_steps": 7494, "loss": 0.5944, "lr": 8.060047218977323e-07, "epoch": 1.916199626367761, "percentage": 95.81, "elapsed_time": "3:17:40", "remaining_time": "0:08:38"} +{"current_steps": 7185, "total_steps": 7494, "loss": 0.5917, "lr": 7.806644759351471e-07, "epoch": 1.9175340272217776, "percentage": 95.88, "elapsed_time": "3:18:26", "remaining_time": "0:08:32"} +{"current_steps": 7190, "total_steps": 7494, "loss": 0.5953, "lr": 7.557268742177908e-07, "epoch": 1.918868428075794, "percentage": 95.94, "elapsed_time": "3:19:09", "remaining_time": "0:08:25"} +{"current_steps": 7195, "total_steps": 7494, "loss": 0.5895, "lr": 7.311920520336106e-07, "epoch": 1.9202028289298105, "percentage": 96.01, "elapsed_time": "3:19:56", "remaining_time": "0:08:18"} +{"current_steps": 7200, "total_steps": 7494, "loss": 0.5909, "lr": 7.070601424854522e-07, "epoch": 1.921537229783827, "percentage": 96.08, "elapsed_time": "3:20:44", "remaining_time": "0:08:11"} +{"current_steps": 7205, "total_steps": 7494, "loss": 0.5963, "lr": 6.833312764903343e-07, "epoch": 1.9228716306378435, "percentage": 96.14, "elapsed_time": "3:21:39", "remaining_time": "0:08:05"} +{"current_steps": 7210, "total_steps": 7494, "loss": 0.5888, "lr": 6.600055827787581e-07, "epoch": 1.92420603149186, "percentage": 96.21, "elapsed_time": "3:22:21", "remaining_time": "0:07:58"} +{"current_steps": 7215, "total_steps": 7494, "loss": 0.6123, "lr": 6.370831878939747e-07, "epoch": 1.9255404323458767, "percentage": 96.28, "elapsed_time": "3:23:09", "remaining_time": "0:07:51"} +{"current_steps": 7220, "total_steps": 7494, "loss": 0.5789, "lr": 6.1456421619131e-07, "epoch": 1.9268748331998933, "percentage": 96.34, "elapsed_time": "3:23:56", "remaining_time": "0:07:44"} +{"current_steps": 7225, "total_steps": 7494, "loss": 0.5894, "lr": 5.924487898375158e-07, "epoch": 1.9282092340539099, "percentage": 96.41, "elapsed_time": "3:24:42", "remaining_time": "0:07:37"} +{"current_steps": 7230, "total_steps": 7494, "loss": 0.6039, "lr": 5.707370288100782e-07, "epoch": 1.9295436349079265, "percentage": 96.48, "elapsed_time": "3:25:26", "remaining_time": "0:07:30"} +{"current_steps": 7235, "total_steps": 7494, "loss": 0.6047, "lr": 5.494290508965605e-07, "epoch": 1.9308780357619428, "percentage": 96.54, "elapsed_time": "3:26:15", "remaining_time": "0:07:23"} +{"current_steps": 7240, "total_steps": 7494, "loss": 0.5834, "lr": 5.285249716940026e-07, "epoch": 1.9322124366159594, "percentage": 96.61, "elapsed_time": "3:27:04", "remaining_time": "0:07:15"} +{"current_steps": 7245, "total_steps": 7494, "loss": 0.5967, "lr": 5.080249046082563e-07, "epoch": 1.933546837469976, "percentage": 96.68, "elapsed_time": "3:27:48", "remaining_time": "0:07:08"} +{"current_steps": 7250, "total_steps": 7494, "loss": 0.6052, "lr": 4.879289608533926e-07, "epoch": 1.9348812383239924, "percentage": 96.74, "elapsed_time": "3:28:32", "remaining_time": "0:07:01"} +{"current_steps": 7255, "total_steps": 7494, "loss": 0.5865, "lr": 4.6823724945107e-07, "epoch": 1.936215639178009, "percentage": 96.81, "elapsed_time": "3:29:20", "remaining_time": "0:06:53"} +{"current_steps": 7260, "total_steps": 7494, "loss": 0.5955, "lr": 4.489498772299843e-07, "epoch": 1.9375500400320256, "percentage": 96.88, "elapsed_time": "3:30:06", "remaining_time": "0:06:46"} +{"current_steps": 7265, "total_steps": 7494, "loss": 0.5929, "lr": 4.3006694882526947e-07, "epoch": 1.9388844408860422, "percentage": 96.94, "elapsed_time": "3:30:51", "remaining_time": "0:06:38"} +{"current_steps": 7270, "total_steps": 7494, "loss": 0.5921, "lr": 4.115885666779062e-07, "epoch": 1.9402188417400588, "percentage": 97.01, "elapsed_time": "3:31:35", "remaining_time": "0:06:31"} +{"current_steps": 7275, "total_steps": 7494, "loss": 0.5803, "lr": 3.9351483103420566e-07, "epoch": 1.9415532425940754, "percentage": 97.08, "elapsed_time": "3:32:22", "remaining_time": "0:06:23"} +{"current_steps": 7280, "total_steps": 7494, "loss": 0.5856, "lr": 3.758458399452519e-07, "epoch": 1.942887643448092, "percentage": 97.14, "elapsed_time": "3:33:10", "remaining_time": "0:06:15"} +{"current_steps": 7285, "total_steps": 7494, "loss": 0.5865, "lr": 3.585816892663351e-07, "epoch": 1.9442220443021083, "percentage": 97.21, "elapsed_time": "3:33:52", "remaining_time": "0:06:08"} +{"current_steps": 7290, "total_steps": 7494, "loss": 0.5944, "lr": 3.4172247265650267e-07, "epoch": 1.945556445156125, "percentage": 97.28, "elapsed_time": "3:34:38", "remaining_time": "0:06:00"} +{"current_steps": 7295, "total_steps": 7494, "loss": 0.5971, "lr": 3.252682815779922e-07, "epoch": 1.9468908460101413, "percentage": 97.34, "elapsed_time": "3:35:23", "remaining_time": "0:05:52"} +{"current_steps": 7300, "total_steps": 7494, "loss": 0.5976, "lr": 3.0921920529574096e-07, "epoch": 1.9482252468641579, "percentage": 97.41, "elapsed_time": "3:36:11", "remaining_time": "0:05:44"} +{"current_steps": 7305, "total_steps": 7494, "loss": 0.59, "lr": 2.9357533087694397e-07, "epoch": 1.9495596477181745, "percentage": 97.48, "elapsed_time": "3:37:05", "remaining_time": "0:05:37"} +{"current_steps": 7310, "total_steps": 7494, "loss": 0.5876, "lr": 2.7833674319052977e-07, "epoch": 1.950894048572191, "percentage": 97.54, "elapsed_time": "3:37:52", "remaining_time": "0:05:29"} +{"current_steps": 7315, "total_steps": 7494, "loss": 0.5919, "lr": 2.6350352490672746e-07, "epoch": 1.9522284494262077, "percentage": 97.61, "elapsed_time": "3:38:40", "remaining_time": "0:05:21"} +{"current_steps": 7320, "total_steps": 7494, "loss": 0.5899, "lr": 2.49075756496625e-07, "epoch": 1.9535628502802243, "percentage": 97.68, "elapsed_time": "3:39:27", "remaining_time": "0:05:13"} +{"current_steps": 7325, "total_steps": 7494, "loss": 0.6066, "lr": 2.3505351623170353e-07, "epoch": 1.9548972511342408, "percentage": 97.74, "elapsed_time": "3:40:10", "remaining_time": "0:05:04"} +{"current_steps": 7330, "total_steps": 7494, "loss": 0.6077, "lr": 2.2143688018343707e-07, "epoch": 1.9562316519882574, "percentage": 97.81, "elapsed_time": "3:40:57", "remaining_time": "0:04:56"} +{"current_steps": 7335, "total_steps": 7494, "loss": 0.5969, "lr": 2.0822592222287659e-07, "epoch": 1.9575660528422738, "percentage": 97.88, "elapsed_time": "3:41:46", "remaining_time": "0:04:48"} +{"current_steps": 7340, "total_steps": 7494, "loss": 0.5785, "lr": 1.9542071402024185e-07, "epoch": 1.9589004536962904, "percentage": 97.95, "elapsed_time": "3:42:31", "remaining_time": "0:04:40"} +{"current_steps": 7345, "total_steps": 7494, "loss": 0.5777, "lr": 1.830213250445467e-07, "epoch": 1.9602348545503068, "percentage": 98.01, "elapsed_time": "3:43:15", "remaining_time": "0:04:31"} +{"current_steps": 7350, "total_steps": 7494, "loss": 0.6075, "lr": 1.7102782256319115e-07, "epoch": 1.9615692554043234, "percentage": 98.08, "elapsed_time": "3:44:00", "remaining_time": "0:04:23"} +{"current_steps": 7355, "total_steps": 7494, "loss": 0.6058, "lr": 1.5944027164163652e-07, "epoch": 1.96290365625834, "percentage": 98.15, "elapsed_time": "3:44:50", "remaining_time": "0:04:14"} +{"current_steps": 7360, "total_steps": 7494, "loss": 0.5973, "lr": 1.4825873514302257e-07, "epoch": 1.9642380571123566, "percentage": 98.21, "elapsed_time": "3:45:36", "remaining_time": "0:04:06"} +{"current_steps": 7365, "total_steps": 7494, "loss": 0.5972, "lr": 1.3748327372784252e-07, "epoch": 1.9655724579663731, "percentage": 98.28, "elapsed_time": "3:46:19", "remaining_time": "0:03:57"} +{"current_steps": 7370, "total_steps": 7494, "loss": 0.5934, "lr": 1.271139458536019e-07, "epoch": 1.9669068588203897, "percentage": 98.35, "elapsed_time": "3:47:04", "remaining_time": "0:03:49"} +{"current_steps": 7375, "total_steps": 7494, "loss": 0.5912, "lr": 1.1715080777451868e-07, "epoch": 1.9682412596744063, "percentage": 98.41, "elapsed_time": "3:47:52", "remaining_time": "0:03:40"} +{"current_steps": 7380, "total_steps": 7494, "loss": 0.5878, "lr": 1.0759391354119017e-07, "epoch": 1.9695756605284227, "percentage": 98.48, "elapsed_time": "3:48:36", "remaining_time": "0:03:31"} +{"current_steps": 7385, "total_steps": 7494, "loss": 0.5962, "lr": 9.844331500034331e-08, "epoch": 1.9709100613824393, "percentage": 98.55, "elapsed_time": "3:49:21", "remaining_time": "0:03:23"} +{"current_steps": 7390, "total_steps": 7494, "loss": 0.6091, "lr": 8.969906179449316e-08, "epoch": 1.9722444622364559, "percentage": 98.61, "elapsed_time": "3:50:09", "remaining_time": "0:03:14"} +{"current_steps": 7395, "total_steps": 7494, "loss": 0.6054, "lr": 8.136120136174318e-08, "epoch": 1.9735788630904723, "percentage": 98.68, "elapsed_time": "3:50:56", "remaining_time": "0:03:05"} +{"current_steps": 7400, "total_steps": 7494, "loss": 0.6083, "lr": 7.342977893546875e-08, "epoch": 1.9749132639444889, "percentage": 98.75, "elapsed_time": "3:51:41", "remaining_time": "0:02:56"} +{"current_steps": 7405, "total_steps": 7494, "loss": 0.5744, "lr": 6.590483754409237e-08, "epoch": 1.9762476647985054, "percentage": 98.81, "elapsed_time": "3:52:36", "remaining_time": "0:02:47"} +{"current_steps": 7410, "total_steps": 7494, "loss": 0.589, "lr": 5.878641801087547e-08, "epoch": 1.977582065652522, "percentage": 98.88, "elapsed_time": "3:53:23", "remaining_time": "0:02:38"} +{"current_steps": 7415, "total_steps": 7494, "loss": 0.5908, "lr": 5.207455895365198e-08, "epoch": 1.9789164665065386, "percentage": 98.95, "elapsed_time": "3:54:12", "remaining_time": "0:02:29"} +{"current_steps": 7420, "total_steps": 7494, "loss": 0.5963, "lr": 4.5769296784653463e-08, "epoch": 1.9802508673605552, "percentage": 99.01, "elapsed_time": "3:54:54", "remaining_time": "0:02:20"} +{"current_steps": 7425, "total_steps": 7494, "loss": 0.5982, "lr": 3.9870665710300954e-08, "epoch": 1.9815852682145718, "percentage": 99.08, "elapsed_time": "3:55:38", "remaining_time": "0:02:11"} +{"current_steps": 7430, "total_steps": 7494, "loss": 0.5929, "lr": 3.437869773101343e-08, "epoch": 1.9829196690685882, "percentage": 99.15, "elapsed_time": "3:56:26", "remaining_time": "0:02:02"} +{"current_steps": 7435, "total_steps": 7494, "loss": 0.5782, "lr": 2.929342264103296e-08, "epoch": 1.9842540699226048, "percentage": 99.21, "elapsed_time": "3:57:14", "remaining_time": "0:01:52"} +{"current_steps": 7440, "total_steps": 7494, "loss": 0.5853, "lr": 2.4614868028274837e-08, "epoch": 1.9855884707766212, "percentage": 99.28, "elapsed_time": "3:57:57", "remaining_time": "0:01:43"} +{"current_steps": 7445, "total_steps": 7494, "loss": 0.5842, "lr": 2.034305927416935e-08, "epoch": 1.9869228716306377, "percentage": 99.35, "elapsed_time": "3:58:43", "remaining_time": "0:01:34"} +{"current_steps": 7450, "total_steps": 7494, "loss": 0.5771, "lr": 1.647801955354522e-08, "epoch": 1.9882572724846543, "percentage": 99.41, "elapsed_time": "3:59:30", "remaining_time": "0:01:24"} +{"current_steps": 7455, "total_steps": 7494, "loss": 0.5851, "lr": 1.301976983445474e-08, "epoch": 1.989591673338671, "percentage": 99.48, "elapsed_time": "4:00:15", "remaining_time": "0:01:15"} +{"current_steps": 7460, "total_steps": 7494, "loss": 0.6131, "lr": 9.968328878115495e-09, "epoch": 1.9909260741926875, "percentage": 99.55, "elapsed_time": "4:00:58", "remaining_time": "0:01:05"} +{"current_steps": 7465, "total_steps": 7494, "loss": 0.607, "lr": 7.3237132387604646e-09, "epoch": 1.9922604750467041, "percentage": 99.61, "elapsed_time": "4:01:44", "remaining_time": "0:00:56"} +{"current_steps": 7470, "total_steps": 7494, "loss": 0.5819, "lr": 5.0859372635964065e-09, "epoch": 1.9935948759007207, "percentage": 99.68, "elapsed_time": "4:02:30", "remaining_time": "0:00:46"} +{"current_steps": 7475, "total_steps": 7494, "loss": 0.5919, "lr": 3.2550130926789487e-09, "epoch": 1.994929276754737, "percentage": 99.75, "elapsed_time": "4:03:18", "remaining_time": "0:00:37"} +{"current_steps": 7480, "total_steps": 7494, "loss": 0.5921, "lr": 1.8309506588959356e-09, "epoch": 1.9962636776087537, "percentage": 99.81, "elapsed_time": "4:04:01", "remaining_time": "0:00:27"} +{"current_steps": 7485, "total_steps": 7494, "loss": 0.6098, "lr": 8.137576878508578e-10, "epoch": 1.9975980784627703, "percentage": 99.88, "elapsed_time": "4:04:47", "remaining_time": "0:00:17"} +{"current_steps": 7490, "total_steps": 7494, "loss": 0.5871, "lr": 2.0343969787950387e-10, "epoch": 1.9989324793167866, "percentage": 99.95, "elapsed_time": "4:05:33", "remaining_time": "0:00:07"} +{"current_steps": 7494, "total_steps": 7494, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "4:06:22", "remaining_time": "0:00:00"} diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..aab881e --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,16525 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 2.0, + "eval_steps": 500, + "global_step": 7494, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0013344008540165466, + "grad_norm": 7.722733096580246, + "learning_rate": 7.999999999999999e-07, + "loss": 0.8094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8109167218208313, + "step": 5, + "valid_targets_mean": 17002.7, + "valid_targets_min": 549 + }, + { + "epoch": 0.0026688017080330933, + "grad_norm": 7.174760064448044, + "learning_rate": 1.8e-06, + "loss": 0.7891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.8015649318695068, + "step": 10, + "valid_targets_mean": 15526.4, + "valid_targets_min": 632 + }, + { + "epoch": 0.0040032025620496394, + "grad_norm": 4.8505743485010075, + "learning_rate": 2.8e-06, + "loss": 0.7545, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7334458827972412, + "step": 15, + "valid_targets_mean": 16465.6, + "valid_targets_min": 720 + }, + { + "epoch": 0.0053376034160661865, + "grad_norm": 2.68270427913022, + "learning_rate": 3.7999999999999996e-06, + "loss": 0.751, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7277793288230896, + "step": 20, + "valid_targets_mean": 15549.5, + "valid_targets_min": 612 + }, + { + "epoch": 0.006672004270082733, + "grad_norm": 1.120496904003529, + "learning_rate": 4.8e-06, + "loss": 0.6974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7064324617385864, + "step": 25, + "valid_targets_mean": 14978.5, + "valid_targets_min": 643 + }, + { + "epoch": 0.008006405124099279, + "grad_norm": 0.9291840952692353, + "learning_rate": 5.7999999999999995e-06, + "loss": 0.7026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.7051266431808472, + "step": 30, + "valid_targets_mean": 16092.5, + "valid_targets_min": 573 + }, + { + "epoch": 0.009340805978115827, + "grad_norm": 0.5938965072427588, + "learning_rate": 6.8e-06, + "loss": 0.671, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6741308569908142, + "step": 35, + "valid_targets_mean": 15905.5, + "valid_targets_min": 764 + }, + { + "epoch": 0.010675206832132373, + "grad_norm": 0.39881741842407664, + "learning_rate": 7.799999999999998e-06, + "loss": 0.686, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6620453000068665, + "step": 40, + "valid_targets_mean": 17101.4, + "valid_targets_min": 491 + }, + { + "epoch": 0.01200960768614892, + "grad_norm": 0.30052510531289645, + "learning_rate": 8.799999999999999e-06, + "loss": 0.6603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6401622295379639, + "step": 45, + "valid_targets_mean": 16533.7, + "valid_targets_min": 668 + }, + { + "epoch": 0.013344008540165465, + "grad_norm": 0.2422091402873916, + "learning_rate": 9.799999999999998e-06, + "loss": 0.6859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6876528859138489, + "step": 50, + "valid_targets_mean": 15775.3, + "valid_targets_min": 553 + }, + { + "epoch": 0.014678409394182012, + "grad_norm": 0.18435404196588112, + "learning_rate": 1.0799999999999998e-05, + "loss": 0.6601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6202096343040466, + "step": 55, + "valid_targets_mean": 16902.1, + "valid_targets_min": 355 + }, + { + "epoch": 0.016012810248198558, + "grad_norm": 0.2015230015509419, + "learning_rate": 1.1799999999999999e-05, + "loss": 0.6605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6784886121749878, + "step": 60, + "valid_targets_mean": 15094.7, + "valid_targets_min": 699 + }, + { + "epoch": 0.017347211102215106, + "grad_norm": 0.18391518955306396, + "learning_rate": 1.2799999999999998e-05, + "loss": 0.6674, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6657936573028564, + "step": 65, + "valid_targets_mean": 16728.3, + "valid_targets_min": 751 + }, + { + "epoch": 0.018681611956231654, + "grad_norm": 0.18728851278657252, + "learning_rate": 1.3799999999999998e-05, + "loss": 0.6615, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6592050790786743, + "step": 70, + "valid_targets_mean": 15899.9, + "valid_targets_min": 89 + }, + { + "epoch": 0.020016012810248198, + "grad_norm": 0.18276533786350968, + "learning_rate": 1.4799999999999999e-05, + "loss": 0.6482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6309381723403931, + "step": 75, + "valid_targets_mean": 16547.5, + "valid_targets_min": 379 + }, + { + "epoch": 0.021350413664264746, + "grad_norm": 0.15304572919199264, + "learning_rate": 1.5799999999999998e-05, + "loss": 0.6546, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6724115014076233, + "step": 80, + "valid_targets_mean": 16472.0, + "valid_targets_min": 275 + }, + { + "epoch": 0.02268481451828129, + "grad_norm": 0.17202347874272747, + "learning_rate": 1.68e-05, + "loss": 0.6514, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6392582654953003, + "step": 85, + "valid_targets_mean": 15872.7, + "valid_targets_min": 570 + }, + { + "epoch": 0.02401921537229784, + "grad_norm": 0.1605220259750001, + "learning_rate": 1.78e-05, + "loss": 0.6534, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6394810676574707, + "step": 90, + "valid_targets_mean": 16103.1, + "valid_targets_min": 838 + }, + { + "epoch": 0.025353616226314386, + "grad_norm": 0.1856380489569822, + "learning_rate": 1.8799999999999996e-05, + "loss": 0.6642, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6631790399551392, + "step": 95, + "valid_targets_mean": 16072.2, + "valid_targets_min": 521 + }, + { + "epoch": 0.02668801708033093, + "grad_norm": 0.17012529774883547, + "learning_rate": 1.98e-05, + "loss": 0.6403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6355913877487183, + "step": 100, + "valid_targets_mean": 15947.1, + "valid_targets_min": 572 + }, + { + "epoch": 0.02802241793434748, + "grad_norm": 0.18944071384180122, + "learning_rate": 2.0799999999999997e-05, + "loss": 0.6474, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.630897045135498, + "step": 105, + "valid_targets_mean": 16317.5, + "valid_targets_min": 775 + }, + { + "epoch": 0.029356818788364023, + "grad_norm": 0.28359974957392275, + "learning_rate": 2.1799999999999998e-05, + "loss": 0.6414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6439160704612732, + "step": 110, + "valid_targets_mean": 17678.0, + "valid_targets_min": 412 + }, + { + "epoch": 0.03069121964238057, + "grad_norm": 0.20867511279432566, + "learning_rate": 2.28e-05, + "loss": 0.653, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6740957498550415, + "step": 115, + "valid_targets_mean": 14610.8, + "valid_targets_min": 607 + }, + { + "epoch": 0.032025620496397116, + "grad_norm": 0.22034953051672115, + "learning_rate": 2.38e-05, + "loss": 0.6551, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6769538521766663, + "step": 120, + "valid_targets_mean": 15110.7, + "valid_targets_min": 364 + }, + { + "epoch": 0.03336002135041367, + "grad_norm": 0.19858036390829426, + "learning_rate": 2.4799999999999996e-05, + "loss": 0.6566, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6704879999160767, + "step": 125, + "valid_targets_mean": 16683.8, + "valid_targets_min": 364 + }, + { + "epoch": 0.03469442220443021, + "grad_norm": 0.17343296109636808, + "learning_rate": 2.5799999999999997e-05, + "loss": 0.641, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6155713796615601, + "step": 130, + "valid_targets_mean": 16543.7, + "valid_targets_min": 430 + }, + { + "epoch": 0.036028823058446756, + "grad_norm": 0.21961900685930796, + "learning_rate": 2.6799999999999998e-05, + "loss": 0.6375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6220330595970154, + "step": 135, + "valid_targets_mean": 16411.1, + "valid_targets_min": 692 + }, + { + "epoch": 0.03736322391246331, + "grad_norm": 0.22084342992200506, + "learning_rate": 2.7799999999999995e-05, + "loss": 0.6648, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6999180912971497, + "step": 140, + "valid_targets_mean": 14523.8, + "valid_targets_min": 288 + }, + { + "epoch": 0.03869762476647985, + "grad_norm": 0.2310359062397061, + "learning_rate": 2.88e-05, + "loss": 0.6534, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6643216013908386, + "step": 145, + "valid_targets_mean": 16719.3, + "valid_targets_min": 594 + }, + { + "epoch": 0.040032025620496396, + "grad_norm": 0.186516441432285, + "learning_rate": 2.9799999999999996e-05, + "loss": 0.6485, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6516410112380981, + "step": 150, + "valid_targets_mean": 17415.4, + "valid_targets_min": 853 + }, + { + "epoch": 0.04136642647451294, + "grad_norm": 0.2534333458932033, + "learning_rate": 3.0799999999999996e-05, + "loss": 0.654, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6449211239814758, + "step": 155, + "valid_targets_mean": 15443.2, + "valid_targets_min": 360 + }, + { + "epoch": 0.04270082732852949, + "grad_norm": 0.29545907304950525, + "learning_rate": 3.1799999999999994e-05, + "loss": 0.6442, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6491722464561462, + "step": 160, + "valid_targets_mean": 16999.6, + "valid_targets_min": 609 + }, + { + "epoch": 0.044035228182546036, + "grad_norm": 0.26013562588749856, + "learning_rate": 3.28e-05, + "loss": 0.6282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6321196556091309, + "step": 165, + "valid_targets_mean": 16109.6, + "valid_targets_min": 623 + }, + { + "epoch": 0.04536962903656258, + "grad_norm": 0.20357197994388182, + "learning_rate": 3.3799999999999995e-05, + "loss": 0.6459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6354120969772339, + "step": 170, + "valid_targets_mean": 16442.6, + "valid_targets_min": 413 + }, + { + "epoch": 0.04670402989057913, + "grad_norm": 0.2528215866301578, + "learning_rate": 3.48e-05, + "loss": 0.6257, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6035679578781128, + "step": 175, + "valid_targets_mean": 16467.2, + "valid_targets_min": 508 + }, + { + "epoch": 0.04803843074459568, + "grad_norm": 0.29491368956485453, + "learning_rate": 3.5799999999999996e-05, + "loss": 0.6617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6350039839744568, + "step": 180, + "valid_targets_mean": 16867.5, + "valid_targets_min": 731 + }, + { + "epoch": 0.04937283159861222, + "grad_norm": 0.2644554424332122, + "learning_rate": 3.679999999999999e-05, + "loss": 0.6367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6491011381149292, + "step": 185, + "valid_targets_mean": 16007.8, + "valid_targets_min": 850 + }, + { + "epoch": 0.05070723245262877, + "grad_norm": 0.26708080017347674, + "learning_rate": 3.78e-05, + "loss": 0.6586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6851446628570557, + "step": 190, + "valid_targets_mean": 14931.2, + "valid_targets_min": 365 + }, + { + "epoch": 0.05204163330664532, + "grad_norm": 0.32544168158249764, + "learning_rate": 3.8799999999999994e-05, + "loss": 0.6426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6339905858039856, + "step": 195, + "valid_targets_mean": 16106.9, + "valid_targets_min": 101 + }, + { + "epoch": 0.05337603416066186, + "grad_norm": 0.27173833321054686, + "learning_rate": 3.979999999999999e-05, + "loss": 0.6433, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6287566423416138, + "step": 200, + "valid_targets_mean": 16933.6, + "valid_targets_min": 126 + }, + { + "epoch": 0.054710435014678406, + "grad_norm": 0.22284495398618304, + "learning_rate": 4.08e-05, + "loss": 0.6543, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6004332900047302, + "step": 205, + "valid_targets_mean": 16562.4, + "valid_targets_min": 541 + }, + { + "epoch": 0.05604483586869496, + "grad_norm": 0.34011968889770705, + "learning_rate": 4.18e-05, + "loss": 0.6531, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6229228973388672, + "step": 210, + "valid_targets_mean": 15680.9, + "valid_targets_min": 717 + }, + { + "epoch": 0.0573792367227115, + "grad_norm": 0.22699273620693833, + "learning_rate": 4.28e-05, + "loss": 0.6408, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.588473916053772, + "step": 215, + "valid_targets_mean": 16374.6, + "valid_targets_min": 550 + }, + { + "epoch": 0.058713637576728046, + "grad_norm": 0.34995893426720126, + "learning_rate": 4.3799999999999994e-05, + "loss": 0.6479, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6611473560333252, + "step": 220, + "valid_targets_mean": 16212.5, + "valid_targets_min": 789 + }, + { + "epoch": 0.0600480384307446, + "grad_norm": 0.28994318186176626, + "learning_rate": 4.48e-05, + "loss": 0.6398, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.627586841583252, + "step": 225, + "valid_targets_mean": 16141.5, + "valid_targets_min": 745 + }, + { + "epoch": 0.06138243928476114, + "grad_norm": 0.29147818946690207, + "learning_rate": 4.5799999999999995e-05, + "loss": 0.6594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6853932738304138, + "step": 230, + "valid_targets_mean": 14766.9, + "valid_targets_min": 429 + }, + { + "epoch": 0.0627168401387777, + "grad_norm": 0.22883342494533743, + "learning_rate": 4.68e-05, + "loss": 0.6482, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6339342594146729, + "step": 235, + "valid_targets_mean": 15721.2, + "valid_targets_min": 183 + }, + { + "epoch": 0.06405124099279423, + "grad_norm": 0.2461647251551573, + "learning_rate": 4.7799999999999996e-05, + "loss": 0.6426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6382437944412231, + "step": 240, + "valid_targets_mean": 15432.7, + "valid_targets_min": 475 + }, + { + "epoch": 0.06538564184681078, + "grad_norm": 0.26152022660942825, + "learning_rate": 4.8799999999999994e-05, + "loss": 0.637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6458475589752197, + "step": 245, + "valid_targets_mean": 16287.8, + "valid_targets_min": 629 + }, + { + "epoch": 0.06672004270082733, + "grad_norm": 0.2515010561393975, + "learning_rate": 4.98e-05, + "loss": 0.6589, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6445261240005493, + "step": 250, + "valid_targets_mean": 16890.9, + "valid_targets_min": 720 + }, + { + "epoch": 0.06805444355484387, + "grad_norm": 0.29505128400263414, + "learning_rate": 5.0799999999999995e-05, + "loss": 0.6496, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6435770988464355, + "step": 255, + "valid_targets_mean": 15024.3, + "valid_targets_min": 676 + }, + { + "epoch": 0.06938884440886042, + "grad_norm": 0.3188315335754373, + "learning_rate": 5.179999999999999e-05, + "loss": 0.6354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6181894540786743, + "step": 260, + "valid_targets_mean": 16111.8, + "valid_targets_min": 690 + }, + { + "epoch": 0.07072324526287697, + "grad_norm": 0.35692218300890305, + "learning_rate": 5.279999999999999e-05, + "loss": 0.6368, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6286272406578064, + "step": 265, + "valid_targets_mean": 15167.3, + "valid_targets_min": 109 + }, + { + "epoch": 0.07205764611689351, + "grad_norm": 0.3502722942708975, + "learning_rate": 5.38e-05, + "loss": 0.6445, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.615933895111084, + "step": 270, + "valid_targets_mean": 16902.7, + "valid_targets_min": 139 + }, + { + "epoch": 0.07339204697091006, + "grad_norm": 0.3215557581594254, + "learning_rate": 5.48e-05, + "loss": 0.6404, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6237388849258423, + "step": 275, + "valid_targets_mean": 16192.2, + "valid_targets_min": 636 + }, + { + "epoch": 0.07472644782492661, + "grad_norm": 0.39899551445003084, + "learning_rate": 5.5799999999999994e-05, + "loss": 0.63, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5924405455589294, + "step": 280, + "valid_targets_mean": 15586.0, + "valid_targets_min": 539 + }, + { + "epoch": 0.07606084867894315, + "grad_norm": 0.36329343959447064, + "learning_rate": 5.679999999999999e-05, + "loss": 0.6413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6253823041915894, + "step": 285, + "valid_targets_mean": 15027.2, + "valid_targets_min": 706 + }, + { + "epoch": 0.0773952495329597, + "grad_norm": 0.3552887259009282, + "learning_rate": 5.78e-05, + "loss": 0.633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6298519372940063, + "step": 290, + "valid_targets_mean": 15274.9, + "valid_targets_min": 253 + }, + { + "epoch": 0.07872965038697624, + "grad_norm": 0.5427295323238193, + "learning_rate": 5.88e-05, + "loss": 0.6317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6390588283538818, + "step": 295, + "valid_targets_mean": 16540.1, + "valid_targets_min": 134 + }, + { + "epoch": 0.08006405124099279, + "grad_norm": 0.35816189246454916, + "learning_rate": 5.98e-05, + "loss": 0.6602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6374964714050293, + "step": 300, + "valid_targets_mean": 15592.1, + "valid_targets_min": 595 + }, + { + "epoch": 0.08139845209500934, + "grad_norm": 0.27987335172366956, + "learning_rate": 6.0799999999999994e-05, + "loss": 0.6367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6291804313659668, + "step": 305, + "valid_targets_mean": 15667.8, + "valid_targets_min": 688 + }, + { + "epoch": 0.08273285294902588, + "grad_norm": 0.39583641768435684, + "learning_rate": 6.18e-05, + "loss": 0.6459, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.627192497253418, + "step": 310, + "valid_targets_mean": 16965.0, + "valid_targets_min": 748 + }, + { + "epoch": 0.08406725380304243, + "grad_norm": 0.34497427719209073, + "learning_rate": 6.28e-05, + "loss": 0.6357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6164098381996155, + "step": 315, + "valid_targets_mean": 16704.1, + "valid_targets_min": 632 + }, + { + "epoch": 0.08540165465705898, + "grad_norm": 0.5235857704611651, + "learning_rate": 6.379999999999999e-05, + "loss": 0.6412, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6287165880203247, + "step": 320, + "valid_targets_mean": 15693.0, + "valid_targets_min": 617 + }, + { + "epoch": 0.08673605551107552, + "grad_norm": 0.5312837364567617, + "learning_rate": 6.479999999999999e-05, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6154929995536804, + "step": 325, + "valid_targets_mean": 16596.4, + "valid_targets_min": 348 + }, + { + "epoch": 0.08807045636509207, + "grad_norm": 0.5265871873124938, + "learning_rate": 6.579999999999999e-05, + "loss": 0.6242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6224241852760315, + "step": 330, + "valid_targets_mean": 15641.3, + "valid_targets_min": 623 + }, + { + "epoch": 0.08940485721910862, + "grad_norm": 0.45762649729585103, + "learning_rate": 6.68e-05, + "loss": 0.6308, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6392424702644348, + "step": 335, + "valid_targets_mean": 17120.2, + "valid_targets_min": 799 + }, + { + "epoch": 0.09073925807312516, + "grad_norm": 0.4694075757636562, + "learning_rate": 6.78e-05, + "loss": 0.6419, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6159706115722656, + "step": 340, + "valid_targets_mean": 16286.1, + "valid_targets_min": 720 + }, + { + "epoch": 0.09207365892714171, + "grad_norm": 0.5016929581867708, + "learning_rate": 6.879999999999999e-05, + "loss": 0.6334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6220609545707703, + "step": 345, + "valid_targets_mean": 17040.8, + "valid_targets_min": 628 + }, + { + "epoch": 0.09340805978115826, + "grad_norm": 0.6373560197992398, + "learning_rate": 6.979999999999999e-05, + "loss": 0.6437, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6372533440589905, + "step": 350, + "valid_targets_mean": 15782.5, + "valid_targets_min": 616 + }, + { + "epoch": 0.0947424606351748, + "grad_norm": 0.5016876713993831, + "learning_rate": 7.079999999999999e-05, + "loss": 0.6437, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6407184600830078, + "step": 355, + "valid_targets_mean": 16137.4, + "valid_targets_min": 734 + }, + { + "epoch": 0.09607686148919135, + "grad_norm": 0.6364967752399274, + "learning_rate": 7.18e-05, + "loss": 0.6294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6185452342033386, + "step": 360, + "valid_targets_mean": 17217.6, + "valid_targets_min": 906 + }, + { + "epoch": 0.0974112623432079, + "grad_norm": 0.5233293275358429, + "learning_rate": 7.28e-05, + "loss": 0.6413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.634662926197052, + "step": 365, + "valid_targets_mean": 16162.9, + "valid_targets_min": 526 + }, + { + "epoch": 0.09874566319722444, + "grad_norm": 0.5448113397417333, + "learning_rate": 7.379999999999999e-05, + "loss": 0.6352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.637201189994812, + "step": 370, + "valid_targets_mean": 15398.7, + "valid_targets_min": 6 + }, + { + "epoch": 0.100080064051241, + "grad_norm": 0.5456285463552911, + "learning_rate": 7.479999999999999e-05, + "loss": 0.6426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6574046611785889, + "step": 375, + "valid_targets_mean": 15670.4, + "valid_targets_min": 483 + }, + { + "epoch": 0.10141446490525755, + "grad_norm": 0.38739916988200274, + "learning_rate": 7.579999999999999e-05, + "loss": 0.6297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5901604890823364, + "step": 380, + "valid_targets_mean": 17108.8, + "valid_targets_min": 105 + }, + { + "epoch": 0.10274886575927408, + "grad_norm": 0.5322073833756792, + "learning_rate": 7.68e-05, + "loss": 0.6355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6376615762710571, + "step": 385, + "valid_targets_mean": 17225.1, + "valid_targets_min": 719 + }, + { + "epoch": 0.10408326661329063, + "grad_norm": 0.4785089017506761, + "learning_rate": 7.780000000000001e-05, + "loss": 0.6413, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6684964895248413, + "step": 390, + "valid_targets_mean": 15992.3, + "valid_targets_min": 683 + }, + { + "epoch": 0.10541766746730719, + "grad_norm": 0.5065768208339545, + "learning_rate": 7.879999999999999e-05, + "loss": 0.63, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6249961256980896, + "step": 395, + "valid_targets_mean": 15035.4, + "valid_targets_min": 419 + }, + { + "epoch": 0.10675206832132372, + "grad_norm": 0.5140100470937524, + "learning_rate": 7.98e-05, + "loss": 0.6405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6756935119628906, + "step": 400, + "valid_targets_mean": 16192.8, + "valid_targets_min": 664 + }, + { + "epoch": 0.10808646917534027, + "grad_norm": 0.4375144441663607, + "learning_rate": 8.079999999999999e-05, + "loss": 0.6473, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6521981954574585, + "step": 405, + "valid_targets_mean": 15850.0, + "valid_targets_min": 448 + }, + { + "epoch": 0.10942087002935681, + "grad_norm": 0.2929651892552746, + "learning_rate": 8.18e-05, + "loss": 0.6357, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6364883184432983, + "step": 410, + "valid_targets_mean": 15711.7, + "valid_targets_min": 545 + }, + { + "epoch": 0.11075527088337336, + "grad_norm": 0.4564153270660509, + "learning_rate": 8.28e-05, + "loss": 0.6131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6293573379516602, + "step": 415, + "valid_targets_mean": 15629.3, + "valid_targets_min": 682 + }, + { + "epoch": 0.11208967173738991, + "grad_norm": 0.3507225963416143, + "learning_rate": 8.379999999999999e-05, + "loss": 0.6145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6214045286178589, + "step": 420, + "valid_targets_mean": 16229.8, + "valid_targets_min": 462 + }, + { + "epoch": 0.11342407259140645, + "grad_norm": 0.4192240853043197, + "learning_rate": 8.48e-05, + "loss": 0.6274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.619477391242981, + "step": 425, + "valid_targets_mean": 15496.3, + "valid_targets_min": 687 + }, + { + "epoch": 0.114758473445423, + "grad_norm": 0.45349034065464183, + "learning_rate": 8.579999999999998e-05, + "loss": 0.6338, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6174418926239014, + "step": 430, + "valid_targets_mean": 17214.9, + "valid_targets_min": 602 + }, + { + "epoch": 0.11609287429943956, + "grad_norm": 0.4890743720349672, + "learning_rate": 8.68e-05, + "loss": 0.6439, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6422944068908691, + "step": 435, + "valid_targets_mean": 14807.0, + "valid_targets_min": 548 + }, + { + "epoch": 0.11742727515345609, + "grad_norm": 0.3945142664933707, + "learning_rate": 8.779999999999999e-05, + "loss": 0.6323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6414684057235718, + "step": 440, + "valid_targets_mean": 16481.1, + "valid_targets_min": 754 + }, + { + "epoch": 0.11876167600747264, + "grad_norm": 0.396589484423819, + "learning_rate": 8.879999999999999e-05, + "loss": 0.6283, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6542065739631653, + "step": 445, + "valid_targets_mean": 17148.1, + "valid_targets_min": 482 + }, + { + "epoch": 0.1200960768614892, + "grad_norm": 0.4356111519880911, + "learning_rate": 8.98e-05, + "loss": 0.637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6526371240615845, + "step": 450, + "valid_targets_mean": 15223.1, + "valid_targets_min": 466 + }, + { + "epoch": 0.12143047771550573, + "grad_norm": 0.3812490978850452, + "learning_rate": 9.079999999999998e-05, + "loss": 0.6232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6449786424636841, + "step": 455, + "valid_targets_mean": 16120.0, + "valid_targets_min": 85 + }, + { + "epoch": 0.12276487856952228, + "grad_norm": 0.5466324629441199, + "learning_rate": 9.18e-05, + "loss": 0.6288, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6684505939483643, + "step": 460, + "valid_targets_mean": 14551.1, + "valid_targets_min": 535 + }, + { + "epoch": 0.12409927942353884, + "grad_norm": 0.440898309600464, + "learning_rate": 9.279999999999999e-05, + "loss": 0.6389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6249978542327881, + "step": 465, + "valid_targets_mean": 16389.1, + "valid_targets_min": 601 + }, + { + "epoch": 0.1254336802775554, + "grad_norm": 0.4812074587417184, + "learning_rate": 9.379999999999999e-05, + "loss": 0.6294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6114672422409058, + "step": 470, + "valid_targets_mean": 15764.7, + "valid_targets_min": 677 + }, + { + "epoch": 0.12676808113157192, + "grad_norm": 0.33120352620579174, + "learning_rate": 9.479999999999999e-05, + "loss": 0.6481, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6427431106567383, + "step": 475, + "valid_targets_mean": 16125.9, + "valid_targets_min": 566 + }, + { + "epoch": 0.12810248198558846, + "grad_norm": 0.4938707791865049, + "learning_rate": 9.58e-05, + "loss": 0.6352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6327007412910461, + "step": 480, + "valid_targets_mean": 15312.6, + "valid_targets_min": 722 + }, + { + "epoch": 0.12943688283960503, + "grad_norm": 0.6100558208938732, + "learning_rate": 9.68e-05, + "loss": 0.6405, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6266542673110962, + "step": 485, + "valid_targets_mean": 15428.1, + "valid_targets_min": 151 + }, + { + "epoch": 0.13077128369362157, + "grad_norm": 0.6172374578198562, + "learning_rate": 9.779999999999999e-05, + "loss": 0.6278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6328811049461365, + "step": 490, + "valid_targets_mean": 16432.2, + "valid_targets_min": 460 + }, + { + "epoch": 0.1321056845476381, + "grad_norm": 0.6025395448579794, + "learning_rate": 9.879999999999999e-05, + "loss": 0.6328, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6516920924186707, + "step": 495, + "valid_targets_mean": 17290.2, + "valid_targets_min": 234 + }, + { + "epoch": 0.13344008540165467, + "grad_norm": 0.7137832676715946, + "learning_rate": 9.979999999999999e-05, + "loss": 0.6409, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6384673118591309, + "step": 500, + "valid_targets_mean": 16150.1, + "valid_targets_min": 452 + }, + { + "epoch": 0.1347744862556712, + "grad_norm": 0.5110710358565494, + "learning_rate": 0.0001008, + "loss": 0.637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6318944692611694, + "step": 505, + "valid_targets_mean": 16285.9, + "valid_targets_min": 541 + }, + { + "epoch": 0.13610888710968774, + "grad_norm": 0.4387540839417831, + "learning_rate": 0.00010179999999999998, + "loss": 0.6318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6122161149978638, + "step": 510, + "valid_targets_mean": 17210.2, + "valid_targets_min": 663 + }, + { + "epoch": 0.1374432879637043, + "grad_norm": 0.3564577512761047, + "learning_rate": 0.00010279999999999999, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6141184568405151, + "step": 515, + "valid_targets_mean": 15328.4, + "valid_targets_min": 223 + }, + { + "epoch": 0.13877768881772085, + "grad_norm": 0.6811113729467204, + "learning_rate": 0.00010379999999999999, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6268406510353088, + "step": 520, + "valid_targets_mean": 17020.2, + "valid_targets_min": 685 + }, + { + "epoch": 0.14011208967173738, + "grad_norm": 0.6298148606182943, + "learning_rate": 0.00010479999999999999, + "loss": 0.6396, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6501023769378662, + "step": 525, + "valid_targets_mean": 17929.1, + "valid_targets_min": 509 + }, + { + "epoch": 0.14144649052575395, + "grad_norm": 0.4732100884671107, + "learning_rate": 0.0001058, + "loss": 0.6326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.668642520904541, + "step": 530, + "valid_targets_mean": 15325.7, + "valid_targets_min": 749 + }, + { + "epoch": 0.14278089137977049, + "grad_norm": 0.6101088915867378, + "learning_rate": 0.00010679999999999998, + "loss": 0.6309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6329489946365356, + "step": 535, + "valid_targets_mean": 14211.2, + "valid_targets_min": 543 + }, + { + "epoch": 0.14411529223378702, + "grad_norm": 0.6164583822509117, + "learning_rate": 0.00010779999999999999, + "loss": 0.643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6332310438156128, + "step": 540, + "valid_targets_mean": 16027.2, + "valid_targets_min": 513 + }, + { + "epoch": 0.1454496930878036, + "grad_norm": 0.46354108969743496, + "learning_rate": 0.0001088, + "loss": 0.6337, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6408779621124268, + "step": 545, + "valid_targets_mean": 15994.5, + "valid_targets_min": 665 + }, + { + "epoch": 0.14678409394182013, + "grad_norm": 0.6728497617605657, + "learning_rate": 0.00010979999999999999, + "loss": 0.6524, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6410496830940247, + "step": 550, + "valid_targets_mean": 15271.2, + "valid_targets_min": 672 + }, + { + "epoch": 0.14811849479583666, + "grad_norm": 0.452251096886965, + "learning_rate": 0.0001108, + "loss": 0.6142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6183743476867676, + "step": 555, + "valid_targets_mean": 16031.0, + "valid_targets_min": 620 + }, + { + "epoch": 0.14945289564985323, + "grad_norm": 0.4940079278296469, + "learning_rate": 0.00011179999999999998, + "loss": 0.6373, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6272560358047485, + "step": 560, + "valid_targets_mean": 15618.4, + "valid_targets_min": 490 + }, + { + "epoch": 0.15078729650386977, + "grad_norm": 0.40199346202147485, + "learning_rate": 0.00011279999999999999, + "loss": 0.6092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6106986999511719, + "step": 565, + "valid_targets_mean": 17251.2, + "valid_targets_min": 744 + }, + { + "epoch": 0.1521216973578863, + "grad_norm": 0.7062551724607816, + "learning_rate": 0.0001138, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6443933844566345, + "step": 570, + "valid_targets_mean": 15404.6, + "valid_targets_min": 591 + }, + { + "epoch": 0.15345609821190287, + "grad_norm": 0.5295131206766565, + "learning_rate": 0.00011479999999999999, + "loss": 0.6334, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6361149549484253, + "step": 575, + "valid_targets_mean": 16901.2, + "valid_targets_min": 875 + }, + { + "epoch": 0.1547904990659194, + "grad_norm": 0.4347384689835901, + "learning_rate": 0.0001158, + "loss": 0.6426, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6205735206604004, + "step": 580, + "valid_targets_mean": 16786.3, + "valid_targets_min": 369 + }, + { + "epoch": 0.15612489991993594, + "grad_norm": 0.5775856333359377, + "learning_rate": 0.00011679999999999998, + "loss": 0.6461, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6474686861038208, + "step": 585, + "valid_targets_mean": 14895.8, + "valid_targets_min": 108 + }, + { + "epoch": 0.15745930077395248, + "grad_norm": 0.7282618772499635, + "learning_rate": 0.00011779999999999999, + "loss": 0.6436, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6281576752662659, + "step": 590, + "valid_targets_mean": 14939.4, + "valid_targets_min": 477 + }, + { + "epoch": 0.15879370162796905, + "grad_norm": 0.4692524239463527, + "learning_rate": 0.0001188, + "loss": 0.6271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6387741565704346, + "step": 595, + "valid_targets_mean": 17040.3, + "valid_targets_min": 731 + }, + { + "epoch": 0.16012810248198558, + "grad_norm": 0.5058728730875969, + "learning_rate": 0.00011979999999999998, + "loss": 0.6226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.609712541103363, + "step": 600, + "valid_targets_mean": 15650.8, + "valid_targets_min": 463 + }, + { + "epoch": 0.16146250333600212, + "grad_norm": 0.46751037120907246, + "learning_rate": 0.0001208, + "loss": 0.6379, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.665306806564331, + "step": 605, + "valid_targets_mean": 15767.0, + "valid_targets_min": 775 + }, + { + "epoch": 0.1627969041900187, + "grad_norm": 0.41517754616987906, + "learning_rate": 0.00012179999999999999, + "loss": 0.6316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5787537097930908, + "step": 610, + "valid_targets_mean": 16859.7, + "valid_targets_min": 750 + }, + { + "epoch": 0.16413130504403523, + "grad_norm": 0.45185294422831457, + "learning_rate": 0.00012279999999999998, + "loss": 0.6256, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6185984015464783, + "step": 615, + "valid_targets_mean": 15708.6, + "valid_targets_min": 642 + }, + { + "epoch": 0.16546570589805176, + "grad_norm": 0.8923654038299266, + "learning_rate": 0.0001238, + "loss": 0.6395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6756001114845276, + "step": 620, + "valid_targets_mean": 15895.9, + "valid_targets_min": 364 + }, + { + "epoch": 0.16680010675206833, + "grad_norm": 0.6558823229700756, + "learning_rate": 0.00012479999999999997, + "loss": 0.6414, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6151660680770874, + "step": 625, + "valid_targets_mean": 17162.6, + "valid_targets_min": 735 + }, + { + "epoch": 0.16813450760608487, + "grad_norm": 0.4618405285160889, + "learning_rate": 0.0001258, + "loss": 0.6317, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6160898804664612, + "step": 630, + "valid_targets_mean": 15995.3, + "valid_targets_min": 353 + }, + { + "epoch": 0.1694689084601014, + "grad_norm": 0.5370756194829018, + "learning_rate": 0.0001268, + "loss": 0.6339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6276133060455322, + "step": 635, + "valid_targets_mean": 15865.4, + "valid_targets_min": 682 + }, + { + "epoch": 0.17080330931411797, + "grad_norm": 0.45147493000289246, + "learning_rate": 0.0001278, + "loss": 0.6319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6035290360450745, + "step": 640, + "valid_targets_mean": 15300.2, + "valid_targets_min": 473 + }, + { + "epoch": 0.1721377101681345, + "grad_norm": 0.4248585296196485, + "learning_rate": 0.0001288, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6245103478431702, + "step": 645, + "valid_targets_mean": 16338.7, + "valid_targets_min": 561 + }, + { + "epoch": 0.17347211102215104, + "grad_norm": 0.45315242194661487, + "learning_rate": 0.00012979999999999998, + "loss": 0.6429, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6325228214263916, + "step": 650, + "valid_targets_mean": 16460.1, + "valid_targets_min": 91 + }, + { + "epoch": 0.1748065118761676, + "grad_norm": 0.39926687744237155, + "learning_rate": 0.00013079999999999998, + "loss": 0.6401, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6352002620697021, + "step": 655, + "valid_targets_mean": 16758.9, + "valid_targets_min": 760 + }, + { + "epoch": 0.17614091273018415, + "grad_norm": 0.5573738851094832, + "learning_rate": 0.0001318, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6075339317321777, + "step": 660, + "valid_targets_mean": 16955.9, + "valid_targets_min": 827 + }, + { + "epoch": 0.17747531358420068, + "grad_norm": 0.6041112170658741, + "learning_rate": 0.00013279999999999998, + "loss": 0.6387, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6145156621932983, + "step": 665, + "valid_targets_mean": 16214.3, + "valid_targets_min": 617 + }, + { + "epoch": 0.17880971443821725, + "grad_norm": 0.6691609500323099, + "learning_rate": 0.0001338, + "loss": 0.6424, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6259413957595825, + "step": 670, + "valid_targets_mean": 15774.5, + "valid_targets_min": 721 + }, + { + "epoch": 0.1801441152922338, + "grad_norm": 0.5510175966492971, + "learning_rate": 0.00013479999999999997, + "loss": 0.6444, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6546534299850464, + "step": 675, + "valid_targets_mean": 16692.4, + "valid_targets_min": 415 + }, + { + "epoch": 0.18147851614625032, + "grad_norm": 0.45284578631102296, + "learning_rate": 0.0001358, + "loss": 0.6242, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6178637742996216, + "step": 680, + "valid_targets_mean": 15854.1, + "valid_targets_min": 364 + }, + { + "epoch": 0.1828129170002669, + "grad_norm": 0.5598143553534308, + "learning_rate": 0.0001368, + "loss": 0.6377, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6420258283615112, + "step": 685, + "valid_targets_mean": 16098.6, + "valid_targets_min": 690 + }, + { + "epoch": 0.18414731785428343, + "grad_norm": 0.4898643325722064, + "learning_rate": 0.0001378, + "loss": 0.6253, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6103246212005615, + "step": 690, + "valid_targets_mean": 15935.0, + "valid_targets_min": 46 + }, + { + "epoch": 0.18548171870829996, + "grad_norm": 0.48853693142080784, + "learning_rate": 0.00013879999999999999, + "loss": 0.625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6008676886558533, + "step": 695, + "valid_targets_mean": 15636.2, + "valid_targets_min": 800 + }, + { + "epoch": 0.18681611956231653, + "grad_norm": 0.6347995761312584, + "learning_rate": 0.00013979999999999998, + "loss": 0.6324, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.653724730014801, + "step": 700, + "valid_targets_mean": 14665.4, + "valid_targets_min": 224 + }, + { + "epoch": 0.18815052041633307, + "grad_norm": 0.7828402154942533, + "learning_rate": 0.00014079999999999998, + "loss": 0.6318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6152931451797485, + "step": 705, + "valid_targets_mean": 17113.1, + "valid_targets_min": 428 + }, + { + "epoch": 0.1894849212703496, + "grad_norm": 0.5241474516392837, + "learning_rate": 0.0001418, + "loss": 0.6333, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6403192281723022, + "step": 710, + "valid_targets_mean": 15791.3, + "valid_targets_min": 683 + }, + { + "epoch": 0.19081932212436617, + "grad_norm": 0.4632704579471851, + "learning_rate": 0.00014279999999999997, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6158638000488281, + "step": 715, + "valid_targets_mean": 16625.1, + "valid_targets_min": 534 + }, + { + "epoch": 0.1921537229783827, + "grad_norm": 0.46117923760781826, + "learning_rate": 0.0001438, + "loss": 0.6072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6315052509307861, + "step": 720, + "valid_targets_mean": 15794.5, + "valid_targets_min": 596 + }, + { + "epoch": 0.19348812383239924, + "grad_norm": 0.647822630194712, + "learning_rate": 0.0001448, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6225035190582275, + "step": 725, + "valid_targets_mean": 15483.7, + "valid_targets_min": 698 + }, + { + "epoch": 0.1948225246864158, + "grad_norm": 0.49037071545761785, + "learning_rate": 0.0001458, + "loss": 0.6339, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6174116134643555, + "step": 730, + "valid_targets_mean": 17187.7, + "valid_targets_min": 514 + }, + { + "epoch": 0.19615692554043235, + "grad_norm": 1.2177701556230174, + "learning_rate": 0.0001468, + "loss": 0.6278, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6415305137634277, + "step": 735, + "valid_targets_mean": 14950.6, + "valid_targets_min": 576 + }, + { + "epoch": 0.19749132639444889, + "grad_norm": 0.6247158077856722, + "learning_rate": 0.0001478, + "loss": 0.6382, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6371544599533081, + "step": 740, + "valid_targets_mean": 14802.8, + "valid_targets_min": 318 + }, + { + "epoch": 0.19882572724846545, + "grad_norm": 0.6322408214786107, + "learning_rate": 0.00014879999999999998, + "loss": 0.6266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5996054410934448, + "step": 745, + "valid_targets_mean": 15770.3, + "valid_targets_min": 134 + }, + { + "epoch": 0.200160128102482, + "grad_norm": 0.5899230568781816, + "learning_rate": 0.00014979999999999998, + "loss": 0.6311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.648550271987915, + "step": 750, + "valid_targets_mean": 15592.2, + "valid_targets_min": 146 + }, + { + "epoch": 0.20149452895649853, + "grad_norm": 0.5356162186310743, + "learning_rate": 0.00014999986979857214, + "loss": 0.6291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6485459804534912, + "step": 755, + "valid_targets_mean": 15480.7, + "valid_targets_min": 7 + }, + { + "epoch": 0.2028289298105151, + "grad_norm": 0.5996675499754749, + "learning_rate": 0.00014999934085604638, + "loss": 0.6301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6440800428390503, + "step": 760, + "valid_targets_mean": 15474.6, + "valid_targets_min": 473 + }, + { + "epoch": 0.20416333066453163, + "grad_norm": 0.6652446495332728, + "learning_rate": 0.00014999840503770068, + "loss": 0.6316, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6223655939102173, + "step": 765, + "valid_targets_mean": 15384.0, + "valid_targets_min": 433 + }, + { + "epoch": 0.20549773151854817, + "grad_norm": 0.5183540862933816, + "learning_rate": 0.00014999706234861205, + "loss": 0.643, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6405179500579834, + "step": 770, + "valid_targets_mean": 15208.1, + "valid_targets_min": 559 + }, + { + "epoch": 0.20683213237256473, + "grad_norm": 0.46844848194628597, + "learning_rate": 0.00014999531279606457, + "loss": 0.6354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6337324380874634, + "step": 775, + "valid_targets_mean": 16525.7, + "valid_targets_min": 511 + }, + { + "epoch": 0.20816653322658127, + "grad_norm": 0.671172585627433, + "learning_rate": 0.00014999315638954965, + "loss": 0.6348, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6305123567581177, + "step": 780, + "valid_targets_mean": 17233.3, + "valid_targets_min": 778 + }, + { + "epoch": 0.2095009340805978, + "grad_norm": 0.6074185020725967, + "learning_rate": 0.000149990593140766, + "loss": 0.6352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6281955242156982, + "step": 785, + "valid_targets_mean": 16683.3, + "valid_targets_min": 494 + }, + { + "epoch": 0.21083533493461437, + "grad_norm": 0.7479959234194301, + "learning_rate": 0.00014998762306361933, + "loss": 0.6319, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6173586249351501, + "step": 790, + "valid_targets_mean": 16722.9, + "valid_targets_min": 662 + }, + { + "epoch": 0.2121697357886309, + "grad_norm": 0.6232754007313384, + "learning_rate": 0.00014998424617422253, + "loss": 0.6247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6114662289619446, + "step": 795, + "valid_targets_mean": 17318.8, + "valid_targets_min": 707 + }, + { + "epoch": 0.21350413664264745, + "grad_norm": 2.474421684415322, + "learning_rate": 0.00014998046249089538, + "loss": 0.6309, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.630775511264801, + "step": 800, + "valid_targets_mean": 16087.6, + "valid_targets_min": 558 + }, + { + "epoch": 0.214838537496664, + "grad_norm": 0.5272341185487777, + "learning_rate": 0.00014997627203416458, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6349064111709595, + "step": 805, + "valid_targets_mean": 15673.0, + "valid_targets_min": 574 + }, + { + "epoch": 0.21617293835068055, + "grad_norm": 0.5074946180799155, + "learning_rate": 0.00014997167482676366, + "loss": 0.6285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.653042197227478, + "step": 810, + "valid_targets_mean": 14152.6, + "valid_targets_min": 718 + }, + { + "epoch": 0.2175073392046971, + "grad_norm": 0.6304000671143047, + "learning_rate": 0.00014996667089363272, + "loss": 0.6266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6242920160293579, + "step": 815, + "valid_targets_mean": 15896.4, + "valid_targets_min": 308 + }, + { + "epoch": 0.21884174005871362, + "grad_norm": 0.4929101127177894, + "learning_rate": 0.00014996126026191832, + "loss": 0.6425, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6394720077514648, + "step": 820, + "valid_targets_mean": 16951.1, + "valid_targets_min": 495 + }, + { + "epoch": 0.2201761409127302, + "grad_norm": 0.4831309890625364, + "learning_rate": 0.00014995544296097355, + "loss": 0.6282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6423969864845276, + "step": 825, + "valid_targets_mean": 14961.2, + "valid_targets_min": 736 + }, + { + "epoch": 0.22151054176674673, + "grad_norm": 0.5671978591902495, + "learning_rate": 0.00014994921902235757, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6383193135261536, + "step": 830, + "valid_targets_mean": 15189.4, + "valid_targets_min": 465 + }, + { + "epoch": 0.22284494262076326, + "grad_norm": 0.5408721097421353, + "learning_rate": 0.0001499425884798356, + "loss": 0.62, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6238391399383545, + "step": 835, + "valid_targets_mean": 15876.2, + "valid_targets_min": 650 + }, + { + "epoch": 0.22417934347477983, + "grad_norm": 0.5091528558852999, + "learning_rate": 0.00014993555136937872, + "loss": 0.6298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.616040825843811, + "step": 840, + "valid_targets_mean": 16239.6, + "valid_targets_min": 409 + }, + { + "epoch": 0.22551374432879637, + "grad_norm": 0.6991679506883416, + "learning_rate": 0.0001499281077291637, + "loss": 0.6358, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6669756174087524, + "step": 845, + "valid_targets_mean": 15986.7, + "valid_targets_min": 463 + }, + { + "epoch": 0.2268481451828129, + "grad_norm": 2.418185394050847, + "learning_rate": 0.00014992025759957267, + "loss": 0.6569, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6653257012367249, + "step": 850, + "valid_targets_mean": 15783.3, + "valid_targets_min": 673 + }, + { + "epoch": 0.22818254603682947, + "grad_norm": 0.9727676116589085, + "learning_rate": 0.0001499120010231931, + "loss": 0.6297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6188017129898071, + "step": 855, + "valid_targets_mean": 16147.9, + "valid_targets_min": 532 + }, + { + "epoch": 0.229516946890846, + "grad_norm": 0.9375704480379955, + "learning_rate": 0.00014990333804481738, + "loss": 0.6312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6338417530059814, + "step": 860, + "valid_targets_mean": 16900.2, + "valid_targets_min": 239 + }, + { + "epoch": 0.23085134774486255, + "grad_norm": 0.6205540371276664, + "learning_rate": 0.00014989426871144266, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6344268321990967, + "step": 865, + "valid_targets_mean": 16510.0, + "valid_targets_min": 803 + }, + { + "epoch": 0.2321857485988791, + "grad_norm": 0.3787711944460734, + "learning_rate": 0.00014988479307227062, + "loss": 0.6153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6353251338005066, + "step": 870, + "valid_targets_mean": 14899.5, + "valid_targets_min": 302 + }, + { + "epoch": 0.23352014945289565, + "grad_norm": 0.526714631887211, + "learning_rate": 0.00014987491117870717, + "loss": 0.632, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6151652336120605, + "step": 875, + "valid_targets_mean": 16548.4, + "valid_targets_min": 816 + }, + { + "epoch": 0.23485455030691219, + "grad_norm": 0.9469141187868311, + "learning_rate": 0.00014986462308436214, + "loss": 0.619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6323580741882324, + "step": 880, + "valid_targets_mean": 14792.8, + "valid_targets_min": 610 + }, + { + "epoch": 0.23618895116092875, + "grad_norm": 0.5545869906721276, + "learning_rate": 0.00014985392884504903, + "loss": 0.6327, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6401712894439697, + "step": 885, + "valid_targets_mean": 15866.4, + "valid_targets_min": 441 + }, + { + "epoch": 0.2375233520149453, + "grad_norm": 0.6671209209088051, + "learning_rate": 0.00014984282851878477, + "loss": 0.6277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6353170871734619, + "step": 890, + "valid_targets_mean": 16787.9, + "valid_targets_min": 513 + }, + { + "epoch": 0.23885775286896183, + "grad_norm": 0.707216009088664, + "learning_rate": 0.00014983132216578923, + "loss": 0.6277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6237537860870361, + "step": 895, + "valid_targets_mean": 16321.5, + "valid_targets_min": 555 + }, + { + "epoch": 0.2401921537229784, + "grad_norm": 0.44220574683340125, + "learning_rate": 0.00014981940984848508, + "loss": 0.6095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5769079923629761, + "step": 900, + "valid_targets_mean": 16333.7, + "valid_targets_min": 625 + }, + { + "epoch": 0.24152655457699493, + "grad_norm": 0.567649333484972, + "learning_rate": 0.00014980709163149732, + "loss": 0.6352, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6523852944374084, + "step": 905, + "valid_targets_mean": 15671.2, + "valid_targets_min": 517 + }, + { + "epoch": 0.24286095543101147, + "grad_norm": 0.39550289799836713, + "learning_rate": 0.000149794367581653, + "loss": 0.6286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6379982233047485, + "step": 910, + "valid_targets_mean": 16212.5, + "valid_targets_min": 365 + }, + { + "epoch": 0.24419535628502803, + "grad_norm": 0.5657359448312539, + "learning_rate": 0.00014978123776798082, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6022660732269287, + "step": 915, + "valid_targets_mean": 17185.0, + "valid_targets_min": 373 + }, + { + "epoch": 0.24552975713904457, + "grad_norm": 0.46551913820916074, + "learning_rate": 0.00014976770226171084, + "loss": 0.6211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5838291049003601, + "step": 920, + "valid_targets_mean": 17635.7, + "valid_targets_min": 673 + }, + { + "epoch": 0.2468641579930611, + "grad_norm": 0.628573995916106, + "learning_rate": 0.00014975376113627394, + "loss": 0.6243, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6010740399360657, + "step": 925, + "valid_targets_mean": 17160.6, + "valid_targets_min": 653 + }, + { + "epoch": 0.24819855884707767, + "grad_norm": 0.5886488234344668, + "learning_rate": 0.00014973941446730154, + "loss": 0.6417, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6382604837417603, + "step": 930, + "valid_targets_mean": 16632.9, + "valid_targets_min": 434 + }, + { + "epoch": 0.2495329597010942, + "grad_norm": 0.48658287775706377, + "learning_rate": 0.00014972466233262517, + "loss": 0.6268, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6358413696289062, + "step": 935, + "valid_targets_mean": 16748.2, + "valid_targets_min": 386 + }, + { + "epoch": 0.2508673605551108, + "grad_norm": 0.6165528347204787, + "learning_rate": 0.00014970950481227603, + "loss": 0.6271, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6221519708633423, + "step": 940, + "valid_targets_mean": 15600.3, + "valid_targets_min": 423 + }, + { + "epoch": 0.2522017614091273, + "grad_norm": 0.5163784973495187, + "learning_rate": 0.00014969394198848456, + "loss": 0.6291, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6757415533065796, + "step": 945, + "valid_targets_mean": 14300.9, + "valid_targets_min": 655 + }, + { + "epoch": 0.25353616226314385, + "grad_norm": 0.4121567337420054, + "learning_rate": 0.00014967797394567993, + "loss": 0.6102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5853270292282104, + "step": 950, + "valid_targets_mean": 16034.4, + "valid_targets_min": 506 + }, + { + "epoch": 0.2548705631171604, + "grad_norm": 0.7577521485230333, + "learning_rate": 0.00014966160077048982, + "loss": 0.6088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6212820410728455, + "step": 955, + "valid_targets_mean": 16407.6, + "valid_targets_min": 112 + }, + { + "epoch": 0.2562049639711769, + "grad_norm": 0.5797059241277471, + "learning_rate": 0.00014964482255173958, + "loss": 0.6355, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6175366640090942, + "step": 960, + "valid_targets_mean": 15787.3, + "valid_targets_min": 17 + }, + { + "epoch": 0.25753936482519346, + "grad_norm": 0.6745773228660589, + "learning_rate": 0.00014962763938045206, + "loss": 0.6343, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6257587671279907, + "step": 965, + "valid_targets_mean": 14691.4, + "valid_targets_min": 854 + }, + { + "epoch": 0.25887376567921005, + "grad_norm": 0.719661214105207, + "learning_rate": 0.00014961005134984693, + "loss": 0.6238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6064175367355347, + "step": 970, + "valid_targets_mean": 17340.3, + "valid_targets_min": 692 + }, + { + "epoch": 0.2602081665332266, + "grad_norm": 0.7928522671161337, + "learning_rate": 0.00014959205855534036, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6479929685592651, + "step": 975, + "valid_targets_mean": 16809.3, + "valid_targets_min": 201 + }, + { + "epoch": 0.26154256738724313, + "grad_norm": 0.42078558451857806, + "learning_rate": 0.00014957366109454427, + "loss": 0.6165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6084697246551514, + "step": 980, + "valid_targets_mean": 16258.8, + "valid_targets_min": 664 + }, + { + "epoch": 0.26287696824125967, + "grad_norm": 0.5847517399099696, + "learning_rate": 0.00014955485906726596, + "loss": 0.631, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6284216642379761, + "step": 985, + "valid_targets_mean": 15576.3, + "valid_targets_min": 452 + }, + { + "epoch": 0.2642113690952762, + "grad_norm": 0.5762291412718675, + "learning_rate": 0.00014953565257550756, + "loss": 0.6403, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.620425283908844, + "step": 990, + "valid_targets_mean": 16763.7, + "valid_targets_min": 403 + }, + { + "epoch": 0.26554576994929274, + "grad_norm": 0.6979661040448024, + "learning_rate": 0.00014951604172346535, + "loss": 0.6321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6719156503677368, + "step": 995, + "valid_targets_mean": 14564.9, + "valid_targets_min": 620 + }, + { + "epoch": 0.26688017080330934, + "grad_norm": 0.6488310360831638, + "learning_rate": 0.00014949602661752944, + "loss": 0.6361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6312586069107056, + "step": 1000, + "valid_targets_mean": 17267.3, + "valid_targets_min": 488 + }, + { + "epoch": 0.2682145716573259, + "grad_norm": 0.7100211577778035, + "learning_rate": 0.0001494756073662829, + "loss": 0.6048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5785956978797913, + "step": 1005, + "valid_targets_mean": 16819.7, + "valid_targets_min": 548 + }, + { + "epoch": 0.2695489725113424, + "grad_norm": 0.5186043844844956, + "learning_rate": 0.00014945478408050135, + "loss": 0.6241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5791152119636536, + "step": 1010, + "valid_targets_mean": 17192.7, + "valid_targets_min": 702 + }, + { + "epoch": 0.27088337336535895, + "grad_norm": 0.4865216909323894, + "learning_rate": 0.00014943355687315239, + "loss": 0.6346, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6338467597961426, + "step": 1015, + "valid_targets_mean": 15711.4, + "valid_targets_min": 225 + }, + { + "epoch": 0.2722177742193755, + "grad_norm": 2.9839267781053938, + "learning_rate": 0.0001494119258593948, + "loss": 0.6198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6054257154464722, + "step": 1020, + "valid_targets_mean": 16202.0, + "valid_targets_min": 651 + }, + { + "epoch": 0.273552175073392, + "grad_norm": 0.4682102838085987, + "learning_rate": 0.00014938989115657815, + "loss": 0.6438, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6480819582939148, + "step": 1025, + "valid_targets_mean": 16784.9, + "valid_targets_min": 461 + }, + { + "epoch": 0.2748865759274086, + "grad_norm": 0.5780484239113524, + "learning_rate": 0.00014936745288424198, + "loss": 0.6411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6359916925430298, + "step": 1030, + "valid_targets_mean": 16367.8, + "valid_targets_min": 624 + }, + { + "epoch": 0.27622097678142515, + "grad_norm": 0.4748800236035067, + "learning_rate": 0.0001493446111641152, + "loss": 0.6388, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6322864294052124, + "step": 1035, + "valid_targets_mean": 17037.6, + "valid_targets_min": 290 + }, + { + "epoch": 0.2775553776354417, + "grad_norm": 0.5475367460557771, + "learning_rate": 0.00014932136612011554, + "loss": 0.619, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5975278615951538, + "step": 1040, + "valid_targets_mean": 14834.2, + "valid_targets_min": 317 + }, + { + "epoch": 0.27888977848945823, + "grad_norm": 0.5803392107957903, + "learning_rate": 0.00014929771787834868, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6173809170722961, + "step": 1045, + "valid_targets_mean": 14989.7, + "valid_targets_min": 712 + }, + { + "epoch": 0.28022417934347477, + "grad_norm": 0.5695332004442396, + "learning_rate": 0.00014927366656710772, + "loss": 0.6361, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6184433102607727, + "step": 1050, + "valid_targets_mean": 16500.4, + "valid_targets_min": 609 + }, + { + "epoch": 0.2815585801974913, + "grad_norm": 0.5210619813808601, + "learning_rate": 0.00014924921231687245, + "loss": 0.6446, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6179799437522888, + "step": 1055, + "valid_targets_mean": 16106.9, + "valid_targets_min": 119 + }, + { + "epoch": 0.2828929810515079, + "grad_norm": 0.6614658274322637, + "learning_rate": 0.0001492243552603086, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6067185997962952, + "step": 1060, + "valid_targets_mean": 16331.0, + "valid_targets_min": 623 + }, + { + "epoch": 0.28422738190552443, + "grad_norm": 0.9608258567454809, + "learning_rate": 0.00014919909553226716, + "loss": 0.629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5961272716522217, + "step": 1065, + "valid_targets_mean": 17423.3, + "valid_targets_min": 43 + }, + { + "epoch": 0.28556178275954097, + "grad_norm": 0.7810276450704127, + "learning_rate": 0.00014917343326978366, + "loss": 0.626, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6217774152755737, + "step": 1070, + "valid_targets_mean": 16327.2, + "valid_targets_min": 767 + }, + { + "epoch": 0.2868961836135575, + "grad_norm": 0.8791876590438911, + "learning_rate": 0.00014914736861207733, + "loss": 0.614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6118861436843872, + "step": 1075, + "valid_targets_mean": 16543.7, + "valid_targets_min": 316 + }, + { + "epoch": 0.28823058446757405, + "grad_norm": 1.1384137467784206, + "learning_rate": 0.0001491209017005505, + "loss": 0.634, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6420910358428955, + "step": 1080, + "valid_targets_mean": 15269.9, + "valid_targets_min": 541 + }, + { + "epoch": 0.2895649853215906, + "grad_norm": 0.9186506276668647, + "learning_rate": 0.00014909403267878771, + "loss": 0.6226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6265588998794556, + "step": 1085, + "valid_targets_mean": 15304.5, + "valid_targets_min": 279 + }, + { + "epoch": 0.2908993861756072, + "grad_norm": 0.6353711384570834, + "learning_rate": 0.000149066761692555, + "loss": 0.6507, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6470847129821777, + "step": 1090, + "valid_targets_mean": 15632.7, + "valid_targets_min": 653 + }, + { + "epoch": 0.2922337870296237, + "grad_norm": 0.8185383898766663, + "learning_rate": 0.00014903908888979904, + "loss": 0.6703, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.647415816783905, + "step": 1095, + "valid_targets_mean": 16790.4, + "valid_targets_min": 571 + }, + { + "epoch": 0.29356818788364025, + "grad_norm": 0.8184426394736861, + "learning_rate": 0.00014901101442064637, + "loss": 0.6394, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6400127410888672, + "step": 1100, + "valid_targets_mean": 16172.6, + "valid_targets_min": 620 + }, + { + "epoch": 0.2949025887376568, + "grad_norm": 0.556673335317666, + "learning_rate": 0.00014898253843740271, + "loss": 0.6191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6126173734664917, + "step": 1105, + "valid_targets_mean": 16876.9, + "valid_targets_min": 63 + }, + { + "epoch": 0.2962369895916733, + "grad_norm": 0.6295377941122368, + "learning_rate": 0.00014895366109455189, + "loss": 0.6227, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6384031772613525, + "step": 1110, + "valid_targets_mean": 14548.6, + "valid_targets_min": 587 + }, + { + "epoch": 0.29757139044568987, + "grad_norm": 0.5248335147680199, + "learning_rate": 0.00014892438254875522, + "loss": 0.6332, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6321662068367004, + "step": 1115, + "valid_targets_mean": 15943.8, + "valid_targets_min": 510 + }, + { + "epoch": 0.29890579129970646, + "grad_norm": 0.46918917861931686, + "learning_rate": 0.00014889470295885047, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6436111927032471, + "step": 1120, + "valid_targets_mean": 15795.2, + "valid_targets_min": 555 + }, + { + "epoch": 0.300240192153723, + "grad_norm": 0.5296984184134944, + "learning_rate": 0.0001488646224858512, + "loss": 0.622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6454466581344604, + "step": 1125, + "valid_targets_mean": 16186.7, + "valid_targets_min": 481 + }, + { + "epoch": 0.30157459300773953, + "grad_norm": 0.45293649555504717, + "learning_rate": 0.00014883414129294575, + "loss": 0.6249, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6144802570343018, + "step": 1130, + "valid_targets_mean": 16900.4, + "valid_targets_min": 208 + }, + { + "epoch": 0.30290899386175607, + "grad_norm": 0.6521647010742185, + "learning_rate": 0.00014880325954549635, + "loss": 0.6111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6205244064331055, + "step": 1135, + "valid_targets_mean": 16414.0, + "valid_targets_min": 542 + }, + { + "epoch": 0.3042433947157726, + "grad_norm": 0.47504287072364365, + "learning_rate": 0.00014877197741103827, + "loss": 0.6169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6137683391571045, + "step": 1140, + "valid_targets_mean": 16874.0, + "valid_targets_min": 20 + }, + { + "epoch": 0.30557779556978915, + "grad_norm": 0.48482488804825913, + "learning_rate": 0.00014874029505927897, + "loss": 0.628, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.600907564163208, + "step": 1145, + "valid_targets_mean": 15816.4, + "valid_targets_min": 445 + }, + { + "epoch": 0.30691219642380574, + "grad_norm": 0.590376880482206, + "learning_rate": 0.00014870821266209705, + "loss": 0.6389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6424787640571594, + "step": 1150, + "valid_targets_mean": 16383.6, + "valid_targets_min": 341 + }, + { + "epoch": 0.3082465972778223, + "grad_norm": 0.7933903651046492, + "learning_rate": 0.00014867573039354138, + "loss": 0.636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.624193012714386, + "step": 1155, + "valid_targets_mean": 16836.2, + "valid_targets_min": 606 + }, + { + "epoch": 0.3095809981318388, + "grad_norm": 0.9457148294169705, + "learning_rate": 0.00014864284842983018, + "loss": 0.6384, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6270631551742554, + "step": 1160, + "valid_targets_mean": 17508.7, + "valid_targets_min": 773 + }, + { + "epoch": 0.31091539898585535, + "grad_norm": 0.7378226203734249, + "learning_rate": 0.00014860956694935003, + "loss": 0.6175, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5961403846740723, + "step": 1165, + "valid_targets_mean": 15587.0, + "valid_targets_min": 528 + }, + { + "epoch": 0.3122497998398719, + "grad_norm": 0.8823224927738156, + "learning_rate": 0.0001485758861326549, + "loss": 0.611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6161226034164429, + "step": 1170, + "valid_targets_mean": 15393.7, + "valid_targets_min": 213 + }, + { + "epoch": 0.3135842006938884, + "grad_norm": 0.639113418443212, + "learning_rate": 0.00014854180616246523, + "loss": 0.6145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6032258868217468, + "step": 1175, + "valid_targets_mean": 14761.5, + "valid_targets_min": 699 + }, + { + "epoch": 0.31491860154790496, + "grad_norm": 0.9033165887917867, + "learning_rate": 0.00014850732722366682, + "loss": 0.6354, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6307148933410645, + "step": 1180, + "valid_targets_mean": 16037.6, + "valid_targets_min": 501 + }, + { + "epoch": 0.31625300240192156, + "grad_norm": 0.5532447648291372, + "learning_rate": 0.00014847244950330998, + "loss": 0.627, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6076141595840454, + "step": 1185, + "valid_targets_mean": 15901.8, + "valid_targets_min": 662 + }, + { + "epoch": 0.3175874032559381, + "grad_norm": 0.5412595599268045, + "learning_rate": 0.00014843717319060833, + "loss": 0.6318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623320460319519, + "step": 1190, + "valid_targets_mean": 15982.0, + "valid_targets_min": 595 + }, + { + "epoch": 0.31892180410995463, + "grad_norm": 0.712340033605185, + "learning_rate": 0.00014840149847693794, + "loss": 0.6272, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6320945024490356, + "step": 1195, + "valid_targets_mean": 16020.9, + "valid_targets_min": 367 + }, + { + "epoch": 0.32025620496397117, + "grad_norm": 0.5170839825925028, + "learning_rate": 0.00014836542555583628, + "loss": 0.6184, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6051146984100342, + "step": 1200, + "valid_targets_mean": 15806.9, + "valid_targets_min": 681 + }, + { + "epoch": 0.3215906058179877, + "grad_norm": 0.42832852584741143, + "learning_rate": 0.000148328954623001, + "loss": 0.6301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6123482584953308, + "step": 1205, + "valid_targets_mean": 16524.5, + "valid_targets_min": 545 + }, + { + "epoch": 0.32292500667200424, + "grad_norm": 0.4873892662092641, + "learning_rate": 0.00014829208587628908, + "loss": 0.6165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6147938370704651, + "step": 1210, + "valid_targets_mean": 15223.3, + "valid_targets_min": 414 + }, + { + "epoch": 0.32425940752602084, + "grad_norm": 0.493152065483101, + "learning_rate": 0.0001482548195157156, + "loss": 0.6172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6495429277420044, + "step": 1215, + "valid_targets_mean": 14667.0, + "valid_targets_min": 498 + }, + { + "epoch": 0.3255938083800374, + "grad_norm": 0.5157810714523037, + "learning_rate": 0.00014821715574345277, + "loss": 0.6091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6138304471969604, + "step": 1220, + "valid_targets_mean": 16354.4, + "valid_targets_min": 517 + }, + { + "epoch": 0.3269282092340539, + "grad_norm": 0.6056960255078041, + "learning_rate": 0.0001481790947638288, + "loss": 0.6176, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6478211283683777, + "step": 1225, + "valid_targets_mean": 15326.2, + "valid_targets_min": 697 + }, + { + "epoch": 0.32826261008807045, + "grad_norm": 0.45968806774958004, + "learning_rate": 0.00014814063678332667, + "loss": 0.6144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6101811528205872, + "step": 1230, + "valid_targets_mean": 16237.8, + "valid_targets_min": 276 + }, + { + "epoch": 0.329597010942087, + "grad_norm": 0.466696207487788, + "learning_rate": 0.00014810178201058323, + "loss": 0.6105, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6029187440872192, + "step": 1235, + "valid_targets_mean": 15636.9, + "valid_targets_min": 784 + }, + { + "epoch": 0.3309314117961035, + "grad_norm": 0.4547794279301651, + "learning_rate": 0.00014806253065638786, + "loss": 0.6111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5900842547416687, + "step": 1240, + "valid_targets_mean": 17622.9, + "valid_targets_min": 432 + }, + { + "epoch": 0.3322658126501201, + "grad_norm": 0.5035430798808832, + "learning_rate": 0.00014802288293368148, + "loss": 0.6128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6072174310684204, + "step": 1245, + "valid_targets_mean": 16158.9, + "valid_targets_min": 641 + }, + { + "epoch": 0.33360021350413666, + "grad_norm": 0.5291824098972122, + "learning_rate": 0.0001479828390575553, + "loss": 0.6247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6279348134994507, + "step": 1250, + "valid_targets_mean": 15845.8, + "valid_targets_min": 636 + }, + { + "epoch": 0.3349346143581532, + "grad_norm": 0.4913251882169057, + "learning_rate": 0.00014794239924524968, + "loss": 0.6225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6031299233436584, + "step": 1255, + "valid_targets_mean": 16978.3, + "valid_targets_min": 469 + }, + { + "epoch": 0.33626901521216973, + "grad_norm": 0.49690910233477986, + "learning_rate": 0.00014790156371615303, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6335940361022949, + "step": 1260, + "valid_targets_mean": 16518.6, + "valid_targets_min": 293 + }, + { + "epoch": 0.33760341606618627, + "grad_norm": 0.5468966794986143, + "learning_rate": 0.00014786033269180044, + "loss": 0.6068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6059638261795044, + "step": 1265, + "valid_targets_mean": 16844.9, + "valid_targets_min": 324 + }, + { + "epoch": 0.3389378169202028, + "grad_norm": 0.4983062105935614, + "learning_rate": 0.00014781870639587262, + "loss": 0.6282, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6372385025024414, + "step": 1270, + "valid_targets_mean": 15898.1, + "valid_targets_min": 319 + }, + { + "epoch": 0.3402722177742194, + "grad_norm": 0.3892479665426188, + "learning_rate": 0.0001477766850541947, + "loss": 0.6341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6155767440795898, + "step": 1275, + "valid_targets_mean": 17163.2, + "valid_targets_min": 456 + }, + { + "epoch": 0.34160661862823594, + "grad_norm": 0.652787264480223, + "learning_rate": 0.00014773426889473493, + "loss": 0.629, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.622187077999115, + "step": 1280, + "valid_targets_mean": 15787.9, + "valid_targets_min": 356 + }, + { + "epoch": 0.3429410194822525, + "grad_norm": 0.5070064814221472, + "learning_rate": 0.0001476914581476034, + "loss": 0.6411, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6333944797515869, + "step": 1285, + "valid_targets_mean": 16448.7, + "valid_targets_min": 543 + }, + { + "epoch": 0.344275420336269, + "grad_norm": 0.48844856808258474, + "learning_rate": 0.000147648253045051, + "loss": 0.616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5810629725456238, + "step": 1290, + "valid_targets_mean": 16389.3, + "valid_targets_min": 801 + }, + { + "epoch": 0.34560982119028555, + "grad_norm": 0.41518816293543753, + "learning_rate": 0.0001476046538214679, + "loss": 0.6124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6386691331863403, + "step": 1295, + "valid_targets_mean": 14671.7, + "valid_targets_min": 156 + }, + { + "epoch": 0.3469442220443021, + "grad_norm": 0.47948509536370426, + "learning_rate": 0.00014756066071338247, + "loss": 0.6378, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6576275825500488, + "step": 1300, + "valid_targets_mean": 15235.0, + "valid_targets_min": 711 + }, + { + "epoch": 0.3482786228983187, + "grad_norm": 0.4595820910884694, + "learning_rate": 0.00014751627395945984, + "loss": 0.6217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6192502379417419, + "step": 1305, + "valid_targets_mean": 16238.1, + "valid_targets_min": 333 + }, + { + "epoch": 0.3496130237523352, + "grad_norm": 0.4291054247965342, + "learning_rate": 0.0001474714938005008, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6437174081802368, + "step": 1310, + "valid_targets_mean": 15684.9, + "valid_targets_min": 607 + }, + { + "epoch": 0.35094742460635175, + "grad_norm": 0.39671682397098906, + "learning_rate": 0.00014742632047944033, + "loss": 0.637, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6374814510345459, + "step": 1315, + "valid_targets_mean": 15847.1, + "valid_targets_min": 709 + }, + { + "epoch": 0.3522818254603683, + "grad_norm": 0.47859741034274256, + "learning_rate": 0.00014738075424134634, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6308225989341736, + "step": 1320, + "valid_targets_mean": 15888.9, + "valid_targets_min": 708 + }, + { + "epoch": 0.35361622631438483, + "grad_norm": 0.6507671044429603, + "learning_rate": 0.00014733479533341837, + "loss": 0.6195, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6275373697280884, + "step": 1325, + "valid_targets_mean": 15963.1, + "valid_targets_min": 376 + }, + { + "epoch": 0.35495062716840137, + "grad_norm": 0.6399738378817154, + "learning_rate": 0.00014728844400498616, + "loss": 0.6254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6041469573974609, + "step": 1330, + "valid_targets_mean": 17098.5, + "valid_targets_min": 772 + }, + { + "epoch": 0.35628502802241796, + "grad_norm": 0.4984880266031328, + "learning_rate": 0.00014724170050750836, + "loss": 0.6215, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6045820713043213, + "step": 1335, + "valid_targets_mean": 16711.2, + "valid_targets_min": 481 + }, + { + "epoch": 0.3576194288764345, + "grad_norm": 0.5423169689023574, + "learning_rate": 0.00014719456509457122, + "loss": 0.6297, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6203999519348145, + "step": 1340, + "valid_targets_mean": 15233.5, + "valid_targets_min": 569 + }, + { + "epoch": 0.35895382973045104, + "grad_norm": 0.4838132943128504, + "learning_rate": 0.00014714703802188713, + "loss": 0.6265, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6400591135025024, + "step": 1345, + "valid_targets_mean": 16153.9, + "valid_targets_min": 654 + }, + { + "epoch": 0.3602882305844676, + "grad_norm": 0.413527598858469, + "learning_rate": 0.0001470991195472932, + "loss": 0.6318, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5825143456459045, + "step": 1350, + "valid_targets_mean": 17444.9, + "valid_targets_min": 268 + }, + { + "epoch": 0.3616226314384841, + "grad_norm": 0.49583200763125385, + "learning_rate": 0.00014705080993075, + "loss": 0.6186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6185584664344788, + "step": 1355, + "valid_targets_mean": 16056.9, + "valid_targets_min": 606 + }, + { + "epoch": 0.36295703229250065, + "grad_norm": 0.4207625378865751, + "learning_rate": 0.00014700210943433998, + "loss": 0.6284, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6178081035614014, + "step": 1360, + "valid_targets_mean": 16616.0, + "valid_targets_min": 445 + }, + { + "epoch": 0.36429143314651724, + "grad_norm": 0.47838668743172985, + "learning_rate": 0.00014695301832226627, + "loss": 0.6353, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6175183057785034, + "step": 1365, + "valid_targets_mean": 15540.1, + "valid_targets_min": 386 + }, + { + "epoch": 0.3656258340005338, + "grad_norm": 0.44229725453471697, + "learning_rate": 0.00014690353686085098, + "loss": 0.6165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6205130815505981, + "step": 1370, + "valid_targets_mean": 15817.3, + "valid_targets_min": 201 + }, + { + "epoch": 0.3669602348545503, + "grad_norm": 0.46623196564659064, + "learning_rate": 0.00014685366531853395, + "loss": 0.6232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6131946444511414, + "step": 1375, + "valid_targets_mean": 15407.4, + "valid_targets_min": 681 + }, + { + "epoch": 0.36829463570856685, + "grad_norm": 0.44006049355952626, + "learning_rate": 0.00014680340396587118, + "loss": 0.6233, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6441381573677063, + "step": 1380, + "valid_targets_mean": 15845.8, + "valid_targets_min": 571 + }, + { + "epoch": 0.3696290365625834, + "grad_norm": 0.6111464695074394, + "learning_rate": 0.0001467527530755335, + "loss": 0.6084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6167534589767456, + "step": 1385, + "valid_targets_mean": 16684.4, + "valid_targets_min": 366 + }, + { + "epoch": 0.37096343741659993, + "grad_norm": 0.8324813489326134, + "learning_rate": 0.000146701712922305, + "loss": 0.6202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.612213671207428, + "step": 1390, + "valid_targets_mean": 16478.6, + "valid_targets_min": 720 + }, + { + "epoch": 0.37229783827061647, + "grad_norm": 0.670291546771116, + "learning_rate": 0.00014665028378308138, + "loss": 0.6251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6236619353294373, + "step": 1395, + "valid_targets_mean": 15837.5, + "valid_targets_min": 594 + }, + { + "epoch": 0.37363223912463306, + "grad_norm": 0.8512140790165293, + "learning_rate": 0.00014659846593686885, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6356359124183655, + "step": 1400, + "valid_targets_mean": 15852.3, + "valid_targets_min": 474 + }, + { + "epoch": 0.3749666399786496, + "grad_norm": 0.5723739765713398, + "learning_rate": 0.0001465462596647822, + "loss": 0.6298, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6180834770202637, + "step": 1405, + "valid_targets_mean": 15452.5, + "valid_targets_min": 789 + }, + { + "epoch": 0.37630104083266613, + "grad_norm": 0.6075008541552803, + "learning_rate": 0.0001464936652500435, + "loss": 0.6008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6029921770095825, + "step": 1410, + "valid_targets_mean": 16629.1, + "valid_targets_min": 662 + }, + { + "epoch": 0.37763544168668267, + "grad_norm": 0.4676746690221598, + "learning_rate": 0.0001464406829779806, + "loss": 0.6157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6156923770904541, + "step": 1415, + "valid_targets_mean": 15352.8, + "valid_targets_min": 708 + }, + { + "epoch": 0.3789698425406992, + "grad_norm": 0.5817747303529482, + "learning_rate": 0.0001463873131360254, + "loss": 0.6106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6119555234909058, + "step": 1420, + "valid_targets_mean": 16914.2, + "valid_targets_min": 664 + }, + { + "epoch": 0.38030424339471575, + "grad_norm": 0.432992609011377, + "learning_rate": 0.0001463335560137124, + "loss": 0.6156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6189119815826416, + "step": 1425, + "valid_targets_mean": 16088.6, + "valid_targets_min": 429 + }, + { + "epoch": 0.38163864424873234, + "grad_norm": 0.40579421448961717, + "learning_rate": 0.00014627941190267717, + "loss": 0.6152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6119743585586548, + "step": 1430, + "valid_targets_mean": 16528.0, + "valid_targets_min": 748 + }, + { + "epoch": 0.3829730451027489, + "grad_norm": 0.6198382928720174, + "learning_rate": 0.00014622488109665468, + "loss": 0.6285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6378297805786133, + "step": 1435, + "valid_targets_mean": 16510.3, + "valid_targets_min": 563 + }, + { + "epoch": 0.3843074459567654, + "grad_norm": 0.5220468831850059, + "learning_rate": 0.0001461699638914777, + "loss": 0.6203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6250759363174438, + "step": 1440, + "valid_targets_mean": 15598.2, + "valid_targets_min": 533 + }, + { + "epoch": 0.38564184681078195, + "grad_norm": 0.5528435347529946, + "learning_rate": 0.00014611466058507536, + "loss": 0.616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6076961755752563, + "step": 1445, + "valid_targets_mean": 15165.0, + "valid_targets_min": 472 + }, + { + "epoch": 0.3869762476647985, + "grad_norm": 0.4755246533026965, + "learning_rate": 0.00014605897147747132, + "loss": 0.6251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6179888248443604, + "step": 1450, + "valid_targets_mean": 15599.8, + "valid_targets_min": 707 + }, + { + "epoch": 0.388310648518815, + "grad_norm": 0.4844726542546722, + "learning_rate": 0.0001460028968707822, + "loss": 0.6302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6419791579246521, + "step": 1455, + "valid_targets_mean": 14379.4, + "valid_targets_min": 522 + }, + { + "epoch": 0.3896450493728316, + "grad_norm": 0.48494595176664035, + "learning_rate": 0.0001459464370692161, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6191474795341492, + "step": 1460, + "valid_targets_mean": 16336.0, + "valid_targets_min": 494 + }, + { + "epoch": 0.39097945022684816, + "grad_norm": 0.6255867368178756, + "learning_rate": 0.0001458895923790707, + "loss": 0.6212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6456395387649536, + "step": 1465, + "valid_targets_mean": 15574.0, + "valid_targets_min": 524 + }, + { + "epoch": 0.3923138510808647, + "grad_norm": 0.4644640635135548, + "learning_rate": 0.0001458323631087318, + "loss": 0.6206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6031760573387146, + "step": 1470, + "valid_targets_mean": 16420.4, + "valid_targets_min": 505 + }, + { + "epoch": 0.39364825193488123, + "grad_norm": 0.387187368792563, + "learning_rate": 0.00014577474956867155, + "loss": 0.6028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6073260307312012, + "step": 1475, + "valid_targets_mean": 15389.3, + "valid_targets_min": 496 + }, + { + "epoch": 0.39498265278889777, + "grad_norm": 0.57060581290841, + "learning_rate": 0.00014571675207144676, + "loss": 0.6285, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6272798776626587, + "step": 1480, + "valid_targets_mean": 14589.4, + "valid_targets_min": 680 + }, + { + "epoch": 0.3963170536429143, + "grad_norm": 0.5222086273973913, + "learning_rate": 0.00014565837093169728, + "loss": 0.6326, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.619460940361023, + "step": 1485, + "valid_targets_mean": 16074.4, + "valid_targets_min": 494 + }, + { + "epoch": 0.3976514544969309, + "grad_norm": 0.43806267201083776, + "learning_rate": 0.00014559960646614418, + "loss": 0.6314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6153547763824463, + "step": 1490, + "valid_targets_mean": 15761.4, + "valid_targets_min": 649 + }, + { + "epoch": 0.39898585535094744, + "grad_norm": 0.4311441690905246, + "learning_rate": 0.00014554045899358814, + "loss": 0.6203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6338887214660645, + "step": 1495, + "valid_targets_mean": 16588.6, + "valid_targets_min": 700 + }, + { + "epoch": 0.400320256204964, + "grad_norm": 0.39354710766071277, + "learning_rate": 0.00014548092883490772, + "loss": 0.6219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6525273323059082, + "step": 1500, + "valid_targets_mean": 16091.5, + "valid_targets_min": 356 + }, + { + "epoch": 0.4016546570589805, + "grad_norm": 0.3264072177146715, + "learning_rate": 0.00014542101631305745, + "loss": 0.6341, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6408512592315674, + "step": 1505, + "valid_targets_mean": 15003.0, + "valid_targets_min": 524 + }, + { + "epoch": 0.40298905791299705, + "grad_norm": 0.42613217106930396, + "learning_rate": 0.00014536072175306628, + "loss": 0.616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6036968231201172, + "step": 1510, + "valid_targets_mean": 15678.4, + "valid_targets_min": 325 + }, + { + "epoch": 0.4043234587670136, + "grad_norm": 0.5010042319742402, + "learning_rate": 0.00014530004548203573, + "loss": 0.6096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6010334491729736, + "step": 1515, + "valid_targets_mean": 15991.1, + "valid_targets_min": 491 + }, + { + "epoch": 0.4056578596210302, + "grad_norm": 0.46145582386046646, + "learning_rate": 0.00014523898782913818, + "loss": 0.6363, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5833079218864441, + "step": 1520, + "valid_targets_mean": 17355.7, + "valid_targets_min": 257 + }, + { + "epoch": 0.4069922604750467, + "grad_norm": 0.4769221033091848, + "learning_rate": 0.00014517754912561496, + "loss": 0.6225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6384181976318359, + "step": 1525, + "valid_targets_mean": 16321.8, + "valid_targets_min": 399 + }, + { + "epoch": 0.40832666132906326, + "grad_norm": 0.40610205983033637, + "learning_rate": 0.00014511572970477457, + "loss": 0.6092, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5959339737892151, + "step": 1530, + "valid_targets_mean": 16648.0, + "valid_targets_min": 488 + }, + { + "epoch": 0.4096610621830798, + "grad_norm": 0.6294123329894471, + "learning_rate": 0.00014505352990199107, + "loss": 0.6212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.617108941078186, + "step": 1535, + "valid_targets_mean": 16604.0, + "valid_targets_min": 566 + }, + { + "epoch": 0.41099546303709633, + "grad_norm": 0.6048603260456543, + "learning_rate": 0.000144990950054702, + "loss": 0.6203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6036360263824463, + "step": 1540, + "valid_targets_mean": 15739.4, + "valid_targets_min": 383 + }, + { + "epoch": 0.41232986389111287, + "grad_norm": 0.5753985039391059, + "learning_rate": 0.0001449279905024067, + "loss": 0.6229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.624218225479126, + "step": 1545, + "valid_targets_mean": 17004.7, + "valid_targets_min": 430 + }, + { + "epoch": 0.41366426474512946, + "grad_norm": 0.4074871541259797, + "learning_rate": 0.00014486465158666443, + "loss": 0.622, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6364642977714539, + "step": 1550, + "valid_targets_mean": 15261.5, + "valid_targets_min": 461 + }, + { + "epoch": 0.414998665599146, + "grad_norm": 0.7777037216192905, + "learning_rate": 0.00014480093365109252, + "loss": 0.6375, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.625815212726593, + "step": 1555, + "valid_targets_mean": 16165.8, + "valid_targets_min": 86 + }, + { + "epoch": 0.41633306645316254, + "grad_norm": 0.813927001051695, + "learning_rate": 0.00014473683704136454, + "loss": 0.6183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.613219141960144, + "step": 1560, + "valid_targets_mean": 15473.5, + "valid_targets_min": 520 + }, + { + "epoch": 0.4176674673071791, + "grad_norm": 0.624851558395919, + "learning_rate": 0.0001446723621052083, + "loss": 0.6182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6244171857833862, + "step": 1565, + "valid_targets_mean": 15542.5, + "valid_targets_min": 796 + }, + { + "epoch": 0.4190018681611956, + "grad_norm": 0.7299434520023005, + "learning_rate": 0.00014460750919240416, + "loss": 0.6069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.597712516784668, + "step": 1570, + "valid_targets_mean": 16187.9, + "valid_targets_min": 126 + }, + { + "epoch": 0.42033626901521215, + "grad_norm": 0.7996751395350323, + "learning_rate": 0.00014454227865478292, + "loss": 0.6221, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6417670249938965, + "step": 1575, + "valid_targets_mean": 15753.5, + "valid_targets_min": 593 + }, + { + "epoch": 0.42167066986922874, + "grad_norm": 0.7643157528008785, + "learning_rate": 0.0001444766708462241, + "loss": 0.636, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.638425350189209, + "step": 1580, + "valid_targets_mean": 15052.7, + "valid_targets_min": 315 + }, + { + "epoch": 0.4230050707232453, + "grad_norm": 1.6220602331806422, + "learning_rate": 0.0001444106861226539, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6398119926452637, + "step": 1585, + "valid_targets_mean": 16265.2, + "valid_targets_min": 581 + }, + { + "epoch": 0.4243394715772618, + "grad_norm": 0.8975330770047389, + "learning_rate": 0.00014434432484204335, + "loss": 0.6263, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6489125490188599, + "step": 1590, + "valid_targets_mean": 15977.6, + "valid_targets_min": 679 + }, + { + "epoch": 0.42567387243127836, + "grad_norm": 0.6599629728623814, + "learning_rate": 0.0001442775873644062, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6266319155693054, + "step": 1595, + "valid_targets_mean": 16949.8, + "valid_targets_min": 289 + }, + { + "epoch": 0.4270082732852949, + "grad_norm": 1.0255720761078193, + "learning_rate": 0.00014421047405179725, + "loss": 0.6314, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.655253529548645, + "step": 1600, + "valid_targets_mean": 16475.8, + "valid_targets_min": 122 + }, + { + "epoch": 0.42834267413931143, + "grad_norm": 0.5940148209535145, + "learning_rate": 0.00014414298526831012, + "loss": 0.6274, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.604961097240448, + "step": 1605, + "valid_targets_mean": 16166.2, + "valid_targets_min": 519 + }, + { + "epoch": 0.429677074993328, + "grad_norm": 0.6891749029440575, + "learning_rate": 0.00014407512138007547, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6220706701278687, + "step": 1610, + "valid_targets_mean": 15656.4, + "valid_targets_min": 479 + }, + { + "epoch": 0.43101147584734456, + "grad_norm": 0.4005516569017509, + "learning_rate": 0.0001440068827552588, + "loss": 0.6082, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.625106692314148, + "step": 1615, + "valid_targets_mean": 15519.3, + "valid_targets_min": 486 + }, + { + "epoch": 0.4323458767013611, + "grad_norm": 0.5272590178673885, + "learning_rate": 0.0001439382697640587, + "loss": 0.6416, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6334394216537476, + "step": 1620, + "valid_targets_mean": 15268.3, + "valid_targets_min": 726 + }, + { + "epoch": 0.43368027755537764, + "grad_norm": 0.3943863363540411, + "learning_rate": 0.00014386928277870461, + "loss": 0.6022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6156237721443176, + "step": 1625, + "valid_targets_mean": 16021.8, + "valid_targets_min": 636 + }, + { + "epoch": 0.4350146784093942, + "grad_norm": 0.44002913415369016, + "learning_rate": 0.00014379992217345504, + "loss": 0.6372, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6078697443008423, + "step": 1630, + "valid_targets_mean": 15966.3, + "valid_targets_min": 620 + }, + { + "epoch": 0.4363490792634107, + "grad_norm": 0.5474567909345269, + "learning_rate": 0.0001437301883245953, + "loss": 0.6217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5955013036727905, + "step": 1635, + "valid_targets_mean": 16371.5, + "valid_targets_min": 74 + }, + { + "epoch": 0.43768348011742725, + "grad_norm": 0.37821018625798675, + "learning_rate": 0.0001436600816104356, + "loss": 0.6169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6408905982971191, + "step": 1640, + "valid_targets_mean": 16821.0, + "valid_targets_min": 802 + }, + { + "epoch": 0.43901788097144384, + "grad_norm": 0.633186477597186, + "learning_rate": 0.000143589602411309, + "loss": 0.6192, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234664916992188, + "step": 1645, + "valid_targets_mean": 15221.4, + "valid_targets_min": 500 + }, + { + "epoch": 0.4403522818254604, + "grad_norm": 0.6339409024098717, + "learning_rate": 0.00014351875110956927, + "loss": 0.6159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6487512588500977, + "step": 1650, + "valid_targets_mean": 15942.3, + "valid_targets_min": 385 + }, + { + "epoch": 0.4416866826794769, + "grad_norm": 0.3375878572865069, + "learning_rate": 0.00014344752808958887, + "loss": 0.6345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6520563960075378, + "step": 1655, + "valid_targets_mean": 16000.6, + "valid_targets_min": 719 + }, + { + "epoch": 0.44302108353349345, + "grad_norm": 0.38773310648770776, + "learning_rate": 0.0001433759337377569, + "loss": 0.6159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6261415481567383, + "step": 1660, + "valid_targets_mean": 15071.0, + "valid_targets_min": 435 + }, + { + "epoch": 0.44435548438751, + "grad_norm": 0.38867253963185605, + "learning_rate": 0.00014330396844247685, + "loss": 0.6133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5830848217010498, + "step": 1665, + "valid_targets_mean": 17879.8, + "valid_targets_min": 419 + }, + { + "epoch": 0.44568988524152653, + "grad_norm": 1.5177148462768428, + "learning_rate": 0.0001432316325941647, + "loss": 0.6224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6349464058876038, + "step": 1670, + "valid_targets_mean": 15402.8, + "valid_targets_min": 518 + }, + { + "epoch": 0.4470242860955431, + "grad_norm": 0.4944692858526399, + "learning_rate": 0.00014315892658524665, + "loss": 0.6286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6335951685905457, + "step": 1675, + "valid_targets_mean": 15292.9, + "valid_targets_min": 143 + }, + { + "epoch": 0.44835868694955966, + "grad_norm": 0.49903902666348443, + "learning_rate": 0.0001430858508101571, + "loss": 0.6024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6011691689491272, + "step": 1680, + "valid_targets_mean": 16015.8, + "valid_targets_min": 486 + }, + { + "epoch": 0.4496930878035762, + "grad_norm": 0.5951332149681916, + "learning_rate": 0.00014301240566533637, + "loss": 0.6395, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6320478916168213, + "step": 1685, + "valid_targets_mean": 16208.7, + "valid_targets_min": 594 + }, + { + "epoch": 0.45102748865759273, + "grad_norm": 0.4581806243474604, + "learning_rate": 0.00014293859154922866, + "loss": 0.6121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6136428117752075, + "step": 1690, + "valid_targets_mean": 15048.1, + "valid_targets_min": 339 + }, + { + "epoch": 0.45236188951160927, + "grad_norm": 0.5610547921187975, + "learning_rate": 0.00014286440886227995, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6516221761703491, + "step": 1695, + "valid_targets_mean": 15288.6, + "valid_targets_min": 393 + }, + { + "epoch": 0.4536962903656258, + "grad_norm": 0.4888275216939204, + "learning_rate": 0.00014278985800693562, + "loss": 0.6394, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6383839845657349, + "step": 1700, + "valid_targets_mean": 16269.8, + "valid_targets_min": 699 + }, + { + "epoch": 0.4550306912196424, + "grad_norm": 0.3750982099561412, + "learning_rate": 0.0001427149393876384, + "loss": 0.6132, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5994255542755127, + "step": 1705, + "valid_targets_mean": 15503.7, + "valid_targets_min": 469 + }, + { + "epoch": 0.45636509207365894, + "grad_norm": 0.5220259390241854, + "learning_rate": 0.00014263965341082622, + "loss": 0.6216, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6135061383247375, + "step": 1710, + "valid_targets_mean": 16014.8, + "valid_targets_min": 777 + }, + { + "epoch": 0.4576994929276755, + "grad_norm": 0.44611862398704427, + "learning_rate": 0.00014256400048492994, + "loss": 0.6389, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6459407806396484, + "step": 1715, + "valid_targets_mean": 16696.7, + "valid_targets_min": 428 + }, + { + "epoch": 0.459033893781692, + "grad_norm": 0.7215196076760709, + "learning_rate": 0.00014248798102037106, + "loss": 0.6025, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5831271409988403, + "step": 1720, + "valid_targets_mean": 16603.4, + "valid_targets_min": 510 + }, + { + "epoch": 0.46036829463570855, + "grad_norm": 0.68883263340678, + "learning_rate": 0.0001424115954295597, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6232255101203918, + "step": 1725, + "valid_targets_mean": 15403.0, + "valid_targets_min": 550 + }, + { + "epoch": 0.4617026954897251, + "grad_norm": 0.6747839578442204, + "learning_rate": 0.00014233484412689212, + "loss": 0.6234, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6511488556861877, + "step": 1730, + "valid_targets_mean": 14797.5, + "valid_targets_min": 516 + }, + { + "epoch": 0.4630370963437417, + "grad_norm": 0.6377290200940263, + "learning_rate": 0.00014225772752874866, + "loss": 0.6114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5981515645980835, + "step": 1735, + "valid_targets_mean": 16110.6, + "valid_targets_min": 524 + }, + { + "epoch": 0.4643714971977582, + "grad_norm": 0.5027780947825067, + "learning_rate": 0.00014218024605349133, + "loss": 0.6043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6172059774398804, + "step": 1740, + "valid_targets_mean": 16348.3, + "valid_targets_min": 350 + }, + { + "epoch": 0.46570589805177476, + "grad_norm": 0.40475216068056086, + "learning_rate": 0.00014210240012146178, + "loss": 0.6141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6198212504386902, + "step": 1745, + "valid_targets_mean": 16360.2, + "valid_targets_min": 11 + }, + { + "epoch": 0.4670402989057913, + "grad_norm": 0.36279653577965554, + "learning_rate": 0.00014202419015497863, + "loss": 0.6251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5892041921615601, + "step": 1750, + "valid_targets_mean": 14806.2, + "valid_targets_min": 599 + }, + { + "epoch": 0.46837469975980783, + "grad_norm": 0.5529952048740383, + "learning_rate": 0.00014194561657833563, + "loss": 0.6238, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6133667826652527, + "step": 1755, + "valid_targets_mean": 15809.3, + "valid_targets_min": 682 + }, + { + "epoch": 0.46970910061382437, + "grad_norm": 0.6537360232818689, + "learning_rate": 0.000141866679817799, + "loss": 0.6126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6035851240158081, + "step": 1760, + "valid_targets_mean": 16271.0, + "valid_targets_min": 305 + }, + { + "epoch": 0.47104350146784096, + "grad_norm": 0.5789436462540626, + "learning_rate": 0.00014178738030160527, + "loss": 0.623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6485693454742432, + "step": 1765, + "valid_targets_mean": 15430.4, + "valid_targets_min": 501 + }, + { + "epoch": 0.4723779023218575, + "grad_norm": 0.8720659405356321, + "learning_rate": 0.000141707718459959, + "loss": 0.6191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6286308765411377, + "step": 1770, + "valid_targets_mean": 16587.6, + "valid_targets_min": 643 + }, + { + "epoch": 0.47371230317587404, + "grad_norm": 0.7511852245287411, + "learning_rate": 0.00014162769472503032, + "loss": 0.6017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5902373790740967, + "step": 1775, + "valid_targets_mean": 16709.7, + "valid_targets_min": 474 + }, + { + "epoch": 0.4750467040298906, + "grad_norm": 0.8184258903731754, + "learning_rate": 0.00014154730953095274, + "loss": 0.6015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5919774174690247, + "step": 1780, + "valid_targets_mean": 16877.2, + "valid_targets_min": 455 + }, + { + "epoch": 0.4763811048839071, + "grad_norm": 0.773629076068772, + "learning_rate": 0.0001414665633138206, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6243022680282593, + "step": 1785, + "valid_targets_mean": 16179.8, + "valid_targets_min": 540 + }, + { + "epoch": 0.47771550573792365, + "grad_norm": 0.8716843697927165, + "learning_rate": 0.00014138545651168683, + "loss": 0.6299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6102423667907715, + "step": 1790, + "valid_targets_mean": 16395.6, + "valid_targets_min": 20 + }, + { + "epoch": 0.47904990659194024, + "grad_norm": 0.6836681436980766, + "learning_rate": 0.00014130398956456062, + "loss": 0.6121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6184238195419312, + "step": 1795, + "valid_targets_mean": 16681.8, + "valid_targets_min": 618 + }, + { + "epoch": 0.4803843074459568, + "grad_norm": 0.7379214609664572, + "learning_rate": 0.00014122216291440496, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6008614301681519, + "step": 1800, + "valid_targets_mean": 16840.3, + "valid_targets_min": 635 + }, + { + "epoch": 0.4817187082999733, + "grad_norm": 0.6448470422300319, + "learning_rate": 0.00014113997700513422, + "loss": 0.6247, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6125494241714478, + "step": 1805, + "valid_targets_mean": 16632.3, + "valid_targets_min": 394 + }, + { + "epoch": 0.48305310915398986, + "grad_norm": 0.7507255061402137, + "learning_rate": 0.00014105743228261174, + "loss": 0.5971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5912197232246399, + "step": 1810, + "valid_targets_mean": 15968.4, + "valid_targets_min": 14 + }, + { + "epoch": 0.4843875100080064, + "grad_norm": 0.6923025633359248, + "learning_rate": 0.00014097452919464748, + "loss": 0.6275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6405831575393677, + "step": 1815, + "valid_targets_mean": 15824.7, + "valid_targets_min": 791 + }, + { + "epoch": 0.48572191086202293, + "grad_norm": 0.7189502878051086, + "learning_rate": 0.00014089126819099557, + "loss": 0.6076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5731747150421143, + "step": 1820, + "valid_targets_mean": 15942.4, + "valid_targets_min": 76 + }, + { + "epoch": 0.4870563117160395, + "grad_norm": 0.6224947383076709, + "learning_rate": 0.00014080764972335184, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6464651823043823, + "step": 1825, + "valid_targets_mean": 16088.4, + "valid_targets_min": 302 + }, + { + "epoch": 0.48839071257005606, + "grad_norm": 0.7083902377315511, + "learning_rate": 0.00014072367424535135, + "loss": 0.6162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6100757122039795, + "step": 1830, + "valid_targets_mean": 14989.7, + "valid_targets_min": 707 + }, + { + "epoch": 0.4897251134240726, + "grad_norm": 0.56069038755494, + "learning_rate": 0.000140639342212566, + "loss": 0.6172, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5954641699790955, + "step": 1835, + "valid_targets_mean": 17395.5, + "valid_targets_min": 581 + }, + { + "epoch": 0.49105951427808914, + "grad_norm": 0.7780348082684239, + "learning_rate": 0.000140554654082502, + "loss": 0.6136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6116977334022522, + "step": 1840, + "valid_targets_mean": 16951.9, + "valid_targets_min": 791 + }, + { + "epoch": 0.4923939151321057, + "grad_norm": 0.5613734141188126, + "learning_rate": 0.0001404696103145975, + "loss": 0.6327, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6341204047203064, + "step": 1845, + "valid_targets_mean": 15912.0, + "valid_targets_min": 424 + }, + { + "epoch": 0.4937283159861222, + "grad_norm": 0.5646169834365188, + "learning_rate": 0.0001403842113702198, + "loss": 0.6096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6076234579086304, + "step": 1850, + "valid_targets_mean": 16483.9, + "valid_targets_min": 410 + }, + { + "epoch": 0.49506271684013875, + "grad_norm": 0.42454431593189007, + "learning_rate": 0.00014029845771266325, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5989246368408203, + "step": 1855, + "valid_targets_mean": 15265.2, + "valid_targets_min": 701 + }, + { + "epoch": 0.49639711769415534, + "grad_norm": 0.42970395034884246, + "learning_rate": 0.00014021234980714648, + "loss": 0.6311, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6091680526733398, + "step": 1860, + "valid_targets_mean": 15967.2, + "valid_targets_min": 740 + }, + { + "epoch": 0.4977315185481719, + "grad_norm": 0.467813457018178, + "learning_rate": 0.00014012588812080992, + "loss": 0.6301, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6140797138214111, + "step": 1865, + "valid_targets_mean": 16113.7, + "valid_targets_min": 258 + }, + { + "epoch": 0.4990659194021884, + "grad_norm": 0.4443571651380167, + "learning_rate": 0.00014003907312271319, + "loss": 0.6167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6168869137763977, + "step": 1870, + "valid_targets_mean": 16914.2, + "valid_targets_min": 670 + }, + { + "epoch": 0.500400320256205, + "grad_norm": 0.3688517851382228, + "learning_rate": 0.0001399519052838329, + "loss": 0.6169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6044825315475464, + "step": 1875, + "valid_targets_mean": 16600.2, + "valid_targets_min": 515 + }, + { + "epoch": 0.5017347211102215, + "grad_norm": 0.4272311555518661, + "learning_rate": 0.00013986438507705958, + "loss": 0.6232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6084432005882263, + "step": 1880, + "valid_targets_mean": 15952.6, + "valid_targets_min": 693 + }, + { + "epoch": 0.503069121964238, + "grad_norm": 0.4084671985107604, + "learning_rate": 0.00013977651297719548, + "loss": 0.6223, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6196306347846985, + "step": 1885, + "valid_targets_mean": 16205.8, + "valid_targets_min": 462 + }, + { + "epoch": 0.5044035228182546, + "grad_norm": 0.47467835510882866, + "learning_rate": 0.00013968828946095193, + "loss": 0.6094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6280183792114258, + "step": 1890, + "valid_targets_mean": 15579.6, + "valid_targets_min": 443 + }, + { + "epoch": 0.5057379236722711, + "grad_norm": 0.3734668638187962, + "learning_rate": 0.00013959971500694668, + "loss": 0.6166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5934363603591919, + "step": 1895, + "valid_targets_mean": 15840.3, + "valid_targets_min": 16 + }, + { + "epoch": 0.5070723245262877, + "grad_norm": 0.3692138856481344, + "learning_rate": 0.00013951079009570132, + "loss": 0.6212, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6200092434883118, + "step": 1900, + "valid_targets_mean": 16037.6, + "valid_targets_min": 758 + }, + { + "epoch": 0.5084067253803043, + "grad_norm": 0.3823174475553723, + "learning_rate": 0.00013942151520963868, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6433672904968262, + "step": 1905, + "valid_targets_mean": 16325.7, + "valid_targets_min": 727 + }, + { + "epoch": 0.5097411262343208, + "grad_norm": 0.3497586948857913, + "learning_rate": 0.00013933189083308031, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6540859937667847, + "step": 1910, + "valid_targets_mean": 17292.9, + "valid_targets_min": 285 + }, + { + "epoch": 0.5110755270883374, + "grad_norm": 0.4591645468700426, + "learning_rate": 0.00013924191745224364, + "loss": 0.612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6253089904785156, + "step": 1915, + "valid_targets_mean": 15474.2, + "valid_targets_min": 430 + }, + { + "epoch": 0.5124099279423538, + "grad_norm": 0.31031712977802206, + "learning_rate": 0.00013915159555523957, + "loss": 0.6345, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5882706642150879, + "step": 1920, + "valid_targets_mean": 16923.8, + "valid_targets_min": 715 + }, + { + "epoch": 0.5137443287963704, + "grad_norm": 0.4022558108020764, + "learning_rate": 0.00013906092563206968, + "loss": 0.6057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6023075580596924, + "step": 1925, + "valid_targets_mean": 15661.2, + "valid_targets_min": 502 + }, + { + "epoch": 0.5150787296503869, + "grad_norm": 0.4368678641461343, + "learning_rate": 0.00013896990817462363, + "loss": 0.6312, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6641368865966797, + "step": 1930, + "valid_targets_mean": 16154.9, + "valid_targets_min": 651 + }, + { + "epoch": 0.5164131305044035, + "grad_norm": 0.6467331098405801, + "learning_rate": 0.00013887854367667645, + "loss": 0.6222, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6303449273109436, + "step": 1935, + "valid_targets_mean": 16546.6, + "valid_targets_min": 902 + }, + { + "epoch": 0.5177475313584201, + "grad_norm": 0.5977986197066303, + "learning_rate": 0.00013878683263388587, + "loss": 0.6267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6208200454711914, + "step": 1940, + "valid_targets_mean": 14945.0, + "valid_targets_min": 254 + }, + { + "epoch": 0.5190819322124366, + "grad_norm": 0.5304666492399011, + "learning_rate": 0.00013869477554378972, + "loss": 0.6228, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6293059587478638, + "step": 1945, + "valid_targets_mean": 14679.3, + "valid_targets_min": 105 + }, + { + "epoch": 0.5204163330664532, + "grad_norm": 0.5484478107642148, + "learning_rate": 0.00013860237290580306, + "loss": 0.6051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5901466012001038, + "step": 1950, + "valid_targets_mean": 16352.2, + "valid_targets_min": 468 + }, + { + "epoch": 0.5217507339204697, + "grad_norm": 0.4753019705870865, + "learning_rate": 0.00013850962522121569, + "loss": 0.6279, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5876643657684326, + "step": 1955, + "valid_targets_mean": 16744.3, + "valid_targets_min": 527 + }, + { + "epoch": 0.5230851347744863, + "grad_norm": 0.41422385606660383, + "learning_rate": 0.00013841653299318915, + "loss": 0.616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6483991146087646, + "step": 1960, + "valid_targets_mean": 16353.5, + "valid_targets_min": 848 + }, + { + "epoch": 0.5244195356285029, + "grad_norm": 0.36682178106347624, + "learning_rate": 0.00013832309672675428, + "loss": 0.6014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6216505169868469, + "step": 1965, + "valid_targets_mean": 15764.5, + "valid_targets_min": 229 + }, + { + "epoch": 0.5257539364825193, + "grad_norm": 0.46701722935809503, + "learning_rate": 0.00013822931692880828, + "loss": 0.6229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6098369359970093, + "step": 1970, + "valid_targets_mean": 16463.2, + "valid_targets_min": 482 + }, + { + "epoch": 0.5270883373365359, + "grad_norm": 0.4445692469326501, + "learning_rate": 0.00013813519410811208, + "loss": 0.617, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6049668788909912, + "step": 1975, + "valid_targets_mean": 15474.1, + "valid_targets_min": 103 + }, + { + "epoch": 0.5284227381905524, + "grad_norm": 0.5320742477880946, + "learning_rate": 0.00013804072877528746, + "loss": 0.6305, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6137555241584778, + "step": 1980, + "valid_targets_mean": 16337.1, + "valid_targets_min": 363 + }, + { + "epoch": 0.529757139044569, + "grad_norm": 0.34825869011443694, + "learning_rate": 0.0001379459214428144, + "loss": 0.6107, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.595025897026062, + "step": 1985, + "valid_targets_mean": 15993.6, + "valid_targets_min": 757 + }, + { + "epoch": 0.5310915398985855, + "grad_norm": 0.42944867097054756, + "learning_rate": 0.0001378507726250283, + "loss": 0.6194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.606879472732544, + "step": 1990, + "valid_targets_mean": 16933.6, + "valid_targets_min": 739 + }, + { + "epoch": 0.5324259407526021, + "grad_norm": 0.30582752584201905, + "learning_rate": 0.00013775528283811695, + "loss": 0.6142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.582551896572113, + "step": 1995, + "valid_targets_mean": 17717.3, + "valid_targets_min": 558 + }, + { + "epoch": 0.5337603416066187, + "grad_norm": 0.5787030570229632, + "learning_rate": 0.00013765945260011815, + "loss": 0.6181, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6295760273933411, + "step": 2000, + "valid_targets_mean": 15776.8, + "valid_targets_min": 310 + }, + { + "epoch": 0.5350947424606352, + "grad_norm": 0.3901846487164271, + "learning_rate": 0.0001375632824309165, + "loss": 0.6153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5916974544525146, + "step": 2005, + "valid_targets_mean": 17248.5, + "valid_targets_min": 690 + }, + { + "epoch": 0.5364291433146517, + "grad_norm": 0.3384774790194208, + "learning_rate": 0.00013746677285224082, + "loss": 0.6166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6312397718429565, + "step": 2010, + "valid_targets_mean": 15347.2, + "valid_targets_min": 452 + }, + { + "epoch": 0.5377635441686682, + "grad_norm": 0.501250109397787, + "learning_rate": 0.00013736992438766123, + "loss": 0.61, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6018697023391724, + "step": 2015, + "valid_targets_mean": 15687.4, + "valid_targets_min": 24 + }, + { + "epoch": 0.5390979450226848, + "grad_norm": 0.4100739032531526, + "learning_rate": 0.00013727273756258633, + "loss": 0.6096, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6109263300895691, + "step": 2020, + "valid_targets_mean": 16601.7, + "valid_targets_min": 548 + }, + { + "epoch": 0.5404323458767014, + "grad_norm": 0.4246630081006453, + "learning_rate": 0.00013717521290426034, + "loss": 0.6103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6461702585220337, + "step": 2025, + "valid_targets_mean": 17573.6, + "valid_targets_min": 486 + }, + { + "epoch": 0.5417667467307179, + "grad_norm": 0.35833577488702584, + "learning_rate": 0.00013707735094176026, + "loss": 0.6141, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5970995426177979, + "step": 2030, + "valid_targets_mean": 17222.7, + "valid_targets_min": 184 + }, + { + "epoch": 0.5431011475847345, + "grad_norm": 0.4129068769918055, + "learning_rate": 0.00013697915220599294, + "loss": 0.62, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6218748092651367, + "step": 2035, + "valid_targets_mean": 15113.5, + "valid_targets_min": 459 + }, + { + "epoch": 0.544435548438751, + "grad_norm": 0.3387496968435161, + "learning_rate": 0.0001368806172296923, + "loss": 0.6114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.612634539604187, + "step": 2040, + "valid_targets_mean": 17110.6, + "valid_targets_min": 188 + }, + { + "epoch": 0.5457699492927676, + "grad_norm": 0.3745412071832409, + "learning_rate": 0.00013678174654741638, + "loss": 0.599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5897716879844666, + "step": 2045, + "valid_targets_mean": 17232.0, + "valid_targets_min": 521 + }, + { + "epoch": 0.547104350146784, + "grad_norm": 0.38399513390890655, + "learning_rate": 0.00013668254069554439, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6049580574035645, + "step": 2050, + "valid_targets_mean": 15198.6, + "valid_targets_min": 582 + }, + { + "epoch": 0.5484387510008006, + "grad_norm": 0.48936350323324096, + "learning_rate": 0.00013658300021227387, + "loss": 0.6241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6280665397644043, + "step": 2055, + "valid_targets_mean": 16052.8, + "valid_targets_min": 739 + }, + { + "epoch": 0.5497731518548172, + "grad_norm": 0.41651646905962314, + "learning_rate": 0.00013648312563761784, + "loss": 0.5985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6201366186141968, + "step": 2060, + "valid_targets_mean": 15825.8, + "valid_targets_min": 436 + }, + { + "epoch": 0.5511075527088337, + "grad_norm": 0.5106499293556461, + "learning_rate": 0.0001363829175134017, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5888843536376953, + "step": 2065, + "valid_targets_mean": 16064.7, + "valid_targets_min": 253 + }, + { + "epoch": 0.5524419535628503, + "grad_norm": 0.502558200477223, + "learning_rate": 0.00013628237638326038, + "loss": 0.6182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6001168489456177, + "step": 2070, + "valid_targets_mean": 16753.5, + "valid_targets_min": 794 + }, + { + "epoch": 0.5537763544168668, + "grad_norm": 0.4044504847668435, + "learning_rate": 0.0001361815027926354, + "loss": 0.611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6267122030258179, + "step": 2075, + "valid_targets_mean": 17083.9, + "valid_targets_min": 460 + }, + { + "epoch": 0.5551107552708834, + "grad_norm": 0.35978073598074256, + "learning_rate": 0.00013608029728877195, + "loss": 0.6056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.602839469909668, + "step": 2080, + "valid_targets_mean": 16182.3, + "valid_targets_min": 445 + }, + { + "epoch": 0.5564451561248999, + "grad_norm": 0.427878030892968, + "learning_rate": 0.00013597876042071574, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6435970664024353, + "step": 2085, + "valid_targets_mean": 14700.1, + "valid_targets_min": 471 + }, + { + "epoch": 0.5577795569789165, + "grad_norm": 0.35363582855209424, + "learning_rate": 0.00013587689273931032, + "loss": 0.612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.631229817867279, + "step": 2090, + "valid_targets_mean": 15248.1, + "valid_targets_min": 115 + }, + { + "epoch": 0.559113957832933, + "grad_norm": 0.3728911369275915, + "learning_rate": 0.00013577469479719376, + "loss": 0.6292, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6266062259674072, + "step": 2095, + "valid_targets_mean": 16060.7, + "valid_targets_min": 196 + }, + { + "epoch": 0.5604483586869495, + "grad_norm": 0.44761295623444686, + "learning_rate": 0.00013567216714879593, + "loss": 0.6036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5844216346740723, + "step": 2100, + "valid_targets_mean": 16994.4, + "valid_targets_min": 505 + }, + { + "epoch": 0.5617827595409661, + "grad_norm": 0.576099808761112, + "learning_rate": 0.00013556931035033526, + "loss": 0.6206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6165690422058105, + "step": 2105, + "valid_targets_mean": 15846.1, + "valid_targets_min": 99 + }, + { + "epoch": 0.5631171603949826, + "grad_norm": 0.6302577465009878, + "learning_rate": 0.00013546612495981603, + "loss": 0.6209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6065033674240112, + "step": 2110, + "valid_targets_mean": 15524.7, + "valid_targets_min": 727 + }, + { + "epoch": 0.5644515612489992, + "grad_norm": 0.42523423516149084, + "learning_rate": 0.00013536261153702494, + "loss": 0.6081, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.613208532333374, + "step": 2115, + "valid_targets_mean": 15701.8, + "valid_targets_min": 452 + }, + { + "epoch": 0.5657859621030158, + "grad_norm": 0.4123570282242918, + "learning_rate": 0.0001352587706435284, + "loss": 0.5997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.571455717086792, + "step": 2120, + "valid_targets_mean": 15546.9, + "valid_targets_min": 271 + }, + { + "epoch": 0.5671203629570323, + "grad_norm": 0.5144475642174654, + "learning_rate": 0.00013515460284266933, + "loss": 0.6137, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6285332441329956, + "step": 2125, + "valid_targets_mean": 15709.9, + "valid_targets_min": 410 + }, + { + "epoch": 0.5684547638110489, + "grad_norm": 0.3301739903679853, + "learning_rate": 0.0001350501086995642, + "loss": 0.6081, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6021836400032043, + "step": 2130, + "valid_targets_mean": 16203.4, + "valid_targets_min": 100 + }, + { + "epoch": 0.5697891646650654, + "grad_norm": 0.575131486232284, + "learning_rate": 0.00013494528878109978, + "loss": 0.6266, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6023844480514526, + "step": 2135, + "valid_targets_mean": 15848.4, + "valid_targets_min": 591 + }, + { + "epoch": 0.5711235655190819, + "grad_norm": 0.4526311432190505, + "learning_rate": 0.00013484014365593036, + "loss": 0.618, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5874459743499756, + "step": 2140, + "valid_targets_mean": 16963.9, + "valid_targets_min": 476 + }, + { + "epoch": 0.5724579663730984, + "grad_norm": 0.3441773102647398, + "learning_rate": 0.00013473467389447436, + "loss": 0.6084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6037788987159729, + "step": 2145, + "valid_targets_mean": 15695.8, + "valid_targets_min": 254 + }, + { + "epoch": 0.573792367227115, + "grad_norm": 0.5246780101265172, + "learning_rate": 0.0001346288800689114, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6016116738319397, + "step": 2150, + "valid_targets_mean": 15866.1, + "valid_targets_min": 654 + }, + { + "epoch": 0.5751267680811316, + "grad_norm": 0.4340969676204016, + "learning_rate": 0.00013452276275317926, + "loss": 0.6276, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6183035373687744, + "step": 2155, + "valid_targets_mean": 15315.3, + "valid_targets_min": 769 + }, + { + "epoch": 0.5764611689351481, + "grad_norm": 0.35865324150374944, + "learning_rate": 0.00013441632252297054, + "loss": 0.6048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5798181295394897, + "step": 2160, + "valid_targets_mean": 16757.2, + "valid_targets_min": 148 + }, + { + "epoch": 0.5777955697891647, + "grad_norm": 0.33904093328772805, + "learning_rate": 0.0001343095599557297, + "loss": 0.6178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6391230821609497, + "step": 2165, + "valid_targets_mean": 15397.4, + "valid_targets_min": 119 + }, + { + "epoch": 0.5791299706431812, + "grad_norm": 0.4478119414772001, + "learning_rate": 0.00013420247563064998, + "loss": 0.6254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5979142189025879, + "step": 2170, + "valid_targets_mean": 15297.2, + "valid_targets_min": 417 + }, + { + "epoch": 0.5804643714971978, + "grad_norm": 0.5707769603321923, + "learning_rate": 0.0001340950701286701, + "loss": 0.6199, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5975048542022705, + "step": 2175, + "valid_targets_mean": 16655.5, + "valid_targets_min": 452 + }, + { + "epoch": 0.5817987723512144, + "grad_norm": 0.4824505778403902, + "learning_rate": 0.0001339873440324712, + "loss": 0.6229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6108227372169495, + "step": 2180, + "valid_targets_mean": 15969.7, + "valid_targets_min": 282 + }, + { + "epoch": 0.5831331732052308, + "grad_norm": 0.4770877551156547, + "learning_rate": 0.00013387929792647366, + "loss": 0.6077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6048794984817505, + "step": 2185, + "valid_targets_mean": 15896.6, + "valid_targets_min": 567 + }, + { + "epoch": 0.5844675740592474, + "grad_norm": 0.4814622819368835, + "learning_rate": 0.00013377093239683396, + "loss": 0.6245, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6156436800956726, + "step": 2190, + "valid_targets_mean": 15846.9, + "valid_targets_min": 558 + }, + { + "epoch": 0.5858019749132639, + "grad_norm": 0.5145484936853344, + "learning_rate": 0.0001336622480314414, + "loss": 0.6367, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6479911804199219, + "step": 2195, + "valid_targets_mean": 14547.5, + "valid_targets_min": 122 + }, + { + "epoch": 0.5871363757672805, + "grad_norm": 0.4777740945717533, + "learning_rate": 0.00013355324541991512, + "loss": 0.6069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6272017955780029, + "step": 2200, + "valid_targets_mean": 15204.7, + "valid_targets_min": 645 + }, + { + "epoch": 0.588470776621297, + "grad_norm": 0.44934121785856823, + "learning_rate": 0.00013344392515360055, + "loss": 0.5964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6105179786682129, + "step": 2205, + "valid_targets_mean": 15131.6, + "valid_targets_min": 839 + }, + { + "epoch": 0.5898051774753136, + "grad_norm": 0.43607143864022113, + "learning_rate": 0.0001333342878255667, + "loss": 0.6124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6004830598831177, + "step": 2210, + "valid_targets_mean": 16907.6, + "valid_targets_min": 98 + }, + { + "epoch": 0.5911395783293302, + "grad_norm": 0.48902472019677856, + "learning_rate": 0.00013322433403060237, + "loss": 0.6144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6342414021492004, + "step": 2215, + "valid_targets_mean": 15085.4, + "valid_targets_min": 624 + }, + { + "epoch": 0.5924739791833467, + "grad_norm": 0.5744440751634579, + "learning_rate": 0.0001331140643652134, + "loss": 0.6057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5978758931159973, + "step": 2220, + "valid_targets_mean": 16446.8, + "valid_targets_min": 740 + }, + { + "epoch": 0.5938083800373632, + "grad_norm": 0.6905757317466992, + "learning_rate": 0.00013300347942761916, + "loss": 0.6097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6037940979003906, + "step": 2225, + "valid_targets_mean": 16368.0, + "valid_targets_min": 344 + }, + { + "epoch": 0.5951427808913797, + "grad_norm": 0.5554220490082593, + "learning_rate": 0.00013289257981774944, + "loss": 0.6196, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6129052639007568, + "step": 2230, + "valid_targets_mean": 15976.8, + "valid_targets_min": 899 + }, + { + "epoch": 0.5964771817453963, + "grad_norm": 0.4593156602009199, + "learning_rate": 0.0001327813661372411, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6253645420074463, + "step": 2235, + "valid_targets_mean": 15467.9, + "valid_targets_min": 537 + }, + { + "epoch": 0.5978115825994129, + "grad_norm": 0.4420033121389991, + "learning_rate": 0.00013266983898943495, + "loss": 0.6006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5838278532028198, + "step": 2240, + "valid_targets_mean": 17585.7, + "valid_targets_min": 733 + }, + { + "epoch": 0.5991459834534294, + "grad_norm": 0.448148923585819, + "learning_rate": 0.00013255799897937218, + "loss": 0.6258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6293032169342041, + "step": 2245, + "valid_targets_mean": 16851.1, + "valid_targets_min": 606 + }, + { + "epoch": 0.600480384307446, + "grad_norm": 0.6604916443254276, + "learning_rate": 0.0001324458467137915, + "loss": 0.6229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.650986909866333, + "step": 2250, + "valid_targets_mean": 15488.0, + "valid_targets_min": 592 + }, + { + "epoch": 0.6018147851614625, + "grad_norm": 0.4361931344736495, + "learning_rate": 0.00013233338280112548, + "loss": 0.6093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6127656698226929, + "step": 2255, + "valid_targets_mean": 17069.4, + "valid_targets_min": 222 + }, + { + "epoch": 0.6031491860154791, + "grad_norm": 0.3799066011210021, + "learning_rate": 0.00013222060785149744, + "loss": 0.6198, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6276907920837402, + "step": 2260, + "valid_targets_mean": 15284.9, + "valid_targets_min": 272 + }, + { + "epoch": 0.6044835868694955, + "grad_norm": 0.3698011849611436, + "learning_rate": 0.00013210752247671813, + "loss": 0.63, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6076016426086426, + "step": 2265, + "valid_targets_mean": 14670.1, + "valid_targets_min": 830 + }, + { + "epoch": 0.6058179877235121, + "grad_norm": 0.4567594623942834, + "learning_rate": 0.00013199412729028226, + "loss": 0.6124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6216099262237549, + "step": 2270, + "valid_targets_mean": 14361.8, + "valid_targets_min": 566 + }, + { + "epoch": 0.6071523885775287, + "grad_norm": 0.4259876052088613, + "learning_rate": 0.00013188042290736542, + "loss": 0.6219, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6279948949813843, + "step": 2275, + "valid_targets_mean": 16835.0, + "valid_targets_min": 414 + }, + { + "epoch": 0.6084867894315452, + "grad_norm": 0.469714123948217, + "learning_rate": 0.00013176640994482056, + "loss": 0.5975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.577383279800415, + "step": 2280, + "valid_targets_mean": 16238.7, + "valid_targets_min": 226 + }, + { + "epoch": 0.6098211902855618, + "grad_norm": 0.38761602035741405, + "learning_rate": 0.00013165208902117466, + "loss": 0.6194, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6232035160064697, + "step": 2285, + "valid_targets_mean": 17474.3, + "valid_targets_min": 789 + }, + { + "epoch": 0.6111555911395783, + "grad_norm": 0.43628422989244825, + "learning_rate": 0.0001315374607566254, + "loss": 0.6161, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6185094118118286, + "step": 2290, + "valid_targets_mean": 16039.3, + "valid_targets_min": 689 + }, + { + "epoch": 0.6124899919935949, + "grad_norm": 0.3939730845351852, + "learning_rate": 0.0001314225257730379, + "loss": 0.6226, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6232194900512695, + "step": 2295, + "valid_targets_mean": 15926.9, + "valid_targets_min": 430 + }, + { + "epoch": 0.6138243928476115, + "grad_norm": 0.4853802959237896, + "learning_rate": 0.00013130728469394113, + "loss": 0.6149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5909043550491333, + "step": 2300, + "valid_targets_mean": 15626.2, + "valid_targets_min": 541 + }, + { + "epoch": 0.615158793701628, + "grad_norm": 0.5303294991223937, + "learning_rate": 0.00013119173814452474, + "loss": 0.6145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6119722127914429, + "step": 2305, + "valid_targets_mean": 15990.4, + "valid_targets_min": 679 + }, + { + "epoch": 0.6164931945556446, + "grad_norm": 0.3768392664163849, + "learning_rate": 0.0001310758867516355, + "loss": 0.6148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5962955951690674, + "step": 2310, + "valid_targets_mean": 16253.9, + "valid_targets_min": 951 + }, + { + "epoch": 0.617827595409661, + "grad_norm": 0.29568158860296945, + "learning_rate": 0.00013095973114377401, + "loss": 0.6037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6145303845405579, + "step": 2315, + "valid_targets_mean": 16354.1, + "valid_targets_min": 689 + }, + { + "epoch": 0.6191619962636776, + "grad_norm": 0.3957310816668994, + "learning_rate": 0.00013084327195109127, + "loss": 0.6237, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6277497410774231, + "step": 2320, + "valid_targets_mean": 14964.2, + "valid_targets_min": 516 + }, + { + "epoch": 0.6204963971176941, + "grad_norm": 0.40507218781702686, + "learning_rate": 0.0001307265098053852, + "loss": 0.6294, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.613028883934021, + "step": 2325, + "valid_targets_mean": 14705.0, + "valid_targets_min": 516 + }, + { + "epoch": 0.6218307979717107, + "grad_norm": 0.4138873732218475, + "learning_rate": 0.00013060944534009727, + "loss": 0.6133, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6178252696990967, + "step": 2330, + "valid_targets_mean": 16135.6, + "valid_targets_min": 617 + }, + { + "epoch": 0.6231651988257273, + "grad_norm": 0.44550182331310156, + "learning_rate": 0.00013049207919030913, + "loss": 0.624, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6519665718078613, + "step": 2335, + "valid_targets_mean": 15362.8, + "valid_targets_min": 598 + }, + { + "epoch": 0.6244995996797438, + "grad_norm": 0.5069298867814076, + "learning_rate": 0.000130374411992739, + "loss": 0.6252, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6520801186561584, + "step": 2340, + "valid_targets_mean": 15502.6, + "valid_targets_min": 739 + }, + { + "epoch": 0.6258340005337604, + "grad_norm": 0.44255482876271746, + "learning_rate": 0.00013025644438573828, + "loss": 0.6261, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.633766770362854, + "step": 2345, + "valid_targets_mean": 15763.8, + "valid_targets_min": 470 + }, + { + "epoch": 0.6271684013877769, + "grad_norm": 0.34513764917726825, + "learning_rate": 0.0001301381770092882, + "loss": 0.613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6351778507232666, + "step": 2350, + "valid_targets_mean": 15281.8, + "valid_targets_min": 672 + }, + { + "epoch": 0.6285028022417934, + "grad_norm": 0.43679301344497834, + "learning_rate": 0.00013001961050499618, + "loss": 0.6101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6534307599067688, + "step": 2355, + "valid_targets_mean": 14878.5, + "valid_targets_min": 372 + }, + { + "epoch": 0.6298372030958099, + "grad_norm": 0.4870298254856093, + "learning_rate": 0.00012990074551609248, + "loss": 0.5978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5946311354637146, + "step": 2360, + "valid_targets_mean": 16314.5, + "valid_targets_min": 538 + }, + { + "epoch": 0.6311716039498265, + "grad_norm": 0.6945525869442485, + "learning_rate": 0.00012978158268742656, + "loss": 0.5993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6251997947692871, + "step": 2365, + "valid_targets_mean": 15368.2, + "valid_targets_min": 417 + }, + { + "epoch": 0.6325060048038431, + "grad_norm": 0.5790098785319283, + "learning_rate": 0.00012966212266546384, + "loss": 0.6259, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6421008110046387, + "step": 2370, + "valid_targets_mean": 16325.9, + "valid_targets_min": 458 + }, + { + "epoch": 0.6338404056578596, + "grad_norm": 0.792785744317409, + "learning_rate": 0.0001295423660982819, + "loss": 0.6286, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5836455821990967, + "step": 2375, + "valid_targets_mean": 16256.2, + "valid_targets_min": 428 + }, + { + "epoch": 0.6351748065118762, + "grad_norm": 0.5822492847083458, + "learning_rate": 0.00012942231363556717, + "loss": 0.6269, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6273260116577148, + "step": 2380, + "valid_targets_mean": 15313.9, + "valid_targets_min": 845 + }, + { + "epoch": 0.6365092073658927, + "grad_norm": 0.9406504357088764, + "learning_rate": 0.00012930196592861123, + "loss": 0.5945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6099258661270142, + "step": 2385, + "valid_targets_mean": 15458.6, + "valid_targets_min": 200 + }, + { + "epoch": 0.6378436082199093, + "grad_norm": 0.607913266165502, + "learning_rate": 0.0001291813236303075, + "loss": 0.6173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6085502505302429, + "step": 2390, + "valid_targets_mean": 16758.3, + "valid_targets_min": 657 + }, + { + "epoch": 0.6391780090739259, + "grad_norm": 0.7781891932389111, + "learning_rate": 0.0001290603873951475, + "loss": 0.6167, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6008795499801636, + "step": 2395, + "valid_targets_mean": 15621.0, + "valid_targets_min": 320 + }, + { + "epoch": 0.6405124099279423, + "grad_norm": 0.6539333928835719, + "learning_rate": 0.0001289391578792174, + "loss": 0.6095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5965677499771118, + "step": 2400, + "valid_targets_mean": 15319.6, + "valid_targets_min": 691 + }, + { + "epoch": 0.6418468107819589, + "grad_norm": 0.8999958153317562, + "learning_rate": 0.0001288176357401944, + "loss": 0.614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5982319116592407, + "step": 2405, + "valid_targets_mean": 16186.3, + "valid_targets_min": 669 + }, + { + "epoch": 0.6431812116359754, + "grad_norm": 0.58521594108338, + "learning_rate": 0.00012869582163734327, + "loss": 0.6158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5869446396827698, + "step": 2410, + "valid_targets_mean": 14848.0, + "valid_targets_min": 681 + }, + { + "epoch": 0.644515612489992, + "grad_norm": 0.7184768983435939, + "learning_rate": 0.00012857371623151265, + "loss": 0.6008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5802595615386963, + "step": 2415, + "valid_targets_mean": 16208.6, + "valid_targets_min": 428 + }, + { + "epoch": 0.6458500133440085, + "grad_norm": 0.6102088903744022, + "learning_rate": 0.00012845132018513147, + "loss": 0.6121, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6337521076202393, + "step": 2420, + "valid_targets_mean": 15364.2, + "valid_targets_min": 511 + }, + { + "epoch": 0.6471844141980251, + "grad_norm": 0.7605142158941254, + "learning_rate": 0.00012832863416220556, + "loss": 0.6229, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.648051917552948, + "step": 2425, + "valid_targets_mean": 15182.1, + "valid_targets_min": 438 + }, + { + "epoch": 0.6485188150520417, + "grad_norm": 0.6256768708161232, + "learning_rate": 0.00012820565882831365, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6141934394836426, + "step": 2430, + "valid_targets_mean": 14725.9, + "valid_targets_min": 551 + }, + { + "epoch": 0.6498532159060582, + "grad_norm": 0.7451804423044297, + "learning_rate": 0.00012808239485060426, + "loss": 0.6015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6086957454681396, + "step": 2435, + "valid_targets_mean": 16796.6, + "valid_targets_min": 22 + }, + { + "epoch": 0.6511876167600748, + "grad_norm": 0.5513334048003805, + "learning_rate": 0.00012795884289779161, + "loss": 0.6091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5970527529716492, + "step": 2440, + "valid_targets_mean": 16409.0, + "valid_targets_min": 357 + }, + { + "epoch": 0.6525220176140912, + "grad_norm": 0.5601606873656281, + "learning_rate": 0.00012783500364015233, + "loss": 0.6038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6198552846908569, + "step": 2445, + "valid_targets_mean": 15023.3, + "valid_targets_min": 490 + }, + { + "epoch": 0.6538564184681078, + "grad_norm": 0.5710220241717955, + "learning_rate": 0.00012771087774952165, + "loss": 0.6173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6311722993850708, + "step": 2450, + "valid_targets_mean": 16240.5, + "valid_targets_min": 547 + }, + { + "epoch": 0.6551908193221244, + "grad_norm": 0.6210885846793824, + "learning_rate": 0.00012758646589928975, + "loss": 0.6113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5842134952545166, + "step": 2455, + "valid_targets_mean": 15439.6, + "valid_targets_min": 794 + }, + { + "epoch": 0.6565252201761409, + "grad_norm": 0.5047368505662938, + "learning_rate": 0.00012746176876439824, + "loss": 0.6304, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6596218347549438, + "step": 2460, + "valid_targets_mean": 14011.9, + "valid_targets_min": 274 + }, + { + "epoch": 0.6578596210301575, + "grad_norm": 0.5719219448735884, + "learning_rate": 0.00012733678702133642, + "loss": 0.604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6103248596191406, + "step": 2465, + "valid_targets_mean": 15900.6, + "valid_targets_min": 327 + }, + { + "epoch": 0.659194021884174, + "grad_norm": 0.36671511433182047, + "learning_rate": 0.00012721152134813755, + "loss": 0.616, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5883936882019043, + "step": 2470, + "valid_targets_mean": 16086.2, + "valid_targets_min": 102 + }, + { + "epoch": 0.6605284227381906, + "grad_norm": 0.5035071153244577, + "learning_rate": 0.00012708597242437524, + "loss": 0.6111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6350337266921997, + "step": 2475, + "valid_targets_mean": 14267.4, + "valid_targets_min": 274 + }, + { + "epoch": 0.661862823592207, + "grad_norm": 0.49047354453068903, + "learning_rate": 0.00012696014093115974, + "loss": 0.6239, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6190519332885742, + "step": 2480, + "valid_targets_mean": 16891.8, + "valid_targets_min": 219 + }, + { + "epoch": 0.6631972244462236, + "grad_norm": 0.3639431845661133, + "learning_rate": 0.00012683402755113432, + "loss": 0.6011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5651915669441223, + "step": 2485, + "valid_targets_mean": 16542.9, + "valid_targets_min": 599 + }, + { + "epoch": 0.6645316253002402, + "grad_norm": 0.3092175056739848, + "learning_rate": 0.0001267076329684714, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5737978219985962, + "step": 2490, + "valid_targets_mean": 16735.8, + "valid_targets_min": 397 + }, + { + "epoch": 0.6658660261542567, + "grad_norm": 0.42866256823259696, + "learning_rate": 0.0001265809578688691, + "loss": 0.6128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5863039493560791, + "step": 2495, + "valid_targets_mean": 15345.5, + "valid_targets_min": 488 + }, + { + "epoch": 0.6672004270082733, + "grad_norm": 0.4798819084708603, + "learning_rate": 0.00012645400293954714, + "loss": 0.6182, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.620308518409729, + "step": 2500, + "valid_targets_mean": 15893.3, + "valid_targets_min": 616 + }, + { + "epoch": 0.6685348278622898, + "grad_norm": 0.3719505049119626, + "learning_rate": 0.0001263267688692435, + "loss": 0.6264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6290452480316162, + "step": 2505, + "valid_targets_mean": 15592.1, + "valid_targets_min": 290 + }, + { + "epoch": 0.6698692287163064, + "grad_norm": 0.4398503675850329, + "learning_rate": 0.00012619925634821052, + "loss": 0.6123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6252307891845703, + "step": 2510, + "valid_targets_mean": 16358.0, + "valid_targets_min": 579 + }, + { + "epoch": 0.671203629570323, + "grad_norm": 0.33044335456370993, + "learning_rate": 0.00012607146606821105, + "loss": 0.6048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6037730574607849, + "step": 2515, + "valid_targets_mean": 16456.2, + "valid_targets_min": 468 + }, + { + "epoch": 0.6725380304243395, + "grad_norm": 0.4138312255865989, + "learning_rate": 0.00012594339872251483, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6162407398223877, + "step": 2520, + "valid_targets_mean": 16273.4, + "valid_targets_min": 419 + }, + { + "epoch": 0.673872431278356, + "grad_norm": 0.5338733241457372, + "learning_rate": 0.00012581505500589474, + "loss": 0.6156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.616795539855957, + "step": 2525, + "valid_targets_mean": 15318.8, + "valid_targets_min": 594 + }, + { + "epoch": 0.6752068321323725, + "grad_norm": 0.5538178472599126, + "learning_rate": 0.00012568643561462298, + "loss": 0.6093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6517888307571411, + "step": 2530, + "valid_targets_mean": 16193.2, + "valid_targets_min": 707 + }, + { + "epoch": 0.6765412329863891, + "grad_norm": 0.39314855325609094, + "learning_rate": 0.00012555754124646729, + "loss": 0.6061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6136894226074219, + "step": 2535, + "valid_targets_mean": 15608.1, + "valid_targets_min": 690 + }, + { + "epoch": 0.6778756338404056, + "grad_norm": 0.28736129685480677, + "learning_rate": 0.0001254283726006871, + "loss": 0.6034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6169589757919312, + "step": 2540, + "valid_targets_mean": 16580.6, + "valid_targets_min": 391 + }, + { + "epoch": 0.6792100346944222, + "grad_norm": 0.40453438597245944, + "learning_rate": 0.00012529893037803, + "loss": 0.6168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6047553420066833, + "step": 2545, + "valid_targets_mean": 16454.1, + "valid_targets_min": 411 + }, + { + "epoch": 0.6805444355484388, + "grad_norm": 0.40703301810718967, + "learning_rate": 0.00012516921528072752, + "loss": 0.6037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6294437646865845, + "step": 2550, + "valid_targets_mean": 16483.0, + "valid_targets_min": 503 + }, + { + "epoch": 0.6818788364024553, + "grad_norm": 0.4332954316346514, + "learning_rate": 0.00012503922801249172, + "loss": 0.6323, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6062746644020081, + "step": 2555, + "valid_targets_mean": 16690.6, + "valid_targets_min": 831 + }, + { + "epoch": 0.6832132372564719, + "grad_norm": 0.4330673352480961, + "learning_rate": 0.00012490896927851118, + "loss": 0.6149, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6028146147727966, + "step": 2560, + "valid_targets_mean": 16890.8, + "valid_targets_min": 574 + }, + { + "epoch": 0.6845476381104884, + "grad_norm": 0.5758835807464072, + "learning_rate": 0.0001247784397854471, + "loss": 0.6063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6124927997589111, + "step": 2565, + "valid_targets_mean": 16613.3, + "valid_targets_min": 336 + }, + { + "epoch": 0.685882038964505, + "grad_norm": 0.3759062706106212, + "learning_rate": 0.0001246476402414297, + "loss": 0.6173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6371479034423828, + "step": 2570, + "valid_targets_mean": 15202.9, + "valid_targets_min": 311 + }, + { + "epoch": 0.6872164398185214, + "grad_norm": 0.40747309474183957, + "learning_rate": 0.0001245165713560541, + "loss": 0.6197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6243611574172974, + "step": 2575, + "valid_targets_mean": 16138.9, + "valid_targets_min": 451 + }, + { + "epoch": 0.688550840672538, + "grad_norm": 0.33101064658709073, + "learning_rate": 0.00012438523384037675, + "loss": 0.621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6176421642303467, + "step": 2580, + "valid_targets_mean": 15277.3, + "valid_targets_min": 575 + }, + { + "epoch": 0.6898852415265546, + "grad_norm": 0.38388904529906687, + "learning_rate": 0.0001242536284069113, + "loss": 0.5967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5699970126152039, + "step": 2585, + "valid_targets_mean": 16336.4, + "valid_targets_min": 164 + }, + { + "epoch": 0.6912196423805711, + "grad_norm": 0.3477844139398198, + "learning_rate": 0.00012412175576962504, + "loss": 0.608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5966440439224243, + "step": 2590, + "valid_targets_mean": 16631.5, + "valid_targets_min": 441 + }, + { + "epoch": 0.6925540432345877, + "grad_norm": 0.5440458794110384, + "learning_rate": 0.00012398961664393467, + "loss": 0.6197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6081477403640747, + "step": 2595, + "valid_targets_mean": 16263.5, + "valid_targets_min": 192 + }, + { + "epoch": 0.6938884440886042, + "grad_norm": 0.3152153844701328, + "learning_rate": 0.0001238572117467027, + "loss": 0.6225, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6415140628814697, + "step": 2600, + "valid_targets_mean": 15497.3, + "valid_targets_min": 244 + }, + { + "epoch": 0.6952228449426208, + "grad_norm": 0.5474956644762842, + "learning_rate": 0.0001237245417962335, + "loss": 0.6049, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6185272336006165, + "step": 2605, + "valid_targets_mean": 16156.6, + "valid_targets_min": 659 + }, + { + "epoch": 0.6965572457966374, + "grad_norm": 0.37662200390415895, + "learning_rate": 0.0001235916075122693, + "loss": 0.6206, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6300753355026245, + "step": 2610, + "valid_targets_mean": 15374.1, + "valid_targets_min": 139 + }, + { + "epoch": 0.6978916466506538, + "grad_norm": 0.41421104102571804, + "learning_rate": 0.00012345840961598638, + "loss": 0.6321, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6131690740585327, + "step": 2615, + "valid_targets_mean": 15966.3, + "valid_targets_min": 593 + }, + { + "epoch": 0.6992260475046704, + "grad_norm": 0.43574279785165043, + "learning_rate": 0.00012332494882999113, + "loss": 0.6159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6403422355651855, + "step": 2620, + "valid_targets_mean": 15165.6, + "valid_targets_min": 20 + }, + { + "epoch": 0.7005604483586869, + "grad_norm": 0.4314840648934718, + "learning_rate": 0.00012319122587831614, + "loss": 0.6, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6263567209243774, + "step": 2625, + "valid_targets_mean": 15291.8, + "valid_targets_min": 733 + }, + { + "epoch": 0.7018948492127035, + "grad_norm": 0.3696921147982537, + "learning_rate": 0.00012305724148641627, + "loss": 0.6098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6040724515914917, + "step": 2630, + "valid_targets_mean": 15731.2, + "valid_targets_min": 587 + }, + { + "epoch": 0.70322925006672, + "grad_norm": 0.36503865159227195, + "learning_rate": 0.00012292299638116472, + "loss": 0.6145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6203213334083557, + "step": 2635, + "valid_targets_mean": 16185.4, + "valid_targets_min": 423 + }, + { + "epoch": 0.7045636509207366, + "grad_norm": 0.6179094979585101, + "learning_rate": 0.00012278849129084902, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.59694904088974, + "step": 2640, + "valid_targets_mean": 15701.0, + "valid_targets_min": 711 + }, + { + "epoch": 0.7058980517747532, + "grad_norm": 0.554016016939682, + "learning_rate": 0.00012265372694516714, + "loss": 0.6179, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.613195538520813, + "step": 2645, + "valid_targets_mean": 15156.6, + "valid_targets_min": 417 + }, + { + "epoch": 0.7072324526287697, + "grad_norm": 0.5981015163954772, + "learning_rate": 0.00012251870407522364, + "loss": 0.6177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5936011672019958, + "step": 2650, + "valid_targets_mean": 16011.4, + "valid_targets_min": 570 + }, + { + "epoch": 0.7085668534827863, + "grad_norm": 0.49781827733569967, + "learning_rate": 0.00012238342341352546, + "loss": 0.6005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5743311047554016, + "step": 2655, + "valid_targets_mean": 16041.1, + "valid_targets_min": 467 + }, + { + "epoch": 0.7099012543368027, + "grad_norm": 0.7260313002631965, + "learning_rate": 0.00012224788569397806, + "loss": 0.6208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623327374458313, + "step": 2660, + "valid_targets_mean": 15888.8, + "valid_targets_min": 820 + }, + { + "epoch": 0.7112356551908193, + "grad_norm": 0.7328475215596345, + "learning_rate": 0.0001221120916518816, + "loss": 0.6232, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6027488708496094, + "step": 2665, + "valid_targets_mean": 15739.6, + "valid_targets_min": 250 + }, + { + "epoch": 0.7125700560448359, + "grad_norm": 0.7596978663656118, + "learning_rate": 0.0001219760420239267, + "loss": 0.5925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5970748662948608, + "step": 2670, + "valid_targets_mean": 16778.7, + "valid_targets_min": 534 + }, + { + "epoch": 0.7139044568988524, + "grad_norm": 0.6594651660933113, + "learning_rate": 0.00012183973754819051, + "loss": 0.593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5764331817626953, + "step": 2675, + "valid_targets_mean": 16637.8, + "valid_targets_min": 581 + }, + { + "epoch": 0.715238857752869, + "grad_norm": 0.7628936372865166, + "learning_rate": 0.00012170317896413284, + "loss": 0.6018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6267425417900085, + "step": 2680, + "valid_targets_mean": 15401.4, + "valid_targets_min": 732 + }, + { + "epoch": 0.7165732586068855, + "grad_norm": 0.4698922890537805, + "learning_rate": 0.00012156636701259202, + "loss": 0.6038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.596757173538208, + "step": 2685, + "valid_targets_mean": 15641.7, + "valid_targets_min": 727 + }, + { + "epoch": 0.7179076594609021, + "grad_norm": 0.605004344317738, + "learning_rate": 0.00012142930243578092, + "loss": 0.6007, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5908167958259583, + "step": 2690, + "valid_targets_mean": 15483.9, + "valid_targets_min": 775 + }, + { + "epoch": 0.7192420603149186, + "grad_norm": 0.5619485743558523, + "learning_rate": 0.00012129198597728285, + "loss": 0.6157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6099591255187988, + "step": 2695, + "valid_targets_mean": 14776.2, + "valid_targets_min": 387 + }, + { + "epoch": 0.7205764611689351, + "grad_norm": 0.6598145305998949, + "learning_rate": 0.00012115441838204767, + "loss": 0.6158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6329494118690491, + "step": 2700, + "valid_targets_mean": 16702.2, + "valid_targets_min": 523 + }, + { + "epoch": 0.7219108620229517, + "grad_norm": 0.6613863881062565, + "learning_rate": 0.00012101660039638766, + "loss": 0.5824, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5732811689376831, + "step": 2705, + "valid_targets_mean": 15127.5, + "valid_targets_min": 488 + }, + { + "epoch": 0.7232452628769682, + "grad_norm": 0.6893698621225195, + "learning_rate": 0.00012087853276797346, + "loss": 0.6129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5944296717643738, + "step": 2710, + "valid_targets_mean": 15252.4, + "valid_targets_min": 756 + }, + { + "epoch": 0.7245796637309848, + "grad_norm": 0.609549826313975, + "learning_rate": 0.00012074021624583005, + "loss": 0.6202, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6550873517990112, + "step": 2715, + "valid_targets_mean": 15639.0, + "valid_targets_min": 326 + }, + { + "epoch": 0.7259140645850013, + "grad_norm": 0.6535800226145355, + "learning_rate": 0.00012060165158033268, + "loss": 0.5989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5854440927505493, + "step": 2720, + "valid_targets_mean": 16359.4, + "valid_targets_min": 363 + }, + { + "epoch": 0.7272484654390179, + "grad_norm": 0.5139845099693757, + "learning_rate": 0.00012046283952320275, + "loss": 0.613, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6016006469726562, + "step": 2725, + "valid_targets_mean": 17065.6, + "valid_targets_min": 419 + }, + { + "epoch": 0.7285828662930345, + "grad_norm": 0.6014899717015251, + "learning_rate": 0.00012032378082750382, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5890054702758789, + "step": 2730, + "valid_targets_mean": 15969.3, + "valid_targets_min": 503 + }, + { + "epoch": 0.729917267147051, + "grad_norm": 0.5691533934968931, + "learning_rate": 0.00012018447624763748, + "loss": 0.6203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6279616951942444, + "step": 2735, + "valid_targets_mean": 15455.8, + "valid_targets_min": 119 + }, + { + "epoch": 0.7312516680010676, + "grad_norm": 0.6335124799219327, + "learning_rate": 0.00012004492653933923, + "loss": 0.6089, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6014554500579834, + "step": 2740, + "valid_targets_mean": 17150.6, + "valid_targets_min": 505 + }, + { + "epoch": 0.732586068855084, + "grad_norm": 0.5169723465682857, + "learning_rate": 0.0001199051324596744, + "loss": 0.6106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6194249391555786, + "step": 2745, + "valid_targets_mean": 16123.2, + "valid_targets_min": 422 + }, + { + "epoch": 0.7339204697091006, + "grad_norm": 0.6738124101769285, + "learning_rate": 0.00011976509476703408, + "loss": 0.612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6056435108184814, + "step": 2750, + "valid_targets_mean": 16243.4, + "valid_targets_min": 484 + }, + { + "epoch": 0.7352548705631171, + "grad_norm": 0.3664524912963626, + "learning_rate": 0.00011962481422113098, + "loss": 0.6197, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.646386981010437, + "step": 2755, + "valid_targets_mean": 16190.9, + "valid_targets_min": 898 + }, + { + "epoch": 0.7365892714171337, + "grad_norm": 0.44792117478863985, + "learning_rate": 0.00011948429158299523, + "loss": 0.5971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5956047773361206, + "step": 2760, + "valid_targets_mean": 15734.4, + "valid_targets_min": 91 + }, + { + "epoch": 0.7379236722711503, + "grad_norm": 0.4124501979620836, + "learning_rate": 0.00011934352761497043, + "loss": 0.6128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5855376720428467, + "step": 2765, + "valid_targets_mean": 15115.3, + "valid_targets_min": 686 + }, + { + "epoch": 0.7392580731251668, + "grad_norm": 0.3230024437807969, + "learning_rate": 0.00011920252308070936, + "loss": 0.611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234885454177856, + "step": 2770, + "valid_targets_mean": 16610.5, + "valid_targets_min": 501 + }, + { + "epoch": 0.7405924739791834, + "grad_norm": 0.39710487024270547, + "learning_rate": 0.00011906127874516985, + "loss": 0.6344, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380666494369507, + "step": 2775, + "valid_targets_mean": 15587.7, + "valid_targets_min": 190 + }, + { + "epoch": 0.7419268748331999, + "grad_norm": 0.4097828989932021, + "learning_rate": 0.00011891979537461069, + "loss": 0.6043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6162174940109253, + "step": 2780, + "valid_targets_mean": 14953.7, + "valid_targets_min": 491 + }, + { + "epoch": 0.7432612756872164, + "grad_norm": 0.38996309275492613, + "learning_rate": 0.00011877807373658751, + "loss": 0.6157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6415692567825317, + "step": 2785, + "valid_targets_mean": 15363.2, + "valid_targets_min": 380 + }, + { + "epoch": 0.7445956765412329, + "grad_norm": 0.3618667775211813, + "learning_rate": 0.00011863611459994845, + "loss": 0.5936, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5952189564704895, + "step": 2790, + "valid_targets_mean": 16200.4, + "valid_targets_min": 399 + }, + { + "epoch": 0.7459300773952495, + "grad_norm": 0.3267117936332756, + "learning_rate": 0.00011849391873483016, + "loss": 0.6124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5991407036781311, + "step": 2795, + "valid_targets_mean": 17319.6, + "valid_targets_min": 755 + }, + { + "epoch": 0.7472644782492661, + "grad_norm": 0.3016648304278165, + "learning_rate": 0.00011835148691265355, + "loss": 0.5987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6235275268554688, + "step": 2800, + "valid_targets_mean": 15123.5, + "valid_targets_min": 520 + }, + { + "epoch": 0.7485988791032826, + "grad_norm": 0.3221823783108136, + "learning_rate": 0.00011820881990611963, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6053809523582458, + "step": 2805, + "valid_targets_mean": 16131.7, + "valid_targets_min": 591 + }, + { + "epoch": 0.7499332799572992, + "grad_norm": 0.43562984477012173, + "learning_rate": 0.00011806591848920521, + "loss": 0.6111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6194973587989807, + "step": 2810, + "valid_targets_mean": 16540.3, + "valid_targets_min": 669 + }, + { + "epoch": 0.7512676808113157, + "grad_norm": 0.3698450346299921, + "learning_rate": 0.00011792278343715892, + "loss": 0.6255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6236314177513123, + "step": 2815, + "valid_targets_mean": 15602.0, + "valid_targets_min": 604 + }, + { + "epoch": 0.7526020816653323, + "grad_norm": 0.4818546251164576, + "learning_rate": 0.00011777941552649674, + "loss": 0.6097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6257940530776978, + "step": 2820, + "valid_targets_mean": 16670.9, + "valid_targets_min": 544 + }, + { + "epoch": 0.7539364825193489, + "grad_norm": 0.4397285169168285, + "learning_rate": 0.00011763581553499803, + "loss": 0.6251, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6217588186264038, + "step": 2825, + "valid_targets_mean": 15189.8, + "valid_targets_min": 513 + }, + { + "epoch": 0.7552708833733653, + "grad_norm": 0.3478095634132381, + "learning_rate": 0.00011749198424170117, + "loss": 0.5954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5979966521263123, + "step": 2830, + "valid_targets_mean": 16085.6, + "valid_targets_min": 279 + }, + { + "epoch": 0.7566052842273819, + "grad_norm": 0.35110205846176734, + "learning_rate": 0.00011734792242689934, + "loss": 0.6087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6225411891937256, + "step": 2835, + "valid_targets_mean": 16043.0, + "valid_targets_min": 698 + }, + { + "epoch": 0.7579396850813984, + "grad_norm": 0.326064120745074, + "learning_rate": 0.00011720363087213629, + "loss": 0.6068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6108662486076355, + "step": 2840, + "valid_targets_mean": 15808.2, + "valid_targets_min": 351 + }, + { + "epoch": 0.759274085935415, + "grad_norm": 0.49202452785265866, + "learning_rate": 0.00011705911036020222, + "loss": 0.6124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6325043439865112, + "step": 2845, + "valid_targets_mean": 16098.4, + "valid_targets_min": 589 + }, + { + "epoch": 0.7606084867894315, + "grad_norm": 0.3350239081325133, + "learning_rate": 0.00011691436167512938, + "loss": 0.614, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6329668164253235, + "step": 2850, + "valid_targets_mean": 14940.1, + "valid_targets_min": 425 + }, + { + "epoch": 0.7619428876434481, + "grad_norm": 0.3760125143483495, + "learning_rate": 0.00011676938560218781, + "loss": 0.6254, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.612138032913208, + "step": 2855, + "valid_targets_mean": 15901.7, + "valid_targets_min": 40 + }, + { + "epoch": 0.7632772884974647, + "grad_norm": 0.33540908595554625, + "learning_rate": 0.00011662418292788127, + "loss": 0.5968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5743190050125122, + "step": 2860, + "valid_targets_mean": 16764.1, + "valid_targets_min": 354 + }, + { + "epoch": 0.7646116893514812, + "grad_norm": 0.2754574689920214, + "learning_rate": 0.00011647875443994271, + "loss": 0.6114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6536933779716492, + "step": 2865, + "valid_targets_mean": 15792.1, + "valid_targets_min": 432 + }, + { + "epoch": 0.7659460902054978, + "grad_norm": 0.31623825970777014, + "learning_rate": 0.00011633310092733027, + "loss": 0.612, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6481964588165283, + "step": 2870, + "valid_targets_mean": 15686.6, + "valid_targets_min": 91 + }, + { + "epoch": 0.7672804910595142, + "grad_norm": 0.3081228003901501, + "learning_rate": 0.00011618722318022273, + "loss": 0.6033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5976066589355469, + "step": 2875, + "valid_targets_mean": 16311.7, + "valid_targets_min": 497 + }, + { + "epoch": 0.7686148919135308, + "grad_norm": 0.39985682958457286, + "learning_rate": 0.00011604112199001546, + "loss": 0.6155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6129624843597412, + "step": 2880, + "valid_targets_mean": 16037.5, + "valid_targets_min": 553 + }, + { + "epoch": 0.7699492927675474, + "grad_norm": 0.3088978935138083, + "learning_rate": 0.00011589479814931598, + "loss": 0.6315, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6401019096374512, + "step": 2885, + "valid_targets_mean": 15580.1, + "valid_targets_min": 188 + }, + { + "epoch": 0.7712836936215639, + "grad_norm": 0.3825137255624278, + "learning_rate": 0.0001157482524519397, + "loss": 0.6069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6044080853462219, + "step": 2890, + "valid_targets_mean": 16121.2, + "valid_targets_min": 443 + }, + { + "epoch": 0.7726180944755805, + "grad_norm": 0.35342809771327477, + "learning_rate": 0.00011560148569290558, + "loss": 0.6207, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.639106273651123, + "step": 2895, + "valid_targets_mean": 15362.5, + "valid_targets_min": 633 + }, + { + "epoch": 0.773952495329597, + "grad_norm": 0.386043678780904, + "learning_rate": 0.00011545449866843194, + "loss": 0.61, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5949431657791138, + "step": 2900, + "valid_targets_mean": 15466.7, + "valid_targets_min": 730 + }, + { + "epoch": 0.7752868961836136, + "grad_norm": 0.3245398180178222, + "learning_rate": 0.00011530729217593198, + "loss": 0.6188, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5934869050979614, + "step": 2905, + "valid_targets_mean": 15376.7, + "valid_targets_min": 371 + }, + { + "epoch": 0.77662129703763, + "grad_norm": 0.44593536867847916, + "learning_rate": 0.00011515986701400955, + "loss": 0.6055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5876243114471436, + "step": 2910, + "valid_targets_mean": 16781.6, + "valid_targets_min": 704 + }, + { + "epoch": 0.7779556978916466, + "grad_norm": 0.46221191788580496, + "learning_rate": 0.00011501222398245478, + "loss": 0.6069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6441828012466431, + "step": 2915, + "valid_targets_mean": 15654.8, + "valid_targets_min": 497 + }, + { + "epoch": 0.7792900987456632, + "grad_norm": 0.40081314933909024, + "learning_rate": 0.00011486436388223977, + "loss": 0.6077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.595112144947052, + "step": 2920, + "valid_targets_mean": 15317.9, + "valid_targets_min": 503 + }, + { + "epoch": 0.7806244995996797, + "grad_norm": 0.5596690090788919, + "learning_rate": 0.00011471628751551426, + "loss": 0.6068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5922015905380249, + "step": 2925, + "valid_targets_mean": 16044.5, + "valid_targets_min": 613 + }, + { + "epoch": 0.7819589004536963, + "grad_norm": 0.3589995388472471, + "learning_rate": 0.0001145679956856012, + "loss": 0.6103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6053141951560974, + "step": 2930, + "valid_targets_mean": 17100.2, + "valid_targets_min": 789 + }, + { + "epoch": 0.7832933013077128, + "grad_norm": 0.4884923328918617, + "learning_rate": 0.00011441948919699249, + "loss": 0.5993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6002500057220459, + "step": 2935, + "valid_targets_mean": 16290.3, + "valid_targets_min": 466 + }, + { + "epoch": 0.7846277021617294, + "grad_norm": 0.4779545116170051, + "learning_rate": 0.00011427076885534445, + "loss": 0.6165, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5972024202346802, + "step": 2940, + "valid_targets_mean": 15572.7, + "valid_targets_min": 310 + }, + { + "epoch": 0.785962103015746, + "grad_norm": 0.36583593978213447, + "learning_rate": 0.00011412183546747374, + "loss": 0.6275, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6454517841339111, + "step": 2945, + "valid_targets_mean": 15348.2, + "valid_targets_min": 109 + }, + { + "epoch": 0.7872965038697625, + "grad_norm": 0.3622837852549798, + "learning_rate": 0.00011397268984135266, + "loss": 0.6104, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5890398621559143, + "step": 2950, + "valid_targets_mean": 16108.4, + "valid_targets_min": 390 + }, + { + "epoch": 0.7886309047237791, + "grad_norm": 0.28721242725922963, + "learning_rate": 0.00011382333278610503, + "loss": 0.6128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6144457459449768, + "step": 2955, + "valid_targets_mean": 15895.4, + "valid_targets_min": 419 + }, + { + "epoch": 0.7899653055777955, + "grad_norm": 0.39829683210774786, + "learning_rate": 0.00011367376511200157, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5917114019393921, + "step": 2960, + "valid_targets_mean": 15565.9, + "valid_targets_min": 311 + }, + { + "epoch": 0.7912997064318121, + "grad_norm": 0.3738329809252565, + "learning_rate": 0.00011352398763045569, + "loss": 0.6111, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5774213671684265, + "step": 2965, + "valid_targets_mean": 15889.3, + "valid_targets_min": 293 + }, + { + "epoch": 0.7926341072858286, + "grad_norm": 0.39971448523023917, + "learning_rate": 0.00011337400115401905, + "loss": 0.5908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6107337474822998, + "step": 2970, + "valid_targets_mean": 15658.9, + "valid_targets_min": 735 + }, + { + "epoch": 0.7939685081398452, + "grad_norm": 0.4915041380921517, + "learning_rate": 0.00011322380649637704, + "loss": 0.6056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6147445440292358, + "step": 2975, + "valid_targets_mean": 16253.0, + "valid_targets_min": 679 + }, + { + "epoch": 0.7953029089938618, + "grad_norm": 0.46231586052243284, + "learning_rate": 0.00011307340447234449, + "loss": 0.6138, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5767396092414856, + "step": 2980, + "valid_targets_mean": 17331.9, + "valid_targets_min": 234 + }, + { + "epoch": 0.7966373098478783, + "grad_norm": 0.4211986440934076, + "learning_rate": 0.00011292279589786115, + "loss": 0.5993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6300714015960693, + "step": 2985, + "valid_targets_mean": 16442.2, + "valid_targets_min": 695 + }, + { + "epoch": 0.7979717107018949, + "grad_norm": 0.31346676252674627, + "learning_rate": 0.00011277198158998744, + "loss": 0.6094, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5963038206100464, + "step": 2990, + "valid_targets_mean": 16258.1, + "valid_targets_min": 639 + }, + { + "epoch": 0.7993061115559114, + "grad_norm": 0.3152167692640102, + "learning_rate": 0.00011262096236689978, + "loss": 0.6156, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6168862581253052, + "step": 2995, + "valid_targets_mean": 16518.8, + "valid_targets_min": 139 + }, + { + "epoch": 0.800640512409928, + "grad_norm": 0.3798525858644061, + "learning_rate": 0.0001124697390478863, + "loss": 0.5946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5764780640602112, + "step": 3000, + "valid_targets_mean": 15923.1, + "valid_targets_min": 802 + }, + { + "epoch": 0.8019749132639445, + "grad_norm": 0.57419267937008, + "learning_rate": 0.00011231831245334238, + "loss": 0.6174, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5927503705024719, + "step": 3005, + "valid_targets_mean": 17187.9, + "valid_targets_min": 907 + }, + { + "epoch": 0.803309314117961, + "grad_norm": 0.43237740910495476, + "learning_rate": 0.00011216668340476618, + "loss": 0.5986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6266282796859741, + "step": 3010, + "valid_targets_mean": 15425.8, + "valid_targets_min": 346 + }, + { + "epoch": 0.8046437149719776, + "grad_norm": 0.4015442907401617, + "learning_rate": 0.00011201485272475416, + "loss": 0.6186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6169252395629883, + "step": 3015, + "valid_targets_mean": 15839.9, + "valid_targets_min": 772 + }, + { + "epoch": 0.8059781158259941, + "grad_norm": 0.9122981083934059, + "learning_rate": 0.00011186282123699664, + "loss": 0.6125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5926787853240967, + "step": 3020, + "valid_targets_mean": 14898.1, + "valid_targets_min": 193 + }, + { + "epoch": 0.8073125166800107, + "grad_norm": 0.36552132119276587, + "learning_rate": 0.00011171058976627341, + "loss": 0.6114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5867595672607422, + "step": 3025, + "valid_targets_mean": 15765.2, + "valid_targets_min": 341 + }, + { + "epoch": 0.8086469175340272, + "grad_norm": 0.41497109551666145, + "learning_rate": 0.00011155815913844906, + "loss": 0.6052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6065448522567749, + "step": 3030, + "valid_targets_mean": 14955.9, + "valid_targets_min": 417 + }, + { + "epoch": 0.8099813183880438, + "grad_norm": 0.4398597996121229, + "learning_rate": 0.00011140553018046872, + "loss": 0.6166, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6327465772628784, + "step": 3035, + "valid_targets_mean": 14344.6, + "valid_targets_min": 119 + }, + { + "epoch": 0.8113157192420604, + "grad_norm": 0.33965885966385906, + "learning_rate": 0.00011125270372035342, + "loss": 0.6056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5998932123184204, + "step": 3040, + "valid_targets_mean": 16106.6, + "valid_targets_min": 538 + }, + { + "epoch": 0.8126501200960768, + "grad_norm": 0.3850178772215109, + "learning_rate": 0.00011109968058719565, + "loss": 0.6035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6161537766456604, + "step": 3045, + "valid_targets_mean": 15463.7, + "valid_targets_min": 68 + }, + { + "epoch": 0.8139845209500934, + "grad_norm": 0.3256813424259837, + "learning_rate": 0.00011094646161115489, + "loss": 0.5999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5910052061080933, + "step": 3050, + "valid_targets_mean": 16663.1, + "valid_targets_min": 644 + }, + { + "epoch": 0.8153189218041099, + "grad_norm": 0.334038106311323, + "learning_rate": 0.00011079304762345307, + "loss": 0.6041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.598740816116333, + "step": 3055, + "valid_targets_mean": 16783.4, + "valid_targets_min": 595 + }, + { + "epoch": 0.8166533226581265, + "grad_norm": 0.48713259307598056, + "learning_rate": 0.00011063943945637005, + "loss": 0.5932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5953688621520996, + "step": 3060, + "valid_targets_mean": 17433.8, + "valid_targets_min": 384 + }, + { + "epoch": 0.817987723512143, + "grad_norm": 0.4173434520228628, + "learning_rate": 0.00011048563794323915, + "loss": 0.6041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6344270706176758, + "step": 3065, + "valid_targets_mean": 15606.3, + "valid_targets_min": 801 + }, + { + "epoch": 0.8193221243661596, + "grad_norm": 0.3197471666286986, + "learning_rate": 0.00011033164391844259, + "loss": 0.6086, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6131141185760498, + "step": 3070, + "valid_targets_mean": 15585.1, + "valid_targets_min": 425 + }, + { + "epoch": 0.8206565252201762, + "grad_norm": 0.3067640922164882, + "learning_rate": 0.00011017745821740696, + "loss": 0.6091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6086834669113159, + "step": 3075, + "valid_targets_mean": 15632.0, + "valid_targets_min": 592 + }, + { + "epoch": 0.8219909260741927, + "grad_norm": 0.443444899287974, + "learning_rate": 0.00011002308167659877, + "loss": 0.6186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5912847518920898, + "step": 3080, + "valid_targets_mean": 16956.1, + "valid_targets_min": 133 + }, + { + "epoch": 0.8233253269282093, + "grad_norm": 0.464873034571983, + "learning_rate": 0.00010986851513351976, + "loss": 0.6211, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6237614154815674, + "step": 3085, + "valid_targets_mean": 15150.4, + "valid_targets_min": 309 + }, + { + "epoch": 0.8246597277822257, + "grad_norm": 0.34073479026514153, + "learning_rate": 0.00010971375942670251, + "loss": 0.6453, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.65798020362854, + "step": 3090, + "valid_targets_mean": 16809.9, + "valid_targets_min": 143 + }, + { + "epoch": 0.8259941286362423, + "grad_norm": 0.3599346066190022, + "learning_rate": 0.00010955881539570581, + "loss": 0.6047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6177526116371155, + "step": 3095, + "valid_targets_mean": 15655.3, + "valid_targets_min": 531 + }, + { + "epoch": 0.8273285294902589, + "grad_norm": 0.2629035887316631, + "learning_rate": 0.00010940368388111008, + "loss": 0.5913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5859917402267456, + "step": 3100, + "valid_targets_mean": 15790.0, + "valid_targets_min": 654 + }, + { + "epoch": 0.8286629303442754, + "grad_norm": 0.3614709856971453, + "learning_rate": 0.00010924836572451287, + "loss": 0.6101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6259796023368835, + "step": 3105, + "valid_targets_mean": 16146.6, + "valid_targets_min": 671 + }, + { + "epoch": 0.829997331198292, + "grad_norm": 0.36915904463117755, + "learning_rate": 0.00010909286176852432, + "loss": 0.6102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.619566798210144, + "step": 3110, + "valid_targets_mean": 16112.4, + "valid_targets_min": 702 + }, + { + "epoch": 0.8313317320523085, + "grad_norm": 0.4478320563958947, + "learning_rate": 0.0001089371728567625, + "loss": 0.6019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5884507298469543, + "step": 3115, + "valid_targets_mean": 16453.3, + "valid_targets_min": 323 + }, + { + "epoch": 0.8326661329063251, + "grad_norm": 0.48113079680139226, + "learning_rate": 0.00010878129983384886, + "loss": 0.6014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5973682999610901, + "step": 3120, + "valid_targets_mean": 16576.3, + "valid_targets_min": 642 + }, + { + "epoch": 0.8340005337603416, + "grad_norm": 0.41747659934580694, + "learning_rate": 0.00010862524354540369, + "loss": 0.5978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5979155898094177, + "step": 3125, + "valid_targets_mean": 16300.0, + "valid_targets_min": 486 + }, + { + "epoch": 0.8353349346143581, + "grad_norm": 0.403178875264998, + "learning_rate": 0.00010846900483804152, + "loss": 0.6117, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6228663325309753, + "step": 3130, + "valid_targets_mean": 16295.0, + "valid_targets_min": 296 + }, + { + "epoch": 0.8366693354683747, + "grad_norm": 0.6520737963100881, + "learning_rate": 0.00010831258455936645, + "loss": 0.6267, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.634268045425415, + "step": 3135, + "valid_targets_mean": 15397.2, + "valid_targets_min": 500 + }, + { + "epoch": 0.8380037363223912, + "grad_norm": 0.4924864447083112, + "learning_rate": 0.00010815598355796771, + "loss": 0.6126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6175791025161743, + "step": 3140, + "valid_targets_mean": 15168.5, + "valid_targets_min": 613 + }, + { + "epoch": 0.8393381371764078, + "grad_norm": 0.3766799859442458, + "learning_rate": 0.0001079992026834149, + "loss": 0.6168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6296804547309875, + "step": 3145, + "valid_targets_mean": 16058.6, + "valid_targets_min": 647 + }, + { + "epoch": 0.8406725380304243, + "grad_norm": 0.3022993394113949, + "learning_rate": 0.00010784224278625345, + "loss": 0.6087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5977729558944702, + "step": 3150, + "valid_targets_mean": 16427.4, + "valid_targets_min": 547 + }, + { + "epoch": 0.8420069388844409, + "grad_norm": 0.3598287609839585, + "learning_rate": 0.00010768510471799996, + "loss": 0.5997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6242843866348267, + "step": 3155, + "valid_targets_mean": 16881.4, + "valid_targets_min": 487 + }, + { + "epoch": 0.8433413397384575, + "grad_norm": 0.3742423879144425, + "learning_rate": 0.00010752778933113774, + "loss": 0.6084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.609407365322113, + "step": 3160, + "valid_targets_mean": 15541.2, + "valid_targets_min": 619 + }, + { + "epoch": 0.844675740592474, + "grad_norm": 0.36522569966843305, + "learning_rate": 0.00010737029747911191, + "loss": 0.6241, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6038820743560791, + "step": 3165, + "valid_targets_mean": 16314.2, + "valid_targets_min": 778 + }, + { + "epoch": 0.8460101414464906, + "grad_norm": 0.3285028310007243, + "learning_rate": 0.00010721263001632503, + "loss": 0.6125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6167506575584412, + "step": 3170, + "valid_targets_mean": 16436.5, + "valid_targets_min": 98 + }, + { + "epoch": 0.847344542300507, + "grad_norm": 0.36921107249552737, + "learning_rate": 0.00010705478779813235, + "loss": 0.6148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6403708457946777, + "step": 3175, + "valid_targets_mean": 15671.0, + "valid_targets_min": 505 + }, + { + "epoch": 0.8486789431545236, + "grad_norm": 0.3430439116198908, + "learning_rate": 0.00010689677168083711, + "loss": 0.5979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6421139240264893, + "step": 3180, + "valid_targets_mean": 14922.0, + "valid_targets_min": 498 + }, + { + "epoch": 0.8500133440085401, + "grad_norm": 0.3799550119601048, + "learning_rate": 0.00010673858252168603, + "loss": 0.6144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6063963174819946, + "step": 3185, + "valid_targets_mean": 15838.3, + "valid_targets_min": 432 + }, + { + "epoch": 0.8513477448625567, + "grad_norm": 0.3060774420584932, + "learning_rate": 0.00010658022117886457, + "loss": 0.6103, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6487347483634949, + "step": 3190, + "valid_targets_mean": 16051.5, + "valid_targets_min": 735 + }, + { + "epoch": 0.8526821457165733, + "grad_norm": 0.3733579759265676, + "learning_rate": 0.00010642168851149229, + "loss": 0.6168, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6070621013641357, + "step": 3195, + "valid_targets_mean": 16092.5, + "valid_targets_min": 303 + }, + { + "epoch": 0.8540165465705898, + "grad_norm": 0.38626581096154744, + "learning_rate": 0.00010626298537961821, + "loss": 0.6018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6229579448699951, + "step": 3200, + "valid_targets_mean": 16702.4, + "valid_targets_min": 688 + }, + { + "epoch": 0.8553509474246064, + "grad_norm": 0.36477867910412903, + "learning_rate": 0.00010610411264421611, + "loss": 0.6099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6154232025146484, + "step": 3205, + "valid_targets_mean": 16684.9, + "valid_targets_min": 718 + }, + { + "epoch": 0.8566853482786229, + "grad_norm": 0.36198405688505025, + "learning_rate": 0.0001059450711671799, + "loss": 0.6128, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6101678013801575, + "step": 3210, + "valid_targets_mean": 15619.2, + "valid_targets_min": 259 + }, + { + "epoch": 0.8580197491326395, + "grad_norm": 0.32113133660955206, + "learning_rate": 0.0001057858618113189, + "loss": 0.6224, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6320436596870422, + "step": 3215, + "valid_targets_mean": 15215.8, + "valid_targets_min": 744 + }, + { + "epoch": 0.859354149986656, + "grad_norm": 0.3435642080760044, + "learning_rate": 0.00010562648544035323, + "loss": 0.606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6011517643928528, + "step": 3220, + "valid_targets_mean": 15546.4, + "valid_targets_min": 395 + }, + { + "epoch": 0.8606885508406725, + "grad_norm": 0.31579139858324407, + "learning_rate": 0.00010546694291890902, + "loss": 0.5854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6084245443344116, + "step": 3225, + "valid_targets_mean": 14603.2, + "valid_targets_min": 737 + }, + { + "epoch": 0.8620229516946891, + "grad_norm": 0.34765535513552315, + "learning_rate": 0.00010530723511251382, + "loss": 0.6144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6162877082824707, + "step": 3230, + "valid_targets_mean": 15704.7, + "valid_targets_min": 468 + }, + { + "epoch": 0.8633573525487056, + "grad_norm": 0.4299871031279047, + "learning_rate": 0.0001051473628875918, + "loss": 0.6078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6121437549591064, + "step": 3235, + "valid_targets_mean": 15767.7, + "valid_targets_min": 344 + }, + { + "epoch": 0.8646917534027222, + "grad_norm": 0.5574544856474637, + "learning_rate": 0.00010498732711145918, + "loss": 0.6201, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6257040500640869, + "step": 3240, + "valid_targets_mean": 15540.5, + "valid_targets_min": 820 + }, + { + "epoch": 0.8660261542567387, + "grad_norm": 0.42323183273983017, + "learning_rate": 0.00010482712865231942, + "loss": 0.5843, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5765583515167236, + "step": 3245, + "valid_targets_mean": 16329.5, + "valid_targets_min": 473 + }, + { + "epoch": 0.8673605551107553, + "grad_norm": 0.28174129439551565, + "learning_rate": 0.00010466676837925857, + "loss": 0.6054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6117812395095825, + "step": 3250, + "valid_targets_mean": 16464.4, + "valid_targets_min": 584 + }, + { + "epoch": 0.8686949559647719, + "grad_norm": 0.3346385254721476, + "learning_rate": 0.00010450624716224045, + "loss": 0.6173, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6023174524307251, + "step": 3255, + "valid_targets_mean": 15990.7, + "valid_targets_min": 709 + }, + { + "epoch": 0.8700293568187883, + "grad_norm": 0.2584890129520337, + "learning_rate": 0.00010434556587210214, + "loss": 0.6004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6040849685668945, + "step": 3260, + "valid_targets_mean": 17105.3, + "valid_targets_min": 670 + }, + { + "epoch": 0.8713637576728049, + "grad_norm": 0.3297204401029785, + "learning_rate": 0.000104184725380549, + "loss": 0.6214, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5984177589416504, + "step": 3265, + "valid_targets_mean": 16792.4, + "valid_targets_min": 341 + }, + { + "epoch": 0.8726981585268214, + "grad_norm": 0.3848946663409018, + "learning_rate": 0.0001040237265601502, + "loss": 0.6112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.589970588684082, + "step": 3270, + "valid_targets_mean": 17034.3, + "valid_targets_min": 10 + }, + { + "epoch": 0.874032559380838, + "grad_norm": 0.2959705381837207, + "learning_rate": 0.00010386257028433366, + "loss": 0.6037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6227315664291382, + "step": 3275, + "valid_targets_mean": 14472.7, + "valid_targets_min": 248 + }, + { + "epoch": 0.8753669602348545, + "grad_norm": 0.4417862059825601, + "learning_rate": 0.00010370125742738173, + "loss": 0.6033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5997108221054077, + "step": 3280, + "valid_targets_mean": 16168.1, + "valid_targets_min": 538 + }, + { + "epoch": 0.8767013610888711, + "grad_norm": 0.37525797564764835, + "learning_rate": 0.00010353978886442605, + "loss": 0.6264, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6209875345230103, + "step": 3285, + "valid_targets_mean": 15834.1, + "valid_targets_min": 137 + }, + { + "epoch": 0.8780357619428877, + "grad_norm": 0.3241866530396012, + "learning_rate": 0.00010337816547144308, + "loss": 0.6302, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6284918189048767, + "step": 3290, + "valid_targets_mean": 15657.5, + "valid_targets_min": 822 + }, + { + "epoch": 0.8793701627969042, + "grad_norm": 0.3160018728632203, + "learning_rate": 0.00010321638812524917, + "loss": 0.6155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6200350522994995, + "step": 3295, + "valid_targets_mean": 16819.1, + "valid_targets_min": 361 + }, + { + "epoch": 0.8807045636509208, + "grad_norm": 0.322845974931051, + "learning_rate": 0.00010305445770349593, + "loss": 0.6024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6223856806755066, + "step": 3300, + "valid_targets_mean": 16542.1, + "valid_targets_min": 402 + }, + { + "epoch": 0.8820389645049372, + "grad_norm": 0.4608365284178052, + "learning_rate": 0.00010289237508466536, + "loss": 0.6057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6043040752410889, + "step": 3305, + "valid_targets_mean": 15211.4, + "valid_targets_min": 534 + }, + { + "epoch": 0.8833733653589538, + "grad_norm": 0.4690910299930012, + "learning_rate": 0.00010273014114806517, + "loss": 0.5999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6026057004928589, + "step": 3310, + "valid_targets_mean": 15156.6, + "valid_targets_min": 572 + }, + { + "epoch": 0.8847077662129704, + "grad_norm": 0.4201149153301678, + "learning_rate": 0.000102567756773824, + "loss": 0.6134, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5694378018379211, + "step": 3315, + "valid_targets_mean": 16189.5, + "valid_targets_min": 693 + }, + { + "epoch": 0.8860421670669869, + "grad_norm": 0.4201365080338633, + "learning_rate": 0.00010240522284288657, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6202242374420166, + "step": 3320, + "valid_targets_mean": 14022.6, + "valid_targets_min": 413 + }, + { + "epoch": 0.8873765679210035, + "grad_norm": 0.4654591928652114, + "learning_rate": 0.00010224254023700899, + "loss": 0.6131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6067278385162354, + "step": 3325, + "valid_targets_mean": 16067.8, + "valid_targets_min": 703 + }, + { + "epoch": 0.88871096877502, + "grad_norm": 0.35180283178941474, + "learning_rate": 0.00010207970983875395, + "loss": 0.6147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6386433839797974, + "step": 3330, + "valid_targets_mean": 15235.7, + "valid_targets_min": 610 + }, + { + "epoch": 0.8900453696290366, + "grad_norm": 0.33352068396479145, + "learning_rate": 0.00010191673253148589, + "loss": 0.609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6070728302001953, + "step": 3335, + "valid_targets_mean": 15675.0, + "valid_targets_min": 390 + }, + { + "epoch": 0.8913797704830531, + "grad_norm": 0.3736462263125514, + "learning_rate": 0.00010175360919936623, + "loss": 0.611, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5979476571083069, + "step": 3340, + "valid_targets_mean": 16730.8, + "valid_targets_min": 463 + }, + { + "epoch": 0.8927141713370697, + "grad_norm": 0.3270191279863833, + "learning_rate": 0.00010159034072734865, + "loss": 0.5914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5909374356269836, + "step": 3345, + "valid_targets_mean": 16453.6, + "valid_targets_min": 380 + }, + { + "epoch": 0.8940485721910862, + "grad_norm": 0.36081202928209205, + "learning_rate": 0.00010142692800117416, + "loss": 0.6028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6175713539123535, + "step": 3350, + "valid_targets_mean": 16360.4, + "valid_targets_min": 549 + }, + { + "epoch": 0.8953829730451027, + "grad_norm": 0.28276237364863666, + "learning_rate": 0.00010126337190736636, + "loss": 0.6085, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6301509141921997, + "step": 3355, + "valid_targets_mean": 15152.6, + "valid_targets_min": 71 + }, + { + "epoch": 0.8967173738991193, + "grad_norm": 0.2872918873302433, + "learning_rate": 0.00010109967333322669, + "loss": 0.6069, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6228970289230347, + "step": 3360, + "valid_targets_mean": 15857.6, + "valid_targets_min": 736 + }, + { + "epoch": 0.8980517747531358, + "grad_norm": 0.3265392681478234, + "learning_rate": 0.00010093583316682945, + "loss": 0.6048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.63560950756073, + "step": 3365, + "valid_targets_mean": 14328.4, + "valid_targets_min": 516 + }, + { + "epoch": 0.8993861756071524, + "grad_norm": 0.28161790268306824, + "learning_rate": 0.00010077185229701722, + "loss": 0.6036, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.597403883934021, + "step": 3370, + "valid_targets_mean": 15919.6, + "valid_targets_min": 292 + }, + { + "epoch": 0.900720576461169, + "grad_norm": 0.3825874335065564, + "learning_rate": 0.00010060773161339574, + "loss": 0.5992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.624705970287323, + "step": 3375, + "valid_targets_mean": 15714.4, + "valid_targets_min": 82 + }, + { + "epoch": 0.9020549773151855, + "grad_norm": 0.5458605458372956, + "learning_rate": 0.00010044347200632943, + "loss": 0.5989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5926228761672974, + "step": 3380, + "valid_targets_mean": 15382.2, + "valid_targets_min": 485 + }, + { + "epoch": 0.9033893781692021, + "grad_norm": 0.44645818132465365, + "learning_rate": 0.00010027907436693623, + "loss": 0.6095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6042912006378174, + "step": 3385, + "valid_targets_mean": 14443.6, + "valid_targets_min": 414 + }, + { + "epoch": 0.9047237790232185, + "grad_norm": 0.34305195074771816, + "learning_rate": 0.00010011453958708297, + "loss": 0.6125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5844123363494873, + "step": 3390, + "valid_targets_mean": 15720.4, + "valid_targets_min": 502 + }, + { + "epoch": 0.9060581798772351, + "grad_norm": 0.41868384483343835, + "learning_rate": 9.994986855938047e-05, + "loss": 0.609, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.588081955909729, + "step": 3395, + "valid_targets_mean": 16701.1, + "valid_targets_min": 664 + }, + { + "epoch": 0.9073925807312516, + "grad_norm": 0.3945502563027158, + "learning_rate": 9.978506217717874e-05, + "loss": 0.6019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.579233705997467, + "step": 3400, + "valid_targets_mean": 16139.0, + "valid_targets_min": 676 + }, + { + "epoch": 0.9087269815852682, + "grad_norm": 0.4392212981591805, + "learning_rate": 9.962012133456204e-05, + "loss": 0.6129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6045866012573242, + "step": 3405, + "valid_targets_mean": 16258.9, + "valid_targets_min": 368 + }, + { + "epoch": 0.9100613824392848, + "grad_norm": 0.5664907112861385, + "learning_rate": 9.945504692634409e-05, + "loss": 0.5989, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.576043963432312, + "step": 3410, + "valid_targets_mean": 15018.4, + "valid_targets_min": 648 + }, + { + "epoch": 0.9113957832933013, + "grad_norm": 0.5588994820568607, + "learning_rate": 9.928983984806326e-05, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6139967441558838, + "step": 3415, + "valid_targets_mean": 16057.7, + "valid_targets_min": 538 + }, + { + "epoch": 0.9127301841473179, + "grad_norm": 0.5421048040367675, + "learning_rate": 9.912450099597765e-05, + "loss": 0.6028, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6360303163528442, + "step": 3420, + "valid_targets_mean": 15415.0, + "valid_targets_min": 705 + }, + { + "epoch": 0.9140645850013344, + "grad_norm": 0.6742729587621604, + "learning_rate": 9.895903126706019e-05, + "loss": 0.608, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6016721129417419, + "step": 3425, + "valid_targets_mean": 15982.4, + "valid_targets_min": 450 + }, + { + "epoch": 0.915398985855351, + "grad_norm": 0.523298202464321, + "learning_rate": 9.879343155899382e-05, + "loss": 0.5938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5959682464599609, + "step": 3430, + "valid_targets_mean": 15555.7, + "valid_targets_min": 795 + }, + { + "epoch": 0.9167333867093675, + "grad_norm": 0.556504006712715, + "learning_rate": 9.862770277016676e-05, + "loss": 0.6054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6146102547645569, + "step": 3435, + "valid_targets_mean": 16316.7, + "valid_targets_min": 716 + }, + { + "epoch": 0.918067787563384, + "grad_norm": 0.5926906258765555, + "learning_rate": 9.846184579966733e-05, + "loss": 0.6017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5958269238471985, + "step": 3440, + "valid_targets_mean": 16558.8, + "valid_targets_min": 502 + }, + { + "epoch": 0.9194021884174006, + "grad_norm": 0.6279864400454699, + "learning_rate": 9.829586154727933e-05, + "loss": 0.6113, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5914964079856873, + "step": 3445, + "valid_targets_mean": 15705.2, + "valid_targets_min": 843 + }, + { + "epoch": 0.9207365892714171, + "grad_norm": 0.5296792410221006, + "learning_rate": 9.812975091347706e-05, + "loss": 0.5973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6114808320999146, + "step": 3450, + "valid_targets_mean": 15067.1, + "valid_targets_min": 576 + }, + { + "epoch": 0.9220709901254337, + "grad_norm": 0.5816183075645648, + "learning_rate": 9.796351479942047e-05, + "loss": 0.6098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.593274712562561, + "step": 3455, + "valid_targets_mean": 16594.1, + "valid_targets_min": 438 + }, + { + "epoch": 0.9234053909794502, + "grad_norm": 0.5769841624751353, + "learning_rate": 9.779715410695015e-05, + "loss": 0.6065, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5925379395484924, + "step": 3460, + "valid_targets_mean": 16822.5, + "valid_targets_min": 408 + }, + { + "epoch": 0.9247397918334668, + "grad_norm": 0.6119656142684935, + "learning_rate": 9.76306697385827e-05, + "loss": 0.6102, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5965239405632019, + "step": 3465, + "valid_targets_mean": 16336.2, + "valid_targets_min": 721 + }, + { + "epoch": 0.9260741926874834, + "grad_norm": 0.5978678471828447, + "learning_rate": 9.746406259750552e-05, + "loss": 0.6204, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623969554901123, + "step": 3470, + "valid_targets_mean": 14696.4, + "valid_targets_min": 574 + }, + { + "epoch": 0.9274085935414998, + "grad_norm": 0.5392574518557786, + "learning_rate": 9.729733358757213e-05, + "loss": 0.5921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6138155460357666, + "step": 3475, + "valid_targets_mean": 16144.3, + "valid_targets_min": 762 + }, + { + "epoch": 0.9287429943955164, + "grad_norm": 0.546975568741761, + "learning_rate": 9.713048361329715e-05, + "loss": 0.6044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5964043140411377, + "step": 3480, + "valid_targets_mean": 16867.3, + "valid_targets_min": 407 + }, + { + "epoch": 0.9300773952495329, + "grad_norm": 0.590321559873573, + "learning_rate": 9.696351357985154e-05, + "loss": 0.6209, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6271519660949707, + "step": 3485, + "valid_targets_mean": 14657.9, + "valid_targets_min": 652 + }, + { + "epoch": 0.9314117961035495, + "grad_norm": 0.4609890304723043, + "learning_rate": 9.679642439305744e-05, + "loss": 0.618, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6284685730934143, + "step": 3490, + "valid_targets_mean": 16037.7, + "valid_targets_min": 769 + }, + { + "epoch": 0.932746196957566, + "grad_norm": 0.5460416444420783, + "learning_rate": 9.662921695938354e-05, + "loss": 0.5986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6472452282905579, + "step": 3495, + "valid_targets_mean": 15298.9, + "valid_targets_min": 659 + }, + { + "epoch": 0.9340805978115826, + "grad_norm": 0.4599174267849713, + "learning_rate": 9.646189218593992e-05, + "loss": 0.6074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5882945656776428, + "step": 3500, + "valid_targets_mean": 15542.3, + "valid_targets_min": 453 + }, + { + "epoch": 0.9354149986655992, + "grad_norm": 0.5595444795518102, + "learning_rate": 9.629445098047334e-05, + "loss": 0.6169, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6238095760345459, + "step": 3505, + "valid_targets_mean": 16269.1, + "valid_targets_min": 338 + }, + { + "epoch": 0.9367493995196157, + "grad_norm": 0.3894759895544851, + "learning_rate": 9.61268942513621e-05, + "loss": 0.5954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5966178774833679, + "step": 3510, + "valid_targets_mean": 15001.4, + "valid_targets_min": 760 + }, + { + "epoch": 0.9380838003736323, + "grad_norm": 0.4979215250445888, + "learning_rate": 9.595922290761128e-05, + "loss": 0.6126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6272135972976685, + "step": 3515, + "valid_targets_mean": 16634.0, + "valid_targets_min": 628 + }, + { + "epoch": 0.9394182012276487, + "grad_norm": 0.3927564720256912, + "learning_rate": 9.579143785884779e-05, + "loss": 0.5916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5718698501586914, + "step": 3520, + "valid_targets_mean": 16832.0, + "valid_targets_min": 886 + }, + { + "epoch": 0.9407526020816653, + "grad_norm": 0.43211562604456244, + "learning_rate": 9.562354001531532e-05, + "loss": 0.6158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5840474367141724, + "step": 3525, + "valid_targets_mean": 15508.1, + "valid_targets_min": 355 + }, + { + "epoch": 0.9420870029356819, + "grad_norm": 0.4128672941000394, + "learning_rate": 9.545553028786952e-05, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5857966542243958, + "step": 3530, + "valid_targets_mean": 15651.6, + "valid_targets_min": 727 + }, + { + "epoch": 0.9434214037896984, + "grad_norm": 0.3634747021780349, + "learning_rate": 9.5287409587973e-05, + "loss": 0.6033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6025322675704956, + "step": 3535, + "valid_targets_mean": 15089.4, + "valid_targets_min": 629 + }, + { + "epoch": 0.944755804643715, + "grad_norm": 0.3521546765730756, + "learning_rate": 9.511917882769042e-05, + "loss": 0.6005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6014447808265686, + "step": 3540, + "valid_targets_mean": 16103.0, + "valid_targets_min": 922 + }, + { + "epoch": 0.9460902054977315, + "grad_norm": 0.3187808407216376, + "learning_rate": 9.495083891968351e-05, + "loss": 0.6097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5850682854652405, + "step": 3545, + "valid_targets_mean": 15095.1, + "valid_targets_min": 163 + }, + { + "epoch": 0.9474246063517481, + "grad_norm": 0.3198484300211676, + "learning_rate": 9.478239077720615e-05, + "loss": 0.6122, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6104428768157959, + "step": 3550, + "valid_targets_mean": 16228.7, + "valid_targets_min": 764 + }, + { + "epoch": 0.9487590072057646, + "grad_norm": 0.3181476862431669, + "learning_rate": 9.461383531409937e-05, + "loss": 0.6013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6085827350616455, + "step": 3555, + "valid_targets_mean": 16036.3, + "valid_targets_min": 441 + }, + { + "epoch": 0.9500934080597812, + "grad_norm": 0.29736598906741296, + "learning_rate": 9.444517344478645e-05, + "loss": 0.6099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5716111660003662, + "step": 3560, + "valid_targets_mean": 16294.4, + "valid_targets_min": 588 + }, + { + "epoch": 0.9514278089137977, + "grad_norm": 0.3542780709853529, + "learning_rate": 9.427640608426789e-05, + "loss": 0.6045, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.600184977054596, + "step": 3565, + "valid_targets_mean": 16048.9, + "valid_targets_min": 431 + }, + { + "epoch": 0.9527622097678142, + "grad_norm": 0.2694226538412474, + "learning_rate": 9.410753414811654e-05, + "loss": 0.5991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5748517513275146, + "step": 3570, + "valid_targets_mean": 16511.5, + "valid_targets_min": 652 + }, + { + "epoch": 0.9540966106218308, + "grad_norm": 0.34003100557255933, + "learning_rate": 9.393855855247254e-05, + "loss": 0.6299, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6436910033226013, + "step": 3575, + "valid_targets_mean": 16154.0, + "valid_targets_min": 647 + }, + { + "epoch": 0.9554310114758473, + "grad_norm": 0.30757421140605506, + "learning_rate": 9.376948021403838e-05, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5963718891143799, + "step": 3580, + "valid_targets_mean": 16212.5, + "valid_targets_min": 185 + }, + { + "epoch": 0.9567654123298639, + "grad_norm": 0.24627952846755352, + "learning_rate": 9.360030005007399e-05, + "loss": 0.6087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5852136015892029, + "step": 3585, + "valid_targets_mean": 15584.9, + "valid_targets_min": 424 + }, + { + "epoch": 0.9580998131838805, + "grad_norm": 0.4008105415564908, + "learning_rate": 9.343101897839169e-05, + "loss": 0.6124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.637090802192688, + "step": 3590, + "valid_targets_mean": 15035.9, + "valid_targets_min": 489 + }, + { + "epoch": 0.959434214037897, + "grad_norm": 0.3175824226253769, + "learning_rate": 9.326163791735116e-05, + "loss": 0.5915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6040235161781311, + "step": 3595, + "valid_targets_mean": 16532.5, + "valid_targets_min": 980 + }, + { + "epoch": 0.9607686148919136, + "grad_norm": 0.2967552407153772, + "learning_rate": 9.309215778585461e-05, + "loss": 0.6081, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6449960470199585, + "step": 3600, + "valid_targets_mean": 16095.4, + "valid_targets_min": 539 + }, + { + "epoch": 0.96210301574593, + "grad_norm": 0.27300528101957167, + "learning_rate": 9.29225795033417e-05, + "loss": 0.6151, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.600953221321106, + "step": 3605, + "valid_targets_mean": 16097.2, + "valid_targets_min": 574 + }, + { + "epoch": 0.9634374165999466, + "grad_norm": 0.34659082635686456, + "learning_rate": 9.275290398978454e-05, + "loss": 0.6258, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6250200271606445, + "step": 3610, + "valid_targets_mean": 14943.5, + "valid_targets_min": 359 + }, + { + "epoch": 0.9647718174539631, + "grad_norm": 0.2768182893205293, + "learning_rate": 9.258313216568273e-05, + "loss": 0.6089, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6249918937683105, + "step": 3615, + "valid_targets_mean": 16153.6, + "valid_targets_min": 514 + }, + { + "epoch": 0.9661062183079797, + "grad_norm": 0.2856620183403404, + "learning_rate": 9.241326495205836e-05, + "loss": 0.6155, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6104844808578491, + "step": 3620, + "valid_targets_mean": 15287.8, + "valid_targets_min": 692 + }, + { + "epoch": 0.9674406191619963, + "grad_norm": 0.28353965965788425, + "learning_rate": 9.224330327045105e-05, + "loss": 0.5971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5877224802970886, + "step": 3625, + "valid_targets_mean": 15522.9, + "valid_targets_min": 805 + }, + { + "epoch": 0.9687750200160128, + "grad_norm": 0.24175798876635027, + "learning_rate": 9.207324804291285e-05, + "loss": 0.6101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5926316976547241, + "step": 3630, + "valid_targets_mean": 16090.8, + "valid_targets_min": 517 + }, + { + "epoch": 0.9701094208700294, + "grad_norm": 0.27316066602702954, + "learning_rate": 9.190310019200338e-05, + "loss": 0.6062, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5892231464385986, + "step": 3635, + "valid_targets_mean": 16473.6, + "valid_targets_min": 460 + }, + { + "epoch": 0.9714438217240459, + "grad_norm": 0.2955367891918511, + "learning_rate": 9.173286064078465e-05, + "loss": 0.6246, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6512964963912964, + "step": 3640, + "valid_targets_mean": 15582.8, + "valid_targets_min": 567 + }, + { + "epoch": 0.9727782225780625, + "grad_norm": 0.27556938116596297, + "learning_rate": 9.156253031281625e-05, + "loss": 0.6205, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6214442253112793, + "step": 3645, + "valid_targets_mean": 14921.4, + "valid_targets_min": 761 + }, + { + "epoch": 0.974112623432079, + "grad_norm": 0.2582864150794311, + "learning_rate": 9.139211013215013e-05, + "loss": 0.6159, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.62605881690979, + "step": 3650, + "valid_targets_mean": 15899.8, + "valid_targets_min": 147 + }, + { + "epoch": 0.9754470242860955, + "grad_norm": 0.27919860547561176, + "learning_rate": 9.122160102332583e-05, + "loss": 0.6124, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5860695242881775, + "step": 3655, + "valid_targets_mean": 16154.2, + "valid_targets_min": 225 + }, + { + "epoch": 0.9767814251401121, + "grad_norm": 0.3429673890231037, + "learning_rate": 9.105100391136523e-05, + "loss": 0.5969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6048210263252258, + "step": 3660, + "valid_targets_mean": 15284.5, + "valid_targets_min": 830 + }, + { + "epoch": 0.9781158259941286, + "grad_norm": 0.25992997840803017, + "learning_rate": 9.088031972176764e-05, + "loss": 0.597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5927121639251709, + "step": 3665, + "valid_targets_mean": 16107.3, + "valid_targets_min": 804 + }, + { + "epoch": 0.9794502268481452, + "grad_norm": 0.3105241091189908, + "learning_rate": 9.070954938050482e-05, + "loss": 0.6177, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6217231750488281, + "step": 3670, + "valid_targets_mean": 15208.2, + "valid_targets_min": 336 + }, + { + "epoch": 0.9807846277021617, + "grad_norm": 0.29322134040149855, + "learning_rate": 9.053869381401589e-05, + "loss": 0.6078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6112452745437622, + "step": 3675, + "valid_targets_mean": 15493.6, + "valid_targets_min": 570 + }, + { + "epoch": 0.9821190285561783, + "grad_norm": 0.25629999684865057, + "learning_rate": 9.036775394920228e-05, + "loss": 0.6087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5787304639816284, + "step": 3680, + "valid_targets_mean": 17701.9, + "valid_targets_min": 313 + }, + { + "epoch": 0.9834534294101949, + "grad_norm": 0.31739063948027607, + "learning_rate": 9.01967307134228e-05, + "loss": 0.6044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5753624439239502, + "step": 3685, + "valid_targets_mean": 16942.6, + "valid_targets_min": 586 + }, + { + "epoch": 0.9847878302642114, + "grad_norm": 0.2630316702217527, + "learning_rate": 9.00256250344885e-05, + "loss": 0.5962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5995844602584839, + "step": 3690, + "valid_targets_mean": 17047.1, + "valid_targets_min": 488 + }, + { + "epoch": 0.9861222311182279, + "grad_norm": 0.2870742144270906, + "learning_rate": 8.985443784065774e-05, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234308481216431, + "step": 3695, + "valid_targets_mean": 16177.1, + "valid_targets_min": 441 + }, + { + "epoch": 0.9874566319722444, + "grad_norm": 0.2870968766409778, + "learning_rate": 8.968317006063107e-05, + "loss": 0.6052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6069310903549194, + "step": 3700, + "valid_targets_mean": 15818.8, + "valid_targets_min": 670 + }, + { + "epoch": 0.988791032826261, + "grad_norm": 0.3201633458743414, + "learning_rate": 8.951182262354624e-05, + "loss": 0.5855, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.596049427986145, + "step": 3705, + "valid_targets_mean": 15979.8, + "valid_targets_min": 926 + }, + { + "epoch": 0.9901254336802775, + "grad_norm": 0.45292184212025816, + "learning_rate": 8.934039645897316e-05, + "loss": 0.6119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6308547258377075, + "step": 3710, + "valid_targets_mean": 16358.6, + "valid_targets_min": 708 + }, + { + "epoch": 0.9914598345342941, + "grad_norm": 0.37136557232397777, + "learning_rate": 8.916889249690877e-05, + "loss": 0.6218, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6080734133720398, + "step": 3715, + "valid_targets_mean": 15775.9, + "valid_targets_min": 124 + }, + { + "epoch": 0.9927942353883107, + "grad_norm": 0.3059224517778049, + "learning_rate": 8.899731166777216e-05, + "loss": 0.6203, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5962896943092346, + "step": 3720, + "valid_targets_mean": 16839.4, + "valid_targets_min": 102 + }, + { + "epoch": 0.9941286362423272, + "grad_norm": 0.41060114220604527, + "learning_rate": 8.882565490239935e-05, + "loss": 0.5876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5867825746536255, + "step": 3725, + "valid_targets_mean": 15651.4, + "valid_targets_min": 476 + }, + { + "epoch": 0.9954630370963438, + "grad_norm": 0.287734059966752, + "learning_rate": 8.865392313203839e-05, + "loss": 0.6016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5873230695724487, + "step": 3730, + "valid_targets_mean": 15009.5, + "valid_targets_min": 634 + }, + { + "epoch": 0.9967974379503602, + "grad_norm": 0.3042666420646906, + "learning_rate": 8.848211728834415e-05, + "loss": 0.625, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6030747890472412, + "step": 3735, + "valid_targets_mean": 15472.2, + "valid_targets_min": 323 + }, + { + "epoch": 0.9981318388043768, + "grad_norm": 0.2796652765372023, + "learning_rate": 8.831023830337348e-05, + "loss": 0.6217, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6056950092315674, + "step": 3740, + "valid_targets_mean": 14817.1, + "valid_targets_min": 435 + }, + { + "epoch": 0.9994662396583934, + "grad_norm": 0.28730214935887727, + "learning_rate": 8.813828710957987e-05, + "loss": 0.5884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6174252033233643, + "step": 3745, + "valid_targets_mean": 15888.3, + "valid_targets_min": 496 + }, + { + "epoch": 1.00080064051241, + "grad_norm": 0.2735137322124431, + "learning_rate": 8.796626463980863e-05, + "loss": 0.5954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6183410286903381, + "step": 3750, + "valid_targets_mean": 17187.5, + "valid_targets_min": 700 + }, + { + "epoch": 1.0021350413664265, + "grad_norm": 0.23838304440126826, + "learning_rate": 8.779417182729181e-05, + "loss": 0.6026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5817262530326843, + "step": 3755, + "valid_targets_mean": 16220.9, + "valid_targets_min": 614 + }, + { + "epoch": 1.003469442220443, + "grad_norm": 0.44839831654591217, + "learning_rate": 8.762200960564295e-05, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6195690035820007, + "step": 3760, + "valid_targets_mean": 16122.4, + "valid_targets_min": 215 + }, + { + "epoch": 1.0048038430744595, + "grad_norm": 0.27158246380773216, + "learning_rate": 8.744977890885218e-05, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6100062131881714, + "step": 3765, + "valid_targets_mean": 15919.8, + "valid_targets_min": 800 + }, + { + "epoch": 1.006138243928476, + "grad_norm": 0.2806714085545213, + "learning_rate": 8.727748067128116e-05, + "loss": 0.6074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6355049014091492, + "step": 3770, + "valid_targets_mean": 14672.5, + "valid_targets_min": 587 + }, + { + "epoch": 1.0074726447824927, + "grad_norm": 0.2658647270458597, + "learning_rate": 8.71051158276579e-05, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.594117283821106, + "step": 3775, + "valid_targets_mean": 17941.1, + "valid_targets_min": 567 + }, + { + "epoch": 1.0088070456365092, + "grad_norm": 0.3368849544158226, + "learning_rate": 8.693268531307182e-05, + "loss": 0.6119, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6125128269195557, + "step": 3780, + "valid_targets_mean": 15490.7, + "valid_targets_min": 526 + }, + { + "epoch": 1.0101414464905258, + "grad_norm": 0.2855946808005626, + "learning_rate": 8.676019006296851e-05, + "loss": 0.6057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5923916101455688, + "step": 3785, + "valid_targets_mean": 16882.1, + "valid_targets_min": 344 + }, + { + "epoch": 1.0114758473445422, + "grad_norm": 0.2487870371227702, + "learning_rate": 8.658763101314484e-05, + "loss": 0.6095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5815153121948242, + "step": 3790, + "valid_targets_mean": 15732.1, + "valid_targets_min": 775 + }, + { + "epoch": 1.0128102481985588, + "grad_norm": 0.2702522146979926, + "learning_rate": 8.64150090997438e-05, + "loss": 0.5956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6120627522468567, + "step": 3795, + "valid_targets_mean": 15799.6, + "valid_targets_min": 644 + }, + { + "epoch": 1.0141446490525754, + "grad_norm": 0.31275492888858597, + "learning_rate": 8.624232525924936e-05, + "loss": 0.607, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6010204553604126, + "step": 3800, + "valid_targets_mean": 16183.2, + "valid_targets_min": 683 + }, + { + "epoch": 1.015479049906592, + "grad_norm": 0.2714797189470768, + "learning_rate": 8.606958042848145e-05, + "loss": 0.6059, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5856226682662964, + "step": 3805, + "valid_targets_mean": 16296.6, + "valid_targets_min": 519 + }, + { + "epoch": 1.0168134507606086, + "grad_norm": 0.24184649907456296, + "learning_rate": 8.589677554459094e-05, + "loss": 0.5885, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5947768688201904, + "step": 3810, + "valid_targets_mean": 17623.0, + "valid_targets_min": 91 + }, + { + "epoch": 1.018147851614625, + "grad_norm": 0.21960448002011657, + "learning_rate": 8.572391154505444e-05, + "loss": 0.5863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5928741693496704, + "step": 3815, + "valid_targets_mean": 15627.8, + "valid_targets_min": 783 + }, + { + "epoch": 1.0194822524686415, + "grad_norm": 0.33082622819338225, + "learning_rate": 8.555098936766927e-05, + "loss": 0.5957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6214810013771057, + "step": 3820, + "valid_targets_mean": 14932.7, + "valid_targets_min": 683 + }, + { + "epoch": 1.0208166533226581, + "grad_norm": 0.3375992376978062, + "learning_rate": 8.537800995054838e-05, + "loss": 0.6157, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6424602270126343, + "step": 3825, + "valid_targets_mean": 15787.0, + "valid_targets_min": 733 + }, + { + "epoch": 1.0221510541766747, + "grad_norm": 0.293029681044579, + "learning_rate": 8.520497423211527e-05, + "loss": 0.5826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5864099860191345, + "step": 3830, + "valid_targets_mean": 15670.6, + "valid_targets_min": 114 + }, + { + "epoch": 1.0234854550306913, + "grad_norm": 0.26359125702311575, + "learning_rate": 8.503188315109881e-05, + "loss": 0.6114, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.592563807964325, + "step": 3835, + "valid_targets_mean": 15773.3, + "valid_targets_min": 570 + }, + { + "epoch": 1.0248198558847077, + "grad_norm": 0.2762342311611941, + "learning_rate": 8.485873764652832e-05, + "loss": 0.5968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5965045094490051, + "step": 3840, + "valid_targets_mean": 16424.9, + "valid_targets_min": 771 + }, + { + "epoch": 1.0261542567387243, + "grad_norm": 0.29960406026858055, + "learning_rate": 8.468553865772826e-05, + "loss": 0.585, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5900242328643799, + "step": 3845, + "valid_targets_mean": 16089.0, + "valid_targets_min": 507 + }, + { + "epoch": 1.0274886575927409, + "grad_norm": 0.3654350862443785, + "learning_rate": 8.451228712431332e-05, + "loss": 0.5997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6008077263832092, + "step": 3850, + "valid_targets_mean": 17085.4, + "valid_targets_min": 679 + }, + { + "epoch": 1.0288230584467575, + "grad_norm": 0.39564743981799033, + "learning_rate": 8.433898398618319e-05, + "loss": 0.6076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5913037657737732, + "step": 3855, + "valid_targets_mean": 15768.2, + "valid_targets_min": 654 + }, + { + "epoch": 1.0301574593007738, + "grad_norm": 0.47340182038873624, + "learning_rate": 8.416563018351758e-05, + "loss": 0.5866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6292645931243896, + "step": 3860, + "valid_targets_mean": 14999.9, + "valid_targets_min": 510 + }, + { + "epoch": 1.0314918601547904, + "grad_norm": 0.39882755526734276, + "learning_rate": 8.399222665677105e-05, + "loss": 0.6109, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6066784858703613, + "step": 3865, + "valid_targets_mean": 16274.1, + "valid_targets_min": 731 + }, + { + "epoch": 1.032826261008807, + "grad_norm": 0.5133907696664676, + "learning_rate": 8.381877434666784e-05, + "loss": 0.5897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6070998907089233, + "step": 3870, + "valid_targets_mean": 14476.0, + "valid_targets_min": 631 + }, + { + "epoch": 1.0341606618628236, + "grad_norm": 0.37803881156149816, + "learning_rate": 8.364527419419696e-05, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5785161256790161, + "step": 3875, + "valid_targets_mean": 15344.3, + "valid_targets_min": 521 + }, + { + "epoch": 1.0354950627168402, + "grad_norm": 0.38545354922670294, + "learning_rate": 8.347172714060686e-05, + "loss": 0.6003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.62616366147995, + "step": 3880, + "valid_targets_mean": 15722.0, + "valid_targets_min": 436 + }, + { + "epoch": 1.0368294635708566, + "grad_norm": 0.27601606744784446, + "learning_rate": 8.32981341274005e-05, + "loss": 0.587, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5717325210571289, + "step": 3885, + "valid_targets_mean": 15027.5, + "valid_targets_min": 24 + }, + { + "epoch": 1.0381638644248732, + "grad_norm": 0.283209337819396, + "learning_rate": 8.312449609633014e-05, + "loss": 0.598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6005629301071167, + "step": 3890, + "valid_targets_mean": 16904.1, + "valid_targets_min": 633 + }, + { + "epoch": 1.0394982652788898, + "grad_norm": 0.2589442465778229, + "learning_rate": 8.295081398939227e-05, + "loss": 0.591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.622482180595398, + "step": 3895, + "valid_targets_mean": 15561.6, + "valid_targets_min": 558 + }, + { + "epoch": 1.0408326661329064, + "grad_norm": 0.2538028332575704, + "learning_rate": 8.277708874882252e-05, + "loss": 0.5922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5734326243400574, + "step": 3900, + "valid_targets_mean": 16120.2, + "valid_targets_min": 791 + }, + { + "epoch": 1.042167066986923, + "grad_norm": 0.2951707638591912, + "learning_rate": 8.26033213170905e-05, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5737336874008179, + "step": 3905, + "valid_targets_mean": 16694.7, + "valid_targets_min": 798 + }, + { + "epoch": 1.0435014678409393, + "grad_norm": 0.23428151714943055, + "learning_rate": 8.242951263689468e-05, + "loss": 0.6112, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6021207571029663, + "step": 3910, + "valid_targets_mean": 16208.7, + "valid_targets_min": 539 + }, + { + "epoch": 1.044835868694956, + "grad_norm": 0.3700479615812931, + "learning_rate": 8.225566365115738e-05, + "loss": 0.5971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.592542290687561, + "step": 3915, + "valid_targets_mean": 16273.6, + "valid_targets_min": 548 + }, + { + "epoch": 1.0461702695489725, + "grad_norm": 0.2645971281118714, + "learning_rate": 8.20817753030195e-05, + "loss": 0.5968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5795402526855469, + "step": 3920, + "valid_targets_mean": 16697.3, + "valid_targets_min": 403 + }, + { + "epoch": 1.0475046704029891, + "grad_norm": 0.3425426380482205, + "learning_rate": 8.190784853583554e-05, + "loss": 0.6191, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623998761177063, + "step": 3925, + "valid_targets_mean": 15397.3, + "valid_targets_min": 91 + }, + { + "epoch": 1.0488390712570057, + "grad_norm": 0.24545813741267344, + "learning_rate": 8.17338842931684e-05, + "loss": 0.6043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5687215328216553, + "step": 3930, + "valid_targets_mean": 17506.0, + "valid_targets_min": 546 + }, + { + "epoch": 1.050173472111022, + "grad_norm": 0.33126881411854414, + "learning_rate": 8.155988351878433e-05, + "loss": 0.5914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5726214647293091, + "step": 3935, + "valid_targets_mean": 15834.2, + "valid_targets_min": 876 + }, + { + "epoch": 1.0515078729650387, + "grad_norm": 0.5763101772706276, + "learning_rate": 8.138584715664766e-05, + "loss": 0.621, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5805267095565796, + "step": 3940, + "valid_targets_mean": 15561.8, + "valid_targets_min": 865 + }, + { + "epoch": 1.0528422738190553, + "grad_norm": 0.494034853848136, + "learning_rate": 8.121177615091591e-05, + "loss": 0.6087, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5953424572944641, + "step": 3945, + "valid_targets_mean": 15862.3, + "valid_targets_min": 40 + }, + { + "epoch": 1.0541766746730719, + "grad_norm": 0.5229883887191916, + "learning_rate": 8.103767144593445e-05, + "loss": 0.5978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5901090502738953, + "step": 3950, + "valid_targets_mean": 16749.9, + "valid_targets_min": 462 + }, + { + "epoch": 1.0555110755270882, + "grad_norm": 0.4728196990146652, + "learning_rate": 8.086353398623154e-05, + "loss": 0.5914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5970526337623596, + "step": 3955, + "valid_targets_mean": 16564.7, + "valid_targets_min": 624 + }, + { + "epoch": 1.0568454763811048, + "grad_norm": 0.5396700684131644, + "learning_rate": 8.068936471651308e-05, + "loss": 0.6052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5742120146751404, + "step": 3960, + "valid_targets_mean": 15665.1, + "valid_targets_min": 419 + }, + { + "epoch": 1.0581798772351214, + "grad_norm": 0.39065735194712553, + "learning_rate": 8.051516458165759e-05, + "loss": 0.594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6119595170021057, + "step": 3965, + "valid_targets_mean": 15060.5, + "valid_targets_min": 477 + }, + { + "epoch": 1.059514278089138, + "grad_norm": 0.4593056562963595, + "learning_rate": 8.0340934526711e-05, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6290844678878784, + "step": 3970, + "valid_targets_mean": 15527.7, + "valid_targets_min": 591 + }, + { + "epoch": 1.0608486789431546, + "grad_norm": 0.40920946492053945, + "learning_rate": 8.016667549688157e-05, + "loss": 0.5954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5855837464332581, + "step": 3975, + "valid_targets_mean": 16526.8, + "valid_targets_min": 493 + }, + { + "epoch": 1.062183079797171, + "grad_norm": 0.46026687220809426, + "learning_rate": 7.999238843753474e-05, + "loss": 0.5988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.588485598564148, + "step": 3980, + "valid_targets_mean": 15916.0, + "valid_targets_min": 814 + }, + { + "epoch": 1.0635174806511876, + "grad_norm": 0.41338177927826364, + "learning_rate": 7.981807429418803e-05, + "loss": 0.6255, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234038472175598, + "step": 3985, + "valid_targets_mean": 15702.3, + "valid_targets_min": 625 + }, + { + "epoch": 1.0648518815052042, + "grad_norm": 0.44812067294712354, + "learning_rate": 7.96437340125059e-05, + "loss": 0.5849, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5726232528686523, + "step": 3990, + "valid_targets_mean": 17405.6, + "valid_targets_min": 669 + }, + { + "epoch": 1.0661862823592207, + "grad_norm": 0.37211637583987855, + "learning_rate": 7.946936853829458e-05, + "loss": 0.6035, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6075381636619568, + "step": 3995, + "valid_targets_mean": 16482.9, + "valid_targets_min": 434 + }, + { + "epoch": 1.0675206832132373, + "grad_norm": 0.42373416536725417, + "learning_rate": 7.929497881749699e-05, + "loss": 0.5986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.594200611114502, + "step": 4000, + "valid_targets_mean": 17066.9, + "valid_targets_min": 779 + }, + { + "epoch": 1.0688550840672537, + "grad_norm": 0.3914037196829223, + "learning_rate": 7.912056579618759e-05, + "loss": 0.6101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5865424871444702, + "step": 4005, + "valid_targets_mean": 16414.9, + "valid_targets_min": 841 + }, + { + "epoch": 1.0701894849212703, + "grad_norm": 0.36788284503140656, + "learning_rate": 7.894613042056721e-05, + "loss": 0.5826, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6006873250007629, + "step": 4010, + "valid_targets_mean": 15932.2, + "valid_targets_min": 587 + }, + { + "epoch": 1.071523885775287, + "grad_norm": 0.2916092674005148, + "learning_rate": 7.877167363695805e-05, + "loss": 0.6027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6191377639770508, + "step": 4015, + "valid_targets_mean": 15171.0, + "valid_targets_min": 333 + }, + { + "epoch": 1.0728582866293035, + "grad_norm": 0.3703056092797146, + "learning_rate": 7.859719639179834e-05, + "loss": 0.5863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5682851672172546, + "step": 4020, + "valid_targets_mean": 16206.3, + "valid_targets_min": 368 + }, + { + "epoch": 1.07419268748332, + "grad_norm": 0.2758510848401202, + "learning_rate": 7.842269963163735e-05, + "loss": 0.6048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5797070264816284, + "step": 4025, + "valid_targets_mean": 17413.4, + "valid_targets_min": 704 + }, + { + "epoch": 1.0755270883373365, + "grad_norm": 0.3275128650166002, + "learning_rate": 7.824818430313028e-05, + "loss": 0.5987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5855237245559692, + "step": 4030, + "valid_targets_mean": 16071.4, + "valid_targets_min": 61 + }, + { + "epoch": 1.076861489191353, + "grad_norm": 0.3412770087192014, + "learning_rate": 7.807365135303299e-05, + "loss": 0.6152, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6232606172561646, + "step": 4035, + "valid_targets_mean": 15833.4, + "valid_targets_min": 608 + }, + { + "epoch": 1.0781958900453696, + "grad_norm": 0.33999788333188585, + "learning_rate": 7.789910172819693e-05, + "loss": 0.5986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5924199819564819, + "step": 4040, + "valid_targets_mean": 16710.9, + "valid_targets_min": 543 + }, + { + "epoch": 1.0795302908993862, + "grad_norm": 0.36260912648773397, + "learning_rate": 7.772453637556411e-05, + "loss": 0.6208, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6322931051254272, + "step": 4045, + "valid_targets_mean": 16038.3, + "valid_targets_min": 253 + }, + { + "epoch": 1.0808646917534026, + "grad_norm": 0.35220327417259206, + "learning_rate": 7.754995624216176e-05, + "loss": 0.6002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5823273658752441, + "step": 4050, + "valid_targets_mean": 16727.7, + "valid_targets_min": 578 + }, + { + "epoch": 1.0821990926074192, + "grad_norm": 0.4864103700141048, + "learning_rate": 7.737536227509734e-05, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5839403867721558, + "step": 4055, + "valid_targets_mean": 15676.5, + "valid_targets_min": 396 + }, + { + "epoch": 1.0835334934614358, + "grad_norm": 0.3790317408511732, + "learning_rate": 7.720075542155336e-05, + "loss": 0.6277, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6375101804733276, + "step": 4060, + "valid_targets_mean": 15747.6, + "valid_targets_min": 790 + }, + { + "epoch": 1.0848678943154524, + "grad_norm": 0.34787300200592175, + "learning_rate": 7.702613662878223e-05, + "loss": 0.6163, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6184200048446655, + "step": 4065, + "valid_targets_mean": 15998.6, + "valid_targets_min": 613 + }, + { + "epoch": 1.086202295169469, + "grad_norm": 0.27071999547248415, + "learning_rate": 7.685150684410114e-05, + "loss": 0.5985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5919818878173828, + "step": 4070, + "valid_targets_mean": 15357.0, + "valid_targets_min": 686 + }, + { + "epoch": 1.0875366960234856, + "grad_norm": 0.32451365522562825, + "learning_rate": 7.667686701488688e-05, + "loss": 0.6014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5560876131057739, + "step": 4075, + "valid_targets_mean": 17877.9, + "valid_targets_min": 375 + }, + { + "epoch": 1.088871096877502, + "grad_norm": 0.3881096398697237, + "learning_rate": 7.650221808857081e-05, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.596640408039093, + "step": 4080, + "valid_targets_mean": 16333.7, + "valid_targets_min": 552 + }, + { + "epoch": 1.0902054977315185, + "grad_norm": 0.28008609577192756, + "learning_rate": 7.632756101263358e-05, + "loss": 0.5888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5497901439666748, + "step": 4085, + "valid_targets_mean": 17502.5, + "valid_targets_min": 415 + }, + { + "epoch": 1.0915398985855351, + "grad_norm": 0.40852074144248085, + "learning_rate": 7.615289673460003e-05, + "loss": 0.6023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6026955842971802, + "step": 4090, + "valid_targets_mean": 14722.9, + "valid_targets_min": 499 + }, + { + "epoch": 1.0928742994395517, + "grad_norm": 0.3377885391386289, + "learning_rate": 7.59782262020341e-05, + "loss": 0.5906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6042886972427368, + "step": 4095, + "valid_targets_mean": 16119.0, + "valid_targets_min": 312 + }, + { + "epoch": 1.094208700293568, + "grad_norm": 0.3636416145030373, + "learning_rate": 7.580355036253372e-05, + "loss": 0.6024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5962235331535339, + "step": 4100, + "valid_targets_mean": 14884.0, + "valid_targets_min": 705 + }, + { + "epoch": 1.0955431011475847, + "grad_norm": 0.2796195315960068, + "learning_rate": 7.562887016372551e-05, + "loss": 0.6077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6036214828491211, + "step": 4105, + "valid_targets_mean": 15731.4, + "valid_targets_min": 565 + }, + { + "epoch": 1.0968775020016013, + "grad_norm": 0.3801739652085176, + "learning_rate": 7.54541865532598e-05, + "loss": 0.602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5916723012924194, + "step": 4110, + "valid_targets_mean": 16717.8, + "valid_targets_min": 686 + }, + { + "epoch": 1.0982119028556179, + "grad_norm": 0.29474613873650163, + "learning_rate": 7.527950047880543e-05, + "loss": 0.6016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6182796359062195, + "step": 4115, + "valid_targets_mean": 15451.0, + "valid_targets_min": 481 + }, + { + "epoch": 1.0995463037096345, + "grad_norm": 0.2653542372013782, + "learning_rate": 7.51048128880446e-05, + "loss": 0.6074, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6237516403198242, + "step": 4120, + "valid_targets_mean": 14658.4, + "valid_targets_min": 624 + }, + { + "epoch": 1.1008807045636508, + "grad_norm": 0.2580311694584571, + "learning_rate": 7.493012472866769e-05, + "loss": 0.6027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5956270098686218, + "step": 4125, + "valid_targets_mean": 16665.0, + "valid_targets_min": 631 + }, + { + "epoch": 1.1022151054176674, + "grad_norm": 0.33966126879080366, + "learning_rate": 7.47554369483682e-05, + "loss": 0.6022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6200779676437378, + "step": 4130, + "valid_targets_mean": 15626.4, + "valid_targets_min": 685 + }, + { + "epoch": 1.103549506271684, + "grad_norm": 0.3325337972812342, + "learning_rate": 7.458075049483762e-05, + "loss": 0.5945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5936934947967529, + "step": 4135, + "valid_targets_mean": 16802.8, + "valid_targets_min": 462 + }, + { + "epoch": 1.1048839071257006, + "grad_norm": 0.2800792855939298, + "learning_rate": 7.44060663157602e-05, + "loss": 0.6033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6194767951965332, + "step": 4140, + "valid_targets_mean": 16379.5, + "valid_targets_min": 769 + }, + { + "epoch": 1.1062183079797172, + "grad_norm": 0.29176434819055114, + "learning_rate": 7.423138535880779e-05, + "loss": 0.6026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5879778861999512, + "step": 4145, + "valid_targets_mean": 16280.6, + "valid_targets_min": 399 + }, + { + "epoch": 1.1075527088337336, + "grad_norm": 0.2835063383721158, + "learning_rate": 7.405670857163489e-05, + "loss": 0.6106, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6160388588905334, + "step": 4150, + "valid_targets_mean": 16408.5, + "valid_targets_min": 621 + }, + { + "epoch": 1.1088871096877502, + "grad_norm": 0.31251798770839306, + "learning_rate": 7.388203690187325e-05, + "loss": 0.6031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6266306638717651, + "step": 4155, + "valid_targets_mean": 14556.0, + "valid_targets_min": 758 + }, + { + "epoch": 1.1102215105417668, + "grad_norm": 0.3064354700564066, + "learning_rate": 7.370737129712695e-05, + "loss": 0.5892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5773193836212158, + "step": 4160, + "valid_targets_mean": 16209.6, + "valid_targets_min": 670 + }, + { + "epoch": 1.1115559113957834, + "grad_norm": 0.26141133680604506, + "learning_rate": 7.353271270496713e-05, + "loss": 0.6097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6453293561935425, + "step": 4165, + "valid_targets_mean": 15267.4, + "valid_targets_min": 713 + }, + { + "epoch": 1.1128903122498, + "grad_norm": 0.26244489234882723, + "learning_rate": 7.335806207292687e-05, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5935405492782593, + "step": 4170, + "valid_targets_mean": 16030.8, + "valid_targets_min": 835 + }, + { + "epoch": 1.1142247131038163, + "grad_norm": 0.3910474355938962, + "learning_rate": 7.31834203484961e-05, + "loss": 0.6063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6182336211204529, + "step": 4175, + "valid_targets_mean": 14981.8, + "valid_targets_min": 739 + }, + { + "epoch": 1.115559113957833, + "grad_norm": 0.3150996733557663, + "learning_rate": 7.300878847911642e-05, + "loss": 0.6083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6151427626609802, + "step": 4180, + "valid_targets_mean": 15251.6, + "valid_targets_min": 282 + }, + { + "epoch": 1.1168935148118495, + "grad_norm": 0.24806222257823488, + "learning_rate": 7.283416741217595e-05, + "loss": 0.5863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5705355405807495, + "step": 4185, + "valid_targets_mean": 17316.5, + "valid_targets_min": 748 + }, + { + "epoch": 1.118227915665866, + "grad_norm": 0.3124041203185742, + "learning_rate": 7.26595580950042e-05, + "loss": 0.6158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6485847234725952, + "step": 4190, + "valid_targets_mean": 15875.1, + "valid_targets_min": 863 + }, + { + "epoch": 1.1195623165198825, + "grad_norm": 0.37971496808314315, + "learning_rate": 7.248496147486695e-05, + "loss": 0.5857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5784488916397095, + "step": 4195, + "valid_targets_mean": 17062.4, + "valid_targets_min": 440 + }, + { + "epoch": 1.120896717373899, + "grad_norm": 0.7932004381188809, + "learning_rate": 7.23103784989611e-05, + "loss": 0.6139, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6217626929283142, + "step": 4200, + "valid_targets_mean": 15889.3, + "valid_targets_min": 733 + }, + { + "epoch": 1.1222311182279157, + "grad_norm": 0.4868104239933692, + "learning_rate": 7.213581011440954e-05, + "loss": 0.633, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6174220442771912, + "step": 4205, + "valid_targets_mean": 16341.5, + "valid_targets_min": 203 + }, + { + "epoch": 1.1235655190819323, + "grad_norm": 0.5902127688698259, + "learning_rate": 7.1961257268256e-05, + "loss": 0.6032, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6067975759506226, + "step": 4210, + "valid_targets_mean": 14791.9, + "valid_targets_min": 392 + }, + { + "epoch": 1.1248999199359488, + "grad_norm": 0.3536516478373195, + "learning_rate": 7.178672090745986e-05, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5986104011535645, + "step": 4215, + "valid_targets_mean": 16207.2, + "valid_targets_min": 606 + }, + { + "epoch": 1.1262343207899652, + "grad_norm": 0.30077100249154387, + "learning_rate": 7.161220197889114e-05, + "loss": 0.6054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6378801465034485, + "step": 4220, + "valid_targets_mean": 16880.7, + "valid_targets_min": 686 + }, + { + "epoch": 1.1275687216439818, + "grad_norm": 0.27729680429800824, + "learning_rate": 7.143770142932524e-05, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5797771215438843, + "step": 4225, + "valid_targets_mean": 17065.5, + "valid_targets_min": 723 + }, + { + "epoch": 1.1289031224979984, + "grad_norm": 0.27223236223082237, + "learning_rate": 7.126322020543785e-05, + "loss": 0.5982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5857571363449097, + "step": 4230, + "valid_targets_mean": 15327.6, + "valid_targets_min": 599 + }, + { + "epoch": 1.130237523352015, + "grad_norm": 0.2591278577330893, + "learning_rate": 7.108875925379991e-05, + "loss": 0.5973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5912514925003052, + "step": 4235, + "valid_targets_mean": 14846.1, + "valid_targets_min": 578 + }, + { + "epoch": 1.1315719242060316, + "grad_norm": 0.31767585730342623, + "learning_rate": 7.091431952087221e-05, + "loss": 0.6178, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6124032735824585, + "step": 4240, + "valid_targets_mean": 15918.7, + "valid_targets_min": 608 + }, + { + "epoch": 1.132906325060048, + "grad_norm": 0.24375473388947871, + "learning_rate": 7.073990195300058e-05, + "loss": 0.5956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5829209089279175, + "step": 4245, + "valid_targets_mean": 15267.2, + "valid_targets_min": 316 + }, + { + "epoch": 1.1342407259140646, + "grad_norm": 0.2127941498929142, + "learning_rate": 7.056550749641056e-05, + "loss": 0.6004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6242984533309937, + "step": 4250, + "valid_targets_mean": 15888.2, + "valid_targets_min": 725 + }, + { + "epoch": 1.1355751267680811, + "grad_norm": 0.3167067915599793, + "learning_rate": 7.039113709720227e-05, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5977542400360107, + "step": 4255, + "valid_targets_mean": 15727.3, + "valid_targets_min": 1003 + }, + { + "epoch": 1.1369095276220977, + "grad_norm": 0.27993316101713944, + "learning_rate": 7.021679170134533e-05, + "loss": 0.5925, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.587902843952179, + "step": 4260, + "valid_targets_mean": 16104.0, + "valid_targets_min": 364 + }, + { + "epoch": 1.1382439284761143, + "grad_norm": 0.31043922998417844, + "learning_rate": 7.004247225467381e-05, + "loss": 0.5966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5865461230278015, + "step": 4265, + "valid_targets_mean": 16515.5, + "valid_targets_min": 617 + }, + { + "epoch": 1.1395783293301307, + "grad_norm": 0.2689763541971217, + "learning_rate": 6.986817970288082e-05, + "loss": 0.6006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5762760639190674, + "step": 4270, + "valid_targets_mean": 16571.0, + "valid_targets_min": 837 + }, + { + "epoch": 1.1409127301841473, + "grad_norm": 0.22897307468939943, + "learning_rate": 6.969391499151371e-05, + "loss": 0.5863, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5768278241157532, + "step": 4275, + "valid_targets_mean": 15187.9, + "valid_targets_min": 395 + }, + { + "epoch": 1.1422471310381639, + "grad_norm": 0.2574952643742215, + "learning_rate": 6.95196790659688e-05, + "loss": 0.5983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6268581748008728, + "step": 4280, + "valid_targets_mean": 15087.0, + "valid_targets_min": 715 + }, + { + "epoch": 1.1435815318921805, + "grad_norm": 0.31001744346505816, + "learning_rate": 6.934547287148614e-05, + "loss": 0.6097, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6045074462890625, + "step": 4285, + "valid_targets_mean": 15647.8, + "valid_targets_min": 518 + }, + { + "epoch": 1.1449159327461969, + "grad_norm": 0.27988511418077017, + "learning_rate": 6.917129735314455e-05, + "loss": 0.6038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6157107949256897, + "step": 4290, + "valid_targets_mean": 15646.0, + "valid_targets_min": 486 + }, + { + "epoch": 1.1462503336002134, + "grad_norm": 0.284623906189759, + "learning_rate": 6.899715345585649e-05, + "loss": 0.5861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6071814298629761, + "step": 4295, + "valid_targets_mean": 16459.4, + "valid_targets_min": 307 + }, + { + "epoch": 1.14758473445423, + "grad_norm": 0.23613016291869346, + "learning_rate": 6.882304212436272e-05, + "loss": 0.6057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5901815891265869, + "step": 4300, + "valid_targets_mean": 16384.8, + "valid_targets_min": 661 + }, + { + "epoch": 1.1489191353082466, + "grad_norm": 0.7099036688341175, + "learning_rate": 6.864896430322745e-05, + "loss": 0.6244, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6605739593505859, + "step": 4305, + "valid_targets_mean": 15084.9, + "valid_targets_min": 755 + }, + { + "epoch": 1.1502535361622632, + "grad_norm": 0.2660867664547303, + "learning_rate": 6.84749209368331e-05, + "loss": 0.5833, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5416364669799805, + "step": 4310, + "valid_targets_mean": 17516.2, + "valid_targets_min": 413 + }, + { + "epoch": 1.1515879370162796, + "grad_norm": 0.24899135484110319, + "learning_rate": 6.830091296937509e-05, + "loss": 0.5968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5933257341384888, + "step": 4315, + "valid_targets_mean": 15933.6, + "valid_targets_min": 560 + }, + { + "epoch": 1.1529223378702962, + "grad_norm": 0.28429870191220086, + "learning_rate": 6.812694134485686e-05, + "loss": 0.6016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5702193379402161, + "step": 4320, + "valid_targets_mean": 16298.5, + "valid_targets_min": 391 + }, + { + "epoch": 1.1542567387243128, + "grad_norm": 0.3432717505307207, + "learning_rate": 6.795300700708466e-05, + "loss": 0.6048, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5982928276062012, + "step": 4325, + "valid_targets_mean": 16746.6, + "valid_targets_min": 780 + }, + { + "epoch": 1.1555911395783294, + "grad_norm": 0.30284190514883463, + "learning_rate": 6.777911089966245e-05, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6121088266372681, + "step": 4330, + "valid_targets_mean": 15415.2, + "valid_targets_min": 63 + }, + { + "epoch": 1.156925540432346, + "grad_norm": 0.30760369252329195, + "learning_rate": 6.760525396598686e-05, + "loss": 0.6142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6483354568481445, + "step": 4335, + "valid_targets_mean": 15703.1, + "valid_targets_min": 476 + }, + { + "epoch": 1.1582599412863623, + "grad_norm": 0.35568703892758397, + "learning_rate": 6.74314371492419e-05, + "loss": 0.5889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6182370185852051, + "step": 4340, + "valid_targets_mean": 15757.3, + "valid_targets_min": 501 + }, + { + "epoch": 1.159594342140379, + "grad_norm": 0.2984066417689251, + "learning_rate": 6.725766139239399e-05, + "loss": 0.6017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5672701597213745, + "step": 4345, + "valid_targets_mean": 15679.0, + "valid_targets_min": 305 + }, + { + "epoch": 1.1609287429943955, + "grad_norm": 0.35563150663132786, + "learning_rate": 6.708392763818681e-05, + "loss": 0.5988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5748165249824524, + "step": 4350, + "valid_targets_mean": 15702.1, + "valid_targets_min": 190 + }, + { + "epoch": 1.1622631438484121, + "grad_norm": 0.4725264739524481, + "learning_rate": 6.691023682913616e-05, + "loss": 0.6136, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6290553212165833, + "step": 4355, + "valid_targets_mean": 17302.8, + "valid_targets_min": 366 + }, + { + "epoch": 1.1635975447024287, + "grad_norm": 0.41649020656338065, + "learning_rate": 6.673658990752484e-05, + "loss": 0.5954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5825016498565674, + "step": 4360, + "valid_targets_mean": 16416.6, + "valid_targets_min": 252 + }, + { + "epoch": 1.164931945556445, + "grad_norm": 0.4726742196256588, + "learning_rate": 6.656298781539764e-05, + "loss": 0.5896, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5909591913223267, + "step": 4365, + "valid_targets_mean": 16828.3, + "valid_targets_min": 133 + }, + { + "epoch": 1.1662663464104617, + "grad_norm": 0.3577791658502569, + "learning_rate": 6.638943149455598e-05, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5973008275032043, + "step": 4370, + "valid_targets_mean": 15010.5, + "valid_targets_min": 464 + }, + { + "epoch": 1.1676007472644783, + "grad_norm": 0.45347121217280895, + "learning_rate": 6.621592188655314e-05, + "loss": 0.5965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5748577117919922, + "step": 4375, + "valid_targets_mean": 15569.6, + "valid_targets_min": 607 + }, + { + "epoch": 1.1689351481184949, + "grad_norm": 0.3649598802805446, + "learning_rate": 6.604245993268893e-05, + "loss": 0.5927, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5843199491500854, + "step": 4380, + "valid_targets_mean": 16538.5, + "valid_targets_min": 735 + }, + { + "epoch": 1.1702695489725112, + "grad_norm": 0.397739643309116, + "learning_rate": 6.586904657400457e-05, + "loss": 0.5992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5765359401702881, + "step": 4385, + "valid_targets_mean": 15469.5, + "valid_targets_min": 335 + }, + { + "epoch": 1.1716039498265278, + "grad_norm": 0.37300616388581065, + "learning_rate": 6.569568275127769e-05, + "loss": 0.5812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5807654857635498, + "step": 4390, + "valid_targets_mean": 16243.7, + "valid_targets_min": 879 + }, + { + "epoch": 1.1729383506805444, + "grad_norm": 0.3840703505859544, + "learning_rate": 6.552236940501725e-05, + "loss": 0.5828, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5711965560913086, + "step": 4395, + "valid_targets_mean": 14674.8, + "valid_targets_min": 456 + }, + { + "epoch": 1.174272751534561, + "grad_norm": 0.37863289411399653, + "learning_rate": 6.534910747545825e-05, + "loss": 0.5854, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5958431363105774, + "step": 4400, + "valid_targets_mean": 15368.2, + "valid_targets_min": 532 + }, + { + "epoch": 1.1756071523885776, + "grad_norm": 0.4477581792181912, + "learning_rate": 6.517589790255686e-05, + "loss": 0.6129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6343816518783569, + "step": 4405, + "valid_targets_mean": 14593.0, + "valid_targets_min": 375 + }, + { + "epoch": 1.1769415532425942, + "grad_norm": 0.3270473622838311, + "learning_rate": 6.500274162598512e-05, + "loss": 0.606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6062087416648865, + "step": 4410, + "valid_targets_mean": 15336.0, + "valid_targets_min": 486 + }, + { + "epoch": 1.1782759540966106, + "grad_norm": 0.4103892887347845, + "learning_rate": 6.482963958512599e-05, + "loss": 0.598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6063992977142334, + "step": 4415, + "valid_targets_mean": 15912.9, + "valid_targets_min": 730 + }, + { + "epoch": 1.1796103549506272, + "grad_norm": 0.3631692668594323, + "learning_rate": 6.465659271906823e-05, + "loss": 0.593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5838413238525391, + "step": 4420, + "valid_targets_mean": 16326.5, + "valid_targets_min": 407 + }, + { + "epoch": 1.1809447558046438, + "grad_norm": 0.3752812321904994, + "learning_rate": 6.448360196660116e-05, + "loss": 0.6013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5776430368423462, + "step": 4425, + "valid_targets_mean": 16754.6, + "valid_targets_min": 618 + }, + { + "epoch": 1.1822791566586603, + "grad_norm": 0.3642942093840262, + "learning_rate": 6.43106682662098e-05, + "loss": 0.5937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5928678512573242, + "step": 4430, + "valid_targets_mean": 15495.9, + "valid_targets_min": 383 + }, + { + "epoch": 1.1836135575126767, + "grad_norm": 0.3520645453564209, + "learning_rate": 6.413779255606961e-05, + "loss": 0.5813, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5934560894966125, + "step": 4435, + "valid_targets_mean": 15091.7, + "valid_targets_min": 171 + }, + { + "epoch": 1.1849479583666933, + "grad_norm": 0.21548984155232773, + "learning_rate": 6.396497577404143e-05, + "loss": 0.6091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.612282395362854, + "step": 4440, + "valid_targets_mean": 16170.2, + "valid_targets_min": 588 + }, + { + "epoch": 1.18628235922071, + "grad_norm": 0.21533211012293957, + "learning_rate": 6.379221885766643e-05, + "loss": 0.5939, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5665504932403564, + "step": 4445, + "valid_targets_mean": 16189.7, + "valid_targets_min": 318 + }, + { + "epoch": 1.1876167600747265, + "grad_norm": 0.43172732636361405, + "learning_rate": 6.361952274416106e-05, + "loss": 0.5896, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5815595984458923, + "step": 4450, + "valid_targets_mean": 17214.6, + "valid_targets_min": 615 + }, + { + "epoch": 1.188951160928743, + "grad_norm": 0.3749421262001143, + "learning_rate": 6.344688837041177e-05, + "loss": 0.5932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5799713134765625, + "step": 4455, + "valid_targets_mean": 18348.3, + "valid_targets_min": 332 + }, + { + "epoch": 1.1902855617827595, + "grad_norm": 0.3493641365006668, + "learning_rate": 6.32743166729702e-05, + "loss": 0.6017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5951375365257263, + "step": 4460, + "valid_targets_mean": 16188.1, + "valid_targets_min": 301 + }, + { + "epoch": 1.191619962636776, + "grad_norm": 0.3065563699541395, + "learning_rate": 6.310180858804794e-05, + "loss": 0.6135, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.61883544921875, + "step": 4465, + "valid_targets_mean": 15588.0, + "valid_targets_min": 425 + }, + { + "epoch": 1.1929543634907926, + "grad_norm": 0.36380231112006145, + "learning_rate": 6.292936505151145e-05, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6210154294967651, + "step": 4470, + "valid_targets_mean": 14523.7, + "valid_targets_min": 539 + }, + { + "epoch": 1.1942887643448092, + "grad_norm": 0.3314227814860259, + "learning_rate": 6.275698699887699e-05, + "loss": 0.5821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6138677000999451, + "step": 4475, + "valid_targets_mean": 16254.9, + "valid_targets_min": 57 + }, + { + "epoch": 1.1956231651988256, + "grad_norm": 0.3529872358081249, + "learning_rate": 6.258467536530565e-05, + "loss": 0.5997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5828440189361572, + "step": 4480, + "valid_targets_mean": 15555.3, + "valid_targets_min": 303 + }, + { + "epoch": 1.1969575660528422, + "grad_norm": 0.27354690781074714, + "learning_rate": 6.241243108559811e-05, + "loss": 0.6013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5828770399093628, + "step": 4485, + "valid_targets_mean": 16204.0, + "valid_targets_min": 495 + }, + { + "epoch": 1.1982919669068588, + "grad_norm": 0.24452469247733344, + "learning_rate": 6.224025509418971e-05, + "loss": 0.6148, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6097055673599243, + "step": 4490, + "valid_targets_mean": 14923.2, + "valid_targets_min": 726 + }, + { + "epoch": 1.1996263677608754, + "grad_norm": 0.25794393835991686, + "learning_rate": 6.206814832514525e-05, + "loss": 0.5996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6198200583457947, + "step": 4495, + "valid_targets_mean": 15636.4, + "valid_targets_min": 266 + }, + { + "epoch": 1.200960768614892, + "grad_norm": 0.3697274323238262, + "learning_rate": 6.189611171215405e-05, + "loss": 0.5956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6122844219207764, + "step": 4500, + "valid_targets_mean": 16200.8, + "valid_targets_min": 368 + }, + { + "epoch": 1.2022951694689086, + "grad_norm": 0.2851304729295163, + "learning_rate": 6.172414618852488e-05, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6054625511169434, + "step": 4505, + "valid_targets_mean": 17160.3, + "valid_targets_min": 814 + }, + { + "epoch": 1.203629570322925, + "grad_norm": 0.2603392404494807, + "learning_rate": 6.155225268718069e-05, + "loss": 0.5858, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6194175481796265, + "step": 4510, + "valid_targets_mean": 15548.8, + "valid_targets_min": 448 + }, + { + "epoch": 1.2049639711769415, + "grad_norm": 0.23632978796159737, + "learning_rate": 6.138043214065385e-05, + "loss": 0.5931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5853152871131897, + "step": 4515, + "valid_targets_mean": 16253.5, + "valid_targets_min": 526 + }, + { + "epoch": 1.2062983720309581, + "grad_norm": 0.4844945781749991, + "learning_rate": 6.120868548108093e-05, + "loss": 0.5874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6011490821838379, + "step": 4520, + "valid_targets_mean": 15423.4, + "valid_targets_min": 443 + }, + { + "epoch": 1.2076327728849747, + "grad_norm": 0.2819030369362368, + "learning_rate": 6.103701364019754e-05, + "loss": 0.5992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5920343995094299, + "step": 4525, + "valid_targets_mean": 16631.1, + "valid_targets_min": 647 + }, + { + "epoch": 1.208967173738991, + "grad_norm": 0.2918306704913203, + "learning_rate": 6.0865417549333536e-05, + "loss": 0.6078, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6191456317901611, + "step": 4530, + "valid_targets_mean": 15389.3, + "valid_targets_min": 542 + }, + { + "epoch": 1.2103015745930077, + "grad_norm": 0.26350998098499123, + "learning_rate": 6.0693898139407786e-05, + "loss": 0.6084, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6131468415260315, + "step": 4535, + "valid_targets_mean": 15042.1, + "valid_targets_min": 729 + }, + { + "epoch": 1.2116359754470243, + "grad_norm": 0.34680713886085474, + "learning_rate": 6.0522456340923085e-05, + "loss": 0.593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6055951118469238, + "step": 4540, + "valid_targets_mean": 15969.4, + "valid_targets_min": 154 + }, + { + "epoch": 1.2129703763010409, + "grad_norm": 0.2991580039441314, + "learning_rate": 6.0351093083961267e-05, + "loss": 0.5874, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.596157431602478, + "step": 4545, + "valid_targets_mean": 15783.5, + "valid_targets_min": 30 + }, + { + "epoch": 1.2143047771550575, + "grad_norm": 0.31461751378381264, + "learning_rate": 6.017980929817807e-05, + "loss": 0.596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6240620017051697, + "step": 4550, + "valid_targets_mean": 16475.7, + "valid_targets_min": 520 + }, + { + "epoch": 1.2156391780090738, + "grad_norm": 0.2880609654236511, + "learning_rate": 6.000860591279801e-05, + "loss": 0.5988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6084235906600952, + "step": 4555, + "valid_targets_mean": 14790.1, + "valid_targets_min": 761 + }, + { + "epoch": 1.2169735788630904, + "grad_norm": 0.4516901675082028, + "learning_rate": 5.9837483856609527e-05, + "loss": 0.6011, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5949472188949585, + "step": 4560, + "valid_targets_mean": 16267.4, + "valid_targets_min": 553 + }, + { + "epoch": 1.218307979717107, + "grad_norm": 0.3693560610908532, + "learning_rate": 5.966644405795982e-05, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6293297410011292, + "step": 4565, + "valid_targets_mean": 16069.2, + "valid_targets_min": 617 + }, + { + "epoch": 1.2196423805711236, + "grad_norm": 0.3723486353807144, + "learning_rate": 5.949548744474978e-05, + "loss": 0.5878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.569554328918457, + "step": 4570, + "valid_targets_mean": 15508.8, + "valid_targets_min": 697 + }, + { + "epoch": 1.22097678142514, + "grad_norm": 0.3842529043040275, + "learning_rate": 5.9324614944429095e-05, + "loss": 0.6043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5914621949195862, + "step": 4575, + "valid_targets_mean": 15604.2, + "valid_targets_min": 589 + }, + { + "epoch": 1.2223111822791566, + "grad_norm": 0.37655008091615877, + "learning_rate": 5.915382748399105e-05, + "loss": 0.6088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5930585265159607, + "step": 4580, + "valid_targets_mean": 16328.4, + "valid_targets_min": 508 + }, + { + "epoch": 1.2236455831331732, + "grad_norm": 0.37071745643114606, + "learning_rate": 5.8983125989967646e-05, + "loss": 0.6147, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6511808633804321, + "step": 4585, + "valid_targets_mean": 16443.6, + "valid_targets_min": 222 + }, + { + "epoch": 1.2249799839871898, + "grad_norm": 0.39020668353439725, + "learning_rate": 5.881251138842453e-05, + "loss": 0.5941, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.561487078666687, + "step": 4590, + "valid_targets_mean": 16465.2, + "valid_targets_min": 557 + }, + { + "epoch": 1.2263143848412064, + "grad_norm": 0.23579950042688647, + "learning_rate": 5.864198460495585e-05, + "loss": 0.6006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5959711670875549, + "step": 4595, + "valid_targets_mean": 15317.1, + "valid_targets_min": 360 + }, + { + "epoch": 1.227648785695223, + "grad_norm": 0.3149893359674708, + "learning_rate": 5.847154656467944e-05, + "loss": 0.5973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5710833072662354, + "step": 4600, + "valid_targets_mean": 16656.5, + "valid_targets_min": 359 + }, + { + "epoch": 1.2289831865492393, + "grad_norm": 0.296258079297135, + "learning_rate": 5.830119819223166e-05, + "loss": 0.593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5951532125473022, + "step": 4605, + "valid_targets_mean": 16023.0, + "valid_targets_min": 574 + }, + { + "epoch": 1.230317587403256, + "grad_norm": 0.3802746063275357, + "learning_rate": 5.8130940411762406e-05, + "loss": 0.5908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6089481711387634, + "step": 4610, + "valid_targets_mean": 17038.8, + "valid_targets_min": 477 + }, + { + "epoch": 1.2316519882572725, + "grad_norm": 0.3478708443012052, + "learning_rate": 5.79607741469301e-05, + "loss": 0.6099, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5820724964141846, + "step": 4615, + "valid_targets_mean": 16394.3, + "valid_targets_min": 679 + }, + { + "epoch": 1.232986389111289, + "grad_norm": 0.38691919321426016, + "learning_rate": 5.779070032089674e-05, + "loss": 0.6041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6047302484512329, + "step": 4620, + "valid_targets_mean": 15922.8, + "valid_targets_min": 297 + }, + { + "epoch": 1.2343207899653055, + "grad_norm": 0.3068426655265928, + "learning_rate": 5.762071985632276e-05, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5962592959403992, + "step": 4625, + "valid_targets_mean": 16840.9, + "valid_targets_min": 524 + }, + { + "epoch": 1.235655190819322, + "grad_norm": 0.3978013587115205, + "learning_rate": 5.745083367536217e-05, + "loss": 0.5906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5848004817962646, + "step": 4630, + "valid_targets_mean": 15698.9, + "valid_targets_min": 431 + }, + { + "epoch": 1.2369895916733387, + "grad_norm": 0.32933567857837664, + "learning_rate": 5.7281042699657465e-05, + "loss": 0.604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6038892865180969, + "step": 4635, + "valid_targets_mean": 16009.4, + "valid_targets_min": 744 + }, + { + "epoch": 1.2383239925273553, + "grad_norm": 0.38848421103646785, + "learning_rate": 5.71113478503346e-05, + "loss": 0.598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6145868301391602, + "step": 4640, + "valid_targets_mean": 16181.2, + "valid_targets_min": 31 + }, + { + "epoch": 1.2396583933813718, + "grad_norm": 0.30941335141012877, + "learning_rate": 5.694175004799814e-05, + "loss": 0.602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5926676988601685, + "step": 4645, + "valid_targets_mean": 16058.1, + "valid_targets_min": 562 + }, + { + "epoch": 1.2409927942353882, + "grad_norm": 0.3053881051934955, + "learning_rate": 5.6772250212726025e-05, + "loss": 0.5888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5941856503486633, + "step": 4650, + "valid_targets_mean": 14780.3, + "valid_targets_min": 563 + }, + { + "epoch": 1.2423271950894048, + "grad_norm": 0.25752081061216897, + "learning_rate": 5.660284926406484e-05, + "loss": 0.5901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6042780876159668, + "step": 4655, + "valid_targets_mean": 16847.3, + "valid_targets_min": 679 + }, + { + "epoch": 1.2436615959434214, + "grad_norm": 0.3718012087846061, + "learning_rate": 5.64335481210247e-05, + "loss": 0.6052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6086214184761047, + "step": 4660, + "valid_targets_mean": 17391.6, + "valid_targets_min": 509 + }, + { + "epoch": 1.244995996797438, + "grad_norm": 0.30488851628559444, + "learning_rate": 5.626434770207414e-05, + "loss": 0.5926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5924539566040039, + "step": 4665, + "valid_targets_mean": 16268.7, + "valid_targets_min": 322 + }, + { + "epoch": 1.2463303976514546, + "grad_norm": 0.3097058970074245, + "learning_rate": 5.60952489251354e-05, + "loss": 0.5929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5813044309616089, + "step": 4670, + "valid_targets_mean": 17170.6, + "valid_targets_min": 43 + }, + { + "epoch": 1.247664798505471, + "grad_norm": 0.3720595051065334, + "learning_rate": 5.592625270757928e-05, + "loss": 0.6034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6146562099456787, + "step": 4675, + "valid_targets_mean": 14678.0, + "valid_targets_min": 575 + }, + { + "epoch": 1.2489991993594876, + "grad_norm": 0.2834506741884633, + "learning_rate": 5.575735996622011e-05, + "loss": 0.5839, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.568305253982544, + "step": 4680, + "valid_targets_mean": 17661.6, + "valid_targets_min": 301 + }, + { + "epoch": 1.2503336002135041, + "grad_norm": 0.2976879759606349, + "learning_rate": 5.558857161731093e-05, + "loss": 0.5984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6380177736282349, + "step": 4685, + "valid_targets_mean": 15599.7, + "valid_targets_min": 330 + }, + { + "epoch": 1.2516680010675207, + "grad_norm": 0.2513140469642916, + "learning_rate": 5.541988857653847e-05, + "loss": 0.5965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6032347679138184, + "step": 4690, + "valid_targets_mean": 15771.1, + "valid_targets_min": 695 + }, + { + "epoch": 1.2530024019215373, + "grad_norm": 0.24123673240298785, + "learning_rate": 5.5251311759018046e-05, + "loss": 0.5945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6128364205360413, + "step": 4695, + "valid_targets_mean": 15270.5, + "valid_targets_min": 578 + }, + { + "epoch": 1.2543368027755537, + "grad_norm": 0.22916415274619137, + "learning_rate": 5.508284207928879e-05, + "loss": 0.5964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6064445972442627, + "step": 4700, + "valid_targets_mean": 15476.5, + "valid_targets_min": 33 + }, + { + "epoch": 1.2556712036295703, + "grad_norm": 0.23691348003106713, + "learning_rate": 5.491448045130865e-05, + "loss": 0.5897, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5725358128547668, + "step": 4705, + "valid_targets_mean": 17270.2, + "valid_targets_min": 338 + }, + { + "epoch": 1.257005604483587, + "grad_norm": 0.19993496434571217, + "learning_rate": 5.4746227788449236e-05, + "loss": 0.5852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5608433485031128, + "step": 4710, + "valid_targets_mean": 17248.0, + "valid_targets_min": 268 + }, + { + "epoch": 1.2583400053376035, + "grad_norm": 0.19404118932882974, + "learning_rate": 5.457808500349115e-05, + "loss": 0.5992, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6061972379684448, + "step": 4715, + "valid_targets_mean": 15697.4, + "valid_targets_min": 286 + }, + { + "epoch": 1.2596744061916199, + "grad_norm": 0.20080011898223393, + "learning_rate": 5.441005300861887e-05, + "loss": 0.5964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6121039986610413, + "step": 4720, + "valid_targets_mean": 15350.3, + "valid_targets_min": 358 + }, + { + "epoch": 1.2610088070456364, + "grad_norm": 0.21027729915005294, + "learning_rate": 5.424213271541578e-05, + "loss": 0.6162, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6112270355224609, + "step": 4725, + "valid_targets_mean": 16553.9, + "valid_targets_min": 753 + }, + { + "epoch": 1.262343207899653, + "grad_norm": 0.19841926561522874, + "learning_rate": 5.4074325034859336e-05, + "loss": 0.5928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5819110870361328, + "step": 4730, + "valid_targets_mean": 15418.9, + "valid_targets_min": 382 + }, + { + "epoch": 1.2636776087536696, + "grad_norm": 0.19495520891773752, + "learning_rate": 5.390663087731605e-05, + "loss": 0.6071, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5915564894676208, + "step": 4735, + "valid_targets_mean": 16489.7, + "valid_targets_min": 986 + }, + { + "epoch": 1.2650120096076862, + "grad_norm": 0.28836513173381045, + "learning_rate": 5.3739051152536506e-05, + "loss": 0.5859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5791863203048706, + "step": 4740, + "valid_targets_mean": 16232.9, + "valid_targets_min": 60 + }, + { + "epoch": 1.2663464104617028, + "grad_norm": 0.25722341253251046, + "learning_rate": 5.357158676965059e-05, + "loss": 0.5996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6200342178344727, + "step": 4745, + "valid_targets_mean": 16703.4, + "valid_targets_min": 869 + }, + { + "epoch": 1.2676808113157192, + "grad_norm": 0.22747725453073225, + "learning_rate": 5.3404238637162364e-05, + "loss": 0.6024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6098017692565918, + "step": 4750, + "valid_targets_mean": 16243.7, + "valid_targets_min": 122 + }, + { + "epoch": 1.2690152121697358, + "grad_norm": 0.23271601612942164, + "learning_rate": 5.323700766294526e-05, + "loss": 0.5936, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5844199657440186, + "step": 4755, + "valid_targets_mean": 15059.6, + "valid_targets_min": 373 + }, + { + "epoch": 1.2703496130237524, + "grad_norm": 0.2282372019798268, + "learning_rate": 5.306989475423712e-05, + "loss": 0.5917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.596099853515625, + "step": 4760, + "valid_targets_mean": 16810.2, + "valid_targets_min": 675 + }, + { + "epoch": 1.2716840138777687, + "grad_norm": 0.22572255703523167, + "learning_rate": 5.2902900817635264e-05, + "loss": 0.6058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6014312505722046, + "step": 4765, + "valid_targets_mean": 14895.7, + "valid_targets_min": 407 + }, + { + "epoch": 1.2730184147317853, + "grad_norm": 0.28794370507115435, + "learning_rate": 5.273602675909159e-05, + "loss": 0.6186, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6221282482147217, + "step": 4770, + "valid_targets_mean": 16150.4, + "valid_targets_min": 583 + }, + { + "epoch": 1.274352815585802, + "grad_norm": 0.21205356922803897, + "learning_rate": 5.256927348390765e-05, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5996368527412415, + "step": 4775, + "valid_targets_mean": 16298.7, + "valid_targets_min": 234 + }, + { + "epoch": 1.2756872164398185, + "grad_norm": 0.21155388741611245, + "learning_rate": 5.24026418967297e-05, + "loss": 0.599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6262991428375244, + "step": 4780, + "valid_targets_mean": 15940.4, + "valid_targets_min": 288 + }, + { + "epoch": 1.2770216172938351, + "grad_norm": 0.22995007264829823, + "learning_rate": 5.2236132901543895e-05, + "loss": 0.5832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6046526432037354, + "step": 4785, + "valid_targets_mean": 15612.3, + "valid_targets_min": 241 + }, + { + "epoch": 1.2783560181478517, + "grad_norm": 0.3215664591779135, + "learning_rate": 5.2069747401671334e-05, + "loss": 0.595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6015994548797607, + "step": 4790, + "valid_targets_mean": 15822.1, + "valid_targets_min": 424 + }, + { + "epoch": 1.279690419001868, + "grad_norm": 0.24392939420188084, + "learning_rate": 5.1903486299763026e-05, + "loss": 0.6005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5739015936851501, + "step": 4795, + "valid_targets_mean": 16372.1, + "valid_targets_min": 628 + }, + { + "epoch": 1.2810248198558847, + "grad_norm": 0.25390096114052607, + "learning_rate": 5.173735049779523e-05, + "loss": 0.6083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5909823775291443, + "step": 4800, + "valid_targets_mean": 16781.5, + "valid_targets_min": 571 + }, + { + "epoch": 1.2823592207099013, + "grad_norm": 0.26585673297614587, + "learning_rate": 5.1571340897064454e-05, + "loss": 0.5984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6485387086868286, + "step": 4805, + "valid_targets_mean": 14960.3, + "valid_targets_min": 437 + }, + { + "epoch": 1.2836936215639179, + "grad_norm": 0.429583415938752, + "learning_rate": 5.140545839818242e-05, + "loss": 0.5876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5757549405097961, + "step": 4810, + "valid_targets_mean": 16498.8, + "valid_targets_min": 577 + }, + { + "epoch": 1.2850280224179342, + "grad_norm": 0.20010540211949035, + "learning_rate": 5.1239703901071506e-05, + "loss": 0.5784, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5868698358535767, + "step": 4815, + "valid_targets_mean": 16137.8, + "valid_targets_min": 573 + }, + { + "epoch": 1.2863624232719508, + "grad_norm": 0.277590468805937, + "learning_rate": 5.1074078304959474e-05, + "loss": 0.5942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5904673933982849, + "step": 4820, + "valid_targets_mean": 15318.7, + "valid_targets_min": 600 + }, + { + "epoch": 1.2876968241259674, + "grad_norm": 0.19379932646177, + "learning_rate": 5.090858250837495e-05, + "loss": 0.6019, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5824383497238159, + "step": 4825, + "valid_targets_mean": 15670.2, + "valid_targets_min": 690 + }, + { + "epoch": 1.289031224979984, + "grad_norm": 0.22667207340100606, + "learning_rate": 5.0743217409142344e-05, + "loss": 0.5932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.565783679485321, + "step": 4830, + "valid_targets_mean": 17687.1, + "valid_targets_min": 569 + }, + { + "epoch": 1.2903656258340006, + "grad_norm": 0.21887335909403685, + "learning_rate": 5.057798390437696e-05, + "loss": 0.6023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5865060091018677, + "step": 4835, + "valid_targets_mean": 17334.3, + "valid_targets_min": 531 + }, + { + "epoch": 1.2917000266880172, + "grad_norm": 0.19635681305442218, + "learning_rate": 5.0412882890480266e-05, + "loss": 0.5968, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5752499103546143, + "step": 4840, + "valid_targets_mean": 16667.8, + "valid_targets_min": 385 + }, + { + "epoch": 1.2930344275420336, + "grad_norm": 0.22509479283485295, + "learning_rate": 5.0247915263134984e-05, + "loss": 0.6027, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5966780781745911, + "step": 4845, + "valid_targets_mean": 16138.8, + "valid_targets_min": 539 + }, + { + "epoch": 1.2943688283960502, + "grad_norm": 0.22523252216211342, + "learning_rate": 5.0083081917300086e-05, + "loss": 0.6145, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6485409736633301, + "step": 4850, + "valid_targets_mean": 16019.0, + "valid_targets_min": 565 + }, + { + "epoch": 1.2957032292500668, + "grad_norm": 0.19342715348483416, + "learning_rate": 4.991838374720618e-05, + "loss": 0.6125, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5838373899459839, + "step": 4855, + "valid_targets_mean": 15989.9, + "valid_targets_min": 423 + }, + { + "epoch": 1.2970376301040831, + "grad_norm": 0.22246829854069744, + "learning_rate": 4.975382164635051e-05, + "loss": 0.5791, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5719879269599915, + "step": 4860, + "valid_targets_mean": 15469.9, + "valid_targets_min": 469 + }, + { + "epoch": 1.2983720309580997, + "grad_norm": 0.2253572157609349, + "learning_rate": 4.9589396507492044e-05, + "loss": 0.6033, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6229650974273682, + "step": 4865, + "valid_targets_mean": 16063.2, + "valid_targets_min": 581 + }, + { + "epoch": 1.2997064318121163, + "grad_norm": 0.17878954418677784, + "learning_rate": 4.942510922264686e-05, + "loss": 0.6003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.559048056602478, + "step": 4870, + "valid_targets_mean": 16705.4, + "valid_targets_min": 728 + }, + { + "epoch": 1.301040832666133, + "grad_norm": 0.2048965948022605, + "learning_rate": 4.926096068308312e-05, + "loss": 0.593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6001508235931396, + "step": 4875, + "valid_targets_mean": 15511.5, + "valid_targets_min": 238 + }, + { + "epoch": 1.3023752335201495, + "grad_norm": 0.23779288166871065, + "learning_rate": 4.90969517793162e-05, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.622168779373169, + "step": 4880, + "valid_targets_mean": 16736.6, + "valid_targets_min": 464 + }, + { + "epoch": 1.303709634374166, + "grad_norm": 0.21782401030658538, + "learning_rate": 4.893308340110407e-05, + "loss": 0.6022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5979602932929993, + "step": 4885, + "valid_targets_mean": 15912.7, + "valid_targets_min": 672 + }, + { + "epoch": 1.3050440352281825, + "grad_norm": 0.27079239859218573, + "learning_rate": 4.876935643744229e-05, + "loss": 0.6077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.662260115146637, + "step": 4890, + "valid_targets_mean": 15808.6, + "valid_targets_min": 521 + }, + { + "epoch": 1.306378436082199, + "grad_norm": 0.208975210660639, + "learning_rate": 4.860577177655922e-05, + "loss": 0.6017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6019346117973328, + "step": 4895, + "valid_targets_mean": 16212.6, + "valid_targets_min": 646 + }, + { + "epoch": 1.3077128369362157, + "grad_norm": 0.3092531887221787, + "learning_rate": 4.844233030591122e-05, + "loss": 0.5987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6115128397941589, + "step": 4900, + "valid_targets_mean": 16733.5, + "valid_targets_min": 607 + }, + { + "epoch": 1.3090472377902322, + "grad_norm": 0.23607040987981687, + "learning_rate": 4.827903291217785e-05, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.610486626625061, + "step": 4905, + "valid_targets_mean": 15933.8, + "valid_targets_min": 573 + }, + { + "epoch": 1.3103816386442486, + "grad_norm": 0.22198054742229872, + "learning_rate": 4.8115880481257066e-05, + "loss": 0.5979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5951927304267883, + "step": 4910, + "valid_targets_mean": 15765.8, + "valid_targets_min": 629 + }, + { + "epoch": 1.3117160394982652, + "grad_norm": 0.2359077023791005, + "learning_rate": 4.795287389826035e-05, + "loss": 0.5967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.566422700881958, + "step": 4915, + "valid_targets_mean": 16070.0, + "valid_targets_min": 261 + }, + { + "epoch": 1.3130504403522818, + "grad_norm": 0.23498321132713004, + "learning_rate": 4.779001404750797e-05, + "loss": 0.5878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.567772388458252, + "step": 4920, + "valid_targets_mean": 18758.8, + "valid_targets_min": 786 + }, + { + "epoch": 1.3143848412062984, + "grad_norm": 0.1865459120511662, + "learning_rate": 4.762730181252415e-05, + "loss": 0.6056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6111925840377808, + "step": 4925, + "valid_targets_mean": 15379.9, + "valid_targets_min": 514 + }, + { + "epoch": 1.315719242060315, + "grad_norm": 0.22937962717615007, + "learning_rate": 4.746473807603235e-05, + "loss": 0.581, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5950619578361511, + "step": 4930, + "valid_targets_mean": 14893.1, + "valid_targets_min": 435 + }, + { + "epoch": 1.3170536429143316, + "grad_norm": 0.20591200810593613, + "learning_rate": 4.730232371995029e-05, + "loss": 0.6075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.629429042339325, + "step": 4935, + "valid_targets_mean": 15851.1, + "valid_targets_min": 443 + }, + { + "epoch": 1.318388043768348, + "grad_norm": 0.21808347777891596, + "learning_rate": 4.714005962538543e-05, + "loss": 0.6037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5948023200035095, + "step": 4940, + "valid_targets_mean": 16424.6, + "valid_targets_min": 581 + }, + { + "epoch": 1.3197224446223645, + "grad_norm": 0.20745975595609303, + "learning_rate": 4.6977946672630004e-05, + "loss": 0.6063, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5832745432853699, + "step": 4945, + "valid_targets_mean": 14841.7, + "valid_targets_min": 831 + }, + { + "epoch": 1.3210568454763811, + "grad_norm": 0.2122108754462692, + "learning_rate": 4.681598574115622e-05, + "loss": 0.6076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6011431813240051, + "step": 4950, + "valid_targets_mean": 14942.2, + "valid_targets_min": 491 + }, + { + "epoch": 1.3223912463303977, + "grad_norm": 0.21177215134869198, + "learning_rate": 4.665417770961166e-05, + "loss": 0.5986, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5770174264907837, + "step": 4955, + "valid_targets_mean": 16438.4, + "valid_targets_min": 937 + }, + { + "epoch": 1.323725647184414, + "grad_norm": 0.2055154833404559, + "learning_rate": 4.6492523455814415e-05, + "loss": 0.5879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5913348197937012, + "step": 4960, + "valid_targets_mean": 15420.0, + "valid_targets_min": 488 + }, + { + "epoch": 1.3250600480384307, + "grad_norm": 0.20887288536757667, + "learning_rate": 4.633102385674821e-05, + "loss": 0.5941, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5890672206878662, + "step": 4965, + "valid_targets_mean": 16079.2, + "valid_targets_min": 539 + }, + { + "epoch": 1.3263944488924473, + "grad_norm": 0.2011370090756563, + "learning_rate": 4.616967978855788e-05, + "loss": 0.5929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.579448938369751, + "step": 4970, + "valid_targets_mean": 14828.5, + "valid_targets_min": 266 + }, + { + "epoch": 1.3277288497464639, + "grad_norm": 0.2214769709247002, + "learning_rate": 4.6008492126544476e-05, + "loss": 0.5828, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6091501116752625, + "step": 4975, + "valid_targets_mean": 15823.4, + "valid_targets_min": 655 + }, + { + "epoch": 1.3290632506004805, + "grad_norm": 0.21158836520940907, + "learning_rate": 4.584746174516045e-05, + "loss": 0.6022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6131697297096252, + "step": 4980, + "valid_targets_mean": 15405.0, + "valid_targets_min": 235 + }, + { + "epoch": 1.330397651454497, + "grad_norm": 0.24173405329840256, + "learning_rate": 4.568658951800512e-05, + "loss": 0.5843, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6034678220748901, + "step": 4985, + "valid_targets_mean": 16839.0, + "valid_targets_min": 494 + }, + { + "epoch": 1.3317320523085134, + "grad_norm": 0.23491746410533076, + "learning_rate": 4.552587631781969e-05, + "loss": 0.6073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6017293930053711, + "step": 4990, + "valid_targets_mean": 16098.4, + "valid_targets_min": 40 + }, + { + "epoch": 1.33306645316253, + "grad_norm": 0.253333964366688, + "learning_rate": 4.536532301648271e-05, + "loss": 0.5901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6172199249267578, + "step": 4995, + "valid_targets_mean": 15348.4, + "valid_targets_min": 582 + }, + { + "epoch": 1.3344008540165466, + "grad_norm": 0.19692619276908743, + "learning_rate": 4.5204930485005306e-05, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6032106280326843, + "step": 5000, + "valid_targets_mean": 16151.9, + "valid_targets_min": 393 + }, + { + "epoch": 1.335735254870563, + "grad_norm": 0.20788187256604537, + "learning_rate": 4.504469959352627e-05, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5894028544425964, + "step": 5005, + "valid_targets_mean": 14931.8, + "valid_targets_min": 466 + }, + { + "epoch": 1.3370696557245796, + "grad_norm": 0.36348244446202216, + "learning_rate": 4.488463121130762e-05, + "loss": 0.5977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.605487585067749, + "step": 5010, + "valid_targets_mean": 16289.8, + "valid_targets_min": 899 + }, + { + "epoch": 1.3384040565785962, + "grad_norm": 0.23102762914503286, + "learning_rate": 4.472472620672976e-05, + "loss": 0.5918, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6059518456459045, + "step": 5015, + "valid_targets_mean": 16090.9, + "valid_targets_min": 639 + }, + { + "epoch": 1.3397384574326128, + "grad_norm": 0.23526289831427483, + "learning_rate": 4.4564985447286614e-05, + "loss": 0.6004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6051850318908691, + "step": 5020, + "valid_targets_mean": 15910.4, + "valid_targets_min": 417 + }, + { + "epoch": 1.3410728582866294, + "grad_norm": 0.2825165428791914, + "learning_rate": 4.440540979958124e-05, + "loss": 0.6061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6242756843566895, + "step": 5025, + "valid_targets_mean": 15441.1, + "valid_targets_min": 361 + }, + { + "epoch": 1.342407259140646, + "grad_norm": 0.2192602545171049, + "learning_rate": 4.4246000129320867e-05, + "loss": 0.5899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.585957407951355, + "step": 5030, + "valid_targets_mean": 16634.4, + "valid_targets_min": 463 + }, + { + "epoch": 1.3437416599946623, + "grad_norm": 0.26457067121397165, + "learning_rate": 4.408675730131227e-05, + "loss": 0.6129, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6116036176681519, + "step": 5035, + "valid_targets_mean": 15448.4, + "valid_targets_min": 504 + }, + { + "epoch": 1.345076060848679, + "grad_norm": 0.22036978697881862, + "learning_rate": 4.3927682179457144e-05, + "loss": 0.6047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6069991588592529, + "step": 5040, + "valid_targets_mean": 15667.9, + "valid_targets_min": 768 + }, + { + "epoch": 1.3464104617026955, + "grad_norm": 0.20238586364496838, + "learning_rate": 4.376877562674737e-05, + "loss": 0.6056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5942937135696411, + "step": 5045, + "valid_targets_mean": 16723.7, + "valid_targets_min": 631 + }, + { + "epoch": 1.347744862556712, + "grad_norm": 0.2126814911909632, + "learning_rate": 4.3610038505260264e-05, + "loss": 0.6056, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6149522066116333, + "step": 5050, + "valid_targets_mean": 14714.7, + "valid_targets_min": 482 + }, + { + "epoch": 1.3490792634107285, + "grad_norm": 0.20604689807287094, + "learning_rate": 4.3451471676154035e-05, + "loss": 0.5998, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6014049053192139, + "step": 5055, + "valid_targets_mean": 15980.6, + "valid_targets_min": 162 + }, + { + "epoch": 1.350413664264745, + "grad_norm": 0.20624419122922974, + "learning_rate": 4.329307599966306e-05, + "loss": 0.5861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5753385424613953, + "step": 5060, + "valid_targets_mean": 16103.3, + "valid_targets_min": 630 + }, + { + "epoch": 1.3517480651187617, + "grad_norm": 0.220186367340207, + "learning_rate": 4.313485233509309e-05, + "loss": 0.6008, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5982659459114075, + "step": 5065, + "valid_targets_mean": 16369.3, + "valid_targets_min": 374 + }, + { + "epoch": 1.3530824659727783, + "grad_norm": 0.24604574295768564, + "learning_rate": 4.297680154081686e-05, + "loss": 0.5961, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5799025297164917, + "step": 5070, + "valid_targets_mean": 15543.4, + "valid_targets_min": 284 + }, + { + "epoch": 1.3544168668267949, + "grad_norm": 0.2233422233797041, + "learning_rate": 4.2818924474269126e-05, + "loss": 0.5814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5851439833641052, + "step": 5075, + "valid_targets_mean": 16586.4, + "valid_targets_min": 608 + }, + { + "epoch": 1.3557512676808114, + "grad_norm": 0.20406773644050366, + "learning_rate": 4.266122199194226e-05, + "loss": 0.5819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5653451681137085, + "step": 5080, + "valid_targets_mean": 17330.1, + "valid_targets_min": 870 + }, + { + "epoch": 1.3570856685348278, + "grad_norm": 0.22946144750187072, + "learning_rate": 4.250369494938146e-05, + "loss": 0.5979, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5864439606666565, + "step": 5085, + "valid_targets_mean": 15451.2, + "valid_targets_min": 434 + }, + { + "epoch": 1.3584200693888444, + "grad_norm": 0.2431015210548431, + "learning_rate": 4.234634420118021e-05, + "loss": 0.6068, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.623619019985199, + "step": 5090, + "valid_targets_mean": 15702.2, + "valid_targets_min": 660 + }, + { + "epoch": 1.359754470242861, + "grad_norm": 0.17903038907752314, + "learning_rate": 4.218917060097547e-05, + "loss": 0.5945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5696024298667908, + "step": 5095, + "valid_targets_mean": 16674.5, + "valid_targets_min": 100 + }, + { + "epoch": 1.3610888710968774, + "grad_norm": 0.1715613252946905, + "learning_rate": 4.203217500144326e-05, + "loss": 0.5893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5678576827049255, + "step": 5100, + "valid_targets_mean": 16900.0, + "valid_targets_min": 490 + }, + { + "epoch": 1.362423271950894, + "grad_norm": 0.18937189520289122, + "learning_rate": 4.187535825429396e-05, + "loss": 0.6088, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6141047477722168, + "step": 5105, + "valid_targets_mean": 15568.6, + "valid_targets_min": 638 + }, + { + "epoch": 1.3637576728049106, + "grad_norm": 0.18294726253792917, + "learning_rate": 4.171872121026753e-05, + "loss": 0.5972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6077937483787537, + "step": 5110, + "valid_targets_mean": 15063.0, + "valid_targets_min": 708 + }, + { + "epoch": 1.3650920736589272, + "grad_norm": 0.1987739881577311, + "learning_rate": 4.1562264719129165e-05, + "loss": 0.593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5811140537261963, + "step": 5115, + "valid_targets_mean": 16650.8, + "valid_targets_min": 432 + }, + { + "epoch": 1.3664264745129437, + "grad_norm": 0.2080084244520698, + "learning_rate": 4.140598962966447e-05, + "loss": 0.596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5925748348236084, + "step": 5120, + "valid_targets_mean": 14376.4, + "valid_targets_min": 540 + }, + { + "epoch": 1.3677608753669603, + "grad_norm": 0.31546162795988003, + "learning_rate": 4.124989678967503e-05, + "loss": 0.5977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6151330471038818, + "step": 5125, + "valid_targets_mean": 16339.4, + "valid_targets_min": 447 + }, + { + "epoch": 1.3690952762209767, + "grad_norm": 0.23693111572394246, + "learning_rate": 4.109398704597357e-05, + "loss": 0.5867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5888723731040955, + "step": 5130, + "valid_targets_mean": 16056.1, + "valid_targets_min": 394 + }, + { + "epoch": 1.3704296770749933, + "grad_norm": 0.21582845063895006, + "learning_rate": 4.093826124437962e-05, + "loss": 0.589, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5797953009605408, + "step": 5135, + "valid_targets_mean": 16444.4, + "valid_targets_min": 119 + }, + { + "epoch": 1.37176407792901, + "grad_norm": 0.22102332173033082, + "learning_rate": 4.078272022971481e-05, + "loss": 0.6006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5976300239562988, + "step": 5140, + "valid_targets_mean": 15232.9, + "valid_targets_min": 433 + }, + { + "epoch": 1.3730984787830265, + "grad_norm": 0.21257064967375525, + "learning_rate": 4.06273648457982e-05, + "loss": 0.6014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6460756063461304, + "step": 5145, + "valid_targets_mean": 14771.5, + "valid_targets_min": 649 + }, + { + "epoch": 1.3744328796370429, + "grad_norm": 0.21938234079342284, + "learning_rate": 4.0472195935441904e-05, + "loss": 0.586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6117610931396484, + "step": 5150, + "valid_targets_mean": 16004.5, + "valid_targets_min": 512 + }, + { + "epoch": 1.3757672804910595, + "grad_norm": 0.23306877868076897, + "learning_rate": 4.031721434044635e-05, + "loss": 0.5996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6196531057357788, + "step": 5155, + "valid_targets_mean": 15975.8, + "valid_targets_min": 618 + }, + { + "epoch": 1.377101681345076, + "grad_norm": 0.19937402973955345, + "learning_rate": 4.016242090159574e-05, + "loss": 0.6038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5912162065505981, + "step": 5160, + "valid_targets_mean": 15855.6, + "valid_targets_min": 262 + }, + { + "epoch": 1.3784360821990926, + "grad_norm": 0.16528255884024484, + "learning_rate": 4.0007816458653566e-05, + "loss": 0.6015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5705872178077698, + "step": 5165, + "valid_targets_mean": 16436.0, + "valid_targets_min": 262 + }, + { + "epoch": 1.3797704830531092, + "grad_norm": 0.2305999394156692, + "learning_rate": 3.9853401850358036e-05, + "loss": 0.596, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5944071412086487, + "step": 5170, + "valid_targets_mean": 16191.2, + "valid_targets_min": 349 + }, + { + "epoch": 1.3811048839071258, + "grad_norm": 0.22219990738356493, + "learning_rate": 3.969917791441739e-05, + "loss": 0.5981, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5921786427497864, + "step": 5175, + "valid_targets_mean": 17374.1, + "valid_targets_min": 268 + }, + { + "epoch": 1.3824392847611422, + "grad_norm": 0.21281241031463616, + "learning_rate": 3.954514548750553e-05, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6060578227043152, + "step": 5180, + "valid_targets_mean": 16728.2, + "valid_targets_min": 293 + }, + { + "epoch": 1.3837736856151588, + "grad_norm": 0.21240254524115104, + "learning_rate": 3.939130540525746e-05, + "loss": 0.5907, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5911335945129395, + "step": 5185, + "valid_targets_mean": 16488.3, + "valid_targets_min": 554 + }, + { + "epoch": 1.3851080864691754, + "grad_norm": 0.19390611371519534, + "learning_rate": 3.923765850226456e-05, + "loss": 0.5861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5753046274185181, + "step": 5190, + "valid_targets_mean": 16045.1, + "valid_targets_min": 671 + }, + { + "epoch": 1.3864424873231918, + "grad_norm": 0.20217722105575986, + "learning_rate": 3.908420561207032e-05, + "loss": 0.5892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6015340089797974, + "step": 5195, + "valid_targets_mean": 15448.1, + "valid_targets_min": 556 + }, + { + "epoch": 1.3877768881772083, + "grad_norm": 0.237505877780031, + "learning_rate": 3.893094756716569e-05, + "loss": 0.6142, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6200620532035828, + "step": 5200, + "valid_targets_mean": 14185.8, + "valid_targets_min": 687 + }, + { + "epoch": 1.389111289031225, + "grad_norm": 0.3198811804284461, + "learning_rate": 3.87778851989845e-05, + "loss": 0.6024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5919672250747681, + "step": 5205, + "valid_targets_mean": 17366.0, + "valid_targets_min": 635 + }, + { + "epoch": 1.3904456898852415, + "grad_norm": 0.2103159972730984, + "learning_rate": 3.862501933789908e-05, + "loss": 0.5973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6027743816375732, + "step": 5210, + "valid_targets_mean": 15103.6, + "valid_targets_min": 474 + }, + { + "epoch": 1.3917800907392581, + "grad_norm": 0.24002562914948206, + "learning_rate": 3.847235081321573e-05, + "loss": 0.5952, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5700179934501648, + "step": 5215, + "valid_targets_mean": 17431.1, + "valid_targets_min": 204 + }, + { + "epoch": 1.3931144915932747, + "grad_norm": 0.1611356551754476, + "learning_rate": 3.831988045317007e-05, + "loss": 0.5938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5655096769332886, + "step": 5220, + "valid_targets_mean": 16851.1, + "valid_targets_min": 506 + }, + { + "epoch": 1.394448892447291, + "grad_norm": 0.263787542839795, + "learning_rate": 3.816760908492282e-05, + "loss": 0.6054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.590351939201355, + "step": 5225, + "valid_targets_mean": 16870.1, + "valid_targets_min": 645 + }, + { + "epoch": 1.3957832933013077, + "grad_norm": 0.22225719444101186, + "learning_rate": 3.8015537534555e-05, + "loss": 0.5886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6013718247413635, + "step": 5230, + "valid_targets_mean": 15676.9, + "valid_targets_min": 389 + }, + { + "epoch": 1.3971176941553243, + "grad_norm": 0.18685737512531117, + "learning_rate": 3.786366662706372e-05, + "loss": 0.598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5739297866821289, + "step": 5235, + "valid_targets_mean": 15324.5, + "valid_targets_min": 84 + }, + { + "epoch": 1.3984520950093409, + "grad_norm": 0.16037104282602255, + "learning_rate": 3.771199718635758e-05, + "loss": 0.5837, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5539162755012512, + "step": 5240, + "valid_targets_mean": 18008.3, + "valid_targets_min": 298 + }, + { + "epoch": 1.3997864958633572, + "grad_norm": 0.29003098065924876, + "learning_rate": 3.756053003525213e-05, + "loss": 0.6062, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6276518106460571, + "step": 5245, + "valid_targets_mean": 15736.6, + "valid_targets_min": 687 + }, + { + "epoch": 1.4011208967173738, + "grad_norm": 0.20843741485202597, + "learning_rate": 3.7409265995465577e-05, + "loss": 0.6059, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6018944978713989, + "step": 5250, + "valid_targets_mean": 15948.7, + "valid_targets_min": 483 + }, + { + "epoch": 1.4024552975713904, + "grad_norm": 0.18513610440099582, + "learning_rate": 3.725820588761422e-05, + "loss": 0.6073, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6068531274795532, + "step": 5255, + "valid_targets_mean": 16082.1, + "valid_targets_min": 457 + }, + { + "epoch": 1.403789698425407, + "grad_norm": 0.20095844719914072, + "learning_rate": 3.7107350531207944e-05, + "loss": 0.6076, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6160079836845398, + "step": 5260, + "valid_targets_mean": 15276.1, + "valid_targets_min": 584 + }, + { + "epoch": 1.4051240992794236, + "grad_norm": 0.20259429006491972, + "learning_rate": 3.6956700744645934e-05, + "loss": 0.5942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.597230851650238, + "step": 5265, + "valid_targets_mean": 16055.2, + "valid_targets_min": 258 + }, + { + "epoch": 1.4064585001334402, + "grad_norm": 0.1892258550707547, + "learning_rate": 3.6806257345212136e-05, + "loss": 0.5898, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5700638294219971, + "step": 5270, + "valid_targets_mean": 17513.9, + "valid_targets_min": 595 + }, + { + "epoch": 1.4077929009874566, + "grad_norm": 0.23737922547821871, + "learning_rate": 3.665602114907075e-05, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5867282152175903, + "step": 5275, + "valid_targets_mean": 16111.4, + "valid_targets_min": 383 + }, + { + "epoch": 1.4091273018414732, + "grad_norm": 0.17824476807657583, + "learning_rate": 3.650599297126198e-05, + "loss": 0.6023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6063085794448853, + "step": 5280, + "valid_targets_mean": 16692.3, + "valid_targets_min": 619 + }, + { + "epoch": 1.4104617026954898, + "grad_norm": 0.32076707277791566, + "learning_rate": 3.63561736256975e-05, + "loss": 0.6002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5818400979042053, + "step": 5285, + "valid_targets_mean": 16016.4, + "valid_targets_min": 355 + }, + { + "epoch": 1.4117961035495064, + "grad_norm": 0.2886623838106024, + "learning_rate": 3.6206563925156e-05, + "loss": 0.601, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5962020754814148, + "step": 5290, + "valid_targets_mean": 16352.5, + "valid_targets_min": 527 + }, + { + "epoch": 1.4131305044035227, + "grad_norm": 0.22448882632941783, + "learning_rate": 3.605716468127889e-05, + "loss": 0.5908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5873814225196838, + "step": 5295, + "valid_targets_mean": 16176.9, + "valid_targets_min": 507 + }, + { + "epoch": 1.4144649052575393, + "grad_norm": 0.1974506656033717, + "learning_rate": 3.590797670456586e-05, + "loss": 0.5883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5660135746002197, + "step": 5300, + "valid_targets_mean": 16553.2, + "valid_targets_min": 796 + }, + { + "epoch": 1.415799306111556, + "grad_norm": 0.19723366786559937, + "learning_rate": 3.575900080437036e-05, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5775608420372009, + "step": 5305, + "valid_targets_mean": 17046.9, + "valid_targets_min": 697 + }, + { + "epoch": 1.4171337069655725, + "grad_norm": 0.16682747011523738, + "learning_rate": 3.561023778889545e-05, + "loss": 0.5867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5756033658981323, + "step": 5310, + "valid_targets_mean": 16093.6, + "valid_targets_min": 438 + }, + { + "epoch": 1.418468107819589, + "grad_norm": 0.18365559629082295, + "learning_rate": 3.546168846518915e-05, + "loss": 0.5905, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5974948406219482, + "step": 5315, + "valid_targets_mean": 16326.9, + "valid_targets_min": 676 + }, + { + "epoch": 1.4198025086736055, + "grad_norm": 0.19089087086415163, + "learning_rate": 3.531335363914027e-05, + "loss": 0.5893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6205319166183472, + "step": 5320, + "valid_targets_mean": 15791.9, + "valid_targets_min": 708 + }, + { + "epoch": 1.421136909527622, + "grad_norm": 0.19662505005309017, + "learning_rate": 3.516523411547397e-05, + "loss": 0.6034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5730395317077637, + "step": 5325, + "valid_targets_mean": 15740.1, + "valid_targets_min": 447 + }, + { + "epoch": 1.4224713103816387, + "grad_norm": 0.18149916207996997, + "learning_rate": 3.5017330697747276e-05, + "loss": 0.5959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6132838726043701, + "step": 5330, + "valid_targets_mean": 15944.4, + "valid_targets_min": 322 + }, + { + "epoch": 1.4238057112356552, + "grad_norm": 0.20843189835772197, + "learning_rate": 3.486964418834495e-05, + "loss": 0.5995, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.589570939540863, + "step": 5335, + "valid_targets_mean": 14380.5, + "valid_targets_min": 32 + }, + { + "epoch": 1.4251401120896716, + "grad_norm": 0.16785233882242875, + "learning_rate": 3.472217538847496e-05, + "loss": 0.5976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6078864336013794, + "step": 5340, + "valid_targets_mean": 16013.7, + "valid_targets_min": 535 + }, + { + "epoch": 1.4264745129436882, + "grad_norm": 0.1908103124634614, + "learning_rate": 3.457492509816416e-05, + "loss": 0.5888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5652427673339844, + "step": 5345, + "valid_targets_mean": 15611.4, + "valid_targets_min": 697 + }, + { + "epoch": 1.4278089137977048, + "grad_norm": 0.21767883656025544, + "learning_rate": 3.442789411625402e-05, + "loss": 0.6041, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5779842734336853, + "step": 5350, + "valid_targets_mean": 15840.2, + "valid_targets_min": 470 + }, + { + "epoch": 1.4291433146517214, + "grad_norm": 0.22827072357848074, + "learning_rate": 3.428108324039626e-05, + "loss": 0.6022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5914899706840515, + "step": 5355, + "valid_targets_mean": 17542.0, + "valid_targets_min": 688 + }, + { + "epoch": 1.430477715505738, + "grad_norm": 0.21643481421261868, + "learning_rate": 3.413449326704843e-05, + "loss": 0.5765, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5556655526161194, + "step": 5360, + "valid_targets_mean": 16455.6, + "valid_targets_min": 489 + }, + { + "epoch": 1.4318121163597546, + "grad_norm": 0.19922598541740116, + "learning_rate": 3.3988124991469764e-05, + "loss": 0.6153, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6300039291381836, + "step": 5365, + "valid_targets_mean": 15127.3, + "valid_targets_min": 357 + }, + { + "epoch": 1.433146517213771, + "grad_norm": 0.1635470558764958, + "learning_rate": 3.384197920771676e-05, + "loss": 0.5835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5532587170600891, + "step": 5370, + "valid_targets_mean": 18515.0, + "valid_targets_min": 504 + }, + { + "epoch": 1.4344809180677875, + "grad_norm": 0.23513178207713545, + "learning_rate": 3.36960567086388e-05, + "loss": 0.6115, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6326612830162048, + "step": 5375, + "valid_targets_mean": 15665.2, + "valid_targets_min": 526 + }, + { + "epoch": 1.4358153189218041, + "grad_norm": 0.23912023489322257, + "learning_rate": 3.355035828587403e-05, + "loss": 0.5911, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6104973554611206, + "step": 5380, + "valid_targets_mean": 15362.2, + "valid_targets_min": 407 + }, + { + "epoch": 1.4371497197758207, + "grad_norm": 0.20331336753143553, + "learning_rate": 3.340488472984493e-05, + "loss": 0.5891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6072074770927429, + "step": 5385, + "valid_targets_mean": 15468.0, + "valid_targets_min": 171 + }, + { + "epoch": 1.438484120629837, + "grad_norm": 0.22083205722667518, + "learning_rate": 3.3259636829754086e-05, + "loss": 0.5966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.593048095703125, + "step": 5390, + "valid_targets_mean": 15959.7, + "valid_targets_min": 494 + }, + { + "epoch": 1.4398185214838537, + "grad_norm": 0.19609468469659475, + "learning_rate": 3.3114615373579827e-05, + "loss": 0.5841, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.602197527885437, + "step": 5395, + "valid_targets_mean": 16073.3, + "valid_targets_min": 443 + }, + { + "epoch": 1.4411529223378703, + "grad_norm": 0.25854344244132677, + "learning_rate": 3.296982114807207e-05, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6135181188583374, + "step": 5400, + "valid_targets_mean": 15603.4, + "valid_targets_min": 553 + }, + { + "epoch": 1.4424873231918869, + "grad_norm": 0.19332611302622635, + "learning_rate": 3.282525493874798e-05, + "loss": 0.5931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5894027352333069, + "step": 5405, + "valid_targets_mean": 15872.3, + "valid_targets_min": 389 + }, + { + "epoch": 1.4438217240459035, + "grad_norm": 0.23148888062136433, + "learning_rate": 3.2680917529887746e-05, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5799127817153931, + "step": 5410, + "valid_targets_mean": 17129.0, + "valid_targets_min": 726 + }, + { + "epoch": 1.44515612489992, + "grad_norm": 0.1671400646116706, + "learning_rate": 3.2536809704530206e-05, + "loss": 0.5807, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5970917344093323, + "step": 5415, + "valid_targets_mean": 16345.1, + "valid_targets_min": 383 + }, + { + "epoch": 1.4464905257539364, + "grad_norm": 0.18397653462430913, + "learning_rate": 3.239293224446879e-05, + "loss": 0.5964, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5879602432250977, + "step": 5420, + "valid_targets_mean": 16521.5, + "valid_targets_min": 676 + }, + { + "epoch": 1.447824926607953, + "grad_norm": 0.20694154995459813, + "learning_rate": 3.224928593024719e-05, + "loss": 0.5842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.569869339466095, + "step": 5425, + "valid_targets_mean": 16836.6, + "valid_targets_min": 301 + }, + { + "epoch": 1.4491593274619696, + "grad_norm": 0.20357671075946887, + "learning_rate": 3.210587154115501e-05, + "loss": 0.6061, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5855426788330078, + "step": 5430, + "valid_targets_mean": 16225.1, + "valid_targets_min": 708 + }, + { + "epoch": 1.450493728315986, + "grad_norm": 0.18250478657118246, + "learning_rate": 3.196268985522376e-05, + "loss": 0.5967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.578062891960144, + "step": 5435, + "valid_targets_mean": 15699.8, + "valid_targets_min": 617 + }, + { + "epoch": 1.4518281291700026, + "grad_norm": 0.19470223738557854, + "learning_rate": 3.1819741649222485e-05, + "loss": 0.5873, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5918402671813965, + "step": 5440, + "valid_targets_mean": 15734.7, + "valid_targets_min": 299 + }, + { + "epoch": 1.4531625300240192, + "grad_norm": 0.18052433407931184, + "learning_rate": 3.167702769865354e-05, + "loss": 0.6164, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6201403141021729, + "step": 5445, + "valid_targets_mean": 16596.1, + "valid_targets_min": 449 + }, + { + "epoch": 1.4544969308780358, + "grad_norm": 0.18538396940027405, + "learning_rate": 3.153454877774849e-05, + "loss": 0.5957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5928632020950317, + "step": 5450, + "valid_targets_mean": 16370.0, + "valid_targets_min": 359 + }, + { + "epoch": 1.4558313317320524, + "grad_norm": 0.19658172576763985, + "learning_rate": 3.139230565946387e-05, + "loss": 0.5899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5843933820724487, + "step": 5455, + "valid_targets_mean": 15637.9, + "valid_targets_min": 726 + }, + { + "epoch": 1.457165732586069, + "grad_norm": 0.1831526268026529, + "learning_rate": 3.1250299115476874e-05, + "loss": 0.6072, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5988274812698364, + "step": 5460, + "valid_targets_mean": 15774.7, + "valid_targets_min": 696 + }, + { + "epoch": 1.4585001334400853, + "grad_norm": 0.19210346886635393, + "learning_rate": 3.110852991618135e-05, + "loss": 0.5976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5973889231681824, + "step": 5465, + "valid_targets_mean": 15370.5, + "valid_targets_min": 533 + }, + { + "epoch": 1.459834534294102, + "grad_norm": 0.20169036516535757, + "learning_rate": 3.0966998830683536e-05, + "loss": 0.5945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6419908404350281, + "step": 5470, + "valid_targets_mean": 15717.3, + "valid_targets_min": 286 + }, + { + "epoch": 1.4611689351481185, + "grad_norm": 0.20011851692619234, + "learning_rate": 3.082570662679782e-05, + "loss": 0.591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6058547496795654, + "step": 5475, + "valid_targets_mean": 15943.1, + "valid_targets_min": 368 + }, + { + "epoch": 1.4625033360021351, + "grad_norm": 0.19040363954948747, + "learning_rate": 3.068465407104275e-05, + "loss": 0.5945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5980136394500732, + "step": 5480, + "valid_targets_mean": 16190.1, + "valid_targets_min": 496 + }, + { + "epoch": 1.4638377368561515, + "grad_norm": 0.18646996658321627, + "learning_rate": 3.054384192863664e-05, + "loss": 0.5788, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5953836441040039, + "step": 5485, + "valid_targets_mean": 15646.8, + "valid_targets_min": 423 + }, + { + "epoch": 1.465172137710168, + "grad_norm": 0.207569334773845, + "learning_rate": 3.0403270963493657e-05, + "loss": 0.5879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6002626419067383, + "step": 5490, + "valid_targets_mean": 15257.1, + "valid_targets_min": 338 + }, + { + "epoch": 1.4665065385641847, + "grad_norm": 0.22537560589636887, + "learning_rate": 3.026294193821954e-05, + "loss": 0.5984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6118378639221191, + "step": 5495, + "valid_targets_mean": 14416.0, + "valid_targets_min": 683 + }, + { + "epoch": 1.4678409394182013, + "grad_norm": 0.16379355795931236, + "learning_rate": 3.012285561410742e-05, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6207247376441956, + "step": 5500, + "valid_targets_mean": 16059.9, + "valid_targets_min": 588 + }, + { + "epoch": 1.4691753402722179, + "grad_norm": 0.2080506615201531, + "learning_rate": 2.9983012751133852e-05, + "loss": 0.5937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5791140794754028, + "step": 5505, + "valid_targets_mean": 16530.1, + "valid_targets_min": 523 + }, + { + "epoch": 1.4705097411262344, + "grad_norm": 0.19122494750135094, + "learning_rate": 2.9843414107954588e-05, + "loss": 0.586, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5696684718132019, + "step": 5510, + "valid_targets_mean": 17553.1, + "valid_targets_min": 389 + }, + { + "epoch": 1.4718441419802508, + "grad_norm": 0.19492474448887173, + "learning_rate": 2.9704060441900402e-05, + "loss": 0.6058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6235105395317078, + "step": 5515, + "valid_targets_mean": 15722.7, + "valid_targets_min": 628 + }, + { + "epoch": 1.4731785428342674, + "grad_norm": 0.19044348278999745, + "learning_rate": 2.956495250897311e-05, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5901477336883545, + "step": 5520, + "valid_targets_mean": 15814.6, + "valid_targets_min": 574 + }, + { + "epoch": 1.474512943688284, + "grad_norm": 0.2750435525308448, + "learning_rate": 2.9426091063841444e-05, + "loss": 0.5716, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5935043096542358, + "step": 5525, + "valid_targets_mean": 16115.7, + "valid_targets_min": 649 + }, + { + "epoch": 1.4758473445423004, + "grad_norm": 0.23200701546196978, + "learning_rate": 2.9287476859836817e-05, + "loss": 0.5956, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.594383955001831, + "step": 5530, + "valid_targets_mean": 15149.1, + "valid_targets_min": 760 + }, + { + "epoch": 1.477181745396317, + "grad_norm": 0.27083238636421597, + "learning_rate": 2.9149110648949447e-05, + "loss": 0.6053, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6178330183029175, + "step": 5535, + "valid_targets_mean": 15509.2, + "valid_targets_min": 501 + }, + { + "epoch": 1.4785161462503336, + "grad_norm": 0.21162805713737548, + "learning_rate": 2.9010993181824158e-05, + "loss": 0.5969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.60970139503479, + "step": 5540, + "valid_targets_mean": 17768.8, + "valid_targets_min": 724 + }, + { + "epoch": 1.4798505471043502, + "grad_norm": 0.21777734779683613, + "learning_rate": 2.8873125207756255e-05, + "loss": 0.5957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5937681198120117, + "step": 5545, + "valid_targets_mean": 15974.1, + "valid_targets_min": 504 + }, + { + "epoch": 1.4811849479583667, + "grad_norm": 0.2114795871318019, + "learning_rate": 2.8735507474687603e-05, + "loss": 0.5978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5643002986907959, + "step": 5550, + "valid_targets_mean": 16197.7, + "valid_targets_min": 159 + }, + { + "epoch": 1.4825193488123833, + "grad_norm": 0.1561900761777701, + "learning_rate": 2.859814072920249e-05, + "loss": 0.5844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5664620995521545, + "step": 5555, + "valid_targets_mean": 16723.9, + "valid_targets_min": 553 + }, + { + "epoch": 1.4838537496663997, + "grad_norm": 0.21967858614223346, + "learning_rate": 2.846102571652352e-05, + "loss": 0.5988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5975771546363831, + "step": 5560, + "valid_targets_mean": 15892.9, + "valid_targets_min": 553 + }, + { + "epoch": 1.4851881505204163, + "grad_norm": 0.1709140812610374, + "learning_rate": 2.8324163180507716e-05, + "loss": 0.5953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5756304860115051, + "step": 5565, + "valid_targets_mean": 16787.1, + "valid_targets_min": 137 + }, + { + "epoch": 1.486522551374433, + "grad_norm": 0.24002195980945173, + "learning_rate": 2.8187553863642314e-05, + "loss": 0.5881, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5959300994873047, + "step": 5570, + "valid_targets_mean": 16814.7, + "valid_targets_min": 66 + }, + { + "epoch": 1.4878569522284495, + "grad_norm": 0.1824666847678956, + "learning_rate": 2.8051198507040876e-05, + "loss": 0.6051, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5945764780044556, + "step": 5575, + "valid_targets_mean": 16067.2, + "valid_targets_min": 688 + }, + { + "epoch": 1.4891913530824659, + "grad_norm": 0.2584334177787084, + "learning_rate": 2.7915097850439238e-05, + "loss": 0.5943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6012793779373169, + "step": 5580, + "valid_targets_mean": 17179.9, + "valid_targets_min": 501 + }, + { + "epoch": 1.4905257539364825, + "grad_norm": 0.18624677181070054, + "learning_rate": 2.7779252632191394e-05, + "loss": 0.5906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.597710371017456, + "step": 5585, + "valid_targets_mean": 16111.1, + "valid_targets_min": 132 + }, + { + "epoch": 1.491860154790499, + "grad_norm": 0.16420787753171032, + "learning_rate": 2.7643663589265642e-05, + "loss": 0.5987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6165971755981445, + "step": 5590, + "valid_targets_mean": 15712.7, + "valid_targets_min": 335 + }, + { + "epoch": 1.4931945556445156, + "grad_norm": 0.20323769592892854, + "learning_rate": 2.750833145724049e-05, + "loss": 0.605, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5955610275268555, + "step": 5595, + "valid_targets_mean": 16009.6, + "valid_targets_min": 599 + }, + { + "epoch": 1.4945289564985322, + "grad_norm": 0.202867279463156, + "learning_rate": 2.7373256970300663e-05, + "loss": 0.5993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6011368036270142, + "step": 5600, + "valid_targets_mean": 15059.6, + "valid_targets_min": 143 + }, + { + "epoch": 1.4958633573525488, + "grad_norm": 0.20246773736830392, + "learning_rate": 2.7238440861233176e-05, + "loss": 0.6093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6146905422210693, + "step": 5605, + "valid_targets_mean": 15709.0, + "valid_targets_min": 646 + }, + { + "epoch": 1.4971977582065652, + "grad_norm": 0.21797562189566266, + "learning_rate": 2.710388386142335e-05, + "loss": 0.603, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6222171783447266, + "step": 5610, + "valid_targets_mean": 16111.1, + "valid_targets_min": 743 + }, + { + "epoch": 1.4985321590605818, + "grad_norm": 0.21535300035765537, + "learning_rate": 2.6969586700850753e-05, + "loss": 0.6003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6006828546524048, + "step": 5615, + "valid_targets_mean": 16464.0, + "valid_targets_min": 948 + }, + { + "epoch": 1.4998665599145984, + "grad_norm": 0.1739006092855029, + "learning_rate": 2.6835550108085373e-05, + "loss": 0.5914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5925532579421997, + "step": 5620, + "valid_targets_mean": 15993.4, + "valid_targets_min": 618 + }, + { + "epoch": 1.5012009607686148, + "grad_norm": 0.17931968669047224, + "learning_rate": 2.67017748102836e-05, + "loss": 0.5887, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.575809895992279, + "step": 5625, + "valid_targets_mean": 16380.2, + "valid_targets_min": 120 + }, + { + "epoch": 1.5025353616226313, + "grad_norm": 0.23543154742608263, + "learning_rate": 2.6568261533184233e-05, + "loss": 0.6003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5761880874633789, + "step": 5630, + "valid_targets_mean": 16202.9, + "valid_targets_min": 678 + }, + { + "epoch": 1.503869762476648, + "grad_norm": 0.2439908369834107, + "learning_rate": 2.643501100110463e-05, + "loss": 0.5896, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5689970850944519, + "step": 5635, + "valid_targets_mean": 15896.8, + "valid_targets_min": 453 + }, + { + "epoch": 1.5052041633306645, + "grad_norm": 0.17114966912354662, + "learning_rate": 2.6302023936936776e-05, + "loss": 0.597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5948618650436401, + "step": 5640, + "valid_targets_mean": 15256.4, + "valid_targets_min": 279 + }, + { + "epoch": 1.5065385641846811, + "grad_norm": 0.19044671484603795, + "learning_rate": 2.616930106214323e-05, + "loss": 0.5937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.595179557800293, + "step": 5645, + "valid_targets_mean": 14453.9, + "valid_targets_min": 638 + }, + { + "epoch": 1.5078729650386977, + "grad_norm": 0.19342269370897394, + "learning_rate": 2.6036843096753394e-05, + "loss": 0.5876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5870005488395691, + "step": 5650, + "valid_targets_mean": 16089.0, + "valid_targets_min": 299 + }, + { + "epoch": 1.5092073658927143, + "grad_norm": 0.17657912515294857, + "learning_rate": 2.5904650759359528e-05, + "loss": 0.602, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5778599977493286, + "step": 5655, + "valid_targets_mean": 15060.4, + "valid_targets_min": 438 + }, + { + "epoch": 1.5105417667467307, + "grad_norm": 0.20241815062961938, + "learning_rate": 2.5772724767112753e-05, + "loss": 0.5901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5876519083976746, + "step": 5660, + "valid_targets_mean": 14550.5, + "valid_targets_min": 312 + }, + { + "epoch": 1.5118761676007473, + "grad_norm": 0.22708816876904175, + "learning_rate": 2.564106583571933e-05, + "loss": 0.6093, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6123473048210144, + "step": 5665, + "valid_targets_mean": 14711.3, + "valid_targets_min": 568 + }, + { + "epoch": 1.5132105684547636, + "grad_norm": 0.2055084291990726, + "learning_rate": 2.550967467943668e-05, + "loss": 0.5901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5626510381698608, + "step": 5670, + "valid_targets_mean": 16377.3, + "valid_targets_min": 296 + }, + { + "epoch": 1.5145449693087802, + "grad_norm": 0.19756636706354835, + "learning_rate": 2.537855201106955e-05, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5962499380111694, + "step": 5675, + "valid_targets_mean": 17226.2, + "valid_targets_min": 482 + }, + { + "epoch": 1.5158793701627968, + "grad_norm": 0.17030439598730115, + "learning_rate": 2.5247698541966066e-05, + "loss": 0.6044, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.605013370513916, + "step": 5680, + "valid_targets_mean": 15812.6, + "valid_targets_min": 572 + }, + { + "epoch": 1.5172137710168134, + "grad_norm": 0.1661861361650594, + "learning_rate": 2.511711498201397e-05, + "loss": 0.5948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6049402356147766, + "step": 5685, + "valid_targets_mean": 16516.9, + "valid_targets_min": 768 + }, + { + "epoch": 1.51854817187083, + "grad_norm": 0.2125530503596033, + "learning_rate": 2.4986802039636773e-05, + "loss": 0.5948, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5406869649887085, + "step": 5690, + "valid_targets_mean": 16043.2, + "valid_targets_min": 104 + }, + { + "epoch": 1.5198825727248466, + "grad_norm": 0.16553430129331403, + "learning_rate": 2.485676042178976e-05, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6006138920783997, + "step": 5695, + "valid_targets_mean": 15876.9, + "valid_targets_min": 741 + }, + { + "epoch": 1.5212169735788632, + "grad_norm": 0.17905158814387356, + "learning_rate": 2.4726990833956363e-05, + "loss": 0.6006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5899641513824463, + "step": 5700, + "valid_targets_mean": 14660.8, + "valid_targets_min": 469 + }, + { + "epoch": 1.5225513744328798, + "grad_norm": 0.17438147820585884, + "learning_rate": 2.45974939801442e-05, + "loss": 0.5886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5681999325752258, + "step": 5705, + "valid_targets_mean": 16089.6, + "valid_targets_min": 619 + }, + { + "epoch": 1.5238857752868962, + "grad_norm": 0.16255470219703333, + "learning_rate": 2.446827056288131e-05, + "loss": 0.5832, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6050971746444702, + "step": 5710, + "valid_targets_mean": 16768.1, + "valid_targets_min": 569 + }, + { + "epoch": 1.5252201761409128, + "grad_norm": 0.18263292032857117, + "learning_rate": 2.4339321283212276e-05, + "loss": 0.5965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6079804301261902, + "step": 5715, + "valid_targets_mean": 15433.3, + "valid_targets_min": 771 + }, + { + "epoch": 1.5265545769949291, + "grad_norm": 0.1532852778846096, + "learning_rate": 2.421064684069453e-05, + "loss": 0.6029, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5876133441925049, + "step": 5720, + "valid_targets_mean": 16846.8, + "valid_targets_min": 725 + }, + { + "epoch": 1.5278889778489457, + "grad_norm": 0.18064571046835637, + "learning_rate": 2.4082247933394414e-05, + "loss": 0.5996, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6196247935295105, + "step": 5725, + "valid_targets_mean": 15432.3, + "valid_targets_min": 379 + }, + { + "epoch": 1.5292233787029623, + "grad_norm": 0.16939114797997423, + "learning_rate": 2.3954125257883558e-05, + "loss": 0.5953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5634824633598328, + "step": 5730, + "valid_targets_mean": 16351.3, + "valid_targets_min": 783 + }, + { + "epoch": 1.530557779556979, + "grad_norm": 0.1717461062559749, + "learning_rate": 2.382627950923501e-05, + "loss": 0.5951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6182409524917603, + "step": 5735, + "valid_targets_mean": 15957.7, + "valid_targets_min": 405 + }, + { + "epoch": 1.5318921804109955, + "grad_norm": 0.1651763821054294, + "learning_rate": 2.3698711381019398e-05, + "loss": 0.5958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6126998662948608, + "step": 5740, + "valid_targets_mean": 15308.0, + "valid_targets_min": 352 + }, + { + "epoch": 1.533226581265012, + "grad_norm": 0.18787738214160157, + "learning_rate": 2.3571421565301315e-05, + "loss": 0.5852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6002779006958008, + "step": 5745, + "valid_targets_mean": 16487.5, + "valid_targets_min": 141 + }, + { + "epoch": 1.5345609821190287, + "grad_norm": 0.15003464307738298, + "learning_rate": 2.3444410752635512e-05, + "loss": 0.6006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5795835852622986, + "step": 5750, + "valid_targets_mean": 15138.5, + "valid_targets_min": 637 + }, + { + "epoch": 1.535895382973045, + "grad_norm": 0.1585655068584074, + "learning_rate": 2.331767963206302e-05, + "loss": 0.5877, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5767025947570801, + "step": 5755, + "valid_targets_mean": 15502.4, + "valid_targets_min": 35 + }, + { + "epoch": 1.5372297838270617, + "grad_norm": 0.15371045283803136, + "learning_rate": 2.319122889110763e-05, + "loss": 0.592, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5695284605026245, + "step": 5760, + "valid_targets_mean": 16759.5, + "valid_targets_min": 388 + }, + { + "epoch": 1.5385641846810783, + "grad_norm": 0.17458428014420008, + "learning_rate": 2.3065059215772057e-05, + "loss": 0.5867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6019597053527832, + "step": 5765, + "valid_targets_mean": 16116.3, + "valid_targets_min": 565 + }, + { + "epoch": 1.5398985855350946, + "grad_norm": 0.23360031742660345, + "learning_rate": 2.2939171290534127e-05, + "loss": 0.585, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5718658566474915, + "step": 5770, + "valid_targets_mean": 15808.1, + "valid_targets_min": 510 + }, + { + "epoch": 1.5412329863891112, + "grad_norm": 0.2098313727724575, + "learning_rate": 2.281356579834324e-05, + "loss": 0.5943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6123155355453491, + "step": 5775, + "valid_targets_mean": 16492.1, + "valid_targets_min": 311 + }, + { + "epoch": 1.5425673872431278, + "grad_norm": 0.21325154876376626, + "learning_rate": 2.2688243420616573e-05, + "loss": 0.5857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6063023805618286, + "step": 5780, + "valid_targets_mean": 14032.6, + "valid_targets_min": 627 + }, + { + "epoch": 1.5439017880971444, + "grad_norm": 0.18350668193667802, + "learning_rate": 2.2563204837235323e-05, + "loss": 0.6055, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6285330653190613, + "step": 5785, + "valid_targets_mean": 16362.7, + "valid_targets_min": 727 + }, + { + "epoch": 1.545236188951161, + "grad_norm": 0.22654982864260179, + "learning_rate": 2.243845072654115e-05, + "loss": 0.5776, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5971053838729858, + "step": 5790, + "valid_targets_mean": 15919.5, + "valid_targets_min": 324 + }, + { + "epoch": 1.5465705898051776, + "grad_norm": 0.18730563220805965, + "learning_rate": 2.2313981765332464e-05, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.592902660369873, + "step": 5795, + "valid_targets_mean": 15746.0, + "valid_targets_min": 482 + }, + { + "epoch": 1.5479049906591942, + "grad_norm": 0.18051058434162362, + "learning_rate": 2.2189798628860604e-05, + "loss": 0.594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5940338969230652, + "step": 5800, + "valid_targets_mean": 15031.1, + "valid_targets_min": 867 + }, + { + "epoch": 1.5492393915132106, + "grad_norm": 0.167045235586477, + "learning_rate": 2.206590199082642e-05, + "loss": 0.5893, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5510430335998535, + "step": 5805, + "valid_targets_mean": 16077.8, + "valid_targets_min": 303 + }, + { + "epoch": 1.5505737923672271, + "grad_norm": 0.1939197187907762, + "learning_rate": 2.194229252337639e-05, + "loss": 0.5924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5958045125007629, + "step": 5810, + "valid_targets_mean": 15662.2, + "valid_targets_min": 138 + }, + { + "epoch": 1.5519081932212435, + "grad_norm": 0.173011575574559, + "learning_rate": 2.181897089709913e-05, + "loss": 0.5864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6193079948425293, + "step": 5815, + "valid_targets_mean": 16200.1, + "valid_targets_min": 217 + }, + { + "epoch": 1.55324259407526, + "grad_norm": 0.14864675429494573, + "learning_rate": 2.1695937781021736e-05, + "loss": 0.5812, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5566189289093018, + "step": 5820, + "valid_targets_mean": 17615.3, + "valid_targets_min": 361 + }, + { + "epoch": 1.5545769949292767, + "grad_norm": 0.17403013700185496, + "learning_rate": 2.1573193842606007e-05, + "loss": 0.5903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.575369119644165, + "step": 5825, + "valid_targets_mean": 15289.2, + "valid_targets_min": 435 + }, + { + "epoch": 1.5559113957832933, + "grad_norm": 0.16472117596213087, + "learning_rate": 2.1450739747745034e-05, + "loss": 0.5912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6011247634887695, + "step": 5830, + "valid_targets_mean": 15707.9, + "valid_targets_min": 456 + }, + { + "epoch": 1.5572457966373099, + "grad_norm": 0.15586589372849496, + "learning_rate": 2.1328576160759486e-05, + "loss": 0.5867, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5761151313781738, + "step": 5835, + "valid_targets_mean": 15750.8, + "valid_targets_min": 444 + }, + { + "epoch": 1.5585801974913265, + "grad_norm": 0.18984736960378085, + "learning_rate": 2.1206703744393936e-05, + "loss": 0.6189, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6555172204971313, + "step": 5840, + "valid_targets_mean": 15906.1, + "valid_targets_min": 331 + }, + { + "epoch": 1.559914598345343, + "grad_norm": 0.2024767844688485, + "learning_rate": 2.1085123159813398e-05, + "loss": 0.5924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5954935550689697, + "step": 5845, + "valid_targets_mean": 15512.7, + "valid_targets_min": 636 + }, + { + "epoch": 1.5612489991993594, + "grad_norm": 0.14698357547390506, + "learning_rate": 2.0963835066599703e-05, + "loss": 0.5842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5737780332565308, + "step": 5850, + "valid_targets_mean": 16473.4, + "valid_targets_min": 485 + }, + { + "epoch": 1.562583400053376, + "grad_norm": 0.20815349745584602, + "learning_rate": 2.084284012274781e-05, + "loss": 0.6054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6138194799423218, + "step": 5855, + "valid_targets_mean": 15586.1, + "valid_targets_min": 653 + }, + { + "epoch": 1.5639178009073926, + "grad_norm": 0.1844791880337792, + "learning_rate": 2.0722138984662415e-05, + "loss": 0.5818, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.563116192817688, + "step": 5860, + "valid_targets_mean": 15610.7, + "valid_targets_min": 724 + }, + { + "epoch": 1.565252201761409, + "grad_norm": 0.16176616966994398, + "learning_rate": 2.0601732307154283e-05, + "loss": 0.5926, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6010968685150146, + "step": 5865, + "valid_targets_mean": 16884.6, + "valid_targets_min": 771 + }, + { + "epoch": 1.5665866026154256, + "grad_norm": 0.1515417804516231, + "learning_rate": 2.048162074343665e-05, + "loss": 0.5767, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5779093503952026, + "step": 5870, + "valid_targets_mean": 15809.6, + "valid_targets_min": 533 + }, + { + "epoch": 1.5679210034694422, + "grad_norm": 0.17709603738131607, + "learning_rate": 2.036180494512181e-05, + "loss": 0.5886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5752099752426147, + "step": 5875, + "valid_targets_mean": 15900.4, + "valid_targets_min": 672 + }, + { + "epoch": 1.5692554043234588, + "grad_norm": 0.15363365071776586, + "learning_rate": 2.024228556221752e-05, + "loss": 0.6043, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5751421451568604, + "step": 5880, + "valid_targets_mean": 16790.5, + "valid_targets_min": 661 + }, + { + "epoch": 1.5705898051774754, + "grad_norm": 0.14514475181042058, + "learning_rate": 2.0123063243123395e-05, + "loss": 0.5994, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5840705037117004, + "step": 5885, + "valid_targets_mean": 16916.9, + "valid_targets_min": 423 + }, + { + "epoch": 1.571924206031492, + "grad_norm": 0.16845004524499335, + "learning_rate": 2.000413863462754e-05, + "loss": 0.5866, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5833538770675659, + "step": 5890, + "valid_targets_mean": 17593.8, + "valid_targets_min": 364 + }, + { + "epoch": 1.5732586068855086, + "grad_norm": 0.1780532499338099, + "learning_rate": 1.988551238190288e-05, + "loss": 0.5792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5539240837097168, + "step": 5895, + "valid_targets_mean": 15630.7, + "valid_targets_min": 164 + }, + { + "epoch": 1.574593007739525, + "grad_norm": 0.16652297951499662, + "learning_rate": 1.9767185128503817e-05, + "loss": 0.5951, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6258705854415894, + "step": 5900, + "valid_targets_mean": 16201.0, + "valid_targets_min": 689 + }, + { + "epoch": 1.5759274085935415, + "grad_norm": 0.16054757168609174, + "learning_rate": 1.9649157516362663e-05, + "loss": 0.5988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5688210725784302, + "step": 5905, + "valid_targets_mean": 17501.1, + "valid_targets_min": 294 + }, + { + "epoch": 1.577261809447558, + "grad_norm": 0.17767923166761193, + "learning_rate": 1.953143018578607e-05, + "loss": 0.5936, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6063442826271057, + "step": 5910, + "valid_targets_mean": 15196.0, + "valid_targets_min": 429 + }, + { + "epoch": 1.5785962103015745, + "grad_norm": 0.16696992817675763, + "learning_rate": 1.9414003775451754e-05, + "loss": 0.5975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6127891540527344, + "step": 5915, + "valid_targets_mean": 15455.5, + "valid_targets_min": 590 + }, + { + "epoch": 1.579930611155591, + "grad_norm": 0.16544949042824092, + "learning_rate": 1.9296878922404868e-05, + "loss": 0.5988, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6133477091789246, + "step": 5920, + "valid_targets_mean": 15672.0, + "valid_targets_min": 624 + }, + { + "epoch": 1.5812650120096077, + "grad_norm": 0.15281722728969543, + "learning_rate": 1.9180056262054575e-05, + "loss": 0.5962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5834280252456665, + "step": 5925, + "valid_targets_mean": 16627.5, + "valid_targets_min": 653 + }, + { + "epoch": 1.5825994128636243, + "grad_norm": 0.17981677514443467, + "learning_rate": 1.9063536428170682e-05, + "loss": 0.5953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6035789251327515, + "step": 5930, + "valid_targets_mean": 15810.4, + "valid_targets_min": 307 + }, + { + "epoch": 1.5839338137176409, + "grad_norm": 0.16230505592790417, + "learning_rate": 1.8947320052880106e-05, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6399399042129517, + "step": 5935, + "valid_targets_mean": 14876.2, + "valid_targets_min": 627 + }, + { + "epoch": 1.5852682145716575, + "grad_norm": 0.18206963510342355, + "learning_rate": 1.8831407766663513e-05, + "loss": 0.6018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6215972304344177, + "step": 5940, + "valid_targets_mean": 16623.4, + "valid_targets_min": 209 + }, + { + "epoch": 1.5866026154256738, + "grad_norm": 0.15644039490129202, + "learning_rate": 1.8715800198351824e-05, + "loss": 0.5972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5751008987426758, + "step": 5945, + "valid_targets_mean": 15878.5, + "valid_targets_min": 312 + }, + { + "epoch": 1.5879370162796904, + "grad_norm": 0.13079245795628466, + "learning_rate": 1.8600497975122877e-05, + "loss": 0.5792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5741679668426514, + "step": 5950, + "valid_targets_mean": 15517.2, + "valid_targets_min": 597 + }, + { + "epoch": 1.589271417133707, + "grad_norm": 0.15528732944901663, + "learning_rate": 1.8485501722498024e-05, + "loss": 0.5942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5887077450752258, + "step": 5955, + "valid_targets_mean": 15592.5, + "valid_targets_min": 619 + }, + { + "epoch": 1.5906058179877234, + "grad_norm": 0.1635991793147494, + "learning_rate": 1.8370812064338624e-05, + "loss": 0.589, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5944458246231079, + "step": 5960, + "valid_targets_mean": 17228.2, + "valid_targets_min": 541 + }, + { + "epoch": 1.59194021884174, + "grad_norm": 0.17784795023411568, + "learning_rate": 1.8256429622842818e-05, + "loss": 0.5868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6193060874938965, + "step": 5965, + "valid_targets_mean": 16224.5, + "valid_targets_min": 468 + }, + { + "epoch": 1.5932746196957566, + "grad_norm": 0.1636364281337556, + "learning_rate": 1.814235501854206e-05, + "loss": 0.5879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5867465734481812, + "step": 5970, + "valid_targets_mean": 16228.0, + "valid_targets_min": 434 + }, + { + "epoch": 1.5946090205497732, + "grad_norm": 0.17496121191528463, + "learning_rate": 1.8028588870297774e-05, + "loss": 0.5983, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5999577045440674, + "step": 5975, + "valid_targets_mean": 14875.4, + "valid_targets_min": 534 + }, + { + "epoch": 1.5959434214037898, + "grad_norm": 0.1635867696428078, + "learning_rate": 1.7915131795297956e-05, + "loss": 0.5974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5883691310882568, + "step": 5980, + "valid_targets_mean": 17177.1, + "valid_targets_min": 580 + }, + { + "epoch": 1.5972778222578063, + "grad_norm": 0.15255090872222463, + "learning_rate": 1.7801984409053897e-05, + "loss": 0.5891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5758295655250549, + "step": 5985, + "valid_targets_mean": 16917.6, + "valid_targets_min": 597 + }, + { + "epoch": 1.598612223111823, + "grad_norm": 0.18049120683196274, + "learning_rate": 1.7689147325396822e-05, + "loss": 0.5892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6227512955665588, + "step": 5990, + "valid_targets_mean": 15918.9, + "valid_targets_min": 392 + }, + { + "epoch": 1.5999466239658393, + "grad_norm": 0.44262822676640395, + "learning_rate": 1.757662115647448e-05, + "loss": 0.6015, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6125069856643677, + "step": 5995, + "valid_targets_mean": 15745.6, + "valid_targets_min": 494 + }, + { + "epoch": 1.601281024819856, + "grad_norm": 0.16722709656486248, + "learning_rate": 1.7464406512747964e-05, + "loss": 0.5953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5720467567443848, + "step": 6000, + "valid_targets_mean": 15853.1, + "valid_targets_min": 445 + }, + { + "epoch": 1.6026154256738723, + "grad_norm": 0.17427989834524088, + "learning_rate": 1.7352504002988303e-05, + "loss": 0.5993, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6251067519187927, + "step": 6005, + "valid_targets_mean": 14854.0, + "valid_targets_min": 324 + }, + { + "epoch": 1.6039498265278889, + "grad_norm": 0.14081820776809867, + "learning_rate": 1.7240914234273126e-05, + "loss": 0.6101, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.610417366027832, + "step": 6010, + "valid_targets_mean": 16326.3, + "valid_targets_min": 464 + }, + { + "epoch": 1.6052842273819055, + "grad_norm": 0.16288453950282422, + "learning_rate": 1.7129637811983507e-05, + "loss": 0.5892, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5866801738739014, + "step": 6015, + "valid_targets_mean": 15117.6, + "valid_targets_min": 237 + }, + { + "epoch": 1.606618628235922, + "grad_norm": 0.1646206458231276, + "learning_rate": 1.7018675339800557e-05, + "loss": 0.5985, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5739710927009583, + "step": 6020, + "valid_targets_mean": 16634.2, + "valid_targets_min": 537 + }, + { + "epoch": 1.6079530290899386, + "grad_norm": 0.16128266803140606, + "learning_rate": 1.690802741970217e-05, + "loss": 0.5916, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5576621294021606, + "step": 6025, + "valid_targets_mean": 16370.4, + "valid_targets_min": 533 + }, + { + "epoch": 1.6092874299439552, + "grad_norm": 0.15110479462081494, + "learning_rate": 1.6797694651959806e-05, + "loss": 0.5843, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6075755953788757, + "step": 6030, + "valid_targets_mean": 16231.2, + "valid_targets_min": 414 + }, + { + "epoch": 1.6106218307979718, + "grad_norm": 0.15048779325112796, + "learning_rate": 1.6687677635135218e-05, + "loss": 0.6001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6099841594696045, + "step": 6035, + "valid_targets_mean": 14744.9, + "valid_targets_min": 398 + }, + { + "epoch": 1.6119562316519882, + "grad_norm": 0.14317332216610718, + "learning_rate": 1.657797696607714e-05, + "loss": 0.6013, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6132588386535645, + "step": 6040, + "valid_targets_mean": 15638.2, + "valid_targets_min": 555 + }, + { + "epoch": 1.6132906325060048, + "grad_norm": 0.16829366412089236, + "learning_rate": 1.6468593239918136e-05, + "loss": 0.6014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6245346069335938, + "step": 6045, + "valid_targets_mean": 15996.1, + "valid_targets_min": 193 + }, + { + "epoch": 1.6146250333600214, + "grad_norm": 0.16505711959570887, + "learning_rate": 1.635952705007136e-05, + "loss": 0.5872, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5829812288284302, + "step": 6050, + "valid_targets_mean": 17497.4, + "valid_targets_min": 419 + }, + { + "epoch": 1.6159594342140378, + "grad_norm": 0.15102892214056948, + "learning_rate": 1.6250778988227248e-05, + "loss": 0.606, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6144422292709351, + "step": 6055, + "valid_targets_mean": 16664.8, + "valid_targets_min": 620 + }, + { + "epoch": 1.6172938350680544, + "grad_norm": 0.13778739201523155, + "learning_rate": 1.614234964435044e-05, + "loss": 0.5827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5897339582443237, + "step": 6060, + "valid_targets_mean": 17281.9, + "valid_targets_min": 609 + }, + { + "epoch": 1.618628235922071, + "grad_norm": 0.1607951680128057, + "learning_rate": 1.603423960667645e-05, + "loss": 0.597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6235299706459045, + "step": 6065, + "valid_targets_mean": 16151.6, + "valid_targets_min": 681 + }, + { + "epoch": 1.6199626367760875, + "grad_norm": 0.13975207089816102, + "learning_rate": 1.5926449461708577e-05, + "loss": 0.6014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6146085262298584, + "step": 6070, + "valid_targets_mean": 16454.9, + "valid_targets_min": 657 + }, + { + "epoch": 1.6212970376301041, + "grad_norm": 0.13776347324920654, + "learning_rate": 1.581897979421471e-05, + "loss": 0.5997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6190211176872253, + "step": 6075, + "valid_targets_mean": 15920.2, + "valid_targets_min": 863 + }, + { + "epoch": 1.6226314384841207, + "grad_norm": 0.14646313951209627, + "learning_rate": 1.571183118722405e-05, + "loss": 0.5958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5927650928497314, + "step": 6080, + "valid_targets_mean": 15447.5, + "valid_targets_min": 369 + }, + { + "epoch": 1.6239658393381373, + "grad_norm": 0.14941326518295334, + "learning_rate": 1.5605004222024074e-05, + "loss": 0.6005, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6348234415054321, + "step": 6085, + "valid_targets_mean": 15996.3, + "valid_targets_min": 114 + }, + { + "epoch": 1.6253002401921537, + "grad_norm": 0.1730533751354215, + "learning_rate": 1.549849947815737e-05, + "loss": 0.6004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5779517292976379, + "step": 6090, + "valid_targets_mean": 15313.8, + "valid_targets_min": 702 + }, + { + "epoch": 1.6266346410461703, + "grad_norm": 0.1627881531753968, + "learning_rate": 1.5392317533418366e-05, + "loss": 0.6025, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5933674573898315, + "step": 6095, + "valid_targets_mean": 16250.2, + "valid_targets_min": 521 + }, + { + "epoch": 1.6279690419001867, + "grad_norm": 0.15670768313961111, + "learning_rate": 1.5286458963850363e-05, + "loss": 0.5856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5807504057884216, + "step": 6100, + "valid_targets_mean": 15859.4, + "valid_targets_min": 670 + }, + { + "epoch": 1.6293034427542032, + "grad_norm": 0.13926802970619206, + "learning_rate": 1.5180924343742316e-05, + "loss": 0.5891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.569827675819397, + "step": 6105, + "valid_targets_mean": 16856.4, + "valid_targets_min": 552 + }, + { + "epoch": 1.6306378436082198, + "grad_norm": 0.16598312188525904, + "learning_rate": 1.5075714245625689e-05, + "loss": 0.5782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6085491180419922, + "step": 6110, + "valid_targets_mean": 15201.6, + "valid_targets_min": 431 + }, + { + "epoch": 1.6319722444622364, + "grad_norm": 0.1458342645262622, + "learning_rate": 1.4970829240271448e-05, + "loss": 0.5857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5849499702453613, + "step": 6115, + "valid_targets_mean": 16259.1, + "valid_targets_min": 604 + }, + { + "epoch": 1.633306645316253, + "grad_norm": 0.1439106809413625, + "learning_rate": 1.4866269896686917e-05, + "loss": 0.623, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6008425951004028, + "step": 6120, + "valid_targets_mean": 16053.7, + "valid_targets_min": 379 + }, + { + "epoch": 1.6346410461702696, + "grad_norm": 0.15056600587009406, + "learning_rate": 1.4762036782112624e-05, + "loss": 0.5999, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5983825922012329, + "step": 6125, + "valid_targets_mean": 16599.0, + "valid_targets_min": 736 + }, + { + "epoch": 1.6359754470242862, + "grad_norm": 0.18809406813947385, + "learning_rate": 1.465813046201934e-05, + "loss": 0.5883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5702234506607056, + "step": 6130, + "valid_targets_mean": 16462.3, + "valid_targets_min": 532 + }, + { + "epoch": 1.6373098478783028, + "grad_norm": 0.15691191797848125, + "learning_rate": 1.4554551500104971e-05, + "loss": 0.5915, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6137266159057617, + "step": 6135, + "valid_targets_mean": 16040.9, + "valid_targets_min": 693 + }, + { + "epoch": 1.6386442487323192, + "grad_norm": 0.14355841984033843, + "learning_rate": 1.4451300458291401e-05, + "loss": 0.5957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6074045300483704, + "step": 6140, + "valid_targets_mean": 16056.3, + "valid_targets_min": 695 + }, + { + "epoch": 1.6399786495863358, + "grad_norm": 0.13679949081670345, + "learning_rate": 1.4348377896721635e-05, + "loss": 0.588, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5748726725578308, + "step": 6145, + "valid_targets_mean": 16659.3, + "valid_targets_min": 667 + }, + { + "epoch": 1.6413130504403521, + "grad_norm": 0.15897239188462342, + "learning_rate": 1.4245784373756566e-05, + "loss": 0.594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6073840856552124, + "step": 6150, + "valid_targets_mean": 14906.5, + "valid_targets_min": 395 + }, + { + "epoch": 1.6426474512943687, + "grad_norm": 0.16815252513846143, + "learning_rate": 1.4143520445972078e-05, + "loss": 0.6001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6236668229103088, + "step": 6155, + "valid_targets_mean": 15759.6, + "valid_targets_min": 578 + }, + { + "epoch": 1.6439818521483853, + "grad_norm": 0.143794484563453, + "learning_rate": 1.4041586668155989e-05, + "loss": 0.6001, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5926347374916077, + "step": 6160, + "valid_targets_mean": 16193.2, + "valid_targets_min": 494 + }, + { + "epoch": 1.645316253002402, + "grad_norm": 0.1454519692729659, + "learning_rate": 1.3939983593304992e-05, + "loss": 0.5753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5642212629318237, + "step": 6165, + "valid_targets_mean": 16872.0, + "valid_targets_min": 438 + }, + { + "epoch": 1.6466506538564185, + "grad_norm": 0.1376101516577718, + "learning_rate": 1.3838711772621743e-05, + "loss": 0.5935, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5688588619232178, + "step": 6170, + "valid_targets_mean": 15333.7, + "valid_targets_min": 565 + }, + { + "epoch": 1.647985054710435, + "grad_norm": 0.16223202014166033, + "learning_rate": 1.3737771755511811e-05, + "loss": 0.5997, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5690805912017822, + "step": 6175, + "valid_targets_mean": 15612.1, + "valid_targets_min": 23 + }, + { + "epoch": 1.6493194555644517, + "grad_norm": 0.1285767046281265, + "learning_rate": 1.3637164089580673e-05, + "loss": 0.5884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5544174313545227, + "step": 6180, + "valid_targets_mean": 17636.2, + "valid_targets_min": 203 + }, + { + "epoch": 1.650653856418468, + "grad_norm": 0.148398065035962, + "learning_rate": 1.3536889320630841e-05, + "loss": 0.5965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6234698295593262, + "step": 6185, + "valid_targets_mean": 16127.8, + "valid_targets_min": 706 + }, + { + "epoch": 1.6519882572724847, + "grad_norm": 0.14107759764387337, + "learning_rate": 1.3436947992658814e-05, + "loss": 0.58, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5890226364135742, + "step": 6190, + "valid_targets_mean": 16596.9, + "valid_targets_min": 617 + }, + { + "epoch": 1.6533226581265013, + "grad_norm": 0.16180436639057758, + "learning_rate": 1.3337340647852135e-05, + "loss": 0.594, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6033791899681091, + "step": 6195, + "valid_targets_mean": 15863.7, + "valid_targets_min": 650 + }, + { + "epoch": 1.6546570589805176, + "grad_norm": 0.1518895405995563, + "learning_rate": 1.3238067826586491e-05, + "loss": 0.5991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5961155891418457, + "step": 6200, + "valid_targets_mean": 15850.0, + "valid_targets_min": 498 + }, + { + "epoch": 1.6559914598345342, + "grad_norm": 0.17032843421286292, + "learning_rate": 1.3139130067422792e-05, + "loss": 0.5967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5981688499450684, + "step": 6205, + "valid_targets_mean": 16174.9, + "valid_targets_min": 533 + }, + { + "epoch": 1.6573258606885508, + "grad_norm": 0.15065060581950682, + "learning_rate": 1.3040527907104126e-05, + "loss": 0.6057, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5765440464019775, + "step": 6210, + "valid_targets_mean": 17820.4, + "valid_targets_min": 618 + }, + { + "epoch": 1.6586602615425674, + "grad_norm": 0.1597433167413591, + "learning_rate": 1.2942261880553012e-05, + "loss": 0.5899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5972633957862854, + "step": 6215, + "valid_targets_mean": 16479.0, + "valid_targets_min": 681 + }, + { + "epoch": 1.659994662396584, + "grad_norm": 0.15031409007903818, + "learning_rate": 1.2844332520868433e-05, + "loss": 0.5864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5601651668548584, + "step": 6220, + "valid_targets_mean": 15959.4, + "valid_targets_min": 692 + }, + { + "epoch": 1.6613290632506006, + "grad_norm": 0.14976374680290783, + "learning_rate": 1.2746740359322857e-05, + "loss": 0.5995, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6134690046310425, + "step": 6225, + "valid_targets_mean": 13893.3, + "valid_targets_min": 263 + }, + { + "epoch": 1.6626634641046172, + "grad_norm": 0.14880912909382793, + "learning_rate": 1.2649485925359514e-05, + "loss": 0.6006, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5879743099212646, + "step": 6230, + "valid_targets_mean": 15951.7, + "valid_targets_min": 787 + }, + { + "epoch": 1.6639978649586336, + "grad_norm": 0.162208271485178, + "learning_rate": 1.2552569746589386e-05, + "loss": 0.5825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6024885177612305, + "step": 6235, + "valid_targets_mean": 15375.4, + "valid_targets_min": 469 + }, + { + "epoch": 1.6653322658126501, + "grad_norm": 0.13271115663807362, + "learning_rate": 1.245599234878846e-05, + "loss": 0.5871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5827089548110962, + "step": 6240, + "valid_targets_mean": 15835.0, + "valid_targets_min": 546 + }, + { + "epoch": 1.6666666666666665, + "grad_norm": 0.12474651138273796, + "learning_rate": 1.2359754255894737e-05, + "loss": 0.5959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6084429025650024, + "step": 6245, + "valid_targets_mean": 16269.3, + "valid_targets_min": 337 + }, + { + "epoch": 1.6680010675206831, + "grad_norm": 0.1445050377364166, + "learning_rate": 1.2263855990005527e-05, + "loss": 0.6018, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5961320400238037, + "step": 6250, + "valid_targets_mean": 16289.6, + "valid_targets_min": 768 + }, + { + "epoch": 1.6693354683746997, + "grad_norm": 0.1482473852544307, + "learning_rate": 1.2168298071374543e-05, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5933790802955627, + "step": 6255, + "valid_targets_mean": 16351.3, + "valid_targets_min": 519 + }, + { + "epoch": 1.6706698692287163, + "grad_norm": 0.13539046411548533, + "learning_rate": 1.2073081018409112e-05, + "loss": 0.5883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5713330507278442, + "step": 6260, + "valid_targets_mean": 16472.3, + "valid_targets_min": 313 + }, + { + "epoch": 1.672004270082733, + "grad_norm": 0.14799011994133907, + "learning_rate": 1.1978205347667303e-05, + "loss": 0.5954, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6045159101486206, + "step": 6265, + "valid_targets_mean": 16547.1, + "valid_targets_min": 539 + }, + { + "epoch": 1.6733386709367495, + "grad_norm": 0.13725772965713526, + "learning_rate": 1.1883671573855186e-05, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5883108377456665, + "step": 6270, + "valid_targets_mean": 16727.8, + "valid_targets_min": 702 + }, + { + "epoch": 1.674673071790766, + "grad_norm": 0.13623216265241142, + "learning_rate": 1.1789480209824064e-05, + "loss": 0.5835, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5607722997665405, + "step": 6275, + "valid_targets_mean": 16476.7, + "valid_targets_min": 322 + }, + { + "epoch": 1.6760074726447824, + "grad_norm": 0.13015789908144226, + "learning_rate": 1.1695631766567562e-05, + "loss": 0.593, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5627079010009766, + "step": 6280, + "valid_targets_mean": 17736.7, + "valid_targets_min": 627 + }, + { + "epoch": 1.677341873498799, + "grad_norm": 0.1286182356071317, + "learning_rate": 1.1602126753219005e-05, + "loss": 0.5815, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5757423043251038, + "step": 6285, + "valid_targets_mean": 15710.1, + "valid_targets_min": 171 + }, + { + "epoch": 1.6786762743528156, + "grad_norm": 0.1499565174599278, + "learning_rate": 1.1508965677048585e-05, + "loss": 0.5976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5899896025657654, + "step": 6290, + "valid_targets_mean": 15419.5, + "valid_targets_min": 262 + }, + { + "epoch": 1.680010675206832, + "grad_norm": 0.16982584818577737, + "learning_rate": 1.1416149043460562e-05, + "loss": 0.5845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6001005172729492, + "step": 6295, + "valid_targets_mean": 15842.3, + "valid_targets_min": 440 + }, + { + "epoch": 1.6813450760608486, + "grad_norm": 0.14353702154030903, + "learning_rate": 1.132367735599066e-05, + "loss": 0.6126, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6028214693069458, + "step": 6300, + "valid_targets_mean": 16275.0, + "valid_targets_min": 205 + }, + { + "epoch": 1.6826794769148652, + "grad_norm": 0.1381931576513102, + "learning_rate": 1.1231551116303162e-05, + "loss": 0.6014, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.599789023399353, + "step": 6305, + "valid_targets_mean": 15538.0, + "valid_targets_min": 467 + }, + { + "epoch": 1.6840138777688818, + "grad_norm": 0.16697494527921555, + "learning_rate": 1.1139770824188334e-05, + "loss": 0.5883, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6271265745162964, + "step": 6310, + "valid_targets_mean": 16457.3, + "valid_targets_min": 567 + }, + { + "epoch": 1.6853482786228984, + "grad_norm": 0.1377080966130086, + "learning_rate": 1.1048336977559666e-05, + "loss": 0.5877, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5899460315704346, + "step": 6315, + "valid_targets_mean": 16787.1, + "valid_targets_min": 642 + }, + { + "epoch": 1.686682679476915, + "grad_norm": 0.16651128816051763, + "learning_rate": 1.0957250072451084e-05, + "loss": 0.5978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5856098532676697, + "step": 6320, + "valid_targets_mean": 15374.6, + "valid_targets_min": 547 + }, + { + "epoch": 1.6880170803309316, + "grad_norm": 0.13609784431985525, + "learning_rate": 1.0866510603014411e-05, + "loss": 0.6023, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6047021150588989, + "step": 6325, + "valid_targets_mean": 16535.2, + "valid_targets_min": 661 + }, + { + "epoch": 1.689351481184948, + "grad_norm": 0.14592184066797317, + "learning_rate": 1.0776119061516613e-05, + "loss": 0.598, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6073904037475586, + "step": 6330, + "valid_targets_mean": 16283.0, + "valid_targets_min": 651 + }, + { + "epoch": 1.6906858820389645, + "grad_norm": 0.12591510091278948, + "learning_rate": 1.0686075938337055e-05, + "loss": 0.5717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5525071620941162, + "step": 6335, + "valid_targets_mean": 16847.4, + "valid_targets_min": 599 + }, + { + "epoch": 1.692020282892981, + "grad_norm": 0.1484961336986223, + "learning_rate": 1.0596381721964984e-05, + "loss": 0.6042, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6173697710037231, + "step": 6340, + "valid_targets_mean": 14540.3, + "valid_targets_min": 564 + }, + { + "epoch": 1.6933546837469975, + "grad_norm": 0.1518980985701294, + "learning_rate": 1.0507036898996787e-05, + "loss": 0.5825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5898152589797974, + "step": 6345, + "valid_targets_mean": 16248.2, + "valid_targets_min": 655 + }, + { + "epoch": 1.694689084601014, + "grad_norm": 0.129878707444232, + "learning_rate": 1.0418041954133346e-05, + "loss": 0.5914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5593838095664978, + "step": 6350, + "valid_targets_mean": 15633.2, + "valid_targets_min": 294 + }, + { + "epoch": 1.6960234854550307, + "grad_norm": 0.132711070418758, + "learning_rate": 1.032939737017745e-05, + "loss": 0.5974, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5812194347381592, + "step": 6355, + "valid_targets_mean": 15864.6, + "valid_targets_min": 359 + }, + { + "epoch": 1.6973578863090473, + "grad_norm": 0.14825395712334374, + "learning_rate": 1.02411036280312e-05, + "loss": 0.6183, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6262049078941345, + "step": 6360, + "valid_targets_mean": 15748.1, + "valid_targets_min": 546 + }, + { + "epoch": 1.6986922871630639, + "grad_norm": 0.13486774328472748, + "learning_rate": 1.0153161206693269e-05, + "loss": 0.5929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5607184171676636, + "step": 6365, + "valid_targets_mean": 15879.1, + "valid_targets_min": 704 + }, + { + "epoch": 1.7000266880170805, + "grad_norm": 0.1531399398087951, + "learning_rate": 1.0065570583256483e-05, + "loss": 0.5928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5941235423088074, + "step": 6370, + "valid_targets_mean": 16422.2, + "valid_targets_min": 688 + }, + { + "epoch": 1.7013610888710968, + "grad_norm": 0.14345987977648245, + "learning_rate": 9.978332232905114e-06, + "loss": 0.5857, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.571819543838501, + "step": 6375, + "valid_targets_mean": 16778.1, + "valid_targets_min": 463 + }, + { + "epoch": 1.7026954897251134, + "grad_norm": 0.14740771989302237, + "learning_rate": 9.891446628912286e-06, + "loss": 0.5944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6348655223846436, + "step": 6380, + "valid_targets_mean": 14806.2, + "valid_targets_min": 91 + }, + { + "epoch": 1.70402989057913, + "grad_norm": 0.14720633715151338, + "learning_rate": 9.804914242637541e-06, + "loss": 0.5906, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5854336023330688, + "step": 6385, + "valid_targets_mean": 16334.8, + "valid_targets_min": 500 + }, + { + "epoch": 1.7053642914331464, + "grad_norm": 0.15414339297276425, + "learning_rate": 9.718735543524103e-06, + "loss": 0.5894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.585676908493042, + "step": 6390, + "valid_targets_mean": 16565.8, + "valid_targets_min": 25 + }, + { + "epoch": 1.706698692287163, + "grad_norm": 0.144630066463583, + "learning_rate": 9.632910999096486e-06, + "loss": 0.6003, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5819835066795349, + "step": 6395, + "valid_targets_mean": 16601.6, + "valid_targets_min": 609 + }, + { + "epoch": 1.7080330931411796, + "grad_norm": 0.14199837312391764, + "learning_rate": 9.547441074957884e-06, + "loss": 0.5922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5858323574066162, + "step": 6400, + "valid_targets_mean": 16673.0, + "valid_targets_min": 619 + }, + { + "epoch": 1.7093674939951962, + "grad_norm": 0.12787592866458353, + "learning_rate": 9.462326234787621e-06, + "loss": 0.5889, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5914207100868225, + "step": 6405, + "valid_targets_mean": 15893.9, + "valid_targets_min": 563 + }, + { + "epoch": 1.7107018948492128, + "grad_norm": 0.12777324318682454, + "learning_rate": 9.377566940338712e-06, + "loss": 0.6031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.604408323764801, + "step": 6410, + "valid_targets_mean": 17530.7, + "valid_targets_min": 120 + }, + { + "epoch": 1.7120362957032293, + "grad_norm": 0.13973583954593194, + "learning_rate": 9.293163651435298e-06, + "loss": 0.5884, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.582183837890625, + "step": 6415, + "valid_targets_mean": 16832.0, + "valid_targets_min": 432 + }, + { + "epoch": 1.713370696557246, + "grad_norm": 0.18585246281645018, + "learning_rate": 9.20911682597015e-06, + "loss": 0.5808, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6085513234138489, + "step": 6420, + "valid_targets_mean": 15203.5, + "valid_targets_min": 604 + }, + { + "epoch": 1.7147050974112623, + "grad_norm": 0.12632781741232604, + "learning_rate": 9.125426919902231e-06, + "loss": 0.5697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.582617998123169, + "step": 6425, + "valid_targets_mean": 16540.3, + "valid_targets_min": 710 + }, + { + "epoch": 1.716039498265279, + "grad_norm": 0.14588864430661452, + "learning_rate": 9.042094387254212e-06, + "loss": 0.5929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.588573694229126, + "step": 6430, + "valid_targets_mean": 14756.5, + "valid_targets_min": 124 + }, + { + "epoch": 1.7173738991192953, + "grad_norm": 0.14127921161289128, + "learning_rate": 8.959119680109918e-06, + "loss": 0.5859, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6098560094833374, + "step": 6435, + "valid_targets_mean": 15344.9, + "valid_targets_min": 514 + }, + { + "epoch": 1.7187082999733119, + "grad_norm": 0.12191637752010245, + "learning_rate": 8.876503248612036e-06, + "loss": 0.5943, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.594386100769043, + "step": 6440, + "valid_targets_mean": 15512.2, + "valid_targets_min": 459 + }, + { + "epoch": 1.7200427008273285, + "grad_norm": 0.13184433555587588, + "learning_rate": 8.794245540959546e-06, + "loss": 0.5937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5808385610580444, + "step": 6445, + "valid_targets_mean": 17211.4, + "valid_targets_min": 826 + }, + { + "epoch": 1.721377101681345, + "grad_norm": 0.12236297502276318, + "learning_rate": 8.712347003405304e-06, + "loss": 0.5809, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.579727828502655, + "step": 6450, + "valid_targets_mean": 15807.0, + "valid_targets_min": 630 + }, + { + "epoch": 1.7227115025353616, + "grad_norm": 0.12733970081519047, + "learning_rate": 8.630808080253701e-06, + "loss": 0.5871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5996691584587097, + "step": 6455, + "valid_targets_mean": 16812.1, + "valid_targets_min": 789 + }, + { + "epoch": 1.7240459033893782, + "grad_norm": 0.12927177044213958, + "learning_rate": 8.549629213858192e-06, + "loss": 0.591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6019003391265869, + "step": 6460, + "valid_targets_mean": 16805.8, + "valid_targets_min": 364 + }, + { + "epoch": 1.7253803042433948, + "grad_norm": 0.12821859951783265, + "learning_rate": 8.468810844618842e-06, + "loss": 0.5991, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5908550024032593, + "step": 6465, + "valid_targets_mean": 15914.5, + "valid_targets_min": 566 + }, + { + "epoch": 1.7267147050974114, + "grad_norm": 0.12463354968323265, + "learning_rate": 8.388353410980075e-06, + "loss": 0.5931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6119598150253296, + "step": 6470, + "valid_targets_mean": 16807.3, + "valid_targets_min": 448 + }, + { + "epoch": 1.7280491059514278, + "grad_norm": 0.1423546941527745, + "learning_rate": 8.308257349428154e-06, + "loss": 0.5873, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5823371410369873, + "step": 6475, + "valid_targets_mean": 16515.9, + "valid_targets_min": 533 + }, + { + "epoch": 1.7293835068054444, + "grad_norm": 0.13947593660909918, + "learning_rate": 8.228523094488928e-06, + "loss": 0.5853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6231012344360352, + "step": 6480, + "valid_targets_mean": 14861.1, + "valid_targets_min": 359 + }, + { + "epoch": 1.7307179076594608, + "grad_norm": 0.13401251190748847, + "learning_rate": 8.149151078725416e-06, + "loss": 0.6017, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6143298149108887, + "step": 6485, + "valid_targets_mean": 15608.4, + "valid_targets_min": 507 + }, + { + "epoch": 1.7320523085134774, + "grad_norm": 0.12714425848238867, + "learning_rate": 8.070141732735424e-06, + "loss": 0.5879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5799736380577087, + "step": 6490, + "valid_targets_mean": 16586.3, + "valid_targets_min": 460 + }, + { + "epoch": 1.733386709367494, + "grad_norm": 0.13113293232699752, + "learning_rate": 7.991495485149294e-06, + "loss": 0.5977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6002615690231323, + "step": 6495, + "valid_targets_mean": 15329.1, + "valid_targets_min": 865 + }, + { + "epoch": 1.7347211102215105, + "grad_norm": 0.12430560028875079, + "learning_rate": 7.913212762627539e-06, + "loss": 0.5965, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5728801488876343, + "step": 6500, + "valid_targets_mean": 16844.3, + "valid_targets_min": 480 + }, + { + "epoch": 1.7360555110755271, + "grad_norm": 0.1385872249129435, + "learning_rate": 7.835293989858527e-06, + "loss": 0.5932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5763715505599976, + "step": 6505, + "valid_targets_mean": 16026.6, + "valid_targets_min": 635 + }, + { + "epoch": 1.7373899119295437, + "grad_norm": 0.13575477026988048, + "learning_rate": 7.75773958955614e-06, + "loss": 0.5827, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5958987474441528, + "step": 6510, + "valid_targets_mean": 15166.1, + "valid_targets_min": 607 + }, + { + "epoch": 1.7387243127835603, + "grad_norm": 0.14375470702045678, + "learning_rate": 7.680549982457553e-06, + "loss": 0.5967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5804993510246277, + "step": 6515, + "valid_targets_mean": 15304.0, + "valid_targets_min": 463 + }, + { + "epoch": 1.7400587136375767, + "grad_norm": 0.13251025136148764, + "learning_rate": 7.6037255873209165e-06, + "loss": 0.604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6260999441146851, + "step": 6520, + "valid_targets_mean": 17056.7, + "valid_targets_min": 42 + }, + { + "epoch": 1.7413931144915933, + "grad_norm": 0.13207149689690997, + "learning_rate": 7.527266820923089e-06, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5891574025154114, + "step": 6525, + "valid_targets_mean": 16467.2, + "valid_targets_min": 54 + }, + { + "epoch": 1.7427275153456097, + "grad_norm": 0.12270209253540865, + "learning_rate": 7.45117409805733e-06, + "loss": 0.5928, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5965874195098877, + "step": 6530, + "valid_targets_mean": 15756.0, + "valid_targets_min": 467 + }, + { + "epoch": 1.7440619161996262, + "grad_norm": 0.14656779384139537, + "learning_rate": 7.375447831531128e-06, + "loss": 0.5901, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5620827674865723, + "step": 6535, + "valid_targets_mean": 15943.0, + "valid_targets_min": 791 + }, + { + "epoch": 1.7453963170536428, + "grad_norm": 0.12908583929661363, + "learning_rate": 7.300088432163945e-06, + "loss": 0.5914, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6227389574050903, + "step": 6540, + "valid_targets_mean": 16917.0, + "valid_targets_min": 303 + }, + { + "epoch": 1.7467307179076594, + "grad_norm": 0.140681704180509, + "learning_rate": 7.2250963087849e-06, + "loss": 0.5722, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.576507031917572, + "step": 6545, + "valid_targets_mean": 14793.1, + "valid_targets_min": 583 + }, + { + "epoch": 1.748065118761676, + "grad_norm": 0.14019687191999916, + "learning_rate": 7.1504718682306754e-06, + "loss": 0.5961, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5997872948646545, + "step": 6550, + "valid_targets_mean": 14530.4, + "valid_targets_min": 448 + }, + { + "epoch": 1.7493995196156926, + "grad_norm": 0.12345291128910027, + "learning_rate": 7.076215515343256e-06, + "loss": 0.5846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5840612649917603, + "step": 6555, + "valid_targets_mean": 15716.3, + "valid_targets_min": 255 + }, + { + "epoch": 1.7507339204697092, + "grad_norm": 0.1425058945838927, + "learning_rate": 7.0023276529676655e-06, + "loss": 0.6116, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6450003385543823, + "step": 6560, + "valid_targets_mean": 15855.2, + "valid_targets_min": 329 + }, + { + "epoch": 1.7520683213237258, + "grad_norm": 0.12452597354737815, + "learning_rate": 6.928808681949919e-06, + "loss": 0.5868, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5846118330955505, + "step": 6565, + "valid_targets_mean": 15287.1, + "valid_targets_min": 605 + }, + { + "epoch": 1.7534027221777422, + "grad_norm": 0.11444459062454918, + "learning_rate": 6.855659001134739e-06, + "loss": 0.6064, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.579085111618042, + "step": 6570, + "valid_targets_mean": 15837.1, + "valid_targets_min": 372 + }, + { + "epoch": 1.7547371230317588, + "grad_norm": 0.12798762634839495, + "learning_rate": 6.78287900736342e-06, + "loss": 0.5873, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.578317403793335, + "step": 6575, + "valid_targets_mean": 16501.7, + "valid_targets_min": 567 + }, + { + "epoch": 1.7560715238857751, + "grad_norm": 0.12134400921362967, + "learning_rate": 6.710469095471701e-06, + "loss": 0.583, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5920226573944092, + "step": 6580, + "valid_targets_mean": 17444.7, + "valid_targets_min": 266 + }, + { + "epoch": 1.7574059247397917, + "grad_norm": 0.12768102290297237, + "learning_rate": 6.638429658287603e-06, + "loss": 0.591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5544648170471191, + "step": 6585, + "valid_targets_mean": 15754.8, + "valid_targets_min": 629 + }, + { + "epoch": 1.7587403255938083, + "grad_norm": 0.1143794766814526, + "learning_rate": 6.566761086629285e-06, + "loss": 0.5869, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5953787565231323, + "step": 6590, + "valid_targets_mean": 17017.4, + "valid_targets_min": 766 + }, + { + "epoch": 1.760074726447825, + "grad_norm": 0.13194510810045934, + "learning_rate": 6.495463769302952e-06, + "loss": 0.5977, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6088513731956482, + "step": 6595, + "valid_targets_mean": 15849.3, + "valid_targets_min": 755 + }, + { + "epoch": 1.7614091273018415, + "grad_norm": 0.13380248430204805, + "learning_rate": 6.424538093100745e-06, + "loss": 0.6004, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5823229551315308, + "step": 6600, + "valid_targets_mean": 15976.0, + "valid_targets_min": 528 + }, + { + "epoch": 1.762743528155858, + "grad_norm": 0.11524897333434836, + "learning_rate": 6.353984442798582e-06, + "loss": 0.5969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5522147417068481, + "step": 6605, + "valid_targets_mean": 17450.5, + "valid_targets_min": 586 + }, + { + "epoch": 1.7640779290098747, + "grad_norm": 0.1315759288137918, + "learning_rate": 6.283803201154173e-06, + "loss": 0.5831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5800704956054688, + "step": 6610, + "valid_targets_mean": 17219.5, + "valid_targets_min": 418 + }, + { + "epoch": 1.765412329863891, + "grad_norm": 0.13343874209116965, + "learning_rate": 6.213994748904866e-06, + "loss": 0.5882, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5874321460723877, + "step": 6615, + "valid_targets_mean": 16498.7, + "valid_targets_min": 702 + }, + { + "epoch": 1.7667467307179077, + "grad_norm": 0.13166214820508826, + "learning_rate": 6.144559464765605e-06, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5657899379730225, + "step": 6620, + "valid_targets_mean": 16268.9, + "valid_targets_min": 446 + }, + { + "epoch": 1.7680811315719243, + "grad_norm": 0.14027113380235667, + "learning_rate": 6.075497725426862e-06, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6110091209411621, + "step": 6625, + "valid_targets_mean": 15386.6, + "valid_targets_min": 372 + }, + { + "epoch": 1.7694155324259406, + "grad_norm": 0.13038351513833302, + "learning_rate": 6.0068099055526505e-06, + "loss": 0.6022, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5834971070289612, + "step": 6630, + "valid_targets_mean": 16473.2, + "valid_targets_min": 552 + }, + { + "epoch": 1.7707499332799572, + "grad_norm": 0.13341949521409505, + "learning_rate": 5.938496377778395e-06, + "loss": 0.5987, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.589992880821228, + "step": 6635, + "valid_targets_mean": 15739.5, + "valid_targets_min": 682 + }, + { + "epoch": 1.7720843341339738, + "grad_norm": 0.127563718799623, + "learning_rate": 5.870557512709001e-06, + "loss": 0.5945, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5829722881317139, + "step": 6640, + "valid_targets_mean": 16187.3, + "valid_targets_min": 419 + }, + { + "epoch": 1.7734187349879904, + "grad_norm": 0.13086379830367054, + "learning_rate": 5.802993678916773e-06, + "loss": 0.6031, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5990883111953735, + "step": 6645, + "valid_targets_mean": 15799.8, + "valid_targets_min": 687 + }, + { + "epoch": 1.774753135842007, + "grad_norm": 0.1339382142200281, + "learning_rate": 5.7358052429394785e-06, + "loss": 0.5958, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5838741064071655, + "step": 6650, + "valid_targets_mean": 16166.3, + "valid_targets_min": 300 + }, + { + "epoch": 1.7760875366960236, + "grad_norm": 0.12436641926688305, + "learning_rate": 5.668992569278347e-06, + "loss": 0.5946, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6025828719139099, + "step": 6655, + "valid_targets_mean": 15163.1, + "valid_targets_min": 530 + }, + { + "epoch": 1.7774219375500402, + "grad_norm": 0.12139389266546576, + "learning_rate": 5.602556020396004e-06, + "loss": 0.5753, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5686994791030884, + "step": 6660, + "valid_targets_mean": 16358.0, + "valid_targets_min": 148 + }, + { + "epoch": 1.7787563384040566, + "grad_norm": 0.12719396458430962, + "learning_rate": 5.5364959567146514e-06, + "loss": 0.5938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5728775262832642, + "step": 6665, + "valid_targets_mean": 16011.3, + "valid_targets_min": 658 + }, + { + "epoch": 1.7800907392580732, + "grad_norm": 0.13944967945573655, + "learning_rate": 5.470812736614014e-06, + "loss": 0.5976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6120748519897461, + "step": 6670, + "valid_targets_mean": 14323.0, + "valid_targets_min": 637 + }, + { + "epoch": 1.7814251401120895, + "grad_norm": 0.12706901606619092, + "learning_rate": 5.405506716429378e-06, + "loss": 0.5907, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6091560125350952, + "step": 6675, + "valid_targets_mean": 16226.2, + "valid_targets_min": 196 + }, + { + "epoch": 1.7827595409661061, + "grad_norm": 0.11505706377936203, + "learning_rate": 5.340578250449742e-06, + "loss": 0.5768, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.558120846748352, + "step": 6680, + "valid_targets_mean": 16645.7, + "valid_targets_min": 521 + }, + { + "epoch": 1.7840939418201227, + "grad_norm": 0.12119249283018675, + "learning_rate": 5.276027690915868e-06, + "loss": 0.604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6369675397872925, + "step": 6685, + "valid_targets_mean": 16399.1, + "valid_targets_min": 380 + }, + { + "epoch": 1.7854283426741393, + "grad_norm": 0.11977714576766528, + "learning_rate": 5.211855388018282e-06, + "loss": 0.6026, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6144067049026489, + "step": 6690, + "valid_targets_mean": 16009.9, + "valid_targets_min": 765 + }, + { + "epoch": 1.786762743528156, + "grad_norm": 0.12002456110716048, + "learning_rate": 5.148061689895519e-06, + "loss": 0.6054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5942480564117432, + "step": 6695, + "valid_targets_mean": 15441.4, + "valid_targets_min": 699 + }, + { + "epoch": 1.7880971443821725, + "grad_norm": 0.12419839234916387, + "learning_rate": 5.084646942632123e-06, + "loss": 0.5845, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5599845051765442, + "step": 6700, + "valid_targets_mean": 16584.7, + "valid_targets_min": 620 + }, + { + "epoch": 1.789431545236189, + "grad_norm": 0.12276142930868597, + "learning_rate": 5.0216114902567995e-06, + "loss": 0.5873, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6189547777175903, + "step": 6705, + "valid_targets_mean": 14926.4, + "valid_targets_min": 505 + }, + { + "epoch": 1.7907659460902055, + "grad_norm": 0.11850993922110012, + "learning_rate": 4.9589556747406e-06, + "loss": 0.5838, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5783436298370361, + "step": 6710, + "valid_targets_mean": 16365.0, + "valid_targets_min": 315 + }, + { + "epoch": 1.792100346944222, + "grad_norm": 0.12343086819584895, + "learning_rate": 4.896679835994965e-06, + "loss": 0.579, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5465564131736755, + "step": 6715, + "valid_targets_mean": 16514.3, + "valid_targets_min": 169 + }, + { + "epoch": 1.7934347477982386, + "grad_norm": 0.11718639877344501, + "learning_rate": 4.834784311869985e-06, + "loss": 0.577, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5630457401275635, + "step": 6720, + "valid_targets_mean": 16447.2, + "valid_targets_min": 346 + }, + { + "epoch": 1.794769148652255, + "grad_norm": 0.12437660439211354, + "learning_rate": 4.773269438152516e-06, + "loss": 0.6021, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6006584167480469, + "step": 6725, + "valid_targets_mean": 14929.2, + "valid_targets_min": 609 + }, + { + "epoch": 1.7961035495062716, + "grad_norm": 0.11840169382440213, + "learning_rate": 4.712135548564333e-06, + "loss": 0.5739, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5946887135505676, + "step": 6730, + "valid_targets_mean": 16411.4, + "valid_targets_min": 821 + }, + { + "epoch": 1.7974379503602882, + "grad_norm": 0.11591503727537256, + "learning_rate": 4.651382974760382e-06, + "loss": 0.5972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6221188306808472, + "step": 6735, + "valid_targets_mean": 16008.2, + "valid_targets_min": 437 + }, + { + "epoch": 1.7987723512143048, + "grad_norm": 0.12495184922741498, + "learning_rate": 4.591012046326944e-06, + "loss": 0.5844, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6207176446914673, + "step": 6740, + "valid_targets_mean": 15785.4, + "valid_targets_min": 679 + }, + { + "epoch": 1.8001067520683214, + "grad_norm": 0.11777234439275203, + "learning_rate": 4.5310230907798285e-06, + "loss": 0.5912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5886247158050537, + "step": 6745, + "valid_targets_mean": 15777.8, + "valid_targets_min": 261 + }, + { + "epoch": 1.801441152922338, + "grad_norm": 0.13310005646330186, + "learning_rate": 4.471416433562638e-06, + "loss": 0.5864, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6195192337036133, + "step": 6750, + "valid_targets_mean": 16042.3, + "valid_targets_min": 728 + }, + { + "epoch": 1.8027755537763546, + "grad_norm": 0.3573687288701633, + "learning_rate": 4.412192398044997e-06, + "loss": 0.5825, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.547378420829773, + "step": 6755, + "valid_targets_mean": 16194.8, + "valid_targets_min": 22 + }, + { + "epoch": 1.804109954630371, + "grad_norm": 0.12228667808737118, + "learning_rate": 4.353351305520747e-06, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.615507185459137, + "step": 6760, + "valid_targets_mean": 17472.8, + "valid_targets_min": 639 + }, + { + "epoch": 1.8054443554843875, + "grad_norm": 0.12032619569895683, + "learning_rate": 4.2948934752062655e-06, + "loss": 0.6047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5853080749511719, + "step": 6765, + "valid_targets_mean": 17070.5, + "valid_targets_min": 516 + }, + { + "epoch": 1.806778756338404, + "grad_norm": 0.12726124020104732, + "learning_rate": 4.2368192242387355e-06, + "loss": 0.5978, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6125775575637817, + "step": 6770, + "valid_targets_mean": 14640.3, + "valid_targets_min": 333 + }, + { + "epoch": 1.8081131571924205, + "grad_norm": 0.1268406765012243, + "learning_rate": 4.179128867674348e-06, + "loss": 0.5728, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5960764288902283, + "step": 6775, + "valid_targets_mean": 17594.2, + "valid_targets_min": 261 + }, + { + "epoch": 1.809447558046437, + "grad_norm": 0.13020025506897828, + "learning_rate": 4.121822718486664e-06, + "loss": 0.5937, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5955917835235596, + "step": 6780, + "valid_targets_mean": 15496.2, + "valid_targets_min": 484 + }, + { + "epoch": 1.8107819589004537, + "grad_norm": 0.13462347960359008, + "learning_rate": 4.064901087564918e-06, + "loss": 0.6062, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6180999279022217, + "step": 6785, + "valid_targets_mean": 14829.8, + "valid_targets_min": 748 + }, + { + "epoch": 1.8121163597544703, + "grad_norm": 0.12520707920034008, + "learning_rate": 4.008364283712298e-06, + "loss": 0.5764, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6032578945159912, + "step": 6790, + "valid_targets_mean": 15743.1, + "valid_targets_min": 794 + }, + { + "epoch": 1.8134507606084869, + "grad_norm": 0.12153868786431792, + "learning_rate": 3.9522126136442515e-06, + "loss": 0.5842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5904735326766968, + "step": 6795, + "valid_targets_mean": 17683.8, + "valid_targets_min": 700 + }, + { + "epoch": 1.8147851614625035, + "grad_norm": 0.13380932238576912, + "learning_rate": 3.896446381986901e-06, + "loss": 0.5886, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5878794193267822, + "step": 6800, + "valid_targets_mean": 15747.5, + "valid_targets_min": 24 + }, + { + "epoch": 1.8161195623165198, + "grad_norm": 0.11363090802399065, + "learning_rate": 3.841065891275328e-06, + "loss": 0.5814, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5766637921333313, + "step": 6805, + "valid_targets_mean": 16026.2, + "valid_targets_min": 312 + }, + { + "epoch": 1.8174539631705364, + "grad_norm": 0.11903433960083935, + "learning_rate": 3.786071441951918e-06, + "loss": 0.5715, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5726655125617981, + "step": 6810, + "valid_targets_mean": 14966.9, + "valid_targets_min": 474 + }, + { + "epoch": 1.818788364024553, + "grad_norm": 0.10999529624986326, + "learning_rate": 3.7314633323647952e-06, + "loss": 0.599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5864944458007812, + "step": 6815, + "valid_targets_mean": 15981.9, + "valid_targets_min": 424 + }, + { + "epoch": 1.8201227648785694, + "grad_norm": 0.11513842609934516, + "learning_rate": 3.6772418587661474e-06, + "loss": 0.5895, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6018288135528564, + "step": 6820, + "valid_targets_mean": 16233.4, + "valid_targets_min": 612 + }, + { + "epoch": 1.821457165732586, + "grad_norm": 0.126039895611612, + "learning_rate": 3.623407315310667e-06, + "loss": 0.6095, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6270237565040588, + "step": 6825, + "valid_targets_mean": 15310.5, + "valid_targets_min": 510 + }, + { + "epoch": 1.8227915665866026, + "grad_norm": 0.1215457476544879, + "learning_rate": 3.5699599940538836e-06, + "loss": 0.5932, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5928213596343994, + "step": 6830, + "valid_targets_mean": 15371.1, + "valid_targets_min": 644 + }, + { + "epoch": 1.8241259674406192, + "grad_norm": 0.12623056542560115, + "learning_rate": 3.5169001849506496e-06, + "loss": 0.6144, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6307641863822937, + "step": 6835, + "valid_targets_mean": 15279.9, + "valid_targets_min": 545 + }, + { + "epoch": 1.8254603682946358, + "grad_norm": 0.11249761749010688, + "learning_rate": 3.4642281758535645e-06, + "loss": 0.5942, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5592288970947266, + "step": 6840, + "valid_targets_mean": 16210.7, + "valid_targets_min": 705 + }, + { + "epoch": 1.8267947691486524, + "grad_norm": 0.1098951823272564, + "learning_rate": 3.4119442525113283e-06, + "loss": 0.5938, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5647261738777161, + "step": 6845, + "valid_targets_mean": 15996.9, + "valid_targets_min": 517 + }, + { + "epoch": 1.828129170002669, + "grad_norm": 0.12384781447849601, + "learning_rate": 3.3600486985673163e-06, + "loss": 0.5848, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6426936388015747, + "step": 6850, + "valid_targets_mean": 14943.6, + "valid_targets_min": 753 + }, + { + "epoch": 1.8294635708566853, + "grad_norm": 0.13195995027485155, + "learning_rate": 3.308541795557948e-06, + "loss": 0.5941, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6188579201698303, + "step": 6855, + "valid_targets_mean": 14683.0, + "valid_targets_min": 586 + }, + { + "epoch": 1.830797971710702, + "grad_norm": 0.125628185782131, + "learning_rate": 3.2574238229111704e-06, + "loss": 0.5902, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5590197443962097, + "step": 6860, + "valid_targets_mean": 15653.1, + "valid_targets_min": 548 + }, + { + "epoch": 1.8321323725647183, + "grad_norm": 0.12472682756940785, + "learning_rate": 3.2066950579450024e-06, + "loss": 0.582, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5600212812423706, + "step": 6865, + "valid_targets_mean": 16062.4, + "valid_targets_min": 61 + }, + { + "epoch": 1.8334667734187349, + "grad_norm": 0.12207900265083974, + "learning_rate": 3.156355775865968e-06, + "loss": 0.5792, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5914990305900574, + "step": 6870, + "valid_targets_mean": 15910.1, + "valid_targets_min": 278 + }, + { + "epoch": 1.8348011742727515, + "grad_norm": 0.13258139999974625, + "learning_rate": 3.106406249767607e-06, + "loss": 0.5816, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.591293215751648, + "step": 6875, + "valid_targets_mean": 15699.3, + "valid_targets_min": 588 + }, + { + "epoch": 1.836135575126768, + "grad_norm": 0.1160461192943085, + "learning_rate": 3.056846750629041e-06, + "loss": 0.604, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5780788660049438, + "step": 6880, + "valid_targets_mean": 16653.1, + "valid_targets_min": 501 + }, + { + "epoch": 1.8374699759807847, + "grad_norm": 0.11635703270079688, + "learning_rate": 3.007677547313436e-06, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5911270380020142, + "step": 6885, + "valid_targets_mean": 16261.6, + "valid_targets_min": 799 + }, + { + "epoch": 1.8388043768348012, + "grad_norm": 0.10977172189530393, + "learning_rate": 2.958898906566626e-06, + "loss": 0.5962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5859546065330505, + "step": 6890, + "valid_targets_mean": 16357.7, + "valid_targets_min": 408 + }, + { + "epoch": 1.8401387776888178, + "grad_norm": 0.11719525454631909, + "learning_rate": 2.910511093015588e-06, + "loss": 0.5975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6086652278900146, + "step": 6895, + "valid_targets_mean": 15757.9, + "valid_targets_min": 643 + }, + { + "epoch": 1.8414731785428344, + "grad_norm": 0.12906155929183688, + "learning_rate": 2.8625143691670404e-06, + "loss": 0.5879, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6210035085678101, + "step": 6900, + "valid_targets_mean": 14412.2, + "valid_targets_min": 431 + }, + { + "epoch": 1.8428075793968508, + "grad_norm": 0.12002678379642992, + "learning_rate": 2.8149089954060287e-06, + "loss": 0.5852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5683364868164062, + "step": 6905, + "valid_targets_mean": 15993.1, + "valid_targets_min": 199 + }, + { + "epoch": 1.8441419802508674, + "grad_norm": 0.11656843705780746, + "learning_rate": 2.767695229994507e-06, + "loss": 0.6108, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6220520734786987, + "step": 6910, + "valid_targets_mean": 17196.1, + "valid_targets_min": 479 + }, + { + "epoch": 1.8454763811048838, + "grad_norm": 0.10599874066792718, + "learning_rate": 2.720873329069895e-06, + "loss": 0.5894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5496461391448975, + "step": 6915, + "valid_targets_mean": 17237.9, + "valid_targets_min": 595 + }, + { + "epoch": 1.8468107819589004, + "grad_norm": 0.11867440275148777, + "learning_rate": 2.6744435466437535e-06, + "loss": 0.5904, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6073455214500427, + "step": 6920, + "valid_targets_mean": 14592.5, + "valid_targets_min": 104 + }, + { + "epoch": 1.848145182812917, + "grad_norm": 0.10484802668554907, + "learning_rate": 2.6284061346004055e-06, + "loss": 0.5878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5743545889854431, + "step": 6925, + "valid_targets_mean": 16563.4, + "valid_targets_min": 383 + }, + { + "epoch": 1.8494795836669335, + "grad_norm": 0.11758213812901547, + "learning_rate": 2.5827613426954664e-06, + "loss": 0.5966, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6080979108810425, + "step": 6930, + "valid_targets_mean": 14695.3, + "valid_targets_min": 567 + }, + { + "epoch": 1.8508139845209501, + "grad_norm": 0.1232609498682966, + "learning_rate": 2.537509418554631e-06, + "loss": 0.5922, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5918781757354736, + "step": 6935, + "valid_targets_mean": 15298.3, + "valid_targets_min": 490 + }, + { + "epoch": 1.8521483853749667, + "grad_norm": 0.15512351459385357, + "learning_rate": 2.4926506076722417e-06, + "loss": 0.599, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5890061259269714, + "step": 6940, + "valid_targets_mean": 15713.8, + "valid_targets_min": 646 + }, + { + "epoch": 1.8534827862289833, + "grad_norm": 0.11156936934072108, + "learning_rate": 2.4481851534099707e-06, + "loss": 0.5852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5654975175857544, + "step": 6945, + "valid_targets_mean": 15386.7, + "valid_targets_min": 571 + }, + { + "epoch": 1.8548171870829997, + "grad_norm": 0.12304603218916753, + "learning_rate": 2.404113296995505e-06, + "loss": 0.6024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5728027820587158, + "step": 6950, + "valid_targets_mean": 15505.8, + "valid_targets_min": 659 + }, + { + "epoch": 1.8561515879370163, + "grad_norm": 0.11534915665069846, + "learning_rate": 2.360435277521275e-06, + "loss": 0.59, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5883013606071472, + "step": 6955, + "valid_targets_mean": 16474.5, + "valid_targets_min": 122 + }, + { + "epoch": 1.8574859887910327, + "grad_norm": 0.12014463570615995, + "learning_rate": 2.3171513319430596e-06, + "loss": 0.6038, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6192582845687866, + "step": 6960, + "valid_targets_mean": 14878.8, + "valid_targets_min": 459 + }, + { + "epoch": 1.8588203896450493, + "grad_norm": 0.10774896921661002, + "learning_rate": 2.274261695078841e-06, + "loss": 0.5971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5748175382614136, + "step": 6965, + "valid_targets_mean": 17166.3, + "valid_targets_min": 716 + }, + { + "epoch": 1.8601547904990658, + "grad_norm": 0.1078641120068596, + "learning_rate": 2.231766599607371e-06, + "loss": 0.5697, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5333196520805359, + "step": 6970, + "valid_targets_mean": 15537.1, + "valid_targets_min": 690 + }, + { + "epoch": 1.8614891913530824, + "grad_norm": 0.11864787077881608, + "learning_rate": 2.1896662760670618e-06, + "loss": 0.591, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6141413450241089, + "step": 6975, + "valid_targets_mean": 16036.9, + "valid_targets_min": 294 + }, + { + "epoch": 1.862823592207099, + "grad_norm": 0.11136294506461766, + "learning_rate": 2.1479609528546328e-06, + "loss": 0.5952, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5849490165710449, + "step": 6980, + "valid_targets_mean": 16131.3, + "valid_targets_min": 751 + }, + { + "epoch": 1.8641579930611156, + "grad_norm": 0.11410952923157061, + "learning_rate": 2.106650856223899e-06, + "loss": 0.5975, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5867966413497925, + "step": 6985, + "valid_targets_mean": 16985.9, + "valid_targets_min": 876 + }, + { + "epoch": 1.8654923939151322, + "grad_norm": 0.1128290098107921, + "learning_rate": 2.0657362102845576e-06, + "loss": 0.5847, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5945344567298889, + "step": 6990, + "valid_targets_mean": 14839.8, + "valid_targets_min": 673 + }, + { + "epoch": 1.8668267947691488, + "grad_norm": 0.11045443610042519, + "learning_rate": 2.0252172370009646e-06, + "loss": 0.5717, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5728679895401001, + "step": 6995, + "valid_targets_mean": 16231.9, + "valid_targets_min": 589 + }, + { + "epoch": 1.8681611956231652, + "grad_norm": 0.11519466042156558, + "learning_rate": 1.985094156190925e-06, + "loss": 0.6034, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.58236163854599, + "step": 7000, + "valid_targets_mean": 16598.3, + "valid_targets_min": 355 + }, + { + "epoch": 1.8694955964771818, + "grad_norm": 0.12345773340208867, + "learning_rate": 1.9453671855244963e-06, + "loss": 0.5913, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5991541147232056, + "step": 7005, + "valid_targets_mean": 16407.8, + "valid_targets_min": 662 + }, + { + "epoch": 1.8708299973311981, + "grad_norm": 0.11577989709027653, + "learning_rate": 1.906036540522829e-06, + "loss": 0.5972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6317030787467957, + "step": 7010, + "valid_targets_mean": 15361.4, + "valid_targets_min": 544 + }, + { + "epoch": 1.8721643981852147, + "grad_norm": 0.11308467546031899, + "learning_rate": 1.8671024345569773e-06, + "loss": 0.5984, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6096479296684265, + "step": 7015, + "valid_targets_mean": 16363.6, + "valid_targets_min": 699 + }, + { + "epoch": 1.8734987990392313, + "grad_norm": 0.10830315239475957, + "learning_rate": 1.8285650788467415e-06, + "loss": 0.5821, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5622441172599792, + "step": 7020, + "valid_targets_mean": 16065.3, + "valid_targets_min": 482 + }, + { + "epoch": 1.874833199893248, + "grad_norm": 0.11724510320410304, + "learning_rate": 1.7904246824595514e-06, + "loss": 0.5909, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5891350507736206, + "step": 7025, + "valid_targets_mean": 16113.2, + "valid_targets_min": 778 + }, + { + "epoch": 1.8761676007472645, + "grad_norm": 0.1148792581953953, + "learning_rate": 1.7526814523092763e-06, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6323190927505493, + "step": 7030, + "valid_targets_mean": 14901.9, + "valid_targets_min": 642 + }, + { + "epoch": 1.8775020016012811, + "grad_norm": 0.11797792259985213, + "learning_rate": 1.7153355931551592e-06, + "loss": 0.6158, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6224967241287231, + "step": 7035, + "valid_targets_mean": 15057.5, + "valid_targets_min": 605 + }, + { + "epoch": 1.8788364024552977, + "grad_norm": 0.1260175985764918, + "learning_rate": 1.678387307600676e-06, + "loss": 0.6037, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5865051746368408, + "step": 7040, + "valid_targets_mean": 15720.0, + "valid_targets_min": 510 + }, + { + "epoch": 1.880170803309314, + "grad_norm": 0.1067135636134446, + "learning_rate": 1.6418367960924271e-06, + "loss": 0.5846, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.580804705619812, + "step": 7045, + "valid_targets_mean": 15797.4, + "valid_targets_min": 478 + }, + { + "epoch": 1.8815052041633307, + "grad_norm": 0.10174351633184524, + "learning_rate": 1.6056842569190987e-06, + "loss": 0.5923, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5535533428192139, + "step": 7050, + "valid_targets_mean": 16996.6, + "valid_targets_min": 667 + }, + { + "epoch": 1.8828396050173473, + "grad_norm": 0.11244985512618108, + "learning_rate": 1.5699298862103276e-06, + "loss": 0.5891, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5968772172927856, + "step": 7055, + "valid_targets_mean": 16006.3, + "valid_targets_min": 383 + }, + { + "epoch": 1.8841740058713636, + "grad_norm": 0.11948717366431685, + "learning_rate": 1.5345738779356714e-06, + "loss": 0.6002, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6243698596954346, + "step": 7060, + "valid_targets_mean": 15559.3, + "valid_targets_min": 714 + }, + { + "epoch": 1.8855084067253802, + "grad_norm": 0.11580752047329682, + "learning_rate": 1.4996164239035408e-06, + "loss": 0.5748, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5642666816711426, + "step": 7065, + "valid_targets_mean": 15481.2, + "valid_targets_min": 735 + }, + { + "epoch": 1.8868428075793968, + "grad_norm": 0.10485005764097419, + "learning_rate": 1.4650577137601843e-06, + "loss": 0.5957, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5874780416488647, + "step": 7070, + "valid_targets_mean": 15717.2, + "valid_targets_min": 850 + }, + { + "epoch": 1.8881772084334134, + "grad_norm": 0.10417353191360103, + "learning_rate": 1.4308979349886146e-06, + "loss": 0.5924, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6178035736083984, + "step": 7075, + "valid_targets_mean": 17092.7, + "valid_targets_min": 778 + }, + { + "epoch": 1.88951160928743, + "grad_norm": 0.1058447762736142, + "learning_rate": 1.3971372729076503e-06, + "loss": 0.6024, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6247731447219849, + "step": 7080, + "valid_targets_mean": 15420.1, + "valid_targets_min": 713 + }, + { + "epoch": 1.8908460101414466, + "grad_norm": 0.10652874154039586, + "learning_rate": 1.3637759106708501e-06, + "loss": 0.5972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5917098522186279, + "step": 7085, + "valid_targets_mean": 16516.3, + "valid_targets_min": 553 + }, + { + "epoch": 1.8921804109954632, + "grad_norm": 0.10799915454444874, + "learning_rate": 1.3308140292655645e-06, + "loss": 0.58, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5906647443771362, + "step": 7090, + "valid_targets_mean": 16697.9, + "valid_targets_min": 344 + }, + { + "epoch": 1.8935148118494796, + "grad_norm": 0.11981808776170194, + "learning_rate": 1.2982518075119352e-06, + "loss": 0.5763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6170154809951782, + "step": 7095, + "valid_targets_mean": 15495.0, + "valid_targets_min": 146 + }, + { + "epoch": 1.8948492127034962, + "grad_norm": 0.11486360410426957, + "learning_rate": 1.2660894220619139e-06, + "loss": 0.595, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6035982370376587, + "step": 7100, + "valid_targets_mean": 16467.9, + "valid_targets_min": 593 + }, + { + "epoch": 1.8961836135575125, + "grad_norm": 0.10499519888203847, + "learning_rate": 1.2343270473983286e-06, + "loss": 0.597, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5793255567550659, + "step": 7105, + "valid_targets_mean": 16619.4, + "valid_targets_min": 537 + }, + { + "epoch": 1.8975180144115291, + "grad_norm": 0.12478283596005901, + "learning_rate": 1.202964855833935e-06, + "loss": 0.5831, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5687292814254761, + "step": 7110, + "valid_targets_mean": 15931.3, + "valid_targets_min": 570 + }, + { + "epoch": 1.8988524152655457, + "grad_norm": 0.10846084952146565, + "learning_rate": 1.1720030175104506e-06, + "loss": 0.5972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5962158441543579, + "step": 7115, + "valid_targets_mean": 16200.3, + "valid_targets_min": 478 + }, + { + "epoch": 1.9001868161195623, + "grad_norm": 0.11149955520672268, + "learning_rate": 1.1414417003976634e-06, + "loss": 0.5787, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.565889835357666, + "step": 7120, + "valid_targets_mean": 16230.9, + "valid_targets_min": 701 + }, + { + "epoch": 1.901521216973579, + "grad_norm": 0.09727284712006973, + "learning_rate": 1.1112810702925163e-06, + "loss": 0.5852, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5637081265449524, + "step": 7125, + "valid_targets_mean": 17315.3, + "valid_targets_min": 544 + }, + { + "epoch": 1.9028556178275955, + "grad_norm": 0.11391246609885147, + "learning_rate": 1.0815212908181825e-06, + "loss": 0.584, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5784386396408081, + "step": 7130, + "valid_targets_mean": 16232.3, + "valid_targets_min": 388 + }, + { + "epoch": 1.904190018681612, + "grad_norm": 0.10947631191296657, + "learning_rate": 1.0521625234232333e-06, + "loss": 0.5959, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6112264394760132, + "step": 7135, + "valid_targets_mean": 15190.9, + "valid_targets_min": 303 + }, + { + "epoch": 1.9055244195356285, + "grad_norm": 0.11228511943247846, + "learning_rate": 1.023204927380672e-06, + "loss": 0.6016, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5891322493553162, + "step": 7140, + "valid_targets_mean": 16496.0, + "valid_targets_min": 493 + }, + { + "epoch": 1.906858820389645, + "grad_norm": 0.10335632580031771, + "learning_rate": 9.946486597871672e-07, + "loss": 0.5931, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5750100612640381, + "step": 7145, + "valid_targets_mean": 16288.6, + "valid_targets_min": 337 + }, + { + "epoch": 1.9081932212436616, + "grad_norm": 0.10643300666622367, + "learning_rate": 9.664938755621632e-07, + "loss": 0.5861, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6035852432250977, + "step": 7150, + "valid_targets_mean": 15821.4, + "valid_targets_min": 343 + }, + { + "epoch": 1.909527622097678, + "grad_norm": 0.10814021288570172, + "learning_rate": 9.387407274469793e-07, + "loss": 0.5903, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5945829153060913, + "step": 7155, + "valid_targets_mean": 16528.9, + "valid_targets_min": 181 + }, + { + "epoch": 1.9108620229516946, + "grad_norm": 0.10771079524688575, + "learning_rate": 9.113893660041033e-07, + "loss": 0.5876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5860378742218018, + "step": 7160, + "valid_targets_mean": 15851.9, + "valid_targets_min": 530 + }, + { + "epoch": 1.9121964238057112, + "grad_norm": 0.10426780320770314, + "learning_rate": 8.844399396162577e-07, + "loss": 0.5817, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5573742389678955, + "step": 7165, + "valid_targets_mean": 16035.7, + "valid_targets_min": 576 + }, + { + "epoch": 1.9135308246597278, + "grad_norm": 0.11271184825740115, + "learning_rate": 8.578925944856596e-07, + "loss": 0.6009, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.607288122177124, + "step": 7170, + "valid_targets_mean": 16248.8, + "valid_targets_min": 883 + }, + { + "epoch": 1.9148652255137444, + "grad_norm": 0.10539783629888545, + "learning_rate": 8.317474746332126e-07, + "loss": 0.5763, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5683166980743408, + "step": 7175, + "valid_targets_mean": 16696.4, + "valid_targets_min": 464 + }, + { + "epoch": 1.916199626367761, + "grad_norm": 0.11251688734146195, + "learning_rate": 8.060047218977323e-07, + "loss": 0.5944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5919359922409058, + "step": 7180, + "valid_targets_mean": 15508.2, + "valid_targets_min": 299 + }, + { + "epoch": 1.9175340272217776, + "grad_norm": 0.11077719358664008, + "learning_rate": 7.806644759351471e-07, + "loss": 0.5917, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6042367219924927, + "step": 7185, + "valid_targets_mean": 16469.2, + "valid_targets_min": 608 + }, + { + "epoch": 1.918868428075794, + "grad_norm": 0.10978081665948485, + "learning_rate": 7.557268742177908e-07, + "loss": 0.5953, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5959744453430176, + "step": 7190, + "valid_targets_mean": 15302.7, + "valid_targets_min": 699 + }, + { + "epoch": 1.9202028289298105, + "grad_norm": 0.11271598718073285, + "learning_rate": 7.311920520336106e-07, + "loss": 0.5895, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6039493083953857, + "step": 7195, + "valid_targets_mean": 15806.0, + "valid_targets_min": 681 + }, + { + "epoch": 1.921537229783827, + "grad_norm": 0.09979538157727764, + "learning_rate": 7.070601424854522e-07, + "loss": 0.5909, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5759025812149048, + "step": 7200, + "valid_targets_mean": 17470.4, + "valid_targets_min": 650 + }, + { + "epoch": 1.9228716306378435, + "grad_norm": 0.11197812099612356, + "learning_rate": 6.833312764903343e-07, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6100215911865234, + "step": 7205, + "valid_targets_mean": 16637.7, + "valid_targets_min": 523 + }, + { + "epoch": 1.92420603149186, + "grad_norm": 0.11349120819192293, + "learning_rate": 6.600055827787581e-07, + "loss": 0.5888, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5917244553565979, + "step": 7210, + "valid_targets_mean": 15618.0, + "valid_targets_min": 571 + }, + { + "epoch": 1.9255404323458767, + "grad_norm": 0.10606001203762529, + "learning_rate": 6.370831878939747e-07, + "loss": 0.6123, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6029739379882812, + "step": 7215, + "valid_targets_mean": 16360.1, + "valid_targets_min": 539 + }, + { + "epoch": 1.9268748331998933, + "grad_norm": 0.11101483061117472, + "learning_rate": 6.1456421619131e-07, + "loss": 0.5789, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.590622067451477, + "step": 7220, + "valid_targets_mean": 14537.4, + "valid_targets_min": 532 + }, + { + "epoch": 1.9282092340539099, + "grad_norm": 0.10746309454661468, + "learning_rate": 5.924487898375158e-07, + "loss": 0.5894, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.610184907913208, + "step": 7225, + "valid_targets_mean": 15415.4, + "valid_targets_min": 471 + }, + { + "epoch": 1.9295436349079265, + "grad_norm": 0.10496606126519877, + "learning_rate": 5.707370288100782e-07, + "loss": 0.6039, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6027356386184692, + "step": 7230, + "valid_targets_mean": 16612.8, + "valid_targets_min": 429 + }, + { + "epoch": 1.9308780357619428, + "grad_norm": 0.12280401202824656, + "learning_rate": 5.494290508965605e-07, + "loss": 0.6047, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6241533756256104, + "step": 7235, + "valid_targets_mean": 14704.9, + "valid_targets_min": 454 + }, + { + "epoch": 1.9322124366159594, + "grad_norm": 0.10418094491281422, + "learning_rate": 5.285249716940026e-07, + "loss": 0.5834, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5590264201164246, + "step": 7240, + "valid_targets_mean": 17070.4, + "valid_targets_min": 516 + }, + { + "epoch": 1.933546837469976, + "grad_norm": 0.10925989299981413, + "learning_rate": 5.080249046082563e-07, + "loss": 0.5967, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6061210036277771, + "step": 7245, + "valid_targets_mean": 15973.7, + "valid_targets_min": 230 + }, + { + "epoch": 1.9348812383239924, + "grad_norm": 0.1038167631296208, + "learning_rate": 4.879289608533926e-07, + "loss": 0.6052, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5867657661437988, + "step": 7250, + "valid_targets_mean": 16210.0, + "valid_targets_min": 368 + }, + { + "epoch": 1.936215639178009, + "grad_norm": 0.10564140231065966, + "learning_rate": 4.6823724945107e-07, + "loss": 0.5865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5992836952209473, + "step": 7255, + "valid_targets_mean": 15896.8, + "valid_targets_min": 542 + }, + { + "epoch": 1.9375500400320256, + "grad_norm": 0.10121772563289091, + "learning_rate": 4.489498772299843e-07, + "loss": 0.5955, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5765215158462524, + "step": 7260, + "valid_targets_mean": 16066.0, + "valid_targets_min": 413 + }, + { + "epoch": 1.9388844408860422, + "grad_norm": 0.10685783716605916, + "learning_rate": 4.3006694882526947e-07, + "loss": 0.5929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5946753025054932, + "step": 7265, + "valid_targets_mean": 16010.7, + "valid_targets_min": 650 + }, + { + "epoch": 1.9402188417400588, + "grad_norm": 0.11537038648261387, + "learning_rate": 4.115885666779062e-07, + "loss": 0.5921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6231012344360352, + "step": 7270, + "valid_targets_mean": 15111.9, + "valid_targets_min": 675 + }, + { + "epoch": 1.9415532425940754, + "grad_norm": 0.10414761108882142, + "learning_rate": 3.9351483103420566e-07, + "loss": 0.5803, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5548113584518433, + "step": 7275, + "valid_targets_mean": 17432.2, + "valid_targets_min": 592 + }, + { + "epoch": 1.942887643448092, + "grad_norm": 0.10200057372451578, + "learning_rate": 3.758458399452519e-07, + "loss": 0.5856, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5601938962936401, + "step": 7280, + "valid_targets_mean": 16905.9, + "valid_targets_min": 193 + }, + { + "epoch": 1.9442220443021083, + "grad_norm": 0.10194804058111612, + "learning_rate": 3.585816892663351e-07, + "loss": 0.5865, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5662258863449097, + "step": 7285, + "valid_targets_mean": 16372.1, + "valid_targets_min": 483 + }, + { + "epoch": 1.945556445156125, + "grad_norm": 0.10425651405329209, + "learning_rate": 3.4172247265650267e-07, + "loss": 0.5944, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5972768664360046, + "step": 7290, + "valid_targets_mean": 15505.5, + "valid_targets_min": 326 + }, + { + "epoch": 1.9468908460101413, + "grad_norm": 0.10652966361544959, + "learning_rate": 3.252682815779922e-07, + "loss": 0.5971, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5889468789100647, + "step": 7295, + "valid_targets_mean": 15443.7, + "valid_targets_min": 320 + }, + { + "epoch": 1.9482252468641579, + "grad_norm": 0.10225399193367106, + "learning_rate": 3.0921920529574096e-07, + "loss": 0.5976, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6094781756401062, + "step": 7300, + "valid_targets_mean": 16137.0, + "valid_targets_min": 412 + }, + { + "epoch": 1.9495596477181745, + "grad_norm": 0.1058290729172914, + "learning_rate": 2.9357533087694397e-07, + "loss": 0.59, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6034204959869385, + "step": 7305, + "valid_targets_mean": 15746.1, + "valid_targets_min": 716 + }, + { + "epoch": 1.950894048572191, + "grad_norm": 0.09901387339508871, + "learning_rate": 2.7833674319052977e-07, + "loss": 0.5876, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5842059254646301, + "step": 7310, + "valid_targets_mean": 16711.1, + "valid_targets_min": 740 + }, + { + "epoch": 1.9522284494262077, + "grad_norm": 0.1028355506347445, + "learning_rate": 2.6350352490672746e-07, + "loss": 0.5919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6164946556091309, + "step": 7315, + "valid_targets_mean": 15863.6, + "valid_targets_min": 442 + }, + { + "epoch": 1.9535628502802243, + "grad_norm": 0.11315707367960545, + "learning_rate": 2.49075756496625e-07, + "loss": 0.5899, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5809638500213623, + "step": 7320, + "valid_targets_mean": 16541.0, + "valid_targets_min": 482 + }, + { + "epoch": 1.9548972511342408, + "grad_norm": 0.10266507868918702, + "learning_rate": 2.3505351623170353e-07, + "loss": 0.6066, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5731981992721558, + "step": 7325, + "valid_targets_mean": 15640.2, + "valid_targets_min": 553 + }, + { + "epoch": 1.9562316519882574, + "grad_norm": 0.10345989214210093, + "learning_rate": 2.2143688018343707e-07, + "loss": 0.6077, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5999371409416199, + "step": 7330, + "valid_targets_mean": 15955.4, + "valid_targets_min": 731 + }, + { + "epoch": 1.9575660528422738, + "grad_norm": 0.10090461630292039, + "learning_rate": 2.0822592222287659e-07, + "loss": 0.5969, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6222025156021118, + "step": 7335, + "valid_targets_mean": 16458.2, + "valid_targets_min": 634 + }, + { + "epoch": 1.9589004536962904, + "grad_norm": 0.11171063134597106, + "learning_rate": 1.9542071402024185e-07, + "loss": 0.5785, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6225034594535828, + "step": 7340, + "valid_targets_mean": 14275.8, + "valid_targets_min": 568 + }, + { + "epoch": 1.9602348545503068, + "grad_norm": 0.10472137138520929, + "learning_rate": 1.830213250445467e-07, + "loss": 0.5777, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5679185390472412, + "step": 7345, + "valid_targets_mean": 15203.7, + "valid_targets_min": 528 + }, + { + "epoch": 1.9615692554043234, + "grad_norm": 0.10556708209565631, + "learning_rate": 1.7102782256319115e-07, + "loss": 0.6075, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6184024810791016, + "step": 7350, + "valid_targets_mean": 15826.0, + "valid_targets_min": 543 + }, + { + "epoch": 1.96290365625834, + "grad_norm": 0.10908761627910832, + "learning_rate": 1.5944027164163652e-07, + "loss": 0.6058, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6222631931304932, + "step": 7355, + "valid_targets_mean": 15221.2, + "valid_targets_min": 610 + }, + { + "epoch": 1.9642380571123566, + "grad_norm": 0.1010896453599452, + "learning_rate": 1.4825873514302257e-07, + "loss": 0.5973, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5961298942565918, + "step": 7360, + "valid_targets_mean": 15682.6, + "valid_targets_min": 612 + }, + { + "epoch": 1.9655724579663731, + "grad_norm": 0.10025610273231542, + "learning_rate": 1.3748327372784252e-07, + "loss": 0.5972, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6105427145957947, + "step": 7365, + "valid_targets_mean": 16404.8, + "valid_targets_min": 555 + }, + { + "epoch": 1.9669068588203897, + "grad_norm": 0.10228371428791674, + "learning_rate": 1.271139458536019e-07, + "loss": 0.5934, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5717061161994934, + "step": 7370, + "valid_targets_mean": 16421.3, + "valid_targets_min": 753 + }, + { + "epoch": 1.9682412596744063, + "grad_norm": 0.10475497189588388, + "learning_rate": 1.1715080777451868e-07, + "loss": 0.5912, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.59098219871521, + "step": 7375, + "valid_targets_mean": 16878.4, + "valid_targets_min": 765 + }, + { + "epoch": 1.9695756605284227, + "grad_norm": 0.10015423663677037, + "learning_rate": 1.0759391354119017e-07, + "loss": 0.5878, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5767727494239807, + "step": 7380, + "valid_targets_mean": 15934.6, + "valid_targets_min": 502 + }, + { + "epoch": 1.9709100613824393, + "grad_norm": 0.10156387805197431, + "learning_rate": 9.844331500034331e-08, + "loss": 0.5962, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6096939444541931, + "step": 7385, + "valid_targets_mean": 16366.0, + "valid_targets_min": 625 + }, + { + "epoch": 1.9722444622364559, + "grad_norm": 0.10719608709343924, + "learning_rate": 8.969906179449316e-08, + "loss": 0.6091, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6203577518463135, + "step": 7390, + "valid_targets_mean": 15040.2, + "valid_targets_min": 584 + }, + { + "epoch": 1.9735788630904723, + "grad_norm": 0.11017698139830989, + "learning_rate": 8.136120136174318e-08, + "loss": 0.6054, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5938665270805359, + "step": 7395, + "valid_targets_mean": 16084.2, + "valid_targets_min": 461 + }, + { + "epoch": 1.9749132639444889, + "grad_norm": 0.10566871444745696, + "learning_rate": 7.342977893546875e-08, + "loss": 0.6083, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6060525178909302, + "step": 7400, + "valid_targets_mean": 16333.7, + "valid_targets_min": 849 + }, + { + "epoch": 1.9762476647985054, + "grad_norm": 0.09749390670046561, + "learning_rate": 6.590483754409237e-08, + "loss": 0.5744, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5636769533157349, + "step": 7405, + "valid_targets_mean": 16822.6, + "valid_targets_min": 209 + }, + { + "epoch": 1.977582065652522, + "grad_norm": 0.11092173648538958, + "learning_rate": 5.878641801087547e-08, + "loss": 0.589, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5932129621505737, + "step": 7410, + "valid_targets_mean": 15366.3, + "valid_targets_min": 620 + }, + { + "epoch": 1.9789164665065386, + "grad_norm": 0.10269954867675517, + "learning_rate": 5.207455895365198e-08, + "loss": 0.5908, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5902327299118042, + "step": 7415, + "valid_targets_mean": 15743.9, + "valid_targets_min": 474 + }, + { + "epoch": 1.9802508673605552, + "grad_norm": 0.10327250901637106, + "learning_rate": 4.5769296784653463e-08, + "loss": 0.5963, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.57696533203125, + "step": 7420, + "valid_targets_mean": 15775.1, + "valid_targets_min": 547 + }, + { + "epoch": 1.9815852682145718, + "grad_norm": 0.10474078714099273, + "learning_rate": 3.9870665710300954e-08, + "loss": 0.5982, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6041386127471924, + "step": 7425, + "valid_targets_mean": 15682.6, + "valid_targets_min": 338 + }, + { + "epoch": 1.9829196690685882, + "grad_norm": 0.11011438975518267, + "learning_rate": 3.437869773101343e-08, + "loss": 0.5929, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6006224155426025, + "step": 7430, + "valid_targets_mean": 14573.4, + "valid_targets_min": 364 + }, + { + "epoch": 1.9842540699226048, + "grad_norm": 0.10785042466983051, + "learning_rate": 2.929342264103296e-08, + "loss": 0.5782, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6067730784416199, + "step": 7435, + "valid_targets_mean": 17377.5, + "valid_targets_min": 199 + }, + { + "epoch": 1.9855884707766212, + "grad_norm": 0.10847529204402115, + "learning_rate": 2.4614868028274837e-08, + "loss": 0.5853, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5615088939666748, + "step": 7440, + "valid_targets_mean": 15786.1, + "valid_targets_min": 665 + }, + { + "epoch": 1.9869228716306377, + "grad_norm": 0.10017211729266047, + "learning_rate": 2.034305927416935e-08, + "loss": 0.5842, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5783184766769409, + "step": 7445, + "valid_targets_mean": 17086.3, + "valid_targets_min": 608 + }, + { + "epoch": 1.9882572724846543, + "grad_norm": 0.10239017393007949, + "learning_rate": 1.647801955354522e-08, + "loss": 0.5771, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.565893292427063, + "step": 7450, + "valid_targets_mean": 15870.3, + "valid_targets_min": 693 + }, + { + "epoch": 1.989591673338671, + "grad_norm": 0.10269734101477318, + "learning_rate": 1.301976983445474e-08, + "loss": 0.5851, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5717909336090088, + "step": 7455, + "valid_targets_mean": 16363.2, + "valid_targets_min": 453 + }, + { + "epoch": 1.9909260741926875, + "grad_norm": 0.10335049595234001, + "learning_rate": 9.968328878115495e-09, + "loss": 0.6131, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6074311137199402, + "step": 7460, + "valid_targets_mean": 15293.2, + "valid_targets_min": 243 + }, + { + "epoch": 1.9922604750467041, + "grad_norm": 0.10779248661193865, + "learning_rate": 7.3237132387604646e-09, + "loss": 0.607, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6135603189468384, + "step": 7465, + "valid_targets_mean": 15164.7, + "valid_targets_min": 429 + }, + { + "epoch": 1.9935948759007207, + "grad_norm": 0.10479306145925003, + "learning_rate": 5.0859372635964065e-09, + "loss": 0.5819, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5816622972488403, + "step": 7470, + "valid_targets_mean": 15709.1, + "valid_targets_min": 334 + }, + { + "epoch": 1.994929276754737, + "grad_norm": 0.1040250522239671, + "learning_rate": 3.2550130926789487e-09, + "loss": 0.5919, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6114310026168823, + "step": 7475, + "valid_targets_mean": 16027.9, + "valid_targets_min": 291 + }, + { + "epoch": 1.9962636776087537, + "grad_norm": 0.1063982033117486, + "learning_rate": 1.8309506588959356e-09, + "loss": 0.5921, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.6096254587173462, + "step": 7480, + "valid_targets_mean": 16148.9, + "valid_targets_min": 574 + }, + { + "epoch": 1.9975980784627703, + "grad_norm": 0.10167680252386486, + "learning_rate": 8.137576878508578e-10, + "loss": 0.6098, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5815737247467041, + "step": 7485, + "valid_targets_mean": 15848.2, + "valid_targets_min": 356 + }, + { + "epoch": 1.9989324793167866, + "grad_norm": 0.10102538478634103, + "learning_rate": 2.0343969787950387e-10, + "loss": 0.5871, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.5756806135177612, + "step": 7490, + "valid_targets_mean": 16549.2, + "valid_targets_min": 823 + }, + { + "epoch": 2.0, + "loss_nan_ranks": 0, + "loss_rank_avg": 0.598960816860199, + "step": 7494, + "total_flos": 2.3824840797454336e+16, + "train_loss": 0.11019459065355108, + "train_runtime": 14786.2521, + "train_samples_per_second": 129.744, + "train_steps_per_second": 0.507, + "valid_targets_mean": 15636.4, + "valid_targets_min": 509 + } + ], + "logging_steps": 5, + "max_steps": 7494, + "num_input_tokens_seen": 0, + "num_train_epochs": 2, + "save_steps": 100, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 2.3824840797454336e+16, + "train_batch_size": 1, + "trial_name": null, + "trial_params": null +} diff --git a/training_args.bin b/training_args.bin new file mode 100644 index 0000000..1bf0ac0 --- /dev/null +++ b/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e070991589618011b0b85a38b2f253a0d378231f98d4fc1017a0991f00299510 +size 8849 diff --git a/training_loss.png b/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..79e93080f9292b960ebf44bb42f1ffc26d2e419b GIT binary patch literal 47290 zcmeFZhgVfi7Cm^$NRXsRj*5y%k|dHrKm`RvL_~7VNX|(G1VKbH5=2Bq2_i@il2lL- zBuNG(NX{94r_k={S+i!X`2(ic>hAA*ym#-ds#E9ev-hqWs&-Y0oP>b{!!Yto$_g47 zhU<@EIK#w*@QLvE{$KEa;?5Vfov+)QIlCF&HN{j7ogHlKooy_Q*j!ETI$7G=o#PeY z=N08)vv78Ha1!U^v;FTkcE~jK~~c} zd1k=P`}*%aqJ`E=?Z*ea?7#4Mh557Pklo@vl1F?v*UKL-w=XA6ui^f~(X~Gmc_FX- zRbR*Na!boXPVa6MGsHbKcZzO{c_x-P_yyr%Nj4 zV;(YAwK>k{z!W^z6zR5-{@C@sc`FP2tEAT&y2e>{b{x?G=ji6*A@%OCh_-b4njb$j z;qMtrk*>cCOP&P=;#MquIV0w?<*dZ|@OIhn*xUR*TPqP#;nq*&(reD-RkV+jeq{CA z!HH77_xw4B?=26H^C=$V^ecZlN$-|2$;!$qU%FH~{xzx3{YP$*>#R;Vqv+w0k&(xr zO_Wts>YrZ>dmIyE+C4@}Lb4F)w}V&dxf+<4$A^oH%WqUq?7cnv!65ul*Fe4@9$X{X zZlJ8TxtSEc^sznjiu#Qkrtj`VjN$tY4h||`z1ldPSAF=t+{iuit3Uq)v-)C9j?7E) zZOjs@Kd#dWnh*yD1`hxJeP7CFYdGenp6s1F&kQP!n<7TOE3sZ2s`43`oqbeNBG&J_ zJzL_vd6$TJv*=p7nv78e|Jk$T9O~Qk_mf2J6}7eL9#F6j@@`M_kiawl$;sn@Nem(+ z|1(+Vct%xKwWq+CNGn&j_j~YY@#xst_qH~Sf`THLHAn3f`Zlgil3+eusIe_wo{EYJ zN5)MrLClfk@|7zE7T-C@7)8i#+_$!ME)zk2*R!?wGree7vuGUl3-Og`^KD80W^xU5fR^r5UwTw;5saA9q2Zc=`VzbS&b4u*>!{L}Bd$>J^~ z_Eno)u5&&@n{OK{fnD++%*6MV3ZR@X} z#v<6$&nC03*zIDQ+V_?nHIBOFv(Y75K0cLKuDNfo&C1)_o;7QUA9?5F?8?+6%Nyr5 zDS)1Peb9>!yVK@7{r1E2ckigZ*5?{NMR9Jfrg;82-S5(U#~uE_?>wp2@7ia}?DC1$ zXX*1vuIBNUgdoGZ2P5V4Rdw%7o8L(J*7)Oa(RV7b`W%6otcSn}@!Q`Xq6}-m{NWLk z@CW6C4>w4z_Xn~1Zs4pB`Be{BrAT^>vhHsX`EAz{vEI9!`SAfcV_Q#8&qyksajul~ z`);Y3#jWYQy6)~{qJ!?7B6j^f--A2Y*XD=p-|?J2edwC>u22MvFobAWSYKC? zk-_FlCs+zqSuuyH_7f=HiOI?DXJwuAT>W!@BGqqjoJPuPjfa+3Hv~2u%r_?o2QHfI zFU`%WT?2*Y6fj!CQr(CbFOGY!^_qL{W5)Zt^L_#_*Y2L49H&kZyY)K~-F0#zm=0%^ zX4&0Zt-DWp%wg=2=ttPS-@ku%hkZ@3{li@0*jb%=(fOV~tu8wojxS!kU^{*sKP4pv zQo}F4nntPp9jD_bPRMda8*VI&h`G*a=jd_nT04$>Bxp&MW(^1kpgU(4E}s`VvIzGz zst=)ps7-B{DD_x2JAU#cCp&w9zS+FF?EWSRF|mJjwKVNn9h2hhmccQpyT6EEUQ3Or zsgZH_@-l`9*cc9?;9eP)P?4)B9o2St{)#rh~KUT4` z)QmZwY z@0A-=Z%Nq`9cHR|a^eal0|SY@y?x8G3&%1uGtGuB$Zxf#W-dodQd3i>shvvG$lfp= zf0yet@r?k}t#JRIJFBRm07XUlI9K(&tp<0DYbA@{-sZ{12xd~a&c@c3QDZp0nBQK7 z0rRdoFDEBnN7l7q$lP;f)4W(2o9$G4X2_#Q_f@#$^Ykhgpk~Djh4vZQvc_%|GOqKv zuKYBOJaaR5xN?24?)8lvomHvH-xCvKRoip&nwm$3c8Al0S*X3uX3n3)Wc2h{VAJBk zZSUQ`Ka!o55~z_aR6fM16k+h^M>d3Xa9rH6#z&07kZay=dC&>250vh0O%v3zVk?v1 z@qD(|il&|RXFm+daYPL#n5Pt!&cSBCSLL&f!VyK0hz*_Z&Z1KE>P)Gg_wH(UJij6C z$B!S`qCY=QP7a67`eVkaYU*WDzHOffnq3IdjhVvMja`Y&U(q{m>5zKRVx)Ci5%itn z<7*ml8zPsMmX?wdcN!0GaN30}8};M~E{s6o;>D4oZoRQ;{hdm*_W>aLyd!mzDJJVYB8qK8Uw9dN0_`w;=ndt{Klfa~m{->S&r*xyG=)v)tNC zb4{XFLQ=9fgo-m>E9ZCj1&^iU(VtCtV3$>Hjwj7L5*;*9S68wXy zd`%LKM2UB%^QOKjJ3Bl2`VB3urRhhEq7g9Uf}S4jwR)Os`PZa2@2SS~2jCb$9T?G{ z@7D8rgkunPjL&SyZ(nkIZ+rfhqT+*w2~Azy7F;~MTdgUQy?%Skti=E-*5LUHp{_4X zo0yp`&0kxe8|a1N(=h0}ZA(i{{n5zCDE@Nh-3?*S&EIkKSZs1~i&<;RSEGb&e3{nw7b1-&Jh)2J5=>d zzjbi_`Cg^S&bNN2R!J4!xI&2DcV6?AaR=9ry=`ZR^_)!g{zzy1CO0<%eMp8SU2x;w z@4etOPG%fl0N5yHb9=k+n4Wup4-D3(;o;GlMn-!Rzx~}0!@@8W(OZCR_HQLf`$^%| zynFXfW$;?v7+y_#M+d!e_}4_?Fmh(`r`7vEvage2G@%MD3(3O9jbtJ=J^XuXrA`y^ zkYBG{y=rD(xk`Jx(o?v6iqc zKbhempO zdNZF-rkYrHy)opg+TfV($fEG$eYc(rsa6{TH$j)zyj5zO$7_Fgy%&Js=JfR3K>4PN z+w9MV7aFG-g{_Wwtq-{M!U8v;EeoGrxce)lt~Db&I}{CiXUDr3a#2^gn>`vd6y~>5 zS93bwO-@>fn0`4@yR@<4E&{8ww+8#VQ7po^ReHbTtMMl66MD=QQq?=SeYnp;Ezu05 zT;oXTJ+bNt&hD_0y5K@6)$gF%NBXRMSF-u?^fVa;%USeUz-@l;837?7V5ZmtVe77Z z$VY`+Tb?2YH5e@uQ_J3Jp5MXe1f;b55o0|lT}bO?e9u?UP!uT8Zej6RQ7;C>DdMqY zBE=%$mOKAFgQy%4Xao^ z^Cjkt3P%(%Zq1uFJY2M4y^Qu1>^){yR@~9b#{++lH9j)NHfW9*ho6qQOiM*oYghW4 z*0&dKq>@r7T)nq-2CpW9`GT1vvyU1j%nmm<_r~w)-8DwMn!SxN3g3jvyr{jfyA#jc zNVk<3B-nK_HvH=u3WWXM26#+}GFF25Rz~f&%r0cvycz|J|i#zMXe}{#en{(|;zU zU}@niTramcjp5hmdCdyfR;?bBtc2}D=wAsaBXE`b%o%!YEp>kBpbRtkUBWU;87l4;-s-dp3`r`$HexO{3Us2g9MuJWW4h3 z6x;lKAA0FHwd>xF#~$5n8jM#v-ydpj;e^Ysm&yG3k=^wnbF627Z(Z8A62iT!(#x&( z{0-P^ERvr2PoEyCosdaa%df9jK!F{c+LSIIjGx-7SLu1^+eoZ8Y;ZDc8`goKnH;Z% zLTbYwGSVJ^$m5tTk|piY~nvDb=ozKlx*bduqs09ufiRJa$;lroGzcZ$I^>S zW$kUTXK$l+TDBu4GLnK88bOF@-4X}c{5@#E@w59OY;oH%vsWSW726GPTkH+IGbIHu z!Qwf|?wbH;6mG!P<7;VodTnkX46@QO=r04eXQr-L^o$So^n|>7Cs@TAxL4F>A=Fdq zbP|?^b8>h9rb;DAL^Z#XoKZw3r*jlizS6B*^!vxCr~+X244_O0uKIX;aTUf{!w zrVXFVm?t!_fzAoA;DmHogfDG)q|;1K0YEV&Rn@&kOqINL?V56?#!PP^ zQA|t>Z8w0dk7%8TW`F+F0W7RDP_?%Q|F~Bo#6S+vfLNw`9X$Zu1y`P-i^Kh;POo0S z9+j>;di3Z9R6_@7e^AW&?L*=QU>FF&&L%CbpFh+Pc8qlJ+^%n7VWDcoA|&m4Sh|I| z@_7zk-ovY_t6Hhi1sCQkXfC+U)Iib>*<7B$!x$JC-bjr%vHI0RY=mZBiF>XT$-=b` zb%qgr57N*=pMACA=F;z;GM6*st*P@4PTU6DtB9$1{ra^7N^{c>#kN>OQ9*Y=?(n!Nx2_(-i{|!MePdr0)z6bYpIPfXKwQQ?Rh_qi(8(z z_wkYBx|$pUNjOnR_2(17+yDp+Ajj^c(T%CsH1gglyQjqBfuEuH=p!`Z#;(sk4EZu% zlUT$b^qf9hvG9@9mH7(vwM$D&DrJ%h#?ziS#Cb8Dot>x7oT)2u9CKLxb3^myO;VOr zAW+breV6LDM-S-sqJcr$@V1a;`*8~)hM9r#V_3e+w3fTO`)~je%P{L1>d=KxoRQiR zdjO!H?u#}#x8`i(mo9}u zOJ%LDp%M7t0ipB!;DAYAV{@)6TwEk}ecOqXeB6!G z9`5dGw?Ei%MfO#AoO`K~@Nqr6V4~3A(@&@M<>kWdl5>KBGlTZV#+<;x1VGe}0@;w- zuqOlcUvyJWAyzW#Ed+1tm*w(Cbbk*}elA?D96|DXmMGsOH{zD%+<+ZT-H z2FS9F$&5%~Sw0a3ZiVT4dWzE-y91J491Y`39JqGr(xK-W8Jm4;-mEKj6^n{k4RA^P zUTZch)7=zOQc^piUHQMrv5oC*QeMi%#l?`wNTM`SLPU#QisoWJd-ki1`2wWl5!8di zeG#2f*m{zSix44q`_@EZ(%RZu)Z-Uec5t;MpYNC%<0)A6)GfVBfbkoC#4n75`J(BM zRX!dP8cM~}{Oy~frsmVnk+^lO1)MFj8Ny7PJlac8%G2Mx31_`DqyvrktL*FokBEZx z$Nr` z&{x}~SDaFQCgL_QM_VgX8_@fseH};3U)0dP{Gl6~woqt)jUdCIDjO}p-VfKuK_&uTgY)Fcre7~!XYJ#>khX;FV({xzR8P4ZAGAj5z-hux=a7(K z0yaksXeAV{gOy&(C$H_AFHdEqifm@SHTV8#GrKMT#2-vcBOs<4BLAqUs6dyhy)EmU zi>uHxX}!5qP76(@@cBW=p$1)VZcTRQv3BL@&$r10hSHqG#h~;~J75;AZunT${+^fY zaGtq$vS32XZ_@^z**cA|$BG#O+Y)_u?FgNZ?EutbhWqeaSy^qUsNcE6OlSP*%a=eP zO7=OMn5Tw@_IDTKUJ z#7RR3zS!!w*KxdrLCU*iIJmxC>kgz=7YPS$U&VL{d;t08D2O#0u;M$!P1$QdSS0x3q|SE^L*ucGcfX`+CDB zCC0 zgjiEc%cwi|j{9oo&BgXBe2eQ-eyfxB@81V1Gl?0;tO7Bx;R46GxWs3_zH=Vc$u|gK z>$KkqC)JuMv7+TG_&C&0PMnRRa{%G-=K8i)8Bvjk_#XO$<@Os zYMx%sOgl7~(i+G)BRL1OsBiUy-eXQ;5p}Qz{=J3fV~7HWnq%quB1_84bYpNjEbWid z*V55)i#hkVmo8sMdPV`{Nt8`MO!x@v5eAsE+92Ez9sp$>g2;sPPF#ql@`l#XED2WD z>Y%OzogS$F7K&K|;@h8HaN__H6-p^#ljCIH2R;;!kk$_2TGb7I@7f+EBPS;hRDaqy zkqi{VPj3l>#2c-!K(H67XlWk+VixnR1$c`Y6eheCUP;}}&(GJYZiIvhz%J`jH)ie| zfpe#^vH#R8^ihRp$!u@jx)ln-K*jD_U*MO+o}r=-l}xI%%!_JqEMcWYugRERP!wR(PmoYnA}@v3yZNqu_~rwI)&L3{t_&mWtrE;I%Jen&{|vyoa@J}rX`1jHOcx4_u+p(e*-bKC?e zA92LW1K+>c{AYT4adRT|19#X>UEOeq&cq*%N$`aqRz+-efV>w#HagTrN>1JYM4NwJ z)fNeep@G{gQ65m3xl|L6Z$vl$_Exap37dl!;#fazSVO#!B{fI^A)u=HdU$%4UD|&N z;to9&Zut4@&#v^wX3fn#&+`mTy_f!Uy-gZEKh@C%fRk&xYu~d_sAY)SOP|wv#zz(S z_XlllYHw~8Dynr2!!-mv=8$><$cvJNM~)mZKsDDB$_?!4QiE~` zn2T`XL5~UMLTNUp&BKr{6L!N9sfe*{%mKD+NfM<9KFs_PAbmIxBE9{-Dk@}1DFckB zk|J@-;Vm<&IOVS>ut#}K8rercY%mD#osqV0=`VU$R>q+3w_7yOR|1<1)#$3}@buTO zx%ZlM0jWTvln*56p6^?&FlY*TMvKX-^}_|;=v6YXu&{WO2E@h1&5{iRakJnDbVt01 zEdz_+jw3z+!3gvP7tPGLd^dj|3+~v45DL)c6}5c+3^I*kB+Db9df3mL3CjyI%WXxx zXo!GuqX7gJz<2@RVxnSV?gPJj`DW zhIsn=`besQ(rdO&iIp)Zr+P0P8vphz4ASk7t}dh5pG6DH%TDfJgp~9+t()vytw%>j z0#F@9rA`0<8d?L8O*eoHQ1wl>2L&;V_N-v1dV+w*oHU<1*AAOWVy1|hjdK~ZrO z(lQb`die@LA43)H5Dk~X&-a!au%`%iy*$@uLIH|UfD$V2?k-lf_23X8v$vMR>JPbEA_|9$3fnuan`B^u62X;;R75t z%o|`5sA6PW>+_MohhPI`F7l3!0*9H!?^RStKsYz1cW3109)>C$FKW*st$G6}Ed)aV zN#35ZwwOeW!-#4*%skHG(!XI=iJ&z*(67)>IQ!f}< zSRw$Ik{0`HE}2#-=YlZ+c*I2jUC#l~l)(Hjd*-ge;?!lO`aVQRL;e9-EwfvH0OYV= zzkV4&=Z>K0B?EICU=B(koi74W$$91sDJVMiP{0-;PDfDlUZ`g40+b4Zyz$~L+;-Kw zt|lfX!@!f|brjpTK-b_j-Xd_T%5hAQNz(Jjj8E4a?E+i~#U|(i^W7JXR;D_L010eB zW-svD_r=G@@A0{cy1jg$CV8~;v6EMmWlT(tBZL(#WeNnKzV{-*OVy+Ykn4=TKff3f z5uphDpzHh~Qh4@=9-IZlSqo_>0?F=@o-6*K2E%tD6%&F~q{2^k7o@NaNPeisX=-Z5 zAMq8@?N$TsqX48uq>r9HeHyU>DqHCciGrpi92^|{o+}opV;XG;g9IiFjhCTQT4Jf~ zrA!TIJZMlrtKYmCTx8wN!Nb!sL!st`JQq8F&`OX>g#w>mW_yWkK4NytZMg;{C z?J>}bY9OeiQc@xSrH+AgG0`MW_n{wjLz{uJqwD=n6p9f{p@7C|kV~O@Zb$Z=O@S8WRt;jR4slH(1aLw*5i^;^qnK0b4x(?yq; zmyP%K_GW;^7@zi|k5f4BHphgt2|pDua*SH{Ye&b$HA#OP8cH1irT$G?T8+(A*qw6M z0_YgdWov$c;?o1naBVE_oiD%cmVS2igLEYV-~gzxub>Xxnjfs}<&2d0*xug0;ezBE zSK=+83F;6*+6?lxC=z_)o)u_OkN^4{Jp*E-3Gi1cT+s#j`TVZnvnT*IX?c2bh{(xQ zB0RMmpq_6@g|D`UwH{3)-8NAF+D1kk(9Hr_WM~6-3)CP7Fk_7MKu-HQ*VJWR+wS=1 ziauQzuhXxR_4%Pzu4^eR(9|Y?)WgVcfNewLy0QH=#t--iW611092|jnO7Gqm=+fvy zZLkdp(CBesMUuSZ=nCh{EwahNOEr#cbvL%bEFg^_L6iIU&@vEhYrsh4!#B@?oCri` zD=gRPQ)dJ~hgn;wqez;O&wKy=>DfDFPhEhp9};PK>cKDMz2QJ8qvprM#}|oX09)UT zH99J)mX=4m2BIxKIG89bBEk%uKs2|jeI=_S_9{hr3(}<{r%fFu)w;xF74+HUl0I5 zgzJHTzUAmxaHnZ}a@w#&;>3yjph=x8)%}Ln7#vRo6HL~>uUT1J_g=py*-*^|`^jK` zv(;~g`?u*QtZaUVTY3_W4t{5%+IdH}_=1O^2qsBjqrOhn?8 zdAaNCyX~Hij*edN#Gp&XLkZ9iUI9R2hT0F8)f4SJyYzy&c%SHul_Ho7p?u9eV6@}E zop^B`u#GV)i2D_2WanBX>R#vMY`QR&>Y-hFu-+izff{w7N&)=)Vj}6(^yVgr98eIy zr5=-)lj{N1s}*4iS)W1Z=0$)mLt@X)?rtwkRWBrIIt=JqabL;ZiL;!XL8=LY_dPs3 z3KkX|)_`$dHVs%2YfP3PsV6DYc{Dt1fLdJWM;yFnyRsqA1_32>;m65{_g^8qKDv>k zm7br!keDpO4}K=duXT|0z;dSZ7D^NJs=&xb58Rpndl+zYv=Bl))qd5z?b6`#Yw0U- zwB?oM6m+l8%a14yc+wKWp5IwUBbNvGTi<<#q6FlxC^ z!mso5DJNP}Ka_ogt$%6??3z?dW;OCO>{vz zZyzXTOijwOUuB~W16Wk%%qo5R;4_&Yh!yOfvbdA?0oQzpra#gIj}&k&%>- zFE2uhY4kXFIu;fdWFVk`oBegyLy7fCU;5*C^mIz}&#fscv%0?L$RmSmdxILLjOLaK zL0dv{hF@*QjghR8Kzh8ZiwqJwwu*xWUlsyzhapmOEnYsd7YvLN5)!)33NJGL{#bX6 z&KUX=#DqmgM#@K$laSo~t{xSkpju-$xh;PyzIu&cY9M;>doWC0y(*}T5+EExvl67s zi<&BjnH~YG27G8Wj!b(y%hyoB7fc|7URl)A6Z&^|z=2ehl>V^qC7`I604vCE{*B3( zd5miq(hh<}$kGKxit5<0U}#Hp9c)@9*O>s(9)c9_4U@T*lFAwkqZAh#w0sfb|&k{vew!ZbLV$dDUm*d6l+;A8}leFL(j0F*|o#yYR^0YKQ>{ojx?=y!9R@mzl?=8xQp;KmSH zmxi`aVrQWabMCEzX`?82n^y!jAH(=67I3TWK$Aw^kTLWC`o2Jl~Au1LoRnD@&hi0zW#6@m9{tb{ zq?G#^t-$kfw$4c0X6PHhq}df)Tz>kaEsjjALM-CW#BKvF$B;n{EO#|SL##kC)d4P_ zeqzl2R^A62c$}qqEKXG9{NPE5W92^O`sar?ofM$M1)1(JlUNO(HH-wBd~iqEbc;Yi zq5{@|f(ZwEq!twYhi=% z@Abdn9{2#`7Te@0M!=pWtENUdIy$-lHCR4fZ5U{YI^b$&etrWH@&RyfsHvD7C>KSZ z4q*C~ZsNW*;$TFmF7+mMVq%`^9;`{qhWoEY&xaA9Bll-MF6O zILix$5_4RQ!?CewuVFnHgJTuYZ#F|!%)ns>X=K+!Ie`2Z3W6Z`ys3^&3kAtY?QIwX z`Hl>s&^3#BuDt481qt5=d9xwgfjzGQji#}&QN*^e(t&CCdq2B&x`x}rcS!rCS|Ea> zZHHzQaRE^IXZlNNfb4}N&B@z!TF_s5cZDXF=T;!NK@cVG4xJfNGhx$$Q7_@mK6FJ! zz3)sn!1n9_uDUT`RkXpK4zwt;{1ts&YmnuplFjatOK*2xC^)!jLt`U}B6W0b#&r|y z=3AZnsD*_tUGDB(K|}&TX7UDB*Q{IGeSr-<6^s{bo;cTEs?>sE?ewRG^JQPxOyY5D zY!2!IG5fdQYdC4pk^zOz4>F%`0+2c{E=4;4iBcGeY=VxX^@pT}%RN`Qkyts^k@dkd zX*Lv(?RS#@>4PE`;#BHG;{dufXuBWl>IjgpW9I9nKrtWsaTeBp;ygugLOD`ydW zD5LuOTQ_q)9Ks+#E@wWezH|M0$ImR&qfL$rl+%~1h13Wk8xXT!9bcob>FNP5t=1du z0Pw!ygA2PJ(qBGMn<5mJ`lWYIz`ok727BB|<^oD08Sd|u!sJg6DoaRosShDPu)M$= zHZ(K@{)Ybv2?^ofj)yjh3iVub)%(7f3>Yue_4OlxOBsWH*S=E(2eG8u?@SK)mA`!1 zctSSK;Rrv0KkPqZN8S&u@W>jdi~#T*jk7G$K|DJsu7cZi_vOIfzwu+`##egdw?DbC zPbPv0i|y$KShEn2snPHwB#_)XizkDjt9Rwz2?Os9Eof`?D2sz_f=A~)F@~gd9{s9h zeLsMoC?gjDdIb_4MOfuI{5}wAes2!ok6DpDpS}!2{YD8(617+(ir(LEjbV-GOe} zm_4gkK?e=T&Mv4V$c+h&6gX2iV$W5A>jbMAt_`YnWC8%f*Ru!SfFRJ@@rj7WqLf%< zuV1I}ONHdnaZUOWSi}DDXI!73K}jZr7I9=PH&BQSRJyHJfM#O{r4%xA1GFU$ zLq6*x@K_~4OF8`dM1>fzjS1=fP$;pS@HIqCz^RZ|>KO>dKxG?-o~S7!QtBakE(~00 zti#~rYCs-nz~Ey!c~u{Q>vjN(4l?wDyP*M0s7Qlf0c{G*mePX*!@--4q%TBM#mpuY7uh;#~+|irC>UL7axiMD;(Geg>J(D3ZcmD%@7x+ z4nLicI#5`K=jS7#G-pK+^S-vLUuL{sFl}^bj)^KbMs(fnXE6Yd_ZBub3c#TPAIcur zoUWD~wbNdF_UL4 zUJvtE%m@GzW!1(gX}@C=GdkXZiqWs}@sE9dj99*DGc96&2nYy>DJYbjorPFDeo^^q z5MT&Pz@d}~ME)AF%Iq!zC$@km09(*CM1cdL5|Ab)yWTS1y?dAP=+OpgyY?5C(2r2= zfee}f{4$U|zsyV;D*V@T<*X3Jj7qIq=j_BYyn& zk(QQ*!BHbxrY3+zj*FuglbV35)0f)7^M@$*9m>wm28@izQ#jGIQ4OYcMu1T}i;tMj zYvik1oA!m+9z5GY26D!SK;^B7Z8zL5jswpUP?io0!?LJGvV!k4#c$68EjKniGQzH% zIwn@w{Ql=!X`^$_N2@Llk8!w^rMK3xkM$ypYF0G$^=*p}aBmpd4m1Epxz+>O68 z4>gukyTFJ5Xpe~GWF}yvaKJ+_2?}*iv0L{YH_$i7AYy94jhpYaZYQzUV~p6>&8?DF ziDfcml|efZod^Ogz+r2}Qev^52J;6J3>}|<*gwU~tLWlVbZ2`GrW`r>5hDtnunfdE z62<_1E&1#r@c?m!^A*d7QJW4ZnN*RDrU~^3VhjW-(65jHRfOy`@MuclLt2DHe6XXz zlA%*1302&tub3R%PzYSuf%uIWaWFiNcY8qFQUK>+cLSOJPXLH3V4z9qr%;(*%kH!0U23 zDQCW?tJl~LzgAcH?Q*%IXq9@;O@bn$oMu(@19w^K910Sa19_7gl`1;hB zntzoaLDHmlB7aTP`RYcJ80mUVN)|=n%D5@GV29XW+?mWeb^X*4X7A(my({zCi$cx{ zSxzl(9R%Ms9qv(%dP2>Iq5%PelXfPgMfj#6+cO$tGLWK9oH#*DOw6C4A3v#vRsuHc z!4u4~!|@$#gYB^{BOI&SSdWcAc>Xjl10YuTn3~Xe6!6_Za{@=$*ssF&kWG+ggfUz{ zi^C?2LnEi`1wiJT|H#XStVC!)VB( zDo3!g(*=f@^4FRJbiqLan14jm0c(5lk_?JEpoL&u8PWQHppdaN3LMMhe-T6|e5Tk@ z3ycqY{ZTZFTO2DwjOdDTx&i2K4QY^ZDMv}*@&Z=4T=03w88q1NB>!x(13n@dUE>Ao z{+aPthoE@}0H_2lK!(&`ltTc|L5ao$H;9277<*&N=K|2z>O&9iM=$g5XSp))v(d!9 z|6KRr{#@z*u7iWdQ*}tYekv<4<9`OE=mSgm?*ZAz1o^rDJtPg<8!JIF$NvF1Qh4ab z19ieelD-Lp^vT(;lM7Uuq6Ukbu^V zNi5`I*@s{=Tr_DR=it7L^`C|cO>iBZ8?f61p5`ZtH@mc~Lynf|*%4UPwl4l(;dm{a5XTm8X9 zTnXhwI@YE-WrmynZ?+;~nSQg=BJfo7mkp}-5Wj(KfXN2|dN^*ysT5HUHTrDs1+cI= zFqtojg5Sya8Q9Yk`=wp}{8)467V!u<|8HWhD2s1lGpm4f3_m|Ppt>qNlXTs5};vV{)im| zu14eN7Fiu-aUaG(7#7HTbZu~nFTjD8ggerJ*ua^#GX&KJ4wsrzV_!@JYdzsm(d?qL z&69^0A3Gdubcn<5)3`D*m+#Y@ylMdDcSjHeM=+j^0KeyII|g2wdQil0fYYyCg44Nd zJUnFRm@9(MOG|gNSiGz+)pIc5qeY;Mn>?ag19%k*2OxoCJaE3W32dJ>QhQKF#Xw!D z+F80%y9B)UC}@R>pj`+G3NGaN?UKTYqdK4#pq*7M&d}se*W}*p6BZVJ>#ew!p8a?0 zk^t(p$>FQsp+@-^Y88I-e9741y&?3kaEkNs)2H{~0S(}cAy?lmXj2f65XZ{L_6F}& zm!QS_@M=}`jP10~o*xqXfAlE%TRl)B5hMZFmHKrT@l0?k2%T2++K2uStV&<^e~*v< z+&``(%VBqDL(|HN@L-=iIX}eIxMPgq@KaBb^|5Mj93Ybqov_u@&L&{MTH%iyP11XY zPSQYvBkQk;$&21?Q$c#*Nbvn~k5d&@NdAkoTjCcnV(dyRPwmelYa~>Tf-vDenI5bL z?b5|CS{w|d5r3e8k|gHP%7APNCVn1mJrLc@Q#=TRDOeS?v}j#tf8GakPX@qVz_XTd z6DH(DGWAn?m`rw;^W-Ahl)rv{x7@R+p7$+eSd|k}&&!!YYStI!#e7(U@ zG2=hob~I$T@eTEwe@k@<-H_!!eJ`Z5mnuX7e<@VTi8Q!WkqKsbVexodKCUWD--%Y1yxJ{dae*BbT3HREA%oXf0H`T z!Qa)F*(m?zoP$UG-;0jF`d5S=!INacll;pfv?$H`Qif=%{QH0xK1jYd{l)$cup__FIUb5{HL!*7dsg>i7OkUNcuL`<$#`H|D^*3DoKz9A6Jd`fKm8{a79Ne z0a=?2TD^N>2$Edo8D*nY7qB?^0M+TsL-=Hv;I6ZS5cNTIyo#=3%ukH{D-Z|&-X0f# zgOvu;VQtC>P3%1}9QbL3KoIs=@NXT(CBZJ>_+UM0|5z4VD6&a{O!%Wy>0U_;iGSID zs3czpAf@s8 z|EeKh1?Xr4|6z!qfSNvJUcnLkPbp1)h+A{j{~ruHD2JNFiD))*A(mm7bog@r761k? z@YImq;@_3c0TK-e{HIhs$MR{~L~%M!{jGU;F!+b(=m%9Gp_v+S;@>iR zFwmD4lqm1X>E4GCHO0%a{wHkk(U4#UxQl2R&Q1?!pf4$#qY0z_hR-p+uZoBEC1tx7 zx@seq@Zz`abF+gxzd!o-&V(G)j*q7&@LuX1%)TWjik_+_)=pfcGlUd6zs44TYf}Uo z`q$m_sO|w?*3or?H$)7Jefwn(r$Tnb!vzpa5)vK`XZ=rtKkXhII(Xl7z2LUxTWU;| zNC`c|#FP-uFt}juowyP^3=GGA?8ZP7r@eSlKZEM0jG-a>z8f4?4rwq#C+l~_(J?D2 z0Oru56M_yJ0HQZgrsz1l-nC}lPIA?=MgIve+aH#=H6S&j&b$V_`~eKMz#byIx4zG6 zOz&z?U?3%&rrMwFDZqpC0^Zmsx;nuBk#KAg2l=0&04)GDkPeL_qo|!tlet-nPM_d( zaESG3!hu&Wdu0x$QUq$4X11o7<0w9iw4M)+D8VltxT#X zUvN7NW}Oq&Z(h9$8G5iNvbs)xojV4q(avmQB13sg`D(UF`9#Ae?gC@KoT z&I!PobrD@_=CfMyj}~ ziUpDOAj6;3&h<;??9;9CK93~k>i&LRrPPN5WOy=!|4AS(ujBiJr3}5sAoouBhAHq! z!0~+q{^gC-8k{wL02Gn*-XcZq5)ex8AL8O$*RKb0Dn)4bzf|E0N=;22ZoNU4cP7UkRUVUyL}dEJi#oU#6a(8zqg>m41hw{uJSJZJcgzmnNNTL3;fO0 zgseRE&^Jc_8_f(ozIMI=&hzKbL7z%qbHA*0fAb6ehirflK-R6H{asdQ^6wN) zyQ=?})h~Z>-hDSz0*Y`89c5_Vn)ztZotqBbpTsHzK2&$CUxW~JKAKzQ>qf|Hi>n9y zI-Huu!I1k8oP^=%q(M_a3OS&e4M-3h8a!Z_ssZYK>dPJd>vaAye0MPI%rqo8 zPG$i1J*_-F+jl#FmtB6_<S!OxoCoQFWkKt5zRT#t)wt<8pk zFGiM!w%oJ(nO@N4V_28at0;9H`!=F~<=#>B@bFh_v}McObhkmw~guo3zpl({@E zx!mgTJn^@ie6gyVh_eIP9-a08cj{s@IC9X7P>g`}MRRsZnpi>hZvnT&gJ1+~4^|=7 z*zV3wS?-uJSn%U{<5K=Ee{qyDV~G$}f&6gb`$NoMxB!2n16&#%T8kI9jy>b%qq;Pr zgme9G=lga7;t34$A8>^zfO29f zU6u_3l-LpBu_!kCJG1qd?~{ZV9F}50h|d`yg)0ZUlprP({UH7F_aC)N$iVRU8-hs+ z+*Iss&3KraM$XKCKna*XPSX6zX~vD!IB+;T)&eLLJ%U$L)_7P70sg<26f~^5i^*If zH$8wu?c#73K||j%G6O^5|NW>S066V_l8XnrJeWbwz(Xd)%Ur``d~eAA?}zk00+W9p zSXUo5Fm%ED_Df6syEWXa{xiTo<1x?si9DnWKM4Hqq*JcUUC9*FR|{%+w-q6E1itet z5r7@z@(N`V&$2x){y^IcS>x!Jl@!_XKhBglE+csKlN3Ny__@NCn_K~}HX{;w+sF=R zxe1`<9yt_Iie01_{4#6uvKu#jh_&!|CR`k5YOnwC2KE(e;28F*i*E(fV zbr2qIhJ5GXqFY$6hPSf~i(OslhQn1ir5|Y(9I44JI@^%qrh7`nL-Y0z5s?u&*+*$< z&bPH0J{cXl{|4QE8mN>7C`cdS#XtvQCX%Sc9M}N0t7&K$x%vQ2g`_$#U{81FDZ$w; zr15}&SnCNVi7uiB;Dg`(-kQ7k;SQaU+9#a1NfcN=zo8V`E-s=Nj{PB*{O#?>ss7i+ zwy$Dd5uliLe0Ejf*aBp|g&I5x1F%tJ{>U@{#&2W}$hYYgj9#q<^E@&O0wh^jXd{0L zGr)iA8b=fx2gk?Era7|Mt-8%GlKd~dh}W{>aImhOX92;DZbWTs*yYrXGui6Jw(@Tk zzIGi9u*8Q@EmLCz%y|g+SF6B@5#Zd!oF^amHX#EhutrCadIoSlL%-S=i7G-2hNqvP zgV@~MBw!?|yW=)+ALyAlskp9pv@NRB-PASXS|V(D8tGo)vRG%VLEHD2x5N4h_#Zb= z|7AmR$JTHR{_j2kI38%SCU7%P54o`6-B3uwtJoL~a|iYdy&!CP8k!F3A@5~!FmgUb z=MUh30y;Ggb?q!mm`1h&oL?W#lhkg007oP@IY&48QfEHPnB9^jP=kRI7krwX~Wn=KIOYNfWfuXT5%>A-n%_)=b}}Lo&hY*cHeyB@ul@{s3J;4LHS18*%q6FK=;= zA0NmEzz5#b<{6J$1$RBX(?>14rS%dcn9snT#vv&=Fj@erKNB1(-O;zRvpbU#H8ztS zD$0FY+rg{()^e}0({h5Ei;j)3Pbua$z_Wv8<*V}{?I6x$A3}mU5 z-kX9PoSf`2m%mEAgp&=R5JH#x-kk^Ra3H@0R%rnuw6+i4m>ct(yX5D6^PtN8wb-xy2HqqK9WnyZS=WZF6v$7rR_8riV>Wtc-8#6OC<5?iSCb< z88S>pbW48;ddJ+W>V#&n#HY@lZMec$iQc-1-cJT6xPKEp02h>u3BRG8jSUYNnjXMA zI7sja$z(t)Mt)~x1l$n^cC=*q+XWE)BfusdPJixz&a`+nE0e>iu;ul$Xz+(`6sodI zo=3s!XW*U3ula*CsnY3-3+H`n24@@&^UP--UKSi8>S%7`Yh?Ak8>z)oIYws9ps|Bk z1hJc0#PD8II3CvklD^ei6+}lo4|=B!9K5n|^nzZ@sVlwonfj&L9_M1p?9EQPp)+Kv ziCw{JR^;+prMRZ6+${`rzw0yJ>zk)`$H(6sXuCJFCQeOdDXYqdNF zeXOj?XPodc9bZ9~OL4AxPqOZMmDU6-oAURc~vMI`UQ%HWhM% zry0sX^OO+1j8QelcUpldtxM1(rZeOAD~hL9NP1%4n0uHEgYUSMy3}B4@(U63tghMaK)@uym5gD(zYok=^ekr=6Eh zycOWIIc_dfs;Ll9XRiGA`~TtWtHP@6qHZ_cEnNbF2qN8$gmg%5x{*e@8);BFMQQ2o?(PPq zJ3qS5;{R{X&AB-j+`+@%>s{|!V~#n-nAF+RU(c=88;)CLB=8i>G}dG)ZsiP3TTltn ztg>o2d!(zP2O$LN+*!SrVPr2?sN?UKj}_Eb?pB?fHL9uJ&}r0a0}A4z7|!8MRc_7W zx!ey3WCiAyk}0XFZO(Os4HSEINMfD_O(o=&N7FsIaWVh%!H+0UN~|k z#8VR5xKM}ZdGScwOzKh@Lw%|H>=b;0dxS-qd0sx7^j4v@t##-tRV`bW+P83SZ27nV zFJ*A0g*hCFuk(>}t^i!)WEv0C9O8_2=AWb*07tx4pjw~zE{@eq>C@tW3Ck)Kd;js# zf<3*s{Eg}E_iSlraw)~{MAmKu_l}QpZ5d$mI_Wv#ABdY_Ms{D05DR)Dc307vbOBx=~zW0OUDY zsEk;Scb4GUu5s)iNW4XNecMkHe9aY)r3mS3mlH#aeXV26)qdynwknT# zsG;JIZmVsas_8b6b=BX9iOPT5E+A1Q(V;I8HU7Nxm(f)s5U_SRj{rZT$RFZ`R0xW} z5B+}FiuFwP<^SkqqRCn(tUi1cWBS<>?YO9BJiip2J#VWRf6dl&O_|R1{6v9ctLVQF z?M)eO`>?=GqM19p9>b2{wTiUM<}Z&p#?RR{SZdQScwCM9f=fCgD=`Hz!JeDL1lWx# zMcjI_n4g{tLe^(!*@j#cb9sKz9^UYXv&{$xndU@=6Onf;Nn*Y>H+mcpc<^3u^56oH z_u5sj_xfAq`{VopvDM_yrK`^wYI*HXjI)6xHR@=Hx|C8aABne={*;(^Rm*XkJ6P(~ z%nWNuej&Fcoe8L9Hb4L4z*UyowleW~LX9(K^}`?aMa{UE`y2}cb}uLLepEVj=!cuu zE|SHt#s^X965N`RY%S(j)2nS#l`s(F#&4(I$I+&0t1{B$9uha}y?P)vgWX+?z7VXs zde}L_3=tWjLFFSfyItiC>{rHD^FKeJ-=uORW*2?tP0;kE#=?qH?3}0gA)PE^+ld4XI$^w=XebSO- zrr?VzO}?1_pa(u`5$Sh3rE2%SU?VvNE=nC@TnDnjeX=2g$7O-@{%7)$j^yJ`I=c7Wi5&#hX%KC!?XY??^yx5kF^$k>S zjLLYYob>(LmX73DR1)q368(dF&k{2ozT2ahZUGg=eM!_N~?5G)D=c>eg zzy)t1!z+khU}VIbv?&18ys01IheCRgjMgquV#6hNDYlI{i5_+^R#>uq-#}KZDclnp zAxGEj2%4_%34b1qyuikvtgx?%Gz}vh)a`a84E?RT=(K7|AmhW8Lp?QIJ6yI=aC=(? zHmYe%vn%SOnDIWsx_%jiGD^y2Vl66BKclzS4M<^Qd+FrUhESc=G*a3Bg#04}@Sb)b zZeBu~mU`J+SD-r5a3|PEm0mS@LKqjf0=aB>9}RM2FlXxXr1?DmQRhQx zpybf-?Ag@N`=UO=`_fbs%7{Ot%IZZypSsVy$w*a6++=#V*!_CHe+HDrenRP(YQ{i` zn5u|uL*~&AFth8!zd$E@o!4UCnfGV;{)nNQxA5ArX$xR~AT-i(W7P(v;E^nZ=Wb zOp?Ro;`foIIQ0Pb1~stnI{}~4U#K+i71?s7_n`+=ZgCs*#auR{OYRj!pdgOpO}i|{ zu$UN2(NtWt9PF3OXjXGJ9BtZ}(_&tLKiiGA>h zqQOSNJp;Ebz5k;}nD^(WnxyDbPHE&lj~5Jb8GRv<(?<6FDYI6i7U*-q^{bWPF~Tzr zp3fVpyR|bEL6%xi0f^#e(9(P;qT?9uBOh&;!O2aSg9X_;ndlNg0iD+ zOd&HQApw6R)0qoI)mkp!=Vn(!Lz)K>RlyEn%i4yes!3@4re%8ha_UK#!AgDHL9)g;~45yLUpAGYiCkM;|p zu=&~iOIPbHd(k2HDO0vvrLTpq8lw1zVqLlHUm3#*vX+|Dr*c4tcPYcD&ir{2KATo% z#wh=*8Yv8h_~piV8jbuTCNPI5#@>h#VK&t5ntrhCM)3Tl9f}1JnG!uRhnBD`UG=4i zbv#lSmCDN(?fh4SaEYb8E_|+y??|Q}cV?}}N%xjC;m*Nu*@TCXz0X0Zu;vp0GDe|w zy3Qa%r39;xiCp=sWXXilP7kg)LO<(kx~xYmKj0wD0)$8e+JBV`Nh7Bo=0!qTb#jNN ztH{wCu|_PR-HW?pq@KZNkMNh1vIlYjZ5n1*5+CCb_h_AWNw@kGW%D&OS3;SuOpT0w zvJ6ua&*g3R)%F8!<=F7{wzl?^6B0koks3cTq1a-!w@0Edk~fjcOg~HnUUB$9`u7O& zv-VuS2c{a-8gbSoYFtMARCK075fczmsA_$)J}u%xT-v)GwYDw`3N(KG){_7-hi)4s zJo~q1U$TO!x`?{frxp%HCu{`Y6!memYS1J0AtEO}x-_<%2o{RN`zm6gM_~mme~c`E zC|<-|aW7nzM$j5WYN3ZR?5oYY@%=OP2G8yML)#x1RJEZ!|!`XE@th=TasShH-;=Gm+~(wv4)45B^H)R zDcpPotz1+=ni9nA3d5OsEM4#8=X;Ly1v|a5ZOuY(1hFcR9lwcxWWZSqh08eYp~iHL z4*eJ?6Xt=VKQ7W`SVp0jaeJw4_{MElB-lqiRi31w4k|gu`9GmJxzbwn2*@+Qi zvkwPqB=GY@^?yU)vsRHNwx`A5-8~H~+djoz5*Y)NPDEKY=fc+IC+5Pg-D9d)&(Nbm zUX{pC$Y1OL&uk>v<^5gzmxy)j7Gqu(NCIE;|Xrfsixn`}0UrTDu4{%7hN5V(%2^Zb>y`{3Wy9E1D z_kB+6O$t7yaQ`uq4*x~kg)JKNI3OG`&C(n2sLpLo5?|Ptm$_vN}>DAC)D$hr0Ojvx7RIXy!fbcCzSpW=Ds@?icfPRu#OD* zsM$XP9!+BLI9$^du2dnqypeSU$$ys*4sH_61 zh>Smt6uA_{N3NdPAWsm%eZa330+vt}uF|}YhXa!@PK~@ z_;^T&E#q^-=x+e9B6mOtqgXhE% z)7PN8L3sHRU;@ckMOQ4mY?q|QHJojq#o`OYm^MX4`$PI`*5Wqh;|2A@X1%AXK;_WE z?QIy0t~BQ3f&Kd;-1}5^#*ewT6GvS)pM12mj!mM39Jxd=UsD$jaFax zLjtHu3TWL%=}V+6eK=#Wnj}w29IL}-C+UxuQ4vgVaXKUK5^7DS>$0WoH*V9l>lByx zYcApo>Boc|4TG7u!eL#Y|<^f(zs^jc(utCoTQ2#mH4Z?apKL;f2TKZ;60?jlkLUmt+hUU zeJuN$3k{6QKWDQ2m-(cgn5XV2u3c#=GL(hsSZo@F{*Q4(PQM}H%hq8B`jgf3omfqj zJosXflo&Q+PQF*=`Mk6CA`ycqFj?gdD-}Bv%Cym+4rUm1xi>JWMnUU>@a;Ch4W20` zhv>}wYd&n?+4vtDw%QYt^_@LJ92s8qf3SP!|6gaMkXNE2IOZ}B@NO2wUrtS%0X*2++^VJpcj;q!}R?ci{j%{yk#QL%EU zC`Y_BOMQHWxbP)>2bt$z9C|Zv4K`;~Biacg`#q|p<9-j) zK|l{!HV1*GNt4*niewSyP#(+)|4cUr$;#E%rI20-q;e3So^?vm_8-2k<5{2Q*kgtT&{eA-^B`HF|PS&mfO79VHKRkrqd*8L4EQ1Gky`loc$G!n14TWAv(-=*}EhS zSMrJOk$MIc{N9&*@M(nj>N4OoOVzUZmB@2s4i|P8rZa%Wcr&kI94E=b9z8pOZg7AJ z3M=d1LVmjGxoE$$_67zerWP;3akZdURa#>NCqML0^UqS^tNp+#_ZfP2h9)*%Ua~n_ z#E)+#O)Z7)`Qg@lzIMacMoM1AhqDS$VfR%suvRD%c@S~DYim0|&AWf9l?il?l(Ex`Mp#CsGzgZz8f`QZrkLS9sjGK8PLL`$^*%-gC-4FlHe+Y0UcXP@P+9oJ zj;VUbx7nB>ES^g7JMayBx<1vGPQf3QA}%ugDcidMc}Z?g9&a) zwBzS}5xT$s+!3B#Ilk$0Ir{CP!p<1|Ra_D>bEWI@7A%K?><^mV;4Nj!K>N&}^s<+Gl!gXNI{a^jty3 zq0>u?gV$72rb%1ncep*3I3!)MMC*T&S(XrxU<4K?q(lQmY2;O=)Led+Zg9J`o`{o^{X>j} z;T?PfJ}Ln30Dj;_3jFo?MN}cGM^F{#AxtqMsg;3>poXEz){r#t7|E(*SxT6sr5?jn z7)+Ex6l6e|GSKMJpe~6_I##@ne)qlR?s~aAWkF}$v?S(t_P00v5NO!5kML)|gGL12 zS_d9=#_`O#^PLU%PtpHX>8-9vTu9VUgQ;ecMevlu|3g{H_@zm1T>S!{J#7+<_jS`}Lu;2dhV-(Y? zR-eAINH}rQ0{h$9q9u}~P1;gIwu7u^5N{+anH+PKXXakC%cdo-4_{(Ls^rc!lS?la zMOR&mV^CoQzRHv#X5<78iFLk5jUbiZH)0i`6X(&?cDbjA%?L?EfwQtSem&)P`^Si zK`c1ISFgKiX$qdk39U$*8@W5S0j*|jSMyuoZ*?6tQdKCxu5~GAwX@gdpkoEl9s3@o zxlLMccEAV%Q3&UIelcZv8gMi4WN6R)>N5lcb#HJ02|WfPhH3o1URlHkWX+7nt_|q$ zsx41SjK1QQt0oHLI&hlcCPlEM4i3$))=6<}WI^uP`~aW(lt1by>~D>UdAq3bn0lnPtiR0?$HWu|9ugNizM3@lVe$^uCy}S*PIMzV$<) zN*k14KD^(*1uzVGbB}FlWY-EzYb`7L6d=e*9xsx;i#2UolsI`c0i9c33I!DQ_ zm3Jgo$nO(lX^->DVVN3`_2x~BO>_Qn7>Xr|kZ8C(NWFK}2G<_lXOh(8y33`y3nkfq zSdI}(Y=5AIvqp;0cOFuA;In3}-U4(Y4*h;h=lgh_UvtTGc`mR2p|qc1LP`D%qy}AIhYH+LlX3=jKQ}Oq=RI z`JT(?z~~)uU#2=#O6=tIo6PAuKF!;1Blk_u)ijhY@^xi!ss* zY^*zbI-!6D_y#TNX%Qzyb%2fP8uP<4U9v7FCkfP;xswBLd z2Qn)D98hw^us81T)k=lVz^+AoNZy(Mt{BH&`ZEdD3TK_E>*<2+0{Ob*H0ZSsL-iw# z*fQqFrzzQedyXntZ)$H=p3xdp6TXjbW(SYzR@FS9Yq%?-2YNqk}oUz#Ymt#y}4=sYL4T#Yf#yUbH)l;NAi))-Jo_JuH!{g z{m9I0<_?=S$Vjy^(lwDqgp!4FLiKymn-};y$FuCsV0&+ zSq6>F77SnBS!mUcIusQDpNY^&dBcnfST#K0kX-|NJ_ASuy;ipz@BwmsGv z9ANoy{R#6<{BG^|U>#;xh_neK?+@s%)sjF`i{3VXo2}4Yt=`lEz0*tnJ~6Yu)KB%j zi;QHyR&a(QcMM6Jiq5w+7n3cBCRy_4aL(w!HVhkRi)N5OYUkYG%$r|DdntS%oTDnz z@dpRjYe@AqS?;WbGBjVjzHHg-8qwVT4V-4as__A@F5{1EEj@1yq+GOoTo6OzqV=nl zO>}K@)-r|wM(QpDJsd-%4*MY6mmI@lDVtltI+jqcu@EG4-{oNE;LrTlE~tAwMZ3;Z zb-oS7wTSOY2<0iLL4W5>Qw~btHm`|GlzLU2h(d1~rF_*5-#*9hD*_q1&L87mLmsvb z2mr@`IWsgwU($u0Z6H!)>J^t`NXM34jhQw|&@M$MD)~jQImhUI+9D|+?0s|h!Z-Ea z7yC;Ny(Vw~-OsGjid=S&ILQe4k*cWq?B9C9Od~0iaSLk6i_Bv7z8NZk;U2nEmgR~= z2Pqnbet_$O@aH|@*-u{QaxMsH(@bS_BuGovNTP+!*R0HDI0zXB_%2ZxOcC6d#=n%0 zd&G15A#`z+Hh!m<6_-%8*|fy+N)1mhbrcL(Di`}6>6Pz$Kh^`~+4;6HrQgH;$bJZF z3mUOrTFKvj6#*#YTV7M4*>?kt-+S*w_B%)$*Fq?$k{2}ycg1gqCTNxk*^$IMKE4;r zN_zF&OogKS)F_wifRgl;^sO@v(nZ)Sf>j~oyyj2`lrV;1)Dv69uB3Z*P*!XPiUrFA zq6Ig8r3~@@IJT|!OXgQ6PPRz3USUO(iy=7fg%;vQ|8a5OEtDHK8)^i#Bn_26da;gf zYg3rol#XSr^_}VXaDuLmU$43eFVxZ7Iws;zN#WIEr`sz>Dc6Z9qKD9m?pfAa=S&0d z6gnvxp@pwpWvFRm1gYc~#>p^FroQc0{boR2^n=UNCN7ai|77!%Fua@l>u#x#!>T6$ zU~0fLhIRanbq_sDOUctS2KrFBeY}u}U?$GRQX-vnph);-J^31FL#az?o9-XitRp(M z8jTxbLwTl2OzwPyz9T`BxdjN|jA5-Qk}4*lxdW@ovJy2s@ya2}(o{@n7=Jw+d+ZqZ z-y?PRo>RefM&zv>(r?FWr`$Ji681Al;Q8=p#Jn58;X?XSoyh-KuVPh=?LhVnEu4lH z!Noz=Zii><96?i1b-IY9RD=FE9P~~FtE3;p`<&`ZA{C_s!b3;lJ)fR;YLV&U-y!8(oeF6U8*aaz5y4Mj{D|zASLDB?4?;&jAqF`Mz~GD0AiUaELYtQbI&sBmTHA^J8gvgXU{iC_-3%(&8SGJ z`e_;crR|;s`|q9{YO#SKhQ93c`g8O)a^5ie9Ob}-U*Gqff!gy#G#^s4MVCb_BC>JQ zPoGOnn3jNWkflz{A4)j9Xc#3^(gWB$!y#VXa~}_BrrDqURZvG9`@_cxUkdgT^t{R$ z%JOVDv#$RXuO5d7T%rDjED zN0KzM*MWdq^dyF8ou&)yvf;lwm>yEq92*2caFF|NG)>p8!}+Y4W^t~^OptWH8Tq@NKM$-p+8}mv6zj#h_#mg0#XtVuP_9$})2L!3g z&?B{zG2E_`EWr+D_8TvrDuf$Q>CzW{K1)E0G(WSBnf*~3n(7xO5oiR*@_O;#mqJ(l z1|(skEc5yo8+3 z)qWm%gpEq;)c-m4^Z7bQXzk|ABKqv(*7q*WOpW7ubH?lg zWu`vRMj)F)!Z2zBgi~^yy~990lwUF=XepU)lmzgt+h-CtLk{P$yNQpT4?P`j{4`Aq z8qf_WxD1EMu)kD3MDadi6^ z&_MC`V$VdrH(Vf;)RhCt4%lOTA5#aphk({=Gf-HB`zue|AOA7*J^2&DFi@m}CrI;) ze7`(nsLWq1*TH(zo-{daY5u0uCb@#mcAM+a6=fH;5iIZv=>Kg=%dnsJ(x|Z()BuAz zx6csY{f;zejbd&%TU)&S|FS;bCgA*N@M0KGK zOrsox(zRw{CoGYBR1XtIg?`no5gm)(8Wq+6m8KNNm<^2rk!-PTH+h%w$WuKJ&{I*y zY_EcrM>6O5MMG_3LqxUu5Rg>_gjzjD3SYf48?BuT4)`d`V#uRWU6ULD<7H^*Lky>| zrMhlp$ON!B9qqS|$5gn(%f^gPpb_`7nQCq|9j}#nc1h-DXTqJNRl<-RI`mxd!)ly6FRw4k7ko#QLFsH=wwZ_fv6(eb ziry%&Ib9_Q8xlebPc77s_HhG_^-Zfyk5ydu17H^ecuRcQcJcOU@r{oSru+uG7Ax0pJ2&Uo5|Rj zI8B{2>Y8Sgo3b=1d$fDT!lGjhx>Y?U6}yWtfUzT1Oa5j^n~z~ zTBfLR9tqn-h!P}BRho#~UjC)L52_0IZNoERrQRBY_PO<#{LK53_drl7_1-Jwhy=m9 zJeCM=yy!WiJbEZfJJUz)pEG;p zUpyOyT&Zvzxtic^1_V#XfL6owlUy4A0g}7yS$7bH+gBCEVNwFddSLnL?L5F^5uifG zOB*`A>3>7?iq!7_XtQmxAVBos=B*&?gmy_VOm0)OH<->A2=!OPkS}0mpeUZTK=2<+ zbdgxszQl(&(F^UbeNor`zsAzm8ZaQcx{I;pM)KvRt=3bXlfc?U9zbE zeOQ>fJ{qPk*+6O}{`{qy=c^hK*&j|QAXz@nJh+J>j`y~XWN2S@)Ys(iTsX2-fV)xp z8`|j)qpK|XeADDb*_^gzvqwI`6mfLB6wPt{K|KIFx6`bldm))rzz8z@WeE?srx;T| zEm7w*d};KJ6jm_Npl-PhXmR?=-1>JjNY4;7_+#w#Q)aTvo@pl2U%=b74mUYliT^rdphzq>!OXz3 z(@~bt+OcEjr=)y+?|(%k_P^R6+P^QOPPwNap+KV8{RmMlV~N%=u)ZTx!&99Y*pP~V$E{Dpq%{9 ztkm^G8+4ou3nEp;5UZ9aV&X>z82>*cP@(4%Vgzf&I9I8$)5!#SS=g!SwzxoFETAy?NIt3$EXHDqBG0Ph|_1G-{EH|$T6#hY34DfNC%DJof~ zZ}5oU4A_`e|ArNC=sV?!YjwD5m2CiEHuf*B0IA+M;3^9^p=6EFXf^&xC9Sf6L{=|H z7TNNW6D;!$0Pi+tB&T;| z?26;WjE5&TMR0+7L!`PwIs!HIrYb#rpcfcz#8BjFv03}{ z_|+*E2?Nz3N&yG*1fs59448U8x2EX=?zmu-fH)YI0rJR(OUqOWS-`YLAj~%eN!Krd zSRe-khn#$6-{yyvtWGSU*A{LQpL>J^S+i-Qf!J)wlYgy(5gQf`=<%-Fy$!wtEuXF& z`acz{f?_Xgj%q_pbwovA2rh(SauTZE-#Kf(mbU< zXIHfxUbWW@FNI+xAN~_)870{a3m961*0?xFlH}kAjsHPs8QQ^$S0-72?M+9OD3Ypy z8Zqq_S~(SCS94yyI_KnG3g^7)wo0rmv>UDC-X40VampU1=`rG>M=vVjEh}R3LBv#! zyRtbaZ^BYYj?#LIWLPpzqfo>lYD@jw!yiPSpn3-sFu#09>!@>emz%Ch=S8GEKdrOb zB%LkcAW!qWnCuyLF;vVA6L&TFF4gb*5o(EPl@M-QYnSyGhEtKhJIAZrrcC|v-E<_RDUDlzdngR$?l=R91Tp71j zYSfmec`PR0!e`(N6X|&hb~olR1O3Ln!=G?|I)%mRBjWnRtEznBJSaE~bA z)t2T>Y7P*M8_jfN0V=6@rd)M92zB^=vNBTTei3$2a}zjSx*%z7!Vq@;|K&cCFRGI+ z#ZZwRO6gITEY+_Twmrm0{2m$zxU?tMCm@5tAzvNf#`!zW-hKQZJ&*%-eP*cCG=X+I zNRoH+`nYR@4}ov;0V8cuccOZIFwskREc$k2(1A>nuD00@iEYr~#*+6R()6S?bBHY| zNrY$L8>5Z_w`RT~=FH@IxDAhxmvh@qwg>dG;F(k4h1kMogv|3Di^wc-Z6__j(;7AU z$+Xb}YD#+c`ud`2=z|9XCD34j-diuIy_KwLUg*tVk!)2x$unk)!6WiobLv;{ueSHO z_a9yOD7ChjuC*644SUO!ODYZ?5uFyK9H-6}&UuV$@34Ljl&m9pS0il%mHL!V0gm*r zUMcb``$BIbok8D~#95XVSk&_3Vsw%y#I?0fsN>q&TD{ZWkA=RMStPz-1lLPkoi&*0 z0$f3EAR>8UdO8S9B5P1vf`{a)pyXC=y;1*c+%zcYfCT`GvgV3kH}+DM1`jpeI2xOi#b_x=33dgerR?nG#<$IhveywK6tF>iQ+!`YR`LnI6|$ zdzX+6IHhhJx`&O(!_7~^Tf6H|!!P?R3&G8kfZzy_6n6u{mROy3m0srQfZ%We5X?K3 zcLb6Ealx362Yu^e?-7=qjmz-Uo*O+wTfrXeJ_kBDLWrRVCup(*=YX+B#Xit2!NW); zm!(q<8;pY1(@j5Z@^rpUpmsW^E4UyA42e>+tk|r^=zjNa!)}1ch& z@Q+>?XukU3vth*I?s(MSuS^zmg`lV1$IFv=d9t8^t{(^$UXSoj0XT_~zQA%dP#6LL z^9yM}fNsKT$FhH=qKv@-MZ_?6v)eI!a4sZ5P|Nf0X}w@ex5(_E0US;&)lxbX8F3YK zmsY0Ay(@(Ao)=tDgvkbaJJ9c?3i!Rd3xbb`M+=uzz13@|(JTroq`SsW4jGQlGJda) zw$yt=h;VUXL6G;l(OPK9`nnN_)kyZ11Mbb2fc1*{E$W4QMaozB_@cQgHI`|Ra9C3Tf1?q!K>p`Ddm+CDR1h3oH5~f3{B|ve zXb@Fy4k|!6%9DhgBXGX-!Z6ea6Nm=ORkDGTvJ-UbN=R}o4}Xgi=N089rp1$++KD)E zjk%0~P)*qf^OM~#K7OGI=9#G)7!r(wrZ{~K-ViYC;br@Qc;X2Cycx?1tGN##l49`C z_$6!M;=;)SLvlzLBrSlc6=2Zd|D9Ki{3U{QlW%uu*OT!!?6wSB*hye9NR;35E`jv&Bv)z+7{i5;12X_3M}+S;zrof zW+bC@22vAhU5}?QSqF;&zu^QOsGBAay^TG01J;228*oqRRTLp-;yUFYEDkC5yOP?= zyWJLfJd+u_roeR%dP@PgeW0_3bB5PWP#DeV6DGK<}tePYS8cAuuwC zY?GF620Cq3PII_R?}og~i1yWb5jT&}+pIxt2FVtgKwt;O##;@RH+QBL^$5PFE~zH~ z6^5J725Sa~|OkCD)QThK-#f2&vTw1Va9F`kIk-E}Ub9Rc$|3`a96*HunuX%-8K}j#4axTv6SH(%%vbsnhR!r3sT@Qr zD;_oqD-MfE8BW*A6{LzOh-cf;4M5k$-jMh20GdnkHZ4M1gOh`5ya4kpCwY@3a9i&D zzhkg5#SzW-K#2HD;HskFhuVr9e$s&Hmg?QD*WXS3)*u>GdVitD%~ z#KJa(TmxkzNecu^@U>6ve^Qp+@&r!0&bOXyH%l+w0!lwT&4WI7-MZH|{Q@@)`j?>E zeejC|Yx8#@v-e-!e~MH7b`f^FAu&%fJM8>_Rak*)XU+G`@;D7V03s~r_8hJJIgHL# zPbL)4H%j^`S*qbGB|UZDDvO26w7+$~Ue=F}aXrZEU`Ky~tgak=0Tnnpo6LbjWyA9t z);GsfAP1y7_ah{p8N9bXQR_GY_}V~Kg#}Uko<^uXw@J(j79%QgO~fOm6j9$%sR?NF z0B$;6#gIOA>>TDf0(U@N5?vHQ0&2nt$)9b>H`@DXS|+E)S$c(B7?3X>FTsp3uOR|= zyV);uqDTJLnU7J#nZ8V|1_RNwTja&afImrpTy@9VK~%5cGuPQ;!yBXTGb&V9KRiQk zx1pW^`CfuL*Dk0>lmghm4@c$pdl22JrZqz9Uo%(9 z`#}*Oyr>n+<#H$1<@7j1deIK{v{Dtoh?>Z+FYd>dY`h7<;ntHMhDYO%8Zs35SjUm>{gd zcy6|9HN1osJ1nT)xjqwZGD);qoO^qev~ZnE^=|x~2m|)Z`E|Zgvl~8AAF^%q@a+>y zTtZ|}X8dJC$-9o>7$|_W8{>JLKBBSzfe(zW z_5Ik(8om8Z`-#|^?&I@}zueQmSs@L6W`d1>Y0RgbL?sBm9+pfW0mX=^%hcD?Ndg`g zMv<$&s9tUWR^|)|)7Qa+v#qD1n>!IYmGhzs%N6 zHQ(+?R0&&0YBAV-E>sc)QgO4$GhLomp;(0A!PXQbpjEN3p3D->-Kwhs-FeW4>NH@I4V(}hVi9S4_ z?KYlR!+;R2_RqgORqD?6c~BtFaMq9@RR9RH%$=7uup!V*mde4zY;P3G4L~v$kQ&SU zTDL+UB_Rqf{?7xrD#U>vujsiEwj#8vYolocq;NqXXB~fmKJTqSH}w-Q&_nceZNy=3 zGW7s06d;F0a%WSgq3P3a$zE0*SW=a39RY2EjYkym%%2(v6cKXL(IOyas+5HDc1Mi? zv=vMp+T}7-My@>t0G(=qws8ES8>~wqR*XdYz1xH-ARvU&mN~eS7LCzTenti{0FC%v z99!SKqp@>|hpX24d^FqV6AR2c(wQg@v(f=B;C9oe>=y^$>6mh9BmOGcjajxJqPSVh^bsUK_u#2FTbcZ(WT@IaOF_ z6|}LJ0H^Pay>EAAp8pkq93x{%mVI1+I`09V&=Mg!&;*5lCL#tiQx6AW;qF8hF6eux z6_gD4K+p4Z+dYcrVH2>FvXK9FqgIqvS3=>@wgN8TH~;}`NaXZ*cqes#{`o)x&`Yy2 z>Ery7&!W{9PO`uD`K7vnfhHIjVZ17y87hbHU+SOU%juR(p#HvT%jOM5`)_+^`{~wA zcAyLtK&it{xP+U*fW-ceeQ3i4sqQYvDx`fD{1K&Leu?+KNk=CljyIwHmlQpqhsA&+ z2+#8ykYX4*@YRD;n!;#`G8FjC0T(6uoD8|~^Z;Qi8&0

wzt|hXq0grJU>sLk$5W z@iPoK+vbaJ%fa>nm4chq0quj82W7-LF*q=9Z^PU8yi+aJwIN?}P$a{WJUNOTLK@iE;j7&H2l%jx-gq~43Z*yWOV z1}}o=BKo2W08pg@j(Ydd(gsf@YluQxO0cPQ40Z%fd5bA-tMK30c@dMOgH)$yaNLJ^ zcixDyYHguzs=dQrd&^x|QNWxu#otK?{4+q81F77me69TS703Ys;7-R#8x5l-Ag`o| zpFfRT5WgrOL+GLmvf|g8r?xlM>E-S)ifW+EZRc#&a&tM4pfCV^+vo*RWuS?zxcQqj zS0o49{%m*hH#_^!Xq&(9*s?iWO3ItKl;I#9X%OQg_UVndNJ$v=Z))h}RxVS44Ix3& z-K<1~vzm3udS#LKQsaA@n%@UAv^I|@i|P{Mu=A+MTbL5DMg3~X(r;pi4zFWkyV6tG zlXOB**#C_|izT)X(-+c+w*{)k{*Fz#{6ZUJS|Xpm^5ycusqS^O_TdZHQI8y~-6-@u z6!$c*BYS{pZ}iSTYj-yMCiU3P=_mf`&9X#mziCgrjAFOM(G#KD^VG~{uA#MP>N>2T zrfGqs>C(qhlPyW!F8ohL#F{75u~V0I^%)lxs~WJig{4vOJe0C zw~P*vMluzWFN7ug1C~UJ`fxKJWdrd$xBq6p_F!Iz^(btbYl@9d<`X&JOyuA$E3e>f zy4(hN9n`dBlPb1W(HQ*|tXWWg)(I!q6>@U9ANOdLRi3(j_PNpOCqG+?Nl$!a}rZMk&_F_{#b?dAv~~`uLM?k0cG5(rvg+#%^!513 zR%SD9)r%QFXBaYP8=zIzGyiZQG%~v==P_I`6!qtbDM3%J@U(vjru3bQktWo>{70fu zyEh&x%ldkwV4yn%JqzOtrYze9Yj_Jr9SqdHg~$lt zEdQI_yxvc7B}b*ATY+s$rU-^AAWJJ`_&blLf=2}lki!0PzGI#8L53(*I?P<3 zpDbfVOj(v6x~0cYk){)l-=q+v!)L(07kk9=5qb5QBic{2$e%X6`a=t9`a998uRXSm z>FP8JHM;E?#vxS9Gze-wP4TqSKU}x3Y*SHsvZf%g^=9I9GLD6$UTnb zkN;xuvX6!%M;%th58O8kmwjd|-YoOxy~WbkpPNs?fXWq75Y)<_@Cv$AQO{3(;jC|U zI>l{0sKFg!{(mz;IwAAEieL zB6I1Umi|q)G%d?6$M`M2xVSdQ1GcqMJtZR{E#Avk-KVUzvB9;y>@{G)!c_{XBdU z0dz&_$;9&7^HSco%I0>%{oAa$e^NeDBTiwKkvKNUH5*u{}0!N3zrPc zdCqgr+55~K_OG{Dv_&G^%QnGSPW878=kH(ePrNQhzs9x&%1R$NqcRem^9omy~! zA@;|MvBw?MIa7D_QdJ5{d(bC2lO=x*9)9cKWwQ&#H|(e7eI?}w9h5izh=`YzTTTf8;_Jr$(h$=`~ysU z&|aO?^KZIO`PNZd+9Ep~UP2cdUUg7#R$1n2M&cFm5j?Lio|YiD=kAX2`;Ps{){u7J zBs5e|H2iA#RDL}QrI+|Nt-1SYZg~8*>6+r1wSfQUinbswcEh}qw>u}bw-^ivt2vAP zMES_FLd&lBpAe4CIT!a9CuilZOeI~cRrGW(dGp*Zx3>B-OSk=R_XhKdH^Vg5KOLiX z-Ksn}@;K!o#w|s6kd`FvhV2MFD^n<1mGx?}99+iGDzULq>ha2NP3Aks-#y>$O7!GY z#{N-(er#nGv1>Vx6>rGI;~^WJpXJ2HL{=+9wfsu=Yp&Xp4Kz7wGaA$mC@Ph`RnBSs z?Eav&kKpNqP&N_I_IQ+)IGa3XVBJ+gncF0GC$7uNb4YJzK!Z#xFU}x5SdIOhh@rbd z@>27MwqBY-U1sUgqA%KQIlh_$4$R4DOlq)k(iht1@kb~P6^gW+bB zUP5^eof%dqjvEND)Kzkj7ygi4xK7mYJiW)PZI4}mHInZycU}SyeQ0wpiFKfo>wey~ z0V|FjA=ik$!n?*WCb+i^Pswa>`Y2RUG;4%m@EU6m#n<_TdOlJjO;|RXaK_hvxbDeW zy#0b>aXsitw4Hshs`vrn`-blD5|T!zEW$ia#!n|P1XI19)AwTwCnGgPRE>jivd>Wp zX55C@(r#)oE-~04dhhRy^QeYW@JOiD$V4uKd1o&rlXs>Vd93==Jlv=W;%!Xr;6kcd zNo+_6c{QQ-buTfVmy#3cVQ3N@==S!Fm~gx_zGc!Lsve@`xCH`PRp*i2?H8O!D-# z-<_&=E#<48{GB$!iJZZP1fVUaU$y=#ogH0FIR(~h;~x3kQJ++y0}=76dlpLtmGeZx zloQWvWyyS6H!Tfr$&?@7#n#joX|@tio3`o9!PDwKJX;JdHR*B0jS6K8>zs6i9OfZ! zgNFEuPV#Cse}CSfhK9CCE-v#atCCS7nq-2wtp2NensF(zhdH^R#Ys&%dg3(CTA#P)m#0-E^FcRZ3rMTD@VUA)=-jK$RcyaJgh& zp}@`{Psd792e**((Ked4;&4TnzC4#N!iX-xat;$<6dWxG9F7Vp#)hB_g6t zCfon#y8TxrYjJ@JtP8t;c*&DD~Z@nDUw^^{a2x2q!M$a8~0#Q9STswbR z(+WDxUEGZWwj9Ig%Q5BQl=2yQjcm%(j(wk!ghzxNQqJBEH>w=q?VOrjzs6|!}ucvG~Qs1TKaMgQL_|hTEuE<>NmgMcrjOYg!3T%6z$bd$!qbrRQ5o; zTT65)|5z;UN%r1z{1@8Tqh4!%T~G0&1$nfe$~%;sJP9^kX;Ep>c4H%0Int%psx;O) zL1|0iCgbYy%0-Dq3tgwxXSe5fXU7O{L>gEq-7j)sY&n;v|MhEA^F;lr@Ja>Ef))n1 z$>?3WMoi#CK6&0qlOwN>ziRgOzgM@J>I`qAzq@<09ov4cV81drJ5k7O#+kPx!j3_? zM~hm{Bsa~zN2i-d7k|-Kf7=;cCFz&vaeDfT>by*$XLHe>gtmxvbgX^LX2QI9m_(V@ z?um4iP?YovmY;U43@&UmbQ5N>y7Cf!|K_cFat;6DH13Vcwg~yosYjx#^KOZobD4#? zd|gV$!I!_6UG}$F*SyJi{9Y{?7ecA$4v=&$_Fd0!hNi98PO!M?4)L##8^* z&U^FKCHvi-f~s7!sxDDlCS^7{~_0ppvKHmt?XJ7a^vCaLNU^b9+ zrCv$fswK+qF4OiL4ny~?gN7RX8432jO7~Vq)sZ-z6OllJ^_3DDisvku;!#9A6tq|n zED07XX`Skq&#P7Ii4+NADPJt4ef#AxF-pFwJ?SXQLslp2eWd#sajcE<-!pkK*h`qa zmmXX9(VQ6bmJVapuO6_LR_3c2gc3#is_xpUKl!=Jzf0 z@4tzF)SmP<30jTrN{dM~W9g~-5xwxV?y`SB*SB7h^sNb17(dKAepUWGs9zPj#xvlWZ-46=1tqQMHKgw#vzbFRj zkJ=BZqqsfw-bWaHEa`qExYh4dG+M7-a9Z={PvDpLXqTPd8fT{*lp@N*ZWhgYgQC? ze!Lc$2A-Oq#ch&Z7AJh{$>_iS<+oM8u$BULs7%F zZm`xb@aRl8#M*yW>7`<93Z=CWHF6JJF?3%jg9pZF1TeXJat`MCPCB~Z zcdm=CINgX>zkT&d8Yh+P=ESD{@b~OXlhQnL$oHyT8&{IFj`RBCT=>(^US5XVhwe8K zo%Bk=x&AoaIme>-&``?@dUZI{Z{i{zpaX~a>3^Hc=Q|%IM7$-VMh4vV3$;2GUBOZn z#{tn|5w30KqYFp6_fma}AwZth@~WRczp%Xbp*y1L#jDVtVfx9d%{8wDvvOz_XX1UG zviGu*A>avpww85+KC8|inkxSB)sjQ(wd>=y7SY_^$oEA!DBXw$hO%sBCjIKy$dRY4 z%|P#5lzV!ko=9!-ZKLDF&FUI9SD!_tOcw@6gQ6Z((y-Cn?Pa(&{GzHY!-N@%x!0(Y zr2FyggGiW$>#42y5?(wh)2grhs)C1->HX^O#os39O(9gOh+*HqC}S|Ra3%8Vtw_5*blGk$MyokdstiZ za%j?(Z&#L=vv6_Y0T~tCYffLjO?>yWgfYuuN6#i_-N3)o^x;mbgznL z#5opd>Ft=uC@E}Ov|3N9BC}ei$gEKfe~ewd(iZyd(k7rW~3W0d&He=`iMa*<$GM6 z(F?_ng`a+*FyN=EHWchhmZdf_G76Kpb?X+5sQJYRHFlsvHoou`w|jczQwbV|f+ZnM zYU|@8KkKzFf9R2c9-AxcS0L1k+2~@A?25cR>5=NarKu5x zoKf~!=(^9kSL=df=u&57XPwRC2GBScLAaxKXxL3av4EYOA$9t@te>E6MleCph!+HE zHv76i61R19SSF{YmLn!Bqwm>33{a(+j$5AjXtb@p$19 zrY~6*v)!*KRQ{k4LBEAoJ%UIU0RbUBJN}`Fu)Unm)@KELw_;N-G#Cp(15=`w{#5v$ zct)qD3i0ysVSriSS4^>7N>=o11iFM8j=jd8!6{8$1^7>SpQG}w?rw76*2$n)F!|rT zKjhsB0_0$##7}Wd{uqUULs7gAS{x3l)Oqd0FmIzIlg?_syemq>9*Ny5xQZlu?sTAHl;8U?By>Y?*iJzsCw z59H8XgtF^UA=DSjWFu0o(?TmwO>h14Z52&T%?Ndh31|Q|s?>UfmsO?zV8^rJU~2A^ zvudKk<_(HP;qV(dtBUr($3e^XQnSu)5`@%(6cS0dn3f`aci5roa*;=o*IJGG&39rv zqu0W&KX~vCapB0G)fW~PW>i-jK&@;;L$5y-&ZxxDe>w;TfUbN3{9Do?B~kdXa@W%5 zjhbDcD#GDiWx~|{H&MkRL7fkquW6{O;~}m`M~B*>2wE)wK6`I{=5qQy(foU^i5Zk_ zy@+o6s?4GyEv7N9RPXa4ZT^#!4{C0~WQFwxtW~I!{r#QIBVn3v60w}OT0ydKf{E8H zM&|~Hka198TwtM)XXxwG!X)0faU(h@ser~sRTXF2zG~VWN~~L2S+xL#_)X&U$4@)* z_5Ew^?vhkO#u3F$r*v>?1YdR*VV1wd@m%$}KD-IcES_;Obx=@HqKFwT@J!e&BAtKx zWY^OwE2-RP+^7u&sR1?GTnrcb(n)^eQjnR6g$USdb?XWmF>(J~H_GvXwA(L=+PXT* zvl>+MpJz(|={o%yY2MwFpRR_s;J)e3mMZ$X5|xrtWSRMl`0Ph0UTS}cI@5D(WLkoP z^z9VptP}&W>Qu9cI-PbdaC`!m4i1qR$JWV8JNl3Me6X09_otwtAb8rxkNm8ibwG;1 zP(OnOi}2;^%ZnbXzkVT0&HTy!TxV+#VX5DlFJjulEyb6fg`)Y7L45{Yw*%l^qy+wa zdI(c1u-5rMT{3*_1pvG4?d?TOlIb@pUT7XUqk35-*X$%w3u2f&i0dphYxJrnCWg#* zww@Ml1t!U%@zq;V3)7MOyPIpHX+Q=GGx;7oM(V6{#`4V0)bMj^r|_ROeELKNbU4hW zHpHb*?ENma$1mZnzzp@}5pW!Zg6=K#`TGoJwO=z3O-s{tR4r7OcW! z_9lVFNU;Pa=tX*oo4#_O2{1A;TH4#|mtSIV$=VFGHY=N0biOS?a}n%zWl($&bTL1l z_js?W=~nfo{d6@cf(yaWNc*}1A0;s1j@R6q0<>}hrv7NLqGHLyhW92{Exp@UZdv=Viw^Fd0P6 zd!o)#G?wmu9UTpZLzfIpkz5PLCMX(3UvHgXANm#kUWB^tD6(yrf-zY5=bdYi$aq+) z;*I8c>9MZNnvDskM%Fyz=gX9(fEaC_toxb3n8y?qq~}&t+_jx7*F^rJNSaP}i!mQ= zCA9;+9z-I)Lcu^Bf|&0ZSRXLMd3txh^1w;OaJSXbS1>RQD5$CVhIqtaMTL0Oc=E>~ z{LfTXIPz@a7_v961efGCUX)Dz$;ivojMiTOZQeNv%*^oVX~Rt@5&w#aULq7k(Ay>^ zLd@&8@*J1Yl3`#9g+r!b0yta#hdWR=zX-(7Hy#T?)Qbta3#FY*{nnH;a0oROi?=++h2FyL1?zIluln+Une zBzqjK3j4w6$#D}YMGXnmLy0D^Bytm$zXm^>lfS| zx0P^$I1@HHs;`mUnnoe?q3RQt5rW2o@o>v->3Pe&L<=8+HHbK2eBoU>cHvCU1 z<$uUHHB>b1;7oD#$==k`3=vyKci4X?qwu8#$YoR@;`Eq{f@%xOU?_0si}2eA7|0ii zG-Fsa$=lr70w(ZNU7tNOg`kIE zbMM4$V2RoYH#t6!pkk2U!YDzZ5Lx6VCpomp5m5MPul0tmuC8WKiW&PC$VgS&VFN=p z3(D~zET6J#)mX?Rei0T%fO;`u+X2*Z6yz*belRTOw+}alZU|kC;Xom9;=H5O0Gx2A zcc=$vPnZT#T-r=a)9ULP6weO(Mcmg6<#vbl1}r@Sf{wCJnobI0_EU)`QI@5m23xQ;0}x0*3}JVqj*b&{EdChvs-$$j`rf`DL#;;qyM2 zAZZN^jOJyusFG)Y9zgp5xoCIgS5d*jJZx5p+kj>1ACwnt%4XORY>Ym1SU^Ay5P zW=IL!>((2?51~9)3m)^gBSkj4Eo7^N-)~;_c=y-HL9c^vKtcl5x8>!9dre1_5N#tM zl@b#dPlweSF5UoSFHNR*vAJ3Ucj+%LziChYR851 zAGA|nLq>MR7Yn*62K0ccR>;Ks89iBzBvRGkb=^moskEW`YN|ExTm;VK%d=(A= literal 0 HcmV?d00001 diff --git a/vocab.json b/vocab.json new file mode 100644 index 0000000..6c49fc6 --- /dev/null +++ b/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833